diff --git a/.agent/self-learning/.gitignore b/.agent/self-learning/.gitignore
new file mode 100644
index 000000000..5b7b12729
--- /dev/null
+++ b/.agent/self-learning/.gitignore
@@ -0,0 +1,2 @@
+fallback-counts.json
+*.bak
diff --git a/.agent/self-learning/INDEX.md b/.agent/self-learning/INDEX.md
new file mode 100644
index 000000000..87ee14155
--- /dev/null
+++ b/.agent/self-learning/INDEX.md
@@ -0,0 +1,10 @@
+# Lessons Index
+
+Read this index every turn. Each entry below is a routing condition.
+If a `Use when ...` condition matches the current task, read the full lesson file.
+
+<!-- LESSONS:START -->
+<!-- Auto-managed by self-improve plugin. Manual edits preserved between markers. -->
+
+- [build-before-running-examples](lessons/2026-05-14-build-before-running-examples.md) — Use when starting any tanstack/ai example dev server — build workspace packages first
+<!-- LESSONS:END -->
diff --git a/.agent/self-learning/config.yml b/.agent/self-learning/config.yml
new file mode 100644
index 000000000..b9e1e5e96
--- /dev/null
+++ b/.agent/self-learning/config.yml
@@ -0,0 +1,15 @@
+# Self-improve plugin behavior knobs. Edit and commit per repo.
+correction_detection:
+  enabled: true
+  regex_strictness: loose # loose | strict
+coupling_detection:
+  enabled: true
+  regex_strictness: loose
+enforcement:
+  pre_push_block: true # false = warn only, do not block push
+curation:
+  default_interval_days: 30
+promotion:
+  auto_suggest_global: true
+  skill_improve_threshold: 3
+skills_repo: ~/.claude/skills
diff --git a/.agent/self-learning/coupling.json b/.agent/self-learning/coupling.json
new file mode 100644
index 000000000..1a7826a75
--- /dev/null
+++ b/.agent/self-learning/coupling.json
@@ -0,0 +1,4 @@
+{
+  "$schema": "./coupling.schema.json",
+  "couplings": []
+}
diff --git a/.agent/self-learning/curation-state.yml b/.agent/self-learning/curation-state.yml
new file mode 100644
index 000000000..1f8bb0ab5
--- /dev/null
+++ b/.agent/self-learning/curation-state.yml
@@ -0,0 +1,3 @@
+last_curated: 2026-05-14
+next_nag: 2026-06-13
+default_interval_days: 30
diff --git a/.agent/self-learning/lessons/2026-05-14-build-before-running-examples.md b/.agent/self-learning/lessons/2026-05-14-build-before-running-examples.md
new file mode 100644
index 000000000..62bfaaa06
--- /dev/null
+++ b/.agent/self-learning/lessons/2026-05-14-build-before-running-examples.md
@@ -0,0 +1,19 @@
+---
+name: build-before-running-examples
+description: Use when starting any tanstack/ai example dev server — build workspace packages first
+tags: [monorepo, examples, dev-workflow, build]
+scope: repo
+source:
+  type: auto-captured
+  created: 2026-05-14T13:05:00Z
+related_skill: null
+related: []
+---
+
+# Build Workspace Packages Before Running Examples
+
+**Rule:** Run `pnpm -w run build:all` from the repo root before starting any example dev server (`examples/ts-react-chat`, `ts-solid-chat`, `ts-vue-chat`, `ts-svelte-chat`, `vanilla-chat`, `php-slim`, `python-fastapi`, `ts-group-chat`).
+
+**Why:** "this was a mistake by you, you should always build packages inside of this repo before you run the examples" — examples import workspace packages (`@tanstack/ai`, `@tanstack/react-ai-devtools`, `@tanstack/ai-devtools-core`, etc.) via `workspace:*` and resolve through each package's `exports` field pointing at `dist/`. If `dist/` is missing for any package — including transitive ones — vite's dep-scan fails and SSR returns a 500. Fixing the first missing package one at a time wastes round-trips: I tried `pnpm --filter @tanstack/react-ai-devtools build`, hit a missing `@tanstack/ai-devtools-core`, etc. The cure is one command up front.
+
+**How to apply:** Before any `pnpm --filter "<example-name>" dev` (or running an example via its own directory), run `pnpm -w run build:all` from the worktree root. Nx caches the build so re-runs are cheap. Skip only if the user has just explicitly said the workspace is freshly built.
diff --git a/.agent/self-learning/lessons/promoted/.gitkeep b/.agent/self-learning/lessons/promoted/.gitkeep
new file mode 100644
index 000000000..e69de29bb
diff --git a/.changeset/decouple-openrouter-collapse-openai-base.md b/.changeset/decouple-openrouter-collapse-openai-base.md
deleted file mode 100644
index 3dab48e95..000000000
--- a/.changeset/decouple-openrouter-collapse-openai-base.md
+++ /dev/null
@@ -1,35 +0,0 @@
----
-'@tanstack/openai-base': minor
-'@tanstack/ai-openai': patch
-'@tanstack/ai-grok': patch
-'@tanstack/ai-groq': patch
-'@tanstack/ai-openrouter': patch
----
-
-Decouple `@tanstack/ai-openrouter` from the shared OpenAI base, and collapse the base into a thinner shim over the `openai` SDK.
-
-Three changes that ship together:
-
-**1. Rename `@tanstack/ai-openai-compatible` → `@tanstack/openai-base`.** The previous name implied a multi-vendor protocol surface. After ai-openrouter is decoupled (see below), the only remaining consumers (`ai-openai`, `ai-grok`, `ai-groq`) all back onto the `openai` SDK with a different `baseURL` — "base" describes that role accurately. Imports change:
-
-```diff
-- import { OpenAICompatibleChatCompletionsTextAdapter } from '@tanstack/ai-openai-compatible'
-+ import { OpenAIBaseChatCompletionsTextAdapter } from '@tanstack/openai-base'
-- import { OpenAICompatibleResponsesTextAdapter } from '@tanstack/ai-openai-compatible'
-+ import { OpenAIBaseResponsesTextAdapter } from '@tanstack/openai-base'
-```
-
-`@tanstack/ai-openai-compatible@0.2.x` remains published for anyone with a pinned lockfile reference but will receive no further updates.
-
-**2. `@tanstack/openai-base` adopts the `openai` SDK directly.** The previous package vendored ~720 LOC of hand-written wire-format types (`ChatCompletion`, `ResponseStreamEvent`, etc.) and exposed abstract `callChatCompletion*` / `callResponse*` hooks subclasses had to implement. Both are gone:
-
-- The base now depends on `openai` again and imports types directly from `openai/resources/...`. The vendored `src/types/` directory is removed; consumers that imported wire types from the package (e.g. `import type { ResponseInput } from '@tanstack/ai-openai-compatible'`) should now import from the openai SDK.
-- The abstract SDK-call methods are removed. The base constructor takes a pre-built `OpenAI` client (`new OpenAIBaseChatCompletionsTextAdapter(model, name, openaiClient)`) and calls `client.chat.completions.create` / `client.responses.create` itself. Subclasses (`ai-openai`, `ai-grok`, `ai-groq`) now just construct the SDK with their provider-specific `baseURL` and pass it to `super` — `callChatCompletion*` / `callResponse*` overrides go away.
-
-The other extension hooks (`extractReasoning`, `extractTextFromResponse`, `processStreamChunks`, `makeStructuredOutputCompatible`, `transformStructuredOutput`, `mapOptionsToRequest`, `convertMessage`) remain. Groq's `processStreamChunks` and `makeStructuredOutputCompatible` overrides (for `x_groq.usage` promotion and Groq's structured-output schema quirks) are unchanged.
-
-**3. Decouple `@tanstack/ai-openrouter` from the OpenAI base entirely.** OpenRouter ships its own SDK (`@openrouter/sdk`) with a camelCase shape, so inheriting from the OpenAI-shaped base forced a snake_case ↔ camelCase round-trip on every request and stream event. ai-openrouter now extends `BaseTextAdapter` directly and inlines its own stream processors (`OpenRouterTextAdapter` for chat-completions, `OpenRouterResponsesTextAdapter` for the Responses beta), reading OpenRouter's camelCase types natively. The `@tanstack/openai-base` and `openai` dependencies are removed from ai-openrouter; only `@openrouter/sdk`, `@tanstack/ai`, and `@tanstack/ai-utils` remain.
-
-Public API is unchanged: `openRouterText`, `openRouterResponsesText`, `createOpenRouterText`, `createOpenRouterResponsesText`, the OpenRouter tool factories, provider routing surface (`provider`, `models`, `plugins`, `variant`, `transforms`), app attribution headers (`httpReferer`, `appTitle`), `:variant` model suffixing, `RequestAbortedError` propagation, and the OpenRouter-specific structured-output null-preservation all behave the same. The ~300 LOC of inbound/outbound shape converters (`toOpenRouterRequest`, `toChatCompletion`, `adaptOpenRouterStreamChunks`, `toSnakeResponseResult`, …) are gone.
-
-`ai-ollama` remains on `BaseTextAdapter` directly — its native API uses a different wire format from Chat Completions and was never on the shared base.
diff --git a/.changeset/openrouter-narrow-stream-chunk-types.md b/.changeset/openrouter-narrow-stream-chunk-types.md
deleted file mode 100644
index 2d2e2fc2b..000000000
--- a/.changeset/openrouter-narrow-stream-chunk-types.md
+++ /dev/null
@@ -1,5 +0,0 @@
----
-'@tanstack/ai-openrouter': patch
----
-
-Internal: drop the remaining duck-typed `as { ... }` casts on stream chunks in `OpenRouterResponsesTextAdapter`. Five sites (`response.created/in_progress/incomplete/failed` model + error capture, `response.content_part.added/done` payload, and the `response.completed` function-call detection) now narrow via the SDK's discriminated unions directly. Behaviourally identical; reduces the chance of a SDK type rename silently slipping past us.
diff --git a/.changeset/streaming-structured-output.md b/.changeset/streaming-structured-output.md
new file mode 100644
index 000000000..d5a3d65e8
--- /dev/null
+++ b/.changeset/streaming-structured-output.md
@@ -0,0 +1,95 @@
+---
+'@tanstack/ai': minor
+'@tanstack/openai-base': minor
+'@tanstack/ai-openai': minor
+'@tanstack/ai-grok': minor
+'@tanstack/ai-groq': minor
+'@tanstack/ai-openrouter': minor
+'@tanstack/ai-react': minor
+'@tanstack/ai-vue': minor
+'@tanstack/ai-solid': minor
+'@tanstack/ai-svelte': minor
+'@tanstack/ai-anthropic': patch
+'@tanstack/ai-gemini': patch
+'@tanstack/ai-ollama': patch
+---
+
+Streaming structured output across the OpenAI-compatible providers, an OpenAI Chat Completions sibling adapter, a summarize-subsystem unification, and the decoupling of `@tanstack/ai-openrouter` from the shared OpenAI base.
+
+## Core — `@tanstack/ai`
+
+- New `chat({ outputSchema, stream: true })` overload returning `StructuredOutputStream<InferSchemaType<TSchema>>`. The stream yields raw JSON deltas via `TEXT_MESSAGE_CONTENT` plus a terminal `CUSTOM` `structured-output.complete` event whose `value.object` is typed against the caller's schema with no helper or cast required.
+- `StructuredOutputStream<T>` is a discriminated union over three tagged `CUSTOM` variants — `structured-output.complete<T>`, `approval-requested`, and `tool-input-available` (new `ApprovalRequestedEvent` / `ToolInputAvailableEvent` interfaces exported from `@tanstack/ai`). Narrowing on `chunk.type === 'CUSTOM' && chunk.name === '<literal>'` resolves `chunk.value` to the exact shape per variant. The bare `CustomEvent` (with `value: any`) is deliberately excluded to keep the narrow from collapsing to `any`; user-emitted events via the `emitCustomEvent` context API still flow at runtime and are documented as a small residual gap.
+- Activity-layer hardening: always-finalise after the stream loop (no silent hangs on missing `finishReason`), typed `RUN_ERROR` on empty content, mid-stream provider errors terminate cleanly, schema-validation failures carry `runId / model / timestamp`.
+- `fallbackStructuredOutputStream` in the activity layer is the single source of truth for adapters that don't implement `structuredOutputStream` natively; `BaseTextAdapter` no longer ships a default.
+- `ChatStreamSummarizeAdapter.summarizeStream` accumulates summary text and emits a terminal `CUSTOM` `generation:result` event before the final `RUN_FINISHED`. Fixes `useSummarize` never populating `result` over streaming connections (the client only sets `result` on that specific CUSTOM event).
+- `SummarizationOptions` is now generic in `TProviderOptions` and `modelOptions` is plumbed through end-to-end (previously silently dropped by `runSummarize` / `runStreamingSummarize`).
+
+## Framework hooks — `@tanstack/ai-react`, `@tanstack/ai-vue`, `@tanstack/ai-solid`, `@tanstack/ai-svelte`
+
+`useChat` (React/Vue/Solid) and `createChat` (Svelte) now accept an `outputSchema` option mirroring `chat({ outputSchema })` on the server. When supplied, the hook's return adds two managed reactive fields:
+
+- `partial` — the live progressive object, typed `DeepPartial<InferSchemaType<typeof outputSchema>>`. Updated from `TEXT_MESSAGE_CONTENT` deltas via `parsePartialJSON`. Resets on every new run.
+- `final` — the validated terminal payload from the `structured-output.complete` event, typed `InferSchemaType<typeof outputSchema> | null`. `null` until the run completes.
+
+Both fields are typed against the schema with no helper or cast — each hook is generic on `TSchema` and conditionally adds the fields to the return type. Without `outputSchema`, the return type is unchanged. Works the same for streaming and non-streaming endpoints — for non-streaming, `partial` stays `{}` and `final` snaps when the single terminal event arrives. Reasoning text and tool calls aren't surfaced as separate hook fields — they're already on `messages[…].parts` (as `ThinkingPart`, `ToolCallPart`, `ToolResultPart`), same as a normal chat. When `outputSchema` is set, the assistant's `TextPart` contains the raw JSON the model produced; filter `text` parts out of your message renderer and let the structured view (driven by `partial` / `final`) replace it.
+
+Reactivity primitive per framework:
+
+| Framework                      | `partial` type                                          | `final` type                                     |
+| ------------------------------ | ------------------------------------------------------- | ------------------------------------------------ |
+| React (`@tanstack/ai-react`)   | `DeepPartial<T>` (plain state)                          | `T \| null` (plain state)                        |
+| Vue (`@tanstack/ai-vue`)       | `Readonly<ShallowRef<DeepPartial<T>>>`                  | `Readonly<ShallowRef<T \| null>>`                |
+| Solid (`@tanstack/ai-solid`)   | `Accessor<DeepPartial<T>>`                              | `Accessor<T \| null>`                            |
+| Svelte (`@tanstack/ai-svelte`) | `readonly partial: DeepPartial<T>` (rune-backed getter) | `readonly final: T \| null` (rune-backed getter) |
+
+`DeepPartial<T>` is exported from each framework package for callers who want to annotate handlers explicitly.
+
+## Base — `@tanstack/openai-base`
+
+- Package renamed from `@tanstack/ai-openai-compatible` (which remains published for pinned lockfiles but receives no further updates). Imports change:
+
+  ```diff
+  - import { OpenAICompatibleChatCompletionsTextAdapter } from '@tanstack/ai-openai-compatible'
+  + import { OpenAIBaseChatCompletionsTextAdapter } from '@tanstack/openai-base'
+  - import { OpenAICompatibleResponsesTextAdapter } from '@tanstack/ai-openai-compatible'
+  + import { OpenAIBaseResponsesTextAdapter } from '@tanstack/openai-base'
+  ```
+
+- Centralised `structuredOutputStream` on both bases. Chat Completions uses `response_format: { type: 'json_schema', strict: true }` + `stream: true`; Responses uses `text.format: { type: 'json_schema', strict: true }` + `stream: true`. Subclasses (`ai-openai`, `ai-grok`, `ai-groq`) inherit it; OpenRouter implements its own (see below).
+- Base now adopts the `openai` SDK directly and imports types from `openai/resources/...`. The previously-vendored ~720 LOC of wire-format types (`ChatCompletion`, `ResponseStreamEvent`, etc.) is removed; consumers that imported wire types from the package should import them from the openai SDK instead. The abstract `callChatCompletion*` / `callResponse*` hooks are gone — the base constructor now takes a pre-built `OpenAI` client (`new OpenAIBaseChatCompletionsTextAdapter(model, name, openaiClient)`) and calls `client.chat.completions.create` / `client.responses.create` itself.
+- New protected `isAbortError(error)` hook duck-types abort detection so `RUN_ERROR { code: 'aborted' }` is emitted consistently across SDK error types — subclasses with proprietary error classes (e.g. `@openrouter/sdk`'s `RequestAbortedError`) override.
+- Per-chunk `logger.provider(...)` debug logging now fires inside `structuredOutputStream` loops, matching the existing pattern in `chatStream` for end-to-end introspection in debug mode.
+
+The other extension hooks (`extractReasoning`, `extractTextFromResponse`, `processStreamChunks`, `makeStructuredOutputCompatible`, `transformStructuredOutput`, `mapOptionsToRequest`, `convertMessage`) remain. Groq's `processStreamChunks` and `makeStructuredOutputCompatible` overrides (for `x_groq.usage` promotion and Groq's structured-output schema quirks) are unchanged.
+
+## Provider adapters
+
+| Adapter                                                    | API              | Reasoning surface                                                                                                |
+| ---------------------------------------------------------- | ---------------- | ---------------------------------------------------------------------------------------------------------------- |
+| `@tanstack/ai-openai` `openaiText`                         | Responses        | `response.reasoning_text.delta` + `response.reasoning_summary_text.delta` (requires `reasoning.summary: 'auto'`) |
+| `@tanstack/ai-openai` `openaiChatCompletions` (new)        | Chat Completions | reasoning emitted silently — Chat Completions has no `reasoning.summary` opt-in                                  |
+| `@tanstack/ai-grok` `grokText`                             | Chat Completions | `delta.reasoning_content` (DeepSeek convention; not typed by OpenAI SDK)                                         |
+| `@tanstack/ai-groq` `groqText`                             | Chat Completions | `delta.reasoning` (requires `reasoning_format: 'parsed'`; not typed by groq-sdk)                                 |
+| `@tanstack/ai-openrouter` `openRouterText`                 | Chat Completions | `delta.reasoningDetails` (camelCase)                                                                             |
+| `@tanstack/ai-openrouter` `openRouterResponsesText` (beta) | Responses (beta) | `response.reasoning_text.delta` + `response.reasoning_summary_text.delta` via `normalizeStreamEvent`             |
+
+All six emit the contractual `REASONING_*` lifecycle (`REASONING_START` → `REASONING_MESSAGE_START` → `REASONING_MESSAGE_CONTENT` deltas → `REASONING_MESSAGE_END` → `REASONING_END`) and close it before `TEXT_MESSAGE_START`. Accumulated reasoning is also surfaced on `structured-output.complete.value.reasoning` for consumers that only subscribe to the terminal event. OpenRouter SDK's proprietary `RequestAbortedError` is mapped (alongside DOM `AbortError`) to `code: 'aborted'` in the two openrouter adapters.
+
+`@tanstack/ai-openai` also exports a new `OpenAIChatCompletionsTextAdapter` / `openaiChatCompletions` / `createOpenaiChatCompletions` factory — a sibling to the existing Responses adapter for callers who want the older `/v1/chat/completions` wire format against the OpenAI SDK.
+
+## Decouple `@tanstack/ai-openrouter` from the OpenAI base
+
+OpenRouter ships its own SDK (`@openrouter/sdk`) with a camelCase shape, so inheriting from the OpenAI-shaped base forced a snake_case ↔ camelCase round-trip on every request and stream event. ai-openrouter now extends `BaseTextAdapter` directly and inlines its own stream processors (`OpenRouterTextAdapter` for chat-completions, `OpenRouterResponsesTextAdapter` for the Responses beta), reading OpenRouter's camelCase types natively. The `@tanstack/openai-base` and `openai` dependencies are removed from ai-openrouter; only `@openrouter/sdk`, `@tanstack/ai`, and `@tanstack/ai-utils` remain. The ~300 LOC of inbound/outbound shape converters (`toOpenRouterRequest`, `toChatCompletion`, `adaptOpenRouterStreamChunks`, `toSnakeResponseResult`, …) are gone. Internal: duck-typed `as { ... }` casts on stream chunks in `OpenRouterResponsesTextAdapter` are replaced with direct narrowing via the SDK's discriminated unions.
+
+Public OpenRouter API is unchanged: `openRouterText`, `openRouterResponsesText`, `createOpenRouterText`, `createOpenRouterResponsesText`, the OpenRouter tool factories, provider routing surface (`provider`, `models`, `plugins`, `variant`, `transforms`), app attribution headers (`httpReferer`, `appTitle`), `:variant` model suffixing, `RequestAbortedError` propagation, and the OpenRouter-specific structured-output null-preservation all behave the same.
+
+`ai-ollama` remains on `BaseTextAdapter` directly — its native API uses a different wire format from Chat Completions and was never on the shared base.
+
+## Summarize subsystem
+
+Anthropic, Gemini, Ollama, and OpenRouter previously each shipped a bespoke 200–300 LOC summarize adapter. They now construct a `ChatStreamSummarizeAdapter` (formerly `ChatStreamWrapperAdapter`, renamed and exported from `@tanstack/ai/activities`) wrapping their own text adapter, matching the existing OpenAI/Grok pattern. Removes ~600 LOC of duplicated logic across the six providers and ensures behavioural parity.
+
+Bespoke `*SummarizeProviderOptions` interfaces (e.g. `OpenAISummarizeProviderOptions`, `AnthropicSummarizeProviderOptions`, `GeminiSummarizeProviderOptions`, `OllamaSummarizeProviderOptions`, `OpenRouterSummarizeProviderOptions`) are removed from the provider packages' public exports. Consumers who imported them should switch to inferring the type from the adapter (`InferTextProviderOptions<typeof adapter>`) or remove the explicit annotation (it'll be inferred from the adapter argument).
+
+`SummarizeAdapter` interface methods are now generic in `TProviderOptions`. `summarize` and `summarizeStream` previously took `SummarizationOptions` (defaulted, so `modelOptions` was effectively `Record<string, any>` regardless of the adapter's typed shape). They now take `SummarizationOptions<TProviderOptions>`. Source-compatible for callers that didn't specify the generic; type-tighter for implementers and downstream consumers. `SummarizationOptions`, `SummarizeAdapter`, `BaseSummarizeAdapter`, and `ChatStreamSummarizeAdapter` previously had a mixed `Record<string, any>` / `Record<string, unknown>` / `object` set of defaults for `TProviderOptions`; they now uniformly default to `Record<string, unknown>`.
diff --git a/.changeset/summarize-unify-on-chat-stream-wrapper.md b/.changeset/summarize-unify-on-chat-stream-wrapper.md
deleted file mode 100644
index 1e1607888..000000000
--- a/.changeset/summarize-unify-on-chat-stream-wrapper.md
+++ /dev/null
@@ -1,23 +0,0 @@
----
-'@tanstack/ai': patch
-'@tanstack/ai-anthropic': patch
-'@tanstack/ai-gemini': patch
-'@tanstack/ai-grok': patch
-'@tanstack/ai-ollama': patch
-'@tanstack/ai-openai': patch
-'@tanstack/ai-openrouter': patch
----
-
-Unify the summarize subsystem on a shared chat-stream wrapper, plumb `modelOptions` through end-to-end, and tighten the `TProviderOptions` generic.
-
-**Provider summarize adapters now share one implementation.** Anthropic, Gemini, Ollama, and OpenRouter previously each shipped a bespoke 200–300 LOC summarize adapter that re-implemented streaming, error handling, usage accounting, and chunk assembly on top of their text adapter. They now construct a `ChatStreamSummarizeAdapter` (formerly `ChatStreamWrapperAdapter`, renamed and exported from `@tanstack/ai/activities`) wrapping their own text adapter, matching the existing OpenAI/Grok pattern. Removes ~600 LOC of duplicated logic across the six providers and ensures behavioural parity.
-
-**`SummarizationOptions.modelOptions` now reaches the wire.** Previously the activity layer (`runSummarize` / `runStreamingSummarize`) silently dropped `modelOptions` when building the internal `SummarizationOptions` it forwarded to the adapter. Provider-specific knobs (Anthropic cache control, OpenRouter plugins, Gemini safety settings, Groq tuning params, …) now flow through correctly.
-
-**Provider summarize types resolve from the wrapped text adapter.** Each provider previously shipped a bespoke `XSummarizeProviderOptions` interface (a partial copy of its text provider options). Those interfaces are removed; summarize provider options are now inferred from the text adapter's `~types` via the new `InferTextProviderOptions<TAdapter>` helper exported from `@tanstack/ai/activities`. IntelliSense for `modelOptions` on `summarize({ adapter: openai('gpt-4o'), … })` now matches what `chat({ adapter: openai('gpt-4o'), … })` would show.
-
-**`SummarizeAdapter` interface methods are now generic in `TProviderOptions`.** `summarize` and `summarizeStream` previously took `SummarizationOptions` (defaulted, so `modelOptions` was effectively `Record<string, any>` regardless of the adapter's typed shape). They now take `SummarizationOptions<TProviderOptions>`, threading the class's `TProviderOptions` generic through. Source-compatible for callers that didn't specify the generic; type-tighter for implementers and downstream consumers.
-
-**Default aligned across the summarize surface.** `SummarizationOptions`, `SummarizeAdapter`, `BaseSummarizeAdapter`, and `ChatStreamSummarizeAdapter` previously had a mixed `Record<string, any>` / `Record<string, unknown>` / `object` set of defaults for `TProviderOptions`. They now uniformly default to `Record<string, unknown>` so unparameterised consumers narrow before indexed access on `modelOptions`. The `extends object` constraint is unchanged — per-model typed interfaces (e.g. `OpenAIBaseOptions & OpenAIReasoningOptions & ...`) inferred via `InferTextProviderOptions<TAdapter>` continue to satisfy it without needing a string index signature. No public-surface signature change for callers that supply a concrete provider-options shape (every shipping adapter does).
-
-Bespoke `*SummarizeProviderOptions` interfaces (e.g. `OpenAISummarizeProviderOptions`, `AnthropicSummarizeProviderOptions`, `GeminiSummarizeProviderOptions`, `OllamaSummarizeProviderOptions`, `OpenRouterSummarizeProviderOptions`) are removed from the provider packages' public exports. Consumers who imported them should switch to inferring the type from the adapter (`InferTextProviderOptions<typeof adapter>`) or remove the explicit annotation (it'll be inferred from the adapter argument).
diff --git a/docs/adapters/openai.md b/docs/adapters/openai.md
index 122aaf520..1d042c4ac 100644
--- a/docs/adapters/openai.md
+++ b/docs/adapters/openai.md
@@ -35,6 +35,50 @@ const stream = chat({
 });
 ```
 
+## Chat Completions API
+
+`@tanstack/ai-openai` ships two text adapters that hit different OpenAI endpoints. `openaiText` (default) calls the Responses API (`/v1/responses`). `openaiChatCompletions` calls the older Chat Completions API (`/v1/chat/completions`).
+
+Pick whichever fits your wire format and feature needs:
+
+| | `openaiText` (Responses) | `openaiChatCompletions` (Chat Completions) |
+|---|---|---|
+| Endpoint | `/v1/responses` | `/v1/chat/completions` |
+| Reasoning summaries | Yes — set `modelOptions.reasoning.summary: 'auto'` to surface reasoning text via `REASONING_*` events | No — reasoning tokens are still consumed but cannot be exposed |
+| Wire-format compatibility | OpenAI-only | Matches the older de-facto industry shape (Grok, Groq, OpenRouter, many local model servers) |
+| Structured output streaming | `text.format: { type: 'json_schema', strict: true }` + `stream: true` | `response_format: { type: 'json_schema', strict: true }` + `stream: true` |
+
+Use `openaiText` when you want reasoning-summary streaming or OpenAI-specific Responses features. Use `openaiChatCompletions` when you're migrating off a Chat-Completions-style provider, share request-building code with other Chat-Completions adapters in your stack, or want the more battle-tested wire format.
+
+```typescript
+import { chat } from "@tanstack/ai";
+import { openaiChatCompletions } from "@tanstack/ai-openai";
+
+const stream = chat({
+  adapter: openaiChatCompletions("gpt-5.2"),
+  messages: [{ role: "user", content: "Hello!" }],
+});
+```
+
+With an explicit API key:
+
+```typescript
+import { chat } from "@tanstack/ai";
+import { createOpenaiChatCompletions } from "@tanstack/ai-openai";
+
+const adapter = createOpenaiChatCompletions("gpt-5.2", {
+  apiKey: process.env.OPENAI_API_KEY!,
+  // organization, baseURL, headers — all optional
+});
+
+const stream = chat({
+  adapter,
+  messages: [{ role: "user", content: "Hello!" }],
+});
+```
+
+Both adapters work identically with [Structured Outputs](../chat/structured-outputs) — including `stream: true` — and accept the same `modelOptions` (temperature, top_p, max_tokens, stop, …). The reasoning section below applies to `openaiText`; `openaiChatCompletions` accepts `modelOptions.reasoning.effort` but cannot stream summary text.
+
 ## Basic Usage - Custom API Key
 
 ```typescript
@@ -289,6 +333,26 @@ Creates an OpenAI chat adapter with an explicit API key.
 
 **Returns:** An OpenAI chat adapter instance.
 
+### `openaiChatCompletions(model)`
+
+Creates an OpenAI chat adapter that targets `/v1/chat/completions` instead of the Responses API. See [Chat Completions API](#chat-completions-api) for when to use this over `openaiText`.
+
+**Returns:** An OpenAI chat adapter instance using the Chat Completions wire format.
+
+### `createOpenaiChatCompletions(model, config)`
+
+Creates an OpenAI chat-completions adapter with an explicit API key.
+
+**Parameters:**
+
+- `model` - OpenAI model id (e.g. `"gpt-5.2"`, `"gpt-4o-mini"`)
+- `config.apiKey` - Your OpenAI API key
+- `config.organization?` - Organization ID (optional)
+- `config.baseURL?` - Custom base URL (optional)
+- `config.headers?` - Additional headers (optional)
+
+**Returns:** An OpenAI chat adapter instance using the Chat Completions wire format.
+
 ### `openaiSummarize(config?)`
 
 Creates an OpenAI summarization adapter using environment variables.
diff --git a/docs/chat/structured-outputs.md b/docs/chat/structured-outputs.md
index 6bcd9c7a7..134a58c24 100644
--- a/docs/chat/structured-outputs.md
+++ b/docs/chat/structured-outputs.md
@@ -83,8 +83,9 @@ The return type of `chat()` changes based on the `outputSchema` prop:
 
 | Configuration | Return Type |
 |--------------|-------------|
-| No `outputSchema` | `AsyncIterable<StreamChunk>` | 
+| No `outputSchema` | `AsyncIterable<StreamChunk>` |
 | With `outputSchema` | `Promise<InferSchemaType<TSchema>>` |
+| With `outputSchema` and `stream: true` | `StructuredOutputStream<InferSchemaType<TSchema>>` |
 
 When you provide an `outputSchema`, TanStack AI automatically infers the TypeScript type from your schema:
 
@@ -181,6 +182,186 @@ console.log(company.headquarters.city);
 console.log(company.employees[0].role);
 ```
 
+## Streaming Structured Output
+
+Pass `stream: true` alongside `outputSchema` to receive incremental JSON deltas while the model is generating, plus a final validated, typed object. This is the path to take when you want a progressive UI — a streaming form, a typewriter-style preview, partial cards filling in field by field — instead of a single blocking await.
+
+You build it in two halves: a server route that runs `chat({ outputSchema, stream: true })` and pipes the result as Server-Sent Events, and a client that wires `useChat` to that endpoint and updates state as chunks arrive. The same flow as regular streaming chat (see [Streaming](./streaming)) — `outputSchema + stream: true` just adds one terminal event with the validated object.
+
+### Server endpoint
+
+```typescript
+// app/api/extract-person/route.ts (or your framework's equivalent)
+import { chat, toServerSentEventsResponse } from "@tanstack/ai";
+import { openaiText } from "@tanstack/ai-openai";
+import { z } from "zod";
+
+const PersonSchema = z.object({
+  name: z.string().meta({ description: "The person's full name" }),
+  age: z.number().meta({ description: "The person's age in years" }),
+  email: z.string().email(),
+});
+
+export async function POST(request: Request) {
+  const { messages } = await request.json();
+
+  const stream = chat({
+    adapter: openaiText("gpt-5.2"),
+    messages,
+    outputSchema: PersonSchema,
+    stream: true,
+  });
+
+  return toServerSentEventsResponse(stream);
+}
+```
+
+That's the entire server side. `chat({ outputSchema, stream: true })` returns a `StructuredOutputStream<InferSchemaType<typeof PersonSchema>>` — the same kind of `AsyncIterable` that `toServerSentEventsResponse` accepts for any streaming chat endpoint. The schema travels in the request as JSON Schema, validation runs server-side after the stream completes, and the validated object is emitted as the terminal `structured-output.complete` event.
+
+### Client with `useChat`
+
+Pass the same schema to `useChat` and the hook tracks the progressive object and the validated terminal object for you — `partial` updates as JSON streams in, `final` snaps when `structured-output.complete` arrives. No external state, no `onChunk` ceremony, no `parsePartialJSON` calls:
+
+```tsx
+import { useChat, fetchServerSentEvents } from "@tanstack/ai-react";
+import { z } from "zod";
+
+const PersonSchema = z.object({
+  name: z.string(),
+  age: z.number(),
+  email: z.string().email(),
+});
+
+function PersonExtractor() {
+  const { sendMessage, isLoading, partial, final } = useChat({
+    connection: fetchServerSentEvents("/api/extract-person"),
+    outputSchema: PersonSchema,
+  });
+
+  return (
+    <form
+      onSubmit={(e) => {
+        e.preventDefault();
+        sendMessage("Extract: John Doe, 30, john@example.com");
+      }}
+    >
+      <button disabled={isLoading}>Extract</button>
+      {/* `partial` fills in field by field as JSON streams in. */}
+      <p>Name: {partial.name ?? "…"}</p>
+      <p>Age: {partial.age ?? "…"}</p>
+      <p>Email: {partial.email ?? "…"}</p>
+      {final && <pre>Validated: {JSON.stringify(final, null, 2)}</pre>}
+    </form>
+  );
+}
+```
+
+What the hook does for you:
+
+- **`partial`** is `DeepPartial<z.infer<typeof PersonSchema>>` — every property optional, every nested array element optional. Updated from `TEXT_MESSAGE_CONTENT` deltas via `parsePartialJSON`. Resets on every new `sendMessage` / `reload`.
+- **`final`** is `z.infer<typeof PersonSchema> | null` — the validated terminal payload from the `structured-output.complete` event. `null` until the run completes successfully.
+- **`outputSchema`** is used purely for client-side **type inference**. Validation still runs on the server against the schema you pass to `chat({ outputSchema })` on the server route.
+- This same hook shape works for **non-streaming structured output too**. If your server returns a single `structured-output.complete` event (the fallback path for adapters that don't natively stream), `partial` stays `{}` and `final` populates when the event arrives — same consumer code.
+
+The `outputSchema` field is optional: if you omit it, `useChat`'s return type is unchanged, and `partial` / `final` aren't present.
+
+### Rendering reasoning and tool calls
+
+Reasoning tokens and tool calls aren't on `partial` / `final` — they're already where they'd be in a normal chat: on `messages[…].parts`. The stream processor inside `useChat` routes each chunk type to its canonical part:
+
+| Chunk type | Where it lands |
+|---|---|
+| `REASONING_MESSAGE_CONTENT` | `ThinkingPart` on the assistant message |
+| `TOOL_CALL_START` / `_ARGS` / `_END` | `ToolCallPart` on the assistant message |
+| `TOOL_CALL_RESULT` | `ToolResultPart` on the tool message |
+| `TEXT_MESSAGE_CONTENT` | `TextPart` on the assistant message (this is the raw JSON when `outputSchema` is set — see below) |
+
+So render reasoning and tool calls the same way you'd render them in a normal chat UI:
+
+```tsx
+const last = messages.at(-1);
+
+return (
+  <>
+    {last?.parts.map((part, i) => {
+      if (part.type === "thinking") return <ReasoningView key={i} text={part.text} />;
+      if (part.type === "tool-call") return <ToolCallView key={i} part={part} />;
+      // Hide raw JSON text — the structured view below replaces it.
+      if (part.type === "text") return null;
+      return null;
+    })}
+
+    <StructuredView data={final ?? partial} />
+  </>
+);
+```
+
+> **Note:** When `outputSchema` is set, the assistant's `TextPart` contains the raw JSON the model produced (e.g. `{"name":"John","age":30,…}`). That's not meant to be shown to end users — the structured view powered by `partial` / `final` replaces it. Filter `text` parts out of your message renderer in this mode, as in the snippet above.
+
+> **Going lower-level?** `useChat` still exposes `onChunk` if you want to observe individual chunks alongside the managed `partial` / `final` state (e.g. to drive a custom progress UI). The two paths compose — internal partial/final tracking always runs first, then your `onChunk` callback fires with the same chunk.
+
+`useChat` (React, Vue, Solid) and `createChat` (Svelte) all accept the same `outputSchema` option and expose `partial` / `final` with the same semantics — only the reactivity primitive differs (React state, Vue `shallowRef`, Solid `Accessor`, Svelte reactive getter). See your framework's quick-start for the local idioms.
+
+### What the stream contains
+
+`chat({ outputSchema, stream: true })` returns a `StructuredOutputStream<T>` — an `AsyncIterable` over the standard `StreamChunk` lifecycle plus a terminal `CUSTOM` event named `structured-output.complete`:
+
+```typescript
+{
+  type: "CUSTOM",
+  name: "structured-output.complete",
+  value: {
+    object: T;        // validated, parsed, typed
+    raw: string;      // full accumulated JSON text
+    reasoning?: string; // present only for thinking/reasoning models
+  },
+  // ...standard event fields (timestamp, model, …)
+}
+```
+
+### Adapter coverage
+
+Streaming structured output works with **every adapter**, but only some support a true single-request streaming wire format:
+
+| Adapter | Behavior with `outputSchema` + `stream: true` |
+|---------|-----------------------------------------------|
+| `@tanstack/ai-openai` | Native single-request stream (Responses API, `text.format: json_schema`) |
+| `@tanstack/ai-openrouter` | Native single-request stream (`response_format: json_schema`) |
+| `@tanstack/ai-grok` | Native single-request stream (Chat Completions, `response_format: json_schema`) |
+| `@tanstack/ai-groq` | Native single-request stream (Chat Completions, `response_format: json_schema`) |
+| Other adapters (anthropic, gemini, ollama, …) | Fallback: runs non-streaming `structuredOutput` and emits the final object as one `structured-output.complete` event |
+
+The fallback path keeps the consumer code identical across providers — you always read the final object off `structured-output.complete` — but you won't see incremental deltas unless the adapter implements `structuredOutputStream` natively.
+
+### Advanced: iterating the stream directly
+
+When you don't need the SSE-over-HTTP boundary — Node scripts, CLIs, server endpoints that respond with a final JSON object instead of a stream, or tests — you can consume `chat({ outputSchema, stream: true })` as a plain async iterable:
+
+```typescript
+import { chat } from "@tanstack/ai";
+import { openaiText } from "@tanstack/ai-openai";
+import { z } from "zod";
+
+const PersonSchema = z.object({ name: z.string(), age: z.number(), email: z.string().email() });
+
+const stream = chat({
+  adapter: openaiText("gpt-5.2"),
+  messages: [{ role: "user", content: "Extract: John Doe is 30, john@example.com" }],
+  outputSchema: PersonSchema,
+  stream: true,
+});
+
+for await (const chunk of stream) {
+  if (chunk.type === "CUSTOM" && chunk.name === "structured-output.complete") {
+    // Validated and typed against PersonSchema.
+    console.log(chunk.value.object.name);
+    console.log(chunk.value.object.age);
+  }
+}
+```
+
+This is the same `StructuredOutputStream<T>` the server endpoint above hands to `toServerSentEventsResponse`. Pick this shape when you're a single process end-to-end; use the server-endpoint-plus-`useChat` shape when there's a network in the middle.
+
 ## Combining with Tools
 
 Structured outputs work seamlessly with the agentic tool loop. When both `outputSchema` and `tools` are provided, TanStack AI will:
@@ -228,6 +409,58 @@ console.log(recommendation.currentPrice);
 console.log(recommendation.reason);
 ```
 
+### Streaming with tools that may pause
+
+When you combine `tools` + `outputSchema` + `stream: true`, the agent loop runs first — its events stream through, and only after all tools complete does the structured output stream emit `structured-output.complete`. Two situations can interrupt that flow before the terminal event arrives:
+
+1. **A server tool with `needsApproval: true` is queued.** The agent loop pauses and the queued tool-call lands on the assistant message as a `ToolCallPart` with `state === "approval-requested"`. You respond by calling `addToolApprovalResponse({ id, approved })` from the hook return — same flow as in a normal chat. See [Tool Approval Flow](../tools/tool-approval) for the full pattern.
+2. **A client tool is invoked.** If you registered the tool with an `execute` function, the client runs it automatically and posts the result back — no extra code on your side. If you want to handle it manually, listen for `onToolCall` and respond with `addToolResult({ toolCallId, tool, output, state })`. See [Client Tools](../tools/client-tools) for details.
+
+There's nothing structured-output-specific in either flow — both reuse the standard chat pause/resume APIs. The structured stream layers on top: once tools complete (or the user approves), the agent loop finishes, the structured-output stream takes over, `partial` fills in, and `final` snaps when `structured-output.complete` arrives. For example, an approval-gated tool inside a structured-output run looks like:
+
+```tsx
+const { messages, sendMessage, partial, final, addToolApprovalResponse } = useChat({
+  connection: fetchServerSentEvents("/api/recommend"),
+  outputSchema: RecommendationSchema,
+  tools: [sendEmail], // server tool with needsApproval: true
+});
+
+const last = messages.at(-1);
+
+return (
+  <>
+    {last?.parts.map((part, i) => {
+      // Surface approval prompts inline, the same way Tool Approval Flow shows it.
+      if (
+        part.type === "tool-call" &&
+        part.state === "approval-requested" &&
+        part.approval
+      ) {
+        return (
+          <ApprovalPrompt
+            key={i}
+            part={part}
+            onApprove={() =>
+              addToolApprovalResponse({ id: part.approval!.id, approved: true })
+            }
+            onDeny={() =>
+              addToolApprovalResponse({ id: part.approval!.id, approved: false })
+            }
+          />
+        );
+      }
+      if (part.type === "thinking") return <ReasoningView key={i} text={part.text} />;
+      if (part.type === "tool-call") return <ToolCallView key={i} part={part} />;
+      return null; // hide TextPart (raw JSON when outputSchema is set)
+    })}
+
+    <StructuredView data={final ?? partial} />
+  </>
+);
+```
+
+While the approval is pending, `partial` stays at its last value and `final` stays `null`. As soon as the user approves (or denies and the loop resumes), the agent loop continues, the structured stream runs, and `partial` / `final` populate.
+
 ## Using Plain JSON Schema
 
 If you prefer not to use a schema library, you can pass a plain JSON Schema object:
diff --git a/examples/ts-react-chat/src/components/Header.tsx b/examples/ts-react-chat/src/components/Header.tsx
index 4cd9fc4d8..7dda9649a 100644
--- a/examples/ts-react-chat/src/components/Header.tsx
+++ b/examples/ts-react-chat/src/components/Header.tsx
@@ -163,7 +163,7 @@ export default function Header() {
             }}
           >
             <Braces size={20} />
-            <span className="font-medium">Structured Output (OpenRouter)</span>
+            <span className="font-medium">Structured Output</span>
           </Link>
 
           <hr className="border-gray-700 my-2" />
diff --git a/examples/ts-react-chat/src/lib/server-fns.ts b/examples/ts-react-chat/src/lib/server-fns.ts
index c64168d23..51100e9b5 100644
--- a/examples/ts-react-chat/src/lib/server-fns.ts
+++ b/examples/ts-react-chat/src/lib/server-fns.ts
@@ -191,11 +191,12 @@ export const summarizeFn = createServerFn({ method: 'POST' })
       text: z.string(),
       maxLength: z.number().optional(),
       style: z.enum(['bullet-points', 'paragraph', 'concise']).optional(),
+      model: z.string().optional(),
     }),
   )
   .handler(async ({ data }) => {
     return summarize({
-      adapter: openaiSummarize('gpt-4o-mini'),
+      adapter: openaiSummarize((data.model ?? 'gpt-4o-mini') as 'gpt-4o-mini'),
       text: data.text,
       maxLength: data.maxLength,
       style: data.style,
@@ -338,12 +339,15 @@ export const summarizeStreamFn = createServerFn({ method: 'POST' })
       text: z.string(),
       maxLength: z.number().optional(),
       style: z.enum(['bullet-points', 'paragraph', 'concise']).optional(),
+      model: z.string().optional(),
     }),
   )
   .handler(({ data }) => {
     return toServerSentEventsResponse(
       summarize({
-        adapter: openaiSummarize('gpt-4o-mini'),
+        adapter: openaiSummarize(
+          (data.model ?? 'gpt-4o-mini') as 'gpt-4o-mini',
+        ),
         text: data.text,
         maxLength: data.maxLength,
         style: data.style,
diff --git a/examples/ts-react-chat/src/routes/api.structured-output.ts b/examples/ts-react-chat/src/routes/api.structured-output.ts
index aa1d045f2..73d5325c0 100644
--- a/examples/ts-react-chat/src/routes/api.structured-output.ts
+++ b/examples/ts-react-chat/src/routes/api.structured-output.ts
@@ -1,7 +1,14 @@
 import { createFileRoute } from '@tanstack/react-router'
-import { chat } from '@tanstack/ai'
-import { openRouterText } from '@tanstack/ai-openrouter'
+import { chat, toServerSentEventsResponse } from '@tanstack/ai'
+import { openaiChatCompletions, openaiText } from '@tanstack/ai-openai'
+import { grokText } from '@tanstack/ai-grok'
+import { groqText } from '@tanstack/ai-groq'
+import {
+  openRouterResponsesText,
+  openRouterText,
+} from '@tanstack/ai-openrouter'
 import { z } from 'zod'
+import type { AnyTextAdapter, StreamChunk } from '@tanstack/ai'
 
 const GuitarRecommendationSchema = z.object({
   title: z.string().describe('Short headline for the recommendation'),
@@ -21,23 +28,161 @@ const GuitarRecommendationSchema = z.object({
   nextSteps: z.array(z.string()).describe('Practical follow-up actions'),
 })
 
+type Provider =
+  | 'openai'
+  | 'openai-chat'
+  | 'grok'
+  | 'groq'
+  | 'openrouter'
+  | 'openrouter-responses'
+
+const StructuredOutputRequestSchema = z.object({
+  prompt: z.string().min(1),
+  provider: z
+    .enum([
+      'openai',
+      'openai-chat',
+      'grok',
+      'groq',
+      'openrouter',
+      'openrouter-responses',
+    ])
+    .optional(),
+  model: z.string().optional(),
+  stream: z.boolean().optional(),
+})
+
+function adapterFor(provider: Provider, model?: string): AnyTextAdapter {
+  switch (provider) {
+    case 'openai':
+      return openaiText((model || 'gpt-5.2') as 'gpt-5.2')
+    case 'openai-chat':
+      // Same model surface as the Responses adapter, but talks to
+      // `/v1/chat/completions`. Useful for side-by-side comparison of
+      // streaming structured output across the two OpenAI wire formats.
+      return openaiChatCompletions((model || 'gpt-4o') as 'gpt-4o')
+    case 'grok':
+      return grokText(
+        (model || 'grok-4-1-fast-reasoning') as 'grok-4-1-fast-reasoning',
+      )
+    case 'groq':
+      return groqText(
+        (model ||
+          'meta-llama/llama-4-maverick-17b-128e-instruct') as 'meta-llama/llama-4-maverick-17b-128e-instruct',
+      )
+    case 'openrouter':
+      return openRouterText(
+        (model || 'anthropic/claude-opus-4.6') as 'anthropic/claude-opus-4.6',
+      )
+    case 'openrouter-responses':
+      // OpenRouter Responses (beta) endpoint — same model surface as the
+      // chat-completions adapter, but routes through `/v1/responses`. This
+      // is what exercises `OpenRouterResponsesTextAdapter.structuredOutputStream`.
+      return openRouterResponsesText(
+        (model || 'anthropic/claude-opus-4.6') as 'anthropic/claude-opus-4.6',
+      )
+  }
+}
+
+// Per-provider modelOptions to opt into reasoning surfacing. Without these,
+// reasoning models reason silently and the UI never sees REASONING_* events.
+function reasoningOptionsFor(
+  provider: Provider,
+  model: string | undefined,
+): Record<string, unknown> | undefined {
+  switch (provider) {
+    case 'openai':
+      // Responses API: `reasoning.summary: 'auto'` is what makes the API emit
+      // `response.reasoning_summary_text.delta` events. Only valid on
+      // reasoning models (gpt-5.x, o-series); older models (gpt-4o) reject it.
+      if (
+        model?.startsWith('gpt-5') ||
+        model?.startsWith('o3') ||
+        model?.startsWith('o4')
+      ) {
+        return { reasoning: { summary: 'auto' } }
+      }
+      return undefined
+    case 'openai-chat':
+      // Chat Completions API doesn't surface reasoning summaries the way
+      // Responses does. Reasoning models still reason silently; no opt-in
+      // option to inject here.
+      return undefined
+    case 'groq':
+      // Groq's Chat Completions only streams `delta.reasoning` when
+      // `reasoning_format: 'parsed'`. Required for gpt-oss / qwen3 / kimi-k2
+      // to emit reasoning during structured output (json_schema mode).
+      if (
+        model?.startsWith('openai/gpt-oss') ||
+        model?.startsWith('qwen') ||
+        model?.startsWith('moonshotai/kimi')
+      ) {
+        return { reasoning_format: 'parsed' }
+      }
+      return undefined
+    case 'openrouter':
+    case 'openrouter-responses':
+      // OpenRouter normalises across providers. `reasoning.effort` triggers
+      // the upstream model's reasoning + surfaces the deltas. Same option on
+      // both the chat-completions and Responses-beta endpoints.
+      return { reasoning: { effort: 'medium' } }
+    case 'grok':
+      // xAI surfaces `delta.reasoning_content` automatically on reasoning
+      // models (grok-3-mini, grok-4-fast-reasoning, grok-4-1-fast-reasoning).
+      // No request param needed.
+      return undefined
+  }
+}
+
 export const Route = createFileRoute('/api/structured-output')({
   server: {
     handlers: {
       POST: async ({ request }) => {
-        const body = await request.json()
-        const { prompt, model } = body as {
-          prompt: string
-          model?: string
-        }
-
         try {
+          const parsed = StructuredOutputRequestSchema.safeParse(
+            await request.json(),
+          )
+          if (!parsed.success) {
+            return new Response(
+              JSON.stringify({ error: 'Invalid request body' }),
+              {
+                status: 400,
+                headers: { 'Content-Type': 'application/json' },
+              },
+            )
+          }
+          const { prompt, provider, model, stream } = parsed.data
+          const resolvedProvider: Provider = provider || 'openrouter'
+          const modelOptions = reasoningOptionsFor(resolvedProvider, model)
+
+          if (stream) {
+            const abortController = new AbortController()
+            request.signal.addEventListener('abort', () =>
+              abortController.abort(),
+            )
+            const streamIterable = chat({
+              adapter: adapterFor(resolvedProvider, model),
+              modelOptions: modelOptions as never,
+              messages: [{ role: 'user', content: prompt }],
+              outputSchema: GuitarRecommendationSchema,
+              stream: true,
+              abortController,
+            }) as AsyncIterable<StreamChunk>
+            return toServerSentEventsResponse(streamIterable, {
+              abortController,
+            })
+          }
+
+          const abortController = new AbortController()
+          request.signal.addEventListener('abort', () =>
+            abortController.abort(),
+          )
           const result = await chat({
-            adapter: openRouterText(
-              (model || 'openai/gpt-5.2') as 'openai/gpt-5.2',
-            ),
+            adapter: adapterFor(resolvedProvider, model),
+            modelOptions: modelOptions as never,
             messages: [{ role: 'user', content: prompt }],
             outputSchema: GuitarRecommendationSchema,
+            abortController,
           })
 
           return new Response(JSON.stringify({ data: result }), {
diff --git a/examples/ts-react-chat/src/routes/generations.structured-output.tsx b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
index 9b123308f..4049c2a7e 100644
--- a/examples/ts-react-chat/src/routes/generations.structured-output.tsx
+++ b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
@@ -1,98 +1,389 @@
-import { useState } from 'react'
+import { useRef, useState } from 'react'
 import { createFileRoute } from '@tanstack/react-router'
+import { parsePartialJSON } from '@tanstack/ai'
 
 const SAMPLE_PROMPT =
   'I play indie rock and have a $1500 budget. Recommend two electric guitars and one acoustic to round out my rig.'
 
-const OPENROUTER_MODELS = [
-  { value: 'openai/gpt-5.2', label: 'OpenAI GPT-5.2' },
-  { value: 'openai/gpt-5.2-pro', label: 'OpenAI GPT-5.2 Pro' },
-  { value: 'openai/gpt-5.1', label: 'OpenAI GPT-5.1' },
-  { value: 'anthropic/claude-opus-4.7', label: 'Claude Opus 4.7' },
-  { value: 'anthropic/claude-sonnet-4.6', label: 'Claude Sonnet 4.6' },
-  { value: 'google/gemini-3.1-pro-preview', label: 'Gemini 3.1 Pro (Preview)' },
-  { value: 'x-ai/grok-4.1-fast', label: 'Grok 4.1 Fast' },
-] as const
-
-interface RecommendationResult {
-  title: string
-  summary: string
-  recommendations: Array<{
-    name: string
-    brand: string
-    type: 'acoustic' | 'electric' | 'bass' | 'classical'
-    priceRangeUsd: { min: number; max: number }
-    reason: string
-  }>
-  nextSteps: Array<string>
+type Provider =
+  | 'openai'
+  | 'openai-chat'
+  | 'grok'
+  | 'groq'
+  | 'openrouter'
+  | 'openrouter-responses'
+
+const PROVIDER_MODELS: Record<
+  Provider,
+  Array<{ value: string; label: string }>
+> = {
+  openai: [
+    { value: 'gpt-5.2', label: 'GPT-5.2 (frontier)' },
+    { value: 'gpt-5.2-pro', label: 'GPT-5.2 Pro' },
+    { value: 'gpt-5.1', label: 'GPT-5.1' },
+    { value: 'gpt-5', label: 'GPT-5' },
+    { value: 'gpt-5-mini', label: 'GPT-5 Mini' },
+    { value: 'gpt-4o', label: 'GPT-4o' },
+  ],
+  // OpenAI Chat Completions: same model surface, older `/v1/chat/completions`
+  // wire format. The reasoning-summary opt-in isn't available here, so
+  // streaming reasoning won't be surfaced for gpt-5.x even though the model
+  // is still doing it under the hood.
+  'openai-chat': [
+    { value: 'gpt-4o', label: 'GPT-4o' },
+    { value: 'gpt-5-mini', label: 'GPT-5 Mini' },
+    { value: 'gpt-5', label: 'GPT-5' },
+    { value: 'gpt-5.1', label: 'GPT-5.1' },
+    { value: 'gpt-5.2', label: 'GPT-5.2 (frontier)' },
+  ],
+  grok: [
+    { value: 'grok-4-1-fast-reasoning', label: 'Grok 4.1 Fast (reasoning)' },
+    {
+      value: 'grok-4-1-fast-non-reasoning',
+      label: 'Grok 4.1 Fast (non-reasoning)',
+    },
+    { value: 'grok-4', label: 'Grok 4' },
+    { value: 'grok-3', label: 'Grok 3' },
+  ],
+  groq: [
+    {
+      value: 'meta-llama/llama-4-maverick-17b-128e-instruct',
+      label: 'Llama 4 Maverick 17B',
+    },
+    {
+      value: 'meta-llama/llama-4-scout-17b-16e-instruct',
+      label: 'Llama 4 Scout 17B',
+    },
+    {
+      value: 'moonshotai/kimi-k2-instruct-0905',
+      label: 'Kimi K2 Instruct',
+    },
+    { value: 'llama-3.3-70b-versatile', label: 'Llama 3.3 70B Versatile' },
+    { value: 'openai/gpt-oss-120b', label: 'GPT-OSS 120B' },
+  ],
+  openrouter: [
+    { value: 'anthropic/claude-opus-4.6', label: 'Claude Opus 4.6' },
+    { value: 'anthropic/claude-sonnet-4.6', label: 'Claude Sonnet 4.6' },
+    { value: 'openai/gpt-5.2', label: 'GPT-5.2 (via OpenRouter)' },
+    { value: 'x-ai/grok-4.1-fast', label: 'Grok 4.1 Fast (via OpenRouter)' },
+  ],
+  // OpenRouter Responses (beta) endpoint — same upstream models, but the
+  // request/response uses the Responses API wire format. Useful to compare
+  // streaming behaviour against the chat-completions adapter above.
+  'openrouter-responses': [
+    { value: 'anthropic/claude-opus-4.6', label: 'Claude Opus 4.6' },
+    { value: 'anthropic/claude-sonnet-4.6', label: 'Claude Sonnet 4.6' },
+    { value: 'openai/gpt-5.2', label: 'GPT-5.2 (via OpenRouter)' },
+    { value: 'x-ai/grok-4.1-fast', label: 'Grok 4.1 Fast (via OpenRouter)' },
+  ],
+}
+
+interface PartialRecommendation {
+  name?: string
+  brand?: string
+  type?: 'acoustic' | 'electric' | 'bass' | 'classical' | string
+  priceRangeUsd?: { min?: number; max?: number }
+  reason?: string
+}
+
+interface PartialResult {
+  title?: string
+  summary?: string
+  recommendations?: Array<PartialRecommendation>
+  nextSteps?: Array<string>
+}
+
+interface StreamChunkPayload {
+  type: string
+  delta?: string
+  content?: string
+  name?: string
+  value?: { object?: unknown; raw?: string; reasoning?: string }
+  message?: string
+}
+
+// Pick the last meaningful sentence/line out of an accumulating reasoning
+// stream so the UI can render a single rolling line of "what it's thinking
+// right now" rather than a growing wall of text.
+function latestThought(reasoning: string): string {
+  const trimmed = reasoning.trimEnd()
+  if (!trimmed) return ''
+  // Prefer the last sentence; fall back to the last newline-delimited line.
+  const sentenceMatch = trimmed.match(/[^.!?\n]+[.!?]?\s*$/)
+  const candidate = sentenceMatch ? sentenceMatch[0] : trimmed
+  const last = candidate.split('\n').filter(Boolean).pop() ?? candidate
+  return last.trim()
 }
 
 function StructuredOutputPage() {
+  const providerId = 'structured-output-provider'
+  const modelId = 'structured-output-model'
+  const promptId = 'structured-output-prompt'
   const [prompt, setPrompt] = useState(SAMPLE_PROMPT)
-  const [model, setModel] = useState<string>(OPENROUTER_MODELS[0].value)
-  const [result, setResult] = useState<RecommendationResult | null>(null)
+  const [provider, setProvider] = useState<Provider>('openai')
+  const [model, setModel] = useState<string>(PROVIDER_MODELS.openai[0].value)
+  const [stream, setStream] = useState(true)
+  const [result, setResult] = useState<PartialResult | null>(null)
+  const [rawJson, setRawJson] = useState<string>('')
+  const [deltaCount, setDeltaCount] = useState(0)
+  const [isStreaming, setIsStreaming] = useState(false)
+  const [hasFinalResult, setHasFinalResult] = useState(false)
+  const [reasoningLine, setReasoningLine] = useState<string>('')
+  const [reasoningFull, setReasoningFull] = useState<string>('')
   const [error, setError] = useState<string | null>(null)
   const [isLoading, setIsLoading] = useState(false)
+  const abortRef = useRef<AbortController | null>(null)
+
+  const onProviderChange = (next: Provider) => {
+    setProvider(next)
+    setModel(PROVIDER_MODELS[next][0].value)
+  }
+
+  const reset = () => {
+    setResult(null)
+    setRawJson('')
+    setDeltaCount(0)
+    setHasFinalResult(false)
+    setReasoningLine('')
+    setReasoningFull('')
+    setError(null)
+  }
 
   const handleGenerate = async () => {
     if (!prompt.trim()) return
     setIsLoading(true)
-    setError(null)
-    setResult(null)
+    reset()
+    setIsStreaming(stream)
+
+    const controller = new AbortController()
+    abortRef.current = controller
 
     try {
       const response = await fetch('/api/structured-output', {
         method: 'POST',
         headers: { 'Content-Type': 'application/json' },
-        body: JSON.stringify({ prompt: prompt.trim(), model }),
+        body: JSON.stringify({
+          prompt: prompt.trim(),
+          provider,
+          model,
+          stream,
+        }),
+        signal: controller.signal,
       })
-      const payload = await response.json()
+
       if (!response.ok) {
-        throw new Error(payload.error || 'Request failed')
+        const errPayload = await response.json().catch(() => ({}))
+        throw new Error(
+          errPayload.error || `Request failed (${response.status})`,
+        )
+      }
+
+      if (!stream) {
+        const payload = await response.json()
+        setResult(payload.data as PartialResult)
+        setHasFinalResult(true)
+        return
+      }
+
+      // Streaming path — parse SSE, accumulate raw JSON, render the partially
+      // parsed object live, snap to the validated terminal payload.
+      const reader = response.body!.getReader()
+      const decoder = new TextDecoder()
+      let buffer = ''
+      let accumulated = ''
+      let reasoning = ''
+      let deltas = 0
+      let sawComplete = false
+
+      const processBuffer = () => {
+        let sepIdx = buffer.indexOf('\n\n')
+        while (sepIdx !== -1) {
+          const frame = buffer.slice(0, sepIdx)
+          buffer = buffer.slice(sepIdx + 2)
+          sepIdx = buffer.indexOf('\n\n')
+
+          for (const line of frame.split('\n')) {
+            if (!line.startsWith('data: ')) continue
+            const json = line.slice(6).trim()
+            if (!json) continue
+            let chunk: StreamChunkPayload
+            try {
+              chunk = JSON.parse(json) as StreamChunkPayload
+            } catch {
+              continue
+            }
+
+            if (chunk.type === 'TEXT_MESSAGE_CONTENT' && chunk.delta) {
+              accumulated += chunk.delta
+              deltas += 1
+              setRawJson(accumulated)
+              setDeltaCount(deltas)
+              // partial-json tolerates incomplete JSON — it returns whatever
+              // structure can be inferred. Render it directly so the UI fills
+              // in field by field as the model produces them.
+              const partial = parsePartialJSON(accumulated) as
+                | PartialResult
+                | undefined
+              if (partial && typeof partial === 'object') {
+                setResult(partial)
+              }
+            } else if (
+              chunk.type === 'REASONING_MESSAGE_CONTENT' &&
+              chunk.delta
+            ) {
+              reasoning += chunk.delta
+              setReasoningFull(reasoning)
+              // One-liner: take the last non-empty line/sentence so consumers
+              // see "what it's thinking right now" without a wall of text.
+              setReasoningLine(latestThought(reasoning))
+            } else if (
+              chunk.type === 'CUSTOM' &&
+              chunk.name === 'structured-output.complete' &&
+              chunk.value?.object
+            ) {
+              sawComplete = true
+              setResult(chunk.value.object as PartialResult)
+              setHasFinalResult(true)
+              if (
+                typeof (chunk.value as { reasoning?: string }).reasoning ===
+                'string'
+              ) {
+                const finalReasoning = (chunk.value as { reasoning: string })
+                  .reasoning
+                setReasoningFull(finalReasoning)
+                setReasoningLine(latestThought(finalReasoning))
+              }
+            } else if (chunk.type === 'RUN_ERROR') {
+              throw new Error(chunk.message || 'Stream failed')
+            }
+          }
+        }
+      }
+
+      while (true) {
+        const { done, value } = await reader.read()
+        if (done) break
+        buffer += decoder.decode(value, { stream: true })
+        processBuffer()
+      }
+
+      // Flush any buffered bytes from incomplete multi-byte UTF-8 sequences
+      // so the final SSE frame isn't dropped.
+      buffer += decoder.decode()
+      processBuffer()
+
+      if (!sawComplete) {
+        throw new Error('Stream ended before structured-output.complete')
       }
-      setResult(payload.data as RecommendationResult)
     } catch (err) {
-      setError(err instanceof Error ? err.message : 'Unknown error')
+      if (err instanceof Error && err.name === 'AbortError') {
+        setError('Aborted')
+      } else {
+        setError(err instanceof Error ? err.message : 'Unknown error')
+      }
     } finally {
       setIsLoading(false)
+      setIsStreaming(false)
+      abortRef.current = null
     }
   }
 
+  const handleAbort = () => abortRef.current?.abort()
+
+  const renderingPartial = isStreaming && !hasFinalResult
+  const recommendations = result?.recommendations ?? []
+  const nextSteps = result?.nextSteps ?? []
+
   return (
     <div className="flex flex-col h-[calc(100vh-72px)] bg-gray-900 text-white">
       <div className="border-b border-orange-500/20 bg-gray-800 px-6 py-4">
-        <h2 className="text-xl font-semibold">
-          Structured Output (OpenRouter)
-        </h2>
+        <h2 className="text-xl font-semibold">Structured Output</h2>
         <p className="text-sm text-gray-400 mt-1">
           Calls <code className="text-orange-400">chat()</code> with an{' '}
-          <code className="text-orange-400">outputSchema</code> via the{' '}
-          <code className="text-orange-400">openRouterText</code> adapter and
-          parses the JSON result.
+          <code className="text-orange-400">outputSchema</code>. Toggle{' '}
+          <code className="text-orange-400">stream</code> to exercise{' '}
+          <code className="text-orange-400">structuredOutputStream</code> on the
+          selected provider; the UI fills in progressively via{' '}
+          <code className="text-orange-400">parsePartialJSON</code>, then snaps
+          to the validated payload from the terminal{' '}
+          <code className="text-orange-400">structured-output.complete</code>{' '}
+          event. Reasoning models surface a live thinking strip from{' '}
+          <code className="text-orange-400">REASONING_MESSAGE_CONTENT</code>{' '}
+          deltas — openai (Responses API), openrouter, xAI (
+          <code className="text-orange-400">delta.reasoning_content</code>), and
+          Groq (<code className="text-orange-400">delta.reasoning</code>) all
+          stream chain-of-thought.
         </p>
       </div>
 
       <div className="flex-1 overflow-y-auto p-6">
         <div className="max-w-2xl mx-auto space-y-6">
-          <div className="space-y-3">
-            <label className="text-sm text-gray-400">OpenRouter Model</label>
-            <select
-              value={model}
-              onChange={(e) => setModel(e.target.value)}
-              disabled={isLoading}
-              className="w-full rounded-lg border border-orange-500/20 bg-gray-800/50 px-3 py-2 text-sm text-white focus:outline-none focus:ring-2 focus:ring-orange-500/50 disabled:opacity-50"
-            >
-              {OPENROUTER_MODELS.map((opt) => (
-                <option key={opt.value} value={opt.value}>
-                  {opt.label}
+          <div className="grid grid-cols-2 gap-3">
+            <div className="space-y-2">
+              <label htmlFor={providerId} className="text-sm text-gray-400">
+                Provider
+              </label>
+              <select
+                id={providerId}
+                value={provider}
+                onChange={(e) => onProviderChange(e.target.value as Provider)}
+                disabled={isLoading}
+                className="w-full rounded-lg border border-orange-500/20 bg-gray-800/50 px-3 py-2 text-sm text-white focus:outline-none focus:ring-2 focus:ring-orange-500/50 disabled:opacity-50"
+              >
+                <option value="openai">OpenAI (Responses)</option>
+                <option value="openai-chat">OpenAI (Chat Completions)</option>
+                <option value="grok">Grok (xAI)</option>
+                <option value="groq">Groq</option>
+                <option value="openrouter">
+                  OpenRouter (Chat Completions)
                 </option>
-              ))}
-            </select>
+                <option value="openrouter-responses">
+                  OpenRouter (Responses beta)
+                </option>
+              </select>
+            </div>
+            <div className="space-y-2">
+              <label htmlFor={modelId} className="text-sm text-gray-400">
+                Model
+              </label>
+              <select
+                id={modelId}
+                value={model}
+                onChange={(e) => setModel(e.target.value)}
+                disabled={isLoading}
+                className="w-full rounded-lg border border-orange-500/20 bg-gray-800/50 px-3 py-2 text-sm text-white focus:outline-none focus:ring-2 focus:ring-orange-500/50 disabled:opacity-50"
+              >
+                {PROVIDER_MODELS[provider].map((opt) => (
+                  <option key={opt.value} value={opt.value}>
+                    {opt.label}
+                  </option>
+                ))}
+              </select>
+            </div>
           </div>
 
+          <label className="flex items-center gap-2 text-sm text-gray-300">
+            <input
+              type="checkbox"
+              checked={stream}
+              onChange={(e) => setStream(e.target.checked)}
+              disabled={isLoading}
+              className="accent-orange-500"
+            />
+            Stream (single-request{' '}
+            <code className="text-orange-400">stream: true</code> +{' '}
+            <code className="text-orange-400">
+              response_format: json_schema
+            </code>
+            )
+          </label>
+
           <div className="space-y-3">
-            <label className="text-sm text-gray-400">Prompt</label>
+            <label htmlFor={promptId} className="text-sm text-gray-400">
+              Prompt
+            </label>
             <textarea
+              id={promptId}
               value={prompt}
               onChange={(e) => setPrompt(e.target.value)}
               placeholder="Describe what you want recommendations for..."
@@ -108,11 +399,23 @@ function StructuredOutputPage() {
               disabled={!prompt.trim() || isLoading}
               className="px-6 py-2 bg-orange-600 hover:bg-orange-700 disabled:bg-gray-700 disabled:text-gray-500 text-white rounded-lg text-sm font-medium transition-colors"
             >
-              {isLoading ? 'Generating...' : 'Generate Structured Output'}
+              {isLoading
+                ? stream
+                  ? 'Streaming...'
+                  : 'Generating...'
+                : 'Generate'}
             </button>
-            {result && (
+            {isLoading && stream && (
+              <button
+                onClick={handleAbort}
+                className="px-6 py-2 bg-red-600 hover:bg-red-700 text-white rounded-lg text-sm font-medium transition-colors"
+              >
+                Abort
+              </button>
+            )}
+            {(result || rawJson) && !isLoading && (
               <button
-                onClick={() => setResult(null)}
+                onClick={reset}
                 className="px-6 py-2 bg-gray-700 hover:bg-gray-600 text-white rounded-lg text-sm font-medium transition-colors"
               >
                 Clear
@@ -126,58 +429,151 @@ function StructuredOutputPage() {
             </div>
           )}
 
+          {(reasoningLine || reasoningFull) && (
+            <div className="p-3 bg-purple-500/5 border border-purple-500/20 rounded-lg">
+              <div className="flex items-center gap-2 text-xs text-purple-300/80">
+                <span className="uppercase tracking-wider">Thinking</span>
+                {isStreaming && !hasFinalResult && (
+                  <span className="inline-block w-1.5 h-1.5 rounded-full bg-purple-400 animate-pulse" />
+                )}
+              </div>
+              <p
+                className="text-sm text-purple-100/90 mt-1 truncate"
+                title={reasoningFull}
+              >
+                {reasoningLine ||
+                  reasoningFull.split('\n').filter(Boolean).slice(-1)[0] ||
+                  '…'}
+              </p>
+              {reasoningFull && reasoningFull !== reasoningLine && (
+                <details className="mt-2">
+                  <summary className="text-xs text-purple-300/60 cursor-pointer">
+                    Full reasoning ({reasoningFull.length} chars)
+                  </summary>
+                  <pre className="text-xs text-purple-100/70 mt-2 whitespace-pre-wrap wrap-break-word">
+                    {reasoningFull}
+                  </pre>
+                </details>
+              )}
+            </div>
+          )}
+
           {result && (
             <div className="space-y-4">
-              <div className="p-4 bg-gray-800/50 border border-gray-700 rounded-lg">
-                <h3 className="text-lg font-semibold text-white">
-                  {result.title}
-                </h3>
-                <p className="text-gray-300 mt-2 text-sm">{result.summary}</p>
-              </div>
+              {stream && deltaCount > 0 && (
+                <p className="text-xs text-gray-500">
+                  {hasFinalResult ? 'Final result' : 'Streaming'} — {deltaCount}{' '}
+                  deltas received
+                  {renderingPartial && (
+                    <span className="ml-1 inline-block w-2 h-2 rounded-full bg-orange-500 animate-pulse" />
+                  )}
+                </p>
+              )}
 
-              <div className="space-y-3">
-                {result.recommendations.map((rec, i) => (
-                  <div
-                    key={i}
-                    className="p-4 bg-gray-800/50 border border-gray-700 rounded-lg"
-                  >
-                    <div className="flex items-start justify-between gap-3">
-                      <div>
-                        <p className="text-white font-medium">
-                          {rec.brand} {rec.name}
-                        </p>
-                        <p className="text-xs text-orange-400 uppercase tracking-wider mt-0.5">
-                          {rec.type}
-                        </p>
+              {(result.title || renderingPartial) && (
+                <div
+                  className={`p-4 bg-gray-800/50 border border-gray-700 rounded-lg transition-colors ${
+                    renderingPartial && !result.summary
+                      ? 'border-orange-500/30'
+                      : ''
+                  }`}
+                >
+                  <h3 className="text-lg font-semibold text-white">
+                    {result.title || (
+                      <span className="text-gray-500 italic">
+                        Generating title…
+                      </span>
+                    )}
+                    {renderingPartial && result.title && !result.summary && (
+                      <span className="ml-1 inline-block w-1.5 h-4 align-middle bg-orange-400 animate-pulse" />
+                    )}
+                  </h3>
+                  {(result.summary || renderingPartial) && (
+                    <p className="text-gray-300 mt-2 text-sm">
+                      {result.summary || (
+                        <span className="text-gray-500 italic">
+                          Generating summary…
+                        </span>
+                      )}
+                    </p>
+                  )}
+                </div>
+              )}
+
+              {recommendations.length > 0 && (
+                <div className="space-y-3">
+                  {recommendations.map((rec, i) => {
+                    const isLastWhileStreaming =
+                      renderingPartial && i === recommendations.length - 1
+                    return (
+                      <div
+                        key={i}
+                        className={`p-4 bg-gray-800/50 border rounded-lg transition-colors ${
+                          isLastWhileStreaming
+                            ? 'border-orange-500/30'
+                            : 'border-gray-700'
+                        }`}
+                      >
+                        <div className="flex items-start justify-between gap-3">
+                          <div>
+                            <p className="text-white font-medium">
+                              {[rec.brand, rec.name]
+                                .filter(Boolean)
+                                .join(' ') || (
+                                <span className="text-gray-500 italic">
+                                  Loading…
+                                </span>
+                              )}
+                            </p>
+                            {rec.type && (
+                              <p className="text-xs text-orange-400 uppercase tracking-wider mt-0.5">
+                                {rec.type}
+                              </p>
+                            )}
+                          </div>
+                          {rec.priceRangeUsd?.min != null &&
+                            rec.priceRangeUsd.max != null && (
+                              <p className="text-sm text-gray-400 whitespace-nowrap">
+                                ${rec.priceRangeUsd.min} – $
+                                {rec.priceRangeUsd.max}
+                              </p>
+                            )}
+                        </div>
+                        {rec.reason && (
+                          <p className="text-sm text-gray-300 mt-2">
+                            {rec.reason}
+                            {isLastWhileStreaming && (
+                              <span className="ml-1 inline-block w-1.5 h-4 align-middle bg-orange-400 animate-pulse" />
+                            )}
+                          </p>
+                        )}
                       </div>
-                      <p className="text-sm text-gray-400 whitespace-nowrap">
-                        ${rec.priceRangeUsd.min} – ${rec.priceRangeUsd.max}
-                      </p>
-                    </div>
-                    <p className="text-sm text-gray-300 mt-2">{rec.reason}</p>
-                  </div>
-                ))}
-              </div>
+                    )
+                  })}
+                </div>
+              )}
 
-              {result.nextSteps.length > 0 && (
+              {nextSteps.length > 0 && (
                 <div className="p-4 bg-gray-800/50 border border-gray-700 rounded-lg">
                   <p className="text-sm text-gray-400 mb-2">Next Steps</p>
                   <ul className="list-disc list-inside text-sm text-gray-200 space-y-1">
-                    {result.nextSteps.map((step, i) => (
+                    {nextSteps.map((step, i) => (
                       <li key={i}>{step}</li>
                     ))}
                   </ul>
                 </div>
               )}
 
-              <details className="p-4 bg-gray-800/30 border border-gray-700/50 rounded-lg">
-                <summary className="text-sm text-gray-400 cursor-pointer">
-                  Raw JSON
-                </summary>
-                <pre className="text-xs text-gray-300 mt-3 overflow-x-auto">
-                  {JSON.stringify(result, null, 2)}
-                </pre>
-              </details>
+              {rawJson && (
+                <details className="p-4 bg-gray-800/30 border border-gray-700/50 rounded-lg">
+                  <summary className="text-sm text-gray-400 cursor-pointer">
+                    Raw JSON ({rawJson.length} chars)
+                  </summary>
+                  <pre className="text-xs text-gray-300 mt-3 overflow-x-auto wrap-break-word whitespace-pre-wrap">
+                    {rawJson}
+                  </pre>
+                </details>
+              )}
             </div>
           )}
         </div>
diff --git a/examples/ts-react-chat/src/routes/generations.summarize.tsx b/examples/ts-react-chat/src/routes/generations.summarize.tsx
index 09f2a7f21..bcc12898b 100644
--- a/examples/ts-react-chat/src/routes/generations.summarize.tsx
+++ b/examples/ts-react-chat/src/routes/generations.summarize.tsx
@@ -4,6 +4,7 @@ import { useSummarize } from '@tanstack/ai-react'
 import type { UseSummarizeReturn } from '@tanstack/ai-react'
 import { fetchServerSentEvents } from '@tanstack/ai-client'
 import { summarizeFn, summarizeStreamFn } from '../lib/server-fns'
+import type { StreamChunk } from '@tanstack/ai'
 
 const SAMPLE_TEXT = `Artificial intelligence (AI) has rapidly transformed from a niche academic pursuit into one of the most influential technologies of the 21st century. The development of large language models, in particular, has demonstrated capabilities that were previously thought to be decades away. These models can generate human-like text, translate languages, write code, and even engage in complex reasoning tasks.
 
@@ -11,14 +12,44 @@ The implications of this technology are far-reaching. In healthcare, AI systems
 
 However, the rapid advancement of AI also raises significant concerns. Issues of bias in training data, the environmental cost of training large models, the potential for misuse in generating disinformation, and the impact on employment are all active areas of debate. Researchers and policymakers are working to develop frameworks for responsible AI development that balance innovation with safety and ethical considerations.`
 
+const MODELS: Array<{ value: string; label: string }> = [
+  { value: 'gpt-4o-mini', label: 'GPT-4o Mini (fast, cheap)' },
+  { value: 'gpt-4o', label: 'GPT-4o' },
+  { value: 'gpt-5-mini', label: 'GPT-5 Mini' },
+  { value: 'gpt-5', label: 'GPT-5' },
+  { value: 'gpt-5.1', label: 'GPT-5.1' },
+  { value: 'gpt-5.2', label: 'GPT-5.2 (frontier)' },
+]
+
+// Accumulate TEXT_MESSAGE_CONTENT deltas (or the absolute `content`) from a
+// streaming chunk so we can render the summary token-by-token instead of
+// waiting for the terminal `generation:result` event.
+function consumeStreamingChunk(
+  chunk: StreamChunk,
+  prev: string,
+): string | undefined {
+  if (chunk.type !== 'TEXT_MESSAGE_CONTENT') return undefined
+  const c = chunk as StreamChunk & { content?: string; delta?: string }
+  if (typeof c.content === 'string' && c.content.length > 0) return c.content
+  if (typeof c.delta === 'string' && c.delta.length > 0) return prev + c.delta
+  return undefined
+}
+
 function StreamingSummarize() {
   const [text, setText] = useState('')
   const [style, setStyle] = useState<'concise' | 'bullet-points' | 'paragraph'>(
     'concise',
   )
+  const [model, setModel] = useState<string>(MODELS[0].value)
+  const [streamingText, setStreamingText] = useState('')
 
+  // The connect adapter merges `body` into every request payload; the API
+  // route reads `model` from `body.data` to pick the openaiSummarize variant.
   const hookReturn = useSummarize({
     connection: fetchServerSentEvents('/api/summarize'),
+    body: { model },
+    onChunk: (chunk) =>
+      setStreamingText((prev) => consumeStreamingChunk(chunk, prev) ?? prev),
   })
 
   return (
@@ -28,6 +59,10 @@ function StreamingSummarize() {
       setText={setText}
       style={style}
       setStyle={setStyle}
+      model={model}
+      setModel={setModel}
+      streamingText={streamingText}
+      onBeforeGenerate={() => setStreamingText('')}
     />
   )
 }
@@ -37,9 +72,14 @@ function DirectSummarize() {
   const [style, setStyle] = useState<'concise' | 'bullet-points' | 'paragraph'>(
     'concise',
   )
+  const [model, setModel] = useState<string>(MODELS[0].value)
 
+  // Fetcher path: GenerationClient passes `input` straight to the fetcher
+  // (no `body` merge), so we inject `model` into the payload here. Direct
+  // mode is non-streaming — the result appears all at once when the
+  // server-fn resolves.
   const hookReturn = useSummarize({
-    fetcher: (input) => summarizeFn({ data: input }),
+    fetcher: (input) => summarizeFn({ data: { ...input, model } }),
   })
 
   return (
@@ -49,6 +89,8 @@ function DirectSummarize() {
       setText={setText}
       style={style}
       setStyle={setStyle}
+      model={model}
+      setModel={setModel}
     />
   )
 }
@@ -58,9 +100,15 @@ function ServerFnSummarize() {
   const [style, setStyle] = useState<'concise' | 'bullet-points' | 'paragraph'>(
     'concise',
   )
+  const [model, setModel] = useState<string>(MODELS[0].value)
+  const [streamingText, setStreamingText] = useState('')
 
+  // The server-fn returns an SSE Response; GenerationClient parses it and
+  // routes chunks through `onChunk` exactly like the connect-adapter path.
   const hookReturn = useSummarize({
-    fetcher: (input) => summarizeStreamFn({ data: input }),
+    fetcher: (input) => summarizeStreamFn({ data: { ...input, model } }),
+    onChunk: (chunk) =>
+      setStreamingText((prev) => consumeStreamingChunk(chunk, prev) ?? prev),
   })
 
   return (
@@ -70,6 +118,10 @@ function ServerFnSummarize() {
       setText={setText}
       style={style}
       setStyle={setStyle}
+      model={model}
+      setModel={setModel}
+      streamingText={streamingText}
+      onBeforeGenerate={() => setStreamingText('')}
     />
   )
 }
@@ -79,6 +131,10 @@ function SummarizeUI({
   setText,
   style,
   setStyle,
+  model,
+  setModel,
+  streamingText,
+  onBeforeGenerate,
   generate,
   result,
   isLoading,
@@ -89,12 +145,32 @@ function SummarizeUI({
   setText: (v: string) => void
   style: 'concise' | 'bullet-points' | 'paragraph'
   setStyle: (v: 'concise' | 'bullet-points' | 'paragraph') => void
+  model: string
+  setModel: (v: string) => void
+  /** Token-by-token accumulated text from streaming chunks (undefined in
+   *  direct/non-streaming mode). */
+  streamingText?: string
+  /** Called just before `generate()` so streaming variants can clear local
+   *  accumulator state. */
+  onBeforeGenerate?: () => void
 }) {
   const handleSummarize = () => {
     if (!text.trim()) return
-    generate({ text: text.trim(), style, maxLength: 200 })
+    onBeforeGenerate?.()
+    // Intentionally no `maxLength` — for the OpenAI Responses API,
+    // `maxLength` is mapped to `max_output_tokens`, which on GPT-5.x
+    // reasoning models is the budget for BOTH hidden reasoning AND visible
+    // output. A tight cap (e.g. 200) gets the whole budget consumed by
+    // reasoning, leaving the response truncated with `finishReason: 'length'`
+    // and no visible summary. The selected `style` already drives length.
+    generate({ text: text.trim(), style })
   }
 
+  // Prefer the live streaming text while generating, fall back to the final
+  // result once the run completes. Direct mode never has streamingText so it
+  // jumps straight to result.
+  const displaySummary = streamingText || result?.summary || ''
+
   return (
     <div className="space-y-6">
       <div className="space-y-3">
@@ -117,6 +193,22 @@ function SummarizeUI({
         />
       </div>
 
+      <div className="space-y-3">
+        <label className="text-sm text-gray-400">Model</label>
+        <select
+          value={model}
+          onChange={(e) => setModel(e.target.value)}
+          disabled={isLoading}
+          className="w-full rounded-lg border border-orange-500/20 bg-gray-800/50 px-3 py-2 text-sm text-white focus:outline-none focus:ring-2 focus:ring-orange-500/50 disabled:opacity-50"
+        >
+          {MODELS.map((opt) => (
+            <option key={opt.value} value={opt.value}>
+              {opt.label}
+            </option>
+          ))}
+        </select>
+      </div>
+
       <div className="space-y-3">
         <label className="text-sm text-gray-400">Style</label>
         <div className="flex flex-wrap gap-2">
@@ -160,10 +252,17 @@ function SummarizeUI({
         </div>
       )}
 
-      {result && (
+      {displaySummary && (
         <div className="p-4 bg-gray-800/50 border border-gray-700 rounded-lg">
-          <p className="text-sm text-gray-400 mb-3">Summary</p>
-          <p className="text-white whitespace-pre-wrap">{result.summary}</p>
+          <p className="text-sm text-gray-400 mb-3">
+            Summary
+            {isLoading && streamingText && (
+              <span className="ml-2 text-orange-400 animate-pulse">
+                streaming…
+              </span>
+            )}
+          </p>
+          <p className="text-white whitespace-pre-wrap">{displaySummary}</p>
         </div>
       )}
     </div>
diff --git a/packages/typescript/ai-grok/src/adapters/text.ts b/packages/typescript/ai-grok/src/adapters/text.ts
index 0a25fa3fb..c186e2a10 100644
--- a/packages/typescript/ai-grok/src/adapters/text.ts
+++ b/packages/typescript/ai-grok/src/adapters/text.ts
@@ -59,6 +59,26 @@ export class GrokTextAdapter<
   constructor(config: GrokTextConfig, model: TModel) {
     super(model, 'grok', new OpenAI(withGrokDefaults(config)))
   }
+
+  /**
+   * Surfaces xAI reasoning deltas on Grok reasoning models. The DeepSeek-style
+   * convention puts the chain-of-thought on `delta.reasoning_content`; some
+   * Grok variants also populate `delta.reasoning`. Reading both keeps
+   * reasoning flowing through the base's REASONING_* lifecycle for both
+   * `chatStream` and `structuredOutputStream`.
+   */
+  protected override extractReasoning(
+    chunk: OpenAI.Chat.Completions.ChatCompletionChunk,
+  ): { text: string } | undefined {
+    const delta = chunk.choices[0]?.delta as
+      | { reasoning?: unknown; reasoning_content?: unknown }
+      | undefined
+    const raw = delta?.reasoning_content ?? delta?.reasoning
+    if (typeof raw === 'string' && raw.length > 0) {
+      return { text: raw }
+    }
+    return undefined
+  }
 }
 
 /**
diff --git a/packages/typescript/ai-groq/src/adapters/text.ts b/packages/typescript/ai-groq/src/adapters/text.ts
index 879342187..41f35070c 100644
--- a/packages/typescript/ai-groq/src/adapters/text.ts
+++ b/packages/typescript/ai-groq/src/adapters/text.ts
@@ -3,7 +3,6 @@ import { OpenAIBaseChatCompletionsTextAdapter } from '@tanstack/openai-base'
 import { getGroqApiKeyFromEnv, withGroqDefaults } from '../utils/client'
 import { makeGroqStructuredOutputCompatible } from '../utils/schema-converter'
 import type { Modality, TextOptions } from '@tanstack/ai'
-import type { ChatCompletionChunk } from 'openai/resources/chat/completions/completions'
 import type {
   GROQ_CHAT_MODELS,
   GroqChatModelToolCapabilitiesByName,
@@ -70,7 +69,7 @@ export class GroqTextAdapter<
   }
 
   protected override async *processStreamChunks(
-    stream: AsyncIterable<ChatCompletionChunk>,
+    stream: AsyncIterable<OpenAI.Chat.Completions.ChatCompletionChunk>,
     options: TextOptions,
     aguiState: {
       runId: string
@@ -85,6 +84,26 @@ export class GroqTextAdapter<
       aguiState,
     )
   }
+
+  /**
+   * Surfaces Groq's reasoning deltas during streaming structured output.
+   * Groq emits `delta.reasoning` (or legacy `delta.reasoning_content`) on
+   * reasoning models when the caller sets `reasoning_format: 'parsed'` in
+   * modelOptions. The base's chatStream and structuredOutputStream both
+   * route reasoning through this hook.
+   */
+  protected override extractReasoning(
+    chunk: OpenAI.Chat.Completions.ChatCompletionChunk,
+  ): { text: string } | undefined {
+    const delta = chunk.choices[0]?.delta as
+      | { reasoning?: unknown; reasoning_content?: unknown }
+      | undefined
+    const raw = delta?.reasoning ?? delta?.reasoning_content
+    if (typeof raw === 'string' && raw.length > 0) {
+      return { text: raw }
+    }
+    return undefined
+  }
 }
 
 /**
@@ -93,11 +112,11 @@ export class GroqTextAdapter<
  * the documented location.
  */
 async function* promoteGroqUsage(
-  stream: AsyncIterable<ChatCompletionChunk>,
-): AsyncIterable<ChatCompletionChunk> {
+  stream: AsyncIterable<OpenAI.Chat.Completions.ChatCompletionChunk>,
+): AsyncIterable<OpenAI.Chat.Completions.ChatCompletionChunk> {
   for await (const chunk of stream) {
     const groqChunk = chunk as typeof chunk & {
-      x_groq?: { usage?: ChatCompletionChunk['usage'] }
+      x_groq?: { usage?: OpenAI.Chat.Completions.ChatCompletionChunk['usage'] }
     }
     if (!chunk.usage && groqChunk.x_groq?.usage) {
       yield { ...chunk, usage: groqChunk.x_groq.usage }
diff --git a/packages/typescript/ai-openai/src/adapters/text-chat-completions.ts b/packages/typescript/ai-openai/src/adapters/text-chat-completions.ts
new file mode 100644
index 000000000..3adf400d3
--- /dev/null
+++ b/packages/typescript/ai-openai/src/adapters/text-chat-completions.ts
@@ -0,0 +1,90 @@
+import OpenAI from 'openai'
+import { OpenAIBaseChatCompletionsTextAdapter } from '@tanstack/openai-base'
+import { getOpenAIApiKeyFromEnv } from '../utils/client'
+import type {
+  OPENAI_CHAT_MODELS,
+  OpenAIChatModel,
+  OpenAIChatModelProviderOptionsByName,
+  OpenAIChatModelToolCapabilitiesByName,
+  OpenAIModelInputModalitiesByName,
+} from '../model-meta'
+import type { Modality } from '@tanstack/ai'
+import type { OpenAIMessageMetadataByModality } from '../message-types'
+import type { OpenAIClientConfig } from '../utils/client'
+import type { ExternalTextProviderOptions } from '../text/text-provider-options'
+
+/**
+ * Configuration for the OpenAI Chat Completions adapter.
+ *
+ * Distinct from `OpenAITextConfig` (the Responses-API adapter) only in name —
+ * both wrap the same `OpenAIClientConfig`. Kept separate so a future
+ * chat-completions-only knob (e.g. legacy `function_call`) has a place to land
+ * without leaking into the Responses adapter's surface.
+ */
+export interface OpenAIChatCompletionsConfig extends OpenAIClientConfig {}
+
+export type OpenAIChatCompletionsProviderOptions = ExternalTextProviderOptions
+
+type ResolveProviderOptions<TModel extends string> =
+  TModel extends keyof OpenAIChatModelProviderOptionsByName
+    ? OpenAIChatModelProviderOptionsByName[TModel]
+    : OpenAIChatCompletionsProviderOptions
+
+type ResolveInputModalities<TModel extends string> =
+  TModel extends keyof OpenAIModelInputModalitiesByName
+    ? OpenAIModelInputModalitiesByName[TModel]
+    : readonly ['text', 'image', 'audio']
+
+type ResolveToolCapabilities<TModel extends string> =
+  TModel extends keyof OpenAIChatModelToolCapabilitiesByName
+    ? NonNullable<OpenAIChatModelToolCapabilitiesByName[TModel]>
+    : readonly []
+
+/**
+ * OpenAI Text adapter targeting the **Chat Completions** API
+ * (`/v1/chat/completions`).
+ *
+ * Sibling of `OpenAITextAdapter`, which targets the Responses API. Use this
+ * one when you want the older, more broadly compatible wire format (e.g. to
+ * compare streaming behaviour across providers that don't speak Responses yet).
+ */
+export class OpenAIChatCompletionsTextAdapter<
+  TModel extends OpenAIChatModel,
+  TProviderOptions extends Record<string, any> = ResolveProviderOptions<TModel>,
+  TInputModalities extends ReadonlyArray<Modality> =
+    ResolveInputModalities<TModel>,
+  TToolCapabilities extends ReadonlyArray<string> =
+    ResolveToolCapabilities<TModel>,
+> extends OpenAIBaseChatCompletionsTextAdapter<
+  TModel,
+  TProviderOptions,
+  TInputModalities,
+  OpenAIMessageMetadataByModality,
+  TToolCapabilities
+> {
+  readonly kind = 'text' as const
+
+  constructor(config: OpenAIChatCompletionsConfig, model: TModel) {
+    super(model, 'openai-chat', new OpenAI(config))
+  }
+}
+
+export function createOpenaiChatCompletions<
+  TModel extends (typeof OPENAI_CHAT_MODELS)[number],
+>(
+  model: TModel,
+  apiKey: string,
+  config?: Omit<OpenAIChatCompletionsConfig, 'apiKey'>,
+): OpenAIChatCompletionsTextAdapter<TModel> {
+  return new OpenAIChatCompletionsTextAdapter({ apiKey, ...config }, model)
+}
+
+export function openaiChatCompletions<
+  TModel extends (typeof OPENAI_CHAT_MODELS)[number],
+>(
+  model: TModel,
+  config?: Omit<OpenAIChatCompletionsConfig, 'apiKey'>,
+): OpenAIChatCompletionsTextAdapter<TModel> {
+  const apiKey = getOpenAIApiKeyFromEnv()
+  return createOpenaiChatCompletions(model, apiKey, config)
+}
diff --git a/packages/typescript/ai-openai/src/index.ts b/packages/typescript/ai-openai/src/index.ts
index 170833aea..fdeb79d57 100644
--- a/packages/typescript/ai-openai/src/index.ts
+++ b/packages/typescript/ai-openai/src/index.ts
@@ -2,7 +2,7 @@
 // New Tree-Shakeable Adapters (Recommended)
 // ============================================================================
 
-// Text (Chat) adapter - for chat/text completion
+// Text (Chat) adapter - for chat/text completion (Responses API)
 export {
   OpenAITextAdapter,
   createOpenaiChat,
@@ -11,6 +11,15 @@ export {
   type OpenAITextProviderOptions,
 } from './adapters/text'
 
+// Text (Chat Completions) adapter - older `/v1/chat/completions` wire format
+export {
+  OpenAIChatCompletionsTextAdapter,
+  createOpenaiChatCompletions,
+  openaiChatCompletions,
+  type OpenAIChatCompletionsConfig,
+  type OpenAIChatCompletionsProviderOptions,
+} from './adapters/text-chat-completions'
+
 // Summarize - thin factory functions over @tanstack/ai's ChatStreamSummarizeAdapter
 export {
   createOpenaiSummarize,
diff --git a/packages/typescript/ai-openrouter/src/adapters/responses-text.ts b/packages/typescript/ai-openrouter/src/adapters/responses-text.ts
index b70f6dde0..ca9b1711b 100644
--- a/packages/typescript/ai-openrouter/src/adapters/responses-text.ts
+++ b/packages/typescript/ai-openrouter/src/adapters/responses-text.ts
@@ -259,6 +259,411 @@ export class OpenRouterResponsesTextAdapter<
     }
   }
 
+  /**
+   * Streamed structured output via OpenRouter's Responses API
+   * (`text.format: { type: 'json_schema', ... }` + `stream: true`).
+   *
+   * Mirrors {@link OpenAIBaseResponsesTextAdapter.structuredOutputStream}
+   * adapted to OpenRouter's SDK call surface
+   * (`orClient.beta.responses.send`) and to the camelCase usage shape on
+   * `response.completed` (`inputTokens` / `outputTokens` / `totalTokens`).
+   *
+   * Events flow through {@link normalizeStreamEvent} so this method reads
+   * the same canonical event shape as `processStreamChunks` (covering
+   * Speakeasy's UNKNOWN-with-`raw` fallback for events that fail strict
+   * per-variant validation upstream).
+   */
+  async *structuredOutputStream(
+    options: StructuredOutputOptions<OpenRouterResponsesTextProviderOptions>,
+  ): AsyncIterable<StreamChunk> {
+    const { chatOptions, outputSchema } = options
+    const responsesRequest = this.mapOptionsToRequest(chatOptions)
+
+    const jsonSchema = this.makeStructuredOutputCompatible(
+      outputSchema,
+      outputSchema.required,
+    )
+
+    const timestamp = Date.now()
+    const aguiState = {
+      runId: generateId(this.name),
+      threadId: chatOptions.threadId ?? generateId(this.name),
+      messageId: generateId(this.name),
+      timestamp,
+      hasEmittedRunStarted: false,
+    }
+
+    let accumulatedContent = ''
+    let accumulatedReasoning = ''
+    let hasEmittedTextMessageStart = false
+    let reasoningMessageId: string | undefined
+    let stepId: string | undefined
+    let hasClosedReasoning = false
+    let model: string = chatOptions.model
+    let usage:
+      | {
+          inputTokens?: number
+          outputTokens?: number
+          totalTokens?: number
+        }
+      | undefined
+
+    const closeReasoning = function* (this: {
+      name: string
+    }): Generator<StreamChunk> {
+      if (reasoningMessageId && !hasClosedReasoning) {
+        hasClosedReasoning = true
+        yield {
+          type: EventType.REASONING_MESSAGE_END,
+          messageId: reasoningMessageId,
+          model,
+          timestamp,
+        }
+        yield {
+          type: EventType.REASONING_END,
+          messageId: reasoningMessageId,
+          model,
+          timestamp,
+        }
+        if (stepId) {
+          yield {
+            type: EventType.STEP_FINISHED,
+            stepName: stepId,
+            stepId,
+            model,
+            timestamp,
+            content: accumulatedReasoning,
+          }
+        }
+      }
+    }.bind(this)
+
+    const openReasoning = function* (this: {
+      name: string
+    }): Generator<StreamChunk> {
+      if (reasoningMessageId) return
+      reasoningMessageId = generateId(this.name)
+      stepId = generateId(this.name)
+      yield {
+        type: EventType.REASONING_START,
+        messageId: reasoningMessageId,
+        model,
+        timestamp,
+      }
+      yield {
+        type: EventType.REASONING_MESSAGE_START,
+        messageId: reasoningMessageId,
+        role: 'reasoning' as const,
+        model,
+        timestamp,
+      }
+      yield {
+        type: EventType.STEP_STARTED,
+        stepName: stepId,
+        stepId,
+        model,
+        timestamp,
+        stepType: 'thinking',
+      }
+    }.bind(this)
+
+    try {
+      chatOptions.logger.request(
+        `activity=structuredOutputStream provider=${this.name} model=${this.model} messages=${chatOptions.messages.length}`,
+        { provider: this.name, model: this.model },
+      )
+      const reqOptions = extractRequestOptions(chatOptions.request)
+      const rawStream = await this.orClient.beta.responses.send(
+        {
+          responsesRequest: {
+            ...responsesRequest,
+            stream: true,
+            text: {
+              format: {
+                type: 'json_schema',
+                name: 'structured_output',
+                schema: jsonSchema,
+                strict: true,
+              },
+            },
+          },
+        },
+        {
+          signal: reqOptions.signal ?? undefined,
+          ...(reqOptions.headers && { headers: reqOptions.headers }),
+        },
+      )
+
+      for await (const rawEvent of rawStream) {
+        const chunk = normalizeStreamEvent(rawEvent)
+
+        chatOptions.logger.provider(
+          `provider=${this.name} type=${chunk.type}`,
+          { provider: this.name, type: chunk.type },
+        )
+
+        if (!aguiState.hasEmittedRunStarted) {
+          aguiState.hasEmittedRunStarted = true
+          yield {
+            type: EventType.RUN_STARTED,
+            runId: aguiState.runId,
+            threadId: aguiState.threadId,
+            model,
+            timestamp,
+          }
+        }
+
+        if (
+          chunk.type === 'response.created' ||
+          chunk.type === 'response.in_progress'
+        ) {
+          if (chunk.response?.model) model = chunk.response.model
+          continue
+        }
+
+        if (chunk.type === 'response.refusal.delta') {
+          const delta = typeof chunk.delta === 'string' ? chunk.delta : ''
+          yield {
+            type: EventType.RUN_ERROR,
+            runId: aguiState.runId,
+            model,
+            timestamp,
+            message: `Model refused: ${delta}`,
+            code: 'refusal',
+            error: { message: `Model refused: ${delta}`, code: 'refusal' },
+          }
+          return
+        }
+
+        if (
+          chunk.type === 'response.reasoning_text.delta' ||
+          chunk.type === 'response.reasoning_summary_text.delta'
+        ) {
+          const reasoningDelta = Array.isArray(chunk.delta)
+            ? chunk.delta.join('')
+            : typeof chunk.delta === 'string'
+              ? chunk.delta
+              : ''
+          if (!reasoningDelta) continue
+          yield* openReasoning()
+          // openReasoning() guarantees reasoningMessageId is set on first
+          // call; TS can't see through the generator side-effect.
+          const messageId = reasoningMessageId!
+          accumulatedReasoning += reasoningDelta
+          yield {
+            type: EventType.REASONING_MESSAGE_CONTENT,
+            messageId,
+            delta: reasoningDelta,
+            model,
+            timestamp,
+          }
+          continue
+        }
+
+        if (chunk.type === 'response.output_text.delta') {
+          const textDelta = Array.isArray(chunk.delta)
+            ? chunk.delta.join('')
+            : typeof chunk.delta === 'string'
+              ? chunk.delta
+              : ''
+          if (!textDelta) continue
+
+          yield* closeReasoning()
+
+          if (!hasEmittedTextMessageStart) {
+            hasEmittedTextMessageStart = true
+            yield {
+              type: EventType.TEXT_MESSAGE_START,
+              messageId: aguiState.messageId,
+              model,
+              timestamp,
+              role: 'assistant',
+            }
+          }
+          accumulatedContent += textDelta
+          yield {
+            type: EventType.TEXT_MESSAGE_CONTENT,
+            messageId: aguiState.messageId,
+            model,
+            timestamp,
+            delta: textDelta,
+            content: accumulatedContent,
+          }
+          continue
+        }
+
+        if (chunk.type === 'response.completed') {
+          if (chunk.response?.model) model = chunk.response.model
+          if (chunk.response?.usage) usage = chunk.response.usage
+          continue
+        }
+
+        if (
+          chunk.type === 'response.failed' ||
+          chunk.type === 'response.incomplete'
+        ) {
+          const message =
+            chunk.response?.error?.message ||
+            chunk.response?.incompleteDetails?.reason ||
+            (chunk.type === 'response.failed'
+              ? 'Response failed'
+              : 'Response ended incomplete')
+          const code =
+            normalizeCode(chunk.response?.error?.code) ??
+            (chunk.response?.incompleteDetails ? 'incomplete' : undefined)
+          yield {
+            type: EventType.RUN_ERROR,
+            runId: aguiState.runId,
+            model,
+            timestamp,
+            message,
+            ...(code !== undefined && { code }),
+            error: {
+              message,
+              ...(code !== undefined && { code }),
+            },
+          }
+          return
+        }
+
+        if (chunk.type === 'error') {
+          const code = normalizeCode(chunk.code)
+          const message = chunk.message ?? 'Responses API stream error'
+          yield {
+            type: EventType.RUN_ERROR,
+            runId: aguiState.runId,
+            model,
+            timestamp,
+            message,
+            ...(code !== undefined && { code }),
+            error: {
+              message,
+              ...(code !== undefined && { code }),
+            },
+          }
+          return
+        }
+      }
+
+      yield* closeReasoning()
+
+      if (hasEmittedTextMessageStart) {
+        yield {
+          type: EventType.TEXT_MESSAGE_END,
+          messageId: aguiState.messageId,
+          model,
+          timestamp,
+        }
+      }
+
+      if (accumulatedContent.length === 0) {
+        yield {
+          type: EventType.RUN_ERROR,
+          runId: aguiState.runId,
+          model,
+          timestamp,
+          message: `${this.name}.structuredOutputStream: response contained no content`,
+          code: 'empty-response',
+          error: {
+            message: `${this.name}.structuredOutputStream: response contained no content`,
+            code: 'empty-response',
+          },
+        }
+        return
+      }
+
+      let parsed: unknown
+      try {
+        parsed = JSON.parse(accumulatedContent)
+      } catch {
+        yield {
+          type: EventType.RUN_ERROR,
+          runId: aguiState.runId,
+          model,
+          timestamp,
+          message: `Failed to parse structured output as JSON. Content: ${accumulatedContent.slice(0, 200)}${accumulatedContent.length > 200 ? '...' : ''}`,
+          code: 'parse-error',
+          error: {
+            message: 'Failed to parse structured output as JSON',
+            code: 'parse-error',
+          },
+        }
+        return
+      }
+
+      const transformed = this.transformStructuredOutput(parsed)
+
+      yield {
+        type: EventType.CUSTOM,
+        name: 'structured-output.complete',
+        value: {
+          object: transformed,
+          raw: accumulatedContent,
+          ...(accumulatedReasoning ? { reasoning: accumulatedReasoning } : {}),
+        },
+        model,
+        timestamp,
+      }
+
+      yield {
+        type: EventType.RUN_FINISHED,
+        runId: aguiState.runId,
+        threadId: aguiState.threadId,
+        model,
+        timestamp,
+        finishReason: 'stop',
+        ...(usage && {
+          usage: {
+            promptTokens: usage.inputTokens ?? 0,
+            completionTokens: usage.outputTokens ?? 0,
+            totalTokens: usage.totalTokens ?? 0,
+          },
+        }),
+      }
+    } catch (error: unknown) {
+      if (!aguiState.hasEmittedRunStarted) {
+        aguiState.hasEmittedRunStarted = true
+        yield {
+          type: EventType.RUN_STARTED,
+          runId: aguiState.runId,
+          threadId: aguiState.threadId,
+          model,
+          timestamp,
+        }
+      }
+
+      // OpenRouter SDK raises a proprietary `RequestAbortedError` on
+      // caller-initiated abort. Map it (plus DOM `AbortError`) to
+      // `code: 'aborted'` so consumers can distinguish abort from a real
+      // upstream failure.
+      const errName =
+        error && typeof error === 'object'
+          ? ((error as { name?: unknown }).name ?? '')
+          : ''
+      const isAbort =
+        errName === 'AbortError' || errName === 'RequestAbortedError'
+      const errorPayload = toRunErrorPayload(
+        error,
+        `${this.name}.structuredOutputStream failed`,
+      )
+
+      yield {
+        type: EventType.RUN_ERROR,
+        runId: aguiState.runId,
+        model,
+        timestamp,
+        message: errorPayload.message,
+        code: isAbort ? 'aborted' : errorPayload.code,
+        error: { ...errorPayload, ...(isAbort && { code: 'aborted' }) },
+      }
+
+      chatOptions.logger.errors(`${this.name}.structuredOutputStream fatal`, {
+        error: errorPayload,
+        source: `${this.name}.structuredOutputStream`,
+      })
+    }
+  }
+
   protected makeStructuredOutputCompatible(
     schema: Record<string, any>,
     originalRequired?: Array<string>,
diff --git a/packages/typescript/ai-openrouter/src/adapters/text.ts b/packages/typescript/ai-openrouter/src/adapters/text.ts
index a32a894da..853d02af5 100644
--- a/packages/typescript/ai-openrouter/src/adapters/text.ts
+++ b/packages/typescript/ai-openrouter/src/adapters/text.ts
@@ -271,6 +271,326 @@ export class OpenRouterTextAdapter<
     }
   }
 
+  /**
+   * Streamed structured output: a single OpenRouter chat call with
+   * `responseFormat: { type: 'json_schema', jsonSchema: {...} }` and
+   * `stream: true`. Emits AG-UI lifecycle events plus a terminal
+   * `CUSTOM { name: 'structured-output.complete' }` carrying the parsed
+   * object and raw JSON text.
+   *
+   * Mirrors the chat-completions structured-output stream from
+   * `@tanstack/openai-base`, adapted to OpenRouter's camelCase wire shape
+   * (`responseFormat` / `streamOptions: { includeUsage: true }`) and SDK
+   * call surface (`orClient.chat.send({ chatRequest })`). Reasoning flows
+   * through the existing `extractReasoningText` helper used by
+   * `processStreamChunks`; the final parsed JSON runs through
+   * {@link transformStructuredOutput} (null-preserving for OpenRouter).
+   */
+  async *structuredOutputStream(
+    options: StructuredOutputOptions<ResolveProviderOptions<TModel>>,
+  ): AsyncIterable<StreamChunk> {
+    const { chatOptions, outputSchema } = options
+    const chatRequest = this.mapOptionsToRequest(chatOptions)
+
+    const jsonSchema = this.makeStructuredOutputCompatible(
+      outputSchema,
+      outputSchema.required,
+    )
+
+    const timestamp = Date.now()
+    const aguiState = {
+      runId: generateId(this.name),
+      threadId: chatOptions.threadId ?? generateId(this.name),
+      messageId: generateId(this.name),
+      timestamp,
+      hasEmittedRunStarted: false,
+    }
+
+    let accumulatedContent = ''
+    let accumulatedReasoning = ''
+    let hasEmittedTextMessageStart = false
+    let reasoningMessageId: string | undefined
+    let hasClosedReasoning = false
+    let stepId: string | undefined
+    let lastModel: string | undefined
+    let lastUsage: ChatStreamChunk['usage'] | undefined
+
+    const closeReasoningLifecycle = function* (this: {
+      name: string
+    }): Generator<StreamChunk> {
+      if (reasoningMessageId && !hasClosedReasoning) {
+        hasClosedReasoning = true
+        yield {
+          type: EventType.REASONING_MESSAGE_END,
+          messageId: reasoningMessageId,
+          model: lastModel || chatOptions.model,
+          timestamp,
+        }
+        yield {
+          type: EventType.REASONING_END,
+          messageId: reasoningMessageId,
+          model: lastModel || chatOptions.model,
+          timestamp,
+        }
+        if (stepId) {
+          yield {
+            type: EventType.STEP_FINISHED,
+            stepName: stepId,
+            stepId,
+            model: lastModel || chatOptions.model,
+            timestamp,
+            content: accumulatedReasoning,
+          }
+        }
+      }
+    }.bind(this)
+
+    try {
+      // Strip streamOptions/tools from the base request. Structured output
+      // sends `responseFormat: json_schema` and doesn't carry tools — keeping
+      // them can confuse strict-mode validation upstream. (`stream` is
+      // already absent — `mapOptionsToRequest` returns `Omit<ChatRequest,
+      // 'stream'>`; we set it explicitly below.)
+      const { streamOptions: _so, tools: _t, ...cleanParams } = chatRequest
+      void _so
+      void _t
+
+      chatOptions.logger.request(
+        `activity=structuredOutputStream provider=${this.name} model=${this.model} messages=${chatOptions.messages.length}`,
+        { provider: this.name, model: this.model },
+      )
+
+      const reqOptions = extractRequestOptions(chatOptions.request)
+      const stream = await this.orClient.chat.send(
+        {
+          chatRequest: {
+            ...cleanParams,
+            stream: true,
+            streamOptions: { includeUsage: true },
+            responseFormat: {
+              type: 'json_schema',
+              jsonSchema: {
+                name: 'structured_output',
+                schema: jsonSchema,
+                strict: true,
+              },
+            },
+          },
+        },
+        {
+          signal: reqOptions.signal ?? undefined,
+          ...(reqOptions.headers && { headers: reqOptions.headers }),
+        },
+      )
+
+      for await (const chunk of stream) {
+        const choiceForLog = chunk.choices[0]
+        chatOptions.logger.provider(
+          `provider=${this.name} finishReason=${choiceForLog?.finishReason ?? 'none'} hasContent=${!!choiceForLog?.delta.content} hasUsage=${!!chunk.usage}`,
+          { provider: this.name, model: chunk.model },
+        )
+
+        if (chunk.model) lastModel = chunk.model
+        if (chunk.usage) lastUsage = chunk.usage
+
+        if (!aguiState.hasEmittedRunStarted) {
+          aguiState.hasEmittedRunStarted = true
+          yield {
+            type: EventType.RUN_STARTED,
+            runId: aguiState.runId,
+            threadId: aguiState.threadId,
+            model: chunk.model || chatOptions.model,
+            timestamp,
+          }
+        }
+
+        const reasoningText = extractReasoningText(chunk)
+        if (reasoningText) {
+          if (!reasoningMessageId) {
+            reasoningMessageId = generateId(this.name)
+            stepId = generateId(this.name)
+            yield {
+              type: EventType.REASONING_START,
+              messageId: reasoningMessageId,
+              model: chunk.model || chatOptions.model,
+              timestamp,
+            }
+            yield {
+              type: EventType.REASONING_MESSAGE_START,
+              messageId: reasoningMessageId,
+              role: 'reasoning' as const,
+              model: chunk.model || chatOptions.model,
+              timestamp,
+            }
+            yield {
+              type: EventType.STEP_STARTED,
+              stepName: stepId,
+              stepId,
+              model: chunk.model || chatOptions.model,
+              timestamp,
+              stepType: 'thinking',
+            }
+          }
+          accumulatedReasoning += reasoningText
+          yield {
+            type: EventType.REASONING_MESSAGE_CONTENT,
+            messageId: reasoningMessageId,
+            delta: reasoningText,
+            model: chunk.model || chatOptions.model,
+            timestamp,
+          }
+        }
+
+        const choice = chunk.choices[0]
+        if (!choice) continue
+
+        const deltaContent = choice.delta.content
+        if (deltaContent) {
+          yield* closeReasoningLifecycle()
+
+          if (!hasEmittedTextMessageStart) {
+            hasEmittedTextMessageStart = true
+            yield {
+              type: EventType.TEXT_MESSAGE_START,
+              messageId: aguiState.messageId,
+              model: chunk.model || chatOptions.model,
+              timestamp,
+              role: 'assistant',
+            }
+          }
+
+          accumulatedContent += deltaContent
+
+          yield {
+            type: EventType.TEXT_MESSAGE_CONTENT,
+            messageId: aguiState.messageId,
+            model: chunk.model || chatOptions.model,
+            timestamp,
+            delta: deltaContent,
+            content: accumulatedContent,
+          }
+        }
+      }
+
+      yield* closeReasoningLifecycle()
+
+      if (hasEmittedTextMessageStart) {
+        yield {
+          type: EventType.TEXT_MESSAGE_END,
+          messageId: aguiState.messageId,
+          model: lastModel || chatOptions.model,
+          timestamp,
+        }
+      }
+
+      if (accumulatedContent.length === 0) {
+        yield {
+          type: EventType.RUN_ERROR,
+          runId: aguiState.runId,
+          model: lastModel || chatOptions.model,
+          timestamp,
+          message: `${this.name}.structuredOutputStream: response contained no content`,
+          code: 'empty-response',
+          error: {
+            message: `${this.name}.structuredOutputStream: response contained no content`,
+            code: 'empty-response',
+          },
+        }
+        return
+      }
+
+      let parsed: unknown
+      try {
+        parsed = JSON.parse(accumulatedContent)
+      } catch {
+        yield {
+          type: EventType.RUN_ERROR,
+          runId: aguiState.runId,
+          model: lastModel || chatOptions.model,
+          timestamp,
+          message: `Failed to parse structured output as JSON. Content: ${accumulatedContent.slice(0, 200)}${accumulatedContent.length > 200 ? '...' : ''}`,
+          code: 'parse-error',
+          error: {
+            message: 'Failed to parse structured output as JSON',
+            code: 'parse-error',
+          },
+        }
+        return
+      }
+
+      const transformed = this.transformStructuredOutput(parsed)
+
+      yield {
+        type: EventType.CUSTOM,
+        name: 'structured-output.complete',
+        value: {
+          object: transformed,
+          raw: accumulatedContent,
+          ...(accumulatedReasoning ? { reasoning: accumulatedReasoning } : {}),
+        },
+        model: lastModel || chatOptions.model,
+        timestamp,
+      }
+
+      yield {
+        type: EventType.RUN_FINISHED,
+        runId: aguiState.runId,
+        threadId: aguiState.threadId,
+        model: lastModel || chatOptions.model,
+        timestamp,
+        finishReason: 'stop',
+        ...(lastUsage && {
+          usage: {
+            promptTokens: lastUsage.promptTokens,
+            completionTokens: lastUsage.completionTokens,
+            totalTokens: lastUsage.totalTokens,
+          },
+        }),
+      }
+    } catch (error: unknown) {
+      if (!aguiState.hasEmittedRunStarted) {
+        aguiState.hasEmittedRunStarted = true
+        yield {
+          type: EventType.RUN_STARTED,
+          runId: aguiState.runId,
+          threadId: aguiState.threadId,
+          model: chatOptions.model,
+          timestamp,
+        }
+      }
+
+      // OpenRouter SDK raises a proprietary `RequestAbortedError` on
+      // caller-initiated abort. Map it (plus the standard DOM `AbortError`)
+      // to `code: 'aborted'` so consumers can distinguish abort from a real
+      // upstream failure.
+      const errName =
+        error && typeof error === 'object'
+          ? ((error as { name?: unknown }).name ?? '')
+          : ''
+      const isAbort =
+        errName === 'AbortError' || errName === 'RequestAbortedError'
+      const errorPayload = toRunErrorPayload(
+        error,
+        `${this.name}.structuredOutputStream failed`,
+      )
+
+      yield {
+        type: EventType.RUN_ERROR,
+        runId: aguiState.runId,
+        model: lastModel || chatOptions.model,
+        timestamp,
+        message: errorPayload.message,
+        code: isAbort ? 'aborted' : errorPayload.code,
+        error: { ...errorPayload, ...(isAbort && { code: 'aborted' }) },
+      }
+
+      chatOptions.logger.errors(`${this.name}.structuredOutputStream fatal`, {
+        error: errorPayload,
+        source: `${this.name}.structuredOutputStream`,
+      })
+    }
+  }
+
   /**
    * Applies provider-specific transformations for structured output compatibility.
    */
diff --git a/packages/typescript/ai-react/package.json b/packages/typescript/ai-react/package.json
index b0931335c..0b6749375 100644
--- a/packages/typescript/ai-react/package.json
+++ b/packages/typescript/ai-react/package.json
@@ -49,6 +49,7 @@
     "react": ">=18.0.0"
   },
   "devDependencies": {
+    "@standard-schema/spec": "^1.1.0",
     "@tanstack/ai": "workspace:*",
     "@testing-library/react": "^16.3.0",
     "@types/react": "^19.2.7",
diff --git a/packages/typescript/ai-react/src/index.ts b/packages/typescript/ai-react/src/index.ts
index 5ce8c9911..f0c5c437a 100644
--- a/packages/typescript/ai-react/src/index.ts
+++ b/packages/typescript/ai-react/src/index.ts
@@ -1,6 +1,7 @@
 export { useChat } from './use-chat'
 export { useRealtimeChat } from './use-realtime-chat'
 export type {
+  DeepPartial,
   UseChatOptions,
   UseChatReturn,
   UIMessage,
diff --git a/packages/typescript/ai-react/src/types.ts b/packages/typescript/ai-react/src/types.ts
index ec8f49a92..92b6b3500 100644
--- a/packages/typescript/ai-react/src/types.ts
+++ b/packages/typescript/ai-react/src/types.ts
@@ -1,4 +1,9 @@
-import type { AnyClientTool, ModelMessage } from '@tanstack/ai'
+import type {
+  AnyClientTool,
+  InferSchemaType,
+  ModelMessage,
+  SchemaInput,
+} from '@tanstack/ai'
 import type {
   ChatClientOptions,
   ChatClientState,
@@ -11,6 +16,18 @@ import type {
 // Re-export types from ai-client
 export type { ChatRequestBody, MultimodalContent, UIMessage }
 
+/**
+ * Recursive partial — every property and every nested array element is optional.
+ * Used to type the in-flight `partial` value the hook exposes while a structured
+ * output stream is still arriving (the JSON has shape but is incomplete).
+ */
+export type DeepPartial<T> =
+  T extends ReadonlyArray<infer U>
+    ? Array<DeepPartial<U>>
+    : T extends object
+      ? { [K in keyof T]?: DeepPartial<T[K]> }
+      : T
+
 /**
  * Options for the useChat hook.
  *
@@ -24,30 +41,71 @@ export type { ChatRequestBody, MultimodalContent, UIMessage }
  * All other callbacks (onResponse, onChunk, onFinish, onError) are
  * passed through to the underlying ChatClient and can be used for side effects.
  *
+ * When `outputSchema` is supplied, the hook returns a typed `partial` (live
+ * progressive object, updated from `TEXT_MESSAGE_CONTENT` deltas via
+ * `parsePartialJSON`) and `final` (validated terminal payload from the
+ * `structured-output.complete` event). The schema is used purely for type
+ * inference on the client — server-side validation still runs against the
+ * schema you pass to `chat({ outputSchema })` on the server route.
+ *
  * Note: Connection and body changes will recreate the ChatClient instance.
  * To update these options, remount the component or use a key prop.
  */
-export type UseChatOptions<TTools extends ReadonlyArray<AnyClientTool> = any> =
-  Omit<
-    ChatClientOptions<TTools>,
-    | 'onMessagesChange'
-    | 'onLoadingChange'
-    | 'onErrorChange'
-    | 'onStatusChange'
-    | 'onSubscriptionChange'
-    | 'onConnectionStatusChange'
-    | 'onSessionGeneratingChange'
-  > & {
-    /**
-     * Opt into mount-time live subscription behavior.
-     * When enabled, the hook subscribes on mount and unsubscribes on unmount.
-     */
-    live?: boolean
-  }
-
-export interface UseChatReturn<
+export type UseChatOptions<
+  TTools extends ReadonlyArray<AnyClientTool> = any,
+  TSchema extends SchemaInput | undefined = undefined,
+> = Omit<
+  ChatClientOptions<TTools>,
+  | 'onMessagesChange'
+  | 'onLoadingChange'
+  | 'onErrorChange'
+  | 'onStatusChange'
+  | 'onSubscriptionChange'
+  | 'onConnectionStatusChange'
+  | 'onSessionGeneratingChange'
+> & {
+  /**
+   * Opt into mount-time live subscription behavior.
+   * When enabled, the hook subscribes on mount and unsubscribes on unmount.
+   */
+  live?: boolean
+  /**
+   * Standard-schema-compatible schema (Zod, Valibot, ArkType, or a plain JSON
+   * Schema). Used to infer the shape of `partial` and `final` in the return.
+   * The schema is **not** sent to the server — server-side validation runs
+   * against the schema passed to `chat({ outputSchema })` on the server route.
+   */
+  outputSchema?: TSchema
+}
+
+/**
+ * Discriminated return shape: when `outputSchema` is supplied, the hook adds
+ * typed `partial` / `final` fields; when it is omitted (default), the return
+ * is unchanged.
+ */
+export type UseChatReturn<
   TTools extends ReadonlyArray<AnyClientTool> = any,
-> {
+  TSchema extends SchemaInput | undefined = undefined,
+> = BaseUseChatReturn<TTools> &
+  (TSchema extends SchemaInput
+    ? {
+        /**
+         * Live, progressively-parsed structured output. Updated from
+         * `TEXT_MESSAGE_CONTENT` deltas via `parsePartialJSON` while the stream
+         * is still arriving, and snapped to the validated payload when
+         * `structured-output.complete` fires. Resets on every new run
+         * (`sendMessage` / `reload`).
+         */
+        partial: DeepPartial<InferSchemaType<TSchema>>
+        /**
+         * Final, schema-validated structured output. `null` until the terminal
+         * `structured-output.complete` event arrives. Resets on every new run.
+         */
+        final: InferSchemaType<TSchema> | null
+      }
+    : Record<never, never>)
+
+interface BaseUseChatReturn<TTools extends ReadonlyArray<AnyClientTool> = any> {
   /**
    * Current messages in the conversation
    */
diff --git a/packages/typescript/ai-react/src/use-chat.ts b/packages/typescript/ai-react/src/use-chat.ts
index c95589874..9b552ed0d 100644
--- a/packages/typescript/ai-react/src/use-chat.ts
+++ b/packages/typescript/ai-react/src/use-chat.ts
@@ -1,18 +1,27 @@
 import { ChatClient } from '@tanstack/ai-client'
+import { parsePartialJSON } from '@tanstack/ai'
 import { useCallback, useEffect, useId, useMemo, useRef, useState } from 'react'
-import type { AnyClientTool, ModelMessage } from '@tanstack/ai'
+import type {
+  AnyClientTool,
+  InferSchemaType,
+  ModelMessage,
+  SchemaInput,
+  StreamChunk,
+} from '@tanstack/ai'
 import type { ChatClientState, ConnectionStatus } from '@tanstack/ai-client'
 
 import type {
+  DeepPartial,
   MultimodalContent,
   UIMessage,
   UseChatOptions,
   UseChatReturn,
 } from './types'
 
-export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
-  options: UseChatOptions<TTools>,
-): UseChatReturn<TTools> {
+export function useChat<
+  TTools extends ReadonlyArray<AnyClientTool> = any,
+  TSchema extends SchemaInput | undefined = undefined,
+>(options: UseChatOptions<TTools, TSchema>): UseChatReturn<TTools, TSchema> {
   const hookId = useId()
   const clientId = options.id || hookId
 
@@ -27,6 +36,19 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     useState<ConnectionStatus>('disconnected')
   const [sessionGenerating, setSessionGenerating] = useState(false)
 
+  // Structured-output state. Only meaningful when `outputSchema` is supplied;
+  // when it isn't, these stay at their initial values and are hidden from the
+  // return type by the conditional in UseChatReturn. Runtime always tracks
+  // them — the type system gates visibility, not the runtime.
+  type Partial = DeepPartial<InferSchemaType<NonNullable<TSchema>>>
+  type Final = InferSchemaType<NonNullable<TSchema>>
+  const [partial, setPartial] = useState<Partial>({} as Partial)
+  const [final, setFinal] = useState<Final | null>(null)
+  // Raw JSON accumulator for parsePartialJSON. Ref instead of state — partial
+  // JSON parsing happens synchronously inside the chunk handler; we don't want
+  // a re-render per delta solely to track the buffer.
+  const rawJsonRef = useRef('')
+
   // Track current messages in a ref to preserve them when client is recreated
   const messagesRef = useRef<Array<UIMessage<TTools>>>(
     options.initialMessages || [],
@@ -38,7 +60,7 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
   messagesRef.current = messages
 
   // Track current options in a ref to avoid recreating client when options change
-  const optionsRef = useRef<UseChatOptions<TTools>>(options)
+  const optionsRef = useRef<UseChatOptions<TTools, TSchema>>(options)
   optionsRef.current = options
 
   // Create ChatClient instance with callbacks to sync state
@@ -62,7 +84,32 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
       // Capturing the function reference directly would freeze it to whatever
       // the parent passed on the first render.
       onResponse: (response) => optionsRef.current.onResponse?.(response),
-      onChunk: (chunk) => optionsRef.current.onChunk?.(chunk),
+      onChunk: (chunk: StreamChunk) => {
+        // Internal structured-output tracking — runs before the user callback
+        // so user code observes the same state the hook does. Only active when
+        // a schema is supplied; otherwise the branches are no-ops.
+        if (optionsRef.current.outputSchema !== undefined) {
+          if (chunk.type === 'RUN_STARTED') {
+            // New run — reset both views.
+            rawJsonRef.current = ''
+            setPartial({} as Partial)
+            setFinal(null)
+          } else if (chunk.type === 'TEXT_MESSAGE_CONTENT' && chunk.delta) {
+            rawJsonRef.current += chunk.delta
+            const progressive = parsePartialJSON(rawJsonRef.current)
+            if (progressive && typeof progressive === 'object') {
+              setPartial(progressive as Partial)
+            }
+          } else if (
+            chunk.type === 'CUSTOM' &&
+            chunk.name === 'structured-output.complete'
+          ) {
+            const value = chunk.value as { object: unknown }
+            setFinal(value.object as Final)
+          }
+        }
+        optionsRef.current.onChunk?.(chunk)
+      },
       onFinish: (message: UIMessage<TTools>) => {
         optionsRef.current.onFinish?.(message)
       },
@@ -195,6 +242,10 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     [client],
   )
 
+  // partial / final are runtime-tracked unconditionally; the conditional
+  // return type (UseChatReturn<TTools, TSchema>) hides them from callers that
+  // didn't supply `outputSchema`. The `as` cast is the seam between the
+  // unconditional runtime shape and the schema-discriminated public shape.
   return {
     messages,
     sendMessage,
@@ -211,5 +262,7 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     clear,
     addToolResult,
     addToolApprovalResponse,
-  }
+    partial,
+    final,
+  } as unknown as UseChatReturn<TTools, TSchema>
 }
diff --git a/packages/typescript/ai-react/tests/use-chat-structured-output.test.ts b/packages/typescript/ai-react/tests/use-chat-structured-output.test.ts
new file mode 100644
index 000000000..c7f5955dd
--- /dev/null
+++ b/packages/typescript/ai-react/tests/use-chat-structured-output.test.ts
@@ -0,0 +1,239 @@
+/**
+ * Runtime tests for `useChat({ outputSchema })`:
+ *
+ * - `partial` updates per `TEXT_MESSAGE_CONTENT` delta (progressive JSON parse)
+ * - `final` snaps on the terminal `CUSTOM structured-output.complete` event
+ * - State resets between `sendMessage` calls (on `RUN_STARTED`)
+ * - User's own `onChunk` callback fires after internal tracking
+ * - Without `outputSchema`, no partial/final tracking runs
+ */
+
+import { act, renderHook, waitFor } from '@testing-library/react'
+import { describe, expect, it, vi } from 'vitest'
+import type { StandardJSONSchemaV1 } from '@standard-schema/spec'
+import type { StreamChunk } from '@tanstack/ai'
+import { createMockConnectionAdapter } from '../../ai-client/tests/test-utils'
+import { useChat } from '../src/use-chat'
+
+type Person = { name: string; age: number; email: string }
+type PersonSchema = StandardJSONSchemaV1<Person, Person>
+const personSchema = {} as PersonSchema
+
+/**
+ * Build a chunk sequence simulating a streaming structured-output run:
+ * RUN_STARTED → TEXT_MESSAGE_CONTENT deltas (each delta moves the buffer
+ * one character closer to `fullJson`) → CUSTOM structured-output.complete
+ * → RUN_FINISHED.
+ */
+function buildStructuredStream(
+  fullJson: string,
+  finalObject: Person,
+  runId = 'run-1',
+): Array<StreamChunk> {
+  const chunks: Array<StreamChunk> = [
+    {
+      type: 'RUN_STARTED',
+      runId,
+      threadId: `thread-${runId}`,
+      model: 'test',
+      timestamp: Date.now(),
+    } as StreamChunk,
+  ]
+  // Split fullJson into a few large-ish slices so we test progressive parsing
+  // without producing a flood of one-char chunks.
+  const sliceSize = Math.max(4, Math.floor(fullJson.length / 4))
+  for (let i = 0; i < fullJson.length; i += sliceSize) {
+    chunks.push({
+      type: 'TEXT_MESSAGE_CONTENT',
+      messageId: `msg-${runId}`,
+      delta: fullJson.slice(i, i + sliceSize),
+      content: fullJson.slice(0, i + sliceSize),
+      model: 'test',
+      timestamp: Date.now(),
+    } as StreamChunk)
+  }
+  chunks.push({
+    type: 'CUSTOM',
+    name: 'structured-output.complete',
+    value: { object: finalObject, raw: fullJson },
+    model: 'test',
+    timestamp: Date.now(),
+  } as StreamChunk)
+  chunks.push({
+    type: 'RUN_FINISHED',
+    runId,
+    threadId: `thread-${runId}`,
+    model: 'test',
+    timestamp: Date.now(),
+    finishReason: 'stop',
+  } as StreamChunk)
+  return chunks
+}
+
+describe('useChat({ outputSchema }) — runtime', () => {
+  const person: Person = {
+    name: 'John Doe',
+    age: 30,
+    email: 'john@example.com',
+  }
+  const json = JSON.stringify(person)
+
+  it('updates `partial` progressively and snaps `final` on the terminal event', async () => {
+    const chunks = buildStructuredStream(json, person)
+    const adapter = createMockConnectionAdapter({ chunks })
+
+    const { result } = renderHook(() =>
+      useChat({ connection: adapter, outputSchema: personSchema }),
+    )
+
+    // Initial state.
+    expect(result.current.partial).toEqual({})
+    expect(result.current.final).toBeNull()
+
+    await act(async () => {
+      await result.current.sendMessage('Extract')
+    })
+
+    // The schema-validated `final` lands once the terminal event fires.
+    await waitFor(() => {
+      expect(result.current.final).toEqual(person)
+    })
+
+    // `partial` should end with the same shape (parsePartialJSON on the
+    // complete buffer returns the fully-formed object).
+    expect(result.current.partial).toEqual(person)
+  })
+
+  it('resets `partial` and `final` between runs', async () => {
+    const personA: Person = {
+      name: 'Alice',
+      age: 25,
+      email: 'alice@example.com',
+    }
+    const personB: Person = { name: 'Bob', age: 40, email: 'bob@example.com' }
+
+    // Stateful adapter that yields a different stream per connect() call.
+    // Without this, createMockConnectionAdapter would yield the same array
+    // on every sendMessage — the "reset" couldn't be observed between runs
+    // because final would race past personA straight to personB on call #1.
+    let call = 0
+    const adapter = {
+      async *connect() {
+        const chunks =
+          call === 0
+            ? buildStructuredStream(JSON.stringify(personA), personA, 'run-a')
+            : buildStructuredStream(JSON.stringify(personB), personB, 'run-b')
+        call++
+        for (const chunk of chunks) yield chunk
+      },
+    }
+
+    const { result } = renderHook(() =>
+      useChat({ connection: adapter, outputSchema: personSchema }),
+    )
+
+    await act(async () => {
+      await result.current.sendMessage('A')
+    })
+    await waitFor(() => {
+      expect(result.current.final).toEqual(personA)
+    })
+    expect(result.current.partial).toEqual(personA)
+
+    // Second run — RUN_STARTED at the head must clear partial/final before
+    // run-b's deltas land. If the reset didn't happen, run-b's progressive
+    // partial would be shadowed by leftover state from run-a (since
+    // parsePartialJSON would parse run-b's accumulated buffer cleanly, but
+    // the spread-onto-stale-state class of bug would still surface in `final`).
+    await act(async () => {
+      await result.current.sendMessage('B')
+    })
+    await waitFor(() => {
+      expect(result.current.final).toEqual(personB)
+    })
+    expect(result.current.partial).toEqual(personB)
+  })
+
+  it("invokes the user's onChunk callback alongside internal tracking", async () => {
+    const chunks = buildStructuredStream(json, person)
+    const adapter = createMockConnectionAdapter({ chunks })
+    const onChunk = vi.fn()
+
+    const { result } = renderHook(() =>
+      useChat({
+        connection: adapter,
+        outputSchema: personSchema,
+        onChunk,
+      }),
+    )
+
+    await act(async () => {
+      await result.current.sendMessage('Extract')
+    })
+    await waitFor(() => {
+      expect(result.current.final).toEqual(person)
+    })
+
+    // User callback fires for every chunk the hook sees, including the
+    // terminal structured-output.complete event.
+    const completeCalls = onChunk.mock.calls.filter(
+      ([c]) => c.type === 'CUSTOM' && c.name === 'structured-output.complete',
+    )
+    expect(completeCalls.length).toBe(1)
+    expect(completeCalls[0][0].value).toEqual({ object: person, raw: json })
+
+    const deltaCalls = onChunk.mock.calls.filter(
+      ([c]) => c.type === 'TEXT_MESSAGE_CONTENT',
+    )
+    expect(deltaCalls.length).toBeGreaterThan(0)
+  })
+})
+
+describe('useChat() without outputSchema — runtime', () => {
+  it('does not break or track structured state when no schema is supplied', async () => {
+    const adapter = createMockConnectionAdapter({
+      chunks: [
+        {
+          type: 'RUN_STARTED',
+          runId: 'r',
+          threadId: 't',
+          model: 'test',
+          timestamp: Date.now(),
+        } as StreamChunk,
+        {
+          type: 'TEXT_MESSAGE_CONTENT',
+          messageId: 'm',
+          delta: 'Hello',
+          content: 'Hello',
+          model: 'test',
+          timestamp: Date.now(),
+        } as StreamChunk,
+        {
+          type: 'RUN_FINISHED',
+          runId: 'r',
+          threadId: 't',
+          model: 'test',
+          timestamp: Date.now(),
+          finishReason: 'stop',
+        } as StreamChunk,
+      ],
+    })
+
+    const { result } = renderHook(() => useChat({ connection: adapter }))
+
+    await act(async () => {
+      await result.current.sendMessage('hi')
+    })
+    await waitFor(() => {
+      expect(result.current.messages.length).toBeGreaterThan(0)
+    })
+    // The return object doesn't expose partial/final at the type level — and
+    // the runtime branch in onChunk is gated on `outputSchema !== undefined`
+    // so the internal state never updates. (Runtime access is the only way
+    // to verify the no-op branch.)
+    expect(
+      (result.current as unknown as { partial?: unknown }).partial,
+    ).toEqual({})
+    expect((result.current as unknown as { final?: unknown }).final).toBeNull()
+  })
+})
diff --git a/packages/typescript/ai-react/tests/use-chat-types.test.ts b/packages/typescript/ai-react/tests/use-chat-types.test.ts
new file mode 100644
index 000000000..8194a4e4e
--- /dev/null
+++ b/packages/typescript/ai-react/tests/use-chat-types.test.ts
@@ -0,0 +1,58 @@
+/**
+ * Type-level tests for `useChat()`'s return-type narrowing when `outputSchema`
+ * is supplied. Pinning the shape so a future refactor can't silently regress
+ * the schema-driven `partial` / `final` discrimination. These assertions are
+ * pure types — they never invoke the hook at runtime (which would require a
+ * React renderer).
+ */
+
+import { describe, expectTypeOf, it } from 'vitest'
+import type { StandardJSONSchemaV1 } from '@standard-schema/spec'
+import type { AnyClientTool } from '@tanstack/ai'
+import type { DeepPartial, UseChatOptions, UseChatReturn } from '../src/types'
+
+type Person = { name: string; age: number; email: string }
+type PersonSchema = StandardJSONSchemaV1<Person, Person>
+type NoTools = ReadonlyArray<AnyClientTool>
+
+describe('useChat() return type', () => {
+  describe('with outputSchema', () => {
+    it('exposes typed partial + final', () => {
+      type R = UseChatReturn<NoTools, PersonSchema>
+      expectTypeOf<R['partial']>().toEqualTypeOf<DeepPartial<Person>>()
+      expectTypeOf<R['final']>().toEqualTypeOf<Person | null>()
+    })
+
+    it('still exposes the base shape (messages, sendMessage, isLoading, …)', () => {
+      type R = UseChatReturn<NoTools, PersonSchema>
+      expectTypeOf<R['sendMessage']>().toBeFunction()
+      expectTypeOf<R['isLoading']>().toBeBoolean()
+      expectTypeOf<R['messages']>().toBeArray()
+    })
+
+    it('options accept outputSchema with the schema type', () => {
+      type O = UseChatOptions<NoTools, PersonSchema>
+      expectTypeOf<O['outputSchema']>().toEqualTypeOf<
+        PersonSchema | undefined
+      >()
+    })
+  })
+
+  describe('without outputSchema', () => {
+    it('does NOT expose partial or final', () => {
+      type R = UseChatReturn<NoTools>
+      // The conditional resolves to Record<never, never>, so accessing
+      // `partial` / `final` keys is a type error.
+      // @ts-expect-error - partial only exists when outputSchema is supplied
+      type _Partial = R['partial']
+      // @ts-expect-error - final only exists when outputSchema is supplied
+      type _Final = R['final']
+    })
+
+    it('preserves the base return shape', () => {
+      type R = UseChatReturn<NoTools>
+      expectTypeOf<R['sendMessage']>().toBeFunction()
+      expectTypeOf<R['isLoading']>().toBeBoolean()
+    })
+  })
+})
diff --git a/packages/typescript/ai-solid/package.json b/packages/typescript/ai-solid/package.json
index 5b577ffc5..5573e7666 100644
--- a/packages/typescript/ai-solid/package.json
+++ b/packages/typescript/ai-solid/package.json
@@ -47,6 +47,7 @@
   },
   "devDependencies": {
     "@solidjs/testing-library": "^0.8.10",
+    "@standard-schema/spec": "^1.1.0",
     "@tanstack/ai": "workspace:*",
     "@types/node": "^24.10.1",
     "@vitest/coverage-v8": "4.0.14",
diff --git a/packages/typescript/ai-solid/src/index.ts b/packages/typescript/ai-solid/src/index.ts
index 6c60da993..d0bb2de98 100644
--- a/packages/typescript/ai-solid/src/index.ts
+++ b/packages/typescript/ai-solid/src/index.ts
@@ -1,5 +1,6 @@
 export { useChat } from './use-chat'
 export type {
+  DeepPartial,
   UseChatOptions,
   UseChatReturn,
   UIMessage,
diff --git a/packages/typescript/ai-solid/src/types.ts b/packages/typescript/ai-solid/src/types.ts
index eb4654d25..64920af8a 100644
--- a/packages/typescript/ai-solid/src/types.ts
+++ b/packages/typescript/ai-solid/src/types.ts
@@ -1,4 +1,9 @@
-import type { AnyClientTool, ModelMessage } from '@tanstack/ai'
+import type {
+  AnyClientTool,
+  InferSchemaType,
+  ModelMessage,
+  SchemaInput,
+} from '@tanstack/ai'
 import type {
   ChatClientOptions,
   ChatClientState,
@@ -12,6 +17,18 @@ import type { Accessor } from 'solid-js'
 // Re-export types from ai-client
 export type { ChatRequestBody, MultimodalContent, UIMessage }
 
+/**
+ * Recursive partial — every property and every nested array element is optional.
+ * Used to type the in-flight `partial` accessor while a structured-output
+ * stream is still arriving.
+ */
+export type DeepPartial<T> =
+  T extends ReadonlyArray<infer U>
+    ? Array<DeepPartial<U>>
+    : T extends object
+      ? { [K in keyof T]?: DeepPartial<T[K]> }
+      : T
+
 /**
  * Options for the useChat hook.
  *
@@ -25,26 +42,58 @@ export type { ChatRequestBody, MultimodalContent, UIMessage }
  * All other callbacks (onResponse, onChunk, onFinish, onError) are
  * passed through to the underlying ChatClient and can be used for side effects.
  *
+ * When `outputSchema` is supplied, the hook returns typed `partial` and `final`
+ * accessors. The schema is used purely for type inference; server-side
+ * validation still runs against the schema passed to `chat({ outputSchema })`
+ * on the server route.
+ *
  * Note: Connection and body changes will recreate the ChatClient instance.
  * To update these options, remount the component or use a key prop.
  */
-export type UseChatOptions<TTools extends ReadonlyArray<AnyClientTool> = any> =
-  Omit<
-    ChatClientOptions<TTools>,
-    | 'onMessagesChange'
-    | 'onLoadingChange'
-    | 'onErrorChange'
-    | 'onStatusChange'
-    | 'onSubscriptionChange'
-    | 'onConnectionStatusChange'
-    | 'onSessionGeneratingChange'
-  > & {
-    live?: boolean
-  }
-
-export interface UseChatReturn<
+export type UseChatOptions<
+  TTools extends ReadonlyArray<AnyClientTool> = any,
+  TSchema extends SchemaInput | undefined = undefined,
+> = Omit<
+  ChatClientOptions<TTools>,
+  | 'onMessagesChange'
+  | 'onLoadingChange'
+  | 'onErrorChange'
+  | 'onStatusChange'
+  | 'onSubscriptionChange'
+  | 'onConnectionStatusChange'
+  | 'onSessionGeneratingChange'
+> & {
+  live?: boolean
+  /**
+   * Standard-schema-compatible schema (Zod, Valibot, ArkType, or plain JSON
+   * Schema). Used to infer the shape of `partial` and `final`.
+   */
+  outputSchema?: TSchema
+}
+
+/**
+ * Discriminated return shape: when `outputSchema` is supplied, the hook adds
+ * typed `partial` / `final` accessors; otherwise the return is unchanged.
+ */
+export type UseChatReturn<
   TTools extends ReadonlyArray<AnyClientTool> = any,
-> {
+  TSchema extends SchemaInput | undefined = undefined,
+> = BaseUseChatReturn<TTools> &
+  (TSchema extends SchemaInput
+    ? {
+        /**
+         * Live progressively-parsed structured output. Resets on every new run.
+         */
+        partial: Accessor<DeepPartial<InferSchemaType<TSchema>>>
+        /**
+         * Final, schema-validated structured output. `null` until the terminal
+         * `structured-output.complete` event arrives. Resets on every new run.
+         */
+        final: Accessor<InferSchemaType<TSchema> | null>
+      }
+    : Record<never, never>)
+
+interface BaseUseChatReturn<TTools extends ReadonlyArray<AnyClientTool> = any> {
   /**
    * Current messages in the conversation
    */
diff --git a/packages/typescript/ai-solid/src/use-chat.ts b/packages/typescript/ai-solid/src/use-chat.ts
index 0aff8603a..2315cb95b 100644
--- a/packages/typescript/ai-solid/src/use-chat.ts
+++ b/packages/typescript/ai-solid/src/use-chat.ts
@@ -7,18 +7,32 @@ import {
 } from 'solid-js'
 
 import { ChatClient } from '@tanstack/ai-client'
+import { parsePartialJSON } from '@tanstack/ai'
 import type { ChatClientState, ConnectionStatus } from '@tanstack/ai-client'
-import type { AnyClientTool, ModelMessage } from '@tanstack/ai'
 import type {
+  AnyClientTool,
+  InferSchemaType,
+  ModelMessage,
+  SchemaInput,
+  StreamChunk,
+} from '@tanstack/ai'
+import type {
+  DeepPartial,
   MultimodalContent,
   UIMessage,
   UseChatOptions,
   UseChatReturn,
 } from './types'
 
-export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
-  options: UseChatOptions<TTools> = {} as UseChatOptions<TTools>,
-): UseChatReturn<TTools> {
+export function useChat<
+  TTools extends ReadonlyArray<AnyClientTool> = any,
+  TSchema extends SchemaInput | undefined = undefined,
+>(
+  options: UseChatOptions<TTools, TSchema> = {} as UseChatOptions<
+    TTools,
+    TSchema
+  >,
+): UseChatReturn<TTools, TSchema> {
   const hookId = createUniqueId()
   const clientId = options.id || hookId
 
@@ -33,6 +47,15 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     createSignal<ConnectionStatus>('disconnected')
   const [sessionGenerating, setSessionGenerating] = createSignal(false)
 
+  // Structured-output state. Runtime always tracks them — the conditional
+  // return type hides them from callers that didn't supply `outputSchema`.
+  type Partial = DeepPartial<InferSchemaType<NonNullable<TSchema>>>
+  type Final = InferSchemaType<NonNullable<TSchema>>
+  const [partial, setPartial] = createSignal<Partial>({} as Partial)
+  const [final, setFinal] = createSignal<Final | null>(null)
+  // Raw JSON accumulator — kept outside the signal to avoid extra re-runs.
+  let rawJson = ''
+
   // Create ChatClient instance with callbacks to sync state.
   // Every user-provided callback is wrapped so the LATEST `options.xxx` value
   // is read at call time. Direct assignment would freeze the callback to the
@@ -46,7 +69,28 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
       initialMessages: options.initialMessages,
       body: options.body,
       onResponse: (response) => options.onResponse?.(response),
-      onChunk: (chunk) => options.onChunk?.(chunk),
+      onChunk: (chunk: StreamChunk) => {
+        if (options.outputSchema !== undefined) {
+          if (chunk.type === 'RUN_STARTED') {
+            rawJson = ''
+            setPartial({} as Partial)
+            setFinal(null)
+          } else if (chunk.type === 'TEXT_MESSAGE_CONTENT' && chunk.delta) {
+            rawJson += chunk.delta
+            const progressive = parsePartialJSON(rawJson)
+            if (progressive && typeof progressive === 'object') {
+              setPartial(() => progressive as Partial)
+            }
+          } else if (
+            chunk.type === 'CUSTOM' &&
+            chunk.name === 'structured-output.complete'
+          ) {
+            const value = chunk.value as { object: unknown }
+            setFinal(() => value.object as Final)
+          }
+        }
+        options.onChunk?.(chunk)
+      },
       onFinish: (message) => {
         options.onFinish?.(message)
       },
@@ -170,6 +214,8 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     await client().addToolApprovalResponse(response)
   }
 
+  // partial / final are runtime-tracked unconditionally; the conditional
+  // return type hides them when no `outputSchema` is supplied.
   return {
     messages,
     sendMessage,
@@ -186,5 +232,7 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     clear,
     addToolResult,
     addToolApprovalResponse,
-  }
+    partial,
+    final,
+  } as unknown as UseChatReturn<TTools, TSchema>
 }
diff --git a/packages/typescript/ai-solid/tests/use-chat-types.test.ts b/packages/typescript/ai-solid/tests/use-chat-types.test.ts
new file mode 100644
index 000000000..efc859d51
--- /dev/null
+++ b/packages/typescript/ai-solid/tests/use-chat-types.test.ts
@@ -0,0 +1,43 @@
+/**
+ * Type-level tests for `useChat()`'s return-type narrowing when `outputSchema`
+ * is supplied. Mirrors the React variant; pure types only.
+ */
+
+import { describe, expectTypeOf, it } from 'vitest'
+import type { StandardJSONSchemaV1 } from '@standard-schema/spec'
+import type { AnyClientTool } from '@tanstack/ai'
+import type { Accessor } from 'solid-js'
+import type { DeepPartial, UseChatOptions, UseChatReturn } from '../src/types'
+
+type Person = { name: string; age: number; email: string }
+type PersonSchema = StandardJSONSchemaV1<Person, Person>
+type NoTools = ReadonlyArray<AnyClientTool>
+
+describe('useChat() return type (solid)', () => {
+  describe('with outputSchema', () => {
+    it('exposes typed partial + final accessors', () => {
+      type R = UseChatReturn<NoTools, PersonSchema>
+      expectTypeOf<R['partial']>().toEqualTypeOf<
+        Accessor<DeepPartial<Person>>
+      >()
+      expectTypeOf<R['final']>().toEqualTypeOf<Accessor<Person | null>>()
+    })
+
+    it('options accept outputSchema with the schema type', () => {
+      type O = UseChatOptions<NoTools, PersonSchema>
+      expectTypeOf<O['outputSchema']>().toEqualTypeOf<
+        PersonSchema | undefined
+      >()
+    })
+  })
+
+  describe('without outputSchema', () => {
+    it('does NOT expose partial or final', () => {
+      type R = UseChatReturn<NoTools>
+      // @ts-expect-error - partial only exists when outputSchema is supplied
+      type _Partial = R['partial']
+      // @ts-expect-error - final only exists when outputSchema is supplied
+      type _Final = R['final']
+    })
+  })
+})
diff --git a/packages/typescript/ai-svelte/package.json b/packages/typescript/ai-svelte/package.json
index 2f7af385c..3d5288450 100644
--- a/packages/typescript/ai-svelte/package.json
+++ b/packages/typescript/ai-svelte/package.json
@@ -50,6 +50,7 @@
     "svelte": "^5.0.0"
   },
   "devDependencies": {
+    "@standard-schema/spec": "^1.1.0",
     "@sveltejs/package": "^2.3.10",
     "@sveltejs/vite-plugin-svelte": "^5.1.1",
     "@tanstack/ai": "workspace:*",
diff --git a/packages/typescript/ai-svelte/src/create-chat.svelte.ts b/packages/typescript/ai-svelte/src/create-chat.svelte.ts
index 3a9eeb232..e779ab9ee 100644
--- a/packages/typescript/ai-svelte/src/create-chat.svelte.ts
+++ b/packages/typescript/ai-svelte/src/create-chat.svelte.ts
@@ -1,9 +1,17 @@
 import { ChatClient } from '@tanstack/ai-client'
+import { parsePartialJSON } from '@tanstack/ai'
 import type { ChatClientState, ConnectionStatus } from '@tanstack/ai-client'
-import type { AnyClientTool, ModelMessage } from '@tanstack/ai'
+import type {
+  AnyClientTool,
+  InferSchemaType,
+  ModelMessage,
+  SchemaInput,
+  StreamChunk,
+} from '@tanstack/ai'
 import type {
   CreateChatOptions,
   CreateChatReturn,
+  DeepPartial,
   MultimodalContent,
   UIMessage,
 } from './types'
@@ -38,9 +46,12 @@ import type {
  * </div>
  * ```
  */
-export function createChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
-  options: CreateChatOptions<TTools>,
-): CreateChatReturn<TTools> {
+export function createChat<
+  TTools extends ReadonlyArray<AnyClientTool> = any,
+  TSchema extends SchemaInput | undefined = undefined,
+>(
+  options: CreateChatOptions<TTools, TSchema>,
+): CreateChatReturn<TTools, TSchema> {
   // Generate a unique ID for this chat instance
   const clientId =
     options.id ||
@@ -55,6 +66,15 @@ export function createChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
   let connectionStatus = $state<ConnectionStatus>('disconnected')
   let sessionGenerating = $state(false)
 
+  // Structured-output state. Runtime always tracks them — the conditional
+  // return type hides them when no `outputSchema` is supplied.
+  type Partial = DeepPartial<InferSchemaType<NonNullable<TSchema>>>
+  type Final = InferSchemaType<NonNullable<TSchema>>
+  let partial = $state<Partial>({} as Partial)
+  let final = $state<Final | null>(null)
+  // Raw JSON accumulator — not reactive, just a local buffer.
+  let rawJson = ''
+
   // Create ChatClient instance.
   // Note: Svelte's createChat runs once per instance and `options` is captured
   // by reference. Callbacks are therefore frozen to whatever the caller passed
@@ -66,7 +86,28 @@ export function createChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     initialMessages: options.initialMessages,
     body: options.body,
     onResponse: options.onResponse,
-    onChunk: options.onChunk,
+    onChunk: (chunk: StreamChunk) => {
+      if (options.outputSchema !== undefined) {
+        if (chunk.type === 'RUN_STARTED') {
+          rawJson = ''
+          partial = {} as Partial
+          final = null
+        } else if (chunk.type === 'TEXT_MESSAGE_CONTENT' && chunk.delta) {
+          rawJson += chunk.delta
+          const progressive = parsePartialJSON(rawJson)
+          if (progressive && typeof progressive === 'object') {
+            partial = progressive as Partial
+          }
+        } else if (
+          chunk.type === 'CUSTOM' &&
+          chunk.name === 'structured-output.complete'
+        ) {
+          const value = chunk.value as { object: unknown }
+          final = value.object as Final
+        }
+      }
+      options.onChunk?.(chunk)
+    },
     onFinish: (message) => {
       options.onFinish?.(message)
     },
@@ -178,6 +219,12 @@ export function createChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     get sessionGenerating() {
       return sessionGenerating
     },
+    get partial() {
+      return partial
+    },
+    get final() {
+      return final
+    },
     sendMessage,
     append,
     reload,
@@ -187,5 +234,5 @@ export function createChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     addToolResult,
     addToolApprovalResponse,
     updateBody,
-  }
+  } as unknown as CreateChatReturn<TTools, TSchema>
 }
diff --git a/packages/typescript/ai-svelte/src/index.ts b/packages/typescript/ai-svelte/src/index.ts
index b16482739..bdfd7575f 100644
--- a/packages/typescript/ai-svelte/src/index.ts
+++ b/packages/typescript/ai-svelte/src/index.ts
@@ -2,6 +2,7 @@ export { createChat } from './create-chat.svelte'
 export type {
   CreateChatOptions,
   CreateChatReturn,
+  DeepPartial,
   UIMessage,
   ChatRequestBody,
 } from './types'
diff --git a/packages/typescript/ai-svelte/src/types.ts b/packages/typescript/ai-svelte/src/types.ts
index 88e6bb32f..993afd2ae 100644
--- a/packages/typescript/ai-svelte/src/types.ts
+++ b/packages/typescript/ai-svelte/src/types.ts
@@ -1,4 +1,9 @@
-import type { AnyClientTool, ModelMessage } from '@tanstack/ai'
+import type {
+  AnyClientTool,
+  InferSchemaType,
+  ModelMessage,
+  SchemaInput,
+} from '@tanstack/ai'
 import type {
   ChatClientOptions,
   ChatClientState,
@@ -11,6 +16,18 @@ import type {
 // Re-export types from ai-client
 export type { ChatRequestBody, MultimodalContent, UIMessage }
 
+/**
+ * Recursive partial — every property and every nested array element is
+ * optional. Used to type the in-flight `partial` getter while a structured-
+ * output stream is still arriving.
+ */
+export type DeepPartial<T> =
+  T extends ReadonlyArray<infer U>
+    ? Array<DeepPartial<U>>
+    : T extends object
+      ? { [K in keyof T]?: DeepPartial<T[K]> }
+      : T
+
 /**
  * Options for the createChat function.
  *
@@ -24,11 +41,17 @@ export type { ChatRequestBody, MultimodalContent, UIMessage }
  * All other callbacks (onResponse, onChunk, onFinish, onError) are
  * passed through to the underlying ChatClient and can be used for side effects.
  *
+ * When `outputSchema` is supplied, the return adds typed `partial` and `final`
+ * reactive getters. The schema is used purely for type inference; server-side
+ * validation still runs against the schema passed to `chat({ outputSchema })`
+ * on the server route.
+ *
  * Note: Connection and body changes will recreate the ChatClient instance.
  * To update these options, remount the component or use a key prop.
  */
 export type CreateChatOptions<
   TTools extends ReadonlyArray<AnyClientTool> = any,
+  TSchema extends SchemaInput | undefined = undefined,
 > = Omit<
   ChatClientOptions<TTools>,
   | 'onMessagesChange'
@@ -40,9 +63,39 @@ export type CreateChatOptions<
   | 'onSessionGeneratingChange'
 > & {
   live?: boolean
+  /**
+   * Standard-schema-compatible schema (Zod, Valibot, ArkType, or plain JSON
+   * Schema). Used to infer the shape of `partial` and `final`.
+   */
+  outputSchema?: TSchema
 }
 
-export interface CreateChatReturn<
+/**
+ * Discriminated return shape: when `outputSchema` is supplied, the return adds
+ * typed `partial` / `final` reactive getters; otherwise the return is
+ * unchanged.
+ */
+export type CreateChatReturn<
+  TTools extends ReadonlyArray<AnyClientTool> = any,
+  TSchema extends SchemaInput | undefined = undefined,
+> = BaseCreateChatReturn<TTools> &
+  (TSchema extends SchemaInput
+    ? {
+        /**
+         * Live progressively-parsed structured output (reactive getter).
+         * Resets on every new run.
+         */
+        readonly partial: DeepPartial<InferSchemaType<TSchema>>
+        /**
+         * Final, schema-validated structured output (reactive getter). `null`
+         * until the terminal `structured-output.complete` event arrives.
+         * Resets on every new run.
+         */
+        readonly final: InferSchemaType<TSchema> | null
+      }
+    : Record<never, never>)
+
+interface BaseCreateChatReturn<
   TTools extends ReadonlyArray<AnyClientTool> = any,
 > {
   /**
diff --git a/packages/typescript/ai-svelte/tests/create-chat-types.test.ts b/packages/typescript/ai-svelte/tests/create-chat-types.test.ts
new file mode 100644
index 000000000..034c82a5f
--- /dev/null
+++ b/packages/typescript/ai-svelte/tests/create-chat-types.test.ts
@@ -0,0 +1,44 @@
+/**
+ * Type-level tests for `createChat()`'s return-type narrowing when
+ * `outputSchema` is supplied. Mirrors the React useChat variant.
+ */
+
+import { describe, expectTypeOf, it } from 'vitest'
+import type { StandardJSONSchemaV1 } from '@standard-schema/spec'
+import type { AnyClientTool } from '@tanstack/ai'
+import type {
+  CreateChatOptions,
+  CreateChatReturn,
+  DeepPartial,
+} from '../src/types'
+
+type Person = { name: string; age: number; email: string }
+type PersonSchema = StandardJSONSchemaV1<Person, Person>
+type NoTools = ReadonlyArray<AnyClientTool>
+
+describe('createChat() return type (svelte)', () => {
+  describe('with outputSchema', () => {
+    it('exposes typed partial + final reactive getters', () => {
+      type R = CreateChatReturn<NoTools, PersonSchema>
+      expectTypeOf<R['partial']>().toEqualTypeOf<DeepPartial<Person>>()
+      expectTypeOf<R['final']>().toEqualTypeOf<Person | null>()
+    })
+
+    it('options accept outputSchema with the schema type', () => {
+      type O = CreateChatOptions<NoTools, PersonSchema>
+      expectTypeOf<O['outputSchema']>().toEqualTypeOf<
+        PersonSchema | undefined
+      >()
+    })
+  })
+
+  describe('without outputSchema', () => {
+    it('does NOT expose partial or final', () => {
+      type R = CreateChatReturn<NoTools>
+      // @ts-expect-error - partial only exists when outputSchema is supplied
+      type _Partial = R['partial']
+      // @ts-expect-error - final only exists when outputSchema is supplied
+      type _Final = R['final']
+    })
+  })
+})
diff --git a/packages/typescript/ai-vue/package.json b/packages/typescript/ai-vue/package.json
index 8aeb4f3c2..039fa657d 100644
--- a/packages/typescript/ai-vue/package.json
+++ b/packages/typescript/ai-vue/package.json
@@ -46,6 +46,7 @@
     "vue": ">=3.5.0"
   },
   "devDependencies": {
+    "@standard-schema/spec": "^1.1.0",
     "@tanstack/ai": "workspace:*",
     "@types/node": "^24.10.1",
     "@vitest/coverage-v8": "4.0.14",
diff --git a/packages/typescript/ai-vue/src/index.ts b/packages/typescript/ai-vue/src/index.ts
index 6c60da993..d0bb2de98 100644
--- a/packages/typescript/ai-vue/src/index.ts
+++ b/packages/typescript/ai-vue/src/index.ts
@@ -1,5 +1,6 @@
 export { useChat } from './use-chat'
 export type {
+  DeepPartial,
   UseChatOptions,
   UseChatReturn,
   UIMessage,
diff --git a/packages/typescript/ai-vue/src/types.ts b/packages/typescript/ai-vue/src/types.ts
index db21b50a6..8170ca4e4 100644
--- a/packages/typescript/ai-vue/src/types.ts
+++ b/packages/typescript/ai-vue/src/types.ts
@@ -1,4 +1,9 @@
-import type { AnyClientTool, ModelMessage } from '@tanstack/ai'
+import type {
+  AnyClientTool,
+  InferSchemaType,
+  ModelMessage,
+  SchemaInput,
+} from '@tanstack/ai'
 import type {
   ChatClientOptions,
   ChatClientState,
@@ -12,6 +17,18 @@ import type { DeepReadonly, ShallowRef } from 'vue'
 // Re-export types from ai-client
 export type { ChatRequestBody, MultimodalContent, UIMessage }
 
+/**
+ * Recursive partial — every property and every nested array element is optional.
+ * Used to type the in-flight `partial` value the composable exposes while a
+ * structured output stream is still arriving.
+ */
+export type DeepPartial<T> =
+  T extends ReadonlyArray<infer U>
+    ? Array<DeepPartial<U>>
+    : T extends object
+      ? { [K in keyof T]?: DeepPartial<T[K]> }
+      : T
+
 /**
  * Options for the useChat composable.
  *
@@ -25,26 +42,62 @@ export type { ChatRequestBody, MultimodalContent, UIMessage }
  * All other callbacks (onResponse, onChunk, onFinish, onError) are
  * passed through to the underlying ChatClient and can be used for side effects.
  *
+ * When `outputSchema` is supplied, the composable returns typed `partial` and
+ * `final` refs — `partial` is the live progressively-parsed object, `final`
+ * snaps to the validated terminal payload. The schema is used purely for type
+ * inference; server-side validation still runs against the schema passed to
+ * `chat({ outputSchema })` on the server route.
+ *
  * Note: Connection and body changes will recreate the ChatClient instance.
  * To update these options, remount the component or use a key prop.
  */
-export type UseChatOptions<TTools extends ReadonlyArray<AnyClientTool> = any> =
-  Omit<
-    ChatClientOptions<TTools>,
-    | 'onMessagesChange'
-    | 'onLoadingChange'
-    | 'onErrorChange'
-    | 'onStatusChange'
-    | 'onSubscriptionChange'
-    | 'onConnectionStatusChange'
-    | 'onSessionGeneratingChange'
-  > & {
-    live?: boolean
-  }
-
-export interface UseChatReturn<
+export type UseChatOptions<
+  TTools extends ReadonlyArray<AnyClientTool> = any,
+  TSchema extends SchemaInput | undefined = undefined,
+> = Omit<
+  ChatClientOptions<TTools>,
+  | 'onMessagesChange'
+  | 'onLoadingChange'
+  | 'onErrorChange'
+  | 'onStatusChange'
+  | 'onSubscriptionChange'
+  | 'onConnectionStatusChange'
+  | 'onSessionGeneratingChange'
+> & {
+  live?: boolean
+  /**
+   * Standard-schema-compatible schema (Zod, Valibot, ArkType, or plain JSON
+   * Schema). Used to infer the shape of `partial` and `final`.
+   */
+  outputSchema?: TSchema
+}
+
+/**
+ * Discriminated return shape: when `outputSchema` is supplied, the composable
+ * adds typed `partial` / `final` refs; when it is omitted (default), the
+ * return is unchanged.
+ */
+export type UseChatReturn<
   TTools extends ReadonlyArray<AnyClientTool> = any,
-> {
+  TSchema extends SchemaInput | undefined = undefined,
+> = BaseUseChatReturn<TTools> &
+  (TSchema extends SchemaInput
+    ? {
+        /**
+         * Live progressively-parsed structured output. Updated from
+         * `TEXT_MESSAGE_CONTENT` deltas via `parsePartialJSON`. Resets on
+         * every new run.
+         */
+        partial: DeepReadonly<ShallowRef<DeepPartial<InferSchemaType<TSchema>>>>
+        /**
+         * Final, schema-validated structured output. `null` until the terminal
+         * `structured-output.complete` event arrives. Resets on every new run.
+         */
+        final: DeepReadonly<ShallowRef<InferSchemaType<TSchema> | null>>
+      }
+    : Record<never, never>)
+
+interface BaseUseChatReturn<TTools extends ReadonlyArray<AnyClientTool> = any> {
   /**
    * Current messages in the conversation
    */
diff --git a/packages/typescript/ai-vue/src/use-chat.ts b/packages/typescript/ai-vue/src/use-chat.ts
index 3f10b4dcb..9b825914d 100644
--- a/packages/typescript/ai-vue/src/use-chat.ts
+++ b/packages/typescript/ai-vue/src/use-chat.ts
@@ -1,17 +1,31 @@
 import { ChatClient } from '@tanstack/ai-client'
+import { parsePartialJSON } from '@tanstack/ai'
 import { onScopeDispose, readonly, shallowRef, useId, watch } from 'vue'
-import type { AnyClientTool, ModelMessage } from '@tanstack/ai'
+import type {
+  AnyClientTool,
+  InferSchemaType,
+  ModelMessage,
+  SchemaInput,
+  StreamChunk,
+} from '@tanstack/ai'
 import type { ChatClientState, ConnectionStatus } from '@tanstack/ai-client'
 import type {
+  DeepPartial,
   MultimodalContent,
   UIMessage,
   UseChatOptions,
   UseChatReturn,
 } from './types'
 
-export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
-  options: UseChatOptions<TTools> = {} as UseChatOptions<TTools>,
-): UseChatReturn<TTools> {
+export function useChat<
+  TTools extends ReadonlyArray<AnyClientTool> = any,
+  TSchema extends SchemaInput | undefined = undefined,
+>(
+  options: UseChatOptions<TTools, TSchema> = {} as UseChatOptions<
+    TTools,
+    TSchema
+  >,
+): UseChatReturn<TTools, TSchema> {
   const hookId = useId() // Available in Vue 3.5+
   const clientId = options.id || hookId
 
@@ -25,6 +39,16 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
   const connectionStatus = shallowRef<ConnectionStatus>('disconnected')
   const sessionGenerating = shallowRef(false)
 
+  // Structured-output state. Runtime always tracks them — the conditional
+  // return type hides them from callers that didn't supply `outputSchema`.
+  type Partial = DeepPartial<InferSchemaType<NonNullable<TSchema>>>
+  type Final = InferSchemaType<NonNullable<TSchema>>
+  const partial = shallowRef<Partial>({} as Partial)
+  const final = shallowRef<Final | null>(null)
+  // Raw JSON accumulator — synchronous inside onChunk; no need to re-render
+  // every delta solely to track the buffer.
+  let rawJson = ''
+
   // Create ChatClient instance with callbacks to sync state.
   // Every user-provided callback is wrapped so the LATEST `options.xxx` value
   // is read at call time. Direct assignment would freeze the callback to the
@@ -38,7 +62,30 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     initialMessages: options.initialMessages,
     body: options.body,
     onResponse: (response) => options.onResponse?.(response),
-    onChunk: (chunk) => options.onChunk?.(chunk),
+    onChunk: (chunk: StreamChunk) => {
+      // Internal structured-output tracking — runs before the user callback
+      // so user code observes the same state. No-op when no schema is set.
+      if (options.outputSchema !== undefined) {
+        if (chunk.type === 'RUN_STARTED') {
+          rawJson = ''
+          partial.value = {} as Partial
+          final.value = null
+        } else if (chunk.type === 'TEXT_MESSAGE_CONTENT' && chunk.delta) {
+          rawJson += chunk.delta
+          const progressive = parsePartialJSON(rawJson)
+          if (progressive && typeof progressive === 'object') {
+            partial.value = progressive as Partial
+          }
+        } else if (
+          chunk.type === 'CUSTOM' &&
+          chunk.name === 'structured-output.complete'
+        ) {
+          const value = chunk.value as { object: unknown }
+          final.value = value.object as Final
+        }
+      }
+      options.onChunk?.(chunk)
+    },
     onFinish: (message) => {
       options.onFinish?.(message)
     },
@@ -147,6 +194,9 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     await client.addToolApprovalResponse(response)
   }
 
+  // partial / final are runtime-tracked unconditionally; the conditional
+  // return type (UseChatReturn<TTools, TSchema>) hides them from callers that
+  // didn't supply `outputSchema`.
   return {
     messages: readonly(messages),
     sendMessage,
@@ -163,5 +213,7 @@ export function useChat<TTools extends ReadonlyArray<AnyClientTool> = any>(
     clear,
     addToolResult,
     addToolApprovalResponse,
-  }
+    partial: readonly(partial),
+    final: readonly(final),
+  } as unknown as UseChatReturn<TTools, TSchema>
 }
diff --git a/packages/typescript/ai-vue/tests/use-chat-types.test.ts b/packages/typescript/ai-vue/tests/use-chat-types.test.ts
new file mode 100644
index 000000000..27f9864ce
--- /dev/null
+++ b/packages/typescript/ai-vue/tests/use-chat-types.test.ts
@@ -0,0 +1,45 @@
+/**
+ * Type-level tests for `useChat()`'s return-type narrowing when `outputSchema`
+ * is supplied. Mirrors the React variant; pure types only.
+ */
+
+import { describe, expectTypeOf, it } from 'vitest'
+import type { StandardJSONSchemaV1 } from '@standard-schema/spec'
+import type { AnyClientTool } from '@tanstack/ai'
+import type { DeepReadonly, ShallowRef } from 'vue'
+import type { DeepPartial, UseChatOptions, UseChatReturn } from '../src/types'
+
+type Person = { name: string; age: number; email: string }
+type PersonSchema = StandardJSONSchemaV1<Person, Person>
+type NoTools = ReadonlyArray<AnyClientTool>
+
+describe('useChat() return type (vue)', () => {
+  describe('with outputSchema', () => {
+    it('exposes typed partial + final refs', () => {
+      type R = UseChatReturn<NoTools, PersonSchema>
+      expectTypeOf<R['partial']>().toEqualTypeOf<
+        DeepReadonly<ShallowRef<DeepPartial<Person>>>
+      >()
+      expectTypeOf<R['final']>().toEqualTypeOf<
+        DeepReadonly<ShallowRef<Person | null>>
+      >()
+    })
+
+    it('options accept outputSchema with the schema type', () => {
+      type O = UseChatOptions<NoTools, PersonSchema>
+      expectTypeOf<O['outputSchema']>().toEqualTypeOf<
+        PersonSchema | undefined
+      >()
+    })
+  })
+
+  describe('without outputSchema', () => {
+    it('does NOT expose partial or final', () => {
+      type R = UseChatReturn<NoTools>
+      // @ts-expect-error - partial only exists when outputSchema is supplied
+      type _Partial = R['partial']
+      // @ts-expect-error - final only exists when outputSchema is supplied
+      type _Final = R['final']
+    })
+  })
+})
diff --git a/packages/typescript/ai-vue/tsconfig.json b/packages/typescript/ai-vue/tsconfig.json
index b819577a7..0474232a5 100644
--- a/packages/typescript/ai-vue/tsconfig.json
+++ b/packages/typescript/ai-vue/tsconfig.json
@@ -5,6 +5,6 @@
     "jsx": "preserve",
     "lib": ["ES2022", "DOM"]
   },
-  "include": ["src/**/*.ts", "src/**/*.tsx", "tests/**/*.ts", "tests/**/*.tsx"],
+  "include": ["src/**/*.ts", "src/**/*.tsx"],
   "exclude": ["node_modules", "dist", "**/*.config.ts"]
 }
diff --git a/packages/typescript/ai/skills/ai-core/structured-outputs/SKILL.md b/packages/typescript/ai/skills/ai-core/structured-outputs/SKILL.md
index da2395e37..0c03f58ea 100644
--- a/packages/typescript/ai/skills/ai-core/structured-outputs/SKILL.md
+++ b/packages/typescript/ai/skills/ai-core/structured-outputs/SKILL.md
@@ -4,7 +4,9 @@ description: >
   Type-safe JSON schema responses from LLMs using outputSchema on chat().
   Supports Zod, ArkType, and Valibot schemas. The adapter handles
   provider-specific strategies transparently — never configure structured
-  output at the provider level. convertSchemaToJsonSchema() for manual
+  output at the provider level. Pass stream:true alongside outputSchema for
+  incremental JSON deltas + a terminal validated object via the
+  `structured-output.complete` event. convertSchemaToJsonSchema() for manual
   schema conversion.
 type: sub-skill
 library: tanstack-ai
@@ -46,6 +48,8 @@ const stream = chat({
 
 When `outputSchema` is provided, `chat()` returns `Promise<InferSchemaType<TSchema>>` instead of `AsyncIterable<StreamChunk>`. The result is fully typed based on the schema.
 
+Adding `stream: true` switches the return to `StructuredOutputStream<InferSchemaType<TSchema>>` — incremental JSON deltas plus a terminal validated object. See **Pattern 3** below.
+
 ## Core Patterns
 
 ### Pattern 1: Basic structured output with Zod
@@ -128,8 +132,94 @@ console.log(company.employees[0].role)
 console.log(company.financials?.revenue)
 ```
 
+### Pattern 3: Streaming structured output
+
+Pass `stream: true` alongside `outputSchema` to receive incremental JSON deltas while the model generates, plus a final validated typed object. Useful for streaming partial UI (progress views, typewriter previews, partially-filled forms).
+
+```typescript
+import { chat } from '@tanstack/ai'
+import { openaiText } from '@tanstack/ai-openai'
+import { z } from 'zod'
+
+const PersonSchema = z.object({
+  name: z.string(),
+  age: z.number(),
+  email: z.string().email(),
+})
+
+const stream = chat({
+  adapter: openaiText('gpt-5.2'),
+  messages: [
+    { role: 'user', content: 'Extract: John Doe is 30, john@example.com' },
+  ],
+  outputSchema: PersonSchema,
+  stream: true,
+})
+
+let raw = ''
+for await (const chunk of stream) {
+  if (chunk.type === 'TEXT_MESSAGE_CONTENT') {
+    // Partial JSON text — drive progress UI only. Do NOT JSON.parse.
+    raw += chunk.delta
+  } else if (
+    chunk.type === 'CUSTOM' &&
+    chunk.name === 'structured-output.complete'
+  ) {
+    // Terminal event. `chunk.value.object` is fully validated and typed
+    // against the schema you passed in — no helper or cast required.
+    chunk.value.object.name // string
+    chunk.value.object.age // number
+    chunk.value.reasoning // string | undefined (thinking models only)
+  }
+}
+```
+
+The terminal event is a `CUSTOM` chunk: `{ type: 'CUSTOM', name: 'structured-output.complete', value: { object: T, raw: string, reasoning?: string } }`. The return type of `chat({ outputSchema, stream: true })` carries `T` through to the terminal event, so a plain discriminated narrow (`chunk.type === 'CUSTOM' && chunk.name === 'structured-output.complete'`) is enough — no type guard helper needed.
+
+**Adapter coverage for streaming:**
+
+| Adapter                                           | `outputSchema` + `stream: true`                                                               |
+| ------------------------------------------------- | --------------------------------------------------------------------------------------------- |
+| `@tanstack/ai-openai`                             | Native single-request stream (Responses API)                                                  |
+| `@tanstack/ai-openrouter`                         | Native single-request stream                                                                  |
+| `@tanstack/ai-grok`                               | Native single-request stream (Chat Completions)                                               |
+| `@tanstack/ai-groq`                               | Native single-request stream (Chat Completions)                                               |
+| All other adapters (anthropic, gemini, ollama, …) | Fallback: runs non-streaming `structuredOutput`, emits one `structured-output.complete` event |
+
+The consumer code is identical across providers — always read the final object off `structured-output.complete`. You only see incremental deltas when the adapter implements `structuredOutputStream` natively.
+
 ## Common Mistakes
 
+### HIGH: Parsing streaming JSON deltas yourself
+
+When using `chat({ outputSchema, stream: true })`, the `TEXT_MESSAGE_CONTENT` chunks contain _partial_ JSON fragments — they are not valid JSON until the stream completes. Always read the validated object from the terminal `structured-output.complete` event. Validation runs once, on the complete payload.
+
+```typescript
+// WRONG -- partial JSON, throws SyntaxError mid-stream, no schema validation
+for await (const chunk of stream) {
+  if (chunk.type === 'TEXT_MESSAGE_CONTENT') {
+    const obj = JSON.parse(chunk.delta) // ❌ partial, invalid
+  }
+}
+
+// CORRECT -- accumulate deltas only for UX progress; trust the terminal event
+let raw = ''
+for await (const chunk of stream) {
+  if (chunk.type === 'TEXT_MESSAGE_CONTENT') {
+    raw += chunk.delta // optional: render a "streaming JSON" preview
+  } else if (
+    chunk.type === 'CUSTOM' &&
+    chunk.name === 'structured-output.complete'
+  ) {
+    const result = chunk.value.object // ✅ typed and validated
+  }
+}
+```
+
+If you need progressive _parsed_ state (e.g. show fields as they arrive), use a partial-JSON parser on the accumulated `raw` string at render time — but do NOT treat the result as schema-validated; only the terminal event is.
+
+Source: maintainer interview
+
 ### HIGH: Trying to implement provider-specific structured output strategies
 
 The adapter already handles provider differences (OpenAI uses `response_format`, Anthropic uses tool-based extraction, Gemini uses `responseSchema`). Never configure this yourself.
@@ -201,3 +291,4 @@ Source: maintainer interview
 ## Cross-References
 
 - See also: ai-core/adapter-configuration/SKILL.md -- Adapter handles structured output strategy transparently
+- See also: ai-core/chat-experience/SKILL.md -- Consuming `StreamChunk` events on the client (the streaming variant uses the same chunk model plus the terminal `structured-output.complete` custom event)
diff --git a/packages/typescript/ai/src/activities/chat/adapter.ts b/packages/typescript/ai/src/activities/chat/adapter.ts
index 4e7bb4ed1..df1c94726 100644
--- a/packages/typescript/ai/src/activities/chat/adapter.ts
+++ b/packages/typescript/ai/src/activities/chat/adapter.ts
@@ -100,6 +100,23 @@ export interface TextAdapter<
   structuredOutput: (
     options: StructuredOutputOptions<TProviderOptions>,
   ) => Promise<StructuredOutputResult<unknown>>
+
+  /**
+   * Stream structured output using the provider's native streaming structured
+   * output API (stream + response_format json_schema in a single request).
+   *
+   * Optional — adapters without native streaming JSON omit this method and the
+   * activity layer synthesizes a stream around the non-streaming
+   * `structuredOutput` call.
+   *
+   * Implementations must emit standard AG-UI lifecycle events (RUN_STARTED,
+   * TEXT_MESSAGE_*, RUN_FINISHED) carrying raw JSON text deltas, plus a final
+   * `CUSTOM` event named `structured-output.complete` whose `value` is
+   * `{ object, raw, reasoning? }`.
+   */
+  structuredOutputStream?: (
+    options: StructuredOutputOptions<TProviderOptions>,
+  ) => AsyncIterable<StreamChunk>
 }
 
 /**
diff --git a/packages/typescript/ai/src/activities/chat/index.ts b/packages/typescript/ai/src/activities/chat/index.ts
index 8ce192a4f..3a4842c61 100644
--- a/packages/typescript/ai/src/activities/chat/index.ts
+++ b/packages/typescript/ai/src/activities/chat/index.ts
@@ -9,6 +9,7 @@ import { devtoolsMiddleware } from '@tanstack/ai-event-client'
 import { stripToSpecMiddleware } from '../../strip-to-spec-middleware'
 import { streamToText } from '../../stream-to-response.js'
 import { resolveDebugOption } from '../../logger/resolve'
+import { EventType } from '../../types'
 import { LazyToolManager } from './tools/lazy-tool-manager'
 import {
   MiddlewareAbortError,
@@ -28,7 +29,7 @@ import type {
   ClientToolRequest,
   ToolResult,
 } from './tools/tool-calls'
-import type { AnyTextAdapter } from './adapter'
+import type { AnyTextAdapter, StructuredOutputOptions } from './adapter'
 import type {
   AgentLoopStrategy,
   ConstrainedModelMessage,
@@ -38,6 +39,8 @@ import type {
   RunFinishedEvent,
   SchemaInput,
   StreamChunk,
+  StructuredOutputCompleteEvent,
+  StructuredOutputStream,
   TextMessageContentEvent,
   TextOptions,
   Tool,
@@ -226,16 +229,28 @@ export function createChatOptions<
 
 /**
  * Result type for the text activity.
- * - If outputSchema is provided: Promise<InferSchemaType<TSchema>>
- * - If stream is false: Promise<string>
- * - Otherwise (stream is true, default): AsyncIterable<StreamChunk>
+ * - If outputSchema is provided AND stream is explicitly true:
+ *   StructuredOutputStream<InferSchemaType<TSchema>> — yields raw JSON deltas
+ *   via TEXT_MESSAGE_CONTENT plus a terminal StructuredOutputCompleteEvent
+ *   carrying the validated object.
+ * - If outputSchema is provided without explicit stream:true:
+ *   Promise<InferSchemaType<TSchema>>.
+ * - If stream is explicitly false (no schema): Promise<string>.
+ * - Otherwise (default): AsyncIterable<StreamChunk>.
+ *
+ * `[TStream] extends [true]` is used (not `TStream extends true`) so that the
+ * default `boolean` value of `TStream` does *not* match the streaming branch.
+ * Without this, plain `chat({ outputSchema })` would type as a stream while
+ * the runtime returns a Promise — see issue #526.
  */
 export type TextActivityResult<
   TSchema extends SchemaInput | undefined,
-  TStream extends boolean = true,
+  TStream extends boolean = boolean,
 > = TSchema extends SchemaInput
-  ? Promise<InferSchemaType<TSchema>>
-  : TStream extends false
+  ? [TStream] extends [true]
+    ? StructuredOutputStream<InferSchemaType<TSchema>>
+    : Promise<InferSchemaType<TSchema>>
+  : [TStream] extends [false]
     ? Promise<string>
     : AsyncIterable<StreamChunk>
 
@@ -1575,38 +1590,46 @@ class TextEngine<
 export function chat<
   TAdapter extends AnyTextAdapter,
   TSchema extends SchemaInput | undefined = undefined,
-  TStream extends boolean = true,
+  TStream extends boolean = boolean,
 >(
   options: TextActivityOptions<TAdapter, TSchema, TStream>,
 ): TextActivityResult<TSchema, TStream> {
   const { outputSchema, stream } = options
 
-  // If outputSchema is provided, run agentic structured output
+  // outputSchema + stream:true is the only branch that streams structured
+  // output. Without an explicit `stream: true`, schema-bearing calls run the
+  // agent loop and resolve to a typed Promise<InferSchemaType<TSchema>>.
+  if (outputSchema && stream === true) {
+    return runStreamingStructuredOutput({
+      ...options,
+      outputSchema,
+      stream,
+    }) as TextActivityResult<TSchema, TStream>
+  }
+
+  // If outputSchema is provided, run agentic structured output (Promise<T>)
   if (outputSchema) {
-    return runAgenticStructuredOutput(
-      options as unknown as TextActivityOptions<
-        AnyTextAdapter,
-        SchemaInput,
-        boolean
-      >,
-    ) as TextActivityResult<TSchema, TStream>
+    return runAgenticStructuredOutput({
+      ...options,
+      outputSchema,
+    }) as TextActivityResult<TSchema, TStream>
   }
 
   // If stream is explicitly false, run non-streaming text
   if (stream === false) {
-    return runNonStreamingText(
-      options as unknown as TextActivityOptions<
-        AnyTextAdapter,
-        undefined,
-        false
-      >,
-    ) as TextActivityResult<TSchema, TStream>
+    return runNonStreamingText({
+      ...options,
+      outputSchema: undefined,
+      stream,
+    }) as TextActivityResult<TSchema, TStream>
   }
 
   // Otherwise, run streaming text (default)
-  return runStreamingText(
-    options as unknown as TextActivityOptions<AnyTextAdapter, undefined, true>,
-  ) as TextActivityResult<TSchema, TStream>
+  return runStreamingText({
+    ...options,
+    outputSchema: undefined,
+    stream,
+  }) as TextActivityResult<TSchema, TStream>
 }
 
 /**
@@ -1741,6 +1764,325 @@ async function runAgenticStructuredOutput<TSchema extends SchemaInput>(
   return result.data as InferSchemaType<TSchema>
 }
 
+/**
+ * Synthesize a streaming structured-output stream by wrapping a non-streaming
+ * `structuredOutput` call. Used when an adapter doesn't implement
+ * `structuredOutputStream` natively.
+ */
+async function* fallbackStructuredOutputStream(
+  adapter: AnyTextAdapter,
+  options: StructuredOutputOptions<Record<string, unknown>>,
+): AsyncIterable<StreamChunk> {
+  const { chatOptions } = options
+  const runId = chatOptions.runId ?? `mock-${Date.now()}`
+  const threadId = chatOptions.threadId ?? `mock-${Date.now()}`
+  const messageId = `mock-${Date.now()}-${Math.random().toString(36).slice(2)}`
+  const model = chatOptions.model
+  const timestamp = Date.now()
+
+  yield {
+    type: EventType.RUN_STARTED,
+    runId,
+    threadId,
+    model,
+    timestamp,
+  }
+
+  let result: { data: unknown; rawText: string }
+  try {
+    result = await adapter.structuredOutput(options)
+  } catch (error) {
+    const message = error instanceof Error ? error.message : 'Unknown error'
+    yield {
+      type: EventType.RUN_ERROR,
+      runId,
+      model,
+      timestamp,
+      message,
+      error: { message },
+    }
+    return
+  }
+
+  yield {
+    type: EventType.TEXT_MESSAGE_START,
+    messageId,
+    role: 'assistant',
+    model,
+    timestamp,
+  }
+
+  yield {
+    type: EventType.TEXT_MESSAGE_CONTENT,
+    messageId,
+    delta: result.rawText,
+    model,
+    timestamp,
+  }
+
+  yield {
+    type: EventType.TEXT_MESSAGE_END,
+    messageId,
+    model,
+    timestamp,
+  }
+
+  yield {
+    type: EventType.CUSTOM,
+    name: 'structured-output.complete',
+    value: { object: result.data, raw: result.rawText },
+    model,
+    timestamp,
+  }
+
+  yield {
+    type: EventType.RUN_FINISHED,
+    runId,
+    threadId,
+    model,
+    timestamp,
+    finishReason: 'stop',
+  }
+}
+
+/**
+ * Run streaming structured output:
+ * - Without tools: call adapter.structuredOutputStream directly (single
+ *   provider request emitting JSON deltas + a final CUSTOM event).
+ * - With tools: run the agent loop, yield its non-terminal chunks, then call
+ *   structuredOutputStream on the final messages so the structured stream's
+ *   own RUN_STARTED/RUN_FINISHED bracket the run.
+ *
+ * Validates the parsed object against the original Standard Schema (if
+ * applicable) when forwarding the final `structured-output.complete` event.
+ *
+ * Pre-flight validation (missing schema, unconvertible schema) throws
+ * synchronously at call time rather than as a yielded RUN_ERROR mid-stream —
+ * those are programmer errors, not runtime conditions.
+ */
+function runStreamingStructuredOutput<TSchema extends SchemaInput>(
+  options: TextActivityOptions<AnyTextAdapter, TSchema, true>,
+): StructuredOutputStream<InferSchemaType<TSchema>> {
+  const { outputSchema } = options
+
+  if (!outputSchema) {
+    throw new Error('outputSchema is required for streaming structured output')
+  }
+
+  // forStructuredOutput strict-converts the schema once at the activity
+  // boundary. Adapters can re-convert if their wire format diverges, but the
+  // default flow hands them a strict-ready schema.
+  const jsonSchema = convertSchemaToJsonSchema(outputSchema, {
+    forStructuredOutput: true,
+  })
+  if (!jsonSchema) {
+    throw new Error('Failed to convert output schema to JSON Schema')
+  }
+
+  // The implementation generator yields the broader internal type
+  // (`StreamChunk | StructuredOutputCompleteEvent<T>`) so agent-loop
+  // CustomEvents can flow through; the public-facing type narrows to
+  // `Exclude<StreamChunk, CustomEvent> | StructuredOutputCompleteEvent<T>`
+  // which lets consumers narrow `chunk.value` cleanly. The widen→narrow
+  // is contained here so consumers see only the strict type.
+  return runStreamingStructuredOutputImpl(
+    options,
+    jsonSchema,
+  ) as StructuredOutputStream<InferSchemaType<TSchema>>
+}
+
+/**
+ * Internal generator return type — broader than the public
+ * `StructuredOutputStream<T>`. The public type pins three tagged `CUSTOM`
+ * events (`structured-output.complete`, `approval-requested`,
+ * `tool-input-available`) so consumers can narrow `chunk.value` cleanly by
+ * literal `name`. At runtime, tools can also emit arbitrary user-defined
+ * `CustomEvent`s through the `emitCustomEvent` context API; those flow
+ * through this generator with `name: string` and are widened out at the
+ * public boundary because keeping them would collapse the typed narrow back
+ * to `any`. The cast inside `runStreamingStructuredOutput` is where that
+ * widening happens.
+ */
+type StructuredOutputStreamInternal<T> = AsyncIterable<
+  StreamChunk | StructuredOutputCompleteEvent<T>
+>
+
+async function* runStreamingStructuredOutputImpl<TSchema extends SchemaInput>(
+  options: TextActivityOptions<AnyTextAdapter, TSchema, true>,
+  jsonSchema: NonNullable<ReturnType<typeof convertSchemaToJsonSchema>>,
+): StructuredOutputStreamInternal<InferSchemaType<TSchema>> {
+  const { adapter, outputSchema, middleware, context, debug, ...textOptions } =
+    options
+  const model = adapter.model
+  const logger = resolveDebugOption(debug)
+  const runId = textOptions.runId
+
+  // Inputs may be UIMessages (from useChat) or ModelMessages (from server-side
+  // callers). The agent-loop branch converts via TextEngine; the no-tools
+  // branch must convert here so the adapter sees a uniform ModelMessage shape.
+  let finalMessages = convertMessagesToModelMessages(textOptions.messages ?? [])
+
+  if (textOptions.tools?.length) {
+    const engine = new TextEngine(
+      {
+        adapter,
+        params: { ...textOptions, model, logger, messages: finalMessages },
+        middleware,
+        context,
+      },
+      logger,
+    )
+
+    // The structured-output stream emits its own RUN_STARTED + RUN_FINISHED
+    // pair to bracket the run — drop both from the engine's output so
+    // consumers see exactly one terminal lifecycle pair.
+    let agentLoopErrored = false
+    try {
+      for await (const chunk of engine.run()) {
+        if (chunk.type === 'RUN_STARTED' || chunk.type === 'RUN_FINISHED') {
+          continue
+        }
+        if (chunk.type === 'RUN_ERROR') {
+          // The engine yielded RUN_ERROR without throwing (provider error mid
+          // agent loop). Forward it once and short-circuit before invoking
+          // structuredOutputStream — otherwise consumers would see a confusing
+          // RUN_ERROR → RUN_STARTED → structured-output.complete sequence and
+          // we would bill another provider call after a failed run.
+          agentLoopErrored = true
+          yield chunk
+          continue
+        }
+        yield chunk
+      }
+    } catch (engineError) {
+      const message = (engineError as Error).message || 'Agent loop failed'
+      logger.errors('runStreamingStructuredOutput agent loop failed', {
+        error: engineError,
+        source: 'runStreamingStructuredOutput',
+      })
+      yield {
+        type: EventType.RUN_ERROR,
+        runId,
+        model,
+        timestamp: Date.now(),
+        message,
+        code: 'agent-loop-failed',
+        error: { message, code: 'agent-loop-failed' },
+      }
+      return
+    }
+
+    if (agentLoopErrored) {
+      return
+    }
+
+    finalMessages = engine.getMessages()
+  }
+
+  const {
+    tools: _tools,
+    agentLoopStrategy: _als,
+    ...structuredTextOptions
+  } = textOptions
+
+  logger.request(
+    `activity=chat-structured-stream provider=${adapter.name} model=${model} messages=${finalMessages.length}`,
+    {
+      provider: adapter.name,
+      model,
+      messageCount: finalMessages.length,
+    },
+  )
+
+  // Adapters consume the abort signal via `chatOptions.request?.signal` and
+  // pass it to the underlying network call. Without this, aborting the SSE
+  // response never cancels the upstream provider request and a terminal
+  // structured-output.complete event still gets yielded after stop.
+  const structuredChatOptions = {
+    ...structuredTextOptions,
+    model,
+    messages: finalMessages,
+    logger,
+    request: textOptions.abortController
+      ? { signal: textOptions.abortController.signal }
+      : undefined,
+  }
+
+  // Adapters that don't implement structuredOutputStream natively fall back
+  // to wrapping the non-streaming `structuredOutput` — `fallbackStructuredOutputStream`
+  // synthesizes the AG-UI lifecycle events around it.
+  const stream = adapter.structuredOutputStream
+    ? adapter.structuredOutputStream({
+        chatOptions: structuredChatOptions,
+        outputSchema: jsonSchema,
+      })
+    : fallbackStructuredOutputStream(adapter, {
+        chatOptions: structuredChatOptions,
+        outputSchema: jsonSchema,
+      })
+
+  for await (const chunk of stream) {
+    if (
+      chunk.type === EventType.CUSTOM &&
+      chunk.name === 'structured-output.complete'
+    ) {
+      const value = chunk.value as {
+        object: unknown
+        raw: string
+        reasoning?: string
+      }
+      if (isStandardSchema(outputSchema)) {
+        try {
+          const validated = parseWithStandardSchema<InferSchemaType<TSchema>>(
+            outputSchema,
+            value.object,
+          )
+          yield {
+            ...chunk,
+            // Forward `reasoning` through schema validation so consumers that
+            // only listen for the terminal event don't lose chain-of-thought.
+            value: {
+              object: validated,
+              raw: value.raw,
+              ...(value.reasoning ? { reasoning: value.reasoning } : {}),
+            },
+          }
+          continue
+        } catch (err) {
+          const message = (err as Error).message || 'Schema validation failed'
+          logger.errors(
+            'runStreamingStructuredOutput schema validation failed',
+            {
+              error: err,
+              source: 'runStreamingStructuredOutput',
+              // Include reasoning in error meta so post-mortems can recover
+              // what the model thought through before producing invalid JSON.
+              ...(value.reasoning ? { reasoning: value.reasoning } : {}),
+            },
+          )
+          yield {
+            type: EventType.RUN_ERROR,
+            runId,
+            model: chunk.model ?? model,
+            timestamp: chunk.timestamp ?? Date.now(),
+            message,
+            code: 'schema-validation',
+            error: {
+              message,
+              code: 'schema-validation',
+              ...(value.reasoning ? { reasoning: value.reasoning } : {}),
+            },
+          }
+          return
+        }
+      }
+      yield chunk
+      continue
+    }
+    yield chunk
+  }
+}
+
 // Re-export adapter types
 export type {
   TextAdapter,
diff --git a/packages/typescript/ai/src/activities/summarize/chat-stream-summarize.ts b/packages/typescript/ai/src/activities/summarize/chat-stream-summarize.ts
index 2e7abb0c1..45f1b66fd 100644
--- a/packages/typescript/ai/src/activities/summarize/chat-stream-summarize.ts
+++ b/packages/typescript/ai/src/activities/summarize/chat-stream-summarize.ts
@@ -1,3 +1,4 @@
+import { EventType } from '@ag-ui/core'
 import { toRunErrorPayload } from '../error-payload'
 import { BaseSummarizeAdapter } from './adapter'
 import type {
@@ -133,10 +134,48 @@ export class ChatStreamSummarizeAdapter<
       { provider: this.name, model: options.model },
     )
 
+    const id = this.generateId()
+    let summary = ''
+    let model = options.model
+    let usage: SummarizationResult['usage'] = {
+      promptTokens: 0,
+      completionTokens: 0,
+      totalTokens: 0,
+    }
+
     try {
-      yield* this.textAdapter.chatStream(
+      for await (const chunk of this.textAdapter.chatStream(
         this.buildTextOptions(options, systemPrompt),
-      )
+      )) {
+        // Accumulate the same way `summarize()` does so consumers see deltas
+        // AND the terminal `generation:result` event below carries the same
+        // final summary that non-streaming returns.
+        if (chunk.type === 'TEXT_MESSAGE_CONTENT') {
+          if (chunk.content) {
+            summary = chunk.content
+          } else if (chunk.delta) {
+            summary += chunk.delta
+          }
+          if (chunk.model) model = chunk.model
+        }
+
+        // Emit the GenerationClient-shaped result event just before the
+        // terminal RUN_FINISHED so subscribers (useSummarize) populate
+        // `result` before flipping `status` to success.
+        if (chunk.type === 'RUN_FINISHED') {
+          if (chunk.usage) usage = chunk.usage
+          if (chunk.model) model = chunk.model
+          yield {
+            type: EventType.CUSTOM,
+            name: 'generation:result',
+            value: { id, model, summary, usage } satisfies SummarizationResult,
+            model,
+            timestamp: Date.now(),
+          }
+        }
+
+        yield chunk
+      }
     } catch (error: unknown) {
       options.logger.errors(`${this.name}.summarizeStream fatal`, {
         error: toRunErrorPayload(error, `${this.name}.summarizeStream failed`),
diff --git a/packages/typescript/ai/src/types.ts b/packages/typescript/ai/src/types.ts
index e51870b7c..b730fe719 100644
--- a/packages/typescript/ai/src/types.ts
+++ b/packages/typescript/ai/src/types.ts
@@ -1057,6 +1057,106 @@ export interface CustomEvent extends AGUICustomEvent {
   model?: string
 }
 
+/**
+ * Final event of a streaming structured-output run. Carries the validated
+ * `object` (typed as `T` after the orchestrator runs Standard Schema parsing),
+ * the `raw` JSON text that produced it, and — for thinking/reasoning models —
+ * the accumulated reasoning text. Adapters emit this with `T = unknown`; the
+ * chat orchestrator narrows to the schema's inferred type after validation.
+ *
+ * `reasoning` is `undefined` when the model produced none (most non-thinking
+ * models) and when the underlying adapter doesn't expose reasoning streams.
+ *
+ * `name` is a string literal so consumers can narrow directly:
+ *
+ * ```ts
+ * if (chunk.type === 'CUSTOM' && chunk.name === 'structured-output.complete') {
+ *   chunk.value.object // typed as T
+ * }
+ * ```
+ */
+export interface StructuredOutputCompleteEvent<T = unknown> extends Omit<
+  CustomEvent,
+  'name' | 'value'
+> {
+  name: 'structured-output.complete'
+  value: { object: T; raw: string; reasoning?: string }
+}
+
+/**
+ * Emitted when a server tool requires approval before execution. The agent
+ * loop yields this and pauses — `structured-output.complete` will not fire
+ * for that run. The shape is fixed by the orchestrator's tool-approval flow
+ * (see `buildApprovalChunks` in `activities/chat/index.ts`).
+ */
+export interface ApprovalRequestedEvent extends Omit<
+  CustomEvent,
+  'name' | 'value'
+> {
+  name: 'approval-requested'
+  value: {
+    toolCallId: string
+    toolName: string
+    input: unknown
+    approval: { id: string; needsApproval: true }
+  }
+}
+
+/**
+ * Emitted when a client tool is invoked. The agent loop yields this and
+ * pauses to let the caller run the tool client-side — `structured-output.complete`
+ * will not fire for that run. Shape fixed by `buildClientToolChunks` in
+ * `activities/chat/index.ts`.
+ */
+export interface ToolInputAvailableEvent extends Omit<
+  CustomEvent,
+  'name' | 'value'
+> {
+  name: 'tool-input-available'
+  value: {
+    toolCallId: string
+    toolName: string
+    input: unknown
+  }
+}
+
+/**
+ * Public type for streams returned by `chat({ outputSchema, stream: true })`.
+ *
+ * Yields all standard `StreamChunk` lifecycle events plus the three tagged
+ * `CUSTOM` events the orchestrator can emit through this path:
+ * - `structured-output.complete` — terminal event with typed `value.object: T`
+ * - `approval-requested` — server tool needs approval (pauses the run)
+ * - `tool-input-available` — client tool invocation (pauses the run)
+ *
+ * Each variant has a literal `name`, so a single discriminated narrow gives
+ * you a typed `value` with no helper or cast:
+ *
+ * ```ts
+ * for await (const chunk of stream) {
+ *   if (chunk.type === 'CUSTOM' && chunk.name === 'structured-output.complete') {
+ *     chunk.value.object // typed as T
+ *   } else if (chunk.type === 'CUSTOM' && chunk.name === 'approval-requested') {
+ *     chunk.value.toolCallId // typed as string
+ *   }
+ * }
+ * ```
+ *
+ * Caveat: tools can emit arbitrary user-defined custom events via the
+ * `emitCustomEvent(name, value)` context API. Those flow through this stream
+ * at runtime but are intentionally absent from this type — including a bare
+ * `CustomEvent` (whose `value: any` would poison the union) would collapse
+ * `chunk.value` back to `any` after the narrow. If you rely on
+ * `emitCustomEvent` plus `outputSchema + stream: true`, branch on `CUSTOM`
+ * outside the literal-`name` narrows or cast explicitly.
+ */
+export type StructuredOutputStream<T = unknown> = AsyncIterable<
+  | Exclude<StreamChunk, CustomEvent>
+  | StructuredOutputCompleteEvent<T>
+  | ApprovalRequestedEvent
+  | ToolInputAvailableEvent
+>
+
 // ============================================================================
 // AG-UI Reasoning Event Interfaces
 // ============================================================================
diff --git a/packages/typescript/ai/tests/chat-result-types.test.ts b/packages/typescript/ai/tests/chat-result-types.test.ts
new file mode 100644
index 000000000..bcbe6b851
--- /dev/null
+++ b/packages/typescript/ai/tests/chat-result-types.test.ts
@@ -0,0 +1,63 @@
+/**
+ * Type-level tests for `chat()`'s return-type narrowing.
+ *
+ * Pinning the shape returned by every `(outputSchema?, stream?)` combination so a
+ * future refactor of `TextActivityResult` can't silently regress the streaming-
+ * structured-output branch (issue #526).
+ */
+
+import { describe, expectTypeOf, it } from 'vitest'
+import type { StandardJSONSchemaV1 } from '@standard-schema/spec'
+import type { TextActivityResult } from '../src/activities/chat'
+import type { StreamChunk, StructuredOutputStream } from '../src/types'
+
+type Person = { name: string }
+
+// A schema branded as Standard JSON Schema so `InferSchemaType<>` can recover
+// the input type — this is what real callers pass via Zod / ArkType.
+type PersonSchema = StandardJSONSchemaV1<Person, Person>
+
+describe('chat() return type', () => {
+  describe('with outputSchema', () => {
+    it('stream: true → StructuredOutputStream<T>', () => {
+      expectTypeOf<TextActivityResult<PersonSchema, true>>().toEqualTypeOf<
+        StructuredOutputStream<Person>
+      >()
+    })
+
+    it('stream: false → Promise<T>', () => {
+      expectTypeOf<TextActivityResult<PersonSchema, false>>().toEqualTypeOf<
+        Promise<Person>
+      >()
+    })
+
+    it('default stream (boolean) → Promise<T> (does NOT match streaming branch)', () => {
+      // Regression guard for #526: the default `TStream = boolean` must
+      // resolve to the non-streaming Promise branch. `[true] extends [boolean]`
+      // is false, so the conditional falls through to `Promise<T>`.
+      expectTypeOf<TextActivityResult<PersonSchema>>().toEqualTypeOf<
+        Promise<Person>
+      >()
+    })
+  })
+
+  describe('without outputSchema', () => {
+    it('stream: true → AsyncIterable<StreamChunk>', () => {
+      expectTypeOf<TextActivityResult<undefined, true>>().toEqualTypeOf<
+        AsyncIterable<StreamChunk>
+      >()
+    })
+
+    it('stream: false → Promise<string>', () => {
+      expectTypeOf<TextActivityResult<undefined, false>>().toEqualTypeOf<
+        Promise<string>
+      >()
+    })
+
+    it('default stream (boolean) → AsyncIterable<StreamChunk>', () => {
+      expectTypeOf<TextActivityResult<undefined>>().toEqualTypeOf<
+        AsyncIterable<StreamChunk>
+      >()
+    })
+  })
+})
diff --git a/packages/typescript/ai/tests/chat-structured-output-stream.test.ts b/packages/typescript/ai/tests/chat-structured-output-stream.test.ts
new file mode 100644
index 000000000..9bc034eea
--- /dev/null
+++ b/packages/typescript/ai/tests/chat-structured-output-stream.test.ts
@@ -0,0 +1,377 @@
+/**
+ * Unit tests for `chat({ outputSchema, stream: true })`'s orchestrator
+ * (runStreamingStructuredOutput / runStreamingStructuredOutputImpl in
+ * `activities/chat/index.ts`).
+ *
+ * The orchestrator wraps the adapter's `structuredOutputStream` (or falls back
+ * to wrapping the non-streaming `structuredOutput`) and threads Standard-Schema
+ * validation through the terminal `CUSTOM structured-output.complete` event.
+ * These tests pin the behavior so a future refactor of the orchestrator can't
+ * silently regress validation, reasoning forwarding, or the fallback path.
+ *
+ * Adapter-side branches (chat-completions vs. responses, provider quirks) are
+ * exercised by the per-adapter test suites under packages/typescript/openai-base
+ * and the e2e suite. This file is the orchestrator-only fixture.
+ */
+
+import { describe, expect, it } from 'vitest'
+import { z } from 'zod'
+import { chat } from '../src/activities/chat/index'
+import { EventType } from '../src/types'
+import type { StreamChunk } from '../src/types'
+import type { AnyTextAdapter } from '../src/activities/chat/adapter'
+import { collectChunks } from './test-utils'
+
+const PersonSchema = z.object({
+  name: z.string(),
+  age: z.number(),
+  email: z.string().email(),
+})
+type Person = z.infer<typeof PersonSchema>
+
+const validPerson: Person = {
+  name: 'John Doe',
+  age: 30,
+  email: 'john@example.com',
+}
+
+/**
+ * Minimal AnyTextAdapter shell — only the fields the orchestrator touches in
+ * the no-tools structured-output streaming path. Optional callbacks let each
+ * test wire just the behaviour it needs.
+ */
+function makeAdapter(opts: {
+  structuredOutputStream?: (o: unknown) => AsyncIterable<StreamChunk>
+  structuredOutput?: (o: unknown) => Promise<{ data: unknown; rawText: string }>
+}): AnyTextAdapter {
+  return {
+    kind: 'text' as const,
+    name: 'mock',
+    model: 'test-model' as const,
+    '~types': {
+      providerOptions: {} as Record<string, unknown>,
+      inputModalities: ['text'] as readonly ['text'],
+      messageMetadataByModality: {
+        text: undefined as unknown,
+        image: undefined as unknown,
+        audio: undefined as unknown,
+        video: undefined as unknown,
+        document: undefined as unknown,
+      },
+      toolCapabilities: [] as ReadonlyArray<string>,
+      toolCallMetadata: undefined as unknown,
+    },
+    chatStream: () => (async function* () {})(),
+    structuredOutput:
+      (opts.structuredOutput as AnyTextAdapter['structuredOutput']) ??
+      (async () => ({
+        data: validPerson,
+        rawText: JSON.stringify(validPerson),
+      })),
+    ...(opts.structuredOutputStream
+      ? {
+          structuredOutputStream:
+            opts.structuredOutputStream as AnyTextAdapter['structuredOutputStream'],
+        }
+      : {}),
+  } as AnyTextAdapter
+}
+
+/** Build a complete adapter-emitted structured-output stream. */
+function structuredStreamChunks(
+  fullJson: string,
+  object: unknown,
+  reasoning?: string,
+): Array<StreamChunk> {
+  return [
+    {
+      type: EventType.RUN_STARTED,
+      runId: 'run-1',
+      threadId: 'thread-1',
+      timestamp: Date.now(),
+    } as StreamChunk,
+    {
+      type: EventType.TEXT_MESSAGE_START,
+      messageId: 'msg-1',
+      role: 'assistant',
+      timestamp: Date.now(),
+    } as StreamChunk,
+    {
+      type: EventType.TEXT_MESSAGE_CONTENT,
+      messageId: 'msg-1',
+      delta: fullJson,
+      timestamp: Date.now(),
+    } as StreamChunk,
+    {
+      type: EventType.TEXT_MESSAGE_END,
+      messageId: 'msg-1',
+      timestamp: Date.now(),
+    } as StreamChunk,
+    {
+      type: EventType.CUSTOM,
+      name: 'structured-output.complete',
+      value: {
+        object,
+        raw: fullJson,
+        ...(reasoning ? { reasoning } : {}),
+      },
+      timestamp: Date.now(),
+    } as StreamChunk,
+    {
+      type: EventType.RUN_FINISHED,
+      runId: 'run-1',
+      threadId: 'thread-1',
+      finishReason: 'stop',
+      timestamp: Date.now(),
+    } as StreamChunk,
+  ]
+}
+
+describe('chat({ outputSchema, stream: true })', () => {
+  describe('native adapter.structuredOutputStream', () => {
+    it('forwards a schema-validated structured-output.complete event', async () => {
+      const adapter = makeAdapter({
+        structuredOutputStream: () =>
+          (async function* () {
+            for (const c of structuredStreamChunks(
+              JSON.stringify(validPerson),
+              validPerson,
+            ))
+              yield c
+          })(),
+      })
+
+      const stream = chat({
+        adapter,
+        messages: [{ role: 'user', content: 'extract' }],
+        outputSchema: PersonSchema,
+        stream: true,
+      })
+
+      // `collectChunks` expects `AsyncIterable<StreamChunk>`. The orchestrator
+      // returns the narrower `StructuredOutputStream<T>` whose element union
+      // includes tagged events that TS doesn't always realise are structural
+      // subtypes of `CustomEvent` (and thus of `StreamChunk`) — cast through
+      // the wider iterable type for the test boundary.
+      const chunks = await collectChunks(
+        stream as unknown as AsyncIterable<StreamChunk>,
+      )
+
+      const complete = chunks.find(
+        (c) =>
+          c.type === EventType.CUSTOM &&
+          (c as { name?: string }).name === 'structured-output.complete',
+      )
+      expect(complete).toBeDefined()
+      const value = (complete as { value: { object: Person } }).value
+      expect(value.object).toEqual(validPerson)
+    })
+
+    it('emits RUN_ERROR (code: schema-validation) when adapter data fails schema parse', async () => {
+      // Adapter emits an object that's not a valid Person (age missing, email invalid).
+      const invalidObject = { name: 'X', email: 'not-an-email' }
+      const adapter = makeAdapter({
+        structuredOutputStream: () =>
+          (async function* () {
+            for (const c of structuredStreamChunks(
+              JSON.stringify(invalidObject),
+              invalidObject,
+            ))
+              yield c
+          })(),
+      })
+
+      const stream = chat({
+        adapter,
+        messages: [{ role: 'user', content: 'extract' }],
+        outputSchema: PersonSchema,
+        stream: true,
+      })
+
+      // `collectChunks` expects `AsyncIterable<StreamChunk>`. The orchestrator
+      // returns the narrower `StructuredOutputStream<T>` whose element union
+      // includes tagged events that TS doesn't always realise are structural
+      // subtypes of `CustomEvent` (and thus of `StreamChunk`) — cast through
+      // the wider iterable type for the test boundary.
+      const chunks = await collectChunks(
+        stream as unknown as AsyncIterable<StreamChunk>,
+      )
+
+      const runError = chunks.find((c) => c.type === EventType.RUN_ERROR) as
+        | { type: EventType.RUN_ERROR; code?: string; message?: string }
+        | undefined
+
+      expect(runError).toBeDefined()
+      expect(runError!.code).toBe('schema-validation')
+
+      // The (unvalidated) structured-output.complete must not have been
+      // forwarded to consumers — validation failure short-circuits the
+      // happy-path emit.
+      const completeAfterError = chunks.find(
+        (c) =>
+          c.type === EventType.CUSTOM &&
+          (c as { name?: string }).name === 'structured-output.complete',
+      )
+      expect(completeAfterError).toBeUndefined()
+    })
+
+    it('forwards `reasoning` through schema validation', async () => {
+      const reasoning = 'Reading the prompt… extracting name, age, email… done.'
+      const adapter = makeAdapter({
+        structuredOutputStream: () =>
+          (async function* () {
+            for (const c of structuredStreamChunks(
+              JSON.stringify(validPerson),
+              validPerson,
+              reasoning,
+            ))
+              yield c
+          })(),
+      })
+
+      const stream = chat({
+        adapter,
+        messages: [{ role: 'user', content: 'extract' }],
+        outputSchema: PersonSchema,
+        stream: true,
+      })
+
+      // `collectChunks` expects `AsyncIterable<StreamChunk>`. The orchestrator
+      // returns the narrower `StructuredOutputStream<T>` whose element union
+      // includes tagged events that TS doesn't always realise are structural
+      // subtypes of `CustomEvent` (and thus of `StreamChunk`) — cast through
+      // the wider iterable type for the test boundary.
+      const chunks = await collectChunks(
+        stream as unknown as AsyncIterable<StreamChunk>,
+      )
+
+      const complete = chunks.find(
+        (c) =>
+          c.type === EventType.CUSTOM &&
+          (c as { name?: string }).name === 'structured-output.complete',
+      ) as
+        | {
+            value: { object: Person; raw: string; reasoning?: string }
+          }
+        | undefined
+
+      expect(complete).toBeDefined()
+      expect(complete!.value.reasoning).toBe(reasoning)
+      expect(complete!.value.object).toEqual(validPerson)
+    })
+
+    it('forwards raw JSON text via TEXT_MESSAGE_CONTENT before the terminal event', async () => {
+      const adapter = makeAdapter({
+        structuredOutputStream: () =>
+          (async function* () {
+            for (const c of structuredStreamChunks(
+              JSON.stringify(validPerson),
+              validPerson,
+            ))
+              yield c
+          })(),
+      })
+
+      const stream = chat({
+        adapter,
+        messages: [{ role: 'user', content: 'extract' }],
+        outputSchema: PersonSchema,
+        stream: true,
+      })
+
+      // `collectChunks` expects `AsyncIterable<StreamChunk>`. The orchestrator
+      // returns the narrower `StructuredOutputStream<T>` whose element union
+      // includes tagged events that TS doesn't always realise are structural
+      // subtypes of `CustomEvent` (and thus of `StreamChunk`) — cast through
+      // the wider iterable type for the test boundary.
+      const chunks = await collectChunks(
+        stream as unknown as AsyncIterable<StreamChunk>,
+      )
+
+      const textChunks = chunks.filter(
+        (c) => c.type === EventType.TEXT_MESSAGE_CONTENT,
+      )
+      expect(textChunks.length).toBeGreaterThan(0)
+    })
+  })
+
+  describe('fallbackStructuredOutputStream (adapter lacks native streaming)', () => {
+    it('synthesizes the AG-UI lifecycle around adapter.structuredOutput', async () => {
+      // No `structuredOutputStream` on the adapter — orchestrator falls back
+      // to wrapping the non-streaming `structuredOutput` and synthesizing
+      // RUN_STARTED → TEXT_MESSAGE_* → structured-output.complete → RUN_FINISHED.
+      const adapter = makeAdapter({
+        structuredOutput: async () => ({
+          data: validPerson,
+          rawText: JSON.stringify(validPerson),
+        }),
+      })
+
+      const stream = chat({
+        adapter,
+        messages: [{ role: 'user', content: 'extract' }],
+        outputSchema: PersonSchema,
+        stream: true,
+      })
+
+      // `collectChunks` expects `AsyncIterable<StreamChunk>`. The orchestrator
+      // returns the narrower `StructuredOutputStream<T>` whose element union
+      // includes tagged events that TS doesn't always realise are structural
+      // subtypes of `CustomEvent` (and thus of `StreamChunk`) — cast through
+      // the wider iterable type for the test boundary.
+      const chunks = await collectChunks(
+        stream as unknown as AsyncIterable<StreamChunk>,
+      )
+      const types = chunks.map((c) => c.type)
+
+      // Lifecycle envelope.
+      expect(types).toContain(EventType.RUN_STARTED)
+      expect(types).toContain(EventType.RUN_FINISHED)
+      expect(types).toContain(EventType.TEXT_MESSAGE_START)
+      expect(types).toContain(EventType.TEXT_MESSAGE_CONTENT)
+      expect(types).toContain(EventType.TEXT_MESSAGE_END)
+
+      // Terminal validated event.
+      const complete = chunks.find(
+        (c) =>
+          c.type === EventType.CUSTOM &&
+          (c as { name?: string }).name === 'structured-output.complete',
+      ) as { value: { object: Person; raw: string } } | undefined
+      expect(complete).toBeDefined()
+      expect(complete!.value.object).toEqual(validPerson)
+      expect(complete!.value.raw).toBe(JSON.stringify(validPerson))
+    })
+
+    it('emits RUN_ERROR on schema validation failure (fallback path)', async () => {
+      const invalidObject = { name: 'X', age: 'not-a-number' }
+      const adapter = makeAdapter({
+        structuredOutput: async () => ({
+          data: invalidObject,
+          rawText: JSON.stringify(invalidObject),
+        }),
+      })
+
+      const stream = chat({
+        adapter,
+        messages: [{ role: 'user', content: 'extract' }],
+        outputSchema: PersonSchema,
+        stream: true,
+      })
+
+      // `collectChunks` expects `AsyncIterable<StreamChunk>`. The orchestrator
+      // returns the narrower `StructuredOutputStream<T>` whose element union
+      // includes tagged events that TS doesn't always realise are structural
+      // subtypes of `CustomEvent` (and thus of `StreamChunk`) — cast through
+      // the wider iterable type for the test boundary.
+      const chunks = await collectChunks(
+        stream as unknown as AsyncIterable<StreamChunk>,
+      )
+
+      const runError = chunks.find((c) => c.type === EventType.RUN_ERROR) as
+        | { type: EventType.RUN_ERROR; code?: string }
+        | undefined
+      expect(runError).toBeDefined()
+      expect(runError!.code).toBe('schema-validation')
+    })
+  })
+})
diff --git a/packages/typescript/openai-base/src/adapters/chat-completions-text.ts b/packages/typescript/openai-base/src/adapters/chat-completions-text.ts
index e6d892d53..a733b6604 100644
--- a/packages/typescript/openai-base/src/adapters/chat-completions-text.ts
+++ b/packages/typescript/openai-base/src/adapters/chat-completions-text.ts
@@ -218,6 +218,336 @@ export abstract class OpenAIBaseChatCompletionsTextAdapter<
     }
   }
 
+  /**
+   * Stream structured output. Single Chat Completions request with
+   * `response_format: json_schema` + `stream: true`. Emits the standard
+   * AG-UI lifecycle (`RUN_STARTED` → `REASONING_*?` → `TEXT_MESSAGE_*`
+   * carrying raw JSON deltas → terminal `CUSTOM 'structured-output.complete'`
+   * → `RUN_FINISHED`). Subclasses use the same SDK-call / reasoning /
+   * structured-output-transform hooks as `chatStream` / `structuredOutput` —
+   * no per-subclass override should be needed.
+   */
+  async *structuredOutputStream(
+    options: StructuredOutputOptions<TProviderOptions>,
+  ): AsyncIterable<StreamChunk> {
+    const { chatOptions, outputSchema } = options
+    const requestParams = this.mapOptionsToRequest(chatOptions)
+
+    const jsonSchema = this.makeStructuredOutputCompatible(
+      outputSchema,
+      outputSchema.required,
+    )
+
+    const timestamp = Date.now()
+    const aguiState = {
+      runId: generateId(this.name),
+      threadId: chatOptions.threadId ?? generateId(this.name),
+      messageId: generateId(this.name),
+      timestamp,
+      hasEmittedRunStarted: false,
+    }
+
+    let accumulatedContent = ''
+    let accumulatedReasoning = ''
+    let hasEmittedTextMessageStart = false
+    let reasoningMessageId: string | undefined
+    let hasClosedReasoning = false
+    let stepId: string | undefined
+    let lastModel: string | undefined
+    let lastUsage:
+      | OpenAI.Chat.Completions.ChatCompletionChunk['usage']
+      | undefined
+
+    const closeReasoningLifecycle = function* (this: {
+      name: string
+    }): Generator<StreamChunk> {
+      if (reasoningMessageId && !hasClosedReasoning) {
+        hasClosedReasoning = true
+        yield {
+          type: EventType.REASONING_MESSAGE_END,
+          messageId: reasoningMessageId,
+          model: lastModel || chatOptions.model,
+          timestamp,
+        }
+        yield {
+          type: EventType.REASONING_END,
+          messageId: reasoningMessageId,
+          model: lastModel || chatOptions.model,
+          timestamp,
+        }
+        if (stepId) {
+          yield {
+            type: EventType.STEP_FINISHED,
+            stepName: stepId,
+            stepId,
+            model: lastModel || chatOptions.model,
+            timestamp,
+            content: accumulatedReasoning,
+          }
+        }
+      }
+    }.bind(this)
+
+    try {
+      // Strip stream_options + tools from the base request. Structured output
+      // sends `response_format: json_schema` and doesn't carry tools — keeping
+      // them in the request can confuse strict-mode validation upstream.
+      const {
+        stream_options: _so,
+        stream: _s,
+        tools: _t,
+        ...cleanParams
+      } = requestParams
+
+      chatOptions.logger.request(
+        `activity=structuredOutputStream provider=${this.name} model=${this.model} messages=${chatOptions.messages.length}`,
+        { provider: this.name, model: this.model },
+      )
+
+      const stream = await this.client.chat.completions.create(
+        {
+          ...cleanParams,
+          stream: true,
+          stream_options: { include_usage: true },
+          response_format: {
+            type: 'json_schema',
+            json_schema: {
+              name: 'structured_output',
+              schema: jsonSchema,
+              strict: true,
+            },
+          },
+        },
+        extractRequestOptions(chatOptions.request),
+      )
+
+      for await (const chunk of stream) {
+        const choiceForLog = chunk.choices[0]
+        chatOptions.logger.provider(
+          `provider=${this.name} finish_reason=${choiceForLog?.finish_reason ?? 'none'} hasContent=${!!choiceForLog?.delta.content} hasUsage=${!!chunk.usage}`,
+          { provider: this.name, model: chunk.model },
+        )
+
+        if (chunk.model) lastModel = chunk.model
+
+        // Usage may arrive on a chunk with empty `choices` (OpenAI's
+        // include_usage terminal chunk) or piggybacked on a finish chunk
+        // (`x_groq.usage` on Groq). Capture from either independent of
+        // choices[0].
+        const usage =
+          chunk.usage ??
+          (chunk as { x_groq?: { usage?: typeof chunk.usage } }).x_groq?.usage
+        if (usage) lastUsage = usage
+
+        if (!aguiState.hasEmittedRunStarted) {
+          aguiState.hasEmittedRunStarted = true
+          yield {
+            type: EventType.RUN_STARTED,
+            runId: aguiState.runId,
+            threadId: aguiState.threadId,
+            model: chunk.model || chatOptions.model,
+            timestamp,
+          }
+        }
+
+        // Reasoning (via the extractReasoning hook — same hook as chatStream).
+        const reasoning = this.extractReasoning(chunk)
+        if (reasoning && reasoning.text) {
+          if (!reasoningMessageId) {
+            reasoningMessageId = generateId(this.name)
+            stepId = generateId(this.name)
+            yield {
+              type: EventType.REASONING_START,
+              messageId: reasoningMessageId,
+              model: chunk.model || chatOptions.model,
+              timestamp,
+            }
+            yield {
+              type: EventType.REASONING_MESSAGE_START,
+              messageId: reasoningMessageId,
+              role: 'reasoning' as const,
+              model: chunk.model || chatOptions.model,
+              timestamp,
+            }
+            yield {
+              type: EventType.STEP_STARTED,
+              stepName: stepId,
+              stepId,
+              model: chunk.model || chatOptions.model,
+              timestamp,
+              stepType: 'thinking',
+            }
+          }
+          accumulatedReasoning += reasoning.text
+          yield {
+            type: EventType.REASONING_MESSAGE_CONTENT,
+            messageId: reasoningMessageId,
+            delta: reasoning.text,
+            model: chunk.model || chatOptions.model,
+            timestamp,
+          }
+        }
+
+        const choice = chunk.choices[0]
+        if (!choice) continue
+
+        const deltaContent = choice.delta.content
+        if (deltaContent) {
+          yield* closeReasoningLifecycle()
+
+          if (!hasEmittedTextMessageStart) {
+            hasEmittedTextMessageStart = true
+            yield {
+              type: EventType.TEXT_MESSAGE_START,
+              messageId: aguiState.messageId,
+              model: chunk.model || chatOptions.model,
+              timestamp,
+              role: 'assistant',
+            }
+          }
+
+          accumulatedContent += deltaContent
+
+          yield {
+            type: EventType.TEXT_MESSAGE_CONTENT,
+            messageId: aguiState.messageId,
+            model: chunk.model || chatOptions.model,
+            timestamp,
+            delta: deltaContent,
+            content: accumulatedContent,
+          }
+        }
+      }
+
+      // Finalisation: close any open lifecycle, parse + validate, emit
+      // terminal events. This block always runs unless the loop threw — abort
+      // and SDK errors land in the catch block below.
+      yield* closeReasoningLifecycle()
+
+      if (hasEmittedTextMessageStart) {
+        yield {
+          type: EventType.TEXT_MESSAGE_END,
+          messageId: aguiState.messageId,
+          model: lastModel || chatOptions.model,
+          timestamp,
+        }
+      }
+
+      if (accumulatedContent.length === 0) {
+        yield {
+          type: EventType.RUN_ERROR,
+          runId: aguiState.runId,
+          model: lastModel || chatOptions.model,
+          timestamp,
+          message: `${this.name}.structuredOutputStream: response contained no content`,
+          code: 'empty-response',
+          error: {
+            message: `${this.name}.structuredOutputStream: response contained no content`,
+            code: 'empty-response',
+          },
+        }
+        return
+      }
+
+      let parsed: unknown
+      try {
+        parsed = JSON.parse(accumulatedContent)
+      } catch {
+        yield {
+          type: EventType.RUN_ERROR,
+          runId: aguiState.runId,
+          model: lastModel || chatOptions.model,
+          timestamp,
+          message: `Failed to parse structured output as JSON. Content: ${accumulatedContent.slice(0, 200)}${accumulatedContent.length > 200 ? '...' : ''}`,
+          code: 'parse-error',
+          error: {
+            message: 'Failed to parse structured output as JSON',
+            code: 'parse-error',
+          },
+        }
+        return
+      }
+
+      const transformed = this.transformStructuredOutput(parsed)
+
+      yield {
+        type: EventType.CUSTOM,
+        name: 'structured-output.complete',
+        value: {
+          object: transformed,
+          raw: accumulatedContent,
+          ...(accumulatedReasoning ? { reasoning: accumulatedReasoning } : {}),
+        },
+        model: lastModel || chatOptions.model,
+        timestamp,
+      }
+
+      yield {
+        type: EventType.RUN_FINISHED,
+        runId: aguiState.runId,
+        threadId: aguiState.threadId,
+        model: lastModel || chatOptions.model,
+        timestamp,
+        finishReason: 'stop',
+        ...(lastUsage && {
+          usage: {
+            promptTokens: lastUsage.prompt_tokens,
+            completionTokens: lastUsage.completion_tokens,
+            totalTokens: lastUsage.total_tokens,
+          },
+        }),
+      }
+    } catch (error: unknown) {
+      if (!aguiState.hasEmittedRunStarted) {
+        aguiState.hasEmittedRunStarted = true
+        yield {
+          type: EventType.RUN_STARTED,
+          runId: aguiState.runId,
+          threadId: aguiState.threadId,
+          model: chatOptions.model,
+          timestamp,
+        }
+      }
+
+      const isAbort = this.isAbortError(error)
+      const errorPayload = toRunErrorPayload(
+        error,
+        `${this.name}.structuredOutputStream failed`,
+      )
+
+      yield {
+        type: EventType.RUN_ERROR,
+        runId: aguiState.runId,
+        model: lastModel || chatOptions.model,
+        timestamp,
+        message: errorPayload.message,
+        code: isAbort ? 'aborted' : errorPayload.code,
+        error: { ...errorPayload, ...(isAbort && { code: 'aborted' }) },
+      }
+
+      chatOptions.logger.errors(`${this.name}.structuredOutputStream fatal`, {
+        error: errorPayload,
+        source: `${this.name}.structuredOutputStream`,
+      })
+    }
+  }
+
+  /**
+   * Cross-SDK abort detection for `structuredOutputStream`. Default duck-types
+   * on `name === 'APIUserAbortError'` (OpenAI SDK), `code === 'ERR_CANCELED'`,
+   * and standard `AbortError`s. Subclasses with proprietary error types (e.g.
+   * `@openrouter/sdk`'s `RequestAbortedError`) override to extend the check.
+   */
+  protected isAbortError(error: unknown): boolean {
+    if (!error || typeof error !== 'object') return false
+    const e = error as { name?: unknown; code?: unknown }
+    return (
+      e.name === 'APIUserAbortError' ||
+      e.name === 'AbortError' ||
+      e.code === 'ERR_CANCELED'
+    )
+  }
+
   /**
    * Applies provider-specific transformations for structured output compatibility.
    * Override this in subclasses to handle provider-specific quirks.
diff --git a/packages/typescript/openai-base/src/adapters/responses-text.ts b/packages/typescript/openai-base/src/adapters/responses-text.ts
index 4fefd0679..498d62115 100644
--- a/packages/typescript/openai-base/src/adapters/responses-text.ts
+++ b/packages/typescript/openai-base/src/adapters/responses-text.ts
@@ -253,6 +253,387 @@ export abstract class OpenAIBaseResponsesTextAdapter<
     }
   }
 
+  /**
+   * Stream structured output via the Responses API: single request with
+   * `text.format: json_schema` + `stream: true`. Consumes Responses-API
+   * events (`response.output_text.delta`, `response.reasoning_text.delta`,
+   * `response.reasoning_summary_text.delta`, `response.refusal.delta`,
+   * `response.completed`, `response.failed`) and re-emits the standard AG-UI
+   * lifecycle ending with `CUSTOM 'structured-output.complete'`.
+   *
+   * Tools are stripped (structured output is mutually exclusive with tool
+   * calls in this path). Reasoning text is accumulated and surfaced both as
+   * REASONING_* lifecycle events during the stream and on the terminal
+   * CUSTOM event's `value.reasoning`.
+   */
+  async *structuredOutputStream(
+    options: StructuredOutputOptions<TProviderOptions>,
+  ): AsyncIterable<StreamChunk> {
+    const { chatOptions, outputSchema } = options
+    const requestParams = this.mapOptionsToRequest(chatOptions)
+
+    const jsonSchema = this.makeStructuredOutputCompatible(
+      outputSchema,
+      outputSchema.required,
+    )
+
+    const timestamp = Date.now()
+    const aguiState = {
+      runId: generateId(this.name),
+      threadId: chatOptions.threadId ?? generateId(this.name),
+      messageId: generateId(this.name),
+      timestamp,
+      hasEmittedRunStarted: false,
+    }
+
+    let accumulatedContent = ''
+    let accumulatedReasoning = ''
+    let hasEmittedTextMessageStart = false
+    let reasoningMessageId: string | undefined
+    let stepId: string | undefined
+    let hasClosedReasoning = false
+    let model: string = chatOptions.model
+    let usage: OpenAI.Responses.Response['usage'] | undefined
+
+    const closeReasoning = function* (this: {
+      name: string
+    }): Generator<StreamChunk> {
+      if (reasoningMessageId && !hasClosedReasoning) {
+        hasClosedReasoning = true
+        yield {
+          type: EventType.REASONING_MESSAGE_END,
+          messageId: reasoningMessageId,
+          model,
+          timestamp,
+        }
+        yield {
+          type: EventType.REASONING_END,
+          messageId: reasoningMessageId,
+          model,
+          timestamp,
+        }
+        if (stepId) {
+          yield {
+            type: EventType.STEP_FINISHED,
+            stepName: stepId,
+            stepId,
+            model,
+            timestamp,
+            content: accumulatedReasoning,
+          }
+        }
+      }
+    }.bind(this)
+
+    const openReasoning = function* (this: {
+      name: string
+    }): Generator<StreamChunk> {
+      if (reasoningMessageId) return
+      reasoningMessageId = generateId(this.name)
+      stepId = generateId(this.name)
+      yield {
+        type: EventType.REASONING_START,
+        messageId: reasoningMessageId,
+        model,
+        timestamp,
+      }
+      yield {
+        type: EventType.REASONING_MESSAGE_START,
+        messageId: reasoningMessageId,
+        role: 'reasoning' as const,
+        model,
+        timestamp,
+      }
+      yield {
+        type: EventType.STEP_STARTED,
+        stepName: stepId,
+        stepId,
+        model,
+        timestamp,
+        stepType: 'thinking',
+      }
+    }.bind(this)
+
+    try {
+      const { tools: _tools, ...cleanParams } = requestParams
+      void _tools
+
+      chatOptions.logger.request(
+        `activity=structuredOutputStream provider=${this.name} model=${this.model} messages=${chatOptions.messages.length}`,
+        { provider: this.name, model: this.model },
+      )
+
+      const stream = await this.client.responses.create(
+        {
+          ...cleanParams,
+          stream: true,
+          text: {
+            format: {
+              type: 'json_schema',
+              name: 'structured_output',
+              schema: jsonSchema,
+              strict: true,
+            },
+          },
+        },
+        extractRequestOptions(chatOptions.request),
+      )
+
+      for await (const chunk of stream) {
+        chatOptions.logger.provider(
+          `provider=${this.name} type=${chunk.type}`,
+          { provider: this.name, type: chunk.type },
+        )
+
+        if (!aguiState.hasEmittedRunStarted) {
+          aguiState.hasEmittedRunStarted = true
+          yield {
+            type: EventType.RUN_STARTED,
+            runId: aguiState.runId,
+            threadId: aguiState.threadId,
+            model,
+            timestamp,
+          }
+        }
+
+        if (
+          chunk.type === 'response.created' ||
+          chunk.type === 'response.in_progress'
+        ) {
+          const responseModel = (chunk as { response?: { model?: string } })
+            .response?.model
+          if (responseModel) model = responseModel
+          continue
+        }
+
+        if (chunk.type === 'response.refusal.delta') {
+          const delta =
+            typeof (chunk as { delta?: unknown }).delta === 'string'
+              ? (chunk as { delta: string }).delta
+              : ''
+          yield {
+            type: EventType.RUN_ERROR,
+            runId: aguiState.runId,
+            model,
+            timestamp,
+            message: `Model refused: ${delta}`,
+            code: 'refusal',
+            error: { message: `Model refused: ${delta}`, code: 'refusal' },
+          }
+          return
+        }
+
+        if (
+          chunk.type === 'response.reasoning_text.delta' ||
+          chunk.type === 'response.reasoning_summary_text.delta'
+        ) {
+          const raw = (chunk as { delta?: unknown }).delta
+          const reasoningDelta = Array.isArray(raw)
+            ? raw.join('')
+            : typeof raw === 'string'
+              ? raw
+              : ''
+          if (!reasoningDelta) continue
+          yield* openReasoning()
+          // openReasoning() guarantees reasoningMessageId is set on first call;
+          // TS can't see through the generator side-effect.
+          const messageId = reasoningMessageId!
+          accumulatedReasoning += reasoningDelta
+          yield {
+            type: EventType.REASONING_MESSAGE_CONTENT,
+            messageId,
+            delta: reasoningDelta,
+            model,
+            timestamp,
+          }
+          continue
+        }
+
+        if (chunk.type === 'response.output_text.delta') {
+          const raw = (chunk as { delta?: unknown }).delta
+          const textDelta = Array.isArray(raw)
+            ? raw.join('')
+            : typeof raw === 'string'
+              ? raw
+              : ''
+          if (!textDelta) continue
+
+          yield* closeReasoning()
+
+          if (!hasEmittedTextMessageStart) {
+            hasEmittedTextMessageStart = true
+            yield {
+              type: EventType.TEXT_MESSAGE_START,
+              messageId: aguiState.messageId,
+              model,
+              timestamp,
+              role: 'assistant',
+            }
+          }
+          accumulatedContent += textDelta
+          yield {
+            type: EventType.TEXT_MESSAGE_CONTENT,
+            messageId: aguiState.messageId,
+            model,
+            timestamp,
+            delta: textDelta,
+            content: accumulatedContent,
+          }
+          continue
+        }
+
+        if (chunk.type === 'response.completed') {
+          const response = chunk.response
+          if (response.usage) usage = response.usage
+          if (response.model) model = response.model
+          continue
+        }
+
+        if (chunk.type === 'response.failed') {
+          const response = (
+            chunk as {
+              response?: { error?: { message?: string; code?: string } }
+            }
+          ).response
+          const message =
+            response?.error?.message || 'Responses API stream failed'
+          yield {
+            type: EventType.RUN_ERROR,
+            runId: aguiState.runId,
+            model,
+            timestamp,
+            message,
+            code: response?.error?.code,
+            error: { message, code: response?.error?.code },
+          }
+          return
+        }
+      }
+
+      yield* closeReasoning()
+
+      if (hasEmittedTextMessageStart) {
+        yield {
+          type: EventType.TEXT_MESSAGE_END,
+          messageId: aguiState.messageId,
+          model,
+          timestamp,
+        }
+      }
+
+      if (accumulatedContent.length === 0) {
+        yield {
+          type: EventType.RUN_ERROR,
+          runId: aguiState.runId,
+          model,
+          timestamp,
+          message: `${this.name}.structuredOutputStream: response contained no content`,
+          code: 'empty-response',
+          error: {
+            message: `${this.name}.structuredOutputStream: response contained no content`,
+            code: 'empty-response',
+          },
+        }
+        return
+      }
+
+      let parsed: unknown
+      try {
+        parsed = JSON.parse(accumulatedContent)
+      } catch {
+        yield {
+          type: EventType.RUN_ERROR,
+          runId: aguiState.runId,
+          model,
+          timestamp,
+          message: `Failed to parse structured output as JSON. Content: ${accumulatedContent.slice(0, 200)}${accumulatedContent.length > 200 ? '...' : ''}`,
+          code: 'parse-error',
+          error: {
+            message: 'Failed to parse structured output as JSON',
+            code: 'parse-error',
+          },
+        }
+        return
+      }
+
+      const transformed = transformNullsToUndefined(parsed)
+
+      yield {
+        type: EventType.CUSTOM,
+        name: 'structured-output.complete',
+        value: {
+          object: transformed,
+          raw: accumulatedContent,
+          ...(accumulatedReasoning ? { reasoning: accumulatedReasoning } : {}),
+        },
+        model,
+        timestamp,
+      }
+
+      yield {
+        type: EventType.RUN_FINISHED,
+        runId: aguiState.runId,
+        threadId: aguiState.threadId,
+        model,
+        timestamp,
+        finishReason: 'stop',
+        ...(usage && {
+          usage: {
+            promptTokens: usage.input_tokens,
+            completionTokens: usage.output_tokens,
+            totalTokens: usage.total_tokens,
+          },
+        }),
+      }
+    } catch (error: unknown) {
+      if (!aguiState.hasEmittedRunStarted) {
+        aguiState.hasEmittedRunStarted = true
+        yield {
+          type: EventType.RUN_STARTED,
+          runId: aguiState.runId,
+          threadId: aguiState.threadId,
+          model,
+          timestamp,
+        }
+      }
+
+      const isAbort = this.isAbortError(error)
+      const errorPayload = toRunErrorPayload(
+        error,
+        `${this.name}.structuredOutputStream failed`,
+      )
+
+      yield {
+        type: EventType.RUN_ERROR,
+        runId: aguiState.runId,
+        model,
+        timestamp,
+        message: errorPayload.message,
+        code: isAbort ? 'aborted' : errorPayload.code,
+        error: { ...errorPayload, ...(isAbort && { code: 'aborted' }) },
+      }
+
+      chatOptions.logger.errors(`${this.name}.structuredOutputStream fatal`, {
+        error: errorPayload,
+        source: `${this.name}.structuredOutputStream`,
+      })
+    }
+  }
+
+  /**
+   * Cross-SDK abort detection for `structuredOutputStream`. Mirrors the
+   * Chat Completions base; subclasses with proprietary error types override.
+   */
+  protected isAbortError(error: unknown): boolean {
+    if (!error || typeof error !== 'object') return false
+    const e = error as { name?: unknown; code?: unknown }
+    return (
+      e.name === 'APIUserAbortError' ||
+      e.name === 'AbortError' ||
+      e.code === 'ERR_CANCELED'
+    )
+  }
+
   /**
    * Applies provider-specific transformations for structured output compatibility.
    * Override this in subclasses to handle provider-specific quirks.
diff --git a/packages/typescript/openai-base/tests/chat-completions-structured-output-stream.test.ts b/packages/typescript/openai-base/tests/chat-completions-structured-output-stream.test.ts
new file mode 100644
index 000000000..3b7b7ec42
--- /dev/null
+++ b/packages/typescript/openai-base/tests/chat-completions-structured-output-stream.test.ts
@@ -0,0 +1,300 @@
+/**
+ * Unit tests for `OpenAIBaseChatCompletionsTextAdapter.structuredOutputStream`.
+ *
+ * The base adapter's streaming structured-output path is shared by every
+ * subclass (ai-openai, ai-grok, ai-groq). These tests pin the AG-UI lifecycle
+ * around the SDK chunk loop, the `response_format: json_schema` request shape,
+ * the parse-error / empty-content failure paths, and the per-chunk
+ * `logger.provider` debug emission added alongside the streaming feature.
+ */
+
+import { describe, it, expect, vi, beforeEach } from 'vitest'
+import { OpenAIBaseChatCompletionsTextAdapter } from '../src/adapters/chat-completions-text'
+import type OpenAI from 'openai'
+import type { JSONSchema, StreamChunk } from '@tanstack/ai'
+import { resolveDebugOption, type Logger } from '@tanstack/ai/adapter-internals'
+
+let mockCreate: ReturnType<typeof vi.fn>
+
+function makeStubClient(): OpenAI {
+  return {
+    chat: {
+      completions: {
+        create: (params: unknown, options: unknown) =>
+          mockCreate(params, options),
+      },
+    },
+  } as unknown as OpenAI
+}
+
+class TestAdapter extends OpenAIBaseChatCompletionsTextAdapter<string> {
+  constructor(model = 'test-model', name = 'openai-base') {
+    super(model, name, makeStubClient())
+  }
+}
+
+/** Create an async iterable over a fixed array. */
+function createAsyncIterable<T>(chunks: Array<T>): AsyncIterable<T> {
+  return {
+    async *[Symbol.asyncIterator]() {
+      for (const c of chunks) yield c
+    },
+  }
+}
+
+/** Wire `chat.completions.create` to yield `chunks` on the streaming path. */
+function setupStreamingMock(chunks: Array<Record<string, unknown>>) {
+  mockCreate = vi.fn().mockImplementation((params: { stream?: boolean }) => {
+    if (!params.stream) {
+      return Promise.resolve({ choices: [], model: 'test-model' })
+    }
+    return Promise.resolve(createAsyncIterable(chunks))
+  })
+}
+
+/** Build a Chat Completions delta chunk with content. */
+function deltaChunk(content: string, finishReason: string | null = null) {
+  return {
+    id: 'chatcmpl-1',
+    model: 'test-model',
+    choices: [{ delta: { content }, finish_reason: finishReason, index: 0 }],
+  }
+}
+
+/** Terminal chunk (with usage). */
+function finishChunk() {
+  return {
+    id: 'chatcmpl-1',
+    model: 'test-model',
+    choices: [{ delta: {}, finish_reason: 'stop', index: 0 }],
+    usage: { prompt_tokens: 10, completion_tokens: 20, total_tokens: 30 },
+  }
+}
+
+const personSchema: JSONSchema = {
+  type: 'object',
+  properties: {
+    name: { type: 'string' },
+    age: { type: 'number' },
+  },
+  required: ['name', 'age'],
+  additionalProperties: false,
+}
+
+const testLogger = resolveDebugOption(false)
+
+async function collect(
+  stream: AsyncIterable<StreamChunk>,
+): Promise<Array<StreamChunk>> {
+  const out: Array<StreamChunk> = []
+  for await (const c of stream) out.push(c)
+  return out
+}
+
+describe('OpenAIBaseChatCompletionsTextAdapter.structuredOutputStream', () => {
+  beforeEach(() => {
+    vi.clearAllMocks()
+  })
+
+  describe('happy path', () => {
+    it('emits RUN_STARTED → TEXT_MESSAGE_* → structured-output.complete → RUN_FINISHED', async () => {
+      const json = '{"name":"John","age":30}'
+      setupStreamingMock([
+        deltaChunk('{"name":'),
+        deltaChunk('"John",'),
+        deltaChunk('"age":30}'),
+        finishChunk(),
+      ])
+      const adapter = new TestAdapter()
+
+      const chunks = await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: testLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      const types = chunks.map((c) => c.type)
+      expect(types[0]).toBe('RUN_STARTED')
+      expect(types).toContain('TEXT_MESSAGE_START')
+      expect(types).toContain('TEXT_MESSAGE_CONTENT')
+      expect(types).toContain('TEXT_MESSAGE_END')
+      expect(types).toContain('CUSTOM')
+      expect(types[types.length - 1]).toBe('RUN_FINISHED')
+
+      const complete = chunks.find(
+        (c) =>
+          c.type === 'CUSTOM' &&
+          (c as { name?: string }).name === 'structured-output.complete',
+      ) as { value: { object: unknown; raw: string } } | undefined
+      expect(complete).toBeDefined()
+      expect(complete!.value.object).toEqual({ name: 'John', age: 30 })
+      expect(complete!.value.raw).toBe(json)
+    })
+
+    it('sends response_format: { type: "json_schema", strict: true } in the request', async () => {
+      setupStreamingMock([deltaChunk('{"name":"X","age":1}'), finishChunk()])
+      const adapter = new TestAdapter()
+
+      await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: testLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      expect(mockCreate).toHaveBeenCalledTimes(1)
+      const request = mockCreate.mock.calls[0]![0] as {
+        stream?: boolean
+        response_format?: {
+          type: string
+          json_schema: { name: string; strict: boolean }
+        }
+        tools?: unknown
+      }
+      expect(request.stream).toBe(true)
+      expect(request.response_format?.type).toBe('json_schema')
+      expect(request.response_format?.json_schema.strict).toBe(true)
+      // Tools must NOT be carried into the structured-output request — they
+      // can confuse strict-mode json_schema validation upstream.
+      expect(request.tools).toBeUndefined()
+    })
+
+    it('accumulates JSON text from deltas and emits exactly one structured-output.complete', async () => {
+      setupStreamingMock([
+        deltaChunk('{"name":"A"'),
+        deltaChunk(',"age":7}'),
+        finishChunk(),
+      ])
+      const adapter = new TestAdapter()
+
+      const chunks = await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: testLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      const completeEvents = chunks.filter(
+        (c) =>
+          c.type === 'CUSTOM' &&
+          (c as { name?: string }).name === 'structured-output.complete',
+      )
+      expect(completeEvents.length).toBe(1)
+      const value = (completeEvents[0] as { value: { object: unknown } }).value
+      expect(value.object).toEqual({ name: 'A', age: 7 })
+    })
+  })
+
+  describe('error paths', () => {
+    it('emits RUN_ERROR { code: "empty-response" } when no content was produced', async () => {
+      // Stream finishes with no text deltas at all (model returned nothing).
+      setupStreamingMock([finishChunk()])
+      const adapter = new TestAdapter()
+
+      const chunks = await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: testLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      const runError = chunks.find((c) => c.type === 'RUN_ERROR') as
+        | { type: 'RUN_ERROR'; code?: string }
+        | undefined
+      expect(runError).toBeDefined()
+      expect(runError!.code).toBe('empty-response')
+
+      // No structured-output.complete should accompany the failure.
+      const complete = chunks.find(
+        (c) =>
+          c.type === 'CUSTOM' &&
+          (c as { name?: string }).name === 'structured-output.complete',
+      )
+      expect(complete).toBeUndefined()
+    })
+
+    it('emits RUN_ERROR { code: "parse-error" } when the accumulated JSON is malformed', async () => {
+      setupStreamingMock([deltaChunk('{not valid json'), finishChunk()])
+      const adapter = new TestAdapter()
+
+      const chunks = await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: testLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      const runError = chunks.find((c) => c.type === 'RUN_ERROR') as
+        | { type: 'RUN_ERROR'; code?: string }
+        | undefined
+      expect(runError).toBeDefined()
+      expect(runError!.code).toBe('parse-error')
+    })
+  })
+
+  describe('debug logging', () => {
+    it('invokes logger.provider once per SDK chunk', async () => {
+      const debugLogger: Logger = {
+        debug: vi.fn(),
+        info: vi.fn(),
+        warn: vi.fn(),
+        error: vi.fn(),
+      }
+      const verboseLogger = resolveDebugOption({
+        logger: debugLogger,
+        provider: true,
+        request: false,
+        errors: false,
+      })
+
+      setupStreamingMock([
+        deltaChunk('{"name":"X"'),
+        deltaChunk(',"age":1}'),
+        finishChunk(),
+      ])
+      const adapter = new TestAdapter()
+
+      await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: verboseLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      // 3 SDK chunks → 3 provider log calls. Route into `Logger.debug` via
+      // InternalLogger; filter to only the provider-category messages.
+      const providerCalls = (
+        debugLogger.debug as ReturnType<typeof vi.fn>
+      ).mock.calls.filter(
+        ([msg]) =>
+          typeof msg === 'string' && msg.includes('tanstack-ai:provider'),
+      )
+      expect(providerCalls.length).toBe(3)
+    })
+  })
+})
diff --git a/packages/typescript/openai-base/tests/responses-structured-output-stream.test.ts b/packages/typescript/openai-base/tests/responses-structured-output-stream.test.ts
new file mode 100644
index 000000000..d3c8483a3
--- /dev/null
+++ b/packages/typescript/openai-base/tests/responses-structured-output-stream.test.ts
@@ -0,0 +1,340 @@
+/**
+ * Unit tests for `OpenAIBaseResponsesTextAdapter.structuredOutputStream`.
+ *
+ * Mirrors the chat-completions structuredOutputStream tests but against the
+ * Responses API event shape (`response.output_text.delta`, `response.completed`,
+ * etc.). Pins the AG-UI lifecycle, the `text.format: json_schema` request
+ * shape, error paths, and the per-chunk `logger.provider` debug emission.
+ */
+
+import { describe, it, expect, vi, beforeEach } from 'vitest'
+import { OpenAIBaseResponsesTextAdapter } from '../src/adapters/responses-text'
+import type OpenAI from 'openai'
+import type { JSONSchema, StreamChunk } from '@tanstack/ai'
+import { resolveDebugOption, type Logger } from '@tanstack/ai/adapter-internals'
+
+let mockCreate: ReturnType<typeof vi.fn>
+
+function makeStubClient(): OpenAI {
+  return {
+    responses: {
+      create: (params: unknown, options: unknown) =>
+        mockCreate(params, options),
+    },
+  } as unknown as OpenAI
+}
+
+class TestAdapter extends OpenAIBaseResponsesTextAdapter<string> {
+  constructor(model = 'test-model', name = 'openai-base-responses') {
+    super(model, name, makeStubClient())
+  }
+}
+
+function createAsyncIterable<T>(chunks: Array<T>): AsyncIterable<T> {
+  return {
+    async *[Symbol.asyncIterator]() {
+      for (const c of chunks) yield c
+    },
+  }
+}
+
+function setupStreamingMock(chunks: Array<Record<string, unknown>>) {
+  mockCreate = vi.fn().mockImplementation((params: { stream?: boolean }) => {
+    if (!params.stream) {
+      return Promise.resolve({ output: [], model: 'test-model' })
+    }
+    return Promise.resolve(createAsyncIterable(chunks))
+  })
+}
+
+// Responses API event constructors. Field names mirror the openai SDK shape.
+function eventCreated() {
+  return { type: 'response.created', response: { model: 'test-model' } }
+}
+function eventOutputTextDelta(delta: string) {
+  return { type: 'response.output_text.delta', delta }
+}
+function eventCompleted(
+  usage: {
+    input_tokens: number
+    output_tokens: number
+    total_tokens: number
+  } = {
+    input_tokens: 10,
+    output_tokens: 20,
+    total_tokens: 30,
+  },
+) {
+  return {
+    type: 'response.completed',
+    response: { model: 'test-model', usage },
+  }
+}
+
+const personSchema: JSONSchema = {
+  type: 'object',
+  properties: {
+    name: { type: 'string' },
+    age: { type: 'number' },
+  },
+  required: ['name', 'age'],
+  additionalProperties: false,
+}
+
+const testLogger = resolveDebugOption(false)
+
+async function collect(
+  stream: AsyncIterable<StreamChunk>,
+): Promise<Array<StreamChunk>> {
+  const out: Array<StreamChunk> = []
+  for await (const c of stream) out.push(c)
+  return out
+}
+
+describe('OpenAIBaseResponsesTextAdapter.structuredOutputStream', () => {
+  beforeEach(() => {
+    vi.clearAllMocks()
+  })
+
+  describe('happy path', () => {
+    it('emits RUN_STARTED → TEXT_MESSAGE_* → structured-output.complete → RUN_FINISHED', async () => {
+      const json = '{"name":"John","age":30}'
+      setupStreamingMock([
+        eventCreated(),
+        eventOutputTextDelta('{"name":'),
+        eventOutputTextDelta('"John",'),
+        eventOutputTextDelta('"age":30}'),
+        eventCompleted(),
+      ])
+      const adapter = new TestAdapter()
+
+      const chunks = await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: testLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      const types = chunks.map((c) => c.type)
+      expect(types[0]).toBe('RUN_STARTED')
+      expect(types).toContain('TEXT_MESSAGE_START')
+      expect(types).toContain('TEXT_MESSAGE_CONTENT')
+      expect(types).toContain('TEXT_MESSAGE_END')
+      expect(types).toContain('CUSTOM')
+      expect(types[types.length - 1]).toBe('RUN_FINISHED')
+
+      const complete = chunks.find(
+        (c) =>
+          c.type === 'CUSTOM' &&
+          (c as { name?: string }).name === 'structured-output.complete',
+      ) as { value: { object: unknown; raw: string } } | undefined
+      expect(complete).toBeDefined()
+      expect(complete!.value.object).toEqual({ name: 'John', age: 30 })
+      expect(complete!.value.raw).toBe(json)
+    })
+
+    it('sends text.format: { type: "json_schema", strict: true } in the request', async () => {
+      setupStreamingMock([
+        eventCreated(),
+        eventOutputTextDelta('{"name":"X","age":1}'),
+        eventCompleted(),
+      ])
+      const adapter = new TestAdapter()
+
+      await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: testLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      expect(mockCreate).toHaveBeenCalledTimes(1)
+      const request = mockCreate.mock.calls[0]![0] as {
+        stream?: boolean
+        text?: { format?: { type: string; strict: boolean; name: string } }
+        tools?: unknown
+      }
+      expect(request.stream).toBe(true)
+      expect(request.text?.format?.type).toBe('json_schema')
+      expect(request.text?.format?.strict).toBe(true)
+      // Tools must NOT be carried into the structured-output request.
+      expect(request.tools).toBeUndefined()
+    })
+
+    it('forwards usage on the terminal RUN_FINISHED event', async () => {
+      setupStreamingMock([
+        eventCreated(),
+        eventOutputTextDelta('{"name":"A","age":2}'),
+        eventCompleted({
+          input_tokens: 5,
+          output_tokens: 8,
+          total_tokens: 13,
+        }),
+      ])
+      const adapter = new TestAdapter()
+
+      const chunks = await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: testLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      const finished = chunks.find((c) => c.type === 'RUN_FINISHED') as
+        | {
+            type: 'RUN_FINISHED'
+            usage?: {
+              promptTokens: number
+              completionTokens: number
+              totalTokens: number
+            }
+          }
+        | undefined
+      expect(finished).toBeDefined()
+      expect(finished!.usage).toEqual({
+        promptTokens: 5,
+        completionTokens: 8,
+        totalTokens: 13,
+      })
+    })
+  })
+
+  describe('error paths', () => {
+    it('emits RUN_ERROR { code: "empty-response" } when no output_text.delta was received', async () => {
+      setupStreamingMock([eventCreated(), eventCompleted()])
+      const adapter = new TestAdapter()
+
+      const chunks = await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: testLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      const runError = chunks.find((c) => c.type === 'RUN_ERROR') as
+        | { type: 'RUN_ERROR'; code?: string }
+        | undefined
+      expect(runError).toBeDefined()
+      expect(runError!.code).toBe('empty-response')
+
+      const complete = chunks.find(
+        (c) =>
+          c.type === 'CUSTOM' &&
+          (c as { name?: string }).name === 'structured-output.complete',
+      )
+      expect(complete).toBeUndefined()
+    })
+
+    it('emits RUN_ERROR { code: "parse-error" } when the accumulated JSON is malformed', async () => {
+      setupStreamingMock([
+        eventCreated(),
+        eventOutputTextDelta('{not valid json'),
+        eventCompleted(),
+      ])
+      const adapter = new TestAdapter()
+
+      const chunks = await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: testLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      const runError = chunks.find((c) => c.type === 'RUN_ERROR') as
+        | { type: 'RUN_ERROR'; code?: string }
+        | undefined
+      expect(runError).toBeDefined()
+      expect(runError!.code).toBe('parse-error')
+    })
+
+    it('emits RUN_ERROR { code: "refusal" } on response.refusal.delta', async () => {
+      setupStreamingMock([
+        eventCreated(),
+        { type: 'response.refusal.delta', delta: 'cannot do this' },
+      ])
+      const adapter = new TestAdapter()
+
+      const chunks = await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: testLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      const runError = chunks.find((c) => c.type === 'RUN_ERROR') as
+        | { type: 'RUN_ERROR'; code?: string }
+        | undefined
+      expect(runError).toBeDefined()
+      expect(runError!.code).toBe('refusal')
+    })
+  })
+
+  describe('debug logging', () => {
+    it('invokes logger.provider once per SDK event', async () => {
+      const debugLogger: Logger = {
+        debug: vi.fn(),
+        info: vi.fn(),
+        warn: vi.fn(),
+        error: vi.fn(),
+      }
+      const verboseLogger = resolveDebugOption({
+        logger: debugLogger,
+        provider: true,
+        request: false,
+        errors: false,
+      })
+
+      const events = [
+        eventCreated(),
+        eventOutputTextDelta('{"name":"X"'),
+        eventOutputTextDelta(',"age":1}'),
+        eventCompleted(),
+      ]
+      setupStreamingMock(events)
+      const adapter = new TestAdapter()
+
+      await collect(
+        adapter.structuredOutputStream!({
+          chatOptions: {
+            model: 'test-model',
+            messages: [{ role: 'user', content: 'extract' }],
+            logger: verboseLogger,
+          },
+          outputSchema: personSchema,
+        }),
+      )
+
+      const providerCalls = (
+        debugLogger.debug as ReturnType<typeof vi.fn>
+      ).mock.calls.filter(
+        ([msg]) =>
+          typeof msg === 'string' && msg.includes('tanstack-ai:provider'),
+      )
+      expect(providerCalls.length).toBe(events.length)
+    })
+  })
+})
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 241c2f9ca..f99786622 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -1394,6 +1394,9 @@ importers:
         specifier: workspace:*
         version: link:../ai-client
     devDependencies:
+      '@standard-schema/spec':
+        specifier: ^1.1.0
+        version: 1.1.0
       '@tanstack/ai':
         specifier: workspace:*
         version: link:../ai
@@ -1465,6 +1468,9 @@ importers:
       '@solidjs/testing-library':
         specifier: ^0.8.10
         version: 0.8.10(solid-js@1.9.10)
+      '@standard-schema/spec':
+        specifier: ^1.1.0
+        version: 1.1.0
       '@tanstack/ai':
         specifier: workspace:*
         version: link:../ai
@@ -1530,6 +1536,9 @@ importers:
         specifier: workspace:*
         version: link:../ai-client
     devDependencies:
+      '@standard-schema/spec':
+        specifier: ^1.1.0
+        version: 1.1.0
       '@sveltejs/package':
         specifier: ^2.3.10
         version: 2.5.7(svelte@5.45.10)(typescript@5.9.3)
@@ -1579,6 +1588,9 @@ importers:
         specifier: workspace:*
         version: link:../ai-client
     devDependencies:
+      '@standard-schema/spec':
+        specifier: ^1.1.0
+        version: 1.1.0
       '@tanstack/ai':
         specifier: workspace:*
         version: link:../ai
diff --git a/testing/e2e/README.md b/testing/e2e/README.md
index 949f82b17..ab0f13479 100644
--- a/testing/e2e/README.md
+++ b/testing/e2e/README.md
@@ -4,7 +4,7 @@ End-to-end tests for TanStack AI using Playwright and [aimock](https://github.co
 
 **Architecture:** Playwright drives a TanStack Start app (`testing/e2e/`) which routes requests through provider adapters pointing at aimock. Fixtures define mock responses. No real API keys needed. All scenarios (including tool execution flows) use aimock fixtures. Tests run in parallel with per-test `X-Test-Id` isolation.
 
-**Providers tested:** openai, anthropic, gemini, ollama, groq, grok, openrouter, elevenlabs (audio-only)
+**Providers tested:** openai, anthropic, gemini, ollama, groq, grok, openrouter
 
 ## What's tested
 
@@ -12,26 +12,27 @@ End-to-end tests for TanStack AI using Playwright and [aimock](https://github.co
 
 Each test iterates over supported providers using `providersFor('feature')`:
 
-| Feature               | Providers | Spec file                             |
-| --------------------- | --------- | ------------------------------------- |
-| chat                  | 7         | `tests/chat.spec.ts`                  |
-| one-shot-text         | 7         | `tests/one-shot-text.spec.ts`         |
-| multi-turn            | 7         | `tests/multi-turn.spec.ts`            |
-| structured-output     | 7         | `tests/structured-output.spec.ts`     |
-| tool-calling          | 7         | `tests/tool-calling.spec.ts`          |
-| parallel-tool-calls   | 6         | `tests/parallel-tool-calls.spec.ts`   |
-| tool-approval         | 6         | `tests/tool-approval.spec.ts`         |
-| text-tool-text        | 6         | `tests/text-tool-text.spec.ts`        |
-| agentic-structured    | 7         | `tests/agentic-structured.spec.ts`    |
-| reasoning             | 3         | `tests/reasoning.spec.ts`             |
-| multimodal-image      | 5         | `tests/multimodal-image.spec.ts`      |
-| multimodal-structured | 5         | `tests/multimodal-structured.spec.ts` |
-| summarize             | 6         | `tests/summarize.spec.ts`             |
-| summarize-stream      | 6         | `tests/summarize-stream.spec.ts`      |
-| image-gen             | 7         | `tests/image-gen.spec.ts`             |
-| tts                   | 3         | `tests/tts.spec.ts`                   |
-| transcription         | 3         | `tests/transcription.spec.ts`         |
-| audio-gen             | 1         | `tests/audio-gen.spec.ts`             |
+| Feature                  | Providers | Spec file                                |
+| ------------------------ | --------- | ---------------------------------------- |
+| chat                     | 7         | `tests/chat.spec.ts`                     |
+| one-shot-text            | 7         | `tests/one-shot-text.spec.ts`            |
+| multi-turn               | 7         | `tests/multi-turn.spec.ts`               |
+| structured-output        | 7         | `tests/structured-output.spec.ts`        |
+| structured-output-stream | 4         | `tests/structured-output-stream.spec.ts` |
+| tool-calling             | 7         | `tests/tool-calling.spec.ts`             |
+| parallel-tool-calls      | 6         | `tests/parallel-tool-calls.spec.ts`      |
+| tool-approval            | 6         | `tests/tool-approval.spec.ts`            |
+| text-tool-text           | 6         | `tests/text-tool-text.spec.ts`           |
+| agentic-structured       | 7         | `tests/agentic-structured.spec.ts`       |
+| reasoning                | 3         | `tests/reasoning.spec.ts`                |
+| multimodal-image         | 5         | `tests/multimodal-image.spec.ts`         |
+| multimodal-structured    | 5         | `tests/multimodal-structured.spec.ts`    |
+| summarize                | 6         | `tests/summarize.spec.ts`                |
+| summarize-stream         | 6         | `tests/summarize-stream.spec.ts`         |
+| image-gen                | 7         | `tests/image-gen.spec.ts`                |
+| tts                      | 3         | `tests/tts.spec.ts`                      |
+| transcription            | 3         | `tests/transcription.spec.ts`            |
+| audio-gen                | 1         | `tests/audio-gen.spec.ts`                |
 
 ### Tools-test page
 
@@ -78,10 +79,9 @@ pnpm --filter @tanstack/ai-e2e test:e2e -- tests/tools-test/
 ## 2. Recording a New Fixture
 
 ```bash
-# 1. Set your API keys (only the ones you need for the fixture you're recording)
+# 1. Set your API keys
 export OPENAI_API_KEY=sk-...
 export ANTHROPIC_API_KEY=sk-ant-...
-export ELEVENLABS_API_KEY=sk_...   # needed for elevenlabs audio-gen recordings
 
 # 2. Start the app in record mode
 pnpm --filter @tanstack/ai-e2e record
@@ -95,35 +95,6 @@ pnpm --filter @tanstack/ai-e2e record
 # 6. Stop the dev server (Ctrl+C)
 ```
 
-### 2a. Recording ElevenLabs music
-
-aimock 1.17+ has native handlers for `/v1/music/*` and `/v1/sound-generation`,
-so music + SFX requests can be recorded. (TTS `/v1/text-to-speech/{voice_id}`
-and STT `/v1/speech-to-text` are still served by local synthetic mounts in
-`global-setup.ts` — aimock has no native handler for those yet.)
-
-```bash
-# 1. Real ElevenLabs key
-export ELEVENLABS_API_KEY=sk_...
-
-# 2. Record mode
-pnpm --filter @tanstack/ai-e2e record
-
-# 3. Open http://localhost:3010/elevenlabs/audio-gen
-
-# 4. Pick "Music", type the exact prompt the spec uses:
-#    "an upbeat lo-fi beat for the guitar store"
-#    Click Generate. Wait for completion (music_v1 minimum is ~10s of audio).
-
-# 5. The fixture lands in fixtures/recorded/ as a JSON file with the captured
-#    base64 MP3. Move it into fixtures/audio-gen/ so global-setup.ts loads it
-#    on the next test run:
-mv fixtures/recorded/elevenlabs-music-*.json fixtures/audio-gen/music.json
-
-# 6. Drop the programmatic `mock.onMusic(...)` line in global-setup.ts — the
-#    JSON fixture takes over.
-```
-
 ## 3. Organizing the Recorded Fixture
 
 Move from `recorded/` to the appropriate feature directory:
@@ -153,7 +124,7 @@ Clean up the fixture:
 }
 ```
 
-Existing prefixes: `[chat]`, `[oneshot]`, `[reasoning]`, `[multiturn-1]`, `[multiturn-2]`, `[toolcall]`, `[parallel]`, `[approval]`, `[approval-deny]`, `[text-tool-text]`, `[structured]`, `[agentic]`, `[mmimage]`, `[mmstruct]`, `[summarize]`, `[imagegen]`, `[tts]`, `[transcription]`, `[abort-test]`, `[error-test]`.
+Existing prefixes: `[chat]`, `[oneshot]`, `[reasoning]`, `[multiturn-1]`, `[multiturn-2]`, `[toolcall]`, `[parallel]`, `[approval]`, `[approval-deny]`, `[text-tool-text]`, `[structured]`, `[structured-stream]`, `[structured-stream-abort]`, `[agentic]`, `[mmimage]`, `[mmstruct]`, `[summarize]`, `[imagegen]`, `[tts]`, `[transcription]`, `[abort-test]`, `[error-test]`.
 
 ## 4. Writing a Test
 
diff --git a/testing/e2e/fixtures/abort/basic.json b/testing/e2e/fixtures/abort/basic.json
index 98e112516..312e2bf5b 100644
--- a/testing/e2e/fixtures/abort/basic.json
+++ b/testing/e2e/fixtures/abort/basic.json
@@ -7,10 +7,8 @@
       "response": {
         "content": "Once upon a time in a land far away there lived a guitar maker who spent decades perfecting the art of crafting beautiful instruments from the finest tonewoods available in the forests nearby and each guitar was unique and special and every single one had its own story to tell about the wood and the craftsmanship that went into making it a truly remarkable piece of art and the customers would come from miles around just to see the collection and hear the stories behind each instrument that hung on the walls of the little shop on the corner of Main Street in the small town where everyone knew each other by name and the guitar maker would spend hours talking to each customer about the history and character of every guitar in the shop telling tales of the trees that provided the wood and the journeys those trees had taken before becoming part of something so beautiful and musical"
       },
-      "opts": {
-        "tokensPerSecond": 1,
-        "chunkSize": 2
-      }
+      "chunkSize": 2,
+      "streamingProfile": { "tps": 5 }
     }
   ]
 }
diff --git a/testing/e2e/fixtures/structured-output-stream/abort.json b/testing/e2e/fixtures/structured-output-stream/abort.json
new file mode 100644
index 000000000..f1dd6dfba
--- /dev/null
+++ b/testing/e2e/fixtures/structured-output-stream/abort.json
@@ -0,0 +1,14 @@
+{
+  "fixtures": [
+    {
+      "match": {
+        "userMessage": "[structured-stream-abort] recommend a guitar slowly"
+      },
+      "response": {
+        "content": "{\"name\":\"Fender Stratocaster\",\"price\":1299,\"reason\":\"Versatile tone and comfortable playability across many genres including blues rock jazz country and pop with a wide tonal palette\",\"rating\":5}"
+      },
+      "chunkSize": 2,
+      "streamingProfile": { "tps": 5 }
+    }
+  ]
+}
diff --git a/testing/e2e/fixtures/structured-output-stream/basic.json b/testing/e2e/fixtures/structured-output-stream/basic.json
new file mode 100644
index 000000000..62ef046fc
--- /dev/null
+++ b/testing/e2e/fixtures/structured-output-stream/basic.json
@@ -0,0 +1,12 @@
+{
+  "fixtures": [
+    {
+      "match": {
+        "userMessage": "[structured-stream] recommend a guitar as json"
+      },
+      "response": {
+        "content": "{\"name\":\"Fender Stratocaster\",\"price\":1299,\"reason\":\"Versatile tone and comfortable playability\",\"rating\":5}"
+      }
+    }
+  ]
+}
diff --git a/testing/e2e/src/components/ChatUI.tsx b/testing/e2e/src/components/ChatUI.tsx
index 7183115ae..da5f0c595 100644
--- a/testing/e2e/src/components/ChatUI.tsx
+++ b/testing/e2e/src/components/ChatUI.tsx
@@ -18,6 +18,13 @@ interface ChatUIProps {
   }) => Promise<void>
   showImageInput?: boolean
   onStop?: () => void
+  /** When the streaming structured-output CUSTOM event lands, the page
+   *  exposes the parsed object here so e2e tests can assert that the event
+   *  reached the client (not just that the JSON text was rendered). */
+  structuredObject?: unknown
+  /** Number of TEXT_MESSAGE_CONTENT chunks observed. Used by streaming e2e
+   *  tests to verify the response actually streamed in multiple deltas. */
+  contentDeltaCount?: number
 }
 
 export function ChatUI({
@@ -28,6 +35,8 @@ export function ChatUI({
   addToolApprovalResponse,
   showImageInput,
   onStop,
+  structuredObject,
+  contentDeltaCount,
 }: ChatUIProps) {
   const [input, setInput] = useState('')
   const messagesRef = useRef<HTMLDivElement>(null)
@@ -46,6 +55,20 @@ export function ChatUI({
 
   return (
     <div className="flex flex-col h-[calc(100vh-60px)]">
+      {structuredObject != null && (
+        <div
+          data-testid="structured-output-complete"
+          data-structured-output={JSON.stringify(structuredObject)}
+          hidden
+        />
+      )}
+      {contentDeltaCount != null && (
+        <div
+          data-testid="content-delta-count"
+          data-count={String(contentDeltaCount)}
+          hidden
+        />
+      )}
       <div
         ref={messagesRef}
         data-testid="message-list"
diff --git a/testing/e2e/src/lib/feature-support.ts b/testing/e2e/src/lib/feature-support.ts
index 7a8dbb8c8..0f1ca4a02 100644
--- a/testing/e2e/src/lib/feature-support.ts
+++ b/testing/e2e/src/lib/feature-support.ts
@@ -16,7 +16,6 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'groq',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   'one-shot-text': new Set([
     'openai',
@@ -26,10 +25,8 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'groq',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   reasoning: new Set(['openai', 'anthropic', 'gemini']),
-  'multi-turn-reasoning': new Set(['anthropic']),
   'multi-turn': new Set([
     'openai',
     'anthropic',
@@ -38,7 +35,6 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'groq',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   'tool-calling': new Set([
     'openai',
@@ -48,7 +44,6 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'groq',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   'parallel-tool-calls': new Set([
     'openai',
@@ -57,7 +52,6 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'groq',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   // Gemini excluded: approval flow timing issues with Gemini's streaming format
   'tool-approval': new Set([
@@ -67,7 +61,6 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'groq',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   // Ollama excluded: aimock doesn't support content+toolCalls for /api/chat format
   'text-tool-text': new Set([
@@ -77,7 +70,6 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'groq',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   'structured-output': new Set([
     'openai',
@@ -87,8 +79,12 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'groq',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
+  // Streaming structured output: only providers with native streaming JSON
+  // schema support are listed here. Other providers fall back to the
+  // activity-layer `fallbackStructuredOutputStream` (which wraps the
+  // non-streaming `structuredOutput`) but aren't exercised by E2E yet.
+  'structured-output-stream': new Set(['openai', 'groq', 'grok', 'openrouter']),
   'agentic-structured': new Set([
     'openai',
     'anthropic',
@@ -97,7 +93,6 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'groq',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   'multimodal-image': new Set([
     'openai',
@@ -105,7 +100,6 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'gemini',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   'multimodal-structured': new Set([
     'openai',
@@ -113,7 +107,6 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'gemini',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   summarize: new Set([
     'openai',
@@ -122,7 +115,6 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'ollama',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   'summarize-stream': new Set([
     'openai',
@@ -131,22 +123,12 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'ollama',
     'grok',
     'openrouter',
-    'openrouter-responses',
   ]),
   // Gemini excluded: aimock doesn't mock Gemini's Imagen predict endpoint format
   'image-gen': new Set(['openai', 'grok']),
-  // ElevenLabs TTS (/v1/text-to-speech/{voice_id}) and STT (/v1/speech-to-text)
-  // are mocked via local mounts in global-setup.ts (aimock 1.17 covers
-  // /v1/sound-generation + /v1/music/* but not these two routes yet).
-  tts: new Set(['openai', 'grok', 'elevenlabs']),
-  transcription: new Set(['openai', 'grok', 'elevenlabs']),
+  tts: new Set(['openai', 'grok']),
+  transcription: new Set(['openai', 'grok']),
   'video-gen': new Set(['openai']),
-  // Music generation: Gemini Lyria (generateContent with AUDIO modality)
-  // and ElevenLabs music_v1 (/v1/music/*) — both natively mocked by aimock
-  // 1.17+.
-  'audio-gen': new Set(['gemini', 'elevenlabs']),
-  // ElevenLabs sound-generation (/v1/sound-generation), aimock 1.17+.
-  'sound-effects': new Set(['elevenlabs']),
 }
 
 export function isSupported(provider: Provider, feature: Feature): boolean {
diff --git a/testing/e2e/src/lib/features.ts b/testing/e2e/src/lib/features.ts
index a987930e9..08f7aa6c3 100644
--- a/testing/e2e/src/lib/features.ts
+++ b/testing/e2e/src/lib/features.ts
@@ -25,15 +25,6 @@ export const featureConfigs: Record<Feature, FeatureConfig> = {
       anthropic: 'claude-sonnet-4-5',
     },
   },
-  'multi-turn-reasoning': {
-    tools: [getGuitars],
-    modelOptions: {
-      thinking: { type: 'enabled', budget_tokens: 1024 },
-    },
-    modelOverrides: {
-      anthropic: 'claude-sonnet-4-5',
-    },
-  },
   'multi-turn': {
     tools: [],
     modelOptions: {},
@@ -58,6 +49,10 @@ export const featureConfigs: Record<Feature, FeatureConfig> = {
     tools: [],
     modelOptions: {},
   },
+  'structured-output-stream': {
+    tools: [],
+    modelOptions: {},
+  },
   'agentic-structured': {
     tools: [getGuitars],
     modelOptions: {},
@@ -94,12 +89,4 @@ export const featureConfigs: Record<Feature, FeatureConfig> = {
     tools: [],
     modelOptions: {},
   },
-  'audio-gen': {
-    tools: [],
-    modelOptions: {},
-  },
-  'sound-effects': {
-    tools: [],
-    modelOptions: {},
-  },
 }
diff --git a/testing/e2e/src/lib/types.ts b/testing/e2e/src/lib/types.ts
index 2f5cd634c..cca9e4d79 100644
--- a/testing/e2e/src/lib/types.ts
+++ b/testing/e2e/src/lib/types.ts
@@ -8,20 +8,18 @@ export type Provider =
   | 'grok'
   | 'groq'
   | 'openrouter'
-  | 'openrouter-responses'
-  | 'elevenlabs'
 
 export type Feature =
   | 'chat'
   | 'one-shot-text'
   | 'reasoning'
-  | 'multi-turn-reasoning'
   | 'multi-turn'
   | 'tool-calling'
   | 'parallel-tool-calls'
   | 'tool-approval'
   | 'text-tool-text'
   | 'structured-output'
+  | 'structured-output-stream'
   | 'agentic-structured'
   | 'multimodal-image'
   | 'multimodal-structured'
@@ -31,8 +29,6 @@ export type Feature =
   | 'tts'
   | 'transcription'
   | 'video-gen'
-  | 'audio-gen'
-  | 'sound-effects'
 
 export const ALL_PROVIDERS: Provider[] = [
   'openai',
@@ -42,21 +38,19 @@ export const ALL_PROVIDERS: Provider[] = [
   'grok',
   'groq',
   'openrouter',
-  'openrouter-responses',
-  'elevenlabs',
 ]
 
 export const ALL_FEATURES: Feature[] = [
   'chat',
   'one-shot-text',
   'reasoning',
-  'multi-turn-reasoning',
   'multi-turn',
   'tool-calling',
   'parallel-tool-calls',
   'tool-approval',
   'text-tool-text',
   'structured-output',
+  'structured-output-stream',
   'agentic-structured',
   'multimodal-image',
   'multimodal-structured',
@@ -66,6 +60,4 @@ export const ALL_FEATURES: Feature[] = [
   'tts',
   'transcription',
   'video-gen',
-  'audio-gen',
-  'sound-effects',
 ]
diff --git a/testing/e2e/src/routes/$provider/$feature.tsx b/testing/e2e/src/routes/$provider/$feature.tsx
index bf7d508dd..f4c7478e4 100644
--- a/testing/e2e/src/routes/$provider/$feature.tsx
+++ b/testing/e2e/src/routes/$provider/$feature.tsx
@@ -1,4 +1,5 @@
 import { createFileRoute } from '@tanstack/react-router'
+import { useState } from 'react'
 import { fetchServerSentEvents, useChat } from '@tanstack/ai-react'
 import { clientTools } from '@tanstack/ai-client'
 import type { Feature, Mode, Provider } from '@/lib/types'
@@ -11,7 +12,6 @@ import { ImageGenUI } from '@/components/ImageGenUI'
 import { TTSUI } from '@/components/TTSUI'
 import { TranscriptionUI } from '@/components/TranscriptionUI'
 import { VideoGenUI } from '@/components/VideoGenUI'
-import { AudioGenUI } from '@/components/AudioGenUI'
 
 export const Route = createFileRoute('/$provider/$feature')({
   component: FeaturePage,
@@ -33,8 +33,6 @@ const MEDIA_FEATURES = new Set<Feature>([
   'tts',
   'transcription',
   'video-gen',
-  'audio-gen',
-  'sound-effects',
 ])
 
 const addToCartClient = addToCartToolDef.client((args) => ({
@@ -120,17 +118,6 @@ function MediaFeature({
           aimockPort={aimockPort}
         />
       )
-    case 'audio-gen':
-    case 'sound-effects':
-      return (
-        <AudioGenUI
-          provider={provider}
-          mode={mode}
-          testId={testId}
-          aimockPort={aimockPort}
-          feature={feature}
-        />
-      )
     default:
       return <NotSupported provider={provider} feature={feature} />
   }
@@ -151,17 +138,38 @@ function ChatFeature({
 
   const { testId, aimockPort } = Route.useSearch()
 
+  // Tracks streaming-structured-output observability for e2e tests:
+  // - structuredObject: captured from the terminal CUSTOM event
+  // - contentDeltaCount: incremented per TEXT_MESSAGE_CONTENT chunk so tests
+  //   can verify the response actually streamed (rather than silently
+  //   collapsing to a single synthetic delta)
+  const [structuredObject, setStructuredObject] = useState<unknown>(null)
+  const [contentDeltaCount, setContentDeltaCount] = useState(0)
+
   const { messages, sendMessage, isLoading, addToolApprovalResponse, stop } =
     useChat({
       connection: fetchServerSentEvents('/api/chat'),
       tools,
       body: { provider, feature, testId, aimockPort },
+      onCustomEvent: (eventType, data) => {
+        if (eventType === 'structured-output.complete') {
+          const value = data as { object: unknown; raw: string } | undefined
+          setStructuredObject(value?.object ?? null)
+        }
+      },
+      onChunk: (chunk) => {
+        if (chunk.type === 'TEXT_MESSAGE_CONTENT') {
+          setContentDeltaCount((n) => n + 1)
+        }
+      },
     })
 
   return (
     <ChatUI
       messages={messages}
       isLoading={isLoading}
+      structuredObject={structuredObject}
+      contentDeltaCount={contentDeltaCount}
       onSendMessage={(text) => {
         sendMessage(text)
       }}
diff --git a/testing/e2e/src/routes/api.chat.ts b/testing/e2e/src/routes/api.chat.ts
index 30a00f8cc..7ee2bb9eb 100644
--- a/testing/e2e/src/routes/api.chat.ts
+++ b/testing/e2e/src/routes/api.chat.ts
@@ -3,6 +3,7 @@ import { chat, maxIterations, toServerSentEventsResponse } from '@tanstack/ai'
 import type { Feature, Provider } from '@/lib/types'
 import { createTextAdapter } from '@/lib/providers'
 import { featureConfigs } from '@/lib/features'
+import { guitarRecommendationSchema } from '@/lib/schemas'
 
 export const Route = createFileRoute('/api/chat')({
   server: {
@@ -33,15 +34,30 @@ export const Route = createFileRoute('/api/chat')({
         )
 
         try {
-          const stream = chat({
-            ...adapterOptions,
-            tools: config.tools,
-            modelOptions: config.modelOptions,
-            systemPrompts: ['You are a helpful assistant for a guitar store.'],
-            agentLoopStrategy: maxIterations(5),
-            messages,
-            abortController,
-          })
+          const stream =
+            feature === 'structured-output-stream'
+              ? chat({
+                  ...adapterOptions,
+                  modelOptions: config.modelOptions,
+                  systemPrompts: [
+                    'You are a helpful assistant for a guitar store.',
+                  ],
+                  messages,
+                  outputSchema: guitarRecommendationSchema,
+                  stream: true,
+                  abortController,
+                })
+              : chat({
+                  ...adapterOptions,
+                  tools: config.tools,
+                  modelOptions: config.modelOptions,
+                  systemPrompts: [
+                    'You are a helpful assistant for a guitar store.',
+                  ],
+                  agentLoopStrategy: maxIterations(5),
+                  messages,
+                  abortController,
+                })
 
           return toServerSentEventsResponse(stream, { abortController })
         } catch (error: any) {
diff --git a/testing/e2e/tests/structured-output-stream.spec.ts b/testing/e2e/tests/structured-output-stream.spec.ts
new file mode 100644
index 000000000..598355e0a
--- /dev/null
+++ b/testing/e2e/tests/structured-output-stream.spec.ts
@@ -0,0 +1,87 @@
+import { test, expect } from './fixtures'
+import {
+  sendMessage,
+  waitForResponse,
+  getLastAssistantMessage,
+  featureUrl,
+} from './helpers'
+import { providersFor } from './test-matrix'
+
+for (const provider of providersFor('structured-output-stream')) {
+  test.describe(`${provider} — structured-output-stream`, () => {
+    test('streams structured JSON deltas in a single request', async ({
+      page,
+      testId,
+      aimockPort,
+    }) => {
+      await page.goto(
+        featureUrl(provider, 'structured-output-stream', testId, aimockPort),
+      )
+
+      await sendMessage(page, '[structured-stream] recommend a guitar as json')
+      await waitForResponse(page)
+
+      const response = await getLastAssistantMessage(page)
+      expect(response).toContain('Fender Stratocaster')
+      expect(response).toContain('1299')
+
+      // Verify the terminal `structured-output.complete` CUSTOM event
+      // reached the client and carries the parsed object — protects against
+      // a regression where the event is dropped but the JSON text still
+      // happens to render.
+      const completeEl = page.getByTestId('structured-output-complete')
+      await expect(completeEl).toBeAttached()
+      const structuredAttr = await completeEl.getAttribute(
+        'data-structured-output',
+      )
+      expect(structuredAttr).toBeTruthy()
+      const parsed = JSON.parse(structuredAttr!)
+      expect(parsed.name).toContain('Fender Stratocaster')
+      expect(parsed.price).toBe(1299)
+
+      // Verify the response actually streamed (more than one content delta).
+      // A regression that silently fell back to the synthetic single-delta
+      // path would still pass the substring assertion above but fail here.
+      const countAttr = await page
+        .getByTestId('content-delta-count')
+        .getAttribute('data-count')
+      expect(Number(countAttr)).toBeGreaterThan(1)
+    })
+
+    test('aborting mid-stream stops the run cleanly', async ({
+      page,
+      testId,
+      aimockPort,
+    }) => {
+      await page.goto(
+        featureUrl(provider, 'structured-output-stream', testId, aimockPort),
+      )
+
+      // Uses the slow-streaming fixture (tokensPerSecond + small chunkSize)
+      // so the stop button is reliably visible mid-stream.
+      await sendMessage(
+        page,
+        '[structured-stream-abort] recommend a guitar slowly',
+      )
+
+      await expect(page.getByTestId('loading-indicator')).toBeVisible({
+        timeout: 10_000,
+      })
+
+      const stopButton = page.getByTestId('stop-button')
+      await expect(stopButton).toBeVisible({ timeout: 5_000 })
+      await stopButton.click()
+
+      await expect(page.getByTestId('loading-indicator')).not.toBeVisible({
+        timeout: 10_000,
+      })
+
+      // The structured-output.complete event must not have reached the
+      // client — aborting before the JSON finished streaming should leave
+      // the run terminated, not "completed with empty result".
+      await expect(page.getByTestId('structured-output-complete')).toHaveCount(
+        0,
+      )
+    })
+  })
+}