From bd550bf2a61ae4f77bf0238aef7e6ea633beaa47 Mon Sep 17 00:00:00 2001
From: Tom Beckenham <34339192+tombeckenham@users.noreply.github.com>
Date: Tue, 5 May 2026 11:48:49 +1000
Subject: [PATCH 1/9] feat: streaming structured output (chat outputSchema +
 stream:true)

- @tanstack/ai: typed StructuredOutputStream<T> with terminal CUSTOM
  structured-output.complete event { object, raw, reasoning? }; optional
  TextAdapter.structuredOutputStream + activity-layer fallback;
  orchestrator hardening (always-finalize, typed RUN_ERROR with
  runId/model/timestamp, exactly-one-terminal-pair on tools branch, sync
  pre-flight errors, UI->Model message conversion on no-tools path).
- @tanstack/ai-openrouter: native structuredOutputStream via single
  stream:true + response_format:json_schema request; always-finalize on
  upstream close; empty-response and parse-error surface as typed
  RUN_ERROR; in-stream provider errors terminate the run; chain-of-thought
  reasoning threaded through the final CUSTOM event.
- E2E: structured-output-stream feature in matrix with happy-path + abort
  specs; useChat onCustomEvent/onChunk wiring exposes CUSTOM payload +
  delta count to DOM.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../streaming-structured-output-chat.md       |   5 +
 .../streaming-structured-output-openrouter.md |   5 +
 .../ai-openrouter/src/adapters/text.ts        | 276 ++++++++++++-
 .../tests/openrouter-adapter.test.ts          | 387 ++++++++++++++++++
 .../ai/src/activities/chat/adapter.ts         |  17 +
 .../ai/src/activities/chat/index.ts           | 324 ++++++++++++++-
 packages/typescript/ai/src/types.ts           |  49 +++
 testing/e2e/README.md                         |  41 +-
 .../structured-output-stream/abort.json       |  16 +
 .../structured-output-stream/basic.json       |  12 +
 testing/e2e/src/components/ChatUI.tsx         |  23 ++
 testing/e2e/src/lib/feature-support.ts        |   4 +
 testing/e2e/src/lib/features.ts               |   4 +
 testing/e2e/src/lib/types.ts                  |   2 +
 testing/e2e/src/routes/$provider/$feature.tsx |  22 +
 testing/e2e/src/routes/api.chat.ts            |  34 +-
 .../tests/structured-output-stream.spec.ts    |  87 ++++
 17 files changed, 1265 insertions(+), 43 deletions(-)
 create mode 100644 .changeset/streaming-structured-output-chat.md
 create mode 100644 .changeset/streaming-structured-output-openrouter.md
 create mode 100644 testing/e2e/fixtures/structured-output-stream/abort.json
 create mode 100644 testing/e2e/fixtures/structured-output-stream/basic.json
 create mode 100644 testing/e2e/tests/structured-output-stream.spec.ts
diff --git a/.changeset/streaming-structured-output-chat.md b/.changeset/streaming-structured-output-chat.md
new file mode 100644
index 000000000..68aa7302f
--- /dev/null
+++ b/.changeset/streaming-structured-output-chat.md
@@ -0,0 +1,5 @@
+---
+'@tanstack/ai': minor
+---
+
+feat: `chat({ outputSchema, stream: true })` returns `AsyncIterable<StreamChunk>` with raw JSON deltas plus a final `CUSTOM` `structured-output.complete` event carrying the validated parsed object. The existing `chat({ outputSchema })` (non-streaming) path is unchanged. Adapters expose this via a new optional `structuredOutputStream` method on `TextAdapter`; `BaseTextAdapter` provides a default that wraps the non-streaming `structuredOutput` so adapters without native streaming JSON support still satisfy the new combination.
diff --git a/.changeset/streaming-structured-output-openrouter.md b/.changeset/streaming-structured-output-openrouter.md
new file mode 100644
index 000000000..2b0b7fe2b
--- /dev/null
+++ b/.changeset/streaming-structured-output-openrouter.md
@@ -0,0 +1,5 @@
+---
+'@tanstack/ai-openrouter': minor
+---
+
+feat: native streaming structured output. `OpenRouterTextAdapter.structuredOutputStream()` issues a single request with `stream: true` + `response_format: { type: 'json_schema', strict: true }`, surfacing JSON deltas as `TEXT_MESSAGE_CONTENT` chunks and a final `CUSTOM` `structured-output.complete` event with the parsed object — replacing the previous two-request (streamed text → non-streamed JSON) flow when used with `chat({ outputSchema, stream: true })`.
diff --git a/packages/typescript/ai-openrouter/src/adapters/text.ts b/packages/typescript/ai-openrouter/src/adapters/text.ts
index 29427171c..8ef62a882 100644
--- a/packages/typescript/ai-openrouter/src/adapters/text.ts
+++ b/packages/typescript/ai-openrouter/src/adapters/text.ts
@@ -81,7 +81,7 @@ interface AGUIState {
   hasEmittedRunStarted: boolean
   hasEmittedTextMessageStart: boolean
   hasEmittedTextMessageEnd: boolean
-  hasEmittedRunFinished: boolean
+  hasFinalizedChoice: boolean
   hasEmittedStepStarted: boolean
   deferredUsage:
     | { promptTokens: number; completionTokens: number; totalTokens: number }
@@ -131,7 +131,7 @@ export class OpenRouterTextAdapter<
       hasEmittedRunStarted: false,
       hasEmittedTextMessageStart: false,
       hasEmittedTextMessageEnd: false,
-      hasEmittedRunFinished: false,
+      hasFinalizedChoice: false,
       hasEmittedStepStarted: false,
       deferredUsage: undefined,
       computedFinishReason: undefined,
@@ -204,7 +204,7 @@ export class OpenRouterTextAdapter<
 
       // Emit RUN_FINISHED after the stream ends so we capture usage from
       // any chunk (some SDKs send usage on a separate trailing chunk).
-      if (aguiState.hasEmittedRunFinished && aguiState.computedFinishReason) {
+      if (aguiState.hasFinalizedChoice && aguiState.computedFinishReason) {
         yield asChunk({
           type: 'RUN_FINISHED',
           runId: aguiState.runId,
@@ -263,6 +263,272 @@ export class OpenRouterTextAdapter<
     }
   }
 
+  async *structuredOutputStream(
+    options: StructuredOutputOptions<ResolveProviderOptions<TModel>>,
+  ): AsyncIterable<StreamChunk> {
+    const { chatOptions, outputSchema } = options
+    const { logger } = chatOptions
+    const timestamp = Date.now()
+    const toolCallBuffers = new Map<number, ToolCallBuffer>()
+    let accumulatedReasoning = ''
+    let accumulatedContent = ''
+    let responseId: string | null = null
+    let currentModel = chatOptions.model
+    const aguiState: AGUIState = {
+      runId: chatOptions.runId ?? this.generateId(),
+      threadId: chatOptions.threadId ?? this.generateId(),
+      messageId: this.generateId(),
+      stepId: null,
+      reasoningMessageId: null,
+      hasClosedReasoning: false,
+      hasEmittedRunStarted: false,
+      hasEmittedTextMessageStart: false,
+      hasEmittedTextMessageEnd: false,
+      hasFinalizedChoice: false,
+      hasEmittedStepStarted: false,
+      deferredUsage: undefined,
+      computedFinishReason: undefined,
+    }
+
+    const strictSchema = convertSchemaToJsonSchema(outputSchema, {
+      forStructuredOutput: true,
+    })
+
+    try {
+      // Strip tools — structured-output mode shouldn't mix tool calls into the
+      // request body. Matches the non-streaming `structuredOutput` behavior.
+      const { tools: _tools, ...baseParams } =
+        this.mapTextOptionsToSDK(chatOptions)
+      logger.request(
+        `activity=structured-stream provider=openrouter model=${this.model} messages=${chatOptions.messages.length} stream=true`,
+        { provider: 'openrouter', model: this.model },
+      )
+      const stream = await this.client.chat.send(
+        {
+          chatRequest: {
+            ...baseParams,
+            stream: true,
+            responseFormat: {
+              type: 'json_schema',
+              jsonSchema: {
+                name: 'structured_output',
+                schema: strictSchema,
+                strict: true,
+              },
+            },
+          },
+        },
+        { signal: chatOptions.request?.signal },
+      )
+
+      for await (const chunk of stream) {
+        logger.provider(`provider=openrouter`, { chunk })
+        if (chunk.id) responseId = chunk.id
+        if (chunk.model) currentModel = chunk.model
+
+        if (!aguiState.hasEmittedRunStarted) {
+          aguiState.hasEmittedRunStarted = true
+          yield asChunk({
+            type: 'RUN_STARTED',
+            runId: aguiState.runId,
+            threadId: aguiState.threadId,
+            model: currentModel || chatOptions.model,
+            timestamp,
+          })
+        }
+
+        if (chunk.error) {
+          // Provider error mid-stream is terminal: emit RUN_ERROR and stop.
+          // Continuing risks emitting RUN_FINISHED after RUN_ERROR.
+          yield asChunk({
+            type: 'RUN_ERROR',
+            runId: aguiState.runId,
+            model: currentModel || chatOptions.model,
+            timestamp,
+            message: chunk.error.message || 'Unknown error',
+            code: String(chunk.error.code),
+            error: {
+              message: chunk.error.message || 'Unknown error',
+              code: String(chunk.error.code),
+            },
+          })
+          return
+        }
+
+        for (const choice of chunk.choices) {
+          yield* this.processChoice(
+            choice,
+            toolCallBuffers,
+            {
+              id: responseId || this.generateId(),
+              model: currentModel,
+              timestamp,
+            },
+            { reasoning: accumulatedReasoning, content: accumulatedContent },
+            (r, c) => {
+              accumulatedReasoning = r
+              accumulatedContent = c
+            },
+            chunk.usage,
+            aguiState,
+          )
+        }
+      }
+
+      // Finalize the run unconditionally. If the upstream stream closed
+      // without a finishReason (truncation, transport drop), processChoice
+      // never closed reasoning/text or computed a finish reason — we still
+      // owe consumers a CUSTOM + RUN_FINISHED (or RUN_ERROR), never silence.
+      const resolvedModel = currentModel || chatOptions.model
+
+      if (aguiState.reasoningMessageId && !aguiState.hasClosedReasoning) {
+        aguiState.hasClosedReasoning = true
+        yield asChunk({
+          type: 'REASONING_MESSAGE_END',
+          messageId: aguiState.reasoningMessageId,
+          model: resolvedModel,
+          timestamp,
+        })
+        yield asChunk({
+          type: 'REASONING_END',
+          messageId: aguiState.reasoningMessageId,
+          model: resolvedModel,
+          timestamp,
+        })
+        if (aguiState.stepId) {
+          yield asChunk({
+            type: 'STEP_FINISHED',
+            stepName: aguiState.stepId,
+            stepId: aguiState.stepId,
+            model: resolvedModel,
+            timestamp,
+            content: accumulatedReasoning,
+          })
+        }
+      }
+
+      if (
+        aguiState.hasEmittedTextMessageStart &&
+        !aguiState.hasEmittedTextMessageEnd
+      ) {
+        aguiState.hasEmittedTextMessageEnd = true
+        yield asChunk({
+          type: 'TEXT_MESSAGE_END',
+          messageId: aguiState.messageId,
+          model: resolvedModel,
+          timestamp,
+        })
+      }
+
+      if (!accumulatedContent) {
+        // Mirrors the non-streaming `structuredOutput` empty-content error so
+        // refused/truncated responses surface as failures, not `null` data.
+        const message = 'Structured output response contained no content'
+        logger.errors(message, {
+          source: 'openrouter.structuredOutputStream',
+        })
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId: aguiState.runId,
+          model: resolvedModel,
+          timestamp,
+          message,
+          code: 'empty-response',
+          error: { message, code: 'empty-response' },
+        })
+        return
+      }
+
+      let parsed: unknown
+      try {
+        parsed = JSON.parse(accumulatedContent)
+      } catch (parseError) {
+        const message =
+          parseError instanceof SyntaxError
+            ? `Failed to parse structured output as JSON: ${parseError.message}`
+            : 'Failed to parse structured output as JSON'
+        logger.errors(message, {
+          source: 'openrouter.structuredOutputStream',
+          error: parseError,
+        })
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId: aguiState.runId,
+          model: resolvedModel,
+          timestamp,
+          message,
+          code: 'parse-error',
+          error: { message, code: 'parse-error' },
+        })
+        return
+      }
+
+      yield asChunk({
+        type: 'CUSTOM',
+        name: 'structured-output.complete',
+        value: {
+          object: parsed,
+          raw: accumulatedContent,
+          // Surface accumulated chain-of-thought (if any) on the terminal
+          // event so consumers that only subscribe to the final result can
+          // still recover what the model thought through to get there.
+          ...(accumulatedReasoning ? { reasoning: accumulatedReasoning } : {}),
+        },
+        model: resolvedModel,
+        timestamp,
+      })
+
+      yield asChunk({
+        type: 'RUN_FINISHED',
+        runId: aguiState.runId,
+        threadId: aguiState.threadId,
+        model: resolvedModel,
+        timestamp,
+        usage: aguiState.deferredUsage,
+        finishReason: aguiState.computedFinishReason ?? 'stop',
+      })
+    } catch (error) {
+      logger.errors('openrouter.structuredOutputStream fatal', {
+        error,
+        source: 'openrouter.structuredOutputStream',
+      })
+      if (!aguiState.hasEmittedRunStarted) {
+        aguiState.hasEmittedRunStarted = true
+        yield asChunk({
+          type: 'RUN_STARTED',
+          runId: aguiState.runId,
+          threadId: aguiState.threadId,
+          model: chatOptions.model,
+          timestamp,
+        })
+      }
+
+      if (error instanceof RequestAbortedError) {
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId: aguiState.runId,
+          model: chatOptions.model,
+          timestamp,
+          message: 'Request aborted',
+          code: 'aborted',
+          error: { message: 'Request aborted', code: 'aborted' },
+        })
+        return
+      }
+
+      yield asChunk({
+        type: 'RUN_ERROR',
+        runId: aguiState.runId,
+        model: chatOptions.model,
+        timestamp,
+        message: (error as Error).message || 'Unknown error',
+        error: {
+          message: (error as Error).message || 'Unknown error',
+        },
+      })
+    }
+  }
+
   async structuredOutput(
     options: StructuredOutputOptions<ResolveProviderOptions<TModel>>,
   ): Promise<StructuredOutputResult<unknown>> {
@@ -578,8 +844,8 @@ export class OpenRouterTextAdapter<
       // send two chunks with finishReason (one for the finish, one carrying
       // usage data).  Without this guard TEXT_MESSAGE_END and RUN_FINISHED
       // would be emitted twice.
-      if (!aguiState.hasEmittedRunFinished) {
-        aguiState.hasEmittedRunFinished = true
+      if (!aguiState.hasFinalizedChoice) {
+        aguiState.hasFinalizedChoice = true
 
         // Emit all completed tool calls when finish reason indicates tool usage
         if (finishReason === 'tool_calls' || toolCallBuffers.size > 0) {
diff --git a/packages/typescript/ai-openrouter/tests/openrouter-adapter.test.ts b/packages/typescript/ai-openrouter/tests/openrouter-adapter.test.ts
index 206d16525..53d79e2fd 100644
--- a/packages/typescript/ai-openrouter/tests/openrouter-adapter.test.ts
+++ b/packages/typescript/ai-openrouter/tests/openrouter-adapter.test.ts
@@ -1664,3 +1664,390 @@ describe('OpenRouter STEP event consistency', () => {
     expect(stepFinished).toHaveLength(1)
   })
 })
+
+describe('OpenRouter structuredOutputStream', () => {
+  beforeEach(() => {
+    vi.clearAllMocks()
+  })
+
+  it('issues a single streaming request with response_format json_schema and emits parsed object', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-stream-1',
+        model: 'openai/gpt-4o-mini',
+        choices: [{ delta: { content: '{"name":"Ali' }, finishReason: null }],
+      },
+      {
+        id: 'chatcmpl-stream-1',
+        model: 'openai/gpt-4o-mini',
+        choices: [
+          { delta: { content: 'ce","age":30}' }, finishReason: 'stop' },
+        ],
+        usage: { promptTokens: 5, completionTokens: 9, totalTokens: 14 },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const outputSchema = {
+      type: 'object',
+      properties: {
+        name: { type: 'string' },
+        age: { type: 'number' },
+      },
+      required: ['name', 'age'],
+    }
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'openai/gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema,
+    })) {
+      chunks.push(chunk)
+    }
+
+    // Single SDK call with stream:true + responseFormat
+    expect(mockSend).toHaveBeenCalledTimes(1)
+    const [rawParams] = mockSend.mock.calls[0]!
+    const params = rawParams.chatRequest
+    expect(params.stream).toBe(true)
+    expect(params.responseFormat).toEqual({
+      type: 'json_schema',
+      jsonSchema: {
+        name: 'structured_output',
+        schema: {
+          ...outputSchema,
+          additionalProperties: false,
+        },
+        strict: true,
+      },
+    })
+    expect(params.tools).toBeUndefined()
+
+    // Lifecycle events present and in the contractual order: consumers
+    // observing the CUSTOM `structured-output.complete` payload before
+    // RUN_FINISHED is part of the public contract; assert it.
+    const types: Array<string> = chunks.map((c) => c.type)
+    const idx = (t: string) => types.indexOf(t)
+    expect(idx('RUN_STARTED')).toBeGreaterThanOrEqual(0)
+    expect(idx('TEXT_MESSAGE_START')).toBeGreaterThan(idx('RUN_STARTED'))
+    expect(idx('TEXT_MESSAGE_CONTENT')).toBeGreaterThan(
+      idx('TEXT_MESSAGE_START'),
+    )
+    expect(idx('TEXT_MESSAGE_END')).toBeGreaterThan(idx('TEXT_MESSAGE_CONTENT'))
+    expect(idx('CUSTOM')).toBeGreaterThan(idx('TEXT_MESSAGE_END'))
+    expect(idx('RUN_FINISHED')).toBeGreaterThan(idx('CUSTOM'))
+
+    // Two CONTENT deltas — one per stream chunk — carrying raw JSON deltas
+    const contentChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'TEXT_MESSAGE_CONTENT' }> =>
+        c.type === 'TEXT_MESSAGE_CONTENT',
+    )
+    expect(contentChunks).toHaveLength(2)
+    expect(contentChunks[0]!.delta).toBe('{"name":"Ali')
+    expect(contentChunks[1]!.delta).toBe('ce","age":30}')
+
+    // Final CUSTOM event carries the parsed object + raw text
+    const customChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]!.name).toBe('structured-output.complete')
+    expect(customChunks[0]!.value).toEqual({
+      object: { name: 'Alice', age: 30 },
+      raw: '{"name":"Alice","age":30}',
+    })
+  })
+
+  it('emits RUN_ERROR when accumulated content is not valid JSON', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-stream-bad',
+        model: 'openai/gpt-4o-mini',
+        choices: [{ delta: { content: 'not json' }, finishReason: 'stop' }],
+        usage: { promptTokens: 1, completionTokens: 1, totalTokens: 2 },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'openai/gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const errorChunks = chunks.filter((c) => c.type === 'RUN_ERROR')
+    expect(errorChunks).toHaveLength(1)
+    expect(errorChunks[0]).toMatchObject({
+      type: 'RUN_ERROR',
+      message: expect.stringContaining('Failed to parse structured output'),
+    })
+
+    const customChunks = chunks.filter((c) => c.type === 'CUSTOM')
+    expect(customChunks).toHaveLength(0)
+  })
+
+  it('emits empty-response RUN_ERROR when no content is streamed', async () => {
+    // No content delta, just a finish — mirrors a refused/truncated response.
+    const streamChunks = [
+      {
+        id: 'chatcmpl-stream-empty',
+        model: 'openai/gpt-4o-mini',
+        choices: [{ delta: { content: '' }, finishReason: 'stop' }],
+        usage: { promptTokens: 1, completionTokens: 0, totalTokens: 1 },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'openai/gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const errorChunks = chunks.filter((c) => c.type === 'RUN_ERROR')
+    expect(errorChunks).toHaveLength(1)
+    expect(errorChunks[0]).toMatchObject({
+      type: 'RUN_ERROR',
+      code: 'empty-response',
+    })
+    expect(chunks.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
+  })
+
+  it('finalizes the run when upstream stream closes without finishReason', async () => {
+    // Truncated SDK stream: deltas arrive but no finishReason. The adapter
+    // must still emit the terminal CUSTOM + RUN_FINISHED so consumers
+    // never hang waiting for completion.
+    const streamChunks = [
+      {
+        id: 'chatcmpl-stream-trunc',
+        model: 'openai/gpt-4o-mini',
+        choices: [
+          { delta: { content: '{"name":"Alice"}' }, finishReason: null },
+        ],
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'openai/gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const customChunks = chunks.filter((c) => c.type === 'CUSTOM')
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]).toMatchObject({
+      name: 'structured-output.complete',
+      value: { object: { name: 'Alice' }, raw: '{"name":"Alice"}' },
+    })
+    expect(chunks.filter((c) => c.type === 'RUN_FINISHED')).toHaveLength(1)
+    expect(chunks.filter((c) => c.type === 'RUN_ERROR')).toHaveLength(0)
+  })
+
+  it('terminates on mid-stream provider error without emitting RUN_FINISHED', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-stream-err',
+        model: 'openai/gpt-4o-mini',
+        choices: [{ delta: { content: '{"name":"Al' }, finishReason: null }],
+      },
+      {
+        id: 'chatcmpl-stream-err',
+        model: 'openai/gpt-4o-mini',
+        error: { message: 'Upstream rate limit', code: 429 },
+        choices: [],
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'openai/gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const errorChunks = chunks.filter((c) => c.type === 'RUN_ERROR')
+    expect(errorChunks).toHaveLength(1)
+    // After RUN_ERROR the stream is terminal — no RUN_FINISHED, no CUSTOM.
+    expect(chunks.filter((c) => c.type === 'RUN_FINISHED')).toHaveLength(0)
+    expect(chunks.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
+  })
+
+  it('surfaces accumulated reasoning on the structured-output.complete event', async () => {
+    // Thinking-model stream: reasoning deltas before content. Consumers that
+    // subscribe only to the terminal CUSTOM event should still recover the
+    // chain-of-thought via `value.reasoning`.
+    const streamChunks = [
+      {
+        id: 'chatcmpl-stream-reasoning',
+        model: 'openai/gpt-4o-mini',
+        choices: [
+          {
+            delta: {
+              reasoningDetails: [
+                { type: 'reasoning.text', text: 'Let me think... ' },
+              ],
+            },
+            finishReason: null,
+          },
+        ],
+      },
+      {
+        id: 'chatcmpl-stream-reasoning',
+        model: 'openai/gpt-4o-mini',
+        choices: [
+          {
+            delta: {
+              reasoningDetails: [
+                { type: 'reasoning.text', text: 'a Strat would suit them.' },
+              ],
+            },
+            finishReason: null,
+          },
+        ],
+      },
+      {
+        id: 'chatcmpl-stream-reasoning',
+        model: 'openai/gpt-4o-mini',
+        choices: [
+          {
+            delta: { content: '{"name":"Strat","price":1299}' },
+            finishReason: 'stop',
+          },
+        ],
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'openai/gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Recommend a guitar' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: {
+          name: { type: 'string' },
+          price: { type: 'number' },
+        },
+        required: ['name', 'price'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const customChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]!.value).toEqual({
+      object: { name: 'Strat', price: 1299 },
+      raw: '{"name":"Strat","price":1299}',
+      reasoning: 'Let me think... a Strat would suit them.',
+    })
+  })
+
+  it('omits reasoning from the CUSTOM event when none was streamed', async () => {
+    // Non-thinking model: no reasoning deltas. The `reasoning` field should
+    // be absent (not an empty string) so downstream consumers can branch on
+    // `value.reasoning != null` without false positives.
+    const streamChunks = [
+      {
+        id: 'chatcmpl-stream-noreasoning',
+        model: 'openai/gpt-4o-mini',
+        choices: [
+          {
+            delta: { content: '{"name":"Strat","price":1299}' },
+            finishReason: 'stop',
+          },
+        ],
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'openai/gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Recommend a guitar' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: {
+          name: { type: 'string' },
+          price: { type: 'number' },
+        },
+        required: ['name', 'price'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const customChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]!.value).not.toHaveProperty('reasoning')
+  })
+})
diff --git a/packages/typescript/ai/src/activities/chat/adapter.ts b/packages/typescript/ai/src/activities/chat/adapter.ts
index 4ccc6fc09..198b89ffa 100644
--- a/packages/typescript/ai/src/activities/chat/adapter.ts
+++ b/packages/typescript/ai/src/activities/chat/adapter.ts
@@ -97,6 +97,23 @@ export interface TextAdapter<
   structuredOutput: (
     options: StructuredOutputOptions<TProviderOptions>,
   ) => Promise<StructuredOutputResult<unknown>>
+
+  /**
+   * Stream structured output using the provider's native streaming structured
+   * output API (stream + response_format json_schema in a single request).
+   *
+   * Optional — adapters without native streaming JSON omit this method and the
+   * activity layer synthesizes a stream around the non-streaming
+   * `structuredOutput` call.
+   *
+   * Implementations must emit standard AG-UI lifecycle events (RUN_STARTED,
+   * TEXT_MESSAGE_*, RUN_FINISHED) carrying raw JSON text deltas, plus a final
+   * `CUSTOM` event named `structured-output.complete` whose `value` is
+   * `{ object, raw }`.
+   */
+  structuredOutputStream?: (
+    options: StructuredOutputOptions<TProviderOptions>,
+  ) => AsyncIterable<StreamChunk>
 }
 
 /**
diff --git a/packages/typescript/ai/src/activities/chat/index.ts b/packages/typescript/ai/src/activities/chat/index.ts
index e1327fdb5..7a3c332c4 100644
--- a/packages/typescript/ai/src/activities/chat/index.ts
+++ b/packages/typescript/ai/src/activities/chat/index.ts
@@ -38,6 +38,8 @@ import type {
   RunFinishedEvent,
   SchemaInput,
   StreamChunk,
+  StructuredOutputCompleteEvent,
+  StructuredOutputStream,
   TextMessageContentEvent,
   TextOptions,
   Tool,
@@ -213,7 +215,7 @@ export interface TextActivityOptions<
 export function createChatOptions<
   TAdapter extends AnyTextAdapter,
   TSchema extends SchemaInput | undefined = undefined,
-  TStream extends boolean = true,
+  TStream extends boolean = boolean,
 >(
   options: TextActivityOptions<TAdapter, TSchema, TStream>,
 ): TextActivityOptions<TAdapter, TSchema, TStream> {
@@ -226,16 +228,28 @@ export function createChatOptions<
 
 /**
  * Result type for the text activity.
- * - If outputSchema is provided: Promise<InferSchemaType<TSchema>>
- * - If stream is false: Promise<string>
- * - Otherwise (stream is true, default): AsyncIterable<StreamChunk>
+ * - If outputSchema is provided AND stream is explicitly true:
+ *   StructuredOutputStream<InferSchemaType<TSchema>> — yields raw JSON deltas
+ *   via TEXT_MESSAGE_CONTENT plus a terminal StructuredOutputCompleteEvent
+ *   carrying the validated object.
+ * - If outputSchema is provided without explicit stream:true:
+ *   Promise<InferSchemaType<TSchema>>.
+ * - If stream is explicitly false (no schema): Promise<string>.
+ * - Otherwise (default): AsyncIterable<StreamChunk>.
+ *
+ * `[TStream] extends [true]` is used (not `TStream extends true`) so that the
+ * default `boolean` value of `TStream` does *not* match the streaming branch.
+ * Without this, plain `chat({ outputSchema })` would type as a stream while
+ * the runtime returns a Promise — see issue #526.
  */
 export type TextActivityResult<
   TSchema extends SchemaInput | undefined,
-  TStream extends boolean = true,
+  TStream extends boolean = boolean,
 > = TSchema extends SchemaInput
-  ? Promise<InferSchemaType<TSchema>>
-  : TStream extends false
+  ? [TStream] extends [true]
+    ? StructuredOutputStream<InferSchemaType<TSchema>>
+    : Promise<InferSchemaType<TSchema>>
+  : [TStream] extends [false]
     ? Promise<string>
     : AsyncIterable<StreamChunk>
 
@@ -1512,13 +1526,26 @@ class TextEngine<
 export function chat<
   TAdapter extends AnyTextAdapter,
   TSchema extends SchemaInput | undefined = undefined,
-  TStream extends boolean = true,
+  TStream extends boolean = boolean,
 >(
   options: TextActivityOptions<TAdapter, TSchema, TStream>,
 ): TextActivityResult<TSchema, TStream> {
   const { outputSchema, stream } = options
 
-  // If outputSchema is provided, run agentic structured output
+  // outputSchema + stream:true is the only branch that streams structured
+  // output. Without an explicit `stream: true`, schema-bearing calls run the
+  // agent loop and resolve to a typed Promise<InferSchemaType<TSchema>>.
+  if (outputSchema && stream === true) {
+    return runStreamingStructuredOutput(
+      options as unknown as TextActivityOptions<
+        AnyTextAdapter,
+        SchemaInput,
+        true
+      >,
+    ) as TextActivityResult<TSchema, TStream>
+  }
+
+  // If outputSchema is provided, run agentic structured output (Promise<T>)
   if (outputSchema) {
     return runAgenticStructuredOutput(
       options as unknown as TextActivityOptions<
@@ -1678,6 +1705,285 @@ async function runAgenticStructuredOutput<TSchema extends SchemaInput>(
   return result.data as InferSchemaType<TSchema>
 }
 
+/**
+ * Synthesize a streaming structured-output stream by wrapping a non-streaming
+ * `structuredOutput` call. Used when an adapter doesn't implement
+ * `structuredOutputStream` natively.
+ */
+async function* fallbackStructuredOutputStream(
+  adapter: AnyTextAdapter,
+  options: { chatOptions: TextOptions<any, any>; outputSchema: any },
+): AsyncIterable<StreamChunk> {
+  const { chatOptions } = options
+  const runId = chatOptions.runId ?? `mock-${Date.now()}`
+  const threadId = chatOptions.threadId ?? `mock-${Date.now()}`
+  const messageId = `mock-${Date.now()}-${Math.random().toString(36).slice(2)}`
+  const model = chatOptions.model
+  const timestamp = Date.now()
+
+  yield {
+    type: 'RUN_STARTED',
+    runId,
+    threadId,
+    model,
+    timestamp,
+  } as unknown as StreamChunk
+
+  let result: { data: unknown; rawText: string }
+  try {
+    result = await adapter.structuredOutput(options)
+  } catch (error) {
+    const message = error instanceof Error ? error.message : 'Unknown error'
+    yield {
+      type: 'RUN_ERROR',
+      runId,
+      model,
+      timestamp,
+      message,
+      error: { message },
+    } as unknown as StreamChunk
+    return
+  }
+
+  yield {
+    type: 'TEXT_MESSAGE_START',
+    messageId,
+    role: 'assistant',
+    model,
+    timestamp,
+  } as unknown as StreamChunk
+
+  yield {
+    type: 'TEXT_MESSAGE_CONTENT',
+    messageId,
+    delta: result.rawText,
+    model,
+    timestamp,
+  } as unknown as StreamChunk
+
+  yield {
+    type: 'TEXT_MESSAGE_END',
+    messageId,
+    model,
+    timestamp,
+  } as unknown as StreamChunk
+
+  yield {
+    type: 'CUSTOM',
+    name: 'structured-output.complete',
+    value: { object: result.data, raw: result.rawText },
+    model,
+    timestamp,
+  } as unknown as StreamChunk
+
+  yield {
+    type: 'RUN_FINISHED',
+    runId,
+    threadId,
+    model,
+    timestamp,
+    finishReason: 'stop',
+  } as unknown as StreamChunk
+}
+
+/**
+ * Run streaming structured output:
+ * - Without tools: call adapter.structuredOutputStream directly (single
+ *   provider request emitting JSON deltas + a final CUSTOM event).
+ * - With tools: run the agent loop, yield its non-terminal chunks, then call
+ *   structuredOutputStream on the final messages so the structured stream's
+ *   own RUN_STARTED/RUN_FINISHED bracket the run.
+ *
+ * Validates the parsed object against the original Standard Schema (if
+ * applicable) when forwarding the final `structured-output.complete` event.
+ *
+ * Pre-flight validation (missing schema, unconvertible schema) throws
+ * synchronously at call time rather than as a yielded RUN_ERROR mid-stream —
+ * those are programmer errors, not runtime conditions.
+ */
+function runStreamingStructuredOutput<TSchema extends SchemaInput>(
+  options: TextActivityOptions<AnyTextAdapter, TSchema, true>,
+): StructuredOutputStream<InferSchemaType<TSchema>> {
+  const { outputSchema } = options
+
+  if (!outputSchema) {
+    throw new Error('outputSchema is required for streaming structured output')
+  }
+
+  // forStructuredOutput strict-converts the schema once at the activity
+  // boundary. Adapters can re-convert if their wire format diverges, but the
+  // default flow hands them a strict-ready schema.
+  const jsonSchema = convertSchemaToJsonSchema(outputSchema, {
+    forStructuredOutput: true,
+  })
+  if (!jsonSchema) {
+    throw new Error('Failed to convert output schema to JSON Schema')
+  }
+
+  return runStreamingStructuredOutputImpl(options, jsonSchema)
+}
+
+async function* runStreamingStructuredOutputImpl<TSchema extends SchemaInput>(
+  options: TextActivityOptions<AnyTextAdapter, TSchema, true>,
+  jsonSchema: NonNullable<ReturnType<typeof convertSchemaToJsonSchema>>,
+): StructuredOutputStream<InferSchemaType<TSchema>> {
+  const { adapter, outputSchema, middleware, context, debug, ...textOptions } =
+    options
+  const model = adapter.model
+  const logger = resolveDebugOption(debug)
+  const runId = textOptions.runId
+
+  // Inputs may be UIMessages (from useChat) or ModelMessages (from server-side
+  // callers). The agent-loop branch converts via TextEngine; the no-tools
+  // branch must convert here so the adapter sees a uniform ModelMessage shape.
+  let finalMessages = convertMessagesToModelMessages(
+    (textOptions.messages ?? []) as Array<any>,
+  )
+
+  if (textOptions.tools?.length) {
+    const engine = new TextEngine(
+      {
+        adapter,
+        params: { ...textOptions, model, logger } as TextOptions<
+          Record<string, unknown>,
+          Record<string, unknown>
+        >,
+        middleware,
+        context,
+      },
+      logger,
+    )
+
+    // The structured-output stream emits its own RUN_STARTED + RUN_FINISHED
+    // pair to bracket the run — drop both from the engine's output so
+    // consumers see exactly one terminal lifecycle pair.
+    try {
+      for await (const chunk of engine.run()) {
+        if (chunk.type === 'RUN_STARTED' || chunk.type === 'RUN_FINISHED') {
+          continue
+        }
+        yield chunk
+      }
+    } catch (engineError) {
+      const message = (engineError as Error).message || 'Agent loop failed'
+      logger.errors('runStreamingStructuredOutput agent loop failed', {
+        error: engineError,
+        source: 'runStreamingStructuredOutput',
+      })
+      yield {
+        type: 'RUN_ERROR',
+        runId,
+        model,
+        timestamp: Date.now(),
+        message,
+        code: 'agent-loop-failed',
+        error: { message, code: 'agent-loop-failed' },
+      } as unknown as StreamChunk
+      return
+    }
+
+    finalMessages = engine.getMessages()
+  }
+
+  const {
+    tools: _tools,
+    agentLoopStrategy: _als,
+    ...structuredTextOptions
+  } = textOptions
+
+  const providerName =
+    (adapter as { provider?: string }).provider ?? adapter.name
+  logger.request(
+    `activity=chat-structured-stream provider=${providerName} model=${model} messages=${finalMessages.length}`,
+    {
+      provider: providerName,
+      model,
+      messageCount: finalMessages.length,
+    },
+  )
+
+  const structuredChatOptions = {
+    ...structuredTextOptions,
+    model,
+    messages: finalMessages,
+    logger,
+  }
+
+  // Adapters that don't implement structuredOutputStream natively fall back
+  // to wrapping the non-streaming `structuredOutput` — `fallbackStructuredOutputStream`
+  // synthesizes the AG-UI lifecycle events around it.
+  const stream = adapter.structuredOutputStream
+    ? adapter.structuredOutputStream({
+        chatOptions: structuredChatOptions,
+        outputSchema: jsonSchema,
+      })
+    : fallbackStructuredOutputStream(adapter, {
+        chatOptions: structuredChatOptions,
+        outputSchema: jsonSchema,
+      })
+
+  for await (const chunk of stream) {
+    if (
+      chunk.type === 'CUSTOM' &&
+      chunk.name === 'structured-output.complete'
+    ) {
+      const customChunk = chunk
+      const value = customChunk.value as {
+        object: unknown
+        raw: string
+        reasoning?: string
+      }
+      if (isStandardSchema(outputSchema)) {
+        try {
+          const validated = parseWithStandardSchema(outputSchema, value.object)
+          yield {
+            ...customChunk,
+            // Forward `reasoning` through schema validation so consumers that
+            // only listen for the terminal event don't lose chain-of-thought.
+            value: {
+              object: validated,
+              raw: value.raw,
+              ...(value.reasoning ? { reasoning: value.reasoning } : {}),
+            },
+          } as StructuredOutputCompleteEvent<InferSchemaType<TSchema>>
+          continue
+        } catch (err) {
+          const message = (err as Error).message || 'Schema validation failed'
+          logger.errors(
+            'runStreamingStructuredOutput schema validation failed',
+            {
+              error: err,
+              source: 'runStreamingStructuredOutput',
+              // Include reasoning in error meta so post-mortems can recover
+              // what the model thought through before producing invalid JSON.
+              ...(value.reasoning ? { reasoning: value.reasoning } : {}),
+            },
+          )
+          yield {
+            type: 'RUN_ERROR',
+            runId,
+            model: customChunk.model ?? model,
+            timestamp: customChunk.timestamp ?? Date.now(),
+            message,
+            code: 'schema-validation',
+            error: {
+              message,
+              code: 'schema-validation',
+              ...(value.reasoning ? { reasoning: value.reasoning } : {}),
+            },
+          } as unknown as StreamChunk
+          return
+        }
+      }
+      yield customChunk as StructuredOutputCompleteEvent<
+        InferSchemaType<TSchema>
+      >
+      continue
+    }
+    yield chunk
+  }
+}
+
 // Re-export adapter types
 export type {
   TextAdapter,
diff --git a/packages/typescript/ai/src/types.ts b/packages/typescript/ai/src/types.ts
index e11e7176f..abcca84c1 100644
--- a/packages/typescript/ai/src/types.ts
+++ b/packages/typescript/ai/src/types.ts
@@ -1044,6 +1044,55 @@ export interface CustomEvent extends AGUICustomEvent {
   model?: string
 }
 
+/**
+ * Final event of a streaming structured-output run. Carries the validated
+ * `object` (typed as `T` after the orchestrator runs Standard Schema parsing),
+ * the `raw` JSON text that produced it, and — for thinking/reasoning models —
+ * the accumulated reasoning text. Adapters emit this with `T = unknown`; the
+ * chat orchestrator narrows to the schema's inferred type after validation.
+ *
+ * `reasoning` is `undefined` when the model produced none (most non-thinking
+ * models) and when the underlying adapter doesn't expose reasoning streams.
+ */
+export interface StructuredOutputCompleteEvent<T = unknown> extends Omit<
+  CustomEvent,
+  'name' | 'value'
+> {
+  name: 'structured-output.complete'
+  value: { object: T; raw: string; reasoning?: string }
+}
+
+/**
+ * Public type for streams returned by `chat({ outputSchema, stream: true })`.
+ * Yields all standard `StreamChunk` lifecycle events plus a terminal
+ * `StructuredOutputCompleteEvent<T>` whose `value.object` is typed against the
+ * caller's schema.
+ */
+export type StructuredOutputStream<T = unknown> = AsyncIterable<
+  StreamChunk | StructuredOutputCompleteEvent<T>
+>
+
+/**
+ * Type guard for the terminal `structured-output.complete` event. Use to
+ * narrow chunks while iterating a `StructuredOutputStream<T>`:
+ *
+ * ```ts
+ * for await (const chunk of stream) {
+ *   if (isStructuredOutputCompleteEvent<MySchema>(chunk)) {
+ *     chunk.value.object  // typed as MySchema
+ *   }
+ * }
+ * ```
+ */
+export function isStructuredOutputCompleteEvent<T = unknown>(
+  chunk: StreamChunk | StructuredOutputCompleteEvent<T>,
+): chunk is StructuredOutputCompleteEvent<T> {
+  return (
+    chunk.type === 'CUSTOM' &&
+    (chunk as CustomEvent).name === 'structured-output.complete'
+  )
+}
+
 // ============================================================================
 // AG-UI Reasoning Event Interfaces
 // ============================================================================
diff --git a/testing/e2e/README.md b/testing/e2e/README.md
index cc1fb3873..285620db4 100644
--- a/testing/e2e/README.md
+++ b/testing/e2e/README.md
@@ -12,25 +12,26 @@ End-to-end tests for TanStack AI using Playwright and [aimock](https://github.co
 
 Each test iterates over supported providers using `providersFor('feature')`:
 
-| Feature               | Providers | Spec file                             |
-| --------------------- | --------- | ------------------------------------- |
-| chat                  | 7         | `tests/chat.spec.ts`                  |
-| one-shot-text         | 7         | `tests/one-shot-text.spec.ts`         |
-| multi-turn            | 7         | `tests/multi-turn.spec.ts`            |
-| structured-output     | 7         | `tests/structured-output.spec.ts`     |
-| tool-calling          | 7         | `tests/tool-calling.spec.ts`          |
-| parallel-tool-calls   | 6         | `tests/parallel-tool-calls.spec.ts`   |
-| tool-approval         | 6         | `tests/tool-approval.spec.ts`         |
-| text-tool-text        | 6         | `tests/text-tool-text.spec.ts`        |
-| agentic-structured    | 7         | `tests/agentic-structured.spec.ts`    |
-| reasoning             | 3         | `tests/reasoning.spec.ts`             |
-| multimodal-image      | 5         | `tests/multimodal-image.spec.ts`      |
-| multimodal-structured | 5         | `tests/multimodal-structured.spec.ts` |
-| summarize             | 6         | `tests/summarize.spec.ts`             |
-| summarize-stream      | 6         | `tests/summarize-stream.spec.ts`      |
-| image-gen             | 7         | `tests/image-gen.spec.ts`             |
-| tts                   | 7         | `tests/tts.spec.ts`                   |
-| transcription         | 7         | `tests/transcription.spec.ts`         |
+| Feature                  | Providers | Spec file                                |
+| ------------------------ | --------- | ---------------------------------------- |
+| chat                     | 7         | `tests/chat.spec.ts`                     |
+| one-shot-text            | 7         | `tests/one-shot-text.spec.ts`            |
+| multi-turn               | 7         | `tests/multi-turn.spec.ts`               |
+| structured-output        | 7         | `tests/structured-output.spec.ts`        |
+| structured-output-stream | 1         | `tests/structured-output-stream.spec.ts` |
+| tool-calling             | 7         | `tests/tool-calling.spec.ts`             |
+| parallel-tool-calls      | 6         | `tests/parallel-tool-calls.spec.ts`      |
+| tool-approval            | 6         | `tests/tool-approval.spec.ts`            |
+| text-tool-text           | 6         | `tests/text-tool-text.spec.ts`           |
+| agentic-structured       | 7         | `tests/agentic-structured.spec.ts`       |
+| reasoning                | 3         | `tests/reasoning.spec.ts`                |
+| multimodal-image         | 5         | `tests/multimodal-image.spec.ts`         |
+| multimodal-structured    | 5         | `tests/multimodal-structured.spec.ts`    |
+| summarize                | 6         | `tests/summarize.spec.ts`                |
+| summarize-stream         | 6         | `tests/summarize-stream.spec.ts`         |
+| image-gen                | 7         | `tests/image-gen.spec.ts`                |
+| tts                      | 7         | `tests/tts.spec.ts`                      |
+| transcription            | 7         | `tests/transcription.spec.ts`            |
 
 ### Tools-test page
 
@@ -122,7 +123,7 @@ Clean up the fixture:
 }
 ```
 
-Existing prefixes: `[chat]`, `[oneshot]`, `[reasoning]`, `[multiturn-1]`, `[multiturn-2]`, `[toolcall]`, `[parallel]`, `[approval]`, `[approval-deny]`, `[text-tool-text]`, `[structured]`, `[agentic]`, `[mmimage]`, `[mmstruct]`, `[summarize]`, `[imagegen]`, `[tts]`, `[transcription]`, `[abort-test]`, `[error-test]`.
+Existing prefixes: `[chat]`, `[oneshot]`, `[reasoning]`, `[multiturn-1]`, `[multiturn-2]`, `[toolcall]`, `[parallel]`, `[approval]`, `[approval-deny]`, `[text-tool-text]`, `[structured]`, `[structured-stream]`, `[agentic]`, `[mmimage]`, `[mmstruct]`, `[summarize]`, `[imagegen]`, `[tts]`, `[transcription]`, `[abort-test]`, `[error-test]`.
 
 ## 4. Writing a Test
 
diff --git a/testing/e2e/fixtures/structured-output-stream/abort.json b/testing/e2e/fixtures/structured-output-stream/abort.json
new file mode 100644
index 000000000..6ed750774
--- /dev/null
+++ b/testing/e2e/fixtures/structured-output-stream/abort.json
@@ -0,0 +1,16 @@
+{
+  "fixtures": [
+    {
+      "match": {
+        "userMessage": "[structured-stream-abort] recommend a guitar slowly"
+      },
+      "response": {
+        "content": "{\"name\":\"Fender Stratocaster\",\"price\":1299,\"reason\":\"Versatile tone and comfortable playability across many genres including blues rock jazz country and pop with a wide tonal palette\",\"rating\":5}"
+      },
+      "opts": {
+        "tokensPerSecond": 1,
+        "chunkSize": 2
+      }
+    }
+  ]
+}
diff --git a/testing/e2e/fixtures/structured-output-stream/basic.json b/testing/e2e/fixtures/structured-output-stream/basic.json
new file mode 100644
index 000000000..62ef046fc
--- /dev/null
+++ b/testing/e2e/fixtures/structured-output-stream/basic.json
@@ -0,0 +1,12 @@
+{
+  "fixtures": [
+    {
+      "match": {
+        "userMessage": "[structured-stream] recommend a guitar as json"
+      },
+      "response": {
+        "content": "{\"name\":\"Fender Stratocaster\",\"price\":1299,\"reason\":\"Versatile tone and comfortable playability\",\"rating\":5}"
+      }
+    }
+  ]
+}
diff --git a/testing/e2e/src/components/ChatUI.tsx b/testing/e2e/src/components/ChatUI.tsx
index 7183115ae..da5f0c595 100644
--- a/testing/e2e/src/components/ChatUI.tsx
+++ b/testing/e2e/src/components/ChatUI.tsx
@@ -18,6 +18,13 @@ interface ChatUIProps {
   }) => Promise<void>
   showImageInput?: boolean
   onStop?: () => void
+  /** When the streaming structured-output CUSTOM event lands, the page
+   *  exposes the parsed object here so e2e tests can assert that the event
+   *  reached the client (not just that the JSON text was rendered). */
+  structuredObject?: unknown
+  /** Number of TEXT_MESSAGE_CONTENT chunks observed. Used by streaming e2e
+   *  tests to verify the response actually streamed in multiple deltas. */
+  contentDeltaCount?: number
 }
 
 export function ChatUI({
@@ -28,6 +35,8 @@ export function ChatUI({
   addToolApprovalResponse,
   showImageInput,
   onStop,
+  structuredObject,
+  contentDeltaCount,
 }: ChatUIProps) {
   const [input, setInput] = useState('')
   const messagesRef = useRef<HTMLDivElement>(null)
@@ -46,6 +55,20 @@ export function ChatUI({
 
   return (
     <div className="flex flex-col h-[calc(100vh-60px)]">
+      {structuredObject != null && (
+        <div
+          data-testid="structured-output-complete"
+          data-structured-output={JSON.stringify(structuredObject)}
+          hidden
+        />
+      )}
+      {contentDeltaCount != null && (
+        <div
+          data-testid="content-delta-count"
+          data-count={String(contentDeltaCount)}
+          hidden
+        />
+      )}
       <div
         ref={messagesRef}
         data-testid="message-list"
diff --git a/testing/e2e/src/lib/feature-support.ts b/testing/e2e/src/lib/feature-support.ts
index db0696e4e..8c0779f7d 100644
--- a/testing/e2e/src/lib/feature-support.ts
+++ b/testing/e2e/src/lib/feature-support.ts
@@ -80,6 +80,10 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'grok',
     'openrouter',
   ]),
+  // Streaming structured output: only providers with native streaming JSON
+  // schema support are listed here. Other providers fall back to the default
+  // BaseTextAdapter implementation but aren't exercised by E2E yet.
+  'structured-output-stream': new Set(['openrouter']),
   'agentic-structured': new Set([
     'openai',
     'anthropic',
diff --git a/testing/e2e/src/lib/features.ts b/testing/e2e/src/lib/features.ts
index 15000cd7e..08f7aa6c3 100644
--- a/testing/e2e/src/lib/features.ts
+++ b/testing/e2e/src/lib/features.ts
@@ -49,6 +49,10 @@ export const featureConfigs: Record<Feature, FeatureConfig> = {
     tools: [],
     modelOptions: {},
   },
+  'structured-output-stream': {
+    tools: [],
+    modelOptions: {},
+  },
   'agentic-structured': {
     tools: [getGuitars],
     modelOptions: {},
diff --git a/testing/e2e/src/lib/types.ts b/testing/e2e/src/lib/types.ts
index 00c848157..cca9e4d79 100644
--- a/testing/e2e/src/lib/types.ts
+++ b/testing/e2e/src/lib/types.ts
@@ -19,6 +19,7 @@ export type Feature =
   | 'tool-approval'
   | 'text-tool-text'
   | 'structured-output'
+  | 'structured-output-stream'
   | 'agentic-structured'
   | 'multimodal-image'
   | 'multimodal-structured'
@@ -49,6 +50,7 @@ export const ALL_FEATURES: Feature[] = [
   'tool-approval',
   'text-tool-text',
   'structured-output',
+  'structured-output-stream',
   'agentic-structured',
   'multimodal-image',
   'multimodal-structured',
diff --git a/testing/e2e/src/routes/$provider/$feature.tsx b/testing/e2e/src/routes/$provider/$feature.tsx
index de76993a2..f4c7478e4 100644
--- a/testing/e2e/src/routes/$provider/$feature.tsx
+++ b/testing/e2e/src/routes/$provider/$feature.tsx
@@ -1,4 +1,5 @@
 import { createFileRoute } from '@tanstack/react-router'
+import { useState } from 'react'
 import { fetchServerSentEvents, useChat } from '@tanstack/ai-react'
 import { clientTools } from '@tanstack/ai-client'
 import type { Feature, Mode, Provider } from '@/lib/types'
@@ -137,17 +138,38 @@ function ChatFeature({
 
   const { testId, aimockPort } = Route.useSearch()
 
+  // Tracks streaming-structured-output observability for e2e tests:
+  // - structuredObject: captured from the terminal CUSTOM event
+  // - contentDeltaCount: incremented per TEXT_MESSAGE_CONTENT chunk so tests
+  //   can verify the response actually streamed (rather than silently
+  //   collapsing to a single synthetic delta)
+  const [structuredObject, setStructuredObject] = useState<unknown>(null)
+  const [contentDeltaCount, setContentDeltaCount] = useState(0)
+
   const { messages, sendMessage, isLoading, addToolApprovalResponse, stop } =
     useChat({
       connection: fetchServerSentEvents('/api/chat'),
       tools,
       body: { provider, feature, testId, aimockPort },
+      onCustomEvent: (eventType, data) => {
+        if (eventType === 'structured-output.complete') {
+          const value = data as { object: unknown; raw: string } | undefined
+          setStructuredObject(value?.object ?? null)
+        }
+      },
+      onChunk: (chunk) => {
+        if (chunk.type === 'TEXT_MESSAGE_CONTENT') {
+          setContentDeltaCount((n) => n + 1)
+        }
+      },
     })
 
   return (
     <ChatUI
       messages={messages}
       isLoading={isLoading}
+      structuredObject={structuredObject}
+      contentDeltaCount={contentDeltaCount}
       onSendMessage={(text) => {
         sendMessage(text)
       }}
diff --git a/testing/e2e/src/routes/api.chat.ts b/testing/e2e/src/routes/api.chat.ts
index 30a00f8cc..7ee2bb9eb 100644
--- a/testing/e2e/src/routes/api.chat.ts
+++ b/testing/e2e/src/routes/api.chat.ts
@@ -3,6 +3,7 @@ import { chat, maxIterations, toServerSentEventsResponse } from '@tanstack/ai'
 import type { Feature, Provider } from '@/lib/types'
 import { createTextAdapter } from '@/lib/providers'
 import { featureConfigs } from '@/lib/features'
+import { guitarRecommendationSchema } from '@/lib/schemas'
 
 export const Route = createFileRoute('/api/chat')({
   server: {
@@ -33,15 +34,30 @@ export const Route = createFileRoute('/api/chat')({
         )
 
         try {
-          const stream = chat({
-            ...adapterOptions,
-            tools: config.tools,
-            modelOptions: config.modelOptions,
-            systemPrompts: ['You are a helpful assistant for a guitar store.'],
-            agentLoopStrategy: maxIterations(5),
-            messages,
-            abortController,
-          })
+          const stream =
+            feature === 'structured-output-stream'
+              ? chat({
+                  ...adapterOptions,
+                  modelOptions: config.modelOptions,
+                  systemPrompts: [
+                    'You are a helpful assistant for a guitar store.',
+                  ],
+                  messages,
+                  outputSchema: guitarRecommendationSchema,
+                  stream: true,
+                  abortController,
+                })
+              : chat({
+                  ...adapterOptions,
+                  tools: config.tools,
+                  modelOptions: config.modelOptions,
+                  systemPrompts: [
+                    'You are a helpful assistant for a guitar store.',
+                  ],
+                  agentLoopStrategy: maxIterations(5),
+                  messages,
+                  abortController,
+                })
 
           return toServerSentEventsResponse(stream, { abortController })
         } catch (error: any) {
diff --git a/testing/e2e/tests/structured-output-stream.spec.ts b/testing/e2e/tests/structured-output-stream.spec.ts
new file mode 100644
index 000000000..598355e0a
--- /dev/null
+++ b/testing/e2e/tests/structured-output-stream.spec.ts
@@ -0,0 +1,87 @@
+import { test, expect } from './fixtures'
+import {
+  sendMessage,
+  waitForResponse,
+  getLastAssistantMessage,
+  featureUrl,
+} from './helpers'
+import { providersFor } from './test-matrix'
+
+for (const provider of providersFor('structured-output-stream')) {
+  test.describe(`${provider} — structured-output-stream`, () => {
+    test('streams structured JSON deltas in a single request', async ({
+      page,
+      testId,
+      aimockPort,
+    }) => {
+      await page.goto(
+        featureUrl(provider, 'structured-output-stream', testId, aimockPort),
+      )
+
+      await sendMessage(page, '[structured-stream] recommend a guitar as json')
+      await waitForResponse(page)
+
+      const response = await getLastAssistantMessage(page)
+      expect(response).toContain('Fender Stratocaster')
+      expect(response).toContain('1299')
+
+      // Verify the terminal `structured-output.complete` CUSTOM event
+      // reached the client and carries the parsed object — protects against
+      // a regression where the event is dropped but the JSON text still
+      // happens to render.
+      const completeEl = page.getByTestId('structured-output-complete')
+      await expect(completeEl).toBeAttached()
+      const structuredAttr = await completeEl.getAttribute(
+        'data-structured-output',
+      )
+      expect(structuredAttr).toBeTruthy()
+      const parsed = JSON.parse(structuredAttr!)
+      expect(parsed.name).toContain('Fender Stratocaster')
+      expect(parsed.price).toBe(1299)
+
+      // Verify the response actually streamed (more than one content delta).
+      // A regression that silently fell back to the synthetic single-delta
+      // path would still pass the substring assertion above but fail here.
+      const countAttr = await page
+        .getByTestId('content-delta-count')
+        .getAttribute('data-count')
+      expect(Number(countAttr)).toBeGreaterThan(1)
+    })
+
+    test('aborting mid-stream stops the run cleanly', async ({
+      page,
+      testId,
+      aimockPort,
+    }) => {
+      await page.goto(
+        featureUrl(provider, 'structured-output-stream', testId, aimockPort),
+      )
+
+      // Uses the slow-streaming fixture (tokensPerSecond + small chunkSize)
+      // so the stop button is reliably visible mid-stream.
+      await sendMessage(
+        page,
+        '[structured-stream-abort] recommend a guitar slowly',
+      )
+
+      await expect(page.getByTestId('loading-indicator')).toBeVisible({
+        timeout: 10_000,
+      })
+
+      const stopButton = page.getByTestId('stop-button')
+      await expect(stopButton).toBeVisible({ timeout: 5_000 })
+      await stopButton.click()
+
+      await expect(page.getByTestId('loading-indicator')).not.toBeVisible({
+        timeout: 10_000,
+      })
+
+      // The structured-output.complete event must not have reached the
+      // client — aborting before the JSON finished streaming should leave
+      // the run terminated, not "completed with empty result".
+      await expect(page.getByTestId('structured-output-complete')).toHaveCount(
+        0,
+      )
+    })
+  })
+}

From c83d21bd292b455f7b66b62d8d2d5db3f6cb74b2 Mon Sep 17 00:00:00 2001
From: Tom Beckenham <34339192+tombeckenham@users.noreply.github.com>
Date: Tue, 5 May 2026 14:17:39 +1000
Subject: [PATCH 2/9] feat: native streaming structured output for openai,
 grok, groq
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Adds `structuredOutputStream` to `@tanstack/ai-openai`,
`@tanstack/ai-grok`, and `@tanstack/ai-groq`, mirroring the openrouter
reference: a single request with `stream: true` +
`response_format: json_schema` (Chat Completions for grok/groq) or
`text.format: json_schema` (Responses API for openai), no tools, raw
JSON deltas as `TEXT_MESSAGE_CONTENT` plus a terminal `CUSTOM`
`structured-output.complete` event with `{ object, raw }`.

- Always-finalize on upstream close so truncated streams never hang
  consumers
- Typed `RUN_ERROR` paths: `empty-response`, `parse-error`, `aborted`,
  plus mid-stream provider errors (terminal — no `RUN_FINISHED` after)
- `transformNullsToUndefined` applied on parse for parity with the
  non-streaming `structuredOutput`
- E2E feature-support matrix: openai/grok/groq join openrouter for
  `structured-output-stream`; the existing parameterized spec now runs
  against all four
- ts-react-chat example: `api.structured-output.ts` and the matching
  page gain a provider selector (openai/grok/groq/openrouter) and a
  Stream toggle that consumes SSE, renders deltas live, and snaps to
  the parsed object on the terminal CUSTOM event

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../streaming-structured-output-grok.md       |   5 +
 .../streaming-structured-output-groq.md       |   5 +
 .../streaming-structured-output-openai.md     |   5 +
 .../src/routes/api.structured-output.ts       |  49 ++-
 .../routes/generations.structured-output.tsx  | 252 +++++++++++--
 .../typescript/ai-grok/src/adapters/text.ts   | 258 +++++++++++++
 .../ai-grok/tests/grok-adapter.test.ts        | 321 +++++++++++++++++
 .../typescript/ai-groq/src/adapters/text.ts   | 261 ++++++++++++++
 .../ai-groq/tests/groq-adapter.test.ts        | 338 ++++++++++++++++++
 .../typescript/ai-openai/src/adapters/text.ts | 288 +++++++++++++++
 .../ai-openai/tests/openai-adapter.test.ts    | 325 +++++++++++++++++
 testing/e2e/src/lib/feature-support.ts        |   7 +-
 12 files changed, 2069 insertions(+), 45 deletions(-)
 create mode 100644 .changeset/streaming-structured-output-grok.md
 create mode 100644 .changeset/streaming-structured-output-groq.md
 create mode 100644 .changeset/streaming-structured-output-openai.md

diff --git a/.changeset/streaming-structured-output-grok.md b/.changeset/streaming-structured-output-grok.md
new file mode 100644
index 000000000..48fd94c12
--- /dev/null
+++ b/.changeset/streaming-structured-output-grok.md
@@ -0,0 +1,5 @@
+---
+'@tanstack/ai-grok': minor
+---
+
+feat: native streaming structured output. `GrokTextAdapter.structuredOutputStream()` issues a single Chat Completions request with `stream: true` + `response_format: { type: 'json_schema', strict: true }`, surfacing JSON deltas as `TEXT_MESSAGE_CONTENT` chunks and a final `CUSTOM` `structured-output.complete` event with the parsed object — replacing the previous two-request (streamed text → non-streamed JSON) flow when used with `chat({ outputSchema, stream: true })`.
diff --git a/.changeset/streaming-structured-output-groq.md b/.changeset/streaming-structured-output-groq.md
new file mode 100644
index 000000000..7016872ec
--- /dev/null
+++ b/.changeset/streaming-structured-output-groq.md
@@ -0,0 +1,5 @@
+---
+'@tanstack/ai-groq': minor
+---
+
+feat: native streaming structured output. `GroqTextAdapter.structuredOutputStream()` issues a single Chat Completions request with `stream: true` + `response_format: { type: 'json_schema', strict: true }`, surfacing JSON deltas as `TEXT_MESSAGE_CONTENT` chunks and a final `CUSTOM` `structured-output.complete` event with the parsed object — replacing the previous two-request (streamed text → non-streamed JSON) flow when used with `chat({ outputSchema, stream: true })`.
diff --git a/.changeset/streaming-structured-output-openai.md b/.changeset/streaming-structured-output-openai.md
new file mode 100644
index 000000000..666e24b49
--- /dev/null
+++ b/.changeset/streaming-structured-output-openai.md
@@ -0,0 +1,5 @@
+---
+'@tanstack/ai-openai': minor
+---
+
+feat: native streaming structured output. `OpenAITextAdapter.structuredOutputStream()` issues a single Responses API request with `stream: true` + `text.format: { type: 'json_schema', strict: true }`, surfacing JSON deltas as `TEXT_MESSAGE_CONTENT` chunks and a final `CUSTOM` `structured-output.complete` event with the parsed object — replacing the previous two-request (streamed text → non-streamed JSON) flow when used with `chat({ outputSchema, stream: true })`.
diff --git a/examples/ts-react-chat/src/routes/api.structured-output.ts b/examples/ts-react-chat/src/routes/api.structured-output.ts
index aa1d045f2..3af52568d 100644
--- a/examples/ts-react-chat/src/routes/api.structured-output.ts
+++ b/examples/ts-react-chat/src/routes/api.structured-output.ts
@@ -1,7 +1,11 @@
 import { createFileRoute } from '@tanstack/react-router'
-import { chat } from '@tanstack/ai'
+import { chat, toServerSentEventsResponse } from '@tanstack/ai'
+import { openaiText } from '@tanstack/ai-openai'
+import { grokText } from '@tanstack/ai-grok'
+import { groqText } from '@tanstack/ai-groq'
 import { openRouterText } from '@tanstack/ai-openrouter'
 import { z } from 'zod'
+import type { AnyTextAdapter, StreamChunk } from '@tanstack/ai'
 
 const GuitarRecommendationSchema = z.object({
   title: z.string().describe('Short headline for the recommendation'),
@@ -21,21 +25,56 @@ const GuitarRecommendationSchema = z.object({
   nextSteps: z.array(z.string()).describe('Practical follow-up actions'),
 })
 
+type Provider = 'openai' | 'grok' | 'groq' | 'openrouter'
+
+function adapterFor(provider: Provider, model?: string): AnyTextAdapter {
+  switch (provider) {
+    case 'openai':
+      return openaiText((model || 'gpt-4o') as 'gpt-4o')
+    case 'grok':
+      return grokText((model || 'grok-3') as 'grok-3')
+    case 'groq':
+      return groqText(
+        (model || 'llama-3.3-70b-versatile') as 'llama-3.3-70b-versatile',
+      )
+    case 'openrouter':
+      return openRouterText((model || 'openai/gpt-5.2') as 'openai/gpt-5.2')
+  }
+}
+
 export const Route = createFileRoute('/api/structured-output')({
   server: {
     handlers: {
       POST: async ({ request }) => {
         const body = await request.json()
-        const { prompt, model } = body as {
+        const { prompt, provider, model, stream } = body as {
           prompt: string
+          provider?: Provider
           model?: string
+          stream?: boolean
         }
+        const resolvedProvider: Provider = provider || 'openrouter'
 
         try {
+          if (stream) {
+            const abortController = new AbortController()
+            request.signal.addEventListener('abort', () =>
+              abortController.abort(),
+            )
+            const streamIterable = chat({
+              adapter: adapterFor(resolvedProvider, model),
+              messages: [{ role: 'user', content: prompt }],
+              outputSchema: GuitarRecommendationSchema,
+              stream: true,
+              abortController,
+            }) as AsyncIterable<StreamChunk>
+            return toServerSentEventsResponse(streamIterable, {
+              abortController,
+            })
+          }
+
           const result = await chat({
-            adapter: openRouterText(
-              (model || 'openai/gpt-5.2') as 'openai/gpt-5.2',
-            ),
+            adapter: adapterFor(resolvedProvider, model),
             messages: [{ role: 'user', content: prompt }],
             outputSchema: GuitarRecommendationSchema,
           })
diff --git a/examples/ts-react-chat/src/routes/generations.structured-output.tsx b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
index 9b123308f..e247a08a2 100644
--- a/examples/ts-react-chat/src/routes/generations.structured-output.tsx
+++ b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
@@ -1,18 +1,34 @@
-import { useState } from 'react'
+import { useRef, useState } from 'react'
 import { createFileRoute } from '@tanstack/react-router'
 
 const SAMPLE_PROMPT =
   'I play indie rock and have a $1500 budget. Recommend two electric guitars and one acoustic to round out my rig.'
 
-const OPENROUTER_MODELS = [
-  { value: 'openai/gpt-5.2', label: 'OpenAI GPT-5.2' },
-  { value: 'openai/gpt-5.2-pro', label: 'OpenAI GPT-5.2 Pro' },
-  { value: 'openai/gpt-5.1', label: 'OpenAI GPT-5.1' },
-  { value: 'anthropic/claude-opus-4.7', label: 'Claude Opus 4.7' },
-  { value: 'anthropic/claude-sonnet-4.6', label: 'Claude Sonnet 4.6' },
-  { value: 'google/gemini-3.1-pro-preview', label: 'Gemini 3.1 Pro (Preview)' },
-  { value: 'x-ai/grok-4.1-fast', label: 'Grok 4.1 Fast' },
-] as const
+type Provider = 'openai' | 'grok' | 'groq' | 'openrouter'
+
+const PROVIDER_MODELS: Record<
+  Provider,
+  Array<{ value: string; label: string }>
+> = {
+  openai: [
+    { value: 'gpt-4o', label: 'gpt-4o' },
+    { value: 'gpt-4o-mini', label: 'gpt-4o-mini' },
+  ],
+  grok: [
+    { value: 'grok-3', label: 'grok-3' },
+    { value: 'grok-4-0709', label: 'grok-4-0709' },
+  ],
+  groq: [
+    { value: 'llama-3.3-70b-versatile', label: 'llama-3.3-70b-versatile' },
+    { value: 'llama-3.1-8b-instant', label: 'llama-3.1-8b-instant' },
+  ],
+  openrouter: [
+    { value: 'openai/gpt-5.2', label: 'OpenRouter / GPT-5.2' },
+    { value: 'openai/gpt-5.1', label: 'OpenRouter / GPT-5.1' },
+    { value: 'anthropic/claude-sonnet-4.6', label: 'OpenRouter / Sonnet 4.6' },
+    { value: 'x-ai/grok-4.1-fast', label: 'OpenRouter / Grok 4.1 Fast' },
+  ],
+}
 
 interface RecommendationResult {
   title: string
@@ -27,69 +43,192 @@ interface RecommendationResult {
   nextSteps: Array<string>
 }
 
+interface StreamChunk {
+  type: string
+  delta?: string
+  content?: string
+  name?: string
+  value?: { object?: unknown; raw?: string; reasoning?: string }
+  message?: string
+}
+
 function StructuredOutputPage() {
   const [prompt, setPrompt] = useState(SAMPLE_PROMPT)
-  const [model, setModel] = useState<string>(OPENROUTER_MODELS[0].value)
+  const [provider, setProvider] = useState<Provider>('openrouter')
+  const [model, setModel] = useState<string>(PROVIDER_MODELS.openrouter[0].value)
+  const [stream, setStream] = useState(true)
   const [result, setResult] = useState<RecommendationResult | null>(null)
+  const [streamingText, setStreamingText] = useState<string>('')
+  const [deltaCount, setDeltaCount] = useState(0)
   const [error, setError] = useState<string | null>(null)
   const [isLoading, setIsLoading] = useState(false)
+  const abortRef = useRef<AbortController | null>(null)
+
+  const onProviderChange = (next: Provider) => {
+    setProvider(next)
+    setModel(PROVIDER_MODELS[next][0].value)
+  }
 
   const handleGenerate = async () => {
     if (!prompt.trim()) return
     setIsLoading(true)
     setError(null)
     setResult(null)
+    setStreamingText('')
+    setDeltaCount(0)
+
+    const controller = new AbortController()
+    abortRef.current = controller
 
     try {
       const response = await fetch('/api/structured-output', {
         method: 'POST',
         headers: { 'Content-Type': 'application/json' },
-        body: JSON.stringify({ prompt: prompt.trim(), model }),
+        body: JSON.stringify({
+          prompt: prompt.trim(),
+          provider,
+          model,
+          stream,
+        }),
+        signal: controller.signal,
       })
-      const payload = await response.json()
+
       if (!response.ok) {
-        throw new Error(payload.error || 'Request failed')
+        const errPayload = await response.json().catch(() => ({}))
+        throw new Error(errPayload.error || `Request failed (${response.status})`)
+      }
+
+      if (!stream) {
+        const payload = await response.json()
+        setResult(payload.data as RecommendationResult)
+        return
+      }
+
+      // Streaming path: parse SSE, accumulate text deltas live, and capture
+      // the terminal `structured-output.complete` CUSTOM event.
+      const reader = response.body!.getReader()
+      const decoder = new TextDecoder()
+      let buffer = ''
+      let accumulated = ''
+      let deltas = 0
+
+      while (true) {
+        const { done, value } = await reader.read()
+        if (done) break
+        buffer += decoder.decode(value, { stream: true })
+
+        // SSE frames are separated by "\n\n"
+        let sepIdx = buffer.indexOf('\n\n')
+        while (sepIdx !== -1) {
+          const frame = buffer.slice(0, sepIdx)
+          buffer = buffer.slice(sepIdx + 2)
+          sepIdx = buffer.indexOf('\n\n')
+
+          for (const line of frame.split('\n')) {
+            if (!line.startsWith('data: ')) continue
+            const json = line.slice(6).trim()
+            if (!json) continue
+            let chunk: StreamChunk
+            try {
+              chunk = JSON.parse(json) as StreamChunk
+            } catch {
+              continue
+            }
+
+            if (chunk.type === 'TEXT_MESSAGE_CONTENT' && chunk.delta) {
+              accumulated += chunk.delta
+              deltas += 1
+              setStreamingText(accumulated)
+              setDeltaCount(deltas)
+            } else if (
+              chunk.type === 'CUSTOM' &&
+              chunk.name === 'structured-output.complete' &&
+              chunk.value?.object
+            ) {
+              setResult(chunk.value.object as RecommendationResult)
+            } else if (chunk.type === 'RUN_ERROR') {
+              throw new Error(chunk.message || 'Stream failed')
+            }
+          }
+        }
       }
-      setResult(payload.data as RecommendationResult)
     } catch (err) {
-      setError(err instanceof Error ? err.message : 'Unknown error')
+      if (err instanceof Error && err.name === 'AbortError') {
+        setError('Aborted')
+      } else {
+        setError(err instanceof Error ? err.message : 'Unknown error')
+      }
     } finally {
       setIsLoading(false)
+      abortRef.current = null
     }
   }
 
+  const handleAbort = () => abortRef.current?.abort()
+
   return (
     <div className="flex flex-col h-[calc(100vh-72px)] bg-gray-900 text-white">
       <div className="border-b border-orange-500/20 bg-gray-800 px-6 py-4">
-        <h2 className="text-xl font-semibold">
-          Structured Output (OpenRouter)
-        </h2>
+        <h2 className="text-xl font-semibold">Structured Output</h2>
         <p className="text-sm text-gray-400 mt-1">
           Calls <code className="text-orange-400">chat()</code> with an{' '}
-          <code className="text-orange-400">outputSchema</code> via the{' '}
-          <code className="text-orange-400">openRouterText</code> adapter and
-          parses the JSON result.
+          <code className="text-orange-400">outputSchema</code>. Toggle{' '}
+          <code className="text-orange-400">stream</code> to exercise{' '}
+          <code className="text-orange-400">structuredOutputStream</code> on the
+          selected provider; deltas render live while the final{' '}
+          <code className="text-orange-400">structured-output.complete</code>{' '}
+          event populates the parsed result.
         </p>
       </div>
 
       <div className="flex-1 overflow-y-auto p-6">
         <div className="max-w-2xl mx-auto space-y-6">
-          <div className="space-y-3">
-            <label className="text-sm text-gray-400">OpenRouter Model</label>
-            <select
-              value={model}
-              onChange={(e) => setModel(e.target.value)}
-              disabled={isLoading}
-              className="w-full rounded-lg border border-orange-500/20 bg-gray-800/50 px-3 py-2 text-sm text-white focus:outline-none focus:ring-2 focus:ring-orange-500/50 disabled:opacity-50"
-            >
-              {OPENROUTER_MODELS.map((opt) => (
-                <option key={opt.value} value={opt.value}>
-                  {opt.label}
-                </option>
-              ))}
-            </select>
+          <div className="grid grid-cols-2 gap-3">
+            <div className="space-y-2">
+              <label className="text-sm text-gray-400">Provider</label>
+              <select
+                value={provider}
+                onChange={(e) => onProviderChange(e.target.value as Provider)}
+                disabled={isLoading}
+                className="w-full rounded-lg border border-orange-500/20 bg-gray-800/50 px-3 py-2 text-sm text-white focus:outline-none focus:ring-2 focus:ring-orange-500/50 disabled:opacity-50"
+              >
+                <option value="openai">OpenAI</option>
+                <option value="grok">Grok (xAI)</option>
+                <option value="groq">Groq</option>
+                <option value="openrouter">OpenRouter</option>
+              </select>
+            </div>
+            <div className="space-y-2">
+              <label className="text-sm text-gray-400">Model</label>
+              <select
+                value={model}
+                onChange={(e) => setModel(e.target.value)}
+                disabled={isLoading}
+                className="w-full rounded-lg border border-orange-500/20 bg-gray-800/50 px-3 py-2 text-sm text-white focus:outline-none focus:ring-2 focus:ring-orange-500/50 disabled:opacity-50"
+              >
+                {PROVIDER_MODELS[provider].map((opt) => (
+                  <option key={opt.value} value={opt.value}>
+                    {opt.label}
+                  </option>
+                ))}
+              </select>
+            </div>
           </div>
 
+          <label className="flex items-center gap-2 text-sm text-gray-300">
+            <input
+              type="checkbox"
+              checked={stream}
+              onChange={(e) => setStream(e.target.checked)}
+              disabled={isLoading}
+              className="accent-orange-500"
+            />
+            Stream (single-request{' '}
+            <code className="text-orange-400">stream: true</code> +{' '}
+            <code className="text-orange-400">response_format: json_schema</code>
+            )
+          </label>
+
           <div className="space-y-3">
             <label className="text-sm text-gray-400">Prompt</label>
             <textarea
@@ -108,11 +247,27 @@ function StructuredOutputPage() {
               disabled={!prompt.trim() || isLoading}
               className="px-6 py-2 bg-orange-600 hover:bg-orange-700 disabled:bg-gray-700 disabled:text-gray-500 text-white rounded-lg text-sm font-medium transition-colors"
             >
-              {isLoading ? 'Generating...' : 'Generate Structured Output'}
+              {isLoading
+                ? stream
+                  ? 'Streaming...'
+                  : 'Generating...'
+                : 'Generate'}
             </button>
-            {result && (
+            {isLoading && stream && (
               <button
-                onClick={() => setResult(null)}
+                onClick={handleAbort}
+                className="px-6 py-2 bg-red-600 hover:bg-red-700 text-white rounded-lg text-sm font-medium transition-colors"
+              >
+                Abort
+              </button>
+            )}
+            {(result || streamingText) && !isLoading && (
+              <button
+                onClick={() => {
+                  setResult(null)
+                  setStreamingText('')
+                  setDeltaCount(0)
+                }}
                 className="px-6 py-2 bg-gray-700 hover:bg-gray-600 text-white rounded-lg text-sm font-medium transition-colors"
               >
                 Clear
@@ -126,8 +281,27 @@ function StructuredOutputPage() {
             </div>
           )}
 
+          {streamingText && !result && (
+            <div className="p-4 bg-gray-800/30 border border-gray-700/50 rounded-lg">
+              <div className="flex items-center justify-between mb-2">
+                <p className="text-xs text-gray-400 uppercase tracking-wider">
+                  Streaming JSON
+                </p>
+                <p className="text-xs text-orange-400">{deltaCount} deltas</p>
+              </div>
+              <pre className="text-xs text-gray-300 whitespace-pre-wrap break-words">
+                {streamingText}
+              </pre>
+            </div>
+          )}
+
           {result && (
             <div className="space-y-4">
+              {stream && deltaCount > 0 && (
+                <p className="text-xs text-gray-500">
+                  Reassembled from {deltaCount} streamed deltas.
+                </p>
+              )}
               <div className="p-4 bg-gray-800/50 border border-gray-700 rounded-lg">
                 <h3 className="text-lg font-semibold text-white">
                   {result.title}
diff --git a/packages/typescript/ai-grok/src/adapters/text.ts b/packages/typescript/ai-grok/src/adapters/text.ts
index e185c5ecf..c7fdc8287 100644
--- a/packages/typescript/ai-grok/src/adapters/text.ts
+++ b/packages/typescript/ai-grok/src/adapters/text.ts
@@ -1,3 +1,4 @@
+import { APIUserAbortError } from 'openai'
 import { BaseTextAdapter } from '@tanstack/ai/adapters'
 import { validateTextProviderOptions } from '../text/text-provider-options'
 import { convertToolsToProviderFormat } from '../tools'
@@ -223,6 +224,263 @@ export class GrokTextAdapter<
     }
   }
 
+  /**
+   * Stream structured output via a single Chat Completions request with
+   * `stream: true` + `response_format: json_schema`. Emits raw JSON deltas as
+   * `TEXT_MESSAGE_CONTENT` chunks and a terminal `CUSTOM`
+   * `structured-output.complete` event with `{ object, raw }`.
+   */
+  async *structuredOutputStream(
+    options: StructuredOutputOptions<GrokTextProviderOptions>,
+  ): AsyncIterable<StreamChunk> {
+    const { chatOptions, outputSchema } = options
+    const { logger } = chatOptions
+    const timestamp = Date.now()
+    const aguiState = {
+      runId: chatOptions.runId ?? generateId(this.name),
+      threadId: chatOptions.threadId ?? generateId(this.name),
+      messageId: generateId(this.name),
+      timestamp,
+      hasEmittedRunStarted: false,
+      hasEmittedTextMessageStart: false,
+      hasEmittedTextMessageEnd: false,
+      hasFinalizedChoice: false,
+      deferredUsage: undefined as
+        | { promptTokens: number; completionTokens: number; totalTokens: number }
+        | undefined,
+      computedFinishReason: undefined as string | undefined,
+    }
+
+    const strictSchema = makeGrokStructuredOutputCompatible(
+      outputSchema,
+      outputSchema.required || [],
+    )
+
+    let accumulatedContent = ''
+    let currentModel = chatOptions.model
+
+    try {
+      // Strip tools — structured-output mode shouldn't mix tool calls into the
+      // request body. Matches the non-streaming `structuredOutput` behavior.
+      const { tools: _tools, ...baseParams } =
+        this.mapTextOptionsToGrok(chatOptions)
+      logger.request(
+        `activity=structured-stream provider=grok model=${this.model} messages=${chatOptions.messages.length} stream=true`,
+        { provider: 'grok', model: this.model },
+      )
+      const stream = await this.client.chat.completions.create(
+        {
+          ...baseParams,
+          stream: true,
+          response_format: {
+            type: 'json_schema',
+            json_schema: {
+              name: 'structured_output',
+              schema: strictSchema,
+              strict: true,
+            },
+          },
+        },
+        { signal: chatOptions.request?.signal },
+      )
+
+      for await (const chunk of stream) {
+        logger.provider(`provider=grok`, { chunk })
+        if (chunk.model) currentModel = chunk.model
+
+        if (!aguiState.hasEmittedRunStarted) {
+          aguiState.hasEmittedRunStarted = true
+          yield asChunk({
+            type: 'RUN_STARTED',
+            runId: aguiState.runId,
+            threadId: aguiState.threadId,
+            model: currentModel || chatOptions.model,
+            timestamp,
+          })
+        }
+
+        const choice = chunk.choices[0]
+        if (!choice) continue
+
+        const deltaContent = choice.delta.content
+        if (deltaContent) {
+          if (!aguiState.hasEmittedTextMessageStart) {
+            aguiState.hasEmittedTextMessageStart = true
+            yield asChunk({
+              type: 'TEXT_MESSAGE_START',
+              messageId: aguiState.messageId,
+              model: currentModel || chatOptions.model,
+              timestamp,
+              role: 'assistant',
+            })
+          }
+
+          accumulatedContent += deltaContent
+
+          yield asChunk({
+            type: 'TEXT_MESSAGE_CONTENT',
+            messageId: aguiState.messageId,
+            model: currentModel || chatOptions.model,
+            timestamp,
+            delta: deltaContent,
+            content: accumulatedContent,
+          })
+        }
+
+        if (choice.finish_reason) {
+          if (chunk.usage) {
+            aguiState.deferredUsage = {
+              promptTokens: chunk.usage.prompt_tokens || 0,
+              completionTokens: chunk.usage.completion_tokens || 0,
+              totalTokens: chunk.usage.total_tokens || 0,
+            }
+          }
+
+          if (!aguiState.hasFinalizedChoice) {
+            aguiState.hasFinalizedChoice = true
+            aguiState.computedFinishReason =
+              choice.finish_reason === 'length' ? 'length' : 'stop'
+
+            if (
+              aguiState.hasEmittedTextMessageStart &&
+              !aguiState.hasEmittedTextMessageEnd
+            ) {
+              aguiState.hasEmittedTextMessageEnd = true
+              yield asChunk({
+                type: 'TEXT_MESSAGE_END',
+                messageId: aguiState.messageId,
+                model: currentModel || chatOptions.model,
+                timestamp,
+              })
+            }
+          }
+        }
+      }
+
+      // Finalize the run unconditionally. If the upstream stream closed
+      // without a finishReason, we never emitted TEXT_MESSAGE_END or computed
+      // a finish reason — we still owe consumers a CUSTOM + RUN_FINISHED (or
+      // RUN_ERROR), never silence.
+      const resolvedModel = currentModel || chatOptions.model
+
+      if (
+        aguiState.hasEmittedTextMessageStart &&
+        !aguiState.hasEmittedTextMessageEnd
+      ) {
+        aguiState.hasEmittedTextMessageEnd = true
+        yield asChunk({
+          type: 'TEXT_MESSAGE_END',
+          messageId: aguiState.messageId,
+          model: resolvedModel,
+          timestamp,
+        })
+      }
+
+      if (!accumulatedContent) {
+        const message = 'Structured output response contained no content'
+        logger.errors(message, {
+          source: 'grok.structuredOutputStream',
+        })
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId: aguiState.runId,
+          model: resolvedModel,
+          timestamp,
+          message,
+          code: 'empty-response',
+          error: { message, code: 'empty-response' },
+        })
+        return
+      }
+
+      let parsed: unknown
+      try {
+        parsed = JSON.parse(accumulatedContent)
+      } catch (parseError) {
+        const message =
+          parseError instanceof SyntaxError
+            ? `Failed to parse structured output as JSON: ${parseError.message}`
+            : 'Failed to parse structured output as JSON'
+        logger.errors(message, {
+          source: 'grok.structuredOutputStream',
+          error: parseError,
+        })
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId: aguiState.runId,
+          model: resolvedModel,
+          timestamp,
+          message,
+          code: 'parse-error',
+          error: { message, code: 'parse-error' },
+        })
+        return
+      }
+
+      const transformed = transformNullsToUndefined(parsed)
+
+      yield asChunk({
+        type: 'CUSTOM',
+        name: 'structured-output.complete',
+        value: {
+          object: transformed,
+          raw: accumulatedContent,
+        },
+        model: resolvedModel,
+        timestamp,
+      })
+
+      yield asChunk({
+        type: 'RUN_FINISHED',
+        runId: aguiState.runId,
+        threadId: aguiState.threadId,
+        model: resolvedModel,
+        timestamp,
+        usage: aguiState.deferredUsage,
+        finishReason: aguiState.computedFinishReason ?? 'stop',
+      })
+    } catch (error) {
+      logger.errors('grok.structuredOutputStream fatal', {
+        error,
+        source: 'grok.structuredOutputStream',
+      })
+      if (!aguiState.hasEmittedRunStarted) {
+        aguiState.hasEmittedRunStarted = true
+        yield asChunk({
+          type: 'RUN_STARTED',
+          runId: aguiState.runId,
+          threadId: aguiState.threadId,
+          model: chatOptions.model,
+          timestamp,
+        })
+      }
+
+      if (error instanceof APIUserAbortError) {
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId: aguiState.runId,
+          model: chatOptions.model,
+          timestamp,
+          message: 'Request aborted',
+          code: 'aborted',
+          error: { message: 'Request aborted', code: 'aborted' },
+        })
+        return
+      }
+
+      const err = error as Error & { code?: string }
+      yield asChunk({
+        type: 'RUN_ERROR',
+        runId: aguiState.runId,
+        model: chatOptions.model,
+        timestamp,
+        message: err.message || 'Unknown error',
+        code: err.code,
+        error: { message: err.message || 'Unknown error', code: err.code },
+      })
+    }
+  }
+
   private async *processGrokStreamChunks(
     stream: AsyncIterable<OpenAI_SDK.Chat.Completions.ChatCompletionChunk>,
     options: TextOptions,
diff --git a/packages/typescript/ai-grok/tests/grok-adapter.test.ts b/packages/typescript/ai-grok/tests/grok-adapter.test.ts
index f992cfadb..5d2d6a933 100644
--- a/packages/typescript/ai-grok/tests/grok-adapter.test.ts
+++ b/packages/typescript/ai-grok/tests/grok-adapter.test.ts
@@ -13,6 +13,12 @@ let mockCreate: ReturnType<typeof vi.fn>
 
 // Mock the OpenAI SDK
 vi.mock('openai', () => {
+  class APIUserAbortError extends Error {
+    constructor() {
+      super('Request aborted')
+      this.name = 'APIUserAbortError'
+    }
+  }
   return {
     default: class {
       chat = {
@@ -21,6 +27,7 @@ vi.mock('openai', () => {
         },
       }
     },
+    APIUserAbortError,
   }
 })
 
@@ -616,3 +623,317 @@ describe('Grok AG-UI event emission', () => {
     }
   })
 })
+
+describe('Grok structuredOutputStream', () => {
+  beforeEach(() => {
+    vi.clearAllMocks()
+  })
+
+  const createAdapter = () => createGrokText('grok-3', 'test-api-key')
+
+  it('issues a single streaming request with response_format json_schema and emits parsed object', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-stream-1',
+        model: 'grok-3',
+        choices: [{ delta: { content: '{"name":"Ali' }, finish_reason: null }],
+      },
+      {
+        id: 'chatcmpl-stream-1',
+        model: 'grok-3',
+        choices: [
+          { delta: { content: 'ce","age":30}' }, finish_reason: 'stop' },
+        ],
+        usage: {
+          prompt_tokens: 5,
+          completion_tokens: 9,
+          total_tokens: 14,
+        },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const outputSchema = {
+      type: 'object',
+      properties: {
+        name: { type: 'string' },
+        age: { type: 'number' },
+      },
+      required: ['name', 'age'],
+    }
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'grok-3',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema,
+    })) {
+      chunks.push(chunk)
+    }
+
+    expect(mockCreate).toHaveBeenCalledTimes(1)
+    const [params] = mockCreate.mock.calls[0]! as Array<any>
+    expect(params.stream).toBe(true)
+    expect(params.response_format).toEqual({
+      type: 'json_schema',
+      json_schema: {
+        name: 'structured_output',
+        schema: expect.objectContaining({
+          type: 'object',
+          additionalProperties: false,
+        }),
+        strict: true,
+      },
+    })
+    expect(params.tools).toBeUndefined()
+
+    const types: Array<string> = chunks.map((c) => c.type)
+    const idx = (t: string) => types.indexOf(t)
+    expect(idx('RUN_STARTED')).toBeGreaterThanOrEqual(0)
+    expect(idx('TEXT_MESSAGE_START')).toBeGreaterThan(idx('RUN_STARTED'))
+    expect(idx('TEXT_MESSAGE_CONTENT')).toBeGreaterThan(
+      idx('TEXT_MESSAGE_START'),
+    )
+    expect(idx('TEXT_MESSAGE_END')).toBeGreaterThan(idx('TEXT_MESSAGE_CONTENT'))
+    expect(idx('CUSTOM')).toBeGreaterThan(idx('TEXT_MESSAGE_END'))
+    expect(idx('RUN_FINISHED')).toBeGreaterThan(idx('CUSTOM'))
+
+    const contentChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'TEXT_MESSAGE_CONTENT' }> =>
+        c.type === 'TEXT_MESSAGE_CONTENT',
+    )
+    expect(contentChunks).toHaveLength(2)
+    expect(contentChunks[0]!.delta).toBe('{"name":"Ali')
+    expect(contentChunks[1]!.delta).toBe('ce","age":30}')
+
+    const customChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]!.name).toBe('structured-output.complete')
+    expect(customChunks[0]!.value).toEqual({
+      object: { name: 'Alice', age: 30 },
+      raw: '{"name":"Alice","age":30}',
+    })
+  })
+
+  it('emits RUN_ERROR when accumulated content is not valid JSON', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-bad',
+        model: 'grok-3',
+        choices: [{ delta: { content: 'not json' }, finish_reason: 'stop' }],
+        usage: { prompt_tokens: 1, completion_tokens: 1, total_tokens: 2 },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'grok-3',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const errorChunks = chunks.filter((c) => c.type === 'RUN_ERROR')
+    expect(errorChunks).toHaveLength(1)
+    expect(errorChunks[0]).toMatchObject({
+      type: 'RUN_ERROR',
+      code: 'parse-error',
+    })
+    expect(chunks.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
+  })
+
+  it('emits empty-response RUN_ERROR when no content is streamed', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-empty',
+        model: 'grok-3',
+        choices: [{ delta: { content: '' }, finish_reason: 'stop' }],
+        usage: { prompt_tokens: 1, completion_tokens: 0, total_tokens: 1 },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'grok-3',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const errorChunks = chunks.filter((c) => c.type === 'RUN_ERROR')
+    expect(errorChunks).toHaveLength(1)
+    expect(errorChunks[0]).toMatchObject({
+      type: 'RUN_ERROR',
+      code: 'empty-response',
+    })
+    expect(chunks.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
+  })
+
+  it('finalizes the run when upstream stream closes without finish_reason', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-trunc',
+        model: 'grok-3',
+        choices: [
+          { delta: { content: '{"name":"Alice"}' }, finish_reason: null },
+        ],
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'grok-3',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const customChunks = chunks.filter((c) => c.type === 'CUSTOM')
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]).toMatchObject({
+      name: 'structured-output.complete',
+      value: { object: { name: 'Alice' }, raw: '{"name":"Alice"}' },
+    })
+    expect(chunks.filter((c) => c.type === 'RUN_FINISHED')).toHaveLength(1)
+    expect(chunks.filter((c) => c.type === 'RUN_ERROR')).toHaveLength(0)
+  })
+
+  it('terminates on iterator-thrown provider error without emitting RUN_FINISHED', async () => {
+    mockCreate = vi.fn().mockImplementation(() => {
+      const chunks = [
+        {
+          id: 'chatcmpl-err',
+          model: 'grok-3',
+          choices: [
+            { delta: { content: '{"name":"Al' }, finish_reason: null },
+          ],
+        },
+      ] as Array<unknown>
+      return Promise.resolve({
+        [Symbol.asyncIterator]() {
+          let i = 0
+          return {
+            // eslint-disable-next-line @typescript-eslint/require-await
+            async next() {
+              if (i < chunks.length) return { value: chunks[i++], done: false }
+              throw Object.assign(new Error('Upstream rate limit'), {
+                code: '429',
+              })
+            },
+          }
+        },
+      })
+    })
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'grok-3',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const errorChunks = chunks.filter((c) => c.type === 'RUN_ERROR')
+    expect(errorChunks).toHaveLength(1)
+    expect(chunks.filter((c) => c.type === 'RUN_FINISHED')).toHaveLength(0)
+    expect(chunks.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
+  })
+
+  it('transforms null values to undefined on the parsed object', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-null',
+        model: 'grok-3',
+        choices: [
+          {
+            delta: { content: '{"name":"Alice","nickname":null}' },
+            finish_reason: 'stop',
+          },
+        ],
+        usage: { prompt_tokens: 5, completion_tokens: 9, total_tokens: 14 },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'grok-3',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: {
+          name: { type: 'string' },
+          nickname: { type: ['string', 'null'] },
+        },
+        required: ['name', 'nickname'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const customChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    const value = customChunks[0]!.value as { object: Record<string, unknown> }
+    expect(value.object.name).toBe('Alice')
+    expect(value.object.nickname).toBeUndefined()
+    expect((customChunks[0]!.value as { raw: string }).raw).toBe(
+      '{"name":"Alice","nickname":null}',
+    )
+  })
+})
diff --git a/packages/typescript/ai-groq/src/adapters/text.ts b/packages/typescript/ai-groq/src/adapters/text.ts
index 34f44ba81..44bed44b7 100644
--- a/packages/typescript/ai-groq/src/adapters/text.ts
+++ b/packages/typescript/ai-groq/src/adapters/text.ts
@@ -1,3 +1,4 @@
+import { APIUserAbortError } from 'groq-sdk'
 import { BaseTextAdapter } from '@tanstack/ai/adapters'
 import { validateTextProviderOptions } from '../text/text-provider-options'
 import { convertToolsToProviderFormat } from '../tools'
@@ -220,6 +221,266 @@ export class GroqTextAdapter<
     }
   }
 
+  /**
+   * Stream structured output via a single Chat Completions request with
+   * `stream: true` + `response_format: json_schema`. Emits raw JSON deltas as
+   * `TEXT_MESSAGE_CONTENT` chunks and a terminal `CUSTOM`
+   * `structured-output.complete` event with `{ object, raw }`.
+   */
+  async *structuredOutputStream(
+    options: StructuredOutputOptions<GroqTextProviderOptions>,
+  ): AsyncIterable<StreamChunk> {
+    const { chatOptions, outputSchema } = options
+    const { logger } = chatOptions
+    const timestamp = Date.now()
+    const aguiState = {
+      runId: chatOptions.runId ?? generateId(this.name),
+      threadId: chatOptions.threadId ?? generateId(this.name),
+      messageId: generateId(this.name),
+      timestamp,
+      hasEmittedRunStarted: false,
+      hasEmittedTextMessageStart: false,
+      hasEmittedTextMessageEnd: false,
+      hasFinalizedChoice: false,
+      deferredUsage: undefined as
+        | { promptTokens: number; completionTokens: number; totalTokens: number }
+        | undefined,
+      computedFinishReason: undefined as string | undefined,
+    }
+
+    const strictSchema = makeGroqStructuredOutputCompatible(
+      outputSchema,
+      outputSchema.required || [],
+    )
+
+    let accumulatedContent = ''
+    let currentModel = chatOptions.model
+
+    try {
+      // Strip tools — structured-output mode shouldn't mix tool calls into the
+      // request body. Matches the non-streaming `structuredOutput` behavior.
+      const { tools: _tools, ...baseParams } =
+        this.mapTextOptionsToGroq(chatOptions)
+      logger.request(
+        `activity=structured-stream provider=groq model=${this.model} messages=${chatOptions.messages.length} stream=true`,
+        { provider: 'groq', model: this.model },
+      )
+      const stream = await this.client.chat.completions.create(
+        {
+          ...baseParams,
+          stream: true,
+          response_format: {
+            type: 'json_schema',
+            json_schema: {
+              name: 'structured_output',
+              schema: strictSchema,
+              strict: true,
+            },
+          },
+        },
+        { signal: chatOptions.request?.signal },
+      )
+
+      for await (const chunk of stream) {
+        logger.provider(`provider=groq`, { chunk })
+        if (chunk.model) currentModel = chunk.model
+
+        if (!aguiState.hasEmittedRunStarted) {
+          aguiState.hasEmittedRunStarted = true
+          yield asChunk({
+            type: 'RUN_STARTED',
+            runId: aguiState.runId,
+            threadId: aguiState.threadId,
+            model: currentModel || chatOptions.model,
+            timestamp,
+          })
+        }
+
+        const choice = chunk.choices[0]
+        if (!choice) continue
+
+        const deltaContent = choice.delta.content
+        if (deltaContent) {
+          if (!aguiState.hasEmittedTextMessageStart) {
+            aguiState.hasEmittedTextMessageStart = true
+            yield asChunk({
+              type: 'TEXT_MESSAGE_START',
+              messageId: aguiState.messageId,
+              model: currentModel || chatOptions.model,
+              timestamp,
+              role: 'assistant',
+            })
+          }
+
+          accumulatedContent += deltaContent
+
+          yield asChunk({
+            type: 'TEXT_MESSAGE_CONTENT',
+            messageId: aguiState.messageId,
+            model: currentModel || chatOptions.model,
+            timestamp,
+            delta: deltaContent,
+            content: accumulatedContent,
+          })
+        }
+
+        if (choice.finish_reason) {
+          // Capture usage from whichever chunk provides it (Groq surfaces
+          // it via x_groq.usage on the trailing chunk).
+          const groqUsage = chunk.x_groq?.usage
+          if (groqUsage) {
+            aguiState.deferredUsage = {
+              promptTokens: groqUsage.prompt_tokens || 0,
+              completionTokens: groqUsage.completion_tokens || 0,
+              totalTokens: groqUsage.total_tokens || 0,
+            }
+          }
+
+          if (!aguiState.hasFinalizedChoice) {
+            aguiState.hasFinalizedChoice = true
+            aguiState.computedFinishReason =
+              choice.finish_reason === 'length' ? 'length' : 'stop'
+
+            if (
+              aguiState.hasEmittedTextMessageStart &&
+              !aguiState.hasEmittedTextMessageEnd
+            ) {
+              aguiState.hasEmittedTextMessageEnd = true
+              yield asChunk({
+                type: 'TEXT_MESSAGE_END',
+                messageId: aguiState.messageId,
+                model: currentModel || chatOptions.model,
+                timestamp,
+              })
+            }
+          }
+        }
+      }
+
+      // Finalize the run unconditionally. If the upstream stream closed
+      // without a finishReason, we never emitted TEXT_MESSAGE_END or computed
+      // a finish reason — we still owe consumers a CUSTOM + RUN_FINISHED (or
+      // RUN_ERROR), never silence.
+      const resolvedModel = currentModel || chatOptions.model
+
+      if (
+        aguiState.hasEmittedTextMessageStart &&
+        !aguiState.hasEmittedTextMessageEnd
+      ) {
+        aguiState.hasEmittedTextMessageEnd = true
+        yield asChunk({
+          type: 'TEXT_MESSAGE_END',
+          messageId: aguiState.messageId,
+          model: resolvedModel,
+          timestamp,
+        })
+      }
+
+      if (!accumulatedContent) {
+        const message = 'Structured output response contained no content'
+        logger.errors(message, {
+          source: 'groq.structuredOutputStream',
+        })
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId: aguiState.runId,
+          model: resolvedModel,
+          timestamp,
+          message,
+          code: 'empty-response',
+          error: { message, code: 'empty-response' },
+        })
+        return
+      }
+
+      let parsed: unknown
+      try {
+        parsed = JSON.parse(accumulatedContent)
+      } catch (parseError) {
+        const message =
+          parseError instanceof SyntaxError
+            ? `Failed to parse structured output as JSON: ${parseError.message}`
+            : 'Failed to parse structured output as JSON'
+        logger.errors(message, {
+          source: 'groq.structuredOutputStream',
+          error: parseError,
+        })
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId: aguiState.runId,
+          model: resolvedModel,
+          timestamp,
+          message,
+          code: 'parse-error',
+          error: { message, code: 'parse-error' },
+        })
+        return
+      }
+
+      const transformed = transformNullsToUndefined(parsed)
+
+      yield asChunk({
+        type: 'CUSTOM',
+        name: 'structured-output.complete',
+        value: {
+          object: transformed,
+          raw: accumulatedContent,
+        },
+        model: resolvedModel,
+        timestamp,
+      })
+
+      yield asChunk({
+        type: 'RUN_FINISHED',
+        runId: aguiState.runId,
+        threadId: aguiState.threadId,
+        model: resolvedModel,
+        timestamp,
+        usage: aguiState.deferredUsage,
+        finishReason: aguiState.computedFinishReason ?? 'stop',
+      })
+    } catch (error) {
+      logger.errors('groq.structuredOutputStream fatal', {
+        error,
+        source: 'groq.structuredOutputStream',
+      })
+      if (!aguiState.hasEmittedRunStarted) {
+        aguiState.hasEmittedRunStarted = true
+        yield asChunk({
+          type: 'RUN_STARTED',
+          runId: aguiState.runId,
+          threadId: aguiState.threadId,
+          model: chatOptions.model,
+          timestamp,
+        })
+      }
+
+      if (error instanceof APIUserAbortError) {
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId: aguiState.runId,
+          model: chatOptions.model,
+          timestamp,
+          message: 'Request aborted',
+          code: 'aborted',
+          error: { message: 'Request aborted', code: 'aborted' },
+        })
+        return
+      }
+
+      const err = error as Error & { code?: string }
+      yield asChunk({
+        type: 'RUN_ERROR',
+        runId: aguiState.runId,
+        model: chatOptions.model,
+        timestamp,
+        message: err.message || 'Unknown error',
+        code: err.code,
+        error: { message: err.message || 'Unknown error', code: err.code },
+      })
+    }
+  }
+
   /**
    * Processes streaming chunks from the Groq API and yields AG-UI stream events.
    * Handles text content deltas, tool call assembly, and lifecycle events.
diff --git a/packages/typescript/ai-groq/tests/groq-adapter.test.ts b/packages/typescript/ai-groq/tests/groq-adapter.test.ts
index da421a8b5..1ba1ae897 100644
--- a/packages/typescript/ai-groq/tests/groq-adapter.test.ts
+++ b/packages/typescript/ai-groq/tests/groq-adapter.test.ts
@@ -19,6 +19,12 @@ let mockCreate: Mock<(...args: Array<unknown>) => unknown>
 
 // Mock the Groq SDK
 vi.mock('groq-sdk', () => {
+  class APIUserAbortError extends Error {
+    constructor() {
+      super('Request aborted')
+      this.name = 'APIUserAbortError'
+    }
+  }
   return {
     default: class {
       chat = {
@@ -27,6 +33,7 @@ vi.mock('groq-sdk', () => {
         },
       }
     },
+    APIUserAbortError,
   }
 })
 
@@ -586,3 +593,334 @@ describe('Groq AG-UI event emission', () => {
     }
   })
 })
+
+describe('Groq structuredOutputStream', () => {
+  beforeEach(() => {
+    vi.clearAllMocks()
+  })
+
+  const createAdapter = () =>
+    createGroqText('llama-3.3-70b-versatile', 'test-api-key')
+
+  it('issues a single streaming request with response_format json_schema and emits parsed object', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-stream-1',
+        model: 'llama-3.3-70b-versatile',
+        choices: [
+          { delta: { content: '{"name":"Ali' }, finish_reason: null },
+        ],
+      },
+      {
+        id: 'chatcmpl-stream-1',
+        model: 'llama-3.3-70b-versatile',
+        choices: [
+          { delta: { content: 'ce","age":30}' }, finish_reason: 'stop' },
+        ],
+        x_groq: {
+          usage: {
+            prompt_tokens: 5,
+            completion_tokens: 9,
+            total_tokens: 14,
+          },
+        },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const outputSchema = {
+      type: 'object',
+      properties: {
+        name: { type: 'string' },
+        age: { type: 'number' },
+      },
+      required: ['name', 'age'],
+    }
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'llama-3.3-70b-versatile',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema,
+    })) {
+      chunks.push(chunk)
+    }
+
+    expect(mockCreate).toHaveBeenCalledTimes(1)
+    const [params] = mockCreate.mock.calls[0]! as Array<any>
+    expect(params.stream).toBe(true)
+    expect(params.response_format).toEqual({
+      type: 'json_schema',
+      json_schema: {
+        name: 'structured_output',
+        schema: expect.objectContaining({
+          type: 'object',
+          additionalProperties: false,
+        }),
+        strict: true,
+      },
+    })
+    expect(params.tools).toBeUndefined()
+
+    const types: Array<string> = chunks.map((c) => c.type)
+    const idx = (t: string) => types.indexOf(t)
+    expect(idx('RUN_STARTED')).toBeGreaterThanOrEqual(0)
+    expect(idx('TEXT_MESSAGE_START')).toBeGreaterThan(idx('RUN_STARTED'))
+    expect(idx('TEXT_MESSAGE_CONTENT')).toBeGreaterThan(
+      idx('TEXT_MESSAGE_START'),
+    )
+    expect(idx('TEXT_MESSAGE_END')).toBeGreaterThan(idx('TEXT_MESSAGE_CONTENT'))
+    expect(idx('CUSTOM')).toBeGreaterThan(idx('TEXT_MESSAGE_END'))
+    expect(idx('RUN_FINISHED')).toBeGreaterThan(idx('CUSTOM'))
+
+    const contentChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'TEXT_MESSAGE_CONTENT' }> =>
+        c.type === 'TEXT_MESSAGE_CONTENT',
+    )
+    expect(contentChunks).toHaveLength(2)
+    expect(contentChunks[0]!.delta).toBe('{"name":"Ali')
+    expect(contentChunks[1]!.delta).toBe('ce","age":30}')
+
+    const customChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]!.name).toBe('structured-output.complete')
+    expect(customChunks[0]!.value).toEqual({
+      object: { name: 'Alice', age: 30 },
+      raw: '{"name":"Alice","age":30}',
+    })
+  })
+
+  it('emits RUN_ERROR when accumulated content is not valid JSON', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-bad',
+        model: 'llama-3.3-70b-versatile',
+        choices: [{ delta: { content: 'not json' }, finish_reason: 'stop' }],
+        x_groq: {
+          usage: { prompt_tokens: 1, completion_tokens: 1, total_tokens: 2 },
+        },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'llama-3.3-70b-versatile',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const errorChunks = chunks.filter((c) => c.type === 'RUN_ERROR')
+    expect(errorChunks).toHaveLength(1)
+    expect(errorChunks[0]).toMatchObject({
+      type: 'RUN_ERROR',
+      code: 'parse-error',
+      message: expect.stringContaining('Failed to parse structured output'),
+    })
+    expect(chunks.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
+  })
+
+  it('emits empty-response RUN_ERROR when no content is streamed', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-empty',
+        model: 'llama-3.3-70b-versatile',
+        choices: [{ delta: { content: '' }, finish_reason: 'stop' }],
+        x_groq: {
+          usage: { prompt_tokens: 1, completion_tokens: 0, total_tokens: 1 },
+        },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'llama-3.3-70b-versatile',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const errorChunks = chunks.filter((c) => c.type === 'RUN_ERROR')
+    expect(errorChunks).toHaveLength(1)
+    expect(errorChunks[0]).toMatchObject({
+      type: 'RUN_ERROR',
+      code: 'empty-response',
+    })
+    expect(chunks.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
+  })
+
+  it('finalizes the run when upstream stream closes without finish_reason', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-trunc',
+        model: 'llama-3.3-70b-versatile',
+        choices: [
+          { delta: { content: '{"name":"Alice"}' }, finish_reason: null },
+        ],
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'llama-3.3-70b-versatile',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const customChunks = chunks.filter((c) => c.type === 'CUSTOM')
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]).toMatchObject({
+      name: 'structured-output.complete',
+      value: { object: { name: 'Alice' }, raw: '{"name":"Alice"}' },
+    })
+    expect(chunks.filter((c) => c.type === 'RUN_FINISHED')).toHaveLength(1)
+    expect(chunks.filter((c) => c.type === 'RUN_ERROR')).toHaveLength(0)
+  })
+
+  it('terminates on iterator-thrown provider error without emitting RUN_FINISHED', async () => {
+    // Groq surfaces in-stream provider errors as iterator throws (not inline
+    // error chunks), so the test mirrors that contract.
+    mockCreate = vi.fn().mockImplementation(() => {
+      const chunks = [
+        {
+          id: 'chatcmpl-err',
+          model: 'llama-3.3-70b-versatile',
+          choices: [
+            { delta: { content: '{"name":"Al' }, finish_reason: null },
+          ],
+        },
+      ] as Array<unknown>
+      return Promise.resolve({
+        [Symbol.asyncIterator]() {
+          let i = 0
+          return {
+            // eslint-disable-next-line @typescript-eslint/require-await
+            async next() {
+              if (i < chunks.length) return { value: chunks[i++], done: false }
+              throw Object.assign(new Error('Upstream rate limit'), {
+                code: '429',
+              })
+            },
+          }
+        },
+      })
+    })
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'llama-3.3-70b-versatile',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const errorChunks = chunks.filter((c) => c.type === 'RUN_ERROR')
+    expect(errorChunks).toHaveLength(1)
+    expect(chunks.filter((c) => c.type === 'RUN_FINISHED')).toHaveLength(0)
+    expect(chunks.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
+  })
+
+  it('transforms null values to undefined on the parsed object', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-null',
+        model: 'llama-3.3-70b-versatile',
+        choices: [
+          {
+            delta: { content: '{"name":"Alice","nickname":null}' },
+            finish_reason: 'stop',
+          },
+        ],
+        x_groq: {
+          usage: { prompt_tokens: 5, completion_tokens: 9, total_tokens: 14 },
+        },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'llama-3.3-70b-versatile',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: {
+          name: { type: 'string' },
+          nickname: { type: ['string', 'null'] },
+        },
+        required: ['name', 'nickname'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const customChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    // nickname becomes undefined (not present) after transform — matches the
+    // non-streaming structuredOutput contract.
+    const value = customChunks[0]!.value as { object: Record<string, unknown> }
+    expect(value.object.name).toBe('Alice')
+    expect(value.object.nickname).toBeUndefined()
+    // Raw JSON preserves the original null
+    expect((customChunks[0]!.value as { raw: string }).raw).toBe(
+      '{"name":"Alice","nickname":null}',
+    )
+  })
+})
diff --git a/packages/typescript/ai-openai/src/adapters/text.ts b/packages/typescript/ai-openai/src/adapters/text.ts
index 139629869..619aee580 100644
--- a/packages/typescript/ai-openai/src/adapters/text.ts
+++ b/packages/typescript/ai-openai/src/adapters/text.ts
@@ -1,3 +1,4 @@
+import { APIUserAbortError } from 'openai'
 import { BaseTextAdapter } from '@tanstack/ai/adapters'
 import { toRunErrorPayload } from '@tanstack/ai/adapter-internals'
 import { validateTextProviderOptions } from '../text/text-provider-options'
@@ -251,6 +252,293 @@ export class OpenAITextAdapter<
     }
   }
 
+  /**
+   * Stream structured output via a single Responses API request with
+   * `stream: true` + `text.format: json_schema`. Emits raw JSON deltas as
+   * `TEXT_MESSAGE_CONTENT` chunks and a terminal `CUSTOM`
+   * `structured-output.complete` event with `{ object, raw }`.
+   */
+  async *structuredOutputStream(
+    options: StructuredOutputOptions<TProviderOptions>,
+  ): AsyncIterable<StreamChunk> {
+    const { chatOptions, outputSchema } = options
+    const { logger } = chatOptions
+    const timestamp = Date.now()
+    const runId = chatOptions.runId ?? generateId(this.name)
+    const threadId = chatOptions.threadId ?? generateId(this.name)
+    const messageId = generateId(this.name)
+    let hasEmittedRunStarted = false
+    let hasEmittedTextMessageStart = false
+    let accumulatedContent = ''
+    let model: string = chatOptions.model
+    let usage:
+      | { promptTokens: number; completionTokens: number; totalTokens: number }
+      | undefined
+    let finishReason: string | undefined
+
+    const jsonSchema = makeOpenAIStructuredOutputCompatible(
+      outputSchema,
+      outputSchema.required || [],
+    )
+
+    try {
+      // Strip tools — structured-output mode shouldn't mix tool calls into the
+      // request body. Matches the non-streaming `structuredOutput` behavior.
+      const { tools: _tools, ...baseParams } =
+        this.mapTextOptionsToOpenAI(chatOptions)
+      logger.request(
+        `activity=structured-stream provider=openai model=${this.model} messages=${chatOptions.messages.length} stream=true`,
+        { provider: 'openai', model: this.model },
+      )
+      const stream = await this.client.responses.create(
+        {
+          ...baseParams,
+          stream: true,
+          text: {
+            format: {
+              type: 'json_schema',
+              name: 'structured_output',
+              schema: jsonSchema,
+              strict: true,
+            },
+          },
+        },
+        {
+          headers: chatOptions.request?.headers,
+          signal: chatOptions.request?.signal,
+        },
+      )
+
+      for await (const chunk of stream) {
+        logger.provider(`provider=openai type=${chunk.type}`, { chunk })
+
+        if (!hasEmittedRunStarted) {
+          hasEmittedRunStarted = true
+          yield asChunk({
+            type: 'RUN_STARTED',
+            runId,
+            threadId,
+            model,
+            timestamp,
+          })
+        }
+
+        if (
+          chunk.type === 'response.created' ||
+          chunk.type === 'response.in_progress'
+        ) {
+          model = chunk.response.model
+        }
+
+        if (chunk.type === 'response.failed' || chunk.type === 'error') {
+          const message =
+            chunk.type === 'error'
+              ? chunk.message
+              : (chunk.response.error?.message ?? 'OpenAI request failed')
+          const code =
+            chunk.type === 'error'
+              ? (chunk.code ?? undefined)
+              : (chunk.response.error?.code ?? undefined)
+          yield asChunk({
+            type: 'RUN_ERROR',
+            runId,
+            model,
+            timestamp,
+            message,
+            code,
+            error: { message, code },
+          })
+          return
+        }
+
+        if (chunk.type === 'response.output_text.delta' && chunk.delta) {
+          const textDelta = Array.isArray(chunk.delta)
+            ? chunk.delta.join('')
+            : typeof chunk.delta === 'string'
+              ? chunk.delta
+              : ''
+
+          if (textDelta) {
+            if (!hasEmittedTextMessageStart) {
+              hasEmittedTextMessageStart = true
+              yield asChunk({
+                type: 'TEXT_MESSAGE_START',
+                messageId,
+                model,
+                timestamp,
+                role: 'assistant',
+              })
+            }
+
+            accumulatedContent += textDelta
+
+            yield asChunk({
+              type: 'TEXT_MESSAGE_CONTENT',
+              messageId,
+              model,
+              timestamp,
+              delta: textDelta,
+              content: accumulatedContent,
+            })
+          }
+        }
+
+        // A refusal terminates the structured output run — the model declined
+        // to produce JSON conforming to the schema.
+        if (chunk.type === 'response.refusal.delta' && chunk.delta) {
+          const delta: unknown = chunk.delta
+          const refusalText =
+            typeof delta === 'string'
+              ? delta
+              : Array.isArray(delta)
+                ? delta.join('')
+                : ''
+          const message = `Structured output refused${refusalText ? `: ${refusalText}` : ''}`
+          yield asChunk({
+            type: 'RUN_ERROR',
+            runId,
+            model,
+            timestamp,
+            message,
+            code: 'refusal',
+            error: { message, code: 'refusal' },
+          })
+          return
+        }
+
+        if (chunk.type === 'response.completed') {
+          usage = {
+            promptTokens: chunk.response.usage?.input_tokens ?? 0,
+            completionTokens: chunk.response.usage?.output_tokens ?? 0,
+            totalTokens: chunk.response.usage?.total_tokens ?? 0,
+          }
+          finishReason = 'stop'
+        }
+
+        if (chunk.type === 'response.incomplete') {
+          finishReason =
+            chunk.response.incomplete_details?.reason === 'max_output_tokens'
+              ? 'length'
+              : 'stop'
+        }
+      }
+
+      // Always finalize, even if the upstream stream closed without a
+      // `response.completed` event (truncation, transport drop). Otherwise
+      // consumers wait forever on a missing terminal event.
+      if (hasEmittedTextMessageStart) {
+        yield asChunk({
+          type: 'TEXT_MESSAGE_END',
+          messageId,
+          model,
+          timestamp,
+        })
+      }
+
+      if (!accumulatedContent) {
+        const message = 'Structured output response contained no content'
+        logger.errors(message, { source: 'openai.structuredOutputStream' })
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId,
+          model,
+          timestamp,
+          message,
+          code: 'empty-response',
+          error: { message, code: 'empty-response' },
+        })
+        return
+      }
+
+      let parsed: unknown
+      try {
+        parsed = JSON.parse(accumulatedContent)
+      } catch (parseError) {
+        const message =
+          parseError instanceof SyntaxError
+            ? `Failed to parse structured output as JSON: ${parseError.message}`
+            : 'Failed to parse structured output as JSON'
+        logger.errors(message, {
+          source: 'openai.structuredOutputStream',
+          error: parseError,
+        })
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId,
+          model,
+          timestamp,
+          message,
+          code: 'parse-error',
+          error: { message, code: 'parse-error' },
+        })
+        return
+      }
+
+      const transformed = transformNullsToUndefined(parsed)
+
+      yield asChunk({
+        type: 'CUSTOM',
+        name: 'structured-output.complete',
+        value: {
+          object: transformed,
+          raw: accumulatedContent,
+        },
+        model,
+        timestamp,
+      })
+
+      yield asChunk({
+        type: 'RUN_FINISHED',
+        runId,
+        threadId,
+        model,
+        timestamp,
+        usage,
+        finishReason: finishReason ?? 'stop',
+      })
+    } catch (error) {
+      logger.errors('openai.structuredOutputStream fatal', {
+        error: toRunErrorPayload(error, 'openai.structuredOutputStream failed'),
+        source: 'openai.structuredOutputStream',
+      })
+
+      if (!hasEmittedRunStarted) {
+        hasEmittedRunStarted = true
+        yield asChunk({
+          type: 'RUN_STARTED',
+          runId,
+          threadId,
+          model,
+          timestamp,
+        })
+      }
+
+      if (error instanceof APIUserAbortError) {
+        yield asChunk({
+          type: 'RUN_ERROR',
+          runId,
+          model,
+          timestamp,
+          message: 'Request aborted',
+          code: 'aborted',
+          error: { message: 'Request aborted', code: 'aborted' },
+        })
+        return
+      }
+
+      const err = error as Error & { code?: string }
+      yield asChunk({
+        type: 'RUN_ERROR',
+        runId,
+        model,
+        timestamp,
+        message: err.message || 'Unknown error',
+        code: err.code,
+        error: { message: err.message || 'Unknown error', code: err.code },
+      })
+    }
+  }
+
   /**
    * Extract text content from a non-streaming response
    */
diff --git a/packages/typescript/ai-openai/tests/openai-adapter.test.ts b/packages/typescript/ai-openai/tests/openai-adapter.test.ts
index 552793a2e..1d4b692ee 100644
--- a/packages/typescript/ai-openai/tests/openai-adapter.test.ts
+++ b/packages/typescript/ai-openai/tests/openai-adapter.test.ts
@@ -130,3 +130,328 @@ describe('OpenAI adapter option mapping', () => {
     expect(payload.tools.length).toBeGreaterThan(0)
   })
 })
+
+describe('OpenAI structuredOutputStream', () => {
+  beforeEach(() => {
+    vi.clearAllMocks()
+  })
+
+  const setupAdapter = (
+    chunks: Array<Record<string, unknown>>,
+    overrides?: { responsesCreate?: ReturnType<typeof vi.fn> },
+  ) => {
+    const responsesCreate =
+      overrides?.responsesCreate ??
+      vi.fn().mockResolvedValueOnce(createMockChatCompletionsStream(chunks))
+    const adapter = createAdapter('gpt-4o-mini')
+    ;(adapter as any).client = {
+      responses: { create: responsesCreate },
+    }
+    return { adapter, responsesCreate }
+  }
+
+  it('issues a single streaming Responses API request with text.format json_schema and emits parsed object', async () => {
+    const chunks: Array<Record<string, unknown>> = [
+      {
+        type: 'response.created',
+        response: {
+          id: 'resp-1',
+          model: 'gpt-4o-mini',
+          status: 'in_progress',
+          created_at: 1,
+        },
+      },
+      {
+        type: 'response.output_text.delta',
+        delta: '{"name":"Ali',
+      },
+      {
+        type: 'response.output_text.delta',
+        delta: 'ce","age":30}',
+      },
+      {
+        type: 'response.completed',
+        response: {
+          id: 'resp-1',
+          model: 'gpt-4o-mini',
+          status: 'completed',
+          created_at: 2,
+          output: [],
+          usage: { input_tokens: 5, output_tokens: 9, total_tokens: 14 },
+        },
+      },
+    ]
+
+    const { adapter, responsesCreate } = setupAdapter(chunks)
+
+    const outputSchema = {
+      type: 'object',
+      properties: {
+        name: { type: 'string' },
+        age: { type: 'number' },
+      },
+      required: ['name', 'age'],
+    }
+
+    const collected: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: (await import('@tanstack/ai/adapter-internals')).resolveDebugOption(false),
+      },
+      outputSchema,
+    })) {
+      collected.push(chunk)
+    }
+
+    expect(responsesCreate).toHaveBeenCalledTimes(1)
+    const [payload] = responsesCreate.mock.calls[0]
+    expect(payload.stream).toBe(true)
+    expect(payload.text).toEqual({
+      format: {
+        type: 'json_schema',
+        name: 'structured_output',
+        schema: expect.objectContaining({
+          type: 'object',
+          additionalProperties: false,
+        }),
+        strict: true,
+      },
+    })
+    expect(payload.tools).toBeUndefined()
+
+    const types: Array<string> = collected.map((c) => c.type)
+    const idx = (t: string) => types.indexOf(t)
+    expect(idx('RUN_STARTED')).toBeGreaterThanOrEqual(0)
+    expect(idx('TEXT_MESSAGE_START')).toBeGreaterThan(idx('RUN_STARTED'))
+    expect(idx('TEXT_MESSAGE_CONTENT')).toBeGreaterThan(
+      idx('TEXT_MESSAGE_START'),
+    )
+    expect(idx('TEXT_MESSAGE_END')).toBeGreaterThan(idx('TEXT_MESSAGE_CONTENT'))
+    expect(idx('CUSTOM')).toBeGreaterThan(idx('TEXT_MESSAGE_END'))
+    expect(idx('RUN_FINISHED')).toBeGreaterThan(idx('CUSTOM'))
+
+    const contentChunks = collected.filter(
+      (c): c is Extract<StreamChunk, { type: 'TEXT_MESSAGE_CONTENT' }> =>
+        c.type === 'TEXT_MESSAGE_CONTENT',
+    )
+    expect(contentChunks).toHaveLength(2)
+    expect(contentChunks[0]!.delta).toBe('{"name":"Ali')
+    expect(contentChunks[1]!.delta).toBe('ce","age":30}')
+
+    const customChunks = collected.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]!.name).toBe('structured-output.complete')
+    expect(customChunks[0]!.value).toEqual({
+      object: { name: 'Alice', age: 30 },
+      raw: '{"name":"Alice","age":30}',
+    })
+  })
+
+  it('emits RUN_ERROR when accumulated content is not valid JSON', async () => {
+    const { resolveDebugOption } = await import('@tanstack/ai/adapter-internals')
+    const chunks: Array<Record<string, unknown>> = [
+      { type: 'response.output_text.delta', delta: 'not json' },
+      {
+        type: 'response.completed',
+        response: {
+          id: 'resp-bad',
+          model: 'gpt-4o-mini',
+          status: 'completed',
+          created_at: 1,
+          output: [],
+          usage: { input_tokens: 1, output_tokens: 1, total_tokens: 2 },
+        },
+      },
+    ]
+    const { adapter } = setupAdapter(chunks)
+
+    const collected: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: resolveDebugOption(false),
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      collected.push(chunk)
+    }
+
+    const errors = collected.filter((c) => c.type === 'RUN_ERROR')
+    expect(errors).toHaveLength(1)
+    expect(errors[0]).toMatchObject({ code: 'parse-error' })
+    expect(collected.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
+  })
+
+  it('emits empty-response RUN_ERROR when no content is streamed', async () => {
+    const { resolveDebugOption } = await import('@tanstack/ai/adapter-internals')
+    const chunks: Array<Record<string, unknown>> = [
+      {
+        type: 'response.completed',
+        response: {
+          id: 'resp-empty',
+          model: 'gpt-4o-mini',
+          status: 'completed',
+          created_at: 1,
+          output: [],
+          usage: { input_tokens: 1, output_tokens: 0, total_tokens: 1 },
+        },
+      },
+    ]
+    const { adapter } = setupAdapter(chunks)
+
+    const collected: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: resolveDebugOption(false),
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      collected.push(chunk)
+    }
+
+    const errors = collected.filter((c) => c.type === 'RUN_ERROR')
+    expect(errors).toHaveLength(1)
+    expect(errors[0]).toMatchObject({ code: 'empty-response' })
+    expect(collected.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
+  })
+
+  it('finalizes the run when upstream stream closes without response.completed', async () => {
+    const { resolveDebugOption } = await import('@tanstack/ai/adapter-internals')
+    const chunks: Array<Record<string, unknown>> = [
+      { type: 'response.output_text.delta', delta: '{"name":"Alice"}' },
+    ]
+    const { adapter } = setupAdapter(chunks)
+
+    const collected: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: resolveDebugOption(false),
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      collected.push(chunk)
+    }
+
+    const customChunks = collected.filter((c) => c.type === 'CUSTOM')
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]).toMatchObject({
+      name: 'structured-output.complete',
+      value: { object: { name: 'Alice' }, raw: '{"name":"Alice"}' },
+    })
+    expect(collected.filter((c) => c.type === 'RUN_FINISHED')).toHaveLength(1)
+    expect(collected.filter((c) => c.type === 'RUN_ERROR')).toHaveLength(0)
+  })
+
+  it('terminates on response.failed without emitting RUN_FINISHED', async () => {
+    const { resolveDebugOption } = await import('@tanstack/ai/adapter-internals')
+    const chunks: Array<Record<string, unknown>> = [
+      { type: 'response.output_text.delta', delta: '{"name":"Al' },
+      {
+        type: 'response.failed',
+        response: {
+          id: 'resp-err',
+          model: 'gpt-4o-mini',
+          status: 'failed',
+          created_at: 1,
+          error: { message: 'Upstream rate limit', code: 'rate_limit' },
+          output: [],
+        },
+      },
+    ]
+    const { adapter } = setupAdapter(chunks)
+
+    const collected: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: resolveDebugOption(false),
+      },
+      outputSchema: {
+        type: 'object',
+        properties: { name: { type: 'string' } },
+        required: ['name'],
+      },
+    })) {
+      collected.push(chunk)
+    }
+
+    const errors = collected.filter((c) => c.type === 'RUN_ERROR')
+    expect(errors).toHaveLength(1)
+    expect(collected.filter((c) => c.type === 'RUN_FINISHED')).toHaveLength(0)
+    expect(collected.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
+  })
+
+  it('transforms null values to undefined on the parsed object', async () => {
+    const { resolveDebugOption } = await import('@tanstack/ai/adapter-internals')
+    const chunks: Array<Record<string, unknown>> = [
+      {
+        type: 'response.output_text.delta',
+        delta: '{"name":"Alice","nickname":null}',
+      },
+      {
+        type: 'response.completed',
+        response: {
+          id: 'resp-null',
+          model: 'gpt-4o-mini',
+          status: 'completed',
+          created_at: 1,
+          output: [],
+          usage: { input_tokens: 5, output_tokens: 9, total_tokens: 14 },
+        },
+      },
+    ]
+    const { adapter } = setupAdapter(chunks)
+
+    const collected: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'gpt-4o-mini',
+        messages: [{ role: 'user', content: 'Give me a person' }],
+        logger: resolveDebugOption(false),
+      },
+      outputSchema: {
+        type: 'object',
+        properties: {
+          name: { type: 'string' },
+          nickname: { type: ['string', 'null'] },
+        },
+        required: ['name', 'nickname'],
+      },
+    })) {
+      collected.push(chunk)
+    }
+
+    const customChunks = collected.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    const value = customChunks[0]!.value as { object: Record<string, unknown> }
+    expect(value.object.name).toBe('Alice')
+    expect(value.object.nickname).toBeUndefined()
+    expect((customChunks[0]!.value as { raw: string }).raw).toBe(
+      '{"name":"Alice","nickname":null}',
+    )
+  })
+})
diff --git a/testing/e2e/src/lib/feature-support.ts b/testing/e2e/src/lib/feature-support.ts
index 8c0779f7d..6032009da 100644
--- a/testing/e2e/src/lib/feature-support.ts
+++ b/testing/e2e/src/lib/feature-support.ts
@@ -83,7 +83,12 @@ export const matrix: Record<Feature, Set<Provider>> = {
   // Streaming structured output: only providers with native streaming JSON
   // schema support are listed here. Other providers fall back to the default
   // BaseTextAdapter implementation but aren't exercised by E2E yet.
-  'structured-output-stream': new Set(['openrouter']),
+  'structured-output-stream': new Set([
+    'openai',
+    'groq',
+    'grok',
+    'openrouter',
+  ]),
   'agentic-structured': new Set([
     'openai',
     'anthropic',

From 0087eb9a2758292a9b39351f9d6277ee4e8ca40d Mon Sep 17 00:00:00 2001
From: "autofix-ci[bot]" <114827586+autofix-ci[bot]@users.noreply.github.com>
Date: Tue, 5 May 2026 04:18:54 +0000
Subject: [PATCH 3/9] ci: apply automated fixes

---
 .../routes/generations.structured-output.tsx  | 12 +++++++++---
 .../typescript/ai-grok/src/adapters/text.ts   |  6 +++++-
 .../ai-grok/tests/grok-adapter.test.ts        |  4 +---
 .../typescript/ai-groq/src/adapters/text.ts   |  6 +++++-
 .../ai-groq/tests/groq-adapter.test.ts        |  8 ++------
 .../ai-openai/tests/openai-adapter.test.ts    | 19 +++++++++++++------
 testing/e2e/src/lib/feature-support.ts        |  7 +------
 7 files changed, 36 insertions(+), 26 deletions(-)

diff --git a/examples/ts-react-chat/src/routes/generations.structured-output.tsx b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
index e247a08a2..a9fcac31d 100644
--- a/examples/ts-react-chat/src/routes/generations.structured-output.tsx
+++ b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
@@ -55,7 +55,9 @@ interface StreamChunk {
 function StructuredOutputPage() {
   const [prompt, setPrompt] = useState(SAMPLE_PROMPT)
   const [provider, setProvider] = useState<Provider>('openrouter')
-  const [model, setModel] = useState<string>(PROVIDER_MODELS.openrouter[0].value)
+  const [model, setModel] = useState<string>(
+    PROVIDER_MODELS.openrouter[0].value,
+  )
   const [stream, setStream] = useState(true)
   const [result, setResult] = useState<RecommendationResult | null>(null)
   const [streamingText, setStreamingText] = useState<string>('')
@@ -95,7 +97,9 @@ function StructuredOutputPage() {
 
       if (!response.ok) {
         const errPayload = await response.json().catch(() => ({}))
-        throw new Error(errPayload.error || `Request failed (${response.status})`)
+        throw new Error(
+          errPayload.error || `Request failed (${response.status})`,
+        )
       }
 
       if (!stream) {
@@ -225,7 +229,9 @@ function StructuredOutputPage() {
             />
             Stream (single-request{' '}
             <code className="text-orange-400">stream: true</code> +{' '}
-            <code className="text-orange-400">response_format: json_schema</code>
+            <code className="text-orange-400">
+              response_format: json_schema
+            </code>
             )
           </label>
 
diff --git a/packages/typescript/ai-grok/src/adapters/text.ts b/packages/typescript/ai-grok/src/adapters/text.ts
index c7fdc8287..951c78a6b 100644
--- a/packages/typescript/ai-grok/src/adapters/text.ts
+++ b/packages/typescript/ai-grok/src/adapters/text.ts
@@ -246,7 +246,11 @@ export class GrokTextAdapter<
       hasEmittedTextMessageEnd: false,
       hasFinalizedChoice: false,
       deferredUsage: undefined as
-        | { promptTokens: number; completionTokens: number; totalTokens: number }
+        | {
+            promptTokens: number
+            completionTokens: number
+            totalTokens: number
+          }
         | undefined,
       computedFinishReason: undefined as string | undefined,
     }
diff --git a/packages/typescript/ai-grok/tests/grok-adapter.test.ts b/packages/typescript/ai-grok/tests/grok-adapter.test.ts
index 5d2d6a933..e6b24c3a4 100644
--- a/packages/typescript/ai-grok/tests/grok-adapter.test.ts
+++ b/packages/typescript/ai-grok/tests/grok-adapter.test.ts
@@ -844,9 +844,7 @@ describe('Grok structuredOutputStream', () => {
         {
           id: 'chatcmpl-err',
           model: 'grok-3',
-          choices: [
-            { delta: { content: '{"name":"Al' }, finish_reason: null },
-          ],
+          choices: [{ delta: { content: '{"name":"Al' }, finish_reason: null }],
         },
       ] as Array<unknown>
       return Promise.resolve({
diff --git a/packages/typescript/ai-groq/src/adapters/text.ts b/packages/typescript/ai-groq/src/adapters/text.ts
index 44bed44b7..ae0f3bf3b 100644
--- a/packages/typescript/ai-groq/src/adapters/text.ts
+++ b/packages/typescript/ai-groq/src/adapters/text.ts
@@ -243,7 +243,11 @@ export class GroqTextAdapter<
       hasEmittedTextMessageEnd: false,
       hasFinalizedChoice: false,
       deferredUsage: undefined as
-        | { promptTokens: number; completionTokens: number; totalTokens: number }
+        | {
+            promptTokens: number
+            completionTokens: number
+            totalTokens: number
+          }
         | undefined,
       computedFinishReason: undefined as string | undefined,
     }
diff --git a/packages/typescript/ai-groq/tests/groq-adapter.test.ts b/packages/typescript/ai-groq/tests/groq-adapter.test.ts
index 1ba1ae897..4240aeac4 100644
--- a/packages/typescript/ai-groq/tests/groq-adapter.test.ts
+++ b/packages/typescript/ai-groq/tests/groq-adapter.test.ts
@@ -607,9 +607,7 @@ describe('Groq structuredOutputStream', () => {
       {
         id: 'chatcmpl-stream-1',
         model: 'llama-3.3-70b-versatile',
-        choices: [
-          { delta: { content: '{"name":"Ali' }, finish_reason: null },
-        ],
+        choices: [{ delta: { content: '{"name":"Ali' }, finish_reason: null }],
       },
       {
         id: 'chatcmpl-stream-1',
@@ -826,9 +824,7 @@ describe('Groq structuredOutputStream', () => {
         {
           id: 'chatcmpl-err',
           model: 'llama-3.3-70b-versatile',
-          choices: [
-            { delta: { content: '{"name":"Al' }, finish_reason: null },
-          ],
+          choices: [{ delta: { content: '{"name":"Al' }, finish_reason: null }],
         },
       ] as Array<unknown>
       return Promise.resolve({
diff --git a/packages/typescript/ai-openai/tests/openai-adapter.test.ts b/packages/typescript/ai-openai/tests/openai-adapter.test.ts
index 1d4b692ee..6bd6c73e6 100644
--- a/packages/typescript/ai-openai/tests/openai-adapter.test.ts
+++ b/packages/typescript/ai-openai/tests/openai-adapter.test.ts
@@ -198,7 +198,9 @@ describe('OpenAI structuredOutputStream', () => {
       chatOptions: {
         model: 'gpt-4o-mini',
         messages: [{ role: 'user', content: 'Give me a person' }],
-        logger: (await import('@tanstack/ai/adapter-internals')).resolveDebugOption(false),
+        logger: (
+          await import('@tanstack/ai/adapter-internals')
+        ).resolveDebugOption(false),
       },
       outputSchema,
     })) {
@@ -252,7 +254,8 @@ describe('OpenAI structuredOutputStream', () => {
   })
 
   it('emits RUN_ERROR when accumulated content is not valid JSON', async () => {
-    const { resolveDebugOption } = await import('@tanstack/ai/adapter-internals')
+    const { resolveDebugOption } =
+      await import('@tanstack/ai/adapter-internals')
     const chunks: Array<Record<string, unknown>> = [
       { type: 'response.output_text.delta', delta: 'not json' },
       {
@@ -292,7 +295,8 @@ describe('OpenAI structuredOutputStream', () => {
   })
 
   it('emits empty-response RUN_ERROR when no content is streamed', async () => {
-    const { resolveDebugOption } = await import('@tanstack/ai/adapter-internals')
+    const { resolveDebugOption } =
+      await import('@tanstack/ai/adapter-internals')
     const chunks: Array<Record<string, unknown>> = [
       {
         type: 'response.completed',
@@ -331,7 +335,8 @@ describe('OpenAI structuredOutputStream', () => {
   })
 
   it('finalizes the run when upstream stream closes without response.completed', async () => {
-    const { resolveDebugOption } = await import('@tanstack/ai/adapter-internals')
+    const { resolveDebugOption } =
+      await import('@tanstack/ai/adapter-internals')
     const chunks: Array<Record<string, unknown>> = [
       { type: 'response.output_text.delta', delta: '{"name":"Alice"}' },
     ]
@@ -364,7 +369,8 @@ describe('OpenAI structuredOutputStream', () => {
   })
 
   it('terminates on response.failed without emitting RUN_FINISHED', async () => {
-    const { resolveDebugOption } = await import('@tanstack/ai/adapter-internals')
+    const { resolveDebugOption } =
+      await import('@tanstack/ai/adapter-internals')
     const chunks: Array<Record<string, unknown>> = [
       { type: 'response.output_text.delta', delta: '{"name":"Al' },
       {
@@ -404,7 +410,8 @@ describe('OpenAI structuredOutputStream', () => {
   })
 
   it('transforms null values to undefined on the parsed object', async () => {
-    const { resolveDebugOption } = await import('@tanstack/ai/adapter-internals')
+    const { resolveDebugOption } =
+      await import('@tanstack/ai/adapter-internals')
     const chunks: Array<Record<string, unknown>> = [
       {
         type: 'response.output_text.delta',
diff --git a/testing/e2e/src/lib/feature-support.ts b/testing/e2e/src/lib/feature-support.ts
index 6032009da..e1347c2db 100644
--- a/testing/e2e/src/lib/feature-support.ts
+++ b/testing/e2e/src/lib/feature-support.ts
@@ -83,12 +83,7 @@ export const matrix: Record<Feature, Set<Provider>> = {
   // Streaming structured output: only providers with native streaming JSON
   // schema support are listed here. Other providers fall back to the default
   // BaseTextAdapter implementation but aren't exercised by E2E yet.
-  'structured-output-stream': new Set([
-    'openai',
-    'groq',
-    'grok',
-    'openrouter',
-  ]),
+  'structured-output-stream': new Set(['openai', 'groq', 'grok', 'openrouter']),
   'agentic-structured': new Set([
     'openai',
     'anthropic',

From 2472265654013f45771dae3b5c881e4c074ba3a8 Mon Sep 17 00:00:00 2001
From: Tom Beckenham <34339192+tombeckenham@users.noreply.github.com>
Date: Tue, 5 May 2026 16:41:05 +1000
Subject: [PATCH 4/9] feat: stream reasoning during structured output (openai,
 grok, groq)

Surfaces chain-of-thought as REASONING_MESSAGE_CONTENT during
`structuredOutputStream` for the three OpenAI-compatible adapters,
matching openrouter's existing behavior. Each provider exposes
reasoning differently and none are typed by the upstream SDKs:

- openai: consumes `response.reasoning_text.delta` and
  `response.reasoning_summary_text.delta` Responses API events
- grok (xAI): reads `delta.reasoning_content` (DeepSeek convention) on
  Chat Completions deltas
- groq: reads `delta.reasoning` (mirroring its `message.reasoning` on
  completed responses) on Chat Completions deltas

In all three, reasoning lifecycle is closed cleanly before
TEXT_MESSAGE_START so consumers see the contractual transition.
Accumulated reasoning is also surfaced on the terminal `CUSTOM`
`structured-output.complete` event's `value.reasoning` field.

Tests: 4 new cases covering reasoning surfacing + omission across grok
and groq. 61 grok, 19 groq, 137 openai tests pass.

ts-react-chat structured-output example:
- model lists refreshed to latest per provider
- progressive UI rendering via `parsePartialJSON` so cards/fields fill
  in as JSON streams
- live "Thinking" strip rendering the latest reasoning sentence
- per-provider reasoning opt-ins wired through modelOptions so models
  actually emit reasoning deltas (openai reasoning.summary: 'auto',
  groq reasoning_format: 'parsed', openrouter reasoning.effort)
- debug: true on chat() calls for inspection of provider events

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../src/routes/api.structured-output.ts       |  64 +++-
 .../routes/generations.structured-output.tsx  | 344 +++++++++++++-----
 .../typescript/ai-grok/src/adapters/text.ts   |  74 ++++
 .../ai-grok/tests/grok-adapter.test.ts        | 128 +++++++
 .../typescript/ai-groq/src/adapters/text.ts   |  74 ++++
 .../ai-groq/tests/groq-adapter.test.ts        | 130 +++++++
 .../typescript/ai-openai/src/adapters/text.ts |  86 +++++
 7 files changed, 803 insertions(+), 97 deletions(-)

diff --git a/examples/ts-react-chat/src/routes/api.structured-output.ts b/examples/ts-react-chat/src/routes/api.structured-output.ts
index 3af52568d..43a6fe3db 100644
--- a/examples/ts-react-chat/src/routes/api.structured-output.ts
+++ b/examples/ts-react-chat/src/routes/api.structured-output.ts
@@ -30,15 +30,63 @@ type Provider = 'openai' | 'grok' | 'groq' | 'openrouter'
 function adapterFor(provider: Provider, model?: string): AnyTextAdapter {
   switch (provider) {
     case 'openai':
-      return openaiText((model || 'gpt-4o') as 'gpt-4o')
+      return openaiText((model || 'gpt-5.2') as 'gpt-5.2')
     case 'grok':
-      return grokText((model || 'grok-3') as 'grok-3')
+      return grokText(
+        (model || 'grok-4-1-fast-reasoning') as 'grok-4-1-fast-reasoning',
+      )
     case 'groq':
       return groqText(
-        (model || 'llama-3.3-70b-versatile') as 'llama-3.3-70b-versatile',
+        (model ||
+          'meta-llama/llama-4-maverick-17b-128e-instruct') as 'meta-llama/llama-4-maverick-17b-128e-instruct',
       )
     case 'openrouter':
-      return openRouterText((model || 'openai/gpt-5.2') as 'openai/gpt-5.2')
+      return openRouterText(
+        (model || 'anthropic/claude-opus-4.7') as 'anthropic/claude-opus-4.7',
+      )
+  }
+}
+
+// Per-provider modelOptions to opt into reasoning surfacing. Without these,
+// reasoning models reason silently and the UI never sees REASONING_* events.
+function reasoningOptionsFor(
+  provider: Provider,
+  model: string | undefined,
+): Record<string, unknown> | undefined {
+  switch (provider) {
+    case 'openai':
+      // Responses API: `reasoning.summary: 'auto'` is what makes the API emit
+      // `response.reasoning_summary_text.delta` events. Only valid on
+      // reasoning models (gpt-5.x, o-series); older models (gpt-4o) reject it.
+      if (
+        model?.startsWith('gpt-5') ||
+        model?.startsWith('o3') ||
+        model?.startsWith('o4')
+      ) {
+        return { reasoning: { summary: 'auto' } }
+      }
+      return undefined
+    case 'groq':
+      // Groq's Chat Completions only streams `delta.reasoning` when
+      // `reasoning_format: 'parsed'`. Required for gpt-oss / qwen3 / kimi-k2
+      // to emit reasoning during structured output (json_schema mode).
+      if (
+        model?.startsWith('openai/gpt-oss') ||
+        model?.startsWith('qwen') ||
+        model?.startsWith('moonshotai/kimi')
+      ) {
+        return { reasoning_format: 'parsed' }
+      }
+      return undefined
+    case 'openrouter':
+      // OpenRouter normalises across providers. `reasoning.effort` triggers
+      // the upstream model's reasoning + surfaces the deltas.
+      return { reasoning: { effort: 'medium' } }
+    case 'grok':
+      // xAI surfaces `delta.reasoning_content` automatically on reasoning
+      // models (grok-3-mini, grok-4-fast-reasoning, grok-4-1-fast-reasoning).
+      // No request param needed.
+      return undefined
   }
 }
 
@@ -56,6 +104,8 @@ export const Route = createFileRoute('/api/structured-output')({
         const resolvedProvider: Provider = provider || 'openrouter'
 
         try {
+          const modelOptions = reasoningOptionsFor(resolvedProvider, model)
+
           if (stream) {
             const abortController = new AbortController()
             request.signal.addEventListener('abort', () =>
@@ -63,9 +113,13 @@ export const Route = createFileRoute('/api/structured-output')({
             )
             const streamIterable = chat({
               adapter: adapterFor(resolvedProvider, model),
+              modelOptions: modelOptions as never,
               messages: [{ role: 'user', content: prompt }],
               outputSchema: GuitarRecommendationSchema,
               stream: true,
+              // Surface adapter request/provider/error logs so we can see
+              // exactly which Responses API events the model is emitting.
+              debug: true,
               abortController,
             }) as AsyncIterable<StreamChunk>
             return toServerSentEventsResponse(streamIterable, {
@@ -75,8 +129,10 @@ export const Route = createFileRoute('/api/structured-output')({
 
           const result = await chat({
             adapter: adapterFor(resolvedProvider, model),
+            modelOptions: modelOptions as never,
             messages: [{ role: 'user', content: prompt }],
             outputSchema: GuitarRecommendationSchema,
+            debug: true,
           })
 
           return new Response(JSON.stringify({ data: result }), {
diff --git a/examples/ts-react-chat/src/routes/generations.structured-output.tsx b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
index a9fcac31d..dd0a4fc8f 100644
--- a/examples/ts-react-chat/src/routes/generations.structured-output.tsx
+++ b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
@@ -1,5 +1,6 @@
 import { useRef, useState } from 'react'
 import { createFileRoute } from '@tanstack/react-router'
+import { parsePartialJSON } from '@tanstack/ai'
 
 const SAMPLE_PROMPT =
   'I play indie rock and have a $1500 budget. Recommend two electric guitars and one acoustic to round out my rig.'
@@ -11,39 +12,62 @@ const PROVIDER_MODELS: Record<
   Array<{ value: string; label: string }>
 > = {
   openai: [
-    { value: 'gpt-4o', label: 'gpt-4o' },
-    { value: 'gpt-4o-mini', label: 'gpt-4o-mini' },
+    { value: 'gpt-5.2', label: 'GPT-5.2 (frontier)' },
+    { value: 'gpt-5.2-pro', label: 'GPT-5.2 Pro' },
+    { value: 'gpt-5.1', label: 'GPT-5.1' },
+    { value: 'gpt-5', label: 'GPT-5' },
+    { value: 'gpt-5-mini', label: 'GPT-5 Mini' },
+    { value: 'gpt-4o', label: 'GPT-4o' },
   ],
   grok: [
-    { value: 'grok-3', label: 'grok-3' },
-    { value: 'grok-4-0709', label: 'grok-4-0709' },
+    { value: 'grok-4-1-fast-reasoning', label: 'Grok 4.1 Fast (reasoning)' },
+    {
+      value: 'grok-4-1-fast-non-reasoning',
+      label: 'Grok 4.1 Fast (non-reasoning)',
+    },
+    { value: 'grok-4', label: 'Grok 4' },
+    { value: 'grok-3', label: 'Grok 3' },
   ],
   groq: [
-    { value: 'llama-3.3-70b-versatile', label: 'llama-3.3-70b-versatile' },
-    { value: 'llama-3.1-8b-instant', label: 'llama-3.1-8b-instant' },
+    {
+      value: 'meta-llama/llama-4-maverick-17b-128e-instruct',
+      label: 'Llama 4 Maverick 17B',
+    },
+    {
+      value: 'meta-llama/llama-4-scout-17b-16e-instruct',
+      label: 'Llama 4 Scout 17B',
+    },
+    {
+      value: 'moonshotai/kimi-k2-instruct-0905',
+      label: 'Kimi K2 Instruct',
+    },
+    { value: 'llama-3.3-70b-versatile', label: 'Llama 3.3 70B Versatile' },
+    { value: 'openai/gpt-oss-120b', label: 'GPT-OSS 120B' },
   ],
   openrouter: [
-    { value: 'openai/gpt-5.2', label: 'OpenRouter / GPT-5.2' },
-    { value: 'openai/gpt-5.1', label: 'OpenRouter / GPT-5.1' },
-    { value: 'anthropic/claude-sonnet-4.6', label: 'OpenRouter / Sonnet 4.6' },
-    { value: 'x-ai/grok-4.1-fast', label: 'OpenRouter / Grok 4.1 Fast' },
+    { value: 'anthropic/claude-opus-4.7', label: 'Claude Opus 4.7' },
+    { value: 'anthropic/claude-sonnet-4.6', label: 'Claude Sonnet 4.6' },
+    { value: 'openai/gpt-5.2', label: 'GPT-5.2 (via OpenRouter)' },
+    { value: 'x-ai/grok-4.1-fast', label: 'Grok 4.1 Fast (via OpenRouter)' },
   ],
 }
 
-interface RecommendationResult {
-  title: string
-  summary: string
-  recommendations: Array<{
-    name: string
-    brand: string
-    type: 'acoustic' | 'electric' | 'bass' | 'classical'
-    priceRangeUsd: { min: number; max: number }
-    reason: string
-  }>
-  nextSteps: Array<string>
+interface PartialRecommendation {
+  name?: string
+  brand?: string
+  type?: 'acoustic' | 'electric' | 'bass' | 'classical' | string
+  priceRangeUsd?: { min?: number; max?: number }
+  reason?: string
+}
+
+interface PartialResult {
+  title?: string
+  summary?: string
+  recommendations?: Array<PartialRecommendation>
+  nextSteps?: Array<string>
 }
 
-interface StreamChunk {
+interface StreamChunkPayload {
   type: string
   delta?: string
   content?: string
@@ -52,6 +76,19 @@ interface StreamChunk {
   message?: string
 }
 
+// Pick the last meaningful sentence/line out of an accumulating reasoning
+// stream so the UI can render a single rolling line of "what it's thinking
+// right now" rather than a growing wall of text.
+function latestThought(reasoning: string): string {
+  const trimmed = reasoning.trimEnd()
+  if (!trimmed) return ''
+  // Prefer the last sentence; fall back to the last newline-delimited line.
+  const sentenceMatch = trimmed.match(/[^.!?\n]+[.!?]?\s*$/)
+  const candidate = sentenceMatch ? sentenceMatch[0] : trimmed
+  const last = candidate.split('\n').filter(Boolean).pop() ?? candidate
+  return last.trim()
+}
+
 function StructuredOutputPage() {
   const [prompt, setPrompt] = useState(SAMPLE_PROMPT)
   const [provider, setProvider] = useState<Provider>('openrouter')
@@ -59,9 +96,13 @@ function StructuredOutputPage() {
     PROVIDER_MODELS.openrouter[0].value,
   )
   const [stream, setStream] = useState(true)
-  const [result, setResult] = useState<RecommendationResult | null>(null)
-  const [streamingText, setStreamingText] = useState<string>('')
+  const [result, setResult] = useState<PartialResult | null>(null)
+  const [rawJson, setRawJson] = useState<string>('')
   const [deltaCount, setDeltaCount] = useState(0)
+  const [isStreaming, setIsStreaming] = useState(false)
+  const [hasFinalResult, setHasFinalResult] = useState(false)
+  const [reasoningLine, setReasoningLine] = useState<string>('')
+  const [reasoningFull, setReasoningFull] = useState<string>('')
   const [error, setError] = useState<string | null>(null)
   const [isLoading, setIsLoading] = useState(false)
   const abortRef = useRef<AbortController | null>(null)
@@ -71,13 +112,21 @@ function StructuredOutputPage() {
     setModel(PROVIDER_MODELS[next][0].value)
   }
 
+  const reset = () => {
+    setResult(null)
+    setRawJson('')
+    setDeltaCount(0)
+    setHasFinalResult(false)
+    setReasoningLine('')
+    setReasoningFull('')
+    setError(null)
+  }
+
   const handleGenerate = async () => {
     if (!prompt.trim()) return
     setIsLoading(true)
-    setError(null)
-    setResult(null)
-    setStreamingText('')
-    setDeltaCount(0)
+    reset()
+    setIsStreaming(stream)
 
     const controller = new AbortController()
     abortRef.current = controller
@@ -104,16 +153,18 @@ function StructuredOutputPage() {
 
       if (!stream) {
         const payload = await response.json()
-        setResult(payload.data as RecommendationResult)
+        setResult(payload.data as PartialResult)
+        setHasFinalResult(true)
         return
       }
 
-      // Streaming path: parse SSE, accumulate text deltas live, and capture
-      // the terminal `structured-output.complete` CUSTOM event.
+      // Streaming path — parse SSE, accumulate raw JSON, render the partially
+      // parsed object live, snap to the validated terminal payload.
       const reader = response.body!.getReader()
       const decoder = new TextDecoder()
       let buffer = ''
       let accumulated = ''
+      let reasoning = ''
       let deltas = 0
 
       while (true) {
@@ -121,7 +172,6 @@ function StructuredOutputPage() {
         if (done) break
         buffer += decoder.decode(value, { stream: true })
 
-        // SSE frames are separated by "\n\n"
         let sepIdx = buffer.indexOf('\n\n')
         while (sepIdx !== -1) {
           const frame = buffer.slice(0, sepIdx)
@@ -132,9 +182,9 @@ function StructuredOutputPage() {
             if (!line.startsWith('data: ')) continue
             const json = line.slice(6).trim()
             if (!json) continue
-            let chunk: StreamChunk
+            let chunk: StreamChunkPayload
             try {
-              chunk = JSON.parse(json) as StreamChunk
+              chunk = JSON.parse(json) as StreamChunkPayload
             } catch {
               continue
             }
@@ -142,14 +192,41 @@ function StructuredOutputPage() {
             if (chunk.type === 'TEXT_MESSAGE_CONTENT' && chunk.delta) {
               accumulated += chunk.delta
               deltas += 1
-              setStreamingText(accumulated)
+              setRawJson(accumulated)
               setDeltaCount(deltas)
+              // partial-json tolerates incomplete JSON — it returns whatever
+              // structure can be inferred. Render it directly so the UI fills
+              // in field by field as the model produces them.
+              const partial = parsePartialJSON(accumulated) as
+                | PartialResult
+                | undefined
+              if (partial && typeof partial === 'object') {
+                setResult(partial)
+              }
+            } else if (
+              chunk.type === 'REASONING_MESSAGE_CONTENT' &&
+              chunk.delta
+            ) {
+              reasoning += chunk.delta
+              setReasoningFull(reasoning)
+              // One-liner: take the last non-empty line/sentence so consumers
+              // see "what it's thinking right now" without a wall of text.
+              setReasoningLine(latestThought(reasoning))
             } else if (
               chunk.type === 'CUSTOM' &&
               chunk.name === 'structured-output.complete' &&
               chunk.value?.object
             ) {
-              setResult(chunk.value.object as RecommendationResult)
+              setResult(chunk.value.object as PartialResult)
+              setHasFinalResult(true)
+              if (
+                typeof (chunk.value as { reasoning?: string }).reasoning ===
+                'string'
+              ) {
+                setReasoningFull(
+                  (chunk.value as { reasoning: string }).reasoning,
+                )
+              }
             } else if (chunk.type === 'RUN_ERROR') {
               throw new Error(chunk.message || 'Stream failed')
             }
@@ -164,12 +241,17 @@ function StructuredOutputPage() {
       }
     } finally {
       setIsLoading(false)
+      setIsStreaming(false)
       abortRef.current = null
     }
   }
 
   const handleAbort = () => abortRef.current?.abort()
 
+  const renderingPartial = isStreaming && !hasFinalResult
+  const recommendations = result?.recommendations ?? []
+  const nextSteps = result?.nextSteps ?? []
+
   return (
     <div className="flex flex-col h-[calc(100vh-72px)] bg-gray-900 text-white">
       <div className="border-b border-orange-500/20 bg-gray-800 px-6 py-4">
@@ -179,9 +261,16 @@ function StructuredOutputPage() {
           <code className="text-orange-400">outputSchema</code>. Toggle{' '}
           <code className="text-orange-400">stream</code> to exercise{' '}
           <code className="text-orange-400">structuredOutputStream</code> on the
-          selected provider; deltas render live while the final{' '}
+          selected provider; the UI fills in progressively via{' '}
+          <code className="text-orange-400">parsePartialJSON</code>, then snaps
+          to the validated payload from the terminal{' '}
           <code className="text-orange-400">structured-output.complete</code>{' '}
-          event populates the parsed result.
+          event. Reasoning models surface a live thinking strip from{' '}
+          <code className="text-orange-400">REASONING_MESSAGE_CONTENT</code>{' '}
+          deltas — openai (Responses API), openrouter, xAI (
+          <code className="text-orange-400">delta.reasoning_content</code>), and
+          Groq (<code className="text-orange-400">delta.reasoning</code>) all
+          stream chain-of-thought.
         </p>
       </div>
 
@@ -267,13 +356,9 @@ function StructuredOutputPage() {
                 Abort
               </button>
             )}
-            {(result || streamingText) && !isLoading && (
+            {(result || rawJson) && !isLoading && (
               <button
-                onClick={() => {
-                  setResult(null)
-                  setStreamingText('')
-                  setDeltaCount(0)
-                }}
+                onClick={reset}
                 className="px-6 py-2 bg-gray-700 hover:bg-gray-600 text-white rounded-lg text-sm font-medium transition-colors"
               >
                 Clear
@@ -287,17 +372,32 @@ function StructuredOutputPage() {
             </div>
           )}
 
-          {streamingText && !result && (
-            <div className="p-4 bg-gray-800/30 border border-gray-700/50 rounded-lg">
-              <div className="flex items-center justify-between mb-2">
-                <p className="text-xs text-gray-400 uppercase tracking-wider">
-                  Streaming JSON
-                </p>
-                <p className="text-xs text-orange-400">{deltaCount} deltas</p>
+          {(reasoningLine || reasoningFull) && (
+            <div className="p-3 bg-purple-500/5 border border-purple-500/20 rounded-lg">
+              <div className="flex items-center gap-2 text-xs text-purple-300/80">
+                <span className="uppercase tracking-wider">Thinking</span>
+                {isStreaming && !hasFinalResult && (
+                  <span className="inline-block w-1.5 h-1.5 rounded-full bg-purple-400 animate-pulse" />
+                )}
               </div>
-              <pre className="text-xs text-gray-300 whitespace-pre-wrap break-words">
-                {streamingText}
-              </pre>
+              <p
+                className="text-sm text-purple-100/90 mt-1 truncate"
+                title={reasoningFull}
+              >
+                {reasoningLine ||
+                  reasoningFull.split('\n').filter(Boolean).slice(-1)[0] ||
+                  '…'}
+              </p>
+              {reasoningFull && reasoningFull !== reasoningLine && (
+                <details className="mt-2">
+                  <summary className="text-xs text-purple-300/60 cursor-pointer">
+                    Full reasoning ({reasoningFull.length} chars)
+                  </summary>
+                  <pre className="text-xs text-purple-100/70 mt-2 whitespace-pre-wrap wrap-break-word">
+                    {reasoningFull}
+                  </pre>
+                </details>
+              )}
             </div>
           )}
 
@@ -305,59 +405,117 @@ function StructuredOutputPage() {
             <div className="space-y-4">
               {stream && deltaCount > 0 && (
                 <p className="text-xs text-gray-500">
-                  Reassembled from {deltaCount} streamed deltas.
+                  {hasFinalResult ? 'Final result' : 'Streaming'} —{' '}
+                  {deltaCount} deltas received
+                  {renderingPartial && (
+                    <span className="ml-1 inline-block w-2 h-2 rounded-full bg-orange-500 animate-pulse" />
+                  )}
                 </p>
               )}
-              <div className="p-4 bg-gray-800/50 border border-gray-700 rounded-lg">
-                <h3 className="text-lg font-semibold text-white">
-                  {result.title}
-                </h3>
-                <p className="text-gray-300 mt-2 text-sm">{result.summary}</p>
-              </div>
 
-              <div className="space-y-3">
-                {result.recommendations.map((rec, i) => (
-                  <div
-                    key={i}
-                    className="p-4 bg-gray-800/50 border border-gray-700 rounded-lg"
-                  >
-                    <div className="flex items-start justify-between gap-3">
-                      <div>
-                        <p className="text-white font-medium">
-                          {rec.brand} {rec.name}
-                        </p>
-                        <p className="text-xs text-orange-400 uppercase tracking-wider mt-0.5">
-                          {rec.type}
-                        </p>
+              {(result.title || renderingPartial) && (
+                <div
+                  className={`p-4 bg-gray-800/50 border border-gray-700 rounded-lg transition-colors ${
+                    renderingPartial && !result.summary
+                      ? 'border-orange-500/30'
+                      : ''
+                  }`}
+                >
+                  <h3 className="text-lg font-semibold text-white">
+                    {result.title || (
+                      <span className="text-gray-500 italic">
+                        Generating title…
+                      </span>
+                    )}
+                    {renderingPartial && result.title && !result.summary && (
+                      <span className="ml-1 inline-block w-1.5 h-4 align-middle bg-orange-400 animate-pulse" />
+                    )}
+                  </h3>
+                  {(result.summary || renderingPartial) && (
+                    <p className="text-gray-300 mt-2 text-sm">
+                      {result.summary || (
+                        <span className="text-gray-500 italic">
+                          Generating summary…
+                        </span>
+                      )}
+                    </p>
+                  )}
+                </div>
+              )}
+
+              {recommendations.length > 0 && (
+                <div className="space-y-3">
+                  {recommendations.map((rec, i) => {
+                    const isLastWhileStreaming =
+                      renderingPartial && i === recommendations.length - 1
+                    return (
+                      <div
+                        key={i}
+                        className={`p-4 bg-gray-800/50 border rounded-lg transition-colors ${
+                          isLastWhileStreaming
+                            ? 'border-orange-500/30'
+                            : 'border-gray-700'
+                        }`}
+                      >
+                        <div className="flex items-start justify-between gap-3">
+                          <div>
+                            <p className="text-white font-medium">
+                              {[rec.brand, rec.name].filter(Boolean).join(' ') ||
+                                (
+                                  <span className="text-gray-500 italic">
+                                    Loading…
+                                  </span>
+                                )}
+                            </p>
+                            {rec.type && (
+                              <p className="text-xs text-orange-400 uppercase tracking-wider mt-0.5">
+                                {rec.type}
+                              </p>
+                            )}
+                          </div>
+                          {rec.priceRangeUsd?.min != null &&
+                            rec.priceRangeUsd.max != null && (
+                              <p className="text-sm text-gray-400 whitespace-nowrap">
+                                ${rec.priceRangeUsd.min} – $
+                                {rec.priceRangeUsd.max}
+                              </p>
+                            )}
+                        </div>
+                        {rec.reason && (
+                          <p className="text-sm text-gray-300 mt-2">
+                            {rec.reason}
+                            {isLastWhileStreaming && (
+                              <span className="ml-1 inline-block w-1.5 h-4 align-middle bg-orange-400 animate-pulse" />
+                            )}
+                          </p>
+                        )}
                       </div>
-                      <p className="text-sm text-gray-400 whitespace-nowrap">
-                        ${rec.priceRangeUsd.min} – ${rec.priceRangeUsd.max}
-                      </p>
-                    </div>
-                    <p className="text-sm text-gray-300 mt-2">{rec.reason}</p>
-                  </div>
-                ))}
-              </div>
+                    )
+                  })}
+                </div>
+              )}
 
-              {result.nextSteps.length > 0 && (
+              {nextSteps.length > 0 && (
                 <div className="p-4 bg-gray-800/50 border border-gray-700 rounded-lg">
                   <p className="text-sm text-gray-400 mb-2">Next Steps</p>
                   <ul className="list-disc list-inside text-sm text-gray-200 space-y-1">
-                    {result.nextSteps.map((step, i) => (
+                    {nextSteps.map((step, i) => (
                       <li key={i}>{step}</li>
                     ))}
                   </ul>
                 </div>
               )}
 
-              <details className="p-4 bg-gray-800/30 border border-gray-700/50 rounded-lg">
-                <summary className="text-sm text-gray-400 cursor-pointer">
-                  Raw JSON
-                </summary>
-                <pre className="text-xs text-gray-300 mt-3 overflow-x-auto">
-                  {JSON.stringify(result, null, 2)}
-                </pre>
-              </details>
+              {rawJson && (
+                <details className="p-4 bg-gray-800/30 border border-gray-700/50 rounded-lg">
+                  <summary className="text-sm text-gray-400 cursor-pointer">
+                    Raw JSON ({rawJson.length} chars)
+                  </summary>
+                  <pre className="text-xs text-gray-300 mt-3 overflow-x-auto wrap-break-word whitespace-pre-wrap">
+                    {rawJson}
+                  </pre>
+                </details>
+              )}
             </div>
           )}
         </div>
diff --git a/packages/typescript/ai-grok/src/adapters/text.ts b/packages/typescript/ai-grok/src/adapters/text.ts
index 951c78a6b..782cefb60 100644
--- a/packages/typescript/ai-grok/src/adapters/text.ts
+++ b/packages/typescript/ai-grok/src/adapters/text.ts
@@ -236,6 +236,7 @@ export class GrokTextAdapter<
     const { chatOptions, outputSchema } = options
     const { logger } = chatOptions
     const timestamp = Date.now()
+    const reasoningMessageId = generateId(this.name)
     const aguiState = {
       runId: chatOptions.runId ?? generateId(this.name),
       threadId: chatOptions.threadId ?? generateId(this.name),
@@ -244,6 +245,7 @@ export class GrokTextAdapter<
       hasEmittedRunStarted: false,
       hasEmittedTextMessageStart: false,
       hasEmittedTextMessageEnd: false,
+      hasEmittedReasoningStart: false,
       hasFinalizedChoice: false,
       deferredUsage: undefined as
         | {
@@ -261,6 +263,7 @@ export class GrokTextAdapter<
     )
 
     let accumulatedContent = ''
+    let accumulatedReasoning = ''
     let currentModel = chatOptions.model
 
     try {
@@ -306,8 +309,62 @@ export class GrokTextAdapter<
         const choice = chunk.choices[0]
         if (!choice) continue
 
+        // xAI reasoning models surface chain-of-thought via `delta.reasoning_content`
+        // (DeepSeek convention). The OpenAI SDK doesn't type this field so we read
+        // it via an unknown cast.
+        const deltaUnknown = choice.delta as unknown as {
+          reasoning_content?: string
+          reasoning?: string
+        }
+        const deltaReasoning =
+          deltaUnknown.reasoning_content ?? deltaUnknown.reasoning
+        if (deltaReasoning) {
+          if (!aguiState.hasEmittedReasoningStart) {
+            aguiState.hasEmittedReasoningStart = true
+            yield asChunk({
+              type: 'REASONING_START',
+              messageId: reasoningMessageId,
+              model: currentModel || chatOptions.model,
+              timestamp,
+            })
+            yield asChunk({
+              type: 'REASONING_MESSAGE_START',
+              messageId: reasoningMessageId,
+              role: 'reasoning' as const,
+              model: currentModel || chatOptions.model,
+              timestamp,
+            })
+          }
+          accumulatedReasoning += deltaReasoning
+          yield asChunk({
+            type: 'REASONING_MESSAGE_CONTENT',
+            messageId: reasoningMessageId,
+            delta: deltaReasoning,
+            model: currentModel || chatOptions.model,
+            timestamp,
+          })
+        }
+
         const deltaContent = choice.delta.content
         if (deltaContent) {
+          // Close reasoning before text starts so consumers see the
+          // contractual REASONING_END → TEXT_MESSAGE_START transition.
+          if (aguiState.hasEmittedReasoningStart) {
+            aguiState.hasEmittedReasoningStart = false
+            yield asChunk({
+              type: 'REASONING_MESSAGE_END',
+              messageId: reasoningMessageId,
+              model: currentModel || chatOptions.model,
+              timestamp,
+            })
+            yield asChunk({
+              type: 'REASONING_END',
+              messageId: reasoningMessageId,
+              model: currentModel || chatOptions.model,
+              timestamp,
+            })
+          }
+
           if (!aguiState.hasEmittedTextMessageStart) {
             aguiState.hasEmittedTextMessageStart = true
             yield asChunk({
@@ -367,6 +424,22 @@ export class GrokTextAdapter<
       // RUN_ERROR), never silence.
       const resolvedModel = currentModel || chatOptions.model
 
+      if (aguiState.hasEmittedReasoningStart) {
+        aguiState.hasEmittedReasoningStart = false
+        yield asChunk({
+          type: 'REASONING_MESSAGE_END',
+          messageId: reasoningMessageId,
+          model: resolvedModel,
+          timestamp,
+        })
+        yield asChunk({
+          type: 'REASONING_END',
+          messageId: reasoningMessageId,
+          model: resolvedModel,
+          timestamp,
+        })
+      }
+
       if (
         aguiState.hasEmittedTextMessageStart &&
         !aguiState.hasEmittedTextMessageEnd
@@ -429,6 +502,7 @@ export class GrokTextAdapter<
         value: {
           object: transformed,
           raw: accumulatedContent,
+          ...(accumulatedReasoning ? { reasoning: accumulatedReasoning } : {}),
         },
         model: resolvedModel,
         timestamp,
diff --git a/packages/typescript/ai-grok/tests/grok-adapter.test.ts b/packages/typescript/ai-grok/tests/grok-adapter.test.ts
index e6b24c3a4..1b4cca65e 100644
--- a/packages/typescript/ai-grok/tests/grok-adapter.test.ts
+++ b/packages/typescript/ai-grok/tests/grok-adapter.test.ts
@@ -886,6 +886,134 @@ describe('Grok structuredOutputStream', () => {
     expect(chunks.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
   })
 
+  it('surfaces accumulated reasoning_content on the structured-output.complete event', async () => {
+    // xAI reasoning models stream chain-of-thought via `delta.reasoning_content`
+    // (DeepSeek convention). The OpenAI SDK doesn't type this field but the
+    // runtime payload includes it.
+    const streamChunks = [
+      {
+        id: 'chatcmpl-reason',
+        model: 'grok-4-1-fast-reasoning',
+        choices: [
+          {
+            delta: { reasoning_content: 'Considering the budget... ' },
+            finish_reason: null,
+          },
+        ],
+      },
+      {
+        id: 'chatcmpl-reason',
+        model: 'grok-4-1-fast-reasoning',
+        choices: [
+          {
+            delta: { reasoning_content: 'a Strat would suit them.' },
+            finish_reason: null,
+          },
+        ],
+      },
+      {
+        id: 'chatcmpl-reason',
+        model: 'grok-4-1-fast-reasoning',
+        choices: [
+          {
+            delta: { content: '{"name":"Strat","price":1299}' },
+            finish_reason: 'stop',
+          },
+        ],
+        usage: { prompt_tokens: 10, completion_tokens: 9, total_tokens: 19 },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'grok-4-1-fast-reasoning',
+        messages: [{ role: 'user', content: 'Recommend a guitar' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: {
+          name: { type: 'string' },
+          price: { type: 'number' },
+        },
+        required: ['name', 'price'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    // Reasoning lifecycle events emitted before text
+    const types = chunks.map((c) => c.type)
+    expect(types.indexOf('REASONING_START')).toBeGreaterThanOrEqual(0)
+    expect(types.indexOf('REASONING_MESSAGE_END')).toBeLessThan(
+      types.indexOf('TEXT_MESSAGE_START'),
+    )
+
+    const reasoningChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'REASONING_MESSAGE_CONTENT' }> =>
+        c.type === 'REASONING_MESSAGE_CONTENT',
+    )
+    expect(reasoningChunks).toHaveLength(2)
+
+    const customChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]!.value).toEqual({
+      object: { name: 'Strat', price: 1299 },
+      raw: '{"name":"Strat","price":1299}',
+      reasoning: 'Considering the budget... a Strat would suit them.',
+    })
+  })
+
+  it('omits reasoning from the CUSTOM event when none was streamed', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-noreason',
+        model: 'grok-3',
+        choices: [
+          {
+            delta: { content: '{"name":"Strat","price":1299}' },
+            finish_reason: 'stop',
+          },
+        ],
+        usage: { prompt_tokens: 5, completion_tokens: 9, total_tokens: 14 },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'grok-3',
+        messages: [{ role: 'user', content: 'Recommend a guitar' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: {
+          name: { type: 'string' },
+          price: { type: 'number' },
+        },
+        required: ['name', 'price'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const customChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]!.value).not.toHaveProperty('reasoning')
+  })
+
   it('transforms null values to undefined on the parsed object', async () => {
     const streamChunks = [
       {
diff --git a/packages/typescript/ai-groq/src/adapters/text.ts b/packages/typescript/ai-groq/src/adapters/text.ts
index ae0f3bf3b..1cf33805e 100644
--- a/packages/typescript/ai-groq/src/adapters/text.ts
+++ b/packages/typescript/ai-groq/src/adapters/text.ts
@@ -233,6 +233,7 @@ export class GroqTextAdapter<
     const { chatOptions, outputSchema } = options
     const { logger } = chatOptions
     const timestamp = Date.now()
+    const reasoningMessageId = generateId(this.name)
     const aguiState = {
       runId: chatOptions.runId ?? generateId(this.name),
       threadId: chatOptions.threadId ?? generateId(this.name),
@@ -241,6 +242,7 @@ export class GroqTextAdapter<
       hasEmittedRunStarted: false,
       hasEmittedTextMessageStart: false,
       hasEmittedTextMessageEnd: false,
+      hasEmittedReasoningStart: false,
       hasFinalizedChoice: false,
       deferredUsage: undefined as
         | {
@@ -258,6 +260,7 @@ export class GroqTextAdapter<
     )
 
     let accumulatedContent = ''
+    let accumulatedReasoning = ''
     let currentModel = chatOptions.model
 
     try {
@@ -303,8 +306,62 @@ export class GroqTextAdapter<
         const choice = chunk.choices[0]
         if (!choice) continue
 
+        // Groq reasoning models (gpt-oss, qwen3, kimi-k2 with reasoning_format
+        // 'parsed') surface chain-of-thought via `delta.reasoning`; some models
+        // mirror DeepSeek's `delta.reasoning_content`. Neither is typed by the
+        // groq-sdk so we read both via an unknown cast.
+        const deltaUnknown = choice.delta as unknown as {
+          reasoning?: string
+          reasoning_content?: string
+        }
+        const deltaReasoning =
+          deltaUnknown.reasoning ?? deltaUnknown.reasoning_content
+        if (deltaReasoning) {
+          if (!aguiState.hasEmittedReasoningStart) {
+            aguiState.hasEmittedReasoningStart = true
+            yield asChunk({
+              type: 'REASONING_START',
+              messageId: reasoningMessageId,
+              model: currentModel || chatOptions.model,
+              timestamp,
+            })
+            yield asChunk({
+              type: 'REASONING_MESSAGE_START',
+              messageId: reasoningMessageId,
+              role: 'reasoning' as const,
+              model: currentModel || chatOptions.model,
+              timestamp,
+            })
+          }
+          accumulatedReasoning += deltaReasoning
+          yield asChunk({
+            type: 'REASONING_MESSAGE_CONTENT',
+            messageId: reasoningMessageId,
+            delta: deltaReasoning,
+            model: currentModel || chatOptions.model,
+            timestamp,
+          })
+        }
+
         const deltaContent = choice.delta.content
         if (deltaContent) {
+          // Close reasoning before text starts.
+          if (aguiState.hasEmittedReasoningStart) {
+            aguiState.hasEmittedReasoningStart = false
+            yield asChunk({
+              type: 'REASONING_MESSAGE_END',
+              messageId: reasoningMessageId,
+              model: currentModel || chatOptions.model,
+              timestamp,
+            })
+            yield asChunk({
+              type: 'REASONING_END',
+              messageId: reasoningMessageId,
+              model: currentModel || chatOptions.model,
+              timestamp,
+            })
+          }
+
           if (!aguiState.hasEmittedTextMessageStart) {
             aguiState.hasEmittedTextMessageStart = true
             yield asChunk({
@@ -367,6 +424,22 @@ export class GroqTextAdapter<
       // RUN_ERROR), never silence.
       const resolvedModel = currentModel || chatOptions.model
 
+      if (aguiState.hasEmittedReasoningStart) {
+        aguiState.hasEmittedReasoningStart = false
+        yield asChunk({
+          type: 'REASONING_MESSAGE_END',
+          messageId: reasoningMessageId,
+          model: resolvedModel,
+          timestamp,
+        })
+        yield asChunk({
+          type: 'REASONING_END',
+          messageId: reasoningMessageId,
+          model: resolvedModel,
+          timestamp,
+        })
+      }
+
       if (
         aguiState.hasEmittedTextMessageStart &&
         !aguiState.hasEmittedTextMessageEnd
@@ -429,6 +502,7 @@ export class GroqTextAdapter<
         value: {
           object: transformed,
           raw: accumulatedContent,
+          ...(accumulatedReasoning ? { reasoning: accumulatedReasoning } : {}),
         },
         model: resolvedModel,
         timestamp,
diff --git a/packages/typescript/ai-groq/tests/groq-adapter.test.ts b/packages/typescript/ai-groq/tests/groq-adapter.test.ts
index 4240aeac4..588772b9c 100644
--- a/packages/typescript/ai-groq/tests/groq-adapter.test.ts
+++ b/packages/typescript/ai-groq/tests/groq-adapter.test.ts
@@ -866,6 +866,136 @@ describe('Groq structuredOutputStream', () => {
     expect(chunks.filter((c) => c.type === 'CUSTOM')).toHaveLength(0)
   })
 
+  it('surfaces accumulated reasoning on the structured-output.complete event', async () => {
+    // Groq reasoning models (gpt-oss, qwen3, kimi-k2) surface reasoning via
+    // `delta.reasoning` when reasoning_format='parsed'. Not typed by groq-sdk.
+    const streamChunks = [
+      {
+        id: 'chatcmpl-reason',
+        model: 'openai/gpt-oss-120b',
+        choices: [
+          {
+            delta: { reasoning: 'Considering the budget... ' },
+            finish_reason: null,
+          },
+        ],
+      },
+      {
+        id: 'chatcmpl-reason',
+        model: 'openai/gpt-oss-120b',
+        choices: [
+          {
+            delta: { reasoning: 'a Strat would suit them.' },
+            finish_reason: null,
+          },
+        ],
+      },
+      {
+        id: 'chatcmpl-reason',
+        model: 'openai/gpt-oss-120b',
+        choices: [
+          {
+            delta: { content: '{"name":"Strat","price":1299}' },
+            finish_reason: 'stop',
+          },
+        ],
+        x_groq: {
+          usage: { prompt_tokens: 10, completion_tokens: 9, total_tokens: 19 },
+        },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createGroqText('openai/gpt-oss-120b', 'test-api-key')
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'openai/gpt-oss-120b',
+        messages: [{ role: 'user', content: 'Recommend a guitar' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: {
+          name: { type: 'string' },
+          price: { type: 'number' },
+        },
+        required: ['name', 'price'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const types = chunks.map((c) => c.type)
+    expect(types.indexOf('REASONING_START')).toBeGreaterThanOrEqual(0)
+    expect(types.indexOf('REASONING_MESSAGE_END')).toBeLessThan(
+      types.indexOf('TEXT_MESSAGE_START'),
+    )
+
+    const reasoningChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'REASONING_MESSAGE_CONTENT' }> =>
+        c.type === 'REASONING_MESSAGE_CONTENT',
+    )
+    expect(reasoningChunks).toHaveLength(2)
+
+    const customChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]!.value).toEqual({
+      object: { name: 'Strat', price: 1299 },
+      raw: '{"name":"Strat","price":1299}',
+      reasoning: 'Considering the budget... a Strat would suit them.',
+    })
+  })
+
+  it('omits reasoning from the CUSTOM event when none was streamed', async () => {
+    const streamChunks = [
+      {
+        id: 'chatcmpl-noreason',
+        model: 'llama-3.3-70b-versatile',
+        choices: [
+          {
+            delta: { content: '{"name":"Strat","price":1299}' },
+            finish_reason: 'stop',
+          },
+        ],
+        x_groq: {
+          usage: { prompt_tokens: 5, completion_tokens: 9, total_tokens: 14 },
+        },
+      },
+    ]
+
+    setupMockSdkClient(streamChunks)
+    const adapter = createAdapter()
+
+    const chunks: Array<StreamChunk> = []
+    for await (const chunk of adapter.structuredOutputStream({
+      chatOptions: {
+        model: 'llama-3.3-70b-versatile',
+        messages: [{ role: 'user', content: 'Recommend a guitar' }],
+        logger: testLogger,
+      },
+      outputSchema: {
+        type: 'object',
+        properties: {
+          name: { type: 'string' },
+          price: { type: 'number' },
+        },
+        required: ['name', 'price'],
+      },
+    })) {
+      chunks.push(chunk)
+    }
+
+    const customChunks = chunks.filter(
+      (c): c is Extract<StreamChunk, { type: 'CUSTOM' }> => c.type === 'CUSTOM',
+    )
+    expect(customChunks).toHaveLength(1)
+    expect(customChunks[0]!.value).not.toHaveProperty('reasoning')
+  })
+
   it('transforms null values to undefined on the parsed object', async () => {
     const streamChunks = [
       {
diff --git a/packages/typescript/ai-openai/src/adapters/text.ts b/packages/typescript/ai-openai/src/adapters/text.ts
index 619aee580..305b7fd65 100644
--- a/packages/typescript/ai-openai/src/adapters/text.ts
+++ b/packages/typescript/ai-openai/src/adapters/text.ts
@@ -269,7 +269,10 @@ export class OpenAITextAdapter<
     const messageId = generateId(this.name)
     let hasEmittedRunStarted = false
     let hasEmittedTextMessageStart = false
+    let hasEmittedReasoningStart = false
+    const reasoningMessageId = generateId(this.name)
     let accumulatedContent = ''
+    let accumulatedReasoning = ''
     let model: string = chatOptions.model
     let usage:
       | { promptTokens: number; completionTokens: number; totalTokens: number }
@@ -351,6 +354,52 @@ export class OpenAITextAdapter<
           return
         }
 
+        // Reasoning deltas (o-series + GPT-5 reasoning models surface a
+        // chain-of-thought stream). Re-emit them as REASONING_MESSAGE_CONTENT
+        // so consumers can show "thinking" UI before any JSON arrives.
+        if (
+          (chunk.type === 'response.reasoning_text.delta' ||
+            chunk.type === 'response.reasoning_summary_text.delta') &&
+          chunk.delta
+        ) {
+          const delta: unknown = chunk.delta
+          const reasoningDelta =
+            typeof delta === 'string'
+              ? delta
+              : Array.isArray(delta)
+                ? delta.join('')
+                : ''
+
+          if (reasoningDelta) {
+            if (!hasEmittedReasoningStart) {
+              hasEmittedReasoningStart = true
+              yield asChunk({
+                type: 'REASONING_START',
+                messageId: reasoningMessageId,
+                model,
+                timestamp,
+              })
+              yield asChunk({
+                type: 'REASONING_MESSAGE_START',
+                messageId: reasoningMessageId,
+                role: 'reasoning' as const,
+                model,
+                timestamp,
+              })
+            }
+
+            accumulatedReasoning += reasoningDelta
+
+            yield asChunk({
+              type: 'REASONING_MESSAGE_CONTENT',
+              messageId: reasoningMessageId,
+              delta: reasoningDelta,
+              model,
+              timestamp,
+            })
+          }
+        }
+
         if (chunk.type === 'response.output_text.delta' && chunk.delta) {
           const textDelta = Array.isArray(chunk.delta)
             ? chunk.delta.join('')
@@ -359,6 +408,24 @@ export class OpenAITextAdapter<
               : ''
 
           if (textDelta) {
+            // Close reasoning before text starts so consumers see the
+            // contractual REASONING_END → TEXT_MESSAGE_START transition.
+            if (hasEmittedReasoningStart) {
+              hasEmittedReasoningStart = false
+              yield asChunk({
+                type: 'REASONING_MESSAGE_END',
+                messageId: reasoningMessageId,
+                model,
+                timestamp,
+              })
+              yield asChunk({
+                type: 'REASONING_END',
+                messageId: reasoningMessageId,
+                model,
+                timestamp,
+              })
+            }
+
             if (!hasEmittedTextMessageStart) {
               hasEmittedTextMessageStart = true
               yield asChunk({
@@ -426,6 +493,22 @@ export class OpenAITextAdapter<
       // Always finalize, even if the upstream stream closed without a
       // `response.completed` event (truncation, transport drop). Otherwise
       // consumers wait forever on a missing terminal event.
+      if (hasEmittedReasoningStart) {
+        hasEmittedReasoningStart = false
+        yield asChunk({
+          type: 'REASONING_MESSAGE_END',
+          messageId: reasoningMessageId,
+          model,
+          timestamp,
+        })
+        yield asChunk({
+          type: 'REASONING_END',
+          messageId: reasoningMessageId,
+          model,
+          timestamp,
+        })
+      }
+
       if (hasEmittedTextMessageStart) {
         yield asChunk({
           type: 'TEXT_MESSAGE_END',
@@ -482,6 +565,9 @@ export class OpenAITextAdapter<
         value: {
           object: transformed,
           raw: accumulatedContent,
+          // Surface accumulated chain-of-thought (if any) for consumers that
+          // only subscribe to the terminal event.
+          ...(accumulatedReasoning ? { reasoning: accumulatedReasoning } : {}),
         },
         model,
         timestamp,

From 0a7f31ab115e50b6888ae77cd22fde1bec5ac8a4 Mon Sep 17 00:00:00 2001
From: "autofix-ci[bot]" <114827586+autofix-ci[bot]@users.noreply.github.com>
Date: Tue, 5 May 2026 06:42:10 +0000
Subject: [PATCH 5/9] ci: apply automated fixes

---
 .../routes/generations.structured-output.tsx    | 17 +++++++++--------
 1 file changed, 9 insertions(+), 8 deletions(-)

diff --git a/examples/ts-react-chat/src/routes/generations.structured-output.tsx b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
index dd0a4fc8f..aa22c244f 100644
--- a/examples/ts-react-chat/src/routes/generations.structured-output.tsx
+++ b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
@@ -405,8 +405,8 @@ function StructuredOutputPage() {
             <div className="space-y-4">
               {stream && deltaCount > 0 && (
                 <p className="text-xs text-gray-500">
-                  {hasFinalResult ? 'Final result' : 'Streaming'} —{' '}
-                  {deltaCount} deltas received
+                  {hasFinalResult ? 'Final result' : 'Streaming'} — {deltaCount}{' '}
+                  deltas received
                   {renderingPartial && (
                     <span className="ml-1 inline-block w-2 h-2 rounded-full bg-orange-500 animate-pulse" />
                   )}
@@ -460,12 +460,13 @@ function StructuredOutputPage() {
                         <div className="flex items-start justify-between gap-3">
                           <div>
                             <p className="text-white font-medium">
-                              {[rec.brand, rec.name].filter(Boolean).join(' ') ||
-                                (
-                                  <span className="text-gray-500 italic">
-                                    Loading…
-                                  </span>
-                                )}
+                              {[rec.brand, rec.name]
+                                .filter(Boolean)
+                                .join(' ') || (
+                                <span className="text-gray-500 italic">
+                                  Loading…
+                                </span>
+                              )}
                             </p>
                             {rec.type && (
                               <p className="text-xs text-orange-400 uppercase tracking-wider mt-0.5">

From b14800e8349d75b2a2cc73ec0638d943195df964 Mon Sep 17 00:00:00 2001
From: Tom Beckenham <34339192+tombeckenham@users.noreply.github.com>
Date: Tue, 5 May 2026 17:27:30 +1000
Subject: [PATCH 6/9] chore(example): default to OpenAI gpt-5.2, drop debug
 logging
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

ts-react-chat /generations/structured-output now opens with the OpenAI
frontier model (gpt-5.2) preselected in both the Provider and Model
dropdowns instead of OpenRouter. Also removes `debug: true` from the
chat() calls — it was only there to inspect provider events while
diagnosing reasoning visibility on gpt-5.2-pro.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 examples/ts-react-chat/src/routes/api.structured-output.ts  | 4 ----
 .../src/routes/generations.structured-output.tsx            | 6 ++----
 2 files changed, 2 insertions(+), 8 deletions(-)

diff --git a/examples/ts-react-chat/src/routes/api.structured-output.ts b/examples/ts-react-chat/src/routes/api.structured-output.ts
index 43a6fe3db..e87a89d70 100644
--- a/examples/ts-react-chat/src/routes/api.structured-output.ts
+++ b/examples/ts-react-chat/src/routes/api.structured-output.ts
@@ -117,9 +117,6 @@ export const Route = createFileRoute('/api/structured-output')({
               messages: [{ role: 'user', content: prompt }],
               outputSchema: GuitarRecommendationSchema,
               stream: true,
-              // Surface adapter request/provider/error logs so we can see
-              // exactly which Responses API events the model is emitting.
-              debug: true,
               abortController,
             }) as AsyncIterable<StreamChunk>
             return toServerSentEventsResponse(streamIterable, {
@@ -132,7 +129,6 @@ export const Route = createFileRoute('/api/structured-output')({
             modelOptions: modelOptions as never,
             messages: [{ role: 'user', content: prompt }],
             outputSchema: GuitarRecommendationSchema,
-            debug: true,
           })
 
           return new Response(JSON.stringify({ data: result }), {
diff --git a/examples/ts-react-chat/src/routes/generations.structured-output.tsx b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
index aa22c244f..74818eb10 100644
--- a/examples/ts-react-chat/src/routes/generations.structured-output.tsx
+++ b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
@@ -91,10 +91,8 @@ function latestThought(reasoning: string): string {
 
 function StructuredOutputPage() {
   const [prompt, setPrompt] = useState(SAMPLE_PROMPT)
-  const [provider, setProvider] = useState<Provider>('openrouter')
-  const [model, setModel] = useState<string>(
-    PROVIDER_MODELS.openrouter[0].value,
-  )
+  const [provider, setProvider] = useState<Provider>('openai')
+  const [model, setModel] = useState<string>(PROVIDER_MODELS.openai[0].value)
   const [stream, setStream] = useState(true)
   const [result, setResult] = useState<PartialResult | null>(null)
   const [rawJson, setRawJson] = useState<string>('')

From 93127701f072f22b7b64e36e36ba54e1abafc4d0 Mon Sep 17 00:00:00 2001
From: Tom Beckenham <34339192+tombeckenham@users.noreply.github.com>
Date: Tue, 5 May 2026 18:02:03 +1000
Subject: [PATCH 7/9] fix(ai): propagate abort signal in streaming structured
 output
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`runStreamingStructuredOutputImpl` never derived `request: { signal }`
from `abortController`, so aborting the SSE response didn't cancel
the upstream provider request — the terminal `structured-output.complete`
event still got yielded after stop. Mirror `TextEngine` and forward
the signal so adapters' underlying network calls actually abort.

Also fix two e2e abort fixtures whose `opts: { tokensPerSecond, chunkSize }`
wrapper aimock silently ignores (the real schema uses `chunkSize`
at top level + `streamingProfile.tps`). They streamed at full speed,
so the abort test raced the response and saw the complete event
before stop could land.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 packages/typescript/ai/src/activities/chat/index.ts      | 7 +++++++
 testing/e2e/fixtures/abort/basic.json                    | 6 ++----
 testing/e2e/fixtures/structured-output-stream/abort.json | 6 ++----
 3 files changed, 11 insertions(+), 8 deletions(-)

diff --git a/packages/typescript/ai/src/activities/chat/index.ts b/packages/typescript/ai/src/activities/chat/index.ts
index 7a3c332c4..0da6fa307 100644
--- a/packages/typescript/ai/src/activities/chat/index.ts
+++ b/packages/typescript/ai/src/activities/chat/index.ts
@@ -1902,11 +1902,18 @@ async function* runStreamingStructuredOutputImpl<TSchema extends SchemaInput>(
     },
   )
 
+  // Adapters consume the abort signal via `chatOptions.request?.signal` and
+  // pass it to the underlying network call. Without this, aborting the SSE
+  // response never cancels the upstream provider request and a terminal
+  // structured-output.complete event still gets yielded after stop.
   const structuredChatOptions = {
     ...structuredTextOptions,
     model,
     messages: finalMessages,
     logger,
+    request: textOptions.abortController
+      ? { signal: textOptions.abortController.signal }
+      : undefined,
   }
 
   // Adapters that don't implement structuredOutputStream natively fall back
diff --git a/testing/e2e/fixtures/abort/basic.json b/testing/e2e/fixtures/abort/basic.json
index 98e112516..312e2bf5b 100644
--- a/testing/e2e/fixtures/abort/basic.json
+++ b/testing/e2e/fixtures/abort/basic.json
@@ -7,10 +7,8 @@
       "response": {
         "content": "Once upon a time in a land far away there lived a guitar maker who spent decades perfecting the art of crafting beautiful instruments from the finest tonewoods available in the forests nearby and each guitar was unique and special and every single one had its own story to tell about the wood and the craftsmanship that went into making it a truly remarkable piece of art and the customers would come from miles around just to see the collection and hear the stories behind each instrument that hung on the walls of the little shop on the corner of Main Street in the small town where everyone knew each other by name and the guitar maker would spend hours talking to each customer about the history and character of every guitar in the shop telling tales of the trees that provided the wood and the journeys those trees had taken before becoming part of something so beautiful and musical"
       },
-      "opts": {
-        "tokensPerSecond": 1,
-        "chunkSize": 2
-      }
+      "chunkSize": 2,
+      "streamingProfile": { "tps": 5 }
     }
   ]
 }
diff --git a/testing/e2e/fixtures/structured-output-stream/abort.json b/testing/e2e/fixtures/structured-output-stream/abort.json
index 6ed750774..f1dd6dfba 100644
--- a/testing/e2e/fixtures/structured-output-stream/abort.json
+++ b/testing/e2e/fixtures/structured-output-stream/abort.json
@@ -7,10 +7,8 @@
       "response": {
         "content": "{\"name\":\"Fender Stratocaster\",\"price\":1299,\"reason\":\"Versatile tone and comfortable playability across many genres including blues rock jazz country and pop with a wide tonal palette\",\"rating\":5}"
       },
-      "opts": {
-        "tokensPerSecond": 1,
-        "chunkSize": 2
-      }
+      "chunkSize": 2,
+      "streamingProfile": { "tps": 5 }
     }
   ]
 }

From 99f4287ae59dfda90743c14aaeb8ea9ddb45a399 Mon Sep 17 00:00:00 2001
From: Tom Beckenham <34339192+tombeckenham@users.noreply.github.com>
Date: Tue, 5 May 2026 18:16:05 +1000
Subject: [PATCH 8/9] fix(ai): address CodeRabbit review feedback on streaming
 structured output

- Short-circuit structured output stream when agent loop yields RUN_ERROR
- Emit RUN_STARTED for empty streams in openrouter finalization path
- Capture trailing usage chunks (empty choices) in grok adapter
- Sanitize SDK errors via toRunErrorPayload in grok structuredOutputStream
- Validate POST body with zod and propagate abort signal through non-streaming chat() in example
- Flush TextDecoder, throw if structured-output.complete missing, sync reasoningLine, link form labels in example UI
- Correct changeset wording and update e2e fallback comment + abort prefix doc

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../streaming-structured-output-chat.md       |  2 +-
 .../src/routes/api.structured-output.ts       | 35 ++++++++----
 .../routes/generations.structured-output.tsx  | 53 +++++++++++++++----
 .../typescript/ai-grok/src/adapters/text.ts   | 23 ++++----
 .../ai-openrouter/src/adapters/text.ts        | 14 +++++
 .../ai/src/activities/chat/index.ts           | 15 ++++++
 testing/e2e/README.md                         |  2 +-
 testing/e2e/src/lib/feature-support.ts        |  5 +-
 8 files changed, 116 insertions(+), 33 deletions(-)

diff --git a/.changeset/streaming-structured-output-chat.md b/.changeset/streaming-structured-output-chat.md
index 68aa7302f..4cdc22452 100644
--- a/.changeset/streaming-structured-output-chat.md
+++ b/.changeset/streaming-structured-output-chat.md
@@ -2,4 +2,4 @@
 '@tanstack/ai': minor
 ---
 
-feat: `chat({ outputSchema, stream: true })` returns `AsyncIterable<StreamChunk>` with raw JSON deltas plus a final `CUSTOM` `structured-output.complete` event carrying the validated parsed object. The existing `chat({ outputSchema })` (non-streaming) path is unchanged. Adapters expose this via a new optional `structuredOutputStream` method on `TextAdapter`; `BaseTextAdapter` provides a default that wraps the non-streaming `structuredOutput` so adapters without native streaming JSON support still satisfy the new combination.
+feat: `chat({ outputSchema, stream: true })` returns `AsyncIterable<StreamChunk>` with raw JSON deltas plus a final `CUSTOM` `structured-output.complete` event carrying the validated parsed object. The existing `chat({ outputSchema })` (non-streaming) path is unchanged. Adapters expose this via a new optional `structuredOutputStream` method on `TextAdapter`. Adapters that omit the method fall back to the activity layer's `fallbackStructuredOutputStream`, which wraps the non-streaming `structuredOutput` call so adapters without native streaming JSON support still satisfy the new combination.
diff --git a/examples/ts-react-chat/src/routes/api.structured-output.ts b/examples/ts-react-chat/src/routes/api.structured-output.ts
index e87a89d70..57618576c 100644
--- a/examples/ts-react-chat/src/routes/api.structured-output.ts
+++ b/examples/ts-react-chat/src/routes/api.structured-output.ts
@@ -27,6 +27,13 @@ const GuitarRecommendationSchema = z.object({
 
 type Provider = 'openai' | 'grok' | 'groq' | 'openrouter'
 
+const StructuredOutputRequestSchema = z.object({
+  prompt: z.string().min(1),
+  provider: z.enum(['openai', 'grok', 'groq', 'openrouter']).optional(),
+  model: z.string().optional(),
+  stream: z.boolean().optional(),
+})
+
 function adapterFor(provider: Provider, model?: string): AnyTextAdapter {
   switch (provider) {
     case 'openai':
@@ -94,16 +101,21 @@ export const Route = createFileRoute('/api/structured-output')({
   server: {
     handlers: {
       POST: async ({ request }) => {
-        const body = await request.json()
-        const { prompt, provider, model, stream } = body as {
-          prompt: string
-          provider?: Provider
-          model?: string
-          stream?: boolean
-        }
-        const resolvedProvider: Provider = provider || 'openrouter'
-
         try {
+          const parsed = StructuredOutputRequestSchema.safeParse(
+            await request.json(),
+          )
+          if (!parsed.success) {
+            return new Response(
+              JSON.stringify({ error: 'Invalid request body' }),
+              {
+                status: 400,
+                headers: { 'Content-Type': 'application/json' },
+              },
+            )
+          }
+          const { prompt, provider, model, stream } = parsed.data
+          const resolvedProvider: Provider = provider || 'openrouter'
           const modelOptions = reasoningOptionsFor(resolvedProvider, model)
 
           if (stream) {
@@ -124,11 +136,16 @@ export const Route = createFileRoute('/api/structured-output')({
             })
           }
 
+          const abortController = new AbortController()
+          request.signal.addEventListener('abort', () =>
+            abortController.abort(),
+          )
           const result = await chat({
             adapter: adapterFor(resolvedProvider, model),
             modelOptions: modelOptions as never,
             messages: [{ role: 'user', content: prompt }],
             outputSchema: GuitarRecommendationSchema,
+            abortController,
           })
 
           return new Response(JSON.stringify({ data: result }), {
diff --git a/examples/ts-react-chat/src/routes/generations.structured-output.tsx b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
index 74818eb10..a081912a3 100644
--- a/examples/ts-react-chat/src/routes/generations.structured-output.tsx
+++ b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
@@ -90,6 +90,9 @@ function latestThought(reasoning: string): string {
 }
 
 function StructuredOutputPage() {
+  const providerId = 'structured-output-provider'
+  const modelId = 'structured-output-model'
+  const promptId = 'structured-output-prompt'
   const [prompt, setPrompt] = useState(SAMPLE_PROMPT)
   const [provider, setProvider] = useState<Provider>('openai')
   const [model, setModel] = useState<string>(PROVIDER_MODELS.openai[0].value)
@@ -164,12 +167,9 @@ function StructuredOutputPage() {
       let accumulated = ''
       let reasoning = ''
       let deltas = 0
+      let sawComplete = false
 
-      while (true) {
-        const { done, value } = await reader.read()
-        if (done) break
-        buffer += decoder.decode(value, { stream: true })
-
+      const processBuffer = () => {
         let sepIdx = buffer.indexOf('\n\n')
         while (sepIdx !== -1) {
           const frame = buffer.slice(0, sepIdx)
@@ -215,15 +215,18 @@ function StructuredOutputPage() {
               chunk.name === 'structured-output.complete' &&
               chunk.value?.object
             ) {
+              sawComplete = true
               setResult(chunk.value.object as PartialResult)
               setHasFinalResult(true)
               if (
                 typeof (chunk.value as { reasoning?: string }).reasoning ===
                 'string'
               ) {
-                setReasoningFull(
-                  (chunk.value as { reasoning: string }).reasoning,
-                )
+                const finalReasoning = (
+                  chunk.value as { reasoning: string }
+                ).reasoning
+                setReasoningFull(finalReasoning)
+                setReasoningLine(latestThought(finalReasoning))
               }
             } else if (chunk.type === 'RUN_ERROR') {
               throw new Error(chunk.message || 'Stream failed')
@@ -231,6 +234,22 @@ function StructuredOutputPage() {
           }
         }
       }
+
+      while (true) {
+        const { done, value } = await reader.read()
+        if (done) break
+        buffer += decoder.decode(value, { stream: true })
+        processBuffer()
+      }
+
+      // Flush any buffered bytes from incomplete multi-byte UTF-8 sequences
+      // so the final SSE frame isn't dropped.
+      buffer += decoder.decode()
+      processBuffer()
+
+      if (!sawComplete) {
+        throw new Error('Stream ended before structured-output.complete')
+      }
     } catch (err) {
       if (err instanceof Error && err.name === 'AbortError') {
         setError('Aborted')
@@ -276,8 +295,14 @@ function StructuredOutputPage() {
         <div className="max-w-2xl mx-auto space-y-6">
           <div className="grid grid-cols-2 gap-3">
             <div className="space-y-2">
-              <label className="text-sm text-gray-400">Provider</label>
+              <label
+                htmlFor={providerId}
+                className="text-sm text-gray-400"
+              >
+                Provider
+              </label>
               <select
+                id={providerId}
                 value={provider}
                 onChange={(e) => onProviderChange(e.target.value as Provider)}
                 disabled={isLoading}
@@ -290,8 +315,11 @@ function StructuredOutputPage() {
               </select>
             </div>
             <div className="space-y-2">
-              <label className="text-sm text-gray-400">Model</label>
+              <label htmlFor={modelId} className="text-sm text-gray-400">
+                Model
+              </label>
               <select
+                id={modelId}
                 value={model}
                 onChange={(e) => setModel(e.target.value)}
                 disabled={isLoading}
@@ -323,8 +351,11 @@ function StructuredOutputPage() {
           </label>
 
           <div className="space-y-3">
-            <label className="text-sm text-gray-400">Prompt</label>
+            <label htmlFor={promptId} className="text-sm text-gray-400">
+              Prompt
+            </label>
             <textarea
+              id={promptId}
               value={prompt}
               onChange={(e) => setPrompt(e.target.value)}
               placeholder="Describe what you want recommendations for..."
diff --git a/packages/typescript/ai-grok/src/adapters/text.ts b/packages/typescript/ai-grok/src/adapters/text.ts
index 782cefb60..95e382e27 100644
--- a/packages/typescript/ai-grok/src/adapters/text.ts
+++ b/packages/typescript/ai-grok/src/adapters/text.ts
@@ -1,5 +1,6 @@
 import { APIUserAbortError } from 'openai'
 import { BaseTextAdapter } from '@tanstack/ai/adapters'
+import { toRunErrorPayload } from '@tanstack/ai/adapter-internals'
 import { validateTextProviderOptions } from '../text/text-provider-options'
 import { convertToolsToProviderFormat } from '../tools'
 import {
@@ -295,6 +296,18 @@ export class GrokTextAdapter<
         logger.provider(`provider=grok`, { chunk })
         if (chunk.model) currentModel = chunk.model
 
+        // OpenAI-compatible streams with `stream_options: { include_usage: true }`
+        // deliver the final usage payload in a trailing chunk whose `choices`
+        // array is empty. Capture usage outside the choice branch so it's
+        // never dropped.
+        if (chunk.usage) {
+          aguiState.deferredUsage = {
+            promptTokens: chunk.usage.prompt_tokens || 0,
+            completionTokens: chunk.usage.completion_tokens || 0,
+            totalTokens: chunk.usage.total_tokens || 0,
+          }
+        }
+
         if (!aguiState.hasEmittedRunStarted) {
           aguiState.hasEmittedRunStarted = true
           yield asChunk({
@@ -389,14 +402,6 @@ export class GrokTextAdapter<
         }
 
         if (choice.finish_reason) {
-          if (chunk.usage) {
-            aguiState.deferredUsage = {
-              promptTokens: chunk.usage.prompt_tokens || 0,
-              completionTokens: chunk.usage.completion_tokens || 0,
-              totalTokens: chunk.usage.total_tokens || 0,
-            }
-          }
-
           if (!aguiState.hasFinalizedChoice) {
             aguiState.hasFinalizedChoice = true
             aguiState.computedFinishReason =
@@ -519,7 +524,7 @@ export class GrokTextAdapter<
       })
     } catch (error) {
       logger.errors('grok.structuredOutputStream fatal', {
-        error,
+        error: toRunErrorPayload(error, 'grok.structuredOutputStream failed'),
         source: 'grok.structuredOutputStream',
       })
       if (!aguiState.hasEmittedRunStarted) {
diff --git a/packages/typescript/ai-openrouter/src/adapters/text.ts b/packages/typescript/ai-openrouter/src/adapters/text.ts
index 8ef62a882..d9004e0d8 100644
--- a/packages/typescript/ai-openrouter/src/adapters/text.ts
+++ b/packages/typescript/ai-openrouter/src/adapters/text.ts
@@ -381,6 +381,20 @@ export class OpenRouterTextAdapter<
       // owe consumers a CUSTOM + RUN_FINISHED (or RUN_ERROR), never silence.
       const resolvedModel = currentModel || chatOptions.model
 
+      // A truly empty stream (zero chunks) never enters processChoice, so
+      // RUN_STARTED was never emitted. Mirror the catch-block guard so the
+      // AG-UI lifecycle (RUN_STARTED → RUN_ERROR/FINISHED) is preserved.
+      if (!aguiState.hasEmittedRunStarted) {
+        aguiState.hasEmittedRunStarted = true
+        yield asChunk({
+          type: 'RUN_STARTED',
+          runId: aguiState.runId,
+          threadId: aguiState.threadId,
+          model: resolvedModel,
+          timestamp,
+        })
+      }
+
       if (aguiState.reasoningMessageId && !aguiState.hasClosedReasoning) {
         aguiState.hasClosedReasoning = true
         yield asChunk({
diff --git a/packages/typescript/ai/src/activities/chat/index.ts b/packages/typescript/ai/src/activities/chat/index.ts
index 0da6fa307..7cc634add 100644
--- a/packages/typescript/ai/src/activities/chat/index.ts
+++ b/packages/typescript/ai/src/activities/chat/index.ts
@@ -1857,11 +1857,22 @@ async function* runStreamingStructuredOutputImpl<TSchema extends SchemaInput>(
     // The structured-output stream emits its own RUN_STARTED + RUN_FINISHED
     // pair to bracket the run — drop both from the engine's output so
     // consumers see exactly one terminal lifecycle pair.
+    let agentLoopErrored = false
     try {
       for await (const chunk of engine.run()) {
         if (chunk.type === 'RUN_STARTED' || chunk.type === 'RUN_FINISHED') {
           continue
         }
+        if (chunk.type === 'RUN_ERROR') {
+          // The engine yielded RUN_ERROR without throwing (provider error mid
+          // agent loop). Forward it once and short-circuit before invoking
+          // structuredOutputStream — otherwise consumers would see a confusing
+          // RUN_ERROR → RUN_STARTED → structured-output.complete sequence and
+          // we would bill another provider call after a failed run.
+          agentLoopErrored = true
+          yield chunk
+          continue
+        }
         yield chunk
       }
     } catch (engineError) {
@@ -1882,6 +1893,10 @@ async function* runStreamingStructuredOutputImpl<TSchema extends SchemaInput>(
       return
     }
 
+    if (agentLoopErrored) {
+      return
+    }
+
     finalMessages = engine.getMessages()
   }
 
diff --git a/testing/e2e/README.md b/testing/e2e/README.md
index 285620db4..856631724 100644
--- a/testing/e2e/README.md
+++ b/testing/e2e/README.md
@@ -123,7 +123,7 @@ Clean up the fixture:
 }
 ```
 
-Existing prefixes: `[chat]`, `[oneshot]`, `[reasoning]`, `[multiturn-1]`, `[multiturn-2]`, `[toolcall]`, `[parallel]`, `[approval]`, `[approval-deny]`, `[text-tool-text]`, `[structured]`, `[structured-stream]`, `[agentic]`, `[mmimage]`, `[mmstruct]`, `[summarize]`, `[imagegen]`, `[tts]`, `[transcription]`, `[abort-test]`, `[error-test]`.
+Existing prefixes: `[chat]`, `[oneshot]`, `[reasoning]`, `[multiturn-1]`, `[multiturn-2]`, `[toolcall]`, `[parallel]`, `[approval]`, `[approval-deny]`, `[text-tool-text]`, `[structured]`, `[structured-stream]`, `[structured-stream-abort]`, `[agentic]`, `[mmimage]`, `[mmstruct]`, `[summarize]`, `[imagegen]`, `[tts]`, `[transcription]`, `[abort-test]`, `[error-test]`.
 
 ## 4. Writing a Test
 
diff --git a/testing/e2e/src/lib/feature-support.ts b/testing/e2e/src/lib/feature-support.ts
index e1347c2db..0f1ca4a02 100644
--- a/testing/e2e/src/lib/feature-support.ts
+++ b/testing/e2e/src/lib/feature-support.ts
@@ -81,8 +81,9 @@ export const matrix: Record<Feature, Set<Provider>> = {
     'openrouter',
   ]),
   // Streaming structured output: only providers with native streaming JSON
-  // schema support are listed here. Other providers fall back to the default
-  // BaseTextAdapter implementation but aren't exercised by E2E yet.
+  // schema support are listed here. Other providers fall back to the
+  // activity-layer `fallbackStructuredOutputStream` (which wraps the
+  // non-streaming `structuredOutput`) but aren't exercised by E2E yet.
   'structured-output-stream': new Set(['openai', 'groq', 'grok', 'openrouter']),
   'agentic-structured': new Set([
     'openai',

From c3b9f03733d58ab1e424e5016b099b27e946fd89 Mon Sep 17 00:00:00 2001
From: "autofix-ci[bot]" <114827586+autofix-ci[bot]@users.noreply.github.com>
Date: Tue, 5 May 2026 08:17:18 +0000
Subject: [PATCH 9/9] ci: apply automated fixes

---
 .../src/routes/generations.structured-output.tsx       | 10 +++-------
 1 file changed, 3 insertions(+), 7 deletions(-)

diff --git a/examples/ts-react-chat/src/routes/generations.structured-output.tsx b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
index a081912a3..831bcebdd 100644
--- a/examples/ts-react-chat/src/routes/generations.structured-output.tsx
+++ b/examples/ts-react-chat/src/routes/generations.structured-output.tsx
@@ -222,9 +222,8 @@ function StructuredOutputPage() {
                 typeof (chunk.value as { reasoning?: string }).reasoning ===
                 'string'
               ) {
-                const finalReasoning = (
-                  chunk.value as { reasoning: string }
-                ).reasoning
+                const finalReasoning = (chunk.value as { reasoning: string })
+                  .reasoning
                 setReasoningFull(finalReasoning)
                 setReasoningLine(latestThought(finalReasoning))
               }
@@ -295,10 +294,7 @@ function StructuredOutputPage() {
         <div className="max-w-2xl mx-auto space-y-6">
           <div className="grid grid-cols-2 gap-3">
             <div className="space-y-2">
-              <label
-                htmlFor={providerId}
-                className="text-sm text-gray-400"
-              >
+              <label htmlFor={providerId} className="text-sm text-gray-400">
                 Provider
               </label>
               <select