From 0868f202c3e0e630c506789e7e0b812f1ebf8801 Mon Sep 17 00:00:00 2001
From: Matt Apperson <me@mattapperson.com>
Date: Thu, 30 Oct 2025 15:00:04 -0400
Subject: [PATCH 1/4] Add getResponse API with multiple consumption patterns

Implements a new client.getResponse() method that provides flexible ways to consume streaming responses:

- await response.text - Get complete text
- await response.message - Get complete AssistantMessage
- response.textStream - Stream text deltas
- response.newMessagesStream - Stream incremental AssistantMessage updates
- response.reasoningStream - Stream reasoning deltas
- response.toolStream - Stream tool call deltas
- response.fullResponsesStream - Stream all raw events
- response.fullChatStream - Stream in chat-compatible format

All consumption patterns support both concurrent and sequential access, allowing users to mix and match approaches as needed.

Key implementation details:
- ReusableReadableStream enables multiple concurrent consumers without blocking
- ResponseWrapper provides lazy initialization with cached promises
- Stream transformers convert ResponsesAPI events to different formats
- Returns AssistantMessage type for consistency with chat API

Tests: 19 passing, 1 skipped (model unavailable)
---
 src/funcs/getResponse.ts       |  62 ++++
 src/index.ts                   |   5 +
 src/lib/response-wrapper.ts    | 257 +++++++++++++++
 src/lib/reusable-stream.ts     | 196 +++++++++++
 src/lib/stream-transformers.ts | 201 +++++++++++
 src/sdk/sdk.ts                 |  48 +++
 tests/e2e/getResponse.test.ts  | 586 +++++++++++++++++++++++++++++++++
 tests/e2e/responses.test.ts    |   3 +-
 8 files changed, 1357 insertions(+), 1 deletion(-)
 create mode 100644 src/funcs/getResponse.ts
 create mode 100644 src/lib/response-wrapper.ts
 create mode 100644 src/lib/reusable-stream.ts
 create mode 100644 src/lib/stream-transformers.ts
 create mode 100644 tests/e2e/getResponse.test.ts

diff --git a/src/funcs/getResponse.ts b/src/funcs/getResponse.ts
new file mode 100644
index 00000000..d03d6a2a
--- /dev/null
+++ b/src/funcs/getResponse.ts
@@ -0,0 +1,62 @@
+import { OpenRouterCore } from "../core.js";
+import { RequestOptions } from "../lib/sdks.js";
+import { ResponseWrapper } from "../lib/response-wrapper.js";
+import * as models from "../models/index.js";
+
+/**
+ * Get a response with multiple consumption patterns
+ *
+ * @remarks
+ * Creates a response using the OpenResponses API in streaming mode and returns
+ * a wrapper that allows consuming the response in multiple ways:
+ *
+ * - `await response.message` - Get the completed message
+ * - `await response.text` - Get just the text content
+ * - `for await (const delta of response.textStream)` - Stream text deltas
+ * - `for await (const delta of response.reasoningStream)` - Stream reasoning deltas
+ * - `for await (const delta of response.toolStream)` - Stream tool call argument deltas
+ * - `for await (const msg of response.newMessagesStream)` - Stream incremental message updates
+ * - `for await (const event of response.fullResponsesStream)` - Stream all response events
+ * - `for await (const chunk of response.fullChatStream)` - Stream in chat-compatible format
+ *
+ * All consumption patterns can be used concurrently on the same response.
+ *
+ * @example
+ * ```typescript
+ * // Simple text extraction
+ * const response = await openrouter.beta.responses.get({
+ *   model: "anthropic/claude-3-opus",
+ *   input: [{ role: "user", content: "Hello!" }]
+ * });
+ * const text = await response.text;
+ * console.log(text);
+ *
+ * // Streaming text
+ * const response = openrouter.beta.responses.get({
+ *   model: "anthropic/claude-3-opus",
+ *   input: [{ role: "user", content: "Hello!" }]
+ * });
+ * for await (const delta of response.textStream) {
+ *   process.stdout.write(delta);
+ * }
+ *
+ * // Full message with metadata
+ * const response = openrouter.beta.responses.get({
+ *   model: "anthropic/claude-3-opus",
+ *   input: [{ role: "user", content: "Hello!" }]
+ * });
+ * const message = await response.message;
+ * console.log(message.content);
+ * ```
+ */
+export function getResponse(
+  client: OpenRouterCore,
+  request: Omit<models.OpenResponsesRequest, "stream">,
+  options?: RequestOptions,
+): ResponseWrapper {
+  return new ResponseWrapper({
+    client,
+    request: { ...request },
+    options: options ?? {},
+  });
+}
diff --git a/src/index.ts b/src/index.ts
index dbcba164..734a437d 100644
--- a/src/index.ts
+++ b/src/index.ts
@@ -6,4 +6,9 @@ export * from "./lib/config.js";
 export * as files from "./lib/files.js";
 export { HTTPClient } from "./lib/http.js";
 export type { Fetcher, HTTPClientOptions } from "./lib/http.js";
+// #region imports
+export { ResponseWrapper } from "./lib/response-wrapper.js";
+export type { GetResponseOptions } from "./lib/response-wrapper.js";
+export { ReusableReadableStream } from "./lib/reusable-stream.js";
+// #endregion
 export * from "./sdk/sdk.js";
diff --git a/src/lib/response-wrapper.ts b/src/lib/response-wrapper.ts
new file mode 100644
index 00000000..2ccba944
--- /dev/null
+++ b/src/lib/response-wrapper.ts
@@ -0,0 +1,257 @@
+import { OpenRouterCore } from "../core.js";
+import { EventStream } from "./event-streams.js";
+import { RequestOptions } from "./sdks.js";
+import * as models from "../models/index.js";
+import { betaResponsesSend } from "../funcs/betaResponsesSend.js";
+import { ReusableReadableStream } from "./reusable-stream.js";
+import {
+  extractTextDeltas,
+  extractReasoningDeltas,
+  extractToolDeltas,
+  buildMessageStream,
+  consumeStreamForCompletion,
+  extractMessageFromResponse,
+  extractTextFromResponse,
+} from "./stream-transformers.js";
+
+export interface GetResponseOptions {
+  request: models.OpenResponsesRequest;
+  client: OpenRouterCore;
+  options?: RequestOptions;
+}
+
+/**
+ * A wrapper around a streaming response that provides multiple consumption patterns.
+ *
+ * Allows consuming the response in multiple ways:
+ * - `await response.message` - Get the completed message
+ * - `await response.text` - Get just the text
+ * - `for await (const delta of response.textStream)` - Stream text deltas
+ * - `for await (const msg of response.messageStream)` - Stream incremental message updates
+ * - `for await (const event of response.fullResponsesStream)` - Stream all response events
+ *
+ * All consumption patterns can be used concurrently thanks to the underlying
+ * ReusableReadableStream implementation.
+ */
+export class ResponseWrapper {
+  private reusableStream: ReusableReadableStream<models.OpenResponsesStreamEvent> | null = null;
+  private streamPromise: Promise<EventStream<models.OpenResponsesStreamEvent>> | null = null;
+  private messagePromise: Promise<models.AssistantMessage> | null = null;
+  private textPromise: Promise<string> | null = null;
+  private options: GetResponseOptions;
+  private initPromise: Promise<void> | null = null;
+
+  constructor(options: GetResponseOptions) {
+    this.options = options;
+  }
+
+  /**
+   * Initialize the stream if not already started
+   * This is idempotent - multiple calls will return the same promise
+   */
+  private initStream(): Promise<void> {
+    if (this.initPromise) {
+      return this.initPromise;
+    }
+
+    this.initPromise = (async () => {
+      // Force stream mode
+      const request = { ...this.options.request, stream: true as const };
+
+      // Create the stream promise
+      this.streamPromise = betaResponsesSend(
+        this.options.client,
+        request,
+        this.options.options,
+      ).then((result) => {
+        if (!result.ok) {
+          throw result.error;
+        }
+        return result.value;
+      });
+
+      // Wait for the stream and create the reusable stream
+      const eventStream = await this.streamPromise;
+      this.reusableStream = new ReusableReadableStream(eventStream);
+    })();
+
+    return this.initPromise;
+  }
+
+  /**
+   * Get the completed message from the response.
+   * This will consume the stream until completion and extract the first message.
+   * Returns an AssistantMessage in chat format.
+   */
+  get message(): Promise<models.AssistantMessage> {
+    if (this.messagePromise) {
+      return this.messagePromise;
+    }
+
+    this.messagePromise = (async (): Promise<models.AssistantMessage> => {
+      await this.initStream();
+      if (!this.reusableStream) {
+        throw new Error("Stream not initialized");
+      }
+
+      const completedResponse = await consumeStreamForCompletion(this.reusableStream);
+      return extractMessageFromResponse(completedResponse);
+    })();
+
+    return this.messagePromise;
+  }
+
+  /**
+   * Get just the text content from the response.
+   * This will consume the stream until completion and extract the text.
+   */
+  get text(): Promise<string> {
+    if (this.textPromise) {
+      return this.textPromise;
+    }
+
+    this.textPromise = (async () => {
+      await this.initStream();
+      if (!this.reusableStream) {
+        throw new Error("Stream not initialized");
+      }
+
+      const completedResponse = await consumeStreamForCompletion(this.reusableStream);
+      return extractTextFromResponse(completedResponse);
+    })();
+
+    return this.textPromise;
+  }
+
+  /**
+   * Stream all response events as they arrive.
+   * Multiple consumers can iterate over this stream concurrently.
+   */
+  get fullResponsesStream(): AsyncIterableIterator<models.OpenResponsesStreamEvent> {
+    return (async function* (this: ResponseWrapper) {
+      await this.initStream();
+      if (!this.reusableStream) {
+        throw new Error("Stream not initialized");
+      }
+
+      const consumer = this.reusableStream.createConsumer();
+      yield* consumer;
+    }.call(this));
+  }
+
+  /**
+   * Stream only text deltas as they arrive.
+   * This filters the full event stream to only yield text content.
+   */
+  get textStream(): AsyncIterableIterator<string> {
+    return (async function* (this: ResponseWrapper) {
+      await this.initStream();
+      if (!this.reusableStream) {
+        throw new Error("Stream not initialized");
+      }
+
+      yield* extractTextDeltas(this.reusableStream);
+    }.call(this));
+  }
+
+  /**
+   * Stream incremental message updates as content is added.
+   * Each iteration yields an updated version of the message with new content.
+   * Returns AssistantMessage in chat format.
+   */
+  get newMessagesStream(): AsyncIterableIterator<models.AssistantMessage> {
+    return (async function* (this: ResponseWrapper) {
+      await this.initStream();
+      if (!this.reusableStream) {
+        throw new Error("Stream not initialized");
+      }
+
+      yield* buildMessageStream(this.reusableStream);
+    }.call(this));
+  }
+
+  /**
+   * Stream only reasoning deltas as they arrive.
+   * This filters the full event stream to only yield reasoning content.
+   */
+  get reasoningStream(): AsyncIterableIterator<string> {
+    return (async function* (this: ResponseWrapper) {
+      await this.initStream();
+      if (!this.reusableStream) {
+        throw new Error("Stream not initialized");
+      }
+
+      yield* extractReasoningDeltas(this.reusableStream);
+    }.call(this));
+  }
+
+  /**
+   * Stream only tool call argument deltas as they arrive.
+   * This filters the full event stream to only yield function call arguments.
+   */
+  get toolStream(): AsyncIterableIterator<string> {
+    return (async function* (this: ResponseWrapper) {
+      await this.initStream();
+      if (!this.reusableStream) {
+        throw new Error("Stream not initialized");
+      }
+
+      yield* extractToolDeltas(this.reusableStream);
+    }.call(this));
+  }
+
+  /**
+   * Stream events in chat format (compatibility layer).
+   * Note: This transforms responses API events into a chat-like format.
+   *
+   * @remarks
+   * This is a compatibility method that attempts to transform the responses API
+   * stream into a format similar to the chat API. Due to differences in the APIs,
+   * this may not be a perfect mapping.
+   */
+  get fullChatStream(): AsyncIterableIterator<any> {
+    return (async function* (this: ResponseWrapper) {
+      await this.initStream();
+      if (!this.reusableStream) {
+        throw new Error("Stream not initialized");
+      }
+
+      const consumer = this.reusableStream.createConsumer();
+
+      for await (const event of consumer) {
+        if (!("type" in event)) continue;
+
+        // Transform responses events to chat-like format
+        // This is a simplified transformation - you may need to adjust based on your needs
+        if (event.type === "response.output_text.delta") {
+          const deltaEvent = event as models.OpenResponsesStreamEventResponseOutputTextDelta;
+          yield {
+            type: "content.delta",
+            delta: deltaEvent.delta,
+          };
+        } else if (event.type === "response.completed") {
+          const completedEvent = event as models.OpenResponsesStreamEventResponseCompleted;
+          yield {
+            type: "message.complete",
+            response: completedEvent.response,
+          };
+        } else {
+          // Pass through other events
+          yield {
+            type: event.type,
+            event,
+          };
+        }
+      }
+    }.call(this));
+  }
+
+  /**
+   * Cancel the underlying stream and all consumers
+   */
+  async cancel(): Promise<void> {
+    if (this.reusableStream) {
+      await this.reusableStream.cancel();
+    }
+  }
+}
diff --git a/src/lib/reusable-stream.ts b/src/lib/reusable-stream.ts
new file mode 100644
index 00000000..7a8e78db
--- /dev/null
+++ b/src/lib/reusable-stream.ts
@@ -0,0 +1,196 @@
+/**
+ * A reusable readable stream that allows multiple consumers to read from the same source stream
+ * concurrently while it's actively streaming, without forcing consumers to wait for full buffering.
+ *
+ * Key features:
+ * - Multiple concurrent consumers with independent read positions
+ * - New consumers can attach while streaming is active
+ * - Efficient memory management with automatic cleanup
+ * - Each consumer can read at their own pace
+ */
+export class ReusableReadableStream<T> {
+  private buffer: T[] = [];
+  private consumers = new Map<number, ConsumerState>();
+  private nextConsumerId = 0;
+  private sourceReader: ReadableStreamDefaultReader<T> | null = null;
+  private sourceComplete = false;
+  private sourceError: Error | null = null;
+  private pumpStarted = false;
+
+  constructor(private sourceStream: ReadableStream<T>) {}
+
+  /**
+   * Create a new consumer that can independently iterate over the stream.
+   * Multiple consumers can be created and will all receive the same data.
+   */
+  createConsumer(): AsyncIterableIterator<T> {
+    const consumerId = this.nextConsumerId++;
+    const state: ConsumerState = {
+      position: 0,
+      waitingPromise: null,
+      cancelled: false,
+    };
+    this.consumers.set(consumerId, state);
+
+    // Start pumping the source stream if not already started
+    if (!this.pumpStarted) {
+      this.startPump();
+    }
+
+    const self = this;
+
+    return {
+      async next(): Promise<IteratorResult<T>> {
+        const consumer = self.consumers.get(consumerId);
+        if (!consumer) {
+          return { done: true, value: undefined };
+        }
+
+        if (consumer.cancelled) {
+          return { done: true, value: undefined };
+        }
+
+        // If we have buffered data at this position, return it
+        if (consumer.position < self.buffer.length) {
+          const value = self.buffer[consumer.position]!;
+          consumer.position++;
+          // Note: We don't clean up buffer to allow sequential/reusable access
+          return { done: false, value };
+        }
+
+        // If source is complete and we've read everything, we're done
+        if (self.sourceComplete) {
+          self.consumers.delete(consumerId);
+          return { done: true, value: undefined };
+        }
+
+        // If source had an error, propagate it
+        if (self.sourceError) {
+          self.consumers.delete(consumerId);
+          throw self.sourceError;
+        }
+
+        // Wait for more data - but check conditions after setting up the promise
+        // to avoid race condition where source completes between check and wait
+        const waitPromise = new Promise<void>((resolve, reject) => {
+          consumer.waitingPromise = { resolve, reject };
+        });
+
+        // Double-check conditions after setting up promise to handle race
+        if (self.sourceComplete || self.sourceError || consumer.position < self.buffer.length) {
+          // Resolve immediately if conditions changed
+          if (consumer.waitingPromise) {
+            consumer.waitingPromise.resolve();
+            consumer.waitingPromise = null;
+          }
+        }
+
+        await waitPromise;
+
+        // Recursively try again after waking up
+        return this.next();
+      },
+
+      async return(): Promise<IteratorResult<T>> {
+        const consumer = self.consumers.get(consumerId);
+        if (consumer) {
+          consumer.cancelled = true;
+          self.consumers.delete(consumerId);
+        }
+        return { done: true, value: undefined };
+      },
+
+      async throw(e?: any): Promise<IteratorResult<T>> {
+        const consumer = self.consumers.get(consumerId);
+        if (consumer) {
+          consumer.cancelled = true;
+          self.consumers.delete(consumerId);
+        }
+        throw e;
+      },
+
+      [Symbol.asyncIterator]() {
+        return this;
+      },
+    };
+  }
+
+  /**
+   * Start pumping data from the source stream into the buffer
+   */
+  private startPump(): void {
+    if (this.pumpStarted) return;
+    this.pumpStarted = true;
+    this.sourceReader = this.sourceStream.getReader();
+
+    void (async () => {
+      try {
+        while (true) {
+          const result = await this.sourceReader!.read();
+
+          if (result.done) {
+            this.sourceComplete = true;
+            this.notifyAllConsumers();
+            break;
+          }
+
+          // Add to buffer
+          this.buffer.push(result.value);
+
+          // Notify waiting consumers
+          this.notifyAllConsumers();
+        }
+      } catch (error) {
+        this.sourceError = error instanceof Error ? error : new Error(String(error));
+        this.notifyAllConsumers();
+      } finally {
+        if (this.sourceReader) {
+          this.sourceReader.releaseLock();
+        }
+      }
+    })();
+  }
+
+  /**
+   * Notify all waiting consumers that new data is available
+   */
+  private notifyAllConsumers(): void {
+    for (const consumer of this.consumers.values()) {
+      if (consumer.waitingPromise) {
+        if (this.sourceError) {
+          consumer.waitingPromise.reject(this.sourceError);
+        } else {
+          consumer.waitingPromise.resolve();
+        }
+        consumer.waitingPromise = null;
+      }
+    }
+  }
+
+
+  /**
+   * Cancel the source stream and all consumers
+   */
+  async cancel(): Promise<void> {
+    // Cancel all consumers
+    for (const consumer of this.consumers.values()) {
+      consumer.cancelled = true;
+      if (consumer.waitingPromise) {
+        consumer.waitingPromise.resolve();
+      }
+    }
+    this.consumers.clear();
+
+    // Cancel the source stream
+    if (this.sourceReader) {
+      await this.sourceReader.cancel();
+      this.sourceReader.releaseLock();
+    }
+  }
+}
+
+interface ConsumerState {
+  position: number;
+  waitingPromise: { resolve: () => void; reject: (error: Error) => void } | null;
+  cancelled: boolean;
+}
diff --git a/src/lib/stream-transformers.ts b/src/lib/stream-transformers.ts
new file mode 100644
index 00000000..639d4a78
--- /dev/null
+++ b/src/lib/stream-transformers.ts
@@ -0,0 +1,201 @@
+import * as models from "../models/index.js";
+import { ReusableReadableStream } from "./reusable-stream.js";
+
+/**
+ * Extract text deltas from responses stream events
+ */
+export async function* extractTextDeltas(
+  stream: ReusableReadableStream<models.OpenResponsesStreamEvent>,
+): AsyncIterableIterator<string> {
+  const consumer = stream.createConsumer();
+
+  for await (const event of consumer) {
+    if ("type" in event && event.type === "response.output_text.delta") {
+      const deltaEvent = event as models.OpenResponsesStreamEventResponseOutputTextDelta;
+      if (deltaEvent.delta) {
+        yield deltaEvent.delta;
+      }
+    }
+  }
+}
+
+/**
+ * Extract reasoning deltas from responses stream events
+ */
+export async function* extractReasoningDeltas(
+  stream: ReusableReadableStream<models.OpenResponsesStreamEvent>,
+): AsyncIterableIterator<string> {
+  const consumer = stream.createConsumer();
+
+  for await (const event of consumer) {
+    if ("type" in event && event.type === "response.reasoning_text.delta") {
+      const deltaEvent = event as models.OpenResponsesReasoningDeltaEvent;
+      if (deltaEvent.delta) {
+        yield deltaEvent.delta;
+      }
+    }
+  }
+}
+
+/**
+ * Extract tool call argument deltas from responses stream events
+ */
+export async function* extractToolDeltas(
+  stream: ReusableReadableStream<models.OpenResponsesStreamEvent>,
+): AsyncIterableIterator<string> {
+  const consumer = stream.createConsumer();
+
+  for await (const event of consumer) {
+    if ("type" in event && event.type === "response.function_call_arguments.delta") {
+      const deltaEvent = event as models.OpenResponsesStreamEventResponseFunctionCallArgumentsDelta;
+      if (deltaEvent.delta) {
+        yield deltaEvent.delta;
+      }
+    }
+  }
+}
+
+/**
+ * Build incremental message updates from responses stream events
+ * Returns AssistantMessage (chat format) instead of ResponsesOutputMessage
+ */
+export async function* buildMessageStream(
+  stream: ReusableReadableStream<models.OpenResponsesStreamEvent>,
+): AsyncIterableIterator<models.AssistantMessage> {
+  const consumer = stream.createConsumer();
+
+  // Track the accumulated text
+  let currentText = "";
+  let hasStarted = false;
+
+  for await (const event of consumer) {
+    if (!("type" in event)) continue;
+
+    switch (event.type) {
+      case "response.output_item.added": {
+        const itemEvent = event as models.OpenResponsesStreamEventResponseOutputItemAdded;
+        if (itemEvent.item && "type" in itemEvent.item && itemEvent.item.type === "message") {
+          hasStarted = true;
+          currentText = "";
+        }
+        break;
+      }
+
+      case "response.output_text.delta": {
+        const deltaEvent = event as models.OpenResponsesStreamEventResponseOutputTextDelta;
+        if (hasStarted && deltaEvent.delta) {
+          currentText += deltaEvent.delta;
+
+          // Yield updated message
+          yield {
+            role: "assistant" as const,
+            content: currentText,
+          };
+        }
+        break;
+      }
+
+      case "response.output_item.done": {
+        const itemDoneEvent = event as models.OpenResponsesStreamEventResponseOutputItemDone;
+        if (itemDoneEvent.item && "type" in itemDoneEvent.item && itemDoneEvent.item.type === "message") {
+          // Yield final complete message
+          const outputMessage = itemDoneEvent.item as models.ResponsesOutputMessage;
+          yield convertToAssistantMessage(outputMessage);
+        }
+        break;
+      }
+    }
+  }
+}
+
+/**
+ * Consume stream until completion and return the complete response
+ */
+export async function consumeStreamForCompletion(
+  stream: ReusableReadableStream<models.OpenResponsesStreamEvent>,
+): Promise<models.OpenResponsesNonStreamingResponse> {
+  const consumer = stream.createConsumer();
+
+  for await (const event of consumer) {
+    if (!("type" in event)) continue;
+
+    if (event.type === "response.completed") {
+      const completedEvent = event as models.OpenResponsesStreamEventResponseCompleted;
+      return completedEvent.response;
+    }
+
+    if (event.type === "response.failed") {
+      const failedEvent = event as models.OpenResponsesStreamEventResponseFailed;
+      // The failed event contains the full response with error information
+      throw new Error(`Response failed: ${JSON.stringify(failedEvent.response.error)}`);
+    }
+
+    if (event.type === "response.incomplete") {
+      const incompleteEvent = event as models.OpenResponsesStreamEventResponseIncomplete;
+      // Return the incomplete response
+      return incompleteEvent.response;
+    }
+  }
+
+  throw new Error("Stream ended without completion event");
+}
+
+/**
+ * Convert ResponsesOutputMessage to AssistantMessage (chat format)
+ */
+function convertToAssistantMessage(
+  outputMessage: models.ResponsesOutputMessage,
+): models.AssistantMessage {
+  // Extract text content
+  const textContent = outputMessage.content
+    .filter((part): part is models.ResponseOutputText =>
+      "type" in part && part.type === "output_text"
+    )
+    .map((part) => part.text)
+    .join("");
+
+  return {
+    role: "assistant" as const,
+    content: textContent || null,
+  };
+}
+
+/**
+ * Extract the first message from a completed response
+ */
+export function extractMessageFromResponse(
+  response: models.OpenResponsesNonStreamingResponse,
+): models.AssistantMessage {
+  const messageItem = response.output.find(
+    (item): item is models.ResponsesOutputMessage =>
+      "type" in item && item.type === "message"
+  );
+
+  if (!messageItem) {
+    throw new Error("No message found in response output");
+  }
+
+  return convertToAssistantMessage(messageItem);
+}
+
+/**
+ * Extract text from a response, either from outputText or by concatenating message content
+ */
+export function extractTextFromResponse(
+  response: models.OpenResponsesNonStreamingResponse,
+): string {
+  // Use pre-concatenated outputText if available
+  if (response.outputText) {
+    return response.outputText;
+  }
+
+  // Otherwise, extract from the first message (convert to AssistantMessage which has string content)
+  const message = extractMessageFromResponse(response);
+
+  // AssistantMessage.content is string | Array | null | undefined
+  if (typeof message.content === "string") {
+    return message.content;
+  }
+
+  return "";
+}
diff --git a/src/sdk/sdk.ts b/src/sdk/sdk.ts
index 8c70c802..63a604a8 100644
--- a/src/sdk/sdk.ts
+++ b/src/sdk/sdk.ts
@@ -3,6 +3,12 @@
  */
 
 import { ClientSDK } from "../lib/sdks.js";
+// #region imports
+import { RequestOptions } from "../lib/sdks.js";
+import { ResponseWrapper } from "../lib/response-wrapper.js";
+import { getResponse } from "../funcs/getResponse.js";
+import * as models from "../models/index.js";
+// #endregion
 import { Analytics } from "./analytics.js";
 import { APIKeys } from "./apikeys.js";
 import { Beta } from "./beta.js";
@@ -76,4 +82,46 @@ export class OpenRouter extends ClientSDK {
   get completions(): Completions {
     return (this._completions ??= new Completions(this._options));
   }
+  // #region sdk-class-body
+  /**
+   * Get a response with multiple consumption patterns
+   *
+   * @remarks
+   * Returns a wrapper that allows consuming the response in multiple ways:
+   * - `await response.message` - Get the completed message
+   * - `await response.text` - Get just the text content
+   * - `for await (const delta of response.textStream)` - Stream text deltas
+   * - `for await (const msg of response.messageStream)` - Stream incremental message updates
+   * - `for await (const event of response.fullResponsesStream)` - Stream all response events
+   * - `for await (const chunk of response.fullChatStream)` - Stream in chat-compatible format
+   *
+   * All consumption patterns can be used concurrently on the same response.
+   *
+   * @example
+   * ```typescript
+   * // Simple text extraction
+   * const response = openRouter.getResponse({
+   *   model: "anthropic/claude-3-opus",
+   *   input: [{ role: "user", content: "Hello!" }]
+   * });
+   * const text = await response.text;
+   * console.log(text);
+   *
+   * // Streaming text
+   * const response = openRouter.getResponse({
+   *   model: "anthropic/claude-3-opus",
+   *   input: [{ role: "user", content: "Hello!" }]
+   * });
+   * for await (const delta of response.textStream) {
+   *   process.stdout.write(delta);
+   * }
+   * ```
+   */
+  getResponse(
+    request: Omit<models.OpenResponsesRequest, "stream">,
+    options?: RequestOptions,
+  ): ResponseWrapper {
+    return getResponse(this, request, options);
+  }
+  // #endregion
 }
diff --git a/tests/e2e/getResponse.test.ts b/tests/e2e/getResponse.test.ts
new file mode 100644
index 00000000..e031b577
--- /dev/null
+++ b/tests/e2e/getResponse.test.ts
@@ -0,0 +1,586 @@
+import { beforeAll, describe, expect, it } from "vitest";
+import { OpenRouter } from "../../src/sdk/sdk.js";
+import { Message } from "../../src/models/message.js";
+
+describe("getResponse E2E Tests", () => {
+  let client: OpenRouter;
+
+  beforeAll(() => {
+    const apiKey = process.env.OPENROUTER_API_KEY;
+    if (!apiKey) {
+      throw new Error(
+        "OPENROUTER_API_KEY environment variable is required for e2e tests"
+      );
+    }
+
+    client = new OpenRouter({
+      apiKey,
+    });
+  });
+
+  describe("response.text - Text extraction", () => {
+    it("should successfully get text from a response", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Say 'Hello, World!' and nothing else.",
+          },
+        ],
+      });
+
+      const text = await response.text;
+
+      expect(text).toBeDefined();
+      expect(typeof text).toBe("string");
+      expect(text.length).toBeGreaterThan(0);
+      expect(text.toLowerCase()).toContain("hello");
+    });
+
+    it("should handle multi-turn conversations", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "My name is Bob.",
+          },
+          {
+            role: "assistant",
+            content: "Hello Bob! How can I help you today?",
+          },
+          {
+            role: "user",
+            content: "What is my name?",
+          },
+        ],
+      });
+
+      const text = await response.text;
+
+      expect(text).toBeDefined();
+      expect(text.toLowerCase()).toContain("bob");
+    });
+  });
+
+  describe("response.message - Complete message extraction", () => {
+    it("should successfully get a complete message from response", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Say 'test message' and nothing else.",
+          },
+        ],
+      });
+
+      const message = await response.message;
+
+      expect(message).toBeDefined();
+      expect(message.role).toBe("assistant");
+      expect(Array.isArray(message.content) || typeof message.content === "string" || message.content === null).toBe(true);
+
+      if (Array.isArray(message.content)) {
+        expect(message.content.length).toBeGreaterThan(0);
+        const firstContent = message.content[0];
+        expect(firstContent).toBeDefined();
+        expect("type" in firstContent).toBe(true);
+      } else if (typeof message.content === "string") {
+        expect(message.content.length).toBeGreaterThan(0);
+      } else if (message.content === null) {
+        expect(message.content).toBeNull();
+      }
+    });
+
+    it("should have proper message structure", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Respond with a simple greeting.",
+          },
+        ],
+      });
+
+      const message = await response.message;
+
+      expect(message).toBeDefined();
+      expect(message.role).toBe("assistant");
+      expect(message.content).toBeDefined();
+    });
+  });
+
+  describe("response.textStream - Streaming text deltas", () => {
+    it("should successfully stream text deltas", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Count from 1 to 5.",
+          },
+        ],
+      });
+
+      const deltas: string[] = [];
+
+      for await (const delta of response.textStream) {
+        expect(typeof delta).toBe("string");
+        deltas.push(delta);
+      }
+
+      expect(deltas.length).toBeGreaterThan(0);
+
+      // Verify we can reconstruct the full text
+      const fullText = deltas.join("");
+      expect(fullText.length).toBeGreaterThan(0);
+    });
+
+    it("should stream progressively without waiting for completion", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Write a short poem.",
+          },
+        ],
+      });
+
+      let firstDeltaTime: number | null = null;
+      let lastDeltaTime: number | null = null;
+      let deltaCount = 0;
+
+      for await (const delta of response.textStream) {
+        if (!firstDeltaTime) {
+          firstDeltaTime = Date.now();
+        }
+        lastDeltaTime = Date.now();
+        deltaCount++;
+      }
+
+      expect(deltaCount).toBeGreaterThan(1);
+      expect(firstDeltaTime).toBeDefined();
+      expect(lastDeltaTime).toBeDefined();
+
+      // Verify there was a time difference (streaming, not instant)
+      if (firstDeltaTime && lastDeltaTime) {
+        expect(lastDeltaTime).toBeGreaterThanOrEqual(firstDeltaTime);
+      }
+    }, 15000);
+  });
+
+  describe("response.newMessagesStream - Streaming message updates", () => {
+    it("should successfully stream incremental message updates", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Say 'streaming test'.",
+          },
+        ],
+      });
+
+      const messages: Message[] = [];
+
+      for await (const message of response.newMessagesStream) {
+        expect(message).toBeDefined();
+        expect(message.role).toBe("assistant");
+        expect(typeof message.content).toBe("string");
+        messages.push(message);
+      }
+
+      expect(messages.length).toBeGreaterThan(0);
+
+      // Verify content grows over time
+      if (messages.length > 1) {
+        const firstMessage = messages[0];
+        const lastMessage = messages[messages.length - 1];
+
+        const firstText = (firstMessage.content as string) || "";
+        const lastText = (lastMessage.content as string) || "";
+
+        expect(lastText.length).toBeGreaterThanOrEqual(firstText.length);
+      }
+    }, 15000);
+  });
+
+  describe("response.reasoningStream - Streaming reasoning deltas", () => {
+    it("should successfully stream reasoning deltas for reasoning models", async () => {
+      const response = client.getResponse({
+        model: "minimax/minimax-m2",
+        input: [
+          {
+            role: "user",
+            content: "What is 2+2?",
+          },
+        ],
+        reasoning: {
+          enabled: true,
+          effort: "low",
+        },
+      });
+
+      const reasoningDeltas: string[] = [];
+
+      for await (const delta of response.reasoningStream) {
+        expect(typeof delta).toBe("string");
+        reasoningDeltas.push(delta);
+      }
+
+      // Reasoning models may or may not output reasoning for simple questions
+      // Just verify the stream works without error
+      expect(Array.isArray(reasoningDeltas)).toBe(true);
+      expect(reasoningDeltas.length).toBeGreaterThan(0);
+    }, 30000);
+  });
+
+  describe("response.toolStream - Streaming tool call deltas", () => {
+    it("should successfully stream tool call deltas when tools are called", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.1-8b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "What's the weather like in Paris? Use the get_weather tool to find out.",
+          },
+        ],
+        tools: [
+          {
+            type: "function" as const,
+            name: "get_weather",
+            description: "Get the current weather for a location",
+            parameters: {
+              type: "object",
+              properties: {
+                location: {
+                  type: "string",
+                  description: "The city name, e.g. Paris",
+                },
+              },
+              required: ["location"],
+            },
+          },
+        ],
+      });
+
+      const toolDeltas: string[] = [];
+
+      for await (const delta of response.toolStream) {
+        expect(typeof delta).toBe("string");
+        toolDeltas.push(delta);
+      }
+
+      // Verify the stream works and received tool call deltas
+      expect(Array.isArray(toolDeltas)).toBe(true);
+
+      // If the model made a tool call, we should have deltas
+      if (toolDeltas.length > 0) {
+        const fullToolCall = toolDeltas.join("");
+        expect(fullToolCall.length).toBeGreaterThan(0);
+      }
+    }, 30000);
+  });
+
+  describe("response.fullResponsesStream - Streaming all events", () => {
+    it("should successfully stream all response events", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Say 'hello'.",
+          },
+        ],
+      });
+
+      const events: any[] = [];
+
+      for await (const event of response.fullResponsesStream) {
+        expect(event).toBeDefined();
+        expect("type" in event).toBe(true);
+        events.push(event);
+      }
+
+      expect(events.length).toBeGreaterThan(0);
+
+      // Verify we have different event types
+      const eventTypes = new Set(events.map((e) => e.type));
+      expect(eventTypes.size).toBeGreaterThan(1);
+
+      // Should have completion event
+      const hasCompletionEvent = events.some(
+        (e) => e.type === "response.completed" || e.type === "response.incomplete"
+      );
+      expect(hasCompletionEvent).toBe(true);
+    }, 15000);
+
+    it("should include text delta events", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Count to 3.",
+          },
+        ],
+      });
+
+      const textDeltaEvents: any[] = [];
+
+      for await (const event of response.fullResponsesStream) {
+        if ("type" in event && event.type === "response.output_text.delta") {
+          textDeltaEvents.push(event);
+        }
+      }
+
+      expect(textDeltaEvents.length).toBeGreaterThan(0);
+
+      // Verify delta events have the expected structure
+      const firstDelta = textDeltaEvents[0];
+      expect(firstDelta.delta).toBeDefined();
+      expect(typeof firstDelta.delta).toBe("string");
+    }, 15000);
+  });
+
+  describe("response.fullChatStream - Chat-compatible streaming", () => {
+    it("should successfully stream in chat-compatible format", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Say 'test'.",
+          },
+        ],
+      });
+
+      const chunks: any[] = [];
+
+      for await (const chunk of response.fullChatStream) {
+        expect(chunk).toBeDefined();
+        expect(chunk.type).toBeDefined();
+        chunks.push(chunk);
+      }
+
+      expect(chunks.length).toBeGreaterThan(0);
+
+      // Should have content deltas
+      const hasContentDeltas = chunks.some((c) => c.type === "content.delta");
+      expect(hasContentDeltas).toBe(true);
+    }, 15000);
+  });
+
+  describe("Multiple concurrent consumption patterns", () => {
+    it("should allow reading text and streaming simultaneously", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Say 'concurrent test'.",
+          },
+        ],
+      });
+
+      // Get full text and stream concurrently
+      const textPromise = response.text;
+      const streamPromise = (async () => {
+        const deltas: string[] = [];
+        for await (const delta of response.textStream) {
+          deltas.push(delta);
+        }
+        return deltas;
+      })();
+
+      // Wait for both
+      const [text, deltas] = await Promise.all([textPromise, streamPromise]);
+
+      expect(deltas.length).toBeGreaterThan(0);
+      expect(text.length).toBeGreaterThan(0);
+
+      // Verify deltas reconstruct the full text
+      const reconstructed = deltas.join("");
+      expect(reconstructed).toBe(text);
+    }, 30000);
+
+    it("should allow multiple stream consumers", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Write a short sentence.",
+          },
+        ],
+      });
+
+      // Start two concurrent stream consumers
+      const textStreamPromise = (async () => {
+        const deltas: string[] = [];
+        for await (const delta of response.textStream) {
+          deltas.push(delta);
+        }
+        return deltas;
+      })();
+
+      const newMessagesStreamPromise = (async () => {
+        const messages: any[] = [];
+        for await (const message of response.newMessagesStream) {
+          messages.push(message);
+        }
+        return messages;
+      })();
+
+      const [textDeltas, messages] = await Promise.all([
+        textStreamPromise,
+        newMessagesStreamPromise,
+      ]);
+
+      expect(textDeltas.length).toBeGreaterThan(0);
+      expect(messages.length).toBeGreaterThan(0);
+
+      // Verify consistency between streams
+      const textFromDeltas = textDeltas.join("");
+      const lastMessage = messages[messages.length - 1];
+      const textFromMessage = (lastMessage.content as string) || "";
+
+      expect(textFromDeltas).toBe(textFromMessage);
+    }, 20000);
+
+    it("should allow sequential consumption - text then stream", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Say 'sequential test'.",
+          },
+        ],
+      });
+
+      // First, get the full text
+      const text = await response.text;
+      expect(text).toBeDefined();
+      expect(text.length).toBeGreaterThan(0);
+
+      // Then, try to stream (should get same data from buffer)
+      const deltas: string[] = [];
+      for await (const delta of response.textStream) {
+        expect(typeof delta).toBe("string");
+        deltas.push(delta);
+      }
+
+      expect(deltas.length).toBeGreaterThan(0);
+
+      // Verify both give same result
+      const reconstructed = deltas.join("");
+      expect(reconstructed).toBe(text);
+    }, 20000);
+
+    it("should allow sequential consumption - stream then text", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Say 'reverse test'.",
+          },
+        ],
+      });
+
+      // First, collect deltas from stream
+      const deltas: string[] = [];
+      for await (const delta of response.textStream) {
+        expect(typeof delta).toBe("string");
+        deltas.push(delta);
+      }
+      expect(deltas.length).toBeGreaterThan(0);
+
+      // Then, get the full text (should work even after stream consumed)
+      const text = await response.text;
+      expect(text).toBeDefined();
+      expect(text.length).toBeGreaterThan(0);
+
+      // Verify both give same result
+      const reconstructed = deltas.join("");
+      expect(reconstructed).toBe(text);
+    }, 20000);
+  });
+
+  describe("Error handling", () => {
+    it("should handle invalid model gracefully", async () => {
+      const response = client.getResponse({
+        model: "invalid/model-that-does-not-exist",
+        input: [
+          {
+            role: "user",
+            content: "Test",
+          },
+        ],
+      });
+
+      await expect(response.text).rejects.toThrow();
+    });
+
+    it("should handle empty input", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [],
+      });
+
+      // This might fail or return empty - both are acceptable
+      try {
+        const text = await response.text;
+        expect(text).toBeDefined();
+      } catch (error) {
+        expect(error).toBeDefined();
+      }
+    });
+  });
+
+  describe("Response parameters", () => {
+    it("should respect maxOutputTokens parameter", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Write a long story about a cat.",
+          },
+        ],
+        maxOutputTokens: 10,
+      });
+
+      const text = await response.text;
+
+      expect(text).toBeDefined();
+      // Text should be relatively short due to token limit
+      expect(text.split(" ").length).toBeLessThan(50);
+    });
+
+    it("should work with instructions parameter", async () => {
+      const response = client.getResponse({
+        model: "meta-llama/llama-3.2-1b-instruct",
+        input: [
+          {
+            role: "user",
+            content: "Say exactly: 'test complete'",
+          },
+        ],
+        instructions: "You are a helpful assistant. Keep responses concise.",
+      });
+
+      const text = await response.text;
+
+      expect(text).toBeDefined();
+      expect(typeof text).toBe("string");
+      expect(text.length).toBeGreaterThan(0);
+      // Just verify instructions parameter is accepted, not that model follows it perfectly
+    });
+  });
+});
diff --git a/tests/e2e/responses.test.ts b/tests/e2e/responses.test.ts
index eccf2da4..c7065a15 100644
--- a/tests/e2e/responses.test.ts
+++ b/tests/e2e/responses.test.ts
@@ -1,5 +1,6 @@
 import { beforeAll, describe, expect, it } from "vitest";
 import { OpenRouter } from "../../src/sdk/sdk.js";
+import { ResponsesOutputMessage } from "../../esm/models/responsesoutputmessage.js";
 
 describe("Beta Responses E2E Tests", () => {
   let client: OpenRouter;
@@ -45,7 +46,7 @@ describe("Beta Responses E2E Tests", () => {
       const firstOutput = response.output[0];
       expect(firstOutput).toBeDefined();
       expect(firstOutput?.type).toBe("message");
-      expect(firstOutput?.role).toBe("assistant");
+      expect((firstOutput as ResponsesOutputMessage).role).toBe("assistant");
 
       // Verify usage information
       expect(response.usage).toBeDefined();

From ec77c073434658c8c7d9fbba6f353095dd062b70 Mon Sep 17 00:00:00 2001
From: Matt Apperson <me@mattapperson.com>
Date: Fri, 31 Oct 2025 11:08:15 -0400
Subject: [PATCH 2/4] refactor: Convert response API from hanging promises to
 getter methods
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Convert all getter properties that return promises/iterators into
explicit methods with get*() naming for better API clarity and
consistency.

Changes:
- response.text → response.getText()
- response.message → response.getMessage()
- response.textStream → response.getTextStream()
- response.newMessagesStream → response.getNewMessagesStream()
- response.fullResponsesStream → response.getFullResponsesStream()
- response.reasoningStream → response.getReasoningStream()
- response.toolStream → response.getToolStream()
- response.fullChatStream → response.getFullChatStream()

Updated all test files, examples, and JSDoc documentation to reflect
the new API. All 20 e2e tests pass successfully.
---
 src/funcs/getResponse.ts      | 22 ++++++++--------
 src/lib/response-wrapper.ts   | 26 +++++++++----------
 src/sdk/sdk.ts                | 16 ++++++------
 tests/e2e/getResponse.test.ts | 48 +++++++++++++++++------------------
 4 files changed, 56 insertions(+), 56 deletions(-)

diff --git a/src/funcs/getResponse.ts b/src/funcs/getResponse.ts
index d03d6a2a..4bd371d4 100644
--- a/src/funcs/getResponse.ts
+++ b/src/funcs/getResponse.ts
@@ -10,14 +10,14 @@ import * as models from "../models/index.js";
  * Creates a response using the OpenResponses API in streaming mode and returns
  * a wrapper that allows consuming the response in multiple ways:
  *
- * - `await response.message` - Get the completed message
- * - `await response.text` - Get just the text content
- * - `for await (const delta of response.textStream)` - Stream text deltas
- * - `for await (const delta of response.reasoningStream)` - Stream reasoning deltas
- * - `for await (const delta of response.toolStream)` - Stream tool call argument deltas
- * - `for await (const msg of response.newMessagesStream)` - Stream incremental message updates
- * - `for await (const event of response.fullResponsesStream)` - Stream all response events
- * - `for await (const chunk of response.fullChatStream)` - Stream in chat-compatible format
+ * - `await response.getMessage()` - Get the completed message
+ * - `await response.getText()` - Get just the text content
+ * - `for await (const delta of response.getTextStream())` - Stream text deltas
+ * - `for await (const delta of response.getReasoningStream())` - Stream reasoning deltas
+ * - `for await (const delta of response.getToolStream())` - Stream tool call argument deltas
+ * - `for await (const msg of response.getNewMessagesStream())` - Stream incremental message updates
+ * - `for await (const event of response.getFullResponsesStream())` - Stream all response events
+ * - `for await (const chunk of response.getFullChatStream())` - Stream in chat-compatible format
  *
  * All consumption patterns can be used concurrently on the same response.
  *
@@ -28,7 +28,7 @@ import * as models from "../models/index.js";
  *   model: "anthropic/claude-3-opus",
  *   input: [{ role: "user", content: "Hello!" }]
  * });
- * const text = await response.text;
+ * const text = await response.getText();
  * console.log(text);
  *
  * // Streaming text
@@ -36,7 +36,7 @@ import * as models from "../models/index.js";
  *   model: "anthropic/claude-3-opus",
  *   input: [{ role: "user", content: "Hello!" }]
  * });
- * for await (const delta of response.textStream) {
+ * for await (const delta of response.getTextStream()) {
  *   process.stdout.write(delta);
  * }
  *
@@ -45,7 +45,7 @@ import * as models from "../models/index.js";
  *   model: "anthropic/claude-3-opus",
  *   input: [{ role: "user", content: "Hello!" }]
  * });
- * const message = await response.message;
+ * const message = await response.getMessage();
  * console.log(message.content);
  * ```
  */
diff --git a/src/lib/response-wrapper.ts b/src/lib/response-wrapper.ts
index 2ccba944..70197b8c 100644
--- a/src/lib/response-wrapper.ts
+++ b/src/lib/response-wrapper.ts
@@ -24,11 +24,11 @@ export interface GetResponseOptions {
  * A wrapper around a streaming response that provides multiple consumption patterns.
  *
  * Allows consuming the response in multiple ways:
- * - `await response.message` - Get the completed message
- * - `await response.text` - Get just the text
- * - `for await (const delta of response.textStream)` - Stream text deltas
- * - `for await (const msg of response.messageStream)` - Stream incremental message updates
- * - `for await (const event of response.fullResponsesStream)` - Stream all response events
+ * - `await response.getMessage()` - Get the completed message
+ * - `await response.getText()` - Get just the text
+ * - `for await (const delta of response.getTextStream())` - Stream text deltas
+ * - `for await (const msg of response.getNewMessagesStream())` - Stream incremental message updates
+ * - `for await (const event of response.getFullResponsesStream())` - Stream all response events
  *
  * All consumption patterns can be used concurrently thanks to the underlying
  * ReusableReadableStream implementation.
@@ -83,7 +83,7 @@ export class ResponseWrapper {
    * This will consume the stream until completion and extract the first message.
    * Returns an AssistantMessage in chat format.
    */
-  get message(): Promise<models.AssistantMessage> {
+  getMessage(): Promise<models.AssistantMessage> {
     if (this.messagePromise) {
       return this.messagePromise;
     }
@@ -105,7 +105,7 @@ export class ResponseWrapper {
    * Get just the text content from the response.
    * This will consume the stream until completion and extract the text.
    */
-  get text(): Promise<string> {
+  getText(): Promise<string> {
     if (this.textPromise) {
       return this.textPromise;
     }
@@ -127,7 +127,7 @@ export class ResponseWrapper {
    * Stream all response events as they arrive.
    * Multiple consumers can iterate over this stream concurrently.
    */
-  get fullResponsesStream(): AsyncIterableIterator<models.OpenResponsesStreamEvent> {
+  getFullResponsesStream(): AsyncIterableIterator<models.OpenResponsesStreamEvent> {
     return (async function* (this: ResponseWrapper) {
       await this.initStream();
       if (!this.reusableStream) {
@@ -143,7 +143,7 @@ export class ResponseWrapper {
    * Stream only text deltas as they arrive.
    * This filters the full event stream to only yield text content.
    */
-  get textStream(): AsyncIterableIterator<string> {
+  getTextStream(): AsyncIterableIterator<string> {
     return (async function* (this: ResponseWrapper) {
       await this.initStream();
       if (!this.reusableStream) {
@@ -159,7 +159,7 @@ export class ResponseWrapper {
    * Each iteration yields an updated version of the message with new content.
    * Returns AssistantMessage in chat format.
    */
-  get newMessagesStream(): AsyncIterableIterator<models.AssistantMessage> {
+  getNewMessagesStream(): AsyncIterableIterator<models.AssistantMessage> {
     return (async function* (this: ResponseWrapper) {
       await this.initStream();
       if (!this.reusableStream) {
@@ -174,7 +174,7 @@ export class ResponseWrapper {
    * Stream only reasoning deltas as they arrive.
    * This filters the full event stream to only yield reasoning content.
    */
-  get reasoningStream(): AsyncIterableIterator<string> {
+  getReasoningStream(): AsyncIterableIterator<string> {
     return (async function* (this: ResponseWrapper) {
       await this.initStream();
       if (!this.reusableStream) {
@@ -189,7 +189,7 @@ export class ResponseWrapper {
    * Stream only tool call argument deltas as they arrive.
    * This filters the full event stream to only yield function call arguments.
    */
-  get toolStream(): AsyncIterableIterator<string> {
+  getToolStream(): AsyncIterableIterator<string> {
     return (async function* (this: ResponseWrapper) {
       await this.initStream();
       if (!this.reusableStream) {
@@ -209,7 +209,7 @@ export class ResponseWrapper {
    * stream into a format similar to the chat API. Due to differences in the APIs,
    * this may not be a perfect mapping.
    */
-  get fullChatStream(): AsyncIterableIterator<any> {
+  getFullChatStream(): AsyncIterableIterator<any> {
     return (async function* (this: ResponseWrapper) {
       await this.initStream();
       if (!this.reusableStream) {
diff --git a/src/sdk/sdk.ts b/src/sdk/sdk.ts
index 63a604a8..df850e0a 100644
--- a/src/sdk/sdk.ts
+++ b/src/sdk/sdk.ts
@@ -88,12 +88,12 @@ export class OpenRouter extends ClientSDK {
    *
    * @remarks
    * Returns a wrapper that allows consuming the response in multiple ways:
-   * - `await response.message` - Get the completed message
-   * - `await response.text` - Get just the text content
-   * - `for await (const delta of response.textStream)` - Stream text deltas
-   * - `for await (const msg of response.messageStream)` - Stream incremental message updates
-   * - `for await (const event of response.fullResponsesStream)` - Stream all response events
-   * - `for await (const chunk of response.fullChatStream)` - Stream in chat-compatible format
+   * - `await response.getMessage()` - Get the completed message
+   * - `await response.getText()` - Get just the text content
+   * - `for await (const delta of response.getTextStream())` - Stream text deltas
+   * - `for await (const msg of response.getNewMessagesStream())` - Stream incremental message updates
+   * - `for await (const event of response.getFullResponsesStream())` - Stream all response events
+   * - `for await (const chunk of response.getFullChatStream())` - Stream in chat-compatible format
    *
    * All consumption patterns can be used concurrently on the same response.
    *
@@ -104,7 +104,7 @@ export class OpenRouter extends ClientSDK {
    *   model: "anthropic/claude-3-opus",
    *   input: [{ role: "user", content: "Hello!" }]
    * });
-   * const text = await response.text;
+   * const text = await response.getText();
    * console.log(text);
    *
    * // Streaming text
@@ -112,7 +112,7 @@ export class OpenRouter extends ClientSDK {
    *   model: "anthropic/claude-3-opus",
    *   input: [{ role: "user", content: "Hello!" }]
    * });
-   * for await (const delta of response.textStream) {
+   * for await (const delta of response.getTextStream()) {
    *   process.stdout.write(delta);
    * }
    * ```
diff --git a/tests/e2e/getResponse.test.ts b/tests/e2e/getResponse.test.ts
index e031b577..93222938 100644
--- a/tests/e2e/getResponse.test.ts
+++ b/tests/e2e/getResponse.test.ts
@@ -30,7 +30,7 @@ describe("getResponse E2E Tests", () => {
         ],
       });
 
-      const text = await response.text;
+      const text = await response.getText();
 
       expect(text).toBeDefined();
       expect(typeof text).toBe("string");
@@ -57,7 +57,7 @@ describe("getResponse E2E Tests", () => {
         ],
       });
 
-      const text = await response.text;
+      const text = await response.getText();
 
       expect(text).toBeDefined();
       expect(text.toLowerCase()).toContain("bob");
@@ -76,7 +76,7 @@ describe("getResponse E2E Tests", () => {
         ],
       });
 
-      const message = await response.message;
+      const message = await response.getMessage();
 
       expect(message).toBeDefined();
       expect(message.role).toBe("assistant");
@@ -105,7 +105,7 @@ describe("getResponse E2E Tests", () => {
         ],
       });
 
-      const message = await response.message;
+      const message = await response.getMessage();
 
       expect(message).toBeDefined();
       expect(message.role).toBe("assistant");
@@ -127,7 +127,7 @@ describe("getResponse E2E Tests", () => {
 
       const deltas: string[] = [];
 
-      for await (const delta of response.textStream) {
+      for await (const delta of response.getTextStream()) {
         expect(typeof delta).toBe("string");
         deltas.push(delta);
       }
@@ -154,7 +154,7 @@ describe("getResponse E2E Tests", () => {
       let lastDeltaTime: number | null = null;
       let deltaCount = 0;
 
-      for await (const delta of response.textStream) {
+      for await (const delta of response.getTextStream()) {
         if (!firstDeltaTime) {
           firstDeltaTime = Date.now();
         }
@@ -187,7 +187,7 @@ describe("getResponse E2E Tests", () => {
 
       const messages: Message[] = [];
 
-      for await (const message of response.newMessagesStream) {
+      for await (const message of response.getNewMessagesStream()) {
         expect(message).toBeDefined();
         expect(message.role).toBe("assistant");
         expect(typeof message.content).toBe("string");
@@ -227,7 +227,7 @@ describe("getResponse E2E Tests", () => {
 
       const reasoningDeltas: string[] = [];
 
-      for await (const delta of response.reasoningStream) {
+      for await (const delta of response.getReasoningStream()) {
         expect(typeof delta).toBe("string");
         reasoningDeltas.push(delta);
       }
@@ -270,7 +270,7 @@ describe("getResponse E2E Tests", () => {
 
       const toolDeltas: string[] = [];
 
-      for await (const delta of response.toolStream) {
+      for await (const delta of response.getToolStream()) {
         expect(typeof delta).toBe("string");
         toolDeltas.push(delta);
       }
@@ -300,7 +300,7 @@ describe("getResponse E2E Tests", () => {
 
       const events: any[] = [];
 
-      for await (const event of response.fullResponsesStream) {
+      for await (const event of response.getFullResponsesStream()) {
         expect(event).toBeDefined();
         expect("type" in event).toBe(true);
         events.push(event);
@@ -332,7 +332,7 @@ describe("getResponse E2E Tests", () => {
 
       const textDeltaEvents: any[] = [];
 
-      for await (const event of response.fullResponsesStream) {
+      for await (const event of response.getFullResponsesStream()) {
         if ("type" in event && event.type === "response.output_text.delta") {
           textDeltaEvents.push(event);
         }
@@ -361,7 +361,7 @@ describe("getResponse E2E Tests", () => {
 
       const chunks: any[] = [];
 
-      for await (const chunk of response.fullChatStream) {
+      for await (const chunk of response.getFullChatStream()) {
         expect(chunk).toBeDefined();
         expect(chunk.type).toBeDefined();
         chunks.push(chunk);
@@ -388,10 +388,10 @@ describe("getResponse E2E Tests", () => {
       });
 
       // Get full text and stream concurrently
-      const textPromise = response.text;
+      const textPromise = response.getText();
       const streamPromise = (async () => {
         const deltas: string[] = [];
-        for await (const delta of response.textStream) {
+        for await (const delta of response.getTextStream()) {
           deltas.push(delta);
         }
         return deltas;
@@ -422,7 +422,7 @@ describe("getResponse E2E Tests", () => {
       // Start two concurrent stream consumers
       const textStreamPromise = (async () => {
         const deltas: string[] = [];
-        for await (const delta of response.textStream) {
+        for await (const delta of response.getTextStream()) {
           deltas.push(delta);
         }
         return deltas;
@@ -430,7 +430,7 @@ describe("getResponse E2E Tests", () => {
 
       const newMessagesStreamPromise = (async () => {
         const messages: any[] = [];
-        for await (const message of response.newMessagesStream) {
+        for await (const message of response.getNewMessagesStream()) {
           messages.push(message);
         }
         return messages;
@@ -464,13 +464,13 @@ describe("getResponse E2E Tests", () => {
       });
 
       // First, get the full text
-      const text = await response.text;
+      const text = await response.getText();
       expect(text).toBeDefined();
       expect(text.length).toBeGreaterThan(0);
 
       // Then, try to stream (should get same data from buffer)
       const deltas: string[] = [];
-      for await (const delta of response.textStream) {
+      for await (const delta of response.getTextStream()) {
         expect(typeof delta).toBe("string");
         deltas.push(delta);
       }
@@ -495,14 +495,14 @@ describe("getResponse E2E Tests", () => {
 
       // First, collect deltas from stream
       const deltas: string[] = [];
-      for await (const delta of response.textStream) {
+      for await (const delta of response.getTextStream()) {
         expect(typeof delta).toBe("string");
         deltas.push(delta);
       }
       expect(deltas.length).toBeGreaterThan(0);
 
       // Then, get the full text (should work even after stream consumed)
-      const text = await response.text;
+      const text = await response.getText();
       expect(text).toBeDefined();
       expect(text.length).toBeGreaterThan(0);
 
@@ -524,7 +524,7 @@ describe("getResponse E2E Tests", () => {
         ],
       });
 
-      await expect(response.text).rejects.toThrow();
+      await expect(response.getText()).rejects.toThrow();
     });
 
     it("should handle empty input", async () => {
@@ -535,7 +535,7 @@ describe("getResponse E2E Tests", () => {
 
       // This might fail or return empty - both are acceptable
       try {
-        const text = await response.text;
+        const text = await response.getText();
         expect(text).toBeDefined();
       } catch (error) {
         expect(error).toBeDefined();
@@ -556,7 +556,7 @@ describe("getResponse E2E Tests", () => {
         maxOutputTokens: 10,
       });
 
-      const text = await response.text;
+      const text = await response.getText();
 
       expect(text).toBeDefined();
       // Text should be relatively short due to token limit
@@ -575,7 +575,7 @@ describe("getResponse E2E Tests", () => {
         instructions: "You are a helpful assistant. Keep responses concise.",
       });
 
-      const text = await response.text;
+      const text = await response.getText();
 
       expect(text).toBeDefined();
       expect(typeof text).toBe("string");

From ceee37dcc095c756f80fc94c39cdedb78cb32844 Mon Sep 17 00:00:00 2001
From: Matt Apperson <mattapperson@mini.local>
Date: Wed, 5 Nov 2025 13:11:11 -0500
Subject: [PATCH 3/4] Add TurnContext parameter to tool execute functions
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Added TurnContext type with numberOfTurns (1-indexed), messageHistory, model/models
- Updated tool execute function signatures to accept optional context parameter
- Context is built in response-wrapper.ts during tool execution loop
- Updated all tests and examples to demonstrate context usage
- Context parameter is optional for backward compatibility
- Exported TurnContext type in public API

This allows tools to access conversation state including turn number,
message history, and model information during execution.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 examples/tools-example.ts           | 334 ++++++++++++++++++
 pnpm-lock.yaml                      |  28 +-
 src/funcs/getResponse.ts            | 105 ++++--
 src/index.ts                        |  13 +
 src/lib/response-wrapper.ts         | 328 +++++++++++++++--
 src/lib/stream-transformers.ts      | 165 +++++++++
 src/lib/tool-executor.ts            | 249 +++++++++++++
 src/lib/tool-orchestrator.ts        | 206 +++++++++++
 src/lib/tool-types.ts               | 233 ++++++++++++
 src/sdk/sdk.ts                      |   6 +-
 tests/e2e/getResponse-tools.test.ts | 529 ++++++++++++++++++++++++++++
 11 files changed, 2143 insertions(+), 53 deletions(-)
 create mode 100644 examples/tools-example.ts
 create mode 100644 src/lib/tool-executor.ts
 create mode 100644 src/lib/tool-orchestrator.ts
 create mode 100644 src/lib/tool-types.ts
 create mode 100644 tests/e2e/getResponse-tools.test.ts

diff --git a/examples/tools-example.ts b/examples/tools-example.ts
new file mode 100644
index 00000000..e5eb7a53
--- /dev/null
+++ b/examples/tools-example.ts
@@ -0,0 +1,334 @@
+/**
+ * OpenRouter SDK - Enhanced Tool Support Examples
+ *
+ * This file demonstrates the automatic tool execution feature.
+ * When you provide tools with `execute` functions, they are automatically:
+ * 1. Validated using Zod schemas
+ * 2. Executed when the model calls them
+ * 3. Results sent back to the model
+ * 4. Process repeats until no more tool calls (up to maxToolRounds)
+ *
+ * The API is simple: just call getResponse() with tools, and await the result.
+ * Tools are executed transparently before getMessage() or getText() returns!
+ */
+
+import { OpenRouter } from "../src/index.js";
+import { z } from "zod/v4";
+import * as dotenv from "dotenv";
+
+dotenv.config();
+
+const client = new OpenRouter({
+  apiKey: process.env.OPENROUTER_API_KEY || "",
+});
+
+/**
+ * Example 1: Basic Tool with Execute Function
+ * A simple weather tool that returns mock data
+ * Note: The context parameter is optional for backward compatibility
+ */
+async function basicToolExample() {
+  console.log("\n=== Example 1: Basic Tool with Execute Function ===\n");
+
+  const weatherTool = {
+    type: "function" as const,
+    function: {
+      name: "get_weather",
+      description: "Get current weather for a location",
+      inputSchema: z.object({
+        location: z.string().describe("City and country (e.g., San Francisco, CA)"),
+      }),
+      outputSchema: z.object({
+        temperature: z.number(),
+        description: z.string(),
+        humidity: z.number(),
+      }),
+      execute: async (params: { location: string }, context) => {
+        console.log(`Executing get_weather for: ${params.location}`);
+        console.log(`Turn ${context.numberOfTurns} - Model: ${context.model || context.models?.join(", ")}`);
+        // In real usage, you would call a weather API here
+        return {
+          temperature: 72,
+          description: "Sunny",
+          humidity: 45,
+        };
+      },
+    },
+  };
+
+  const response = client.getResponse({
+    model: "openai/gpt-4o",
+    input: "What's the weather like in San Francisco?",
+    tools: [weatherTool],
+  });
+
+  // Tools are automatically executed! Just get the final message
+  const message = await response.getMessage();
+  console.log("\nFinal message after automatic tool execution:", message.content);
+
+  // You can also check what tool calls were made initially
+  const toolCalls = await response.getToolCalls();
+  console.log("\nInitial tool calls:", JSON.stringify(toolCalls, null, 2));
+}
+
+/**
+ * Example 2: Generator Tool with Preliminary Results
+ * Shows how to use async generators for streaming intermediate results
+ */
+async function generatorToolExample() {
+  console.log("\n=== Example 2: Generator Tool with Preliminary Results ===\n");
+
+  const processingTool = {
+    type: "function" as const,
+    function: {
+      name: "process_data",
+      description: "Process data with progress updates",
+      inputSchema: z.object({
+        data: z.string().describe("Data to process"),
+      }),
+      eventSchema: z.object({
+        type: z.enum(["start", "progress", "complete"]),
+        message: z.string(),
+        progress: z.number().min(0).max(100).optional(),
+      }),
+      execute: async function* (params: { data: string }, context) {
+        console.log(`Generator tool - Turn ${context.numberOfTurns}`);
+        // Preliminary result 1
+        yield {
+          type: "start" as const,
+          message: `Started processing: ${params.data}`,
+          progress: 0,
+        };
+
+        await new Promise((resolve) => setTimeout(resolve, 500));
+
+        // Preliminary result 2
+        yield {
+          type: "progress" as const,
+          message: "Processing halfway done",
+          progress: 50,
+        };
+
+        await new Promise((resolve) => setTimeout(resolve, 500));
+
+        // Final result (last yield)
+        yield {
+          type: "complete" as const,
+          message: `Completed processing: ${params.data.toUpperCase()}`,
+          progress: 100,
+        };
+      },
+    },
+  };
+
+  const response = client.getResponse({
+    model: "openai/gpt-4o",
+    input: "Process this data: hello world",
+    tools: [processingTool],
+  });
+
+  // Stream preliminary results as they arrive
+  console.log("Streaming tool events including preliminary results:\n");
+  for await (const event of response.getToolStream()) {
+    if (event.type === "preliminary_result") {
+      console.log(`Preliminary result from ${event.toolCallId}:`, event.result);
+    } else if (event.type === "delta") {
+      process.stdout.write(event.content);
+    }
+  }
+
+  // Tools are automatically executed with preliminary results available
+  const message = await response.getMessage();
+  console.log("\n\nFinal message:", message.content);
+}
+
+/**
+ * Example 3: Manual Tool Execution
+ * Define a tool without execute function for manual handling
+ */
+async function manualToolExample() {
+  console.log("\n=== Example 3: Manual Tool Execution ===\n");
+
+  const calculatorTool = {
+    type: "function" as const,
+    function: {
+      name: "calculate",
+      description: "Perform mathematical calculations",
+      inputSchema: z.object({
+        expression: z.string().describe("Math expression to evaluate"),
+      }),
+      outputSchema: z.object({
+        result: z.number(),
+      }),
+      // No execute function - tool calls are returned but not executed
+    },
+  };
+
+  const response = client.getResponse({
+    model: "openai/gpt-4o",
+    input: "What is 25 * 4 + 10?",
+    tools: [calculatorTool],
+  });
+
+  // Since there's no execute function, tool calls are returned but not executed
+  const toolCalls = await response.getToolCalls();
+  console.log("Tool calls (not auto-executed):", toolCalls);
+
+  // You can manually handle tool execution here
+  for (const toolCall of toolCalls) {
+    if (toolCall.name === "calculate") {
+      const expression = (toolCall.arguments as { expression: string }).expression;
+      console.log(`Manually executing calculation: ${expression}`);
+
+      // In a real app, you would safely evaluate this
+      // For demo purposes only - don't use eval in production!
+      try {
+        const result = eval(expression);
+        console.log(`Result: ${result}`);
+      } catch (error) {
+        console.error("Calculation error:", error);
+      }
+    }
+  }
+
+  // Then you would need to make a new request with the tool results
+  // (This example just shows the manual detection, not the full loop)
+}
+
+/**
+ * Example 4: Streaming Tool Calls
+ * Show how to stream structured tool call objects as they arrive
+ * Note: This tool doesn't use context - demonstrating backward compatibility
+ */
+async function streamingToolCallsExample() {
+  console.log("\n=== Example 4: Streaming Tool Calls ===\n");
+
+  const searchTool = {
+    type: "function" as const,
+    function: {
+      name: "search",
+      description: "Search for information",
+      inputSchema: z.object({
+        query: z.string().describe("Search query"),
+      }),
+      outputSchema: z.object({
+        results: z.array(z.string()),
+      }),
+      execute: async (params: { query: string }) => {
+        // Context parameter is optional - this tool doesn't need it
+        return {
+          results: [
+            `Result 1 for "${params.query}"`,
+            `Result 2 for "${params.query}"`,
+          ],
+        };
+      },
+    },
+  };
+
+  const response = client.getResponse({
+    model: "openai/gpt-4o",
+    input: "Search for information about TypeScript",
+    tools: [searchTool],
+  });
+
+  console.log("Streaming tool calls as they arrive:\n");
+
+  // Stream structured tool call objects
+  for await (const toolCall of response.getToolCallsStream()) {
+    console.log("Tool call:", JSON.stringify(toolCall, null, 2));
+  }
+}
+
+/**
+ * Example 5: Multiple Tools
+ * Use multiple tools in a single request
+ * Note: Shows mixing tools with and without context parameter
+ */
+async function multipleToolsExample() {
+  console.log("\n=== Example 5: Multiple Tools ===\n");
+
+  const tools = [
+    {
+      type: "function" as const,
+      function: {
+        name: "get_time",
+        description: "Get current time",
+        inputSchema: z.object({
+          timezone: z.string().optional(),
+        }),
+        outputSchema: z.object({
+          time: z.string(),
+          timezone: z.string(),
+        }),
+        execute: async (params: { timezone?: string }, context) => {
+          return {
+            time: new Date().toISOString(),
+            timezone: params.timezone || "UTC",
+          };
+        },
+      },
+    },
+    {
+      type: "function" as const,
+      function: {
+        name: "get_weather",
+        description: "Get weather information",
+        inputSchema: z.object({
+          location: z.string(),
+        }),
+        outputSchema: z.object({
+          temperature: z.number(),
+          description: z.string(),
+        }),
+        execute: async (params: { location: string }) => {
+          // This tool doesn't need context
+          return {
+            temperature: 68,
+            description: "Partly cloudy",
+          };
+        },
+      },
+    },
+  ];
+
+  const response = client.getResponse({
+    model: "openai/gpt-4o",
+    input: "What time is it and what's the weather in New York?",
+    tools,
+  });
+
+  // Tools are automatically executed!
+  const message = await response.getMessage();
+  console.log("Final message:", message.content);
+
+  // You can check which tools were called
+  const toolCalls = await response.getToolCalls();
+  console.log("\nTools that were called:", toolCalls.map(tc => tc.name));
+}
+
+// Run examples
+async function main() {
+  try {
+    await basicToolExample();
+    await generatorToolExample();
+    await manualToolExample();
+    await streamingToolCallsExample();
+    await multipleToolsExample();
+  } catch (error) {
+    console.error("Error running examples:", error);
+  }
+}
+
+// Only run if this file is executed directly
+if (import.meta.url === `file://${process.argv[1]}`) {
+  main();
+}
+
+export {
+  basicToolExample,
+  generatorToolExample,
+  manualToolExample,
+  streamingToolCallsExample,
+  multipleToolsExample,
+};
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index cbe25e0a..70df4015 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -11,6 +11,9 @@ importers:
       react:
         specifier: ^18 || ^19
         version: 19.2.0
+      react-dom:
+        specifier: ^18 || ^19
+        version: 19.2.0(react@19.2.0)
       zod:
         specifier: ^3.25.0 || ^4.0.0
         version: 4.1.12
@@ -28,8 +31,8 @@ importers:
         specifier: ^18.3.12
         version: 18.3.26
       dotenv:
-        specifier: ^17.2.3
-        version: 17.2.3
+        specifier: ^16.4.7
+        version: 16.6.1
       eslint:
         specifier: ^9.19.0
         version: 9.38.0
@@ -590,8 +593,8 @@ packages:
   deep-is@0.1.4:
     resolution: {integrity: sha512-oIPzksmTg4/MriiaYGO+okXDT7ztn/w3Eptv/+gSIdMdKsJo0u4CfYNFJPy+4SKMuCqGw2wxnA+URMg3t8a/bQ==}
 
-  dotenv@17.2.3:
-    resolution: {integrity: sha512-JVUnt+DUIzu87TABbhPmNfVdBDt18BLOWjMUFJMSi/Qqg7NTYtabbvSNJGOJ7afbRuv9D/lngizHtP7QyLQ+9w==}
+  dotenv@16.6.1:
+    resolution: {integrity: sha512-uBq4egWHTcTt33a72vpSG0z3HnPuIl6NqYcTrKEg2azoEyl2hpW0zqlxysq2pK9HlDIHyHyakeYaYnSAwd8bow==}
     engines: {node: '>=12'}
 
   es-module-lexer@1.7.0:
@@ -877,6 +880,11 @@ packages:
   queue-microtask@1.2.3:
     resolution: {integrity: sha512-NuaNSa6flKT5JaSYQzJok04JzTL1CA6aGhv5rfLW3PgqA+M2ChpZQnAC8h8i4ZFkBS8X5RqkDBHA7r4hej3K9A==}
 
+  react-dom@19.2.0:
+    resolution: {integrity: sha512-UlbRu4cAiGaIewkPyiRGJk0imDN2T3JjieT6spoL2UeSf5od4n5LB/mQ4ejmxhCFT1tYe8IvaFulzynWovsEFQ==}
+    peerDependencies:
+      react: ^19.2.0
+
   react@19.2.0:
     resolution: {integrity: sha512-tmbWg6W31tQLeB5cdIBOicJDJRR2KzXsV7uSK9iNfLWQ5bIZfxuPEHp7M8wiHyHnn0DD1i7w3Zmin0FtkrwoCQ==}
     engines: {node: '>=0.10.0'}
@@ -897,6 +905,9 @@ packages:
   run-parallel@1.2.0:
     resolution: {integrity: sha512-5l4VyZR86LZ/lDxZTR6jqL8AFE2S0IFLMP26AbjsLVADxHdhB/c0GUsH+y39UfCi3dzz8OlQuPmnaJOMoDHQBA==}
 
+  scheduler@0.27.0:
+    resolution: {integrity: sha512-eNv+WrVbKu1f3vbYJT/xtiF5syA5HPIMtf9IgY/nKg0sWqzAUEvqY/xm7OcZc/qafLx/iO9FgOmeSAp4v5ti/Q==}
+
   semver@7.7.3:
     resolution: {integrity: sha512-SdsKMrI9TdgjdweUSR9MweHA4EJ8YxHn8DFaDisvhVlUOe4BF1tLD7GAj0lIqWVl+dPb/rExr0Btby5loQm20Q==}
     engines: {node: '>=10'}
@@ -1542,7 +1553,7 @@ snapshots:
 
   deep-is@0.1.4: {}
 
-  dotenv@17.2.3: {}
+  dotenv@16.6.1: {}
 
   es-module-lexer@1.7.0: {}
 
@@ -1832,6 +1843,11 @@ snapshots:
 
   queue-microtask@1.2.3: {}
 
+  react-dom@19.2.0(react@19.2.0):
+    dependencies:
+      react: 19.2.0
+      scheduler: 0.27.0
+
   react@19.2.0: {}
 
   resolve-from@4.0.0: {}
@@ -1870,6 +1886,8 @@ snapshots:
     dependencies:
       queue-microtask: 1.2.3
 
+  scheduler@0.27.0: {}
+
   semver@7.7.3: {}
 
   shebang-command@2.0.0:
diff --git a/src/funcs/getResponse.ts b/src/funcs/getResponse.ts
index 4bd371d4..cb3eed16 100644
--- a/src/funcs/getResponse.ts
+++ b/src/funcs/getResponse.ts
@@ -2,6 +2,8 @@ import { OpenRouterCore } from "../core.js";
 import { RequestOptions } from "../lib/sdks.js";
 import { ResponseWrapper } from "../lib/response-wrapper.js";
 import * as models from "../models/index.js";
+import { EnhancedTool, MaxToolRounds } from "../lib/tool-types.js";
+import { convertEnhancedToolsToAPIFormat } from "../lib/tool-executor.js";
 
 /**
  * Get a response with multiple consumption patterns
@@ -10,53 +12,104 @@ import * as models from "../models/index.js";
  * Creates a response using the OpenResponses API in streaming mode and returns
  * a wrapper that allows consuming the response in multiple ways:
  *
- * - `await response.getMessage()` - Get the completed message
- * - `await response.getText()` - Get just the text content
+ * - `await response.getMessage()` - Get the completed message (tools auto-executed)
+ * - `await response.getText()` - Get just the text content (tools auto-executed)
  * - `for await (const delta of response.getTextStream())` - Stream text deltas
  * - `for await (const delta of response.getReasoningStream())` - Stream reasoning deltas
- * - `for await (const delta of response.getToolStream())` - Stream tool call argument deltas
+ * - `for await (const event of response.getToolStream())` - Stream tool events (incl. preliminary results)
+ * - `for await (const toolCall of response.getToolCallsStream())` - Stream structured tool calls
+ * - `await response.getToolCalls()` - Get all tool calls from completed response
  * - `for await (const msg of response.getNewMessagesStream())` - Stream incremental message updates
- * - `for await (const event of response.getFullResponsesStream())` - Stream all response events
- * - `for await (const chunk of response.getFullChatStream())` - Stream in chat-compatible format
+ * - `for await (const event of response.getFullResponsesStream())` - Stream all events (incl. tool preliminary)
+ * - `for await (const event of response.getFullChatStream())` - Stream in chat format (incl. tool preliminary)
  *
  * All consumption patterns can be used concurrently on the same response.
  *
  * @example
  * ```typescript
+ * import { z } from 'zod';
+ *
  * // Simple text extraction
- * const response = await openrouter.beta.responses.get({
- *   model: "anthropic/claude-3-opus",
- *   input: [{ role: "user", content: "Hello!" }]
+ * const response = openrouter.getResponse({
+ *   model: "openai/gpt-4",
+ *   input: "Hello!"
  * });
  * const text = await response.getText();
  * console.log(text);
  *
- * // Streaming text
- * const response = openrouter.beta.responses.get({
- *   model: "anthropic/claude-3-opus",
- *   input: [{ role: "user", content: "Hello!" }]
+ * // With tools (automatic execution)
+ * const response = openrouter.getResponse({
+ *   model: "openai/gpt-4",
+ *   input: "What's the weather in SF?",
+ *   tools: [{
+ *     type: "function",
+ *     function: {
+ *       name: "get_weather",
+ *       description: "Get current weather",
+ *       inputSchema: z.object({
+ *         location: z.string()
+ *       }),
+ *       outputSchema: z.object({
+ *         temperature: z.number(),
+ *         description: z.string()
+ *       }),
+ *       execute: async (params) => {
+ *         return { temperature: 72, description: "Sunny" };
+ *       }
+ *     }
+ *   }],
+ *   maxToolRounds: 5, // or function: (round, calls, responses) => boolean
  * });
- * for await (const delta of response.getTextStream()) {
- *   process.stdout.write(delta);
- * }
+ * const message = await response.getMessage(); // Tools auto-executed!
  *
- * // Full message with metadata
- * const response = openrouter.beta.responses.get({
- *   model: "anthropic/claude-3-opus",
- *   input: [{ role: "user", content: "Hello!" }]
- * });
- * const message = await response.getMessage();
- * console.log(message.content);
+ * // Stream with preliminary results
+ * for await (const event of response.getFullChatStream()) {
+ *   if (event.type === "content.delta") {
+ *     process.stdout.write(event.delta);
+ *   } else if (event.type === "tool.preliminary_result") {
+ *     console.log("Tool progress:", event.result);
+ *   }
+ * }
  * ```
  */
 export function getResponse(
   client: OpenRouterCore,
-  request: Omit<models.OpenResponsesRequest, "stream">,
+  request: Omit<models.OpenResponsesRequest, "stream"> & {
+    tools?: EnhancedTool[];
+    maxToolRounds?: MaxToolRounds;
+  },
   options?: RequestOptions,
 ): ResponseWrapper {
-  return new ResponseWrapper({
+  const { tools, maxToolRounds, ...apiRequest } = request;
+
+  // Convert enhanced tools to API format if provided
+  const apiTools = tools ? convertEnhancedToolsToAPIFormat(tools) : undefined;
+
+  // Build the request with converted tools
+  const finalRequest = {
+    ...apiRequest,
+    ...(apiTools && { tools: apiTools }),
+  };
+
+  const wrapperOptions: {
+    client: OpenRouterCore;
+    request: models.OpenResponsesRequest;
+    options: RequestOptions;
+    tools?: EnhancedTool[];
+    maxToolRounds?: MaxToolRounds;
+  } = {
     client,
-    request: { ...request },
+    request: finalRequest,
     options: options ?? {},
-  });
+  };
+
+  if (tools) {
+    wrapperOptions.tools = tools;
+  }
+
+  if (maxToolRounds !== undefined) {
+    wrapperOptions.maxToolRounds = maxToolRounds;
+  }
+
+  return new ResponseWrapper(wrapperOptions);
 }
diff --git a/src/index.ts b/src/index.ts
index 734a437d..c25fc112 100644
--- a/src/index.ts
+++ b/src/index.ts
@@ -10,5 +10,18 @@ export type { Fetcher, HTTPClientOptions } from "./lib/http.js";
 export { ResponseWrapper } from "./lib/response-wrapper.js";
 export type { GetResponseOptions } from "./lib/response-wrapper.js";
 export { ReusableReadableStream } from "./lib/reusable-stream.js";
+export type {
+  EnhancedTool,
+  ToolWithExecute,
+  ToolWithGenerator,
+  ManualTool,
+  ParsedToolCall,
+  ToolExecutionResult,
+  MaxToolRounds,
+  TurnContext,
+  EnhancedResponseStreamEvent,
+  ToolStreamEvent,
+  ChatStreamEvent,
+} from "./lib/tool-types.js";
 // #endregion
 export * from "./sdk/sdk.js";
diff --git a/src/lib/response-wrapper.ts b/src/lib/response-wrapper.ts
index 70197b8c..e7ed07ff 100644
--- a/src/lib/response-wrapper.ts
+++ b/src/lib/response-wrapper.ts
@@ -12,12 +12,29 @@ import {
   consumeStreamForCompletion,
   extractMessageFromResponse,
   extractTextFromResponse,
+  extractToolCallsFromResponse,
+  buildToolCallStream,
 } from "./stream-transformers.js";
+import {
+  EnhancedTool,
+  ParsedToolCall,
+  MaxToolRounds,
+  TurnContext,
+  hasExecuteFunction,
+  EnhancedResponseStreamEvent,
+  ToolStreamEvent,
+  ChatStreamEvent,
+} from "./tool-types.js";
+import {
+  executeTool,
+} from "./tool-executor.js";
 
 export interface GetResponseOptions {
   request: models.OpenResponsesRequest;
   client: OpenRouterCore;
   options?: RequestOptions;
+  tools?: EnhancedTool[];
+  maxToolRounds?: MaxToolRounds;
 }
 
 /**
@@ -40,6 +57,14 @@ export class ResponseWrapper {
   private textPromise: Promise<string> | null = null;
   private options: GetResponseOptions;
   private initPromise: Promise<void> | null = null;
+  private toolExecutionPromise: Promise<void> | null = null;
+  private finalResponse: models.OpenResponsesNonStreamingResponse | null = null;
+  private preliminaryResults: Map<string, unknown[]> = new Map();
+  private allToolExecutionRounds: Array<{
+    round: number;
+    toolCalls: ParsedToolCall[];
+    response: models.OpenResponsesNonStreamingResponse;
+  }> = [];
 
   constructor(options: GetResponseOptions) {
     this.options = options;
@@ -78,9 +103,183 @@ export class ResponseWrapper {
     return this.initPromise;
   }
 
+  /**
+   * Execute tools automatically if they are provided and have execute functions
+   * This is idempotent - multiple calls will return the same promise
+   */
+  private async executeToolsIfNeeded(): Promise<void> {
+    if (this.toolExecutionPromise) {
+      return this.toolExecutionPromise;
+    }
+
+    this.toolExecutionPromise = (async () => {
+      await this.initStream();
+
+      if (!this.reusableStream) {
+        throw new Error("Stream not initialized");
+      }
+
+      // Get the initial response
+      const initialResponse = await consumeStreamForCompletion(this.reusableStream);
+
+      // Check if we have tools and if auto-execution is enabled
+      const shouldAutoExecute = this.options.tools &&
+                                this.options.tools.length > 0 &&
+                                initialResponse.output.some(
+                                  (item) => "type" in item && item.type === "function_call"
+                                );
+
+      if (!shouldAutoExecute) {
+        // No tools to execute, use initial response
+        this.finalResponse = initialResponse;
+        return;
+      }
+
+      // Extract tool calls
+      const toolCalls = extractToolCallsFromResponse(initialResponse);
+
+      // Check if any have execute functions
+      const executableTools = toolCalls.filter((toolCall) => {
+        const tool = this.options.tools?.find((t) => t.function.name === toolCall.name);
+        return tool && hasExecuteFunction(tool);
+      });
+
+      if (executableTools.length === 0) {
+        // No executable tools, use initial response
+        this.finalResponse = initialResponse;
+        return;
+      }
+
+      // Get maxToolRounds configuration
+      const maxToolRounds = this.options.maxToolRounds ?? 5;
+
+      let currentResponse = initialResponse;
+      let currentRound = 0;
+      let currentInput: models.OpenResponsesInput = this.options.request.input || [];
+
+      while (true) {
+        const currentToolCalls = extractToolCallsFromResponse(currentResponse);
+
+        if (currentToolCalls.length === 0) {
+          break;
+        }
+
+        const hasExecutable = currentToolCalls.some((toolCall) => {
+          const tool = this.options.tools?.find((t) => t.function.name === toolCall.name);
+          return tool && hasExecuteFunction(tool);
+        });
+
+        if (!hasExecutable) {
+          break;
+        }
+
+        // Check if we should continue based on maxToolRounds
+        if (typeof maxToolRounds === "number") {
+          if (currentRound >= maxToolRounds) {
+            break;
+          }
+        } else if (typeof maxToolRounds === "function") {
+          const shouldContinue = maxToolRounds(
+            currentRound,
+            currentToolCalls,
+            this.allToolExecutionRounds.map((r) => r.response)
+          );
+          if (!shouldContinue) {
+            break;
+          }
+        }
+
+        // Store execution round info
+        this.allToolExecutionRounds.push({
+          round: currentRound,
+          toolCalls: currentToolCalls,
+          response: currentResponse,
+        });
+
+        // Build turn context for tool execution
+        const turnContext: TurnContext = {
+          numberOfTurns: currentRound + 1, // 1-indexed
+          messageHistory: currentInput,
+          ...(this.options.request.model && { model: this.options.request.model }),
+          ...(this.options.request.models && { models: this.options.request.models }),
+        };
+
+        // Execute all tool calls
+        const toolResults: Array<models.OpenResponsesFunctionCallOutput> = [];
+
+        for (const toolCall of currentToolCalls) {
+          const tool = this.options.tools?.find((t) => t.function.name === toolCall.name);
+
+          if (!tool || !hasExecuteFunction(tool)) {
+            continue;
+          }
+
+          const result = await executeTool(tool, toolCall, turnContext);
+
+          // Store preliminary results
+          if (result.preliminaryResults && result.preliminaryResults.length > 0) {
+            this.preliminaryResults.set(toolCall.id, result.preliminaryResults);
+          }
+
+          toolResults.push({
+            type: "function_call_output" as const,
+            id: `output_${toolCall.id}`,
+            callId: toolCall.id,
+            output: result.error
+              ? JSON.stringify({ error: result.error.message })
+              : JSON.stringify(result.result),
+          });
+        }
+
+        // Build new input with tool results
+        // For the Responses API, we need to include the tool results in the input
+        const newInput: models.OpenResponsesInput = [
+          ...(Array.isArray(currentResponse.output) ? currentResponse.output : [currentResponse.output]),
+          ...toolResults,
+        ];
+
+        // Update current input for next iteration
+        currentInput = newInput;
+
+        // Make new request with tool results
+        const newRequest: models.OpenResponsesRequest = {
+          ...this.options.request,
+          input: newInput,
+          stream: false,
+        };
+
+        const newResult = await betaResponsesSend(
+          this.options.client,
+          newRequest,
+          this.options.options
+        );
+
+        if (!newResult.ok) {
+          throw newResult.error;
+        }
+
+        // Handle the result - it might be a stream or a response
+        const value = newResult.value;
+        if (value && typeof value === "object" && "toReadableStream" in value) {
+          // It's a stream, consume it
+          const stream = new ReusableReadableStream(value as EventStream<models.OpenResponsesStreamEvent>);
+          currentResponse = await consumeStreamForCompletion(stream);
+        } else {
+          currentResponse = value as models.OpenResponsesNonStreamingResponse;
+        }
+
+        currentRound++;
+      }
+
+      this.finalResponse = currentResponse;
+    })();
+
+    return this.toolExecutionPromise;
+  }
+
   /**
    * Get the completed message from the response.
-   * This will consume the stream until completion and extract the first message.
+   * This will consume the stream until completion, execute any tools, and extract the first message.
    * Returns an AssistantMessage in chat format.
    */
   getMessage(): Promise<models.AssistantMessage> {
@@ -89,13 +288,13 @@ export class ResponseWrapper {
     }
 
     this.messagePromise = (async (): Promise<models.AssistantMessage> => {
-      await this.initStream();
-      if (!this.reusableStream) {
-        throw new Error("Stream not initialized");
+      await this.executeToolsIfNeeded();
+
+      if (!this.finalResponse) {
+        throw new Error("Response not available");
       }
 
-      const completedResponse = await consumeStreamForCompletion(this.reusableStream);
-      return extractMessageFromResponse(completedResponse);
+      return extractMessageFromResponse(this.finalResponse);
     })();
 
     return this.messagePromise;
@@ -103,7 +302,7 @@ export class ResponseWrapper {
 
   /**
    * Get just the text content from the response.
-   * This will consume the stream until completion and extract the text.
+   * This will consume the stream until completion, execute any tools, and extract the text.
    */
   getText(): Promise<string> {
     if (this.textPromise) {
@@ -111,13 +310,13 @@ export class ResponseWrapper {
     }
 
     this.textPromise = (async () => {
-      await this.initStream();
-      if (!this.reusableStream) {
-        throw new Error("Stream not initialized");
+      await this.executeToolsIfNeeded();
+
+      if (!this.finalResponse) {
+        throw new Error("Response not available");
       }
 
-      const completedResponse = await consumeStreamForCompletion(this.reusableStream);
-      return extractTextFromResponse(completedResponse);
+      return extractTextFromResponse(this.finalResponse);
     })();
 
     return this.textPromise;
@@ -126,8 +325,9 @@ export class ResponseWrapper {
   /**
    * Stream all response events as they arrive.
    * Multiple consumers can iterate over this stream concurrently.
+   * Includes preliminary tool result events after tool execution.
    */
-  getFullResponsesStream(): AsyncIterableIterator<models.OpenResponsesStreamEvent> {
+  getFullResponsesStream(): AsyncIterableIterator<EnhancedResponseStreamEvent> {
     return (async function* (this: ResponseWrapper) {
       await this.initStream();
       if (!this.reusableStream) {
@@ -135,7 +335,27 @@ export class ResponseWrapper {
       }
 
       const consumer = this.reusableStream.createConsumer();
-      yield* consumer;
+
+      // Yield original events wrapped
+      for await (const event of consumer) {
+        yield { _tag: "original" as const, event };
+      }
+
+      // After stream completes, check if tools were executed and emit preliminary results
+      await this.executeToolsIfNeeded();
+
+      // Emit all preliminary results
+      for (const [toolCallId, results] of this.preliminaryResults) {
+        for (const result of results) {
+          yield {
+            _tag: "tool_preliminary" as const,
+            type: "tool.preliminary_result" as const,
+            toolCallId,
+            result,
+            timestamp: Date.now(),
+          };
+        }
+      }
     }.call(this));
   }
 
@@ -186,30 +406,50 @@ export class ResponseWrapper {
   }
 
   /**
-   * Stream only tool call argument deltas as they arrive.
-   * This filters the full event stream to only yield function call arguments.
+   * Stream tool call argument deltas and preliminary results.
+   * This filters the full event stream to yield:
+   * - Tool call argument deltas as { type: "delta", content: string }
+   * - Preliminary results as { type: "preliminary_result", toolCallId, result }
    */
-  getToolStream(): AsyncIterableIterator<string> {
+  getToolStream(): AsyncIterableIterator<ToolStreamEvent> {
     return (async function* (this: ResponseWrapper) {
       await this.initStream();
       if (!this.reusableStream) {
         throw new Error("Stream not initialized");
       }
 
-      yield* extractToolDeltas(this.reusableStream);
+      // Yield tool deltas as structured events
+      for await (const delta of extractToolDeltas(this.reusableStream)) {
+        yield { type: "delta" as const, content: delta };
+      }
+
+      // After stream completes, check if tools were executed and emit preliminary results
+      await this.executeToolsIfNeeded();
+
+      // Emit all preliminary results
+      for (const [toolCallId, results] of this.preliminaryResults) {
+        for (const result of results) {
+          yield {
+            type: "preliminary_result" as const,
+            toolCallId,
+            result,
+          };
+        }
+      }
     }.call(this));
   }
 
   /**
    * Stream events in chat format (compatibility layer).
    * Note: This transforms responses API events into a chat-like format.
+   * Includes preliminary tool result events after tool execution.
    *
    * @remarks
    * This is a compatibility method that attempts to transform the responses API
    * stream into a format similar to the chat API. Due to differences in the APIs,
    * this may not be a perfect mapping.
    */
-  getFullChatStream(): AsyncIterableIterator<any> {
+  getFullChatStream(): AsyncIterableIterator<ChatStreamEvent> {
     return (async function* (this: ResponseWrapper) {
       await this.initStream();
       if (!this.reusableStream) {
@@ -226,13 +466,13 @@ export class ResponseWrapper {
         if (event.type === "response.output_text.delta") {
           const deltaEvent = event as models.OpenResponsesStreamEventResponseOutputTextDelta;
           yield {
-            type: "content.delta",
+            type: "content.delta" as const,
             delta: deltaEvent.delta,
           };
         } else if (event.type === "response.completed") {
           const completedEvent = event as models.OpenResponsesStreamEventResponseCompleted;
           yield {
-            type: "message.complete",
+            type: "message.complete" as const,
             response: completedEvent.response,
           };
         } else {
@@ -243,9 +483,55 @@ export class ResponseWrapper {
           };
         }
       }
+
+      // After stream completes, check if tools were executed and emit preliminary results
+      await this.executeToolsIfNeeded();
+
+      // Emit all preliminary results
+      for (const [toolCallId, results] of this.preliminaryResults) {
+        for (const result of results) {
+          yield {
+            type: "tool.preliminary_result" as const,
+            toolCallId,
+            result,
+          };
+        }
+      }
+    }.call(this));
+  }
+
+  /**
+   * Get all tool calls from the completed response (before auto-execution).
+   * Note: If tools have execute functions, they will be automatically executed
+   * and this will return the tool calls from the initial response.
+   * Returns structured tool calls with parsed arguments.
+   */
+  async getToolCalls(): Promise<ParsedToolCall[]> {
+    await this.initStream();
+    if (!this.reusableStream) {
+      throw new Error("Stream not initialized");
+    }
+
+    const completedResponse = await consumeStreamForCompletion(this.reusableStream);
+    return extractToolCallsFromResponse(completedResponse);
+  }
+
+  /**
+   * Stream structured tool call objects as they're completed.
+   * Each iteration yields a complete tool call with parsed arguments.
+   */
+  getToolCallsStream(): AsyncIterableIterator<ParsedToolCall> {
+    return (async function* (this: ResponseWrapper) {
+      await this.initStream();
+      if (!this.reusableStream) {
+        throw new Error("Stream not initialized");
+      }
+
+      yield* buildToolCallStream(this.reusableStream);
     }.call(this));
   }
 
+
   /**
    * Cancel the underlying stream and all consumers
    */
diff --git a/src/lib/stream-transformers.ts b/src/lib/stream-transformers.ts
index 639d4a78..9e7dca6f 100644
--- a/src/lib/stream-transformers.ts
+++ b/src/lib/stream-transformers.ts
@@ -1,5 +1,6 @@
 import * as models from "../models/index.js";
 import { ReusableReadableStream } from "./reusable-stream.js";
+import { ParsedToolCall } from "./tool-types.js";
 
 /**
  * Extract text deltas from responses stream events
@@ -199,3 +200,167 @@ export function extractTextFromResponse(
 
   return "";
 }
+
+/**
+ * Extract all tool calls from a completed response
+ * Returns parsed tool calls with arguments as objects (not JSON strings)
+ */
+export function extractToolCallsFromResponse(
+  response: models.OpenResponsesNonStreamingResponse,
+): ParsedToolCall[] {
+  const toolCalls: ParsedToolCall[] = [];
+
+  for (const item of response.output) {
+    if ("type" in item && item.type === "function_call") {
+      const functionCallItem = item as models.ResponsesOutputItemFunctionCall;
+
+      try {
+        const parsedArguments = JSON.parse(functionCallItem.arguments);
+
+        toolCalls.push({
+          id: functionCallItem.callId,
+          name: functionCallItem.name,
+          arguments: parsedArguments,
+        });
+      } catch (error) {
+        console.error(
+          `Failed to parse tool call arguments for ${functionCallItem.name}:`,
+          error
+        );
+        // Include the tool call with unparsed arguments
+        toolCalls.push({
+          id: functionCallItem.callId,
+          name: functionCallItem.name,
+          arguments: functionCallItem.arguments, // Keep as string if parsing fails
+        });
+      }
+    }
+  }
+
+  return toolCalls;
+}
+
+/**
+ * Build incremental tool call updates from responses stream events
+ * Yields structured tool call objects as they're built from deltas
+ */
+export async function* buildToolCallStream(
+  stream: ReusableReadableStream<models.OpenResponsesStreamEvent>,
+): AsyncIterableIterator<ParsedToolCall> {
+  const consumer = stream.createConsumer();
+
+  // Track tool calls being built
+  const toolCallsInProgress = new Map<
+    string,
+    {
+      id: string;
+      name: string;
+      argumentsAccumulated: string;
+    }
+  >();
+
+  for await (const event of consumer) {
+    if (!("type" in event)) continue;
+
+    switch (event.type) {
+      case "response.output_item.added": {
+        const itemEvent = event as models.OpenResponsesStreamEventResponseOutputItemAdded;
+        if (
+          itemEvent.item &&
+          "type" in itemEvent.item &&
+          itemEvent.item.type === "function_call"
+        ) {
+          const functionCallItem = itemEvent.item as models.ResponsesOutputItemFunctionCall;
+          toolCallsInProgress.set(functionCallItem.callId, {
+            id: functionCallItem.callId,
+            name: functionCallItem.name,
+            argumentsAccumulated: "",
+          });
+        }
+        break;
+      }
+
+      case "response.function_call_arguments.delta": {
+        const deltaEvent =
+          event as models.OpenResponsesStreamEventResponseFunctionCallArgumentsDelta;
+        const toolCall = toolCallsInProgress.get(deltaEvent.itemId);
+        if (toolCall && deltaEvent.delta) {
+          toolCall.argumentsAccumulated += deltaEvent.delta;
+        }
+        break;
+      }
+
+      case "response.function_call_arguments.done": {
+        const doneEvent =
+          event as models.OpenResponsesStreamEventResponseFunctionCallArgumentsDone;
+        const toolCall = toolCallsInProgress.get(doneEvent.itemId);
+
+        if (toolCall) {
+          // Parse complete arguments
+          try {
+            const parsedArguments = JSON.parse(doneEvent.arguments);
+            yield {
+              id: toolCall.id,
+              name: doneEvent.name,
+              arguments: parsedArguments,
+            };
+          } catch (error) {
+            // Yield with unparsed arguments if parsing fails
+            yield {
+              id: toolCall.id,
+              name: doneEvent.name,
+              arguments: doneEvent.arguments,
+            };
+          }
+
+          // Clean up
+          toolCallsInProgress.delete(doneEvent.itemId);
+        }
+        break;
+      }
+
+      case "response.output_item.done": {
+        const itemDoneEvent = event as models.OpenResponsesStreamEventResponseOutputItemDone;
+        if (
+          itemDoneEvent.item &&
+          "type" in itemDoneEvent.item &&
+          itemDoneEvent.item.type === "function_call"
+        ) {
+          const functionCallItem = itemDoneEvent.item as models.ResponsesOutputItemFunctionCall;
+
+          // Yield final tool call if we haven't already
+          if (toolCallsInProgress.has(functionCallItem.callId)) {
+            try {
+              const parsedArguments = JSON.parse(functionCallItem.arguments);
+              yield {
+                id: functionCallItem.callId,
+                name: functionCallItem.name,
+                arguments: parsedArguments,
+              };
+            } catch (error) {
+              yield {
+                id: functionCallItem.callId,
+                name: functionCallItem.name,
+                arguments: functionCallItem.arguments,
+              };
+            }
+
+            toolCallsInProgress.delete(functionCallItem.callId);
+          }
+        }
+        break;
+      }
+    }
+  }
+}
+
+/**
+ * Check if a response contains any tool calls
+ */
+export function responseHasToolCalls(
+  response: models.OpenResponsesNonStreamingResponse,
+): boolean {
+  return response.output.some(
+    (item) => "type" in item && item.type === "function_call"
+  );
+}
diff --git a/src/lib/tool-executor.ts b/src/lib/tool-executor.ts
new file mode 100644
index 00000000..45b4feda
--- /dev/null
+++ b/src/lib/tool-executor.ts
@@ -0,0 +1,249 @@
+import { ZodType, ZodError, toJSONSchema } from "zod/v4";
+import {
+  EnhancedTool,
+  ToolExecutionResult,
+  ParsedToolCall,
+  APITool,
+  TurnContext,
+  hasExecuteFunction,
+  isGeneratorTool,
+  isRegularExecuteTool,
+} from "./tool-types.js";
+
+/**
+ * Convert a Zod schema to JSON Schema using Zod v4's toJSONSchema function
+ */
+export function convertZodToJsonSchema(zodSchema: ZodType): Record<string, any> {
+  const jsonSchema = toJSONSchema(zodSchema, {
+    target: "openapi-3.0",
+  });
+  return jsonSchema as Record<string, any>;
+}
+
+/**
+ * Convert enhanced tools to OpenRouter API format
+ */
+export function convertEnhancedToolsToAPIFormat(
+  tools: EnhancedTool[]
+): APITool[] {
+  return tools.map((tool) => ({
+    type: "function" as const,
+    name: tool.function.name,
+    description: tool.function.description || null,
+    strict: null,
+    parameters: convertZodToJsonSchema(tool.function.inputSchema),
+  }));
+}
+
+/**
+ * Validate tool input against Zod schema
+ * @throws ZodError if validation fails
+ */
+export function validateToolInput<T>(schema: ZodType<T>, args: unknown): T {
+  return schema.parse(args);
+}
+
+/**
+ * Validate tool output against Zod schema
+ * @throws ZodError if validation fails
+ */
+export function validateToolOutput<T>(schema: ZodType<T>, result: unknown): T {
+  return schema.parse(result);
+}
+
+/**
+ * Parse tool call arguments from JSON string
+ */
+export function parseToolCallArguments(argumentsString: string): unknown {
+  try {
+    return JSON.parse(argumentsString);
+  } catch (error) {
+    throw new Error(
+      `Failed to parse tool call arguments: ${
+        error instanceof Error ? error.message : String(error)
+      }`
+    );
+  }
+}
+
+/**
+ * Execute a regular (non-generator) tool
+ */
+export async function executeRegularTool(
+  tool: EnhancedTool,
+  toolCall: ParsedToolCall,
+  context: TurnContext
+): Promise<ToolExecutionResult> {
+  if (!isRegularExecuteTool(tool)) {
+    throw new Error(
+      `Tool "${toolCall.name}" is not a regular execute tool or has no execute function`
+    );
+  }
+
+  try {
+    // Validate input
+    const validatedInput = validateToolInput(
+      tool.function.inputSchema,
+      toolCall.arguments
+    );
+
+    // Execute tool with context
+    const result = await Promise.resolve(
+      tool.function.execute(validatedInput as any, context)
+    );
+
+    // Validate output if schema is provided
+    if (tool.function.outputSchema) {
+      const validatedOutput = validateToolOutput(
+        tool.function.outputSchema,
+        result
+      );
+
+      return {
+        toolCallId: toolCall.id,
+        toolName: toolCall.name,
+        result: validatedOutput,
+      };
+    }
+
+    return {
+      toolCallId: toolCall.id,
+      toolName: toolCall.name,
+      result,
+    };
+  } catch (error) {
+    return {
+      toolCallId: toolCall.id,
+      toolName: toolCall.name,
+      result: null,
+      error: error instanceof Error ? error : new Error(String(error)),
+    };
+  }
+}
+
+/**
+ * Execute a generator tool and collect preliminary and final results
+ * Following Vercel AI SDK pattern:
+ * - All yielded values are preliminary results (for streaming to UI)
+ * - Last yielded value is the final result (sent to model)
+ */
+export async function executeGeneratorTool(
+  tool: EnhancedTool,
+  toolCall: ParsedToolCall,
+  context: TurnContext,
+  onPreliminaryResult?: (toolCallId: string, result: unknown) => void
+): Promise<ToolExecutionResult> {
+  if (!isGeneratorTool(tool)) {
+    throw new Error(`Tool "${toolCall.name}" is not a generator tool`);
+  }
+
+  try {
+    // Validate input
+    const validatedInput = validateToolInput(
+      tool.function.inputSchema,
+      toolCall.arguments
+    );
+
+    // Execute generator and collect all results
+    const preliminaryResults: unknown[] = [];
+    let finalResult: unknown = null;
+
+    for await (const event of tool.function.execute(validatedInput as any, context)) {
+      // Validate event against eventSchema
+      const validatedEvent = validateToolOutput(tool.function.eventSchema, event);
+
+      preliminaryResults.push(validatedEvent);
+      finalResult = validatedEvent;
+
+      // Emit preliminary result via callback
+      if (onPreliminaryResult) {
+        onPreliminaryResult(toolCall.id, validatedEvent);
+      }
+    }
+
+    // The last yielded value is the final result sent to model
+    return {
+      toolCallId: toolCall.id,
+      toolName: toolCall.name,
+      result: finalResult,
+      preliminaryResults,
+    };
+  } catch (error) {
+    return {
+      toolCallId: toolCall.id,
+      toolName: toolCall.name,
+      result: null,
+      error: error instanceof Error ? error : new Error(String(error)),
+    };
+  }
+}
+
+/**
+ * Execute a tool call
+ * Automatically detects if it's a regular or generator tool
+ */
+export async function executeTool(
+  tool: EnhancedTool,
+  toolCall: ParsedToolCall,
+  context: TurnContext,
+  onPreliminaryResult?: (toolCallId: string, result: unknown) => void
+): Promise<ToolExecutionResult> {
+  if (!hasExecuteFunction(tool)) {
+    throw new Error(
+      `Tool "${toolCall.name}" has no execute function. Use manual tool execution.`
+    );
+  }
+
+  if (isGeneratorTool(tool)) {
+    return executeGeneratorTool(tool, toolCall, context, onPreliminaryResult);
+  }
+
+  return executeRegularTool(tool, toolCall, context);
+}
+
+/**
+ * Find a tool by name in the tools array
+ */
+export function findToolByName(
+  tools: EnhancedTool[],
+  name: string
+): EnhancedTool | undefined {
+  return tools.find((tool) => tool.function.name === name);
+}
+
+/**
+ * Format tool execution result as a string for sending to the model
+ */
+export function formatToolResultForModel(result: ToolExecutionResult): string {
+  if (result.error) {
+    return JSON.stringify({
+      error: result.error.message,
+      toolName: result.toolName,
+    });
+  }
+
+  return JSON.stringify(result.result);
+}
+
+/**
+ * Create a user-friendly error message for tool execution errors
+ */
+export function formatToolExecutionError(
+  error: Error,
+  toolCall: ParsedToolCall
+): string {
+  if (error instanceof ZodError) {
+    const issues = error.issues.map((issue) => ({
+      path: issue.path.join("."),
+      message: issue.message,
+    }));
+
+    return `Tool "${toolCall.name}" validation error:\n${JSON.stringify(
+      issues,
+      null,
+      2
+    )}`;
+  }
+
+  return `Tool "${toolCall.name}" execution error: ${error.message}`;
+}
diff --git a/src/lib/tool-orchestrator.ts b/src/lib/tool-orchestrator.ts
new file mode 100644
index 00000000..d5524bd7
--- /dev/null
+++ b/src/lib/tool-orchestrator.ts
@@ -0,0 +1,206 @@
+import * as models from "../models/index.js";
+import {
+  EnhancedTool,
+  ToolExecutionResult,
+  hasExecuteFunction,
+} from "./tool-types.js";
+import {
+  executeTool,
+  findToolByName,
+} from "./tool-executor.js";
+import {
+  extractToolCallsFromResponse,
+  responseHasToolCalls,
+} from "./stream-transformers.js";
+
+/**
+ * Options for tool execution
+ */
+export interface ToolExecutionOptions {
+  maxRounds?: number;
+  onPreliminaryResult?: (toolCallId: string, result: unknown) => void;
+}
+
+/**
+ * Result of the tool execution loop
+ */
+export interface ToolOrchestrationResult {
+  finalResponse: models.OpenResponsesNonStreamingResponse;
+  allResponses: models.OpenResponsesNonStreamingResponse[];
+  toolExecutionResults: ToolExecutionResult[];
+  conversationInput: models.OpenResponsesInput;
+}
+
+/**
+ * Execute tool calls and manage multi-turn conversations
+ * This orchestrates the loop of: request -> tool calls -> execute -> send results -> repeat
+ *
+ * @param sendRequest - Function to send a request and get a response
+ * @param initialInput - Starting input for the conversation
+ * @param tools - Enhanced tools with Zod schemas and execute functions
+ * @param apiTools - Converted tools in API format (JSON Schema)
+ * @param options - Execution options
+ * @returns Result containing final response and all execution data
+ */
+export async function executeToolLoop(
+  sendRequest: (
+    input: models.OpenResponsesInput,
+    tools: any[]
+  ) => Promise<models.OpenResponsesNonStreamingResponse>,
+  initialInput: models.OpenResponsesInput,
+  tools: EnhancedTool[],
+  apiTools: any[],
+  options: ToolExecutionOptions = {}
+): Promise<ToolOrchestrationResult> {
+  const maxRounds = options.maxRounds ?? 5;
+  const onPreliminaryResult = options.onPreliminaryResult;
+
+  const allResponses: models.OpenResponsesNonStreamingResponse[] = [];
+  const toolExecutionResults: ToolExecutionResult[] = [];
+  let conversationInput: models.OpenResponsesInput = initialInput;
+
+  let currentRound = 0;
+  let currentResponse: models.OpenResponsesNonStreamingResponse;
+
+  // Initial request
+  currentResponse = await sendRequest(conversationInput, apiTools);
+  allResponses.push(currentResponse);
+
+  // Loop until no more tool calls or max rounds reached
+  while (responseHasToolCalls(currentResponse) && currentRound < maxRounds) {
+    currentRound++;
+
+    // Extract tool calls from response
+    const toolCalls = extractToolCallsFromResponse(currentResponse);
+
+    if (toolCalls.length === 0) {
+      break;
+    }
+
+    // Check if any tools have execute functions
+    const hasExecutableTools = toolCalls.some((toolCall) => {
+      const tool = findToolByName(tools, toolCall.name);
+      return tool && hasExecuteFunction(tool);
+    });
+
+    // If no executable tools, return (manual execution mode)
+    if (!hasExecutableTools) {
+      break;
+    }
+
+    // Execute all tool calls
+    const roundResults: ToolExecutionResult[] = [];
+
+    for (const toolCall of toolCalls) {
+      const tool = findToolByName(tools, toolCall.name);
+
+      if (!tool) {
+        // Tool not found in definitions
+        roundResults.push({
+          toolCallId: toolCall.id,
+          toolName: toolCall.name,
+          result: null,
+          error: new Error(`Tool "${toolCall.name}" not found in tool definitions`),
+        });
+        continue;
+      }
+
+      if (!hasExecuteFunction(tool)) {
+        // Tool has no execute function - skip
+        continue;
+      }
+
+      // Build turn context
+      const turnContext: import("./tool-types.js").TurnContext = {
+        numberOfTurns: currentRound,
+        messageHistory: conversationInput,
+      };
+
+      // Execute the tool
+      const result = await executeTool(tool, toolCall, turnContext, onPreliminaryResult);
+      roundResults.push(result);
+    }
+
+    toolExecutionResults.push(...roundResults);
+
+    // Build array input with all output from previous response plus tool results
+    // The API expects continuation via previousResponseId, not by including outputs
+    // For now, we'll keep the conversation going via previousResponseId
+    conversationInput = initialInput; // Keep original input
+
+    // Note: The OpenRouter Responses API uses previousResponseId for continuation
+    // Tool results are automatically associated with the previous response's tool calls
+
+    // Send updated conversation to API - this should use previousResponseId
+    currentResponse = await sendRequest(conversationInput, apiTools);
+    allResponses.push(currentResponse);
+  }
+
+  return {
+    finalResponse: currentResponse,
+    allResponses,
+    toolExecutionResults,
+    conversationInput,
+  };
+}
+
+/**
+ * Convert tool execution results to a map for easy lookup
+ */
+export function toolResultsToMap(
+  results: ToolExecutionResult[]
+): Map<
+  string,
+  {
+    result: unknown;
+    preliminaryResults?: unknown[];
+  }
+> {
+  const map = new Map();
+
+  for (const result of results) {
+    map.set(result.toolCallId, {
+      result: result.result,
+      preliminaryResults: result.preliminaryResults,
+    });
+  }
+
+  return map;
+}
+
+/**
+ * Build a summary of tool executions for debugging/logging
+ */
+export function summarizeToolExecutions(
+  results: ToolExecutionResult[]
+): string {
+  const lines: string[] = [];
+
+  for (const result of results) {
+    if (result.error) {
+      lines.push(`❌ ${result.toolName} (${result.toolCallId}): ERROR - ${result.error.message}`);
+    } else {
+      const prelimCount = result.preliminaryResults?.length ?? 0;
+      const prelimInfo = prelimCount > 0 ? ` (${prelimCount} preliminary results)` : "";
+      lines.push(`✅ ${result.toolName} (${result.toolCallId}): SUCCESS${prelimInfo}`);
+    }
+  }
+
+  return lines.join("\n");
+}
+
+/**
+ * Check if any tool executions had errors
+ */
+export function hasToolExecutionErrors(results: ToolExecutionResult[]): boolean {
+  return results.some((result) => result.error !== undefined);
+}
+
+/**
+ * Get all tool execution errors
+ */
+export function getToolExecutionErrors(results: ToolExecutionResult[]): Error[] {
+  return results
+    .filter((result) => result.error !== undefined)
+    .map((result) => result.error!);
+}
diff --git a/src/lib/tool-types.ts b/src/lib/tool-types.ts
new file mode 100644
index 00000000..f181cc44
--- /dev/null
+++ b/src/lib/tool-types.ts
@@ -0,0 +1,233 @@
+import { z, ZodType, ZodObject, ZodRawShape } from "zod";
+import * as models from "../models/index.js";
+
+/**
+ * Turn context passed to tool execute functions
+ * Contains information about the current conversation state
+ */
+export interface TurnContext {
+  /** Number of tool execution turns so far (1-indexed: first turn = 1) */
+  numberOfTurns: number;
+  /** Current message history being sent to the API */
+  messageHistory: models.OpenResponsesInput;
+  /** Model name if request.model is set */
+  model?: string;
+  /** Model names if request.models is set */
+  models?: string[];
+}
+
+/**
+ * Base tool function interface with inputSchema
+ */
+export interface BaseToolFunction<TInput extends ZodObject<ZodRawShape>> {
+  name: string;
+  description?: string;
+  inputSchema: TInput;
+}
+
+/**
+ * Regular tool with synchronous or asynchronous execute function and optional outputSchema
+ */
+export interface ToolFunctionWithExecute<
+  TInput extends ZodObject<ZodRawShape>,
+  TOutput extends ZodType = ZodType<any>
+> extends BaseToolFunction<TInput> {
+  outputSchema?: TOutput;
+  execute: (
+    params: z.infer<TInput>,
+    context?: TurnContext
+  ) => Promise<z.infer<TOutput>> | z.infer<TOutput>;
+}
+
+/**
+ * Generator-based tool with async generator execute function and eventSchema
+ * Follows Vercel AI SDK pattern:
+ * - All yielded values are "preliminary results" (streamed to UI)
+ * - Last yielded value is the "final result" (sent to model)
+ */
+export interface ToolFunctionWithGenerator<
+  TInput extends ZodObject<ZodRawShape>,
+  TEvent extends ZodType = ZodType<any>
+> extends BaseToolFunction<TInput> {
+  eventSchema: TEvent;
+  execute: (
+    params: z.infer<TInput>,
+    context?: TurnContext
+  ) => AsyncGenerator<z.infer<TEvent>>;
+}
+
+/**
+ * Manual tool without execute function - requires manual handling by developer
+ */
+export interface ManualToolFunction<
+  TInput extends ZodObject<ZodRawShape>,
+  TOutput extends ZodType = ZodType<any>
+> extends BaseToolFunction<TInput> {
+  outputSchema?: TOutput;
+}
+
+/**
+ * Tool with execute function (regular or generator)
+ */
+export type ToolWithExecute<
+  TInput extends ZodObject<ZodRawShape> = ZodObject<ZodRawShape>,
+  TOutput extends ZodType = ZodType<any>
+> = {
+  type: "function";
+  function: ToolFunctionWithExecute<TInput, TOutput>;
+};
+
+/**
+ * Tool with generator execute function
+ */
+export type ToolWithGenerator<
+  TInput extends ZodObject<ZodRawShape> = ZodObject<ZodRawShape>,
+  TEvent extends ZodType = ZodType<any>
+> = {
+  type: "function";
+  function: ToolFunctionWithGenerator<TInput, TEvent>;
+};
+
+/**
+ * Tool without execute function (manual handling)
+ */
+export type ManualTool<
+  TInput extends ZodObject<ZodRawShape> = ZodObject<ZodRawShape>,
+  TOutput extends ZodType = ZodType<any>
+> = {
+  type: "function";
+  function: ManualToolFunction<TInput, TOutput>;
+};
+
+/**
+ * Union type of all enhanced tool types
+ */
+export type EnhancedTool =
+  | ToolWithExecute<any, any>
+  | ToolWithGenerator<any, any>
+  | ManualTool<any, any>;
+
+/**
+ * Type guard to check if a tool has an execute function
+ */
+export function hasExecuteFunction(
+  tool: EnhancedTool
+): tool is ToolWithExecute | ToolWithGenerator {
+  return "execute" in tool.function && typeof tool.function.execute === "function";
+}
+
+/**
+ * Type guard to check if a tool uses a generator (has eventSchema)
+ */
+export function isGeneratorTool(
+  tool: EnhancedTool
+): tool is ToolWithGenerator {
+  return "eventSchema" in tool.function;
+}
+
+/**
+ * Type guard to check if a tool is a regular execution tool (not generator)
+ */
+export function isRegularExecuteTool(
+  tool: EnhancedTool
+): tool is ToolWithExecute {
+  return hasExecuteFunction(tool) && !isGeneratorTool(tool);
+}
+
+/**
+ * Parsed tool call from API response
+ */
+export interface ParsedToolCall {
+  id: string;
+  name: string;
+  arguments: unknown; // Parsed from JSON string
+}
+
+/**
+ * Result of tool execution
+ */
+export interface ToolExecutionResult {
+  toolCallId: string;
+  toolName: string;
+  result: unknown; // Final result (sent to model)
+  preliminaryResults?: unknown[]; // All yielded values from generator
+  error?: Error;
+}
+
+/**
+ * Type for maxToolRounds - can be a number or a function that determines if execution should continue
+ */
+export type MaxToolRounds =
+  | number
+  | ((
+      round: number,
+      toolCalls: ParsedToolCall[],
+      responses: any[] // OpenResponsesNonStreamingResponse[]
+    ) => boolean); // Return true to continue, false to stop
+
+/**
+ * Result of executeTools operation
+ */
+export interface ExecuteToolsResult {
+  finalResponse: any; // ResponseWrapper (avoiding circular dependency)
+  allResponses: any[]; // All ResponseWrappers from each round
+  toolResults: Map<
+    string,
+    {
+      result: unknown;
+      preliminaryResults?: unknown[];
+    }
+  >;
+}
+
+/**
+ * Standard tool format for OpenRouter API (JSON Schema based)
+ * Matches OpenResponsesRequestToolFunction structure
+ */
+export interface APITool {
+  type: "function";
+  name: string;
+  description?: string | null;
+  strict?: boolean | null;
+  parameters: { [k: string]: any | null } | null;
+}
+
+/**
+ * Enhanced stream event types for getFullResponsesStream
+ * Extends OpenResponsesStreamEvent with tool preliminary results
+ */
+export type EnhancedResponseStreamEvent =
+  | { _tag: "original"; event: any } // Original OpenResponsesStreamEvent
+  | {
+      _tag: "tool_preliminary";
+      type: "tool.preliminary_result";
+      toolCallId: string;
+      result: unknown;
+      timestamp: number;
+    };
+
+/**
+ * Tool stream event types for getToolStream
+ * Includes both argument deltas and preliminary results
+ */
+export type ToolStreamEvent =
+  | { type: "delta"; content: string }
+  | {
+      type: "preliminary_result";
+      toolCallId: string;
+      result: unknown;
+    };
+
+/**
+ * Chat stream event types for getFullChatStream
+ * Includes content deltas, completion events, and tool preliminary results
+ */
+export type ChatStreamEvent =
+  | { type: "content.delta"; delta: string }
+  | { type: "message.complete"; response: any }
+  | {
+      type: "tool.preliminary_result";
+      toolCallId: string;
+      result: unknown;
+    }
+  | { type: string; event: any }; // Pass-through for other events
diff --git a/src/sdk/sdk.ts b/src/sdk/sdk.ts
index df850e0a..963da614 100644
--- a/src/sdk/sdk.ts
+++ b/src/sdk/sdk.ts
@@ -7,6 +7,7 @@ import { ClientSDK } from "../lib/sdks.js";
 import { RequestOptions } from "../lib/sdks.js";
 import { ResponseWrapper } from "../lib/response-wrapper.js";
 import { getResponse } from "../funcs/getResponse.js";
+import { EnhancedTool, MaxToolRounds } from "../lib/tool-types.js";
 import * as models from "../models/index.js";
 // #endregion
 import { Analytics } from "./analytics.js";
@@ -118,7 +119,10 @@ export class OpenRouter extends ClientSDK {
    * ```
    */
   getResponse(
-    request: Omit<models.OpenResponsesRequest, "stream">,
+    request: Omit<models.OpenResponsesRequest, "stream"> & {
+      tools?: EnhancedTool[];
+      maxToolRounds?: MaxToolRounds;
+    },
     options?: RequestOptions,
   ): ResponseWrapper {
     return getResponse(this, request, options);
diff --git a/tests/e2e/getResponse-tools.test.ts b/tests/e2e/getResponse-tools.test.ts
new file mode 100644
index 00000000..cf6951ca
--- /dev/null
+++ b/tests/e2e/getResponse-tools.test.ts
@@ -0,0 +1,529 @@
+import { describe, it, expect, beforeAll } from "vitest";
+import { OpenRouter } from "../../src/index.js";
+import { z } from "zod";
+import { toJSONSchema } from "zod/v4";
+import * as dotenv from "dotenv";
+
+dotenv.config();
+
+describe("Enhanced Tool Support for getResponse", () => {
+  let client: OpenRouter;
+
+  beforeAll(() => {
+    const apiKey = process.env.OPENROUTER_API_KEY;
+    if (!apiKey) {
+      throw new Error("OPENROUTER_API_KEY environment variable is required");
+    }
+    client = new OpenRouter({ apiKey });
+  });
+
+  describe("Zod Schema Conversion", () => {
+    it("should convert Zod schema to JSON Schema using v4 toJSONSchema()", () => {
+      const schema = z.object({
+        name: z.string().describe("The user's name"),
+        age: z.number().min(0).describe("The user's age"),
+      });
+
+      const jsonSchema = toJSONSchema(schema, { target: "openapi-3.0" });
+
+      expect(jsonSchema).toHaveProperty("type", "object");
+      expect(jsonSchema).toHaveProperty("properties");
+      expect(jsonSchema.properties).toHaveProperty("name");
+      expect(jsonSchema.properties).toHaveProperty("age");
+    });
+
+    it("should handle complex nested schemas", () => {
+      const schema = z.object({
+        user: z.object({
+          name: z.string(),
+          address: z.object({
+            street: z.string(),
+            city: z.string(),
+          }),
+        }),
+        tags: z.array(z.string()),
+      });
+
+      const jsonSchema = toJSONSchema(schema, { target: "openapi-3.0" });
+
+      expect(jsonSchema.properties.user).toBeDefined();
+      expect(jsonSchema.properties.tags).toBeDefined();
+    });
+
+    it("should preserve descriptions and metadata", () => {
+      const schema = z.object({
+        location: z.string().describe("City and country e.g. Bogotá, Colombia"),
+      });
+
+      const jsonSchema = toJSONSchema(schema, { target: "openapi-3.0" });
+
+      expect(jsonSchema.properties.location.description).toBe(
+        "City and country e.g. Bogotá, Colombia"
+      );
+    });
+  });
+
+  describe("Tool Definition", () => {
+    it("should define tool with inputSchema", async () => {
+      const weatherTool = {
+        type: "function" as const,
+        function: {
+          name: "get_weather",
+          description: "Get current temperature for a given location.",
+          inputSchema: z.object({
+            location: z.string().describe("City and country e.g. Bogotá, Colombia"),
+          }),
+          outputSchema: z.object({
+            temperature: z.number(),
+            description: z.string(),
+          }),
+          execute: async (parameters: { location: string }, context) => {
+            return {
+              temperature: 20,
+              description: "Clear skies",
+            };
+          },
+        },
+      };
+
+      // Tool definition should be valid
+      expect(weatherTool.function.name).toBe("get_weather");
+      expect(weatherTool.function.inputSchema).toBeDefined();
+      expect(weatherTool.function.outputSchema).toBeDefined();
+    });
+
+    it("should validate input against Zod schema", () => {
+      const schema = z.object({
+        location: z.string(),
+        temperature: z.number(),
+      });
+
+      const validInput = { location: "Tokyo", temperature: 25 };
+      const result = schema.safeParse(validInput);
+
+      expect(result.success).toBe(true);
+    });
+
+    it("should reject invalid input with ZodError", () => {
+      const schema = z.object({
+        location: z.string(),
+        temperature: z.number(),
+      });
+
+      const invalidInput = { location: "Tokyo", temperature: "hot" }; // Wrong type
+
+      const result = schema.safeParse(invalidInput);
+
+      expect(result.success).toBe(false);
+      if (!result.success) {
+        expect(result.error).toBeDefined();
+      }
+    });
+  });
+
+  describe("Regular Tool Execution", () => {
+    it("should execute tool with valid input", async () => {
+      const addTool = {
+        type: "function" as const,
+        function: {
+          name: "add_numbers",
+          description: "Add two numbers together",
+          inputSchema: z.object({
+            a: z.number(),
+            b: z.number(),
+          }),
+          outputSchema: z.object({
+            result: z.number(),
+          }),
+          execute: async (params: { a: number; b: number }, context) => {
+            return { result: params.a + params.b };
+          },
+        },
+      };
+
+      const mockContext = {
+        numberOfTurns: 1,
+        messageHistory: [],
+        model: "test-model",
+      };
+      const result = await addTool.function.execute({ a: 5, b: 3 }, mockContext);
+
+      expect(result.result).toBe(8);
+    });
+
+    it("should validate output against outputSchema", () => {
+      const schema = z.object({
+        temperature: z.number(),
+        description: z.string(),
+      });
+
+      const output = { temperature: 72, description: "Sunny" };
+      const result = schema.safeParse(output);
+
+      expect(result.success).toBe(true);
+    });
+
+    it("should handle execution errors gracefully", async () => {
+      const errorTool = {
+        type: "function" as const,
+        function: {
+          name: "error_tool",
+          inputSchema: z.object({}),
+          execute: async (params, context) => {
+            throw new Error("Tool execution failed");
+          },
+        },
+      };
+
+      const mockContext = {
+        numberOfTurns: 1,
+        messageHistory: [],
+        model: "test-model",
+      };
+      await expect(errorTool.function.execute({}, mockContext)).rejects.toThrow(
+        "Tool execution failed"
+      );
+    });
+  });
+
+  describe("Generator Tools (Preliminary Results)", () => {
+    it("should collect all yielded values as preliminary results", async () => {
+      const weatherSchema = z.object({
+        type: z.enum(["start", "update", "end"]),
+        data: z
+          .object({
+            location: z.string().optional(),
+            temperature: z.number().optional(),
+            description: z.string().optional(),
+          })
+          .optional(),
+      });
+
+      const generatorTool = {
+        type: "function" as const,
+        function: {
+          name: "get_weather_with_updates",
+          description: "Get weather with streaming updates",
+          inputSchema: z.object({
+            location: z.string(),
+          }),
+          eventSchema: weatherSchema,
+          execute: async function* (params: { location: string }, context) {
+            yield { type: "start" as const, data: { location: params.location } };
+            yield {
+              type: "update" as const,
+              data: { temperature: 20, description: "Clear skies" },
+            };
+            yield { type: "end" as const };
+          },
+        },
+      };
+
+      const mockContext = {
+        numberOfTurns: 1,
+        messageHistory: [],
+        model: "test-model",
+      };
+      const results: Array<z.infer<typeof weatherSchema>> = [];
+      for await (const result of generatorTool.function.execute({
+        location: "Tokyo",
+      }, mockContext)) {
+        results.push(result);
+      }
+
+      expect(results).toHaveLength(3);
+      expect(results[0].type).toBe("start");
+      expect(results[1].type).toBe("update");
+      expect(results[2].type).toBe("end");
+    });
+
+    it("should send only final (last) yield to model", async () => {
+      const generatorTool = {
+        type: "function" as const,
+        function: {
+          name: "process_data",
+          inputSchema: z.object({ data: z.string() }),
+          eventSchema: z.object({
+            status: z.string(),
+            result: z.any().optional(),
+          }),
+          execute: async function* (params: { data: string }, context) {
+            yield { status: "processing" };
+            yield { status: "almost_done" };
+            yield { status: "complete", result: `Processed: ${params.data}` };
+          },
+        },
+      };
+
+      const mockContext = {
+        numberOfTurns: 1,
+        messageHistory: [],
+        model: "test-model",
+      };
+      const results = [];
+      for await (const result of generatorTool.function.execute({ data: "test" }, mockContext)) {
+        results.push(result);
+      }
+
+      const finalResult = results[results.length - 1];
+      expect(finalResult.status).toBe("complete");
+      expect(finalResult.result).toBe("Processed: test");
+    });
+
+    it("should validate all events against eventSchema", async () => {
+      const eventSchema = z.object({
+        type: z.enum(["start", "end"]),
+        message: z.string(),
+      });
+
+      const validEvent1 = { type: "start" as const, message: "Starting" };
+      const validEvent2 = { type: "end" as const, message: "Done" };
+      const invalidEvent = { type: "middle", message: "Processing" };
+
+      expect(eventSchema.safeParse(validEvent1).success).toBe(true);
+      expect(eventSchema.safeParse(validEvent2).success).toBe(true);
+      expect(eventSchema.safeParse(invalidEvent).success).toBe(false);
+    });
+
+    it("should handle async generators", async () => {
+      async function* testGenerator() {
+        yield 1;
+        await new Promise((resolve) => setTimeout(resolve, 10));
+        yield 2;
+        await new Promise((resolve) => setTimeout(resolve, 10));
+        yield 3;
+      }
+
+      const results = [];
+      for await (const value of testGenerator()) {
+        results.push(value);
+      }
+
+      expect(results).toEqual([1, 2, 3]);
+    });
+
+    it("should emit preliminary results via callback", async () => {
+      const preliminaryResults: any[] = [];
+
+      const generatorTool = {
+        type: "function" as const,
+        function: {
+          name: "streaming_tool",
+          inputSchema: z.object({ input: z.string() }),
+          eventSchema: z.object({ progress: z.number(), message: z.string() }),
+          execute: async function* (params: { input: string }, context) {
+            yield { progress: 25, message: "Quarter done" };
+            yield { progress: 50, message: "Half done" };
+            yield { progress: 100, message: "Complete" };
+          },
+        },
+      };
+
+      const mockContext = {
+        numberOfTurns: 1,
+        messageHistory: [],
+        model: "test-model",
+      };
+      // Simulate callback
+      for await (const result of generatorTool.function.execute({ input: "test" }, mockContext)) {
+        preliminaryResults.push(result);
+      }
+
+      expect(preliminaryResults).toHaveLength(3);
+      expect(preliminaryResults[0].progress).toBe(25);
+      expect(preliminaryResults[1].progress).toBe(50);
+      expect(preliminaryResults[2].progress).toBe(100);
+    });
+  });
+
+  describe("Manual Tool Execution", () => {
+    it("should define tool without execute function", () => {
+      const manualTool = {
+        type: "function" as const,
+        function: {
+          name: "manual_tool",
+          description: "A tool that requires manual handling",
+          inputSchema: z.object({
+            query: z.string(),
+          }),
+          outputSchema: z.object({
+            result: z.string(),
+          }),
+        },
+      };
+
+      expect(manualTool.function.name).toBe("manual_tool");
+      expect(manualTool.function).not.toHaveProperty("execute");
+    });
+  });
+
+  describe("Integration with OpenRouter API", () => {
+    it.skip("should send tool call to API and receive tool call response", async () => {
+      // This test requires actual API integration which we'll implement
+      const weatherTool = {
+        type: "function" as const,
+        function: {
+          name: "get_weather",
+          description: "Get the current weather for a location",
+          inputSchema: z.object({
+            location: z.string().describe("The city and country"),
+          }),
+          outputSchema: z.object({
+            temperature: z.number(),
+            description: z.string(),
+          }),
+          execute: async (params: { location: string }, context) => {
+            return {
+              temperature: 72,
+              description: "Sunny",
+            };
+          },
+        },
+      };
+
+      const response = await client.getResponse({
+        model: "openai/gpt-4o",
+        messages: [
+          {
+            role: "user",
+            content: "What's the weather like in San Francisco?",
+          },
+        ],
+        tools: [weatherTool],
+      });
+
+      const message = await response.getMessage();
+      expect(message).toBeDefined();
+    }, 30000);
+
+    it.skip("should handle multi-turn conversation with tool execution", async () => {
+      // This will test the full loop: request -> tool call -> execute -> send result -> final response
+      const calculatorTool = {
+        type: "function" as const,
+        function: {
+          name: "calculate",
+          description: "Perform a mathematical calculation",
+          inputSchema: z.object({
+            expression: z.string().describe("Math expression to evaluate"),
+          }),
+          outputSchema: z.object({
+            result: z.number(),
+          }),
+          execute: async (params: { expression: string }, context) => {
+            // Simple eval for testing (don't use in production!)
+            const result = eval(params.expression);
+            return { result };
+          },
+        },
+      };
+
+      const response = await client.getResponse(
+        {
+          model: "openai/gpt-4o",
+          messages: [
+            {
+              role: "user",
+              content: "What is 25 * 4?",
+            },
+          ],
+          tools: [calculatorTool],
+        },
+        {
+          autoExecuteTools: true,
+          maxToolRounds: 3,
+        }
+      );
+
+      const finalMessage = await response.getMessage();
+      expect(finalMessage).toBeDefined();
+      expect(finalMessage.content).toBeTruthy();
+    }, 30000);
+  });
+
+  describe("Error Handling", () => {
+    it("should handle Zod input validation errors", () => {
+      const schema = z.object({
+        name: z.string(),
+        age: z.number().positive(),
+      });
+
+      const invalidInput = { name: "John", age: -5 };
+      const result = schema.safeParse(invalidInput);
+
+      expect(result.success).toBe(false);
+      if (!result.success) {
+        expect(result.error.issues).toHaveLength(1);
+        expect(result.error.issues[0].path).toEqual(["age"]);
+      }
+    });
+
+    it("should handle Zod output validation errors", () => {
+      const schema = z.object({
+        temperature: z.number(),
+        description: z.string(),
+      });
+
+      const invalidOutput = { temperature: "hot", description: "Sunny" };
+      const result = schema.safeParse(invalidOutput);
+
+      expect(result.success).toBe(false);
+    });
+
+    it("should provide clear error messages for validation failures", () => {
+      const schema = z.object({
+        email: z.string().email(),
+        age: z.number().min(18),
+      });
+
+      const invalidData = { email: "not-an-email", age: 15 };
+      const result = schema.safeParse(invalidData);
+
+      if (!result.success) {
+        expect(result.error.issues.length).toBeGreaterThan(0);
+        const issues = result.error.issues;
+        expect(issues.some((i) => i.path.includes("email"))).toBe(true);
+        expect(issues.some((i) => i.path.includes("age"))).toBe(true);
+      }
+    });
+  });
+
+  describe("Type Safety", () => {
+    it("should infer correct parameter types from inputSchema", () => {
+      const weatherTool = {
+        type: "function" as const,
+        function: {
+          name: "get_weather",
+          inputSchema: z.object({
+            location: z.string(),
+            units: z.enum(["celsius", "fahrenheit"]).optional(),
+          }),
+          execute: async (params: z.infer<typeof weatherTool.function.inputSchema>, context) => {
+            // TypeScript should infer: { location: string; units?: "celsius" | "fahrenheit" }
+            const location: string = params.location;
+            const units: "celsius" | "fahrenheit" | undefined = params.units;
+            return { location, units };
+          },
+        },
+      };
+
+      expect(weatherTool.function.name).toBe("get_weather");
+    });
+
+    it("should infer correct return types from outputSchema", () => {
+      const outputSchema = z.object({
+        temperature: z.number(),
+        unit: z.enum(["C", "F"]),
+      });
+
+      type OutputType = z.infer<typeof outputSchema>;
+
+      const output: OutputType = {
+        temperature: 72,
+        unit: "F",
+      };
+
+      expect(output.temperature).toBe(72);
+      expect(output.unit).toBe("F");
+    });
+  });
+});

From 20946291f84bb2682b4e83dbac5860fb68d52479 Mon Sep 17 00:00:00 2001
From: Matt Apperson <mattapperson@mini.local>
Date: Wed, 5 Nov 2025 13:15:05 -0500
Subject: [PATCH 4/4] Update maxToolRounds to accept TurnContext-based function
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Changed MaxToolRounds type to accept (context: TurnContext) => boolean
- Removed old 3-parameter function signature for simplicity
- Function receives full TurnContext with numberOfTurns, messageHistory, model/models
- Returns true to allow another turn, false to stop execution
- Updated examples to demonstrate the new function signature
- Simplified implementation logic in response-wrapper.ts

This provides more context to the maxToolRounds function and makes
the API more consistent with tool execute functions.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 examples/tools-example.ts   | 12 ++++++++++++
 src/funcs/getResponse.ts    |  2 +-
 src/lib/response-wrapper.ts | 13 ++++++++-----
 src/lib/tool-types.ts       |  6 +-----
 4 files changed, 22 insertions(+), 11 deletions(-)

diff --git a/examples/tools-example.ts b/examples/tools-example.ts
index e5eb7a53..f3cf4c8c 100644
--- a/examples/tools-example.ts
+++ b/examples/tools-example.ts
@@ -10,6 +10,13 @@
  *
  * The API is simple: just call getResponse() with tools, and await the result.
  * Tools are executed transparently before getMessage() or getText() returns!
+ *
+ * maxToolRounds can be:
+ * - A number: Maximum number of tool execution rounds (default: 5)
+ * - A function: (context: TurnContext) => boolean
+ *   - Return true to allow another turn
+ *   - Return false to stop execution
+ *   - Context includes: numberOfTurns, messageHistory, model/models
  */
 
 import { OpenRouter } from "../src/index.js";
@@ -60,6 +67,11 @@ async function basicToolExample() {
     model: "openai/gpt-4o",
     input: "What's the weather like in San Francisco?",
     tools: [weatherTool],
+    // Example: limit to 3 turns using a function
+    maxToolRounds: (context) => {
+      console.log(`Checking if we should continue (currently on turn ${context.numberOfTurns})`);
+      return context.numberOfTurns < 3; // Allow up to 3 turns
+    },
   });
 
   // Tools are automatically executed! Just get the final message
diff --git a/src/funcs/getResponse.ts b/src/funcs/getResponse.ts
index cb3eed16..97f21213 100644
--- a/src/funcs/getResponse.ts
+++ b/src/funcs/getResponse.ts
@@ -58,7 +58,7 @@ import { convertEnhancedToolsToAPIFormat } from "../lib/tool-executor.js";
  *       }
  *     }
  *   }],
- *   maxToolRounds: 5, // or function: (round, calls, responses) => boolean
+ *   maxToolRounds: 5, // or function: (context: TurnContext) => boolean
  * });
  * const message = await response.getMessage(); // Tools auto-executed!
  *
diff --git a/src/lib/response-wrapper.ts b/src/lib/response-wrapper.ts
index e7ed07ff..2a31bd31 100644
--- a/src/lib/response-wrapper.ts
+++ b/src/lib/response-wrapper.ts
@@ -179,11 +179,14 @@ export class ResponseWrapper {
             break;
           }
         } else if (typeof maxToolRounds === "function") {
-          const shouldContinue = maxToolRounds(
-            currentRound,
-            currentToolCalls,
-            this.allToolExecutionRounds.map((r) => r.response)
-          );
+          // Function signature: (context: TurnContext) => boolean
+          const turnContext: TurnContext = {
+            numberOfTurns: currentRound + 1,
+            messageHistory: currentInput,
+            ...(this.options.request.model && { model: this.options.request.model }),
+            ...(this.options.request.models && { models: this.options.request.models }),
+          };
+          const shouldContinue = maxToolRounds(turnContext);
           if (!shouldContinue) {
             break;
           }
diff --git a/src/lib/tool-types.ts b/src/lib/tool-types.ts
index f181cc44..eca73711 100644
--- a/src/lib/tool-types.ts
+++ b/src/lib/tool-types.ts
@@ -159,11 +159,7 @@ export interface ToolExecutionResult {
  */
 export type MaxToolRounds =
   | number
-  | ((
-      round: number,
-      toolCalls: ParsedToolCall[],
-      responses: any[] // OpenResponsesNonStreamingResponse[]
-    ) => boolean); // Return true to continue, false to stop
+  | ((context: TurnContext) => boolean); // Return true to allow another turn, false to stop
 
 /**
  * Result of executeTools operation