langchain-ai · christian-bromann · Sep 9, 2025 · Sep 8, 2025 · Sep 9, 2025
diff --git a/libs/langchain-openai/src/chat_models.ts b/libs/langchain-openai/src/chat_models.ts
@@ -107,6 +107,7 @@ import {
   ResponsesTool,
   ResponsesToolChoice,
 } from "./utils/tools.js";
+import { handleMultiModalOutput } from "./utils/output.js";
 
 const _FUNCTION_CALL_IDS_MAP_KEY = "__openai_function_call_ids__";
 
@@ -2721,8 +2722,13 @@ export class ChatOpenAICompletions<
           additional_kwargs.audio = message.audio;
         }
 
+        const content = handleMultiModalOutput(
+          message.content || "",
+          rawResponse.choices?.[0]?.message
+        );
+
         return new AIMessage({
-          content: message.content || "",
+          content,
           tool_calls: toolCalls,
           invalid_tool_calls: invalidToolCalls,
           additional_kwargs,

diff --git a/libs/langchain-openai/src/tests/chat_models.test.ts b/libs/langchain-openai/src/tests/chat_models.test.ts
@@ -370,6 +370,149 @@ describe("ChatOpenAI", () => {
     ]);
   });
 
+  describe("OpenRouter image response handling", () => {
+    it("Should correctly parse OpenRouter-style image responses", () => {
+      // Create a minimal ChatOpenAI instance to test the method
+      const model = new ChatOpenAI({
+        model: "test-model",
+        apiKey: "test-key",
+      });
+
+      // Access the completions object to test the method
+      const { completions } = model as any;
+
+      // Mock message with images from OpenRouter
+      const mockMessage = {
+        role: "assistant" as const,
+        content: "Here is your image of a cute cat:",
+      };
+
+      const mockRawResponse = {
+        id: "chatcmpl-12345",
+        object: "chat.completion",
+        created: 1234567890,
+        model: "google/gemini-2.5-flash-image-preview",
+        choices: [
+          {
+            index: 0,
+            message: {
+              ...mockMessage,
+              // OpenRouter includes images in a separate array
+              images: [
+                {
+                  type: "image_url",
+                  image_url: {
+                    url: "data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mP8/5+hHgAHggJ/PchI7wAAAABJRU5ErkJggg==",
+                  },
+                },
+              ],
+            },
+            finish_reason: "stop",
+          },
+        ],
+        usage: {
+          prompt_tokens: 10,
+          completion_tokens: 20,
+          total_tokens: 30,
+        },
+      };
+
+      // Test the _convertCompletionsMessageToBaseMessage method
+      const result = completions._convertCompletionsMessageToBaseMessage(
+        mockMessage,
+        mockRawResponse
+      );
+
+      // Verify the result is an AIMessage with structured content
+      expect(result.constructor.name).toBe("AIMessage");
+      expect(result.content).toEqual([
+        {
+          source_type: "text",
+          type: "text",
+          text: "Here is your image of a cute cat:",
+        },
+        {
+          source_type: "url",
+          type: "image",
+          url: "data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mP8/5+hHgAHggJ/PchI7wAAAABJRU5ErkJggg==",
+        },
+      ]);
+    });
+
+    it("Should handle OpenRouter responses with multiple images", () => {
+      const model = new ChatOpenAI({
+        model: "test-model",
+        apiKey: "test-key",
+      });
+
+      const { completions } = model as any;
+
+      const mockMessage = {
+        role: "assistant" as const,
+        content: "Here are multiple images:",
+      };
+
+      const mockRawResponse = {
+        id: "chatcmpl-12345",
+        object: "chat.completion",
+        created: 1234567890,
+        model: "google/gemini-2.5-flash-image-preview",
+        choices: [
+          {
+            index: 0,
+            message: {
+              ...mockMessage,
+              images: [
+                {
+                  type: "image_url",
+                  image_url: {
+                    url: "data:image/png;base64,image1",
+                  },
+                },
+                {
+                  type: "image_url",
+                  image_url: {
+                    url: "data:image/png;base64,image2",
+                  },
+                },
+              ],
+            },
+            finish_reason: "stop",
+          },
+        ],
+        usage: {
+          prompt_tokens: 10,
+          completion_tokens: 20,
+          total_tokens: 30,
+        },
+      };
+
+      const result = completions._convertCompletionsMessageToBaseMessage(
+        mockMessage,
+        mockRawResponse
+      );
+
+      // Verify the response contains structured content with multiple image_urls
+      expect(result.content).toEqual([
+        {
+          source_type: "text",
+          type: "text",
+          text: "Here are multiple images:",
+        },
+        {
+          source_type: "url",
+          type: "image",
+          url: "data:image/png;base64,image1",
+        },
+        {
+          source_type: "url",
+          type: "image",
+          url: "data:image/png;base64,image2",
+        },
+      ]);
+    });
+  });
+
   test("can be constructed with reasoningEffort", async () => {
     const model = new ChatOpenAI({
       model: "gpt-4o-2024-08-06",

diff --git a/libs/langchain-openai/src/utils/output.ts b/libs/langchain-openai/src/utils/output.ts
@@ -0,0 +1,41 @@
+import {
+  StandardImageBlock,
+  StandardTextBlock,
+} from "@langchain/core/messages";
+
+/**
+ * Handle multi modal response content.
+ *
+ * @param content The content of the message.
+ * @param messages The messages of the response.
+ * @returns The new content of the message.
+ */
+export function handleMultiModalOutput(
+  content: string,
+  messages: unknown
+): (StandardImageBlock | StandardTextBlock)[] | string {
+  /**
+   * Handle OpenRouter image responses
+   * @see https://openrouter.ai/docs/features/multimodal/image-generation#api-usage
+   */
+  if (
+    messages &&
+    typeof messages === "object" &&
+    "images" in messages &&
+    Array.isArray(messages.images)
+  ) {
+    const images = messages.images
+      .filter((image) => typeof image?.image_url?.url === "string")
+      .map(
+        (image) =>
+          ({
+            type: "image",
+            url: image.image_url.url as string,
+            source_type: "url",
+          } as const)
+      );
+    return [{ type: "text", text: content, source_type: "text" }, ...images];
+  }
+
+  return content;
+}