theopenco · steebchen · May 5, 2026 · Apr 7, 2026 · Apr 7, 2026 · Apr 7, 2026
diff --git a/apps/gateway/src/responses.e2e.ts b/apps/gateway/src/responses.e2e.ts
@@ -0,0 +1,262 @@
+import "dotenv/config";
+import { beforeAll, beforeEach, describe, expect, test } from "vitest";
+
+import { app } from "@/app.js";
+import {
+	beforeAllHook,
+	beforeEachHook,
+	generateTestRequestId,
+	getConcurrentTestOptions,
+	getTestOptions,
+	logMode,
+	testModels,
+	toolCallModels,
+	validateLogByRequestId,
+} from "@/chat-helpers.e2e.js";
+
+// Pick one model per provider to keep CI cost manageable while still
+// validating the Responses API conversion layer across every provider.
+function oneModelPerProvider<T extends { model: string }>(list: T[]): T[] {
+	const seen = new Set<string>();
+	const out: T[] = [];
+	for (const item of list) {
+		const provider = item.model.split("/")[0];
+		if (seen.has(provider)) {
+			continue;
+		}
+		seen.add(provider);
+		out.push(item);
+	}
+	return out;
+}
+
+const responsesTestModels = oneModelPerProvider(testModels);
+const responsesToolCallModels = oneModelPerProvider(toolCallModels);
+
+interface ResponsesOutputItem {
+	type: string;
+	role?: string;
+	content?: { type: string; text?: string }[];
+	call_id?: string;
+	name?: string;
+	arguments?: string;
+}
+
+function getOutputText(json: { output?: ResponsesOutputItem[] }): string {
+	const items = json.output ?? [];
+	const parts: string[] = [];
+	for (const item of items) {
+		if (item.type === "message" && Array.isArray(item.content)) {
+			for (const c of item.content) {
+				if (c.type === "output_text" && typeof c.text === "string") {
+					parts.push(c.text);
+				}
+			}
+		}
+	}
+	return parts.join("");
+}
+
+function getFunctionCall(json: {
+	output?: ResponsesOutputItem[];
+}): ResponsesOutputItem | undefined {
+	return (json.output ?? []).find((i) => i.type === "function_call");
+}
+
+async function postResponses(body: unknown, requestId: string) {
+	return await app.request("/v1/responses", {
+		method: "POST",
+		headers: {
+			"Content-Type": "application/json",
+			"x-request-id": requestId,
+			"x-no-fallback": "true",
+			Authorization: `Bearer real-token`,
+		},
+		body: JSON.stringify(body),
+	});
+}
+
+describe("e2e", getConcurrentTestOptions(), () => {
+	beforeAll(beforeAllHook);
+
+	beforeEach(beforeEachHook);
+
+	test("empty", () => {
+		expect(true).toBe(true);
+	});
+
+	test.each(responsesTestModels)(
+		"responses single-turn $model",
+		getTestOptions(),
+		async ({ model }) => {
+			const requestId = generateTestRequestId();
+			const res = await postResponses(
+				{
+					model,
+					input: "Say hello in one short sentence.",
+				},
+				requestId,
+			);
+
+			const json = await res.json();
+			if (logMode) {
+				console.log(
+					"responses single-turn response:",
+					JSON.stringify(json, null, 2),
+				);
+			}
+
+			expect(res.status).toBe(200);
+			expect(json).toHaveProperty("id");
+			expect(typeof json.id).toBe("string");
+			expect(json.id.startsWith("resp_")).toBe(true);
+			expect(Array.isArray(json.output)).toBe(true);
+
+			const text = getOutputText(json);
+			expect(text.length).toBeGreaterThan(0);
+
+			expect(json).toHaveProperty("usage");
+			expect(typeof json.usage.input_tokens).toBe("number");
+			expect(typeof json.usage.output_tokens).toBe("number");
+			expect(json.usage.input_tokens).toBeGreaterThan(0);
+			expect(json.usage.output_tokens).toBeGreaterThan(0);
+
+			await validateLogByRequestId(requestId);
+		},
+	);
+
+	test.each(responsesTestModels)(
+		"responses multi-turn $model",
+		getTestOptions(),
+		async ({ model }) => {
+			const firstRequestId = generateTestRequestId();
+			const firstRes = await postResponses(
+				{
+					model,
+					input:
+						"My name is Ada. Please remember it. Reply with a brief acknowledgement.",
+				},
+				firstRequestId,
+			);
+			const firstJson = await firstRes.json();
+			if (logMode) {
+				console.log(
+					"responses multi-turn first:",
+					JSON.stringify(firstJson, null, 2),
+				);
+			}
+			expect(firstRes.status).toBe(200);
+			expect(typeof firstJson.id).toBe("string");
+
+			const secondRequestId = generateTestRequestId();
+			const secondRes = await postResponses(
+				{
+					model,
+					input: "What is my name? Reply with just the name.",
+					previous_response_id: firstJson.id,
+				},
+				secondRequestId,
+			);
+			const secondJson = await secondRes.json();
+			if (logMode) {
+				console.log(
+					"responses multi-turn second:",
+					JSON.stringify(secondJson, null, 2),
+				);
+			}
+			expect(secondRes.status).toBe(200);
+			const text = getOutputText(secondJson);
+			expect(text.toLowerCase()).toContain("ada");
+		},
+	);
+
+	test.each(responsesToolCallModels)(
+		"responses tool calls $model",
+		getTestOptions(),
+		async ({ model }) => {
+			const tools = [
+				{
+					type: "function",
+					name: "get_weather",
+					description: "Get the current weather for a given city",
+					parameters: {
+						type: "object",
+						properties: {
+							city: {
+								type: "string",
+								description: "The city name to get weather for",
+							},
+						},
+						required: ["city"],
+					},
+				},
+			];
+
+			const firstRequestId = generateTestRequestId();
+			const firstRes = await postResponses(
+				{
+					model,
+					input: [
+						{
+							role: "user",
+							content: "What's the weather like in San Francisco?",
+						},
+					],
+					tools,
+					tool_choice: "required",
+				},
+				firstRequestId,
+			);
+			const firstJson = await firstRes.json();
+			if (logMode) {
+				console.log(
+					"responses tool calls first:",
+					JSON.stringify(firstJson, null, 2),
+				);
+			}
+
+			expect(firstRes.status).toBe(200);
+			const fnCall = getFunctionCall(firstJson);
+			expect(fnCall).toBeDefined();
+			expect(fnCall?.name).toBe("get_weather");
+			expect(typeof fnCall?.call_id).toBe("string");
+			expect(typeof fnCall?.arguments).toBe("string");
+			const parsedArgs = JSON.parse(fnCall?.arguments ?? "{}");
+			expect(typeof parsedArgs.city).toBe("string");
+			expect(parsedArgs.city.toLowerCase()).toContain("san francisco");
+
+			const secondRequestId = generateTestRequestId();
+			const secondRes = await postResponses(
+				{
+					model,
+					previous_response_id: firstJson.id,
+					input: [
+						{
+							type: "function_call_output",
+							call_id: fnCall?.call_id,
+							output: "72F and sunny",
-			expect(firstRes.status).toBe(200);
-			const fnCall = getFunctionCall(firstJson);
-			expect(fnCall).toBeDefined();
-			expect(fnCall?.name).toBe("get_weather");
-			expect(typeof fnCall?.call_id).toBe("string");
-			expect(typeof fnCall?.arguments).toBe("string");
-			const parsedArgs = JSON.parse(fnCall?.arguments ?? "{}");
-			expect(typeof parsedArgs.city).toBe("string");
-			expect(parsedArgs.city.toLowerCase()).toContain("san francisco");
-
-			const secondRequestId = generateTestRequestId();
-			const secondRes = await postResponses(
-				{
-					model,
-					previous_response_id: firstJson.id,
-					input: [
-						{
-							type: "function_call_output",
-							call_id: fnCall?.call_id,
-							output: "72F and sunny",
+			expect(firstRes.status).toBe(200);
+			expect(typeof firstJson.id).toBe("string");
+			expect(firstJson.id.startsWith("resp_")).toBe(true);
+			const fnCall = getFunctionCall(firstJson);
+			expect(fnCall).toBeDefined();
+			expect(fnCall?.name).toBe("get_weather");
+			expect(typeof fnCall?.call_id).toBe("string");
+			expect(fnCall?.call_id).toBeTruthy();
+			expect(typeof fnCall?.arguments).toBe("string");
+			const parsedArgs = JSON.parse(fnCall?.arguments ?? "{}");
+			expect(typeof parsedArgs.city).toBe("string");
+			expect(parsedArgs.city.toLowerCase()).toContain("san francisco");
+
+			const secondRequestId = generateTestRequestId();
+			const secondRes = await postResponses(
+				{
+					model,
+					previous_response_id: firstJson.id,
+					input: [
+						{
+							type: "function_call_output",
+							call_id: fnCall?.call_id,
+							output: "72F and sunny",
-			expect(firstRes.status).toBe(200);
-			const fnCall = getFunctionCall(firstJson);
-			expect(fnCall).toBeDefined();
-			expect(fnCall?.name).toBe("get_weather");
-			expect(typeof fnCall?.call_id).toBe("string");
-			expect(typeof fnCall?.arguments).toBe("string");
-			const parsedArgs = JSON.parse(fnCall?.arguments ?? "{}");
-			expect(typeof parsedArgs.city).toBe("string");
-			expect(parsedArgs.city.toLowerCase()).toContain("san francisco");
-
-			const secondRequestId = generateTestRequestId();
-			const secondRes = await postResponses(
-				{
-					model,
-					previous_response_id: firstJson.id,
-					input: [
-						{
-							type: "function_call_output",
-							call_id: fnCall?.call_id,
-							output: "72F and sunny",
+			expect(firstRes.status).toBe(200);
+			expect(typeof firstJson.id).toBe("string");
+			expect(firstJson.id.startsWith("resp_")).toBe(true);
+			const fnCall = getFunctionCall(firstJson);
+			expect(fnCall).toBeDefined();
+			expect(fnCall?.name).toBe("get_weather");
+			expect(typeof fnCall?.call_id).toBe("string");
+			expect(fnCall?.call_id).toBeTruthy();
+			expect(typeof fnCall?.arguments).toBe("string");
+			const parsedArgs = JSON.parse(fnCall?.arguments ?? "{}");
+			expect(typeof parsedArgs.city).toBe("string");
+			expect(parsedArgs.city.toLowerCase()).toContain("san francisco");
+
+			const secondRequestId = generateTestRequestId();
+			const secondRes = await postResponses(
+				{
+					model,
+					previous_response_id: firstJson.id,
+					input: [
+						{
+							type: "function_call_output",
+							call_id: fnCall?.call_id,
+							output: "72F and sunny",
+						},
+					],
+					tools,
+				},
+				secondRequestId,
+			);
+			const secondJson = await secondRes.json();
+			if (logMode) {
+				console.log(
+					"responses tool calls second:",
+					JSON.stringify(secondJson, null, 2),
+				);
+			}
+
+			expect(secondRes.status).toBe(200);
+			const finalText = getOutputText(secondJson).toLowerCase();
+			expect(finalText.length).toBeGreaterThan(0);
+			expect(
+				finalText.includes("sunny") ||
+					finalText.includes("72") ||
+					finalText.includes("weather"),
+			).toBe(true);
+		},
+	);
+});