theopenco · steebchen · Apr 7, 2026 · Apr 7, 2026 · Apr 7, 2026 · Apr 8, 2026
diff --git a/apps/gateway/src/chat/chat.ts b/apps/gateway/src/chat/chat.ts
@@ -364,9 +364,9 @@ function isContentFilterProvider(providerId: string): boolean {
 
 function getContentFilterRoutingDecision(
 	availableModelProviders: ProviderModelMapping[],
-	contentFilterMatched: boolean,
+	shouldAvoidContentFilterProviders: boolean,
 ): ContentFilterRoutingDecision {
-	if (!contentFilterMatched) {
+	if (!shouldAvoidContentFilterProviders) {
 		return {
 			candidates: availableModelProviders,
 			excludedProviders: [],
@@ -408,11 +408,12 @@ function getContentFilterRoutingDecision(
 function addContentFilterRoutingMetadata(
 	routingMetadata: RoutingMetadata,
 	contentFilterMatched: boolean,
+	contentFilterUnavailable: boolean,
 	excludedProviders: ProviderModelMapping[],
 	modelId: string | undefined,
 	metricsMap: Map<string, ProviderMetrics>,
 ): RoutingMetadata {
-	if (!contentFilterMatched) {
+	if (!contentFilterMatched && !contentFilterUnavailable) {
 		return routingMetadata;
 	}
 
@@ -438,15 +439,18 @@ function addContentFilterRoutingMetadata(
 							throughput: metrics?.throughput ?? 0,
 							price: getProviderSelectionPrice(provider),
 							contentFilterProvider: true,
-							excludedByContentFilter: true,
+							...(contentFilterMatched
+								? { excludedByContentFilter: true }
+								: { excludedByModerationFailure: true }),
 						};
 					}),
 					...routingMetadata.providerScores,
 				];
 
 	return {
 		...routingMetadata,
-		contentFilterMatched: true,
+		...(contentFilterMatched ? { contentFilterMatched: true } : {}),
+		...(contentFilterUnavailable ? { contentFilterUnavailable: true } : {}),
 		contentFilterRerouted: contentFilterExcludedProviders.length > 0,
 		contentFilterExcludedProviders:
 			contentFilterExcludedProviders.length > 0
@@ -1899,8 +1903,11 @@ chat.openapi(completions, async (c) => {
 	const contentFilterMatched =
 		keywordContentFilterMatch !== null ||
 		openAIContentFilterResult?.flagged === true;
-	const shouldRerouteContentFilter =
-		contentFilterMode === "enabled" && contentFilterMatched;
+	const contentFilterUnavailable =
+		openAIContentFilterResult?.unavailable === true;
+	const shouldAvoidContentFilterProviders =
+		contentFilterMode === "enabled" &&
+		(contentFilterMatched || contentFilterUnavailable);
 	let contentFilterRoutingExcludedProviders: ProviderModelMapping[] = [];
 	let contentFilterRoutingApplied = false;
 
@@ -2311,7 +2318,7 @@ chat.openapi(completions, async (c) => {
 
 			const contentFilterRoutingDecision = getContentFilterRoutingDecision(
 				availableModelProviders,
-				shouldRerouteContentFilter,
+				shouldAvoidContentFilterProviders,
 			);
 			const contentFilterPreferredProviders =
 				contentFilterRoutingDecision.candidates;
@@ -2382,6 +2389,7 @@ chat.openapi(completions, async (c) => {
 							...(noFallback ? { noFallback: true } : {}),
 						},
 						contentFilterMatched,
+						contentFilterUnavailable,
 						contentFilterRoutingExcludedProviders,
 						modelWithPricing.id,
 						metricsMap,
@@ -2569,6 +2577,7 @@ chat.openapi(completions, async (c) => {
 				...(noFallback ? { noFallback: true } : {}),
 			},
 			contentFilterMatched,
+			contentFilterUnavailable,
 			contentFilterRoutingExcludedProviders,
 			baseModelId,
 			metricsMap,
@@ -2868,6 +2877,158 @@ chat.openapi(completions, async (c) => {
 		);
 	}
 
+	if (!usedToken) {
+		throw new HTTPException(500, {
+			message: `No token`,
+		});
+	}
+
+	usedApiKeyHash = getApiKeyFingerprint(usedToken);
+	routingMetadata = withUsedApiKeyHash(routingMetadata, usedApiKeyHash);
+
+	const contentFilterBlocked =
+		contentFilterMode === "enabled" &&
+		contentFilterMatched &&
+		!contentFilterRoutingApplied;
+	const contentFilterSensitiveProviderBlocked =
+		contentFilterMode === "enabled" &&
+		contentFilterUnavailable &&
+		isContentFilterProvider(usedProvider);
+
+	// Preserve monitor tagging, and also tag successful reroutes triggered by a
+	// gateway content-filter match so the decision remains visible in logs.
+	const shouldTagContentFilter =
+		(contentFilterMode === "monitor" && contentFilterMatched) ||
+		contentFilterRoutingApplied;
+	const gatewayContentFilterResponse = openAIContentFilterResult?.responses
+		.length
+		? openAIContentFilterResult.responses
+		: null;
+	const insertLog = (
+		logData: Parameters<typeof _insertLog>[0],
+		options?: Parameters<typeof _insertLog>[1],
+	) =>
+		_insertLog(
+			{
+				...logData,
+				internalContentFilter: shouldTagContentFilter
+					? true
+					: logData.internalContentFilter,
+				gatewayContentFilterResponse:
+					logData.gatewayContentFilterResponse ?? gatewayContentFilterResponse,
+			},
+			options,
+		);
+
+	if (contentFilterSensitiveProviderBlocked) {
+		const moderationOutageMessage =
+			"OpenAI moderation is unavailable and no eligible provider without provider-side content filtering is available.";
+		const baseLogEntry = createLogEntry(
+			requestId,
+			project,
+			apiKey,
+			providerKey?.id,
+			usedModelFormatted,
+			usedModelMapping,
+			usedProvider,
+			initialRequestedModel,
+			requestedProvider,
+			messages,
+			temperature,
+			max_tokens,
+			top_p,
+			frequency_penalty,
+			presence_penalty,
+			reasoning_effort,
+			reasoning_max_tokens,
+			effort,
+			response_format,
+			tools,
+			tool_choice,
+			source,
+			customHeaders,
+			debugMode,
+			userAgent,
+			image_config,
+			routingMetadata,
+			rawBody,
+			null,
+			null,
+			null,
+			undefined,
+			undefined,
+		);
+
+		logger.warn(
+			"Blocking request because OpenAI moderation is unavailable and selected provider is content-filter-sensitive",
+			{
+				requestId,
+				organizationId: project.organizationId,
+				projectId: project.id,
+				apiKeyId: apiKey.id,
+				usedProvider,
+				usedModel,
+				requestedModel: initialRequestedModel,
+				routingMetadata,
+			},
+		);
+
+		try {
+			await insertLogEntry({
+				...baseLogEntry,
+				duration: 0,
+				timeToFirstToken: null,
+				timeToFirstReasoningToken: null,
+				responseSize: 0,
+				content: null,
+				reasoningContent: null,
+				finishReason: "upstream_error",
+				promptTokens: null,
+				completionTokens: null,
+				totalTokens: null,
+				reasoningTokens: null,
+				cachedTokens: null,
+				hasError: true,
+				streamed: !!stream,
+				canceled: false,
+				errorDetails: {
+					statusCode: 503,
+					statusText: "Service Unavailable",
+					responseText: moderationOutageMessage,
+				},
+				cachedInputCost: null,
+				requestCost: null,
+				webSearchCost: null,
+				imageInputTokens: null,
+				imageOutputTokens: null,
+				imageInputCost: null,
+				imageOutputCost: null,
+				estimatedCost: false,
+				discount: null,
+				dataStorageCost: "0",
+				cached: false,
+				toolResults: null,
+				unifiedFinishReason: "upstream_error",
+			});
+		} catch (error) {
+			logger.error(
+				"Failed to persist moderation outage block log",
+				{
+					requestId,
+					organizationId: project.organizationId,
+					projectId: project.id,
+					apiKeyId: apiKey.id,
+					usedProvider,
+				},
+				error as Error,
+			);
+		}
+
+		throw new HTTPException(503, {
+			message: moderationOutageMessage,
+		});
+	}
+
 	// Consume a rate-limit slot for the chosen provider (routing already filtered rate-limited ones)
 	{
 		const providerRateLimitResult = await checkProviderRateLimit(
@@ -2971,52 +3132,13 @@ chat.openapi(completions, async (c) => {
 		}
 	}
 
-	if (!usedToken) {
-		throw new HTTPException(500, {
-			message: `No token`,
-		});
-	}
-
-	usedApiKeyHash = getApiKeyFingerprint(usedToken);
-	routingMetadata = withUsedApiKeyHash(routingMetadata, usedApiKeyHash);
-
-	const contentFilterBlocked =
-		contentFilterMode === "enabled" &&
-		contentFilterMatched &&
-		!contentFilterRoutingApplied;
-
-	// Preserve monitor tagging, and also tag successful reroutes triggered by a
-	// gateway content-filter match so the decision remains visible in logs.
-	const shouldTagContentFilter =
-		(contentFilterMode === "monitor" && contentFilterMatched) ||
-		contentFilterRoutingApplied;
-	const gatewayContentFilterResponse = openAIContentFilterResult?.responses
-		.length
-		? openAIContentFilterResult.responses
-		: null;
-	const insertLog = (
-		logData: Parameters<typeof _insertLog>[0],
-		options?: Parameters<typeof _insertLog>[1],
-	) =>
-		_insertLog(
-			{
-				...logData,
-				internalContentFilter: shouldTagContentFilter
-					? true
-					: logData.internalContentFilter,
-				gatewayContentFilterResponse:
-					logData.gatewayContentFilterResponse ?? gatewayContentFilterResponse,
-			},
-			options,
-		);
-
 	if (contentFilterBlocked) {
 		const contentFilterResponseId = `chatcmpl-${Date.now()}`;
 		const contentFilterCreated = Math.floor(Date.now() / 1000);
 
 		// Log the filtered request
 		try {
-			await insertLog({
+			await insertLogEntry({
 				...createLogEntry(
 					requestId,
 					project,

diff --git a/apps/gateway/src/chat/tools/openai-content-filter.spec.ts b/apps/gateway/src/chat/tools/openai-content-filter.spec.ts
@@ -582,6 +582,7 @@ describe("checkOpenAIContentFilter", () => {
 
 		expect(result).toEqual({
 			flagged: false,
+			unavailable: true,
 			model: "omni-moderation-latest",
 			upstreamRequestId: null,
 			results: [],
@@ -631,6 +632,7 @@ describe("checkOpenAIContentFilter", () => {
 
 		expect(result).toEqual({
 			flagged: false,
+			unavailable: true,
 			model: "omni-moderation-latest",
 			upstreamRequestId: null,
 			results: [],
@@ -715,6 +717,7 @@ describe("checkOpenAIContentFilter", () => {
 
 		expect(result).toEqual({
 			flagged: false,
+			unavailable: true,
 			model: "omni-moderation-latest",
 			upstreamRequestId: null,
 			results: [],

diff --git a/apps/gateway/src/chat/tools/openai-content-filter.ts b/apps/gateway/src/chat/tools/openai-content-filter.ts
@@ -53,6 +53,7 @@ interface OpenAIModerationResult {
 
 export interface OpenAIContentFilterCheckResult {
 	flagged: boolean;
+	unavailable: boolean;
 	model: string;
 	upstreamRequestId: string | null;
 	results: OpenAIModerationResult[];
@@ -339,9 +340,11 @@ function buildModerationErrorDetails(error: unknown): Record<string, string> {
 
 function createFailedOpenAIContentFilterResult(
 	upstreamRequestId: string | null = null,
+	unavailable = true,
 ): OpenAIContentFilterCheckResult {
 	return {
 		flagged: false,
+		unavailable,
 		model: OPENAI_MODERATION_MODEL,
 		upstreamRequestId,
 		results: [],
@@ -446,6 +449,7 @@ async function runOpenAIContentFilterRequest(
 			flagged: (moderationResponse.results ?? []).some((result) =>
 				isOpenAIModerationResultFlagged(result),
 			),
+			unavailable: false,
 			model: moderationResponse.model ?? OPENAI_MODERATION_MODEL,
 			upstreamRequestId,
 			results: moderationResponse.results ?? [],
@@ -476,7 +480,7 @@ export async function checkOpenAIContentFilter(
 			results: [],
 		});
 
-		return createFailedOpenAIContentFilterResult();
+		return createFailedOpenAIContentFilterResult(null, false);
 	}
 
 	const signal = requestSignal
@@ -530,6 +534,7 @@ export async function checkOpenAIContentFilter(
 
 		return {
 			flagged,
+			unavailable: moderationResults.some((result) => !result.success),
 			model,
 			upstreamRequestId,
 			results,

diff --git a/apps/gateway/src/chat/tools/retry-with-fallback.ts b/apps/gateway/src/chat/tools/retry-with-fallback.ts
@@ -85,6 +85,7 @@ export function selectNextProvider(
 		score: number;
 		region?: string;
 		excludedByContentFilter?: boolean;
+		excludedByModerationFailure?: boolean;
 	}>,
 	failedProviders: Set<string>,
 	modelProviders: Array<{
@@ -95,7 +96,7 @@ export function selectNextProvider(
 ): { providerId: string; modelName: string; region?: string } | null {
 	const sorted = [...providerScores].sort((a, b) => a.score - b.score);
 	for (const score of sorted) {
-		if (score.excludedByContentFilter) {
+		if (score.excludedByContentFilter || score.excludedByModerationFailure) {
 			continue;
 		}