theopenco · steebchen · Sep 22, 2025 · Sep 23, 2025 · Sep 23, 2025 · coderabbitai
diff --git a/apps/gateway/src/chat/chat.ts b/apps/gateway/src/chat/chat.ts
@@ -3011,25 +3011,11 @@ chat.openapi(completions, async (c) => {
 		images,
 	} = parseProviderResponse(usedProvider, json, messages);
 
-	// Debug: Log images found in response
-	logger.debug("Gateway - parseProviderResponse extracted images", { images });
-	logger.debug("Gateway - Used provider", { usedProvider });
-	logger.debug("Gateway - Used model", { usedModel });
-
-	// Estimate tokens if not provided by the API
-	const { calculatedPromptTokens, calculatedCompletionTokens } = estimateTokens(
-		usedProvider,
-		messages,
-		content,
-		promptTokens,
-		completionTokens,
-	);
-
 	const costs = calculateCosts(
 		usedModel,
 		usedProvider,
-		calculatedPromptTokens,
-		calculatedCompletionTokens,
+		promptTokens,
+		completionTokens,
 		cachedTokens,
 		{
 			prompt: messages.map((m) => m.content).join("\n"),
@@ -3046,11 +3032,9 @@ chat.openapi(completions, async (c) => {
 		content,
 		reasoningContent,
 		finishReason,
-		calculatedPromptTokens,
-		calculatedCompletionTokens,
-		(calculatedPromptTokens || 0) +
-			(calculatedCompletionTokens || 0) +
-			(reasoningTokens || 0),
+		promptTokens,
+		completionTokens,
+		(promptTokens || 0) + (completionTokens || 0) + (reasoningTokens || 0),
 		reasoningTokens,
 		cachedTokens,
 		toolResults,
@@ -3097,13 +3081,10 @@ chat.openapi(completions, async (c) => {
 		content: content,
 		reasoningContent: reasoningContent,
 		finishReason: finishReason,
-		promptTokens: calculatedPromptTokens?.toString() || null,
-		completionTokens: calculatedCompletionTokens?.toString() || null,
+		promptTokens: promptTokens?.toString() || null,
+		completionTokens: completionTokens?.toString() || null,
 		totalTokens:
-			totalTokens ||
-			(
-				(calculatedPromptTokens || 0) + (calculatedCompletionTokens || 0)
-			).toString(),
+			totalTokens || ((promptTokens || 0) + (completionTokens || 0)).toString(),
 		reasoningTokens: reasoningTokens,
 		cachedTokens: cachedTokens?.toString() || null,
 		hasError: false,

diff --git a/apps/gateway/src/chat/tools/estimate-tokens.ts b/apps/gateway/src/chat/tools/estimate-tokens.ts
@@ -19,47 +19,43 @@ export function estimateTokens(
 	let calculatedPromptTokens = promptTokens;
 	let calculatedCompletionTokens = completionTokens;
 
-	// Always estimate missing tokens for any provider
-	if (!promptTokens || !completionTokens) {
-		// Estimate prompt tokens using encodeChat for better accuracy
-		if (!promptTokens && messages && messages.length > 0) {
-			try {
-				// Convert messages to the format expected by gpt-tokenizer
-				const chatMessages: ChatMessage[] = messages.map((m) => ({
-					role: m.role,
-					content:
-						typeof m.content === "string"
-							? m.content
-							: JSON.stringify(m.content),
-					name: m.name,
-				}));
-				calculatedPromptTokens = encodeChat(
-					chatMessages,
-					DEFAULT_TOKENIZER_MODEL,
-				).length;
-			} catch (error) {
-				// Fallback to simple estimation if encoding fails
-				logger.error(
-					"Failed to encode chat messages in estimate tokens",
-					error instanceof Error ? error : new Error(String(error)),
-				);
-				calculatedPromptTokens =
-					messages.reduce((acc, m) => acc + (m.content?.length || 0), 0) / 4;
-			}
+	// Estimate prompt tokens only if not provided by the API
+	if (!promptTokens && messages && messages.length > 0) {
+		try {
+			// Convert messages to the format expected by gpt-tokenizer
+			const chatMessages: ChatMessage[] = messages.map((m) => ({
+				role: m.role,
+				content:
+					typeof m.content === "string" ? m.content : JSON.stringify(m.content),
+				name: m.name,
+			}));
+			calculatedPromptTokens = encodeChat(
+				chatMessages,
+				DEFAULT_TOKENIZER_MODEL,
+			).length;
+		} catch (error) {
+			// Fallback to simple estimation if encoding fails
+			logger.error(
+				"Failed to encode chat messages in estimate tokens",
+				error instanceof Error ? error : new Error(String(error)),
+			);
+			calculatedPromptTokens = Math.round(
+				messages.reduce((acc, m) => acc + (m.content?.length || 0), 0) / 4,
+			);
 		}
+	}
 
-		// Estimate completion tokens using encode for better accuracy
-		if (!completionTokens && content) {
-			try {
-				calculatedCompletionTokens = encode(JSON.stringify(content)).length;
-			} catch (error) {
-				// Fallback to simple estimation if encoding fails
-				logger.error(
-					"Failed to encode completion text",
-					error instanceof Error ? error : new Error(String(error)),
-				);
-				calculatedCompletionTokens = content.length / 4;
-			}
+	// Estimate completion tokens only if not provided by the API
+	if (!completionTokens && content) {
+		try {
+			calculatedCompletionTokens = encode(JSON.stringify(content)).length;
+		} catch (error) {
+			// Fallback to simple estimation if encoding fails
+			logger.error(
+				"Failed to encode completion text",
+				error instanceof Error ? error : new Error(String(error)),
+			);
+			calculatedCompletionTokens = Math.round(content.length / 4);
 		}
 	}
 

diff --git a/packages/models/src/process-image-url.ts b/packages/models/src/process-image-url.ts
@@ -28,7 +28,7 @@ export async function processImageUrl(
 		const base64Data = isBase64 ? data : btoa(data);
 
 		// Validate size (estimate: base64 adds ~33% overhead)
-		const estimatedSize = (base64Data.length * 3) / 4;
+		const estimatedSize = Math.round((base64Data.length * 3) / 4);
-		const estimatedSize = Math.round((base64Data.length * 3) / 4);
+		const sanitized = base64Data.replace(/\s/g, "");
+		const padding = sanitized.endsWith("==") ? 2 : sanitized.endsWith("=") ? 1 : 0;
+		const estimatedSize = Math.floor((sanitized.length * 3) / 4) - padding;
-		const estimatedSize = Math.round((base64Data.length * 3) / 4);
+		const sanitized = base64Data.replace(/\s/g, "");
+		const padding = sanitized.endsWith("==") ? 2 : sanitized.endsWith("=") ? 1 : 0;
+		const estimatedSize = Math.floor((sanitized.length * 3) / 4) - padding;
 		if (estimatedSize > 20 * 1024 * 1024) {
 			logger.warn("Data URL image size exceeds limit", { estimatedSize });
 			throw new Error("Image size exceeds 20MB limit");