theopenco · steebchen · Sep 22, 2025 · Sep 23, 2025 · Sep 23, 2025 · coderabbitai
diff --git a/apps/gateway/src/chat/tools/estimate-tokens.ts b/apps/gateway/src/chat/tools/estimate-tokens.ts
@@ -19,47 +19,42 @@ export function estimateTokens(
 	let calculatedPromptTokens = promptTokens;
 	let calculatedCompletionTokens = completionTokens;
 
-	// Always estimate missing tokens for any provider
-	if (!promptTokens || !completionTokens) {
-		// Estimate prompt tokens using encodeChat for better accuracy
-		if (!promptTokens && messages && messages.length > 0) {
-			try {
-				// Convert messages to the format expected by gpt-tokenizer
-				const chatMessages: ChatMessage[] = messages.map((m) => ({
-					role: m.role,
-					content:
-						typeof m.content === "string"
-							? m.content
-							: JSON.stringify(m.content),
-					name: m.name,
-				}));
-				calculatedPromptTokens = encodeChat(
-					chatMessages,
-					DEFAULT_TOKENIZER_MODEL,
-				).length;
-			} catch (error) {
-				// Fallback to simple estimation if encoding fails
-				logger.error(
-					"Failed to encode chat messages in estimate tokens",
-					error instanceof Error ? error : new Error(String(error)),
-				);
-				calculatedPromptTokens =
-					messages.reduce((acc, m) => acc + (m.content?.length || 0), 0) / 4;
-			}
+	// Estimate prompt tokens only if not provided by the API
+	if (!promptTokens && messages && messages.length > 0) {
+		try {
+			// Convert messages to the format expected by gpt-tokenizer
+			const chatMessages: ChatMessage[] = messages.map((m) => ({
+				role: m.role,
+				content:
+					typeof m.content === "string" ? m.content : JSON.stringify(m.content),
+				name: m.name,
+			}));
+			calculatedPromptTokens = encodeChat(
+				chatMessages,
+				DEFAULT_TOKENIZER_MODEL,
+			).length;
+		} catch (error) {
+			// Fallback to simple estimation if encoding fails
+			logger.error(
+				"Failed to encode chat messages in estimate tokens",
+				error instanceof Error ? error : new Error(String(error)),
+			);
+			calculatedPromptTokens =
+				messages.reduce((acc, m) => acc + (m.content?.length || 0), 0) / 4;
 		}
+	}
-	// Estimate prompt tokens only if not provided by the API
-	if (!promptTokens && messages && messages.length > 0) {
-		try {
-			// Convert messages to the format expected by gpt-tokenizer
-			const chatMessages: ChatMessage[] = messages.map((m) => ({
-				role: m.role,
-				content:
-					typeof m.content === "string" ? m.content : JSON.stringify(m.content),
-				name: m.name,
-			}));
-			calculatedPromptTokens = encodeChat(
-				chatMessages,
-				DEFAULT_TOKENIZER_MODEL,
-			).length;
-		} catch (error) {
-			// Fallback to simple estimation if encoding fails
-			logger.error(
-				"Failed to encode chat messages in estimate tokens",
-				error instanceof Error ? error : new Error(String(error)),
-			);
-			calculatedPromptTokens =
-				messages.reduce((acc, m) => acc + (m.content?.length || 0), 0) / 4;
-		}
-	}
+	// Estimate prompt tokens only if not provided by the API
+	if (promptTokens == null && messages?.length > 0) {
+		try {
+			// Convert messages to the format expected by gpt-tokenizer
+			const chatMessages: ChatMessage[] = messages.map((m) => ({
+				role: m.role,
+				content:
+					typeof m.content === "string" ? m.content : JSON.stringify(m.content),
+				name: m.name,
+			}));
+			calculatedPromptTokens = encodeChat(
+				chatMessages,
+				DEFAULT_TOKENIZER_MODEL,
+			).length;
+		} catch (error) {
+			// Fallback to simple estimation if encoding fails
+			logger.error(
+				"Failed to encode chat messages in estimate tokens",
+				error instanceof Error ? error : new Error(String(error)),
+			);
+			calculatedPromptTokens = Math.round(
+				messages.reduce((acc, m) => {
+					const text =
+						typeof m.content === "string" ? m.content : JSON.stringify(m.content);
+					return acc + text.length;
+				}, 0) / 4
+			);
+		}
+	}
-	// Estimate prompt tokens only if not provided by the API
-	if (!promptTokens && messages && messages.length > 0) {
-		try {
-			// Convert messages to the format expected by gpt-tokenizer
-			const chatMessages: ChatMessage[] = messages.map((m) => ({
-				role: m.role,
-				content:
-					typeof m.content === "string" ? m.content : JSON.stringify(m.content),
-				name: m.name,
-			}));
-			calculatedPromptTokens = encodeChat(
-				chatMessages,
-				DEFAULT_TOKENIZER_MODEL,
-			).length;
-		} catch (error) {
-			// Fallback to simple estimation if encoding fails
-			logger.error(
-				"Failed to encode chat messages in estimate tokens",
-				error instanceof Error ? error : new Error(String(error)),
-			);
-			calculatedPromptTokens =
-				messages.reduce((acc, m) => acc + (m.content?.length || 0), 0) / 4;
-		}
-	}
+	// Estimate prompt tokens only if not provided by the API
+	if (promptTokens == null && messages?.length > 0) {
+		try {
+			// Convert messages to the format expected by gpt-tokenizer
+			const chatMessages: ChatMessage[] = messages.map((m) => ({
+				role: m.role,
+				content:
+					typeof m.content === "string" ? m.content : JSON.stringify(m.content),
+				name: m.name,
+			}));
+			calculatedPromptTokens = encodeChat(
+				chatMessages,
+				DEFAULT_TOKENIZER_MODEL,
+			).length;
+		} catch (error) {
+			// Fallback to simple estimation if encoding fails
+			logger.error(
+				"Failed to encode chat messages in estimate tokens",
+				error instanceof Error ? error : new Error(String(error)),
+			);
+			calculatedPromptTokens = Math.round(
+				messages.reduce((acc, m) => {
+					const text =
+						typeof m.content === "string" ? m.content : JSON.stringify(m.content);
+					return acc + text.length;
+				}, 0) / 4
+			);
+		}
+	}
 
-		// Estimate completion tokens using encode for better accuracy
-		if (!completionTokens && content) {
-			try {
-				calculatedCompletionTokens = encode(JSON.stringify(content)).length;
-			} catch (error) {
-				// Fallback to simple estimation if encoding fails
-				logger.error(
-					"Failed to encode completion text",
-					error instanceof Error ? error : new Error(String(error)),
-				);
-				calculatedCompletionTokens = content.length / 4;
-			}
+	// Estimate completion tokens only if not provided by the API
+	if (!completionTokens && content) {
+		try {
+			calculatedCompletionTokens = encode(JSON.stringify(content)).length;
+		} catch (error) {
+			// Fallback to simple estimation if encoding fails
+			logger.error(
+				"Failed to encode completion text",
+				error instanceof Error ? error : new Error(String(error)),
+			);
+			calculatedCompletionTokens = content.length / 4;
 		}
 	}
-	// Estimate completion tokens only if not provided by the API
-	if (!completionTokens && content) {
-		try {
-			calculatedCompletionTokens = encode(JSON.stringify(content)).length;
-		} catch (error) {
-			// Fallback to simple estimation if encoding fails
-			logger.error(
-				"Failed to encode completion text",
-				error instanceof Error ? error : new Error(String(error)),
-			);
-			calculatedCompletionTokens = content.length / 4;
-		}
-	}
+	// Estimate completion tokens only if not provided by the API
+	if (completionTokens == null && content != null) {
+		try {
+			calculatedCompletionTokens = encode(content).length;
+		} catch (error) {
+			// Fallback to simple estimation if encoding fails
+			logger.error(
+				"Failed to encode completion text",
+				error instanceof Error ? error : new Error(String(error)),
+			);
+			calculatedCompletionTokens = Math.round(content.length / 4);
+		}
+	}
-	// Estimate completion tokens only if not provided by the API
-	if (!completionTokens && content) {
-		try {
-			calculatedCompletionTokens = encode(JSON.stringify(content)).length;
-		} catch (error) {
-			// Fallback to simple estimation if encoding fails
-			logger.error(
-				"Failed to encode completion text",
-				error instanceof Error ? error : new Error(String(error)),
-			);
-			calculatedCompletionTokens = content.length / 4;
-		}
-	}
+	// Estimate completion tokens only if not provided by the API
+	if (completionTokens == null && content != null) {
+		try {
+			calculatedCompletionTokens = encode(content).length;
+		} catch (error) {
+			// Fallback to simple estimation if encoding fails
+			logger.error(
+				"Failed to encode completion text",
+				error instanceof Error ? error : new Error(String(error)),
+			);
+			calculatedCompletionTokens = Math.round(content.length / 4);
+		}
+	}