From a4b4eac220b861bd80cb797869cc62aa3ed5416e Mon Sep 17 00:00:00 2001
From: Oleg Ivaniv <me@olegivaniv.com>
Date: Thu, 7 May 2026 09:03:48 +0200
Subject: [PATCH] fix(instance-ai): avoid trace token double counting

---
 .../__tests__/langsmith-tracing.test.ts       |  54 +++++-
 .../src/tracing/langsmith-tracing.ts          | 157 ++++++++++++++++--
 2 files changed, 196 insertions(+), 15 deletions(-)

diff --git a/packages/@n8n/instance-ai/src/tracing/__tests__/langsmith-tracing.test.ts b/packages/@n8n/instance-ai/src/tracing/__tests__/langsmith-tracing.test.ts
index fadf1c6da26..2213e131293 100644
--- a/packages/@n8n/instance-ai/src/tracing/__tests__/langsmith-tracing.test.ts
+++ b/packages/@n8n/instance-ai/src/tracing/__tests__/langsmith-tracing.test.ts
@@ -635,6 +635,7 @@ describe('createInstanceAiTraceContext', () => {
 	it('redacts secret-bearing native telemetry span attributes', () => {
 		const span = {
 			attributes: {
+				'ai.operationId': 'ai.streamText.doStream',
 				'ai.prompt.messages': JSON.stringify([
 					{
 						role: 'user',
@@ -657,10 +658,12 @@ describe('createInstanceAiTraceContext', () => {
 			},
 		};
 
-		const redacted = redactLangSmithTelemetrySpan(span);
+		const redacted = redactLangSmithTelemetrySpan(span) as {
+			attributes: Record<string, unknown>;
+		};
 
-		expect(redacted).toEqual({
-			attributes: {
+		expect(redacted.attributes).toEqual(
+			expect.objectContaining({
 				'ai.prompt.messages': JSON.stringify([
 					{
 						role: 'user',
@@ -675,22 +678,62 @@ describe('createInstanceAiTraceContext', () => {
 				'ai.usage.cachedInputTokens': 67,
 				'ai.usage.inputTokenDetails.cacheReadTokens': 67,
 				'gen_ai.usage.input_tokens': 56,
+				'gen_ai.usage.output_tokens': 45,
+				'gen_ai.usage.total_tokens': 101,
 				'gen_ai.usage.input_token_details': JSON.stringify({
 					cache_read: 67,
 					cache_creation: 0,
 					regular: 56,
 					original_input_tokens: 123,
 				}),
+				'langsmith.usage_metadata': JSON.stringify({
+					input_tokens: 56,
+					output_tokens: 45,
+					total_tokens: 101,
+					input_token_details: { cache_read: 67 },
+				}),
 				'headers.authorization': '[redacted]',
 				'metadata.access_token': '[redacted]',
 				'langsmith.span.parent_id': 'parent-run-1',
+				'langsmith.span.kind': 'llm',
 				'langsmith.is_root': true,
 				'langsmith.metadata.anthropic_original_input_tokens': 123,
 				'langsmith.metadata.anthropic_regular_input_tokens': 56,
 				'langsmith.metadata.anthropic_cache_read_input_tokens': 67,
 				'langsmith.metadata.anthropic_cache_creation_input_tokens': 0,
+				'ai_sdk.operation': 'ai.streamText.doStream',
+			}),
+		);
+		expect(redacted.attributes['ai.operationId']).toBeUndefined();
+		expect(redacted.attributes['instance_ai.usage.ai.usage.inputTokens']).toBeUndefined();
+	});
+
+	it('moves counted usage attributes off non-LLM spans', () => {
+		const span = {
+			attributes: {
+				'langsmith.span.kind': 'chain',
+				'gen_ai.usage.input_tokens': 100,
+				'ai.usage.outputTokens': 5,
+				'langsmith.usage_metadata': JSON.stringify({
+					input_tokens: 100,
+					output_tokens: 5,
+					total_tokens: 105,
+				}),
 			},
-		});
+		};
+
+		const redacted = redactLangSmithTelemetrySpan(span) as {
+			attributes: Record<string, unknown>;
+		};
+
+		expect(redacted.attributes['gen_ai.usage.input_tokens']).toBeUndefined();
+		expect(redacted.attributes['ai.usage.outputTokens']).toBeUndefined();
+		expect(redacted.attributes['langsmith.usage_metadata']).toBeUndefined();
+		expect(redacted.attributes['instance_ai.usage.gen_ai.usage.input_tokens']).toBe(100);
+		expect(redacted.attributes['instance_ai.usage.ai.usage.outputTokens']).toBe(5);
+		expect(redacted.attributes['instance_ai.usage.langsmith.usage_metadata']).toBe(
+			JSON.stringify({ input_tokens: 100, output_tokens: 5, total_tokens: 105 }),
+		);
 	});
 
 	it('adds LangSmith prompt input with tool specs for native AI SDK spans', () => {
@@ -770,7 +813,10 @@ describe('createInstanceAiTraceContext', () => {
 
 		expect(redacted.name).toBe('llm: workflow-builder');
 		expect(redacted.attributes['langsmith.trace.name']).toBe('llm: workflow-builder');
+		expect(redacted.attributes['langsmith.span.kind']).toBe('llm');
+		expect(redacted.attributes['gen_ai.operation.name']).toBe('chat');
 		expect(redacted.attributes['ai_sdk.operation']).toBe('ai.streamText.doStream');
+		expect(redacted.attributes['ai.operationId']).toBeUndefined();
 		expect(redacted.attributes['instance_ai.canonical_name']).toBe('ai.streamText.doStream');
 		expect(redacted.attributes.display_kind).toBe('llm');
 		expect(redacted.attributes.display_group).toBe('workflow-builder');
diff --git a/packages/@n8n/instance-ai/src/tracing/langsmith-tracing.ts b/packages/@n8n/instance-ai/src/tracing/langsmith-tracing.ts
index 9b3eeb00c8f..016eb744a05 100644
--- a/packages/@n8n/instance-ai/src/tracing/langsmith-tracing.ts
+++ b/packages/@n8n/instance-ai/src/tracing/langsmith-tracing.ts
@@ -84,8 +84,15 @@ const LANGSMITH_TRACEABLE = 'langsmith.traceable';
 const LANGSMITH_TRACE_NAME = 'langsmith.trace.name';
 const LANGSMITH_SPAN_KIND = 'langsmith.span.kind';
 const LANGSMITH_SPAN_TAGS = 'langsmith.span.tags';
+const LANGSMITH_USAGE_METADATA = 'langsmith.usage_metadata';
 const GEN_AI_PROMPT = 'gen_ai.prompt';
 const GEN_AI_COMPLETION = 'gen_ai.completion';
+const GEN_AI_OPERATION_NAME = 'gen_ai.operation.name';
+const GEN_AI_USAGE_INPUT_TOKENS = 'gen_ai.usage.input_tokens';
+const GEN_AI_USAGE_OUTPUT_TOKENS = 'gen_ai.usage.output_tokens';
+const GEN_AI_USAGE_TOTAL_TOKENS = 'gen_ai.usage.total_tokens';
+const GEN_AI_USAGE_INPUT_TOKEN_DETAILS = 'gen_ai.usage.input_token_details';
+const AI_OPERATION_ID = 'ai.operationId';
 const LLM_AI_SDK_OPERATION_IDS = new Set([
 	'ai.generateText.doGenerate',
 	'ai.streamText.doStream',
@@ -1051,6 +1058,27 @@ function readTokenDetail(details: unknown, keys: string[]): number | undefined {
 	return undefined;
 }
 
+function readNestedRecord(
+	record: Record<string, unknown>,
+	keys: string[],
+): Record<string, unknown> {
+	let current: unknown = record;
+	for (const key of keys) {
+		if (!isRecord(current)) {
+			return {};
+		}
+		current = current[key];
+	}
+	return isRecord(current) ? current : {};
+}
+
+function readProviderAnthropicUsage(attributes: Record<string, unknown>): Record<string, unknown> {
+	const providerMetadata = parseTelemetryJson(attributes['ai.response.providerMetadata']);
+	return isRecord(providerMetadata)
+		? readNestedRecord(providerMetadata, ['anthropic', 'usage'])
+		: {};
+}
+
 function firstNumberAttribute(
 	attributes: Record<string, unknown>,
 	keys: string[],
@@ -1064,23 +1092,34 @@ function firstNumberAttribute(
 	return undefined;
 }
 
-function normalizeAnthropicUsageForLangSmith(attributes: Record<string, unknown>): void {
+function buildLangSmithUsageMetadata(
+	attributes: Record<string, unknown>,
+): Record<string, unknown> | undefined {
 	const inputTokens = firstNumberAttribute(attributes, [
-		'gen_ai.usage.input_tokens',
+		GEN_AI_USAGE_INPUT_TOKENS,
 		'ai.usage.inputTokens',
 		'ai.usage.promptTokens',
 	]);
-	if (inputTokens === undefined) {
+
+	const outputTokens =
+		firstNumberAttribute(attributes, [
+			GEN_AI_USAGE_OUTPUT_TOKENS,
+			'ai.usage.outputTokens',
+			'ai.usage.completionTokens',
+		]) ?? 0;
+	if (inputTokens === undefined && outputTokens === 0) {
 		return;
 	}
 
-	const inputDetails = attributes['gen_ai.usage.input_token_details'];
+	const providerAnthropicUsage = readProviderAnthropicUsage(attributes);
+	const inputDetails = attributes[GEN_AI_USAGE_INPUT_TOKEN_DETAILS];
 	const cacheReadTokens =
 		firstNumberAttribute(attributes, [
 			'ai.usage.inputTokenDetails.cacheReadTokens',
 			'ai.usage.cachedInputTokens',
 			'ai.usage.cacheReadInputTokens',
 		]) ??
+		firstNumberAttribute(providerAnthropicUsage, ['cache_read_input_tokens']) ??
 		readTokenDetail(inputDetails, [
 			'cache_read',
 			'cache_read_tokens',
@@ -1095,6 +1134,10 @@ function normalizeAnthropicUsageForLangSmith(attributes: Record<string, unknown>
 			'ai.usage.inputTokenDetails.cacheWriteTokens',
 			'ai.usage.cacheWriteInputTokens',
 		]) ??
+		firstNumberAttribute(providerAnthropicUsage, [
+			'cache_creation_input_tokens',
+			'cache_write_input_tokens',
+		]) ??
 		readTokenDetail(inputDetails, [
 			'cache_creation',
 			'cache_creation_tokens',
@@ -1105,22 +1148,67 @@ function normalizeAnthropicUsageForLangSmith(attributes: Record<string, unknown>
 		]) ??
 		0;
 
-	if (cacheReadTokens === 0 && cacheCreationTokens === 0) {
+	const regularInputTokens =
+		inputTokens === undefined
+			? 0
+			: Math.max(0, inputTokens - cacheReadTokens - cacheCreationTokens);
+	const inputTokenDetails: Record<string, number> = {};
+	if (cacheReadTokens > 0) {
+		inputTokenDetails.cache_read = cacheReadTokens;
+	}
+	if (cacheCreationTokens > 0) {
+		inputTokenDetails.cache_creation = cacheCreationTokens;
+		inputTokenDetails.ephemeral_5m_input_tokens = cacheCreationTokens;
+	}
+
+	return {
+		input_tokens: regularInputTokens,
+		output_tokens: outputTokens,
+		total_tokens: regularInputTokens + outputTokens,
+		...(Object.keys(inputTokenDetails).length > 0
+			? { input_token_details: inputTokenDetails }
+			: {}),
+	};
+}
+
+function normalizeAnthropicUsageForLangSmith(attributes: Record<string, unknown>): void {
+	const usageMetadata = buildLangSmithUsageMetadata(attributes);
+	if (!usageMetadata) {
 		return;
 	}
 
-	const regularInputTokens = Math.max(0, inputTokens - cacheReadTokens - cacheCreationTokens);
-	attributes['gen_ai.usage.input_tokens'] = regularInputTokens;
+	const inputTokens = firstNumberAttribute(attributes, [
+		GEN_AI_USAGE_INPUT_TOKENS,
+		'ai.usage.inputTokens',
+		'ai.usage.promptTokens',
+	]);
+	const regularInputTokens = numberFromAttribute(usageMetadata.input_tokens) ?? 0;
+	const outputTokens = numberFromAttribute(usageMetadata.output_tokens) ?? 0;
+	const inputTokenDetails = isRecord(usageMetadata.input_token_details)
+		? usageMetadata.input_token_details
+		: {};
+	const cacheReadTokens = numberFromAttribute(inputTokenDetails.cache_read) ?? 0;
+	const cacheCreationTokens =
+		numberFromAttribute(inputTokenDetails.cache_creation) ??
+		numberFromAttribute(inputTokenDetails.ephemeral_5m_input_tokens) ??
+		0;
+
+	attributes[GEN_AI_USAGE_INPUT_TOKENS] = regularInputTokens;
+	attributes[GEN_AI_USAGE_OUTPUT_TOKENS] = outputTokens;
+	attributes[GEN_AI_USAGE_TOTAL_TOKENS] = regularInputTokens + outputTokens;
 	attributes['ai.usage.inputTokens'] = regularInputTokens;
-	attributes['langsmith.metadata.anthropic_original_input_tokens'] = inputTokens;
+	attributes[LANGSMITH_USAGE_METADATA] = JSON.stringify(usageMetadata);
+	if (inputTokens !== undefined) {
+		attributes['langsmith.metadata.anthropic_original_input_tokens'] = inputTokens;
+	}
 	attributes['langsmith.metadata.anthropic_regular_input_tokens'] = regularInputTokens;
 	attributes['langsmith.metadata.anthropic_cache_read_input_tokens'] = cacheReadTokens;
 	attributes['langsmith.metadata.anthropic_cache_creation_input_tokens'] = cacheCreationTokens;
-	attributes['gen_ai.usage.input_token_details'] = JSON.stringify({
+	attributes[GEN_AI_USAGE_INPUT_TOKEN_DETAILS] = JSON.stringify({
 		cache_read: cacheReadTokens,
 		cache_creation: cacheCreationTokens,
 		regular: regularInputTokens,
-		original_input_tokens: inputTokens,
+		...(inputTokens !== undefined ? { original_input_tokens: inputTokens } : {}),
 	});
 }
 
@@ -1182,7 +1270,7 @@ function renameNativeLlmSpanForLangSmith(
 	span: Record<string, unknown>,
 	attributes: Record<string, unknown>,
 ): void {
-	const operationId = readStringAttribute(attributes, ['ai.operationId']);
+	const operationId = readStringAttribute(attributes, [AI_OPERATION_ID]);
 	if (!operationId || !LLM_AI_SDK_OPERATION_IDS.has(operationId)) {
 		return;
 	}
@@ -1190,6 +1278,8 @@ function renameNativeLlmSpanForLangSmith(
 	const displayName = displayNameForNativeLlmSpan(attributes);
 	span.name = displayName;
 	attributes[LANGSMITH_TRACE_NAME] = displayName;
+	attributes[LANGSMITH_SPAN_KIND] = 'llm';
+	attributes[GEN_AI_OPERATION_NAME] = 'chat';
 	const displayGroup = inferNativeLlmRole(attributes);
 	setLangSmithMetadataAttribute(attributes, 'display_name', displayName);
 	setLangSmithMetadataAttribute(attributes, 'display_kind', 'llm');
@@ -1210,6 +1300,50 @@ function renameNativeLlmSpanForLangSmith(
 	setLangSmithMetadataAttribute(attributes, 'instance_ai.display_name', displayName);
 	setLangSmithMetadataAttribute(attributes, 'instance_ai.canonical_name', operationId);
 	setLangSmithMetadataAttribute(attributes, 'instance_ai.run_name', operationId);
+	delete attributes[AI_OPERATION_ID];
+}
+
+function isLangSmithLlmSpan(attributes: Record<string, unknown>): boolean {
+	const operationId = readStringAttribute(attributes, [AI_OPERATION_ID]);
+	return (
+		attributes[LANGSMITH_SPAN_KIND] === 'llm' ||
+		attributes.display_kind === 'llm' ||
+		(typeof operationId === 'string' && LLM_AI_SDK_OPERATION_IDS.has(operationId))
+	);
+}
+
+function isCountedUsageAttribute(key: string): boolean {
+	return (
+		key === LANGSMITH_USAGE_METADATA ||
+		key === 'usage_metadata' ||
+		key === 'prompt_tokens' ||
+		key === 'completion_tokens' ||
+		key === 'total_tokens' ||
+		key === 'input_tokens' ||
+		key === 'output_tokens' ||
+		key.startsWith('gen_ai.usage.') ||
+		key.startsWith('ai.usage.') ||
+		key.startsWith('llm.usage.')
+	);
+}
+
+function neutralUsageAttributeKey(key: string): string {
+	return `instance_ai.usage.${key}`;
+}
+
+function moveNonLlmUsageAttributes(attributes: Record<string, unknown>): void {
+	if (isLangSmithLlmSpan(attributes)) {
+		return;
+	}
+
+	for (const key of Object.keys(attributes)) {
+		if (!isCountedUsageAttribute(key)) {
+			continue;
+		}
+
+		attributes[neutralUsageAttributeKey(key)] = attributes[key];
+		delete attributes[key];
+	}
 }
 
 export function redactLangSmithTelemetrySpan(span: unknown): unknown {
@@ -1224,6 +1358,7 @@ export function redactLangSmithTelemetrySpan(span: unknown): unknown {
 	enrichLangSmithPromptAttribute(attributes);
 	normalizeAnthropicUsageForLangSmith(attributes);
 	renameNativeLlmSpanForLangSmith(span, attributes);
+	moveNonLlmUsageAttributes(attributes);
 	span.attributes = attributes;
 	return span;
 }