feat: add opt-in API usage logging for write endpoint

Anthony Bailey · claude · Anthony Bailey · commit 25865555851f · 2025-06-27T07:28:16.000+01:00
- Implement comprehensive usage logging with rate limit tracking - Opt-in via write-usage.log file existence - Capture token usage, rate limits, duration, and errors - Clean wrapper pattern keeps server code uncluttered - Logs both successful API calls and rate limit errors - No performance impact when logging disabled This helps monitor API usage patterns and debug rate limit issues during conference demos and multi-user testing. 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <noreply@anthropic.com>
diff --git a/src/lib/usage-logger.ts b/src/lib/usage-logger.ts
@@ -0,0 +1,226 @@
+import { writeFileSync, existsSync } from 'fs'
+import { join } from 'path'
+
+const USAGE_LOG_FILE = 'write-usage.log'
+
+interface UsageLogEntry {
+	[requestId: string]: {
+		timestamp: string // ISO format for lexical sorting
+		stepName: string
+		model: string
+		orgId?: string
+		usage: {
+			input_tokens: number
+			cache_creation_input_tokens: number
+			cache_read_input_tokens: number
+			output_tokens: number
+			service_tier: string
+		}
+		rateLimits: {
+			input_tokens_remaining: number
+			output_tokens_remaining: number
+			requests_remaining: number
+			input_tokens_limit: number
+			output_tokens_limit: number
+			requests_limit: number
+		}
+		durationMs: number
+		toolsUsed: boolean
+		webSearchCount?: number
+	}
+}
+
+/**
+ * Log API usage information if write-usage.log file exists
+ * Uses JSON blob per line format for easy parsing
+ */
+export function logApiUsage(
+	requestId: string,
+	stepName: string,
+	model: string,
+	response: any, // Anthropic API response
+	headers: Record<string, string>, // Response headers
+	durationMs: number,
+	toolsUsed: boolean = false,
+	webSearchCount: number = 0
+): void {
+	// Only log if the log file exists (opt-in)
+	if (!existsSync(USAGE_LOG_FILE)) {
+		return
+	}
+
+	try {
+		const logEntry: UsageLogEntry = {
+			[requestId]: {
+				timestamp: new Date().toISOString(),
+				stepName,
+				model,
+				orgId: headers['anthropic-organization-id'],
+				usage: response.usage || {
+					input_tokens: 0,
+					cache_creation_input_tokens: 0,
+					cache_read_input_tokens: 0,
+					output_tokens: 0,
+					service_tier: 'unknown'
+				},
+				rateLimits: {
+					input_tokens_remaining: parseInt(
+						headers['anthropic-ratelimit-input-tokens-remaining'] || '0'
+					),
+					output_tokens_remaining: parseInt(
+						headers['anthropic-ratelimit-output-tokens-remaining'] || '0'
+					),
+					requests_remaining: parseInt(headers['anthropic-ratelimit-requests-remaining'] || '0'),
+					input_tokens_limit: parseInt(headers['anthropic-ratelimit-input-tokens-limit'] || '0'),
+					output_tokens_limit: parseInt(headers['anthropic-ratelimit-output-tokens-limit'] || '0'),
+					requests_limit: parseInt(headers['anthropic-ratelimit-requests-limit'] || '0')
+				},
+				durationMs,
+				toolsUsed,
+				...(webSearchCount > 0 && { webSearchCount })
+			}
+		}
+
+		// Append JSON blob as single line
+		const logLine = JSON.stringify(logEntry) + '\n'
+		writeFileSync(USAGE_LOG_FILE, logLine, { flag: 'a' })
+	} catch (error) {
+		// Silently fail to avoid breaking the API
+		console.warn('Failed to log API usage:', error)
+	}
+}
+
+/**
+ * Wrap an Anthropic API promise to optionally add logging with rate limit headers
+ * If logging is disabled, returns the original response
+ * If logging is enabled, uses .withResponse() to capture headers and logs usage
+ */
+export function optionallyLogUsage<T>(
+	originalPromise: any, // The anthropic.messages.create() promise
+	stepName: string,
+	model: string,
+	startTime: number,
+	toolsUsed: boolean = false,
+	webSearchCount: number = 0
+): Promise<T> {
+	// If logging is disabled, return original promise unchanged
+	if (!existsSync(USAGE_LOG_FILE)) {
+		return originalPromise
+	}
+
+	// If logging is enabled, use withResponse() to get headers
+	return originalPromise
+		.withResponse()
+		.then((responseWithMeta: any) => {
+			const response = responseWithMeta.data
+			const headers = responseWithMeta.response.headers
+			const durationMs = Date.now() - startTime
+
+			// Log in background (don't block)
+			try {
+				const logEntry: UsageLogEntry = {
+					[response.id]: {
+						timestamp: new Date().toISOString(),
+						stepName,
+						model,
+						usage: response.usage || {
+							input_tokens: 0,
+							cache_creation_input_tokens: 0,
+							cache_read_input_tokens: 0,
+							output_tokens: 0,
+							service_tier: 'unknown'
+						},
+						rateLimits: {
+							input_tokens_remaining: parseInt(
+								headers.get('anthropic-ratelimit-input-tokens-remaining') || '0'
+							),
+							output_tokens_remaining: parseInt(
+								headers.get('anthropic-ratelimit-output-tokens-remaining') || '0'
+							),
+							requests_remaining: parseInt(
+								headers.get('anthropic-ratelimit-requests-remaining') || '0'
+							),
+							input_tokens_limit: parseInt(
+								headers.get('anthropic-ratelimit-input-tokens-limit') || '0'
+							),
+							output_tokens_limit: parseInt(
+								headers.get('anthropic-ratelimit-output-tokens-limit') || '0'
+							),
+							requests_limit: parseInt(headers.get('anthropic-ratelimit-requests-limit') || '0'),
+							// Check for potential web search rate limit headers (may not exist)
+							web_search_remaining:
+								parseInt(headers.get('anthropic-ratelimit-web-search-remaining') || '0') || null,
+							web_search_limit:
+								parseInt(headers.get('anthropic-ratelimit-web-search-limit') || '0') || null,
+							// Also capture web search usage from response body if available
+							web_search_requests_used: response.usage?.server_tool_use?.web_search_requests || null
+						},
+						durationMs,
+						toolsUsed,
+						...(webSearchCount > 0 && { webSearchCount })
+					}
+				}
+
+				// Append JSON blob as single line
+				const logLine = JSON.stringify(logEntry) + '\n'
+				writeFileSync(USAGE_LOG_FILE, logLine, { flag: 'a' })
+			} catch (error) {
+				// Silently fail to avoid breaking the API
+				console.warn('Failed to log API usage:', error)
+			}
+
+			// Return the original response (not the withResponse wrapper)
+			return response
+		})
+		.catch((error: any) => {
+			// Log errors with headers if possible
+			const durationMs = Date.now() - startTime
+
+			try {
+				const errorId = `error_${Date.now()}_${Math.random().toString(36).substr(2, 9)}`
+				const logEntry = {
+					[errorId]: {
+						timestamp: new Date().toISOString(),
+						stepName,
+						model,
+						error: error?.message || String(error),
+						durationMs,
+						toolsUsed,
+						// Try to get rate limits from error response if available
+						rateLimits: error?.headers
+							? {
+									input_tokens_remaining: parseInt(
+										error.headers['anthropic-ratelimit-input-tokens-remaining'] || '0'
+									),
+									output_tokens_remaining: parseInt(
+										error.headers['anthropic-ratelimit-output-tokens-remaining'] || '0'
+									),
+									requests_remaining: parseInt(
+										error.headers['anthropic-ratelimit-requests-remaining'] || '0'
+									),
+									input_tokens_limit: parseInt(
+										error.headers['anthropic-ratelimit-input-tokens-limit'] || '0'
+									),
+									output_tokens_limit: parseInt(
+										error.headers['anthropic-ratelimit-output-tokens-limit'] || '0'
+									),
+									requests_limit: parseInt(
+										error.headers['anthropic-ratelimit-requests-limit'] || '0'
+									)
+								}
+							: null
+					}
+				}
+
+				// Append JSON blob as single line
+				const logLine = JSON.stringify(logEntry) + '\n'
+				writeFileSync(USAGE_LOG_FILE, logLine, { flag: 'a' })
+			} catch (logError) {
+				// Silently fail to avoid breaking the API
+				console.warn('Failed to log API error:', logError)
+			}
+
+			// Rethrow the original error
+			throw error
+		})
+}
diff --git a/src/routes/api/write/+server.ts b/src/routes/api/write/+server.ts
@@ -1,6 +1,7 @@
 import { error, json } from '@sveltejs/kit'
 import { env } from '$env/dynamic/private'
 import Anthropic from '@anthropic-ai/sdk'
+import { optionallyLogUsage } from '$lib/usage-logger'
 
 // Safely access the API key, will be undefined if not set
 const ANTHROPIC_API_KEY_FOR_WRITE = env.ANTHROPIC_API_KEY_FOR_WRITE || undefined
@@ -52,7 +53,7 @@ const stepConfigs: Record<StepName, StepConfig> = {
 	// Research-focused steps that benefit from web search
 	findTarget: {
 		toolsEnabled: true,
-		maxToolCalls: 5,
+		maxToolCalls: 3,
 		description: 'Find possible targets (using web search)'
 	},
 	webSearch: {
@@ -287,12 +288,13 @@ Search for and provide:
 7. Contact information (professional email or official channels if publicly available)
 
 Please cite all sources you use and only include information you can verify through your internet search. If you encounter conflicting information, note this and provide the most reliable source.
-
-BE BRIEF! This is extremely important. Try to output only a few lines of text for each questions.
-BE FAST! You do not have a lot of time to answer this query before it times out!
-ANSWER QUICKLY!!!
 `
 
+//BE BRIEF! This is extremely important. Try to output only a few lines of text for each questions.
+//BE FAST! You do not have a lot of time to answer this query before it times out!
+//ANSWER QUICKLY!!!
+//`
+
 // Only initialize the client if we have an API key
 const anthropic = IS_API_AVAILABLE
 	? new Anthropic({
@@ -358,6 +360,10 @@ async function callClaude(
 		// Combine all the specified prompts
 		const systemPrompt = promptNames.map((name) => System_Prompts[name]).join('')
 
+		// TEMP: Log the full request prompt for debugging
+		console.debug(`${logPrefix} system prompt:\n---\n${systemPrompt}\n---`)
+		console.debug(`${logPrefix} user content:\n---\n${userContent}\n---`)
+
 		// NEW: Determine if tools should be included in this call
 		const shouldUseTools = toolsEnabled && ENABLE_WEB_SEARCH && IS_API_AVAILABLE
 
@@ -372,14 +378,14 @@ async function callClaude(
 					{
 						type: 'web_search_20250305', // CHANGED: Use correct tool type from API docs
 						name: 'web_search',
-						max_uses: 1 // ADDED: Limit searches per request
+						max_uses: 5 // ADDED: Limit searches per request
 					}
 				]
 			: undefined
 
 		// ENHANCED: Create API request with conditional tool support
 		const requestParams: any = {
-			model: 'claude-3-7-sonnet-20250219',
+			model: 'claude-sonnet-4-20250514',
 			max_tokens: 4096,
 			system: systemPrompt,
 			messages: [{ role: 'user', content: userContent }]
@@ -406,7 +412,14 @@ async function callClaude(
 				messages: currentMessages
 			}
 
-			const response = await anthropic.messages.create(currentRequest)
+			const response = await optionallyLogUsage(
+				anthropic.messages.create(currentRequest),
+				stepName,
+				requestParams.model,
+				startTime,
+				shouldUseTools,
+				toolCallCount
+			)
 
 			// Log the request ID at debug level
 			console.debug(`${logPrefix} requestId: ${response.id}`)
@@ -468,6 +481,9 @@ async function callClaude(
 
 		// Log the full response text at debug level
 		console.debug(`${logPrefix} full response:\n---\n${finalText}\n---`)
+
+		// Logging is handled by optionallyLogUsage wrapper
+
 		return { text: finalText, durationSec: elapsed }
 	} catch (error) {
 		// ENHANCED: Better error handling for tool-related failures