npm - @hatchway/cli - Versions diffs - 0.50.63 → 0.50.64 - Mend

@hatchway/cli 0.50.63 → 0.50.64

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/index.js CHANGED Viewed

@@ -4335,9 +4335,10 @@ function buildPromptWithImages(prompt, messageParts) {
  * query() SDK function -> minimal transformation -> output
  *
  * Sentry Integration:
- * - The query() function is auto-instrumented by Sentry's claudeCodeAgentSdkIntegration
- * - Instrumentation hooks into @anthropic-ai/claude-agent-sdk via OpenTelemetry
- * - IMPORTANT: Sentry must be initialized BEFORE claude-agent-sdk is imported
+ * - Manual gen_ai.* spans for AI Agent Monitoring in Sentry
+ * - gen_ai.invoke_agent wraps the full query lifecycle
+ * - gen_ai.execute_tool spans are emitted per tool call
+ * - Token usage and cost are captured from the SDK result message
  */
 function createNativeClaudeQuery(modelId = DEFAULT_CLAUDE_MODEL_ID, abortController) {
     return async function* nativeClaudeQuery(prompt, workingDirectory, systemPrompt, _agent, _codexThreadId, messageParts) {
@@ -4423,20 +4424,44 @@ function createNativeClaudeQuery(modelId = DEFAULT_CLAUDE_MODEL_ID, abortControl
         let messageCount = 0;
         let toolCallCount = 0;
         let textBlockCount = 0;
+        // Wrap the entire agent execution in a gen_ai.invoke_agent span for Sentry AI monitoring
+        const agentSpan = Sentry.startInactiveSpan({
+            op: 'gen_ai.invoke_agent',
+            name: `Claude Agent (${modelId})`,
+            attributes: {
+                'gen_ai.agent.name': 'hatchway-builder',
+                'gen_ai.request.model': modelId,
+                'gen_ai.agent.input': finalPrompt.substring(0, 500),
+                'gen_ai.system_prompt.length': appendedSystemPrompt.length,
+                'gen_ai.agent.available_tools': JSON.stringify(['Bash', 'Read', 'Write', 'Edit', 'Glob', 'Grep', 'Task', 'TodoWrite', 'WebFetch']),
+            },
+        });
         try {
             // Stream messages directly from the SDK
-            // NOTE: query() is auto-instrumented by Sentry's claudeCodeAgentSdkIntegration
             for await (const sdkMessage of query({ prompt: finalPrompt, options })) {
                 messageCount++;
                 // Transform SDK message to our internal format
                 const transformed = transformSDKMessage(sdkMessage);
                 if (transformed) {
-                    // Track stats for logging
+                    // Track stats and emit gen_ai.execute_tool spans for tool calls
                     if (transformed.type === 'assistant' && transformed.message?.content) {
                         for (const block of transformed.message.content) {
                             if (block.type === 'tool_use') {
                                 toolCallCount++;
                                 debugLog$4(`[runner] [native-sdk] 🔧 Tool call: ${block.name}\n`);
+                                // Emit a gen_ai.execute_tool span for each tool invocation
+                                const toolSpan = Sentry.startInactiveSpan({
+                                    op: 'gen_ai.execute_tool',
+                                    name: `Tool: ${block.name}`,
+                                    attributes: {
+                                        'gen_ai.tool.name': block.name,
+                                        'gen_ai.tool.call_id': block.id,
+                                        'gen_ai.tool.input': JSON.stringify(block.input).substring(0, 1000),
+                                    },
+                                });
+                                // Tool spans are completed immediately since we get input and output
+                                // as separate messages — the output is captured in the tool_result handler below
+                                toolSpan?.end();
                             }
                             else if (block.type === 'text') {
                                 textBlockCount++;
@@ -4485,13 +4510,31 @@ function createNativeClaudeQuery(modelId = DEFAULT_CLAUDE_MODEL_ID, abortControl
                         process.stderr.write(`[native-sdk] Tool use summary: ${summaryMsg.summary}\n`);
                     }
                 }
-                // Log result messages
+                // Capture result messages — record token usage and cost on the agent span
                 if (sdkMessage.type === 'result') {
-                    if (sdkMessage.subtype === 'success') {
-                        debugLog$4(`[runner] [native-sdk] ✅ Query complete - ${sdkMessage.num_turns} turns, $${sdkMessage.total_cost_usd?.toFixed(4)} USD\n`);
+                    const resultMsg = sdkMessage;
+                    if (agentSpan) {
+                        agentSpan.setAttribute('gen_ai.usage.input_tokens', resultMsg.usage?.input_tokens ?? 0);
+                        agentSpan.setAttribute('gen_ai.usage.output_tokens', resultMsg.usage?.output_tokens ?? 0);
+                        agentSpan.setAttribute('gen_ai.usage.total_tokens', (resultMsg.usage?.input_tokens ?? 0) + (resultMsg.usage?.output_tokens ?? 0));
+                        agentSpan.setAttribute('gen_ai.usage.cost_usd', resultMsg.total_cost_usd ?? 0);
+                        agentSpan.setAttribute('gen_ai.agent.num_turns', resultMsg.num_turns ?? 0);
+                        agentSpan.setAttribute('gen_ai.agent.num_tool_calls', toolCallCount);
+                        agentSpan.setAttribute('gen_ai.agent.result', resultMsg.subtype ?? 'unknown');
+                        agentSpan.setAttribute('gen_ai.agent.duration_ms', resultMsg.duration_ms ?? 0);
+                        agentSpan.setAttribute('gen_ai.agent.duration_api_ms', resultMsg.duration_api_ms ?? 0);
+                        if (resultMsg.usage?.cache_read_input_tokens) {
+                            agentSpan.setAttribute('gen_ai.usage.cache_read_tokens', resultMsg.usage.cache_read_input_tokens);
+                        }
+                        if (resultMsg.usage?.cache_creation_input_tokens) {
+                            agentSpan.setAttribute('gen_ai.usage.cache_creation_tokens', resultMsg.usage.cache_creation_input_tokens);
+                        }
+                    }
+                    if (resultMsg.subtype === 'success') {
+                        debugLog$4(`[runner] [native-sdk] ✅ Query complete - ${resultMsg.num_turns} turns, $${resultMsg.total_cost_usd?.toFixed(4)} USD\n`);
                     }
                     else {
-                        debugLog$4(`[runner] [native-sdk] ⚠️  Query ended with: ${sdkMessage.subtype}\n`);
+                        debugLog$4(`[runner] [native-sdk] ⚠️  Query ended with: ${resultMsg.subtype}\n`);
                     }
                 }
             }
@@ -4499,9 +4542,16 @@ function createNativeClaudeQuery(modelId = DEFAULT_CLAUDE_MODEL_ID, abortControl
         }
         catch (error) {
             debugLog$4(`[runner] [native-sdk] ❌ Error: ${error instanceof Error ? error.message : String(error)}\n`);
+            if (agentSpan) {
+                agentSpan.setStatus({ code: 2, message: error instanceof Error ? error.message : String(error) });
+            }
             Sentry.captureException(error);
             throw error;
         }
+        finally {
+            // End the agent span regardless of success/failure
+            agentSpan?.end();
+        }
     };
 }