npm - @voltagent/core - Versions diffs - 2.6.7 → 2.6.10 - Mend

@voltagent/core 2.6.7 → 2.6.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/dist/index.d.mts +4 -0
package/dist/index.d.ts +4 -0
package/dist/index.js +223 -13
package/dist/index.js.map +1 -1
package/dist/index.mjs +221 -10
package/dist/index.mjs.map +1 -1
package/docs/observability-platform/llm-usage-and-costs.md +122 -2
package/package.json +1 -1

package/dist/index.d.mts CHANGED Viewed

@@ -8796,6 +8796,7 @@ declare class Memory {
      * Get messages by their IDs
      */
     private getMessagesByIds;
+    private getMessageVectorIdsForClear;
     /**
      * Merge two arrays of messages, removing duplicates
      */
@@ -9369,6 +9370,7 @@ declare class Agent {
      */
     private prepareExecution;
     private collectToolDataFromResult;
+    private ensureStructuredOutputGenerated;
     /**
      * Create execution context
      */
@@ -9404,6 +9406,7 @@ declare class Agent {
     private createLLMSpanFinalizer;
     private buildLLMSpanAttributes;
     private recordLLMUsage;
+    private recordProviderCost;
     private createEvalHost;
     /**
      * Get observability instance (lazy initialization)
@@ -9682,6 +9685,7 @@ declare class Agent {
      * Maps AI SDK's LanguageModelUsage to trace context format
      */
     private setTraceContextUsage;
+    private recordRootSpanUsageAndProviderCost;
     /**
      * Create working memory tools if configured
      */

package/dist/index.d.ts CHANGED Viewed

@@ -8796,6 +8796,7 @@ declare class Memory {
      * Get messages by their IDs
      */
     private getMessagesByIds;
+    private getMessageVectorIdsForClear;
     /**
      * Merge two arrays of messages, removing duplicates
      */
@@ -9369,6 +9370,7 @@ declare class Agent {
      */
     private prepareExecution;
     private collectToolDataFromResult;
+    private ensureStructuredOutputGenerated;
     /**
      * Create execution context
      */
@@ -9404,6 +9406,7 @@ declare class Agent {
     private createLLMSpanFinalizer;
     private buildLLMSpanAttributes;
     private recordLLMUsage;
+    private recordProviderCost;
     private createEvalHost;
     /**
      * Get observability instance (lazy initialization)
@@ -9682,6 +9685,7 @@ declare class Agent {
      * Maps AI SDK's LanguageModelUsage to trace context format
      */
     private setTraceContextUsage;
+    private recordRootSpanUsageAndProviderCost;
     /**
      * Create working memory tools if configured
      */

package/dist/index.js CHANGED Viewed

@@ -352,7 +352,7 @@ __export(index_exports, {
   hasFilePart: () => hasFilePart,
   hasImagePart: () => hasImagePart,
   hasTextPart: () => hasTextPart,
-  hasToolCall: () => import_ai8.hasToolCall,
+  hasToolCall: () => import_ai9.hasToolCall,
   isAbortError: () => isAbortError,
   isMiddlewareAbortError: () => isMiddlewareAbortError,
   isNodeRuntime: () => isNodeRuntime,
@@ -375,7 +375,7 @@ __export(index_exports, {
   serializeValueForDebug: () => serializeValueForDebug,
   setWaitUntil: () => setWaitUntil,
   shouldSample: () => shouldSample,
-  stepCountIs: () => import_ai8.stepCountIs,
+  stepCountIs: () => import_ai9.stepCountIs,
   tool: () => tool,
   trace: () => import_api9.trace,
   transformTextContent: () => transformTextContent,
@@ -5248,6 +5248,7 @@ __name(cosineSimilarity, "cosineSimilarity");
 // src/memory/index.ts
 var isEmbeddingAdapter = /* @__PURE__ */ __name((value) => typeof value === "object" && value !== null && "embed" in value && typeof value.embed === "function" && "embedBatch" in value && typeof value.embedBatch === "function", "isEmbeddingAdapter");
 var isEmbeddingAdapterConfig = /* @__PURE__ */ __name((value) => typeof value === "object" && value !== null && "model" in value && !isEmbeddingAdapter(value), "isEmbeddingAdapterConfig");
+var VECTOR_CLEAR_CONVERSATION_PAGE_SIZE = 200;
 var resolveEmbeddingAdapter = /* @__PURE__ */ __name((embedding) => {
   if (!embedding) {
     return void 0;
@@ -5333,6 +5334,19 @@ var Memory = class {
    * Clear messages for a user
    */
   async clearMessages(userId, conversationId, context8) {
+    if (this.vector) {
+      try {
+        const vectorIds = await this.getMessageVectorIdsForClear(userId, conversationId);
+        if (vectorIds.length > 0) {
+          await this.vector.deleteBatch(vectorIds);
+        }
+      } catch (error) {
+        console.warn(
+          `Failed to delete vectors while clearing messages for user ${userId}${conversationId ? ` conversation ${conversationId}` : ""}:`,
+          error
+        );
+      }
+    }
     return this.storage.clearMessages(userId, conversationId, context8);
   }
   /**
@@ -5469,6 +5483,36 @@ var Memory = class {
     const ordered = messageIds.map((id) => byId.get(id)).filter((m) => Boolean(m));
     return ordered;
   }
+  async getMessageVectorIdsForClear(userId, conversationId) {
+    const vectorIds = /* @__PURE__ */ new Set();
+    if (conversationId) {
+      const messages = await this.storage.getMessages(userId, conversationId);
+      for (const message of messages) {
+        vectorIds.add(`msg_${conversationId}_${message.id}`);
+      }
+      return Array.from(vectorIds);
+    }
+    const totalConversations = await this.storage.countConversations({ userId });
+    let offset = 0;
+    while (offset < totalConversations) {
+      const conversations = await this.storage.queryConversations({
+        userId,
+        limit: VECTOR_CLEAR_CONVERSATION_PAGE_SIZE,
+        offset
+      });
+      for (const conversation of conversations) {
+        const messages = await this.storage.getMessages(userId, conversation.id);
+        for (const message of messages) {
+          vectorIds.add(`msg_${conversation.id}_${message.id}`);
+        }
+      }
+      if (conversations.length === 0) {
+        break;
+      }
+      offset += conversations.length;
+    }
+    return Array.from(vectorIds);
+  }
   /**
    * Merge two arrays of messages, removing duplicates
    */
@@ -26315,6 +26359,10 @@ var AgentTraceContext = class {
 function addModelAttributesToSpan(span, modelName, options, defaultMaxOutputTokens, defaultTemperature) {
   if (!span) return;
   span.setAttribute("ai.model.name", modelName);
+  const provider = typeof modelName === "string" && modelName.includes("/") ? modelName.split("/")[0] : void 0;
+  if (provider) {
+    span.setAttribute("ai.model.provider", provider);
+  }
   const temperature = options?.temperature ?? options?.providerOptions?.temperature ?? defaultTemperature;
   if (temperature !== void 0 && typeof temperature === "number") {
     span.setAttribute("ai.model.temperature", temperature);
@@ -30028,6 +30076,7 @@ var DEFAULT_CONVERSATION_PERSISTENCE_OPTIONS = {
   flushOnToolResult: true
 };
 var isRecord4 = /* @__PURE__ */ __name((value) => typeof value === "object" && value !== null, "isRecord");
+var isPlainObject = /* @__PURE__ */ __name((value) => isRecord4(value) && !Array.isArray(value), "isPlainObject");
 var hasNonEmptyString2 = /* @__PURE__ */ __name((value) => typeof value === "string" && value.trim().length > 0, "hasNonEmptyString");
 var firstNonBlank = /* @__PURE__ */ __name((...values) => {
   for (const value of values) {
@@ -30045,6 +30094,58 @@ var firstDefined = /* @__PURE__ */ __name((...values) => {
   }
   return void 0;
 }, "firstDefined");
+var toFiniteNumber = /* @__PURE__ */ __name((value) => {
+  if (typeof value === "number") {
+    return Number.isFinite(value) ? value : void 0;
+  }
+  if (typeof value === "string") {
+    const parsed = Number(value);
+    return Number.isFinite(parsed) ? parsed : void 0;
+  }
+  return void 0;
+}, "toFiniteNumber");
+var toBoolean = /* @__PURE__ */ __name((value) => {
+  if (typeof value === "boolean") {
+    return value;
+  }
+  if (typeof value === "string") {
+    const normalized = value.trim().toLowerCase();
+    if (normalized === "true") return true;
+    if (normalized === "false") return false;
+  }
+  return void 0;
+}, "toBoolean");
+var extractOpenRouterUsageCost = /* @__PURE__ */ __name((providerMetadata) => {
+  if (!isPlainObject(providerMetadata)) {
+    return void 0;
+  }
+  const openRouterMetadata = isPlainObject(providerMetadata.openrouter) ? providerMetadata.openrouter : void 0;
+  const usage = openRouterMetadata && isPlainObject(openRouterMetadata.usage) ? openRouterMetadata.usage : void 0;
+  if (!usage) {
+    return void 0;
+  }
+  const costDetails = firstDefined(
+    isPlainObject(usage.costDetails) ? usage.costDetails : void 0,
+    isPlainObject(usage.cost_details) ? usage.cost_details : void 0
+  );
+  const result = {
+    cost: toFiniteNumber(usage.cost),
+    isByok: firstDefined(toBoolean(usage.isByok), toBoolean(usage.is_byok)),
+    upstreamInferenceCost: firstDefined(
+      toFiniteNumber(costDetails?.upstreamInferenceCost),
+      toFiniteNumber(costDetails?.upstream_inference_cost)
+    ),
+    upstreamInferenceInputCost: firstDefined(
+      toFiniteNumber(costDetails?.upstreamInferenceInputCost),
+      toFiniteNumber(costDetails?.upstream_inference_input_cost)
+    ),
+    upstreamInferenceOutputCost: firstDefined(
+      toFiniteNumber(costDetails?.upstreamInferenceOutputCost),
+      toFiniteNumber(costDetails?.upstream_inference_output_cost)
+    )
+  };
+  return Object.values(result).some((value) => value !== void 0) ? result : void 0;
+}, "extractOpenRouterUsageCost");
 var isAssistantContentPart = /* @__PURE__ */ __name((value) => {
   if (!isRecord4(value)) {
     return false;
@@ -30604,10 +30705,17 @@ var Agent = class {
                       onStepFinish: this.createStepHandler(oc, options)
                     })
                   );
+                  this.ensureStructuredOutputGenerated({
+                    result: response,
+                    output,
+                    tools,
+                    maxSteps
+                  });
                   const resolvedProviderUsage = response.usage ? await Promise.resolve(response.usage) : void 0;
                   finalizeLLMSpan(import_api16.SpanStatusCode.OK, {
                     usage: resolvedProviderUsage,
-                    finishReason: response.finishReason
+                    finishReason: response.finishReason,
+                    providerMetadata: response.providerMetadata
                   });
                   return response;
                 } catch (error) {
@@ -30629,6 +30737,11 @@ var Agent = class {
               usage: providerUsage,
               totalUsage: result.totalUsage
             });
+            this.recordRootSpanUsageAndProviderCost(
+              oc.traceContext,
+              usageForFinish,
+              result.providerMetadata
+            );
             const { toolCalls: aggregatedToolCalls, toolResults: aggregatedToolResults } = this.collectToolDataFromResult(result);
             const usageInfo = convertUsage(usageForFinish);
             const middlewareText = await runOutputMiddlewares(
@@ -30690,7 +30803,6 @@ var Agent = class {
                 text: finalText
               }
             );
-            this.setTraceContextUsage(oc.traceContext, usageForFinish);
             oc.traceContext.setOutput(finalText);
             oc.traceContext.setFinishReason(result.finishReason);
             if (result.steps && result.steps.length >= maxSteps) {
@@ -31164,14 +31276,19 @@ var Agent = class {
                   usage: providerUsage,
                   totalUsage: finalResult.totalUsage
                 });
+                this.recordRootSpanUsageAndProviderCost(
+                  oc.traceContext,
+                  usageForFinish,
+                  finalResult.providerMetadata
+                );
                 finalizeLLMSpan(import_api16.SpanStatusCode.OK, {
                   usage: providerUsage,
-                  finishReason: finalResult.finishReason
+                  finishReason: finalResult.finishReason,
+                  providerMetadata: finalResult.providerMetadata
                 });
                 if (!shouldDeferPersist && shouldPersistMemory) {
                   await persistQueue.flush(buffer, oc);
                 }
-                this.setTraceContextUsage(oc.traceContext, usageForFinish);
                 const usage = convertUsage(usageForFinish);
                 let finalText;
                 const bailedResult = oc.systemContext.get("bailedResult");
@@ -31273,7 +31390,8 @@ var Agent = class {
                 });
                 finalizeLLMSpan(import_api16.SpanStatusCode.OK, {
                   usage: usageForFinish,
-                  finishReason: finalResult.finishReason
+                  finishReason: finalResult.finishReason,
+                  providerMetadata: finalResult.providerMetadata
                 });
                 oc.traceContext.end("completed");
                 feedbackFinalizeRequested = true;
@@ -31729,6 +31847,11 @@ var Agent = class {
               usage: providerUsage,
               totalUsage: result.totalUsage
             });
+            this.recordRootSpanUsageAndProviderCost(
+              oc.traceContext,
+              usageForFinish,
+              result.providerMetadata
+            );
             const usageInfo = convertUsage(usageForFinish);
             const middlewareObject = await runOutputMiddlewares(
               result.object,
@@ -31776,7 +31899,6 @@ var Agent = class {
               };
               this.addStepToHistory(step, oc);
             }
-            this.setTraceContextUsage(oc.traceContext, usageForFinish);
             oc.traceContext.setOutput(finalObject);
             oc.output = finalObject;
             this.enqueueEvalScoring({
@@ -32084,6 +32206,11 @@ var Agent = class {
                     usage: providerUsage,
                     totalUsage: finalResult.totalUsage
                   });
+                  this.recordRootSpanUsageAndProviderCost(
+                    oc.traceContext,
+                    usageForFinish,
+                    finalResult.providerMetadata
+                  );
                   const usageInfo = convertUsage(usageForFinish);
                   let finalObject = finalResult.object;
                   if (guardrailSet.output.length > 0) {
@@ -32122,7 +32249,6 @@ var Agent = class {
                     };
                     this.addStepToHistory(step, oc);
                   }
-                  this.setTraceContextUsage(oc.traceContext, usageForFinish);
                   oc.traceContext.setOutput(finalObject);
                   oc.output = finalObject;
                   await this.getMergedHooks(options).onEnd?.({
@@ -32345,6 +32471,42 @@ Metadata: ${(0, import_utils33.safeStringify)(metadata)}`;
       toolResults: stepToolResults.length > 0 ? stepToolResults : result.toolResults ?? []
     };
   }
+  ensureStructuredOutputGenerated(params) {
+    const { result, output, tools, maxSteps } = params;
+    if (!output) {
+      return;
+    }
+    try {
+      void result.output;
+    } catch (error) {
+      const isNoOutputGeneratedError = error instanceof import_ai7.NoOutputGeneratedError || error instanceof Error && error.name === "AI_NoOutputGeneratedError";
+      if (!isNoOutputGeneratedError) {
+        throw error;
+      }
+      const { toolCalls } = this.collectToolDataFromResult(result);
+      const configuredToolCount = Object.keys(tools ?? {}).length;
+      const stepCount = result.steps?.length ?? 0;
+      const finishReason = result.finishReason ?? "unknown";
+      const reachedMaxSteps = stepCount >= maxSteps;
+      const guidance = configuredToolCount > 0 || toolCalls.length > 0 ? "When tools are enabled, ensure the model emits a final non-tool response that matches the output schema, or split this into two calls (tools first, schema formatting second)." : "Ensure the model emits a final response that matches the requested output schema.";
+      const maxStepHint = reachedMaxSteps ? ` Generation stopped after ${stepCount} steps (maxSteps=${maxSteps}).` : "";
+      throw createVoltAgentError(
+        `Structured output was requested but no final output was generated (finishReason: ${finishReason}). ${guidance}${maxStepHint}`,
+        {
+          stage: "response_parsing",
+          code: "STRUCTURED_OUTPUT_NOT_GENERATED",
+          originalError: error,
+          metadata: {
+            finishReason,
+            stepCount,
+            maxSteps,
+            configuredToolCount,
+            toolCallCount: toolCalls.length
+          }
+        }
+      );
+    }
+  }
   /**
    * Create execution context
    */
@@ -32693,6 +32855,9 @@ Metadata: ${(0, import_utils33.safeStringify)(metadata)}`;
       if (details?.usage) {
         this.recordLLMUsage(span, details.usage);
       }
+      if (details?.providerMetadata !== void 0) {
+        this.recordProviderCost(span, details.providerMetadata);
+      }
       if (details?.finishReason) {
         span.setAttribute("llm.finish_reason", String(details.finishReason));
       }
@@ -32798,6 +32963,36 @@ Metadata: ${(0, import_utils33.safeStringify)(metadata)}`;
       span.setAttribute("llm.usage.total_tokens", totalTokens);
     }
   }
+  recordProviderCost(span, providerMetadata) {
+    const openRouterUsageCost = extractOpenRouterUsageCost(providerMetadata);
+    if (!openRouterUsageCost) {
+      return;
+    }
+    if (openRouterUsageCost.cost !== void 0) {
+      span.setAttribute("usage.cost", openRouterUsageCost.cost);
+    }
+    if (openRouterUsageCost.isByok !== void 0) {
+      span.setAttribute("usage.is_byok", openRouterUsageCost.isByok);
+    }
+    if (openRouterUsageCost.upstreamInferenceCost !== void 0) {
+      span.setAttribute(
+        "usage.cost_details.upstream_inference_cost",
+        openRouterUsageCost.upstreamInferenceCost
+      );
+    }
+    if (openRouterUsageCost.upstreamInferenceInputCost !== void 0) {
+      span.setAttribute(
+        "usage.cost_details.upstream_inference_input_cost",
+        openRouterUsageCost.upstreamInferenceInputCost
+      );
+    }
+    if (openRouterUsageCost.upstreamInferenceOutputCost !== void 0) {
+      span.setAttribute(
+        "usage.cost_details.upstream_inference_output_cost",
+        openRouterUsageCost.upstreamInferenceOutputCost
+      );
+    }
+  }
   createEvalHost() {
     return {
       id: this.id,
@@ -33002,7 +33197,8 @@ Metadata: ${(0, import_utils33.safeStringify)(metadata)}`;
           }
           finalizeLLMSpan(import_api16.SpanStatusCode.OK, {
             usage: resolvedUsage,
-            finishReason: result.finishReason
+            finishReason: result.finishReason,
+            providerMetadata: result.providerMetadata
           });
           return title || null;
         } catch (error) {
@@ -33651,6 +33847,9 @@ ${retrieverContext}`;
     return true;
   }
   isRetryableError(error) {
+    if (isVoltAgentError(error) && error.code === "STRUCTURED_OUTPUT_NOT_GENERATED") {
+      return true;
+    }
     const retryable = error?.isRetryable;
     if (typeof retryable === "boolean") {
       return retryable;
@@ -34779,7 +34978,8 @@ ${retrieverContext}`;
       const resolvedUsage = response.usage ? await Promise.resolve(response.usage) : void 0;
       finalizeLLMSpan(import_api16.SpanStatusCode.OK, {
         usage: resolvedUsage,
-        finishReason: response.finishReason
+        finishReason: response.finishReason,
+        providerMetadata: response.providerMetadata
       });
       return response;
     } catch (error) {
@@ -35796,6 +35996,10 @@ ${retrieverContext}`;
       reasoningTokens: resolvedUsage.reasoningTokens
     });
   }
+  recordRootSpanUsageAndProviderCost(traceContext, usage, providerMetadata) {
+    this.setTraceContextUsage(traceContext, usage);
+    this.recordProviderCost(traceContext.getRootSpan(), providerMetadata);
+  }
   /**
    * Create working memory tools if configured
    */
@@ -41315,6 +41519,9 @@ var TriggerRegistry = class _TriggerRegistry {
   }
 };
+// src/voltagent.ts
+var import_ai8 = require("ai");
 // src/utils/voltops-validation.ts
 function isValidVoltOpsKeys(publicKey, secretKey) {
   if (!publicKey || !secretKey) {
@@ -41635,9 +41842,12 @@ var VoltAgent = class {
     process.once("SIGTERM", () => handleSignal("SIGTERM"));
     process.once("SIGINT", () => handleSignal("SIGINT"));
     process.on("unhandledRejection", (reason) => {
+      const isStructuredOutputWrapperError = isVoltAgentError(reason) && reason.code === "STRUCTURED_OUTPUT_NOT_GENERATED";
+      const isNoOutputGeneratedError = isStructuredOutputWrapperError || reason instanceof import_ai8.NoOutputGeneratedError || reason instanceof Error && reason.name === "AI_NoOutputGeneratedError";
       this.logger.error("[VoltAgent] Unhandled Promise Rejection:", {
         reason: reason instanceof Error ? reason.message : reason,
-        stack: reason instanceof Error ? reason.stack : void 0
+        stack: reason instanceof Error ? reason.stack : void 0,
+        hint: isNoOutputGeneratedError ? "Structured output was requested but no final output was generated. If tools are enabled, ensure a final schema-matching response or split into two calls." : void 0
       });
     });
   }
@@ -41943,7 +42153,7 @@ var VoltAgent = class {
 // src/index.ts
 var import_utils40 = require("@voltagent/internal/utils");
-var import_ai8 = require("ai");
+var import_ai9 = require("ai");
 // Annotate the CommonJS export names for ESM import in node:
 0 && (module.exports = {
   A2AServerRegistry,