npm - @hebo-ai/gateway - Versions diffs - 0.5.1 → 0.5.2 - Mend

@hebo-ai/gateway 0.5.1 → 0.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/package.json +1 -1
package/src/endpoints/chat-completions/handler.ts +10 -3
package/src/endpoints/embeddings/handler.ts +5 -3
package/src/middleware/debug.ts +37 -0
package/src/middleware/matcher.ts +4 -0

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@hebo-ai/gateway",
-  "version": "0.5.1",
+  "version": "0.5.2",
   "description": "AI gateway as a framework. For full control over models, routing & lifecycle. OpenAI-compatible /chat/completions, /embeddings & /models.",
   "keywords": [
     "ai",

package/src/endpoints/chat-completions/handler.ts CHANGED Viewed

@@ -36,7 +36,7 @@ import {
   getChatRequestAttributes,
   getChatResponseAttributes,
 } from "./otel";
-import { ChatCompletionsBodySchema } from "./schema";
+import { ChatCompletionsBodySchema, type ChatCompletionsBody } from "./schema";
 export const chatCompletions = (config: GatewayConfig): Endpoint => {
   const hooks = config.hooks;
@@ -57,6 +57,7 @@ export const chatCompletions = (config: GatewayConfig): Endpoint => {
     } catch {
       throw new GatewayError("Invalid JSON", 400);
     }
+    logger.trace({ requestId: ctx.requestId, body: ctx.body }, "[chat] ChatCompletionsBody");
     addSpanEvent("hebo.request.deserialized");
     const parsed = ChatCompletionsBodySchema.safeParse(ctx.body);
@@ -68,7 +69,8 @@ export const chatCompletions = (config: GatewayConfig): Endpoint => {
     addSpanEvent("hebo.request.parsed");
     if (hooks?.before) {
-      ctx.body = (await hooks.before(ctx as BeforeHookContext)) ?? ctx.body;
+      ctx.body =
+        ((await hooks.before(ctx as BeforeHookContext)) as ChatCompletionsBody) ?? ctx.body;
       addSpanEvent("hebo.hooks.before.completed");
     }
@@ -110,7 +112,7 @@ export const chatCompletions = (config: GatewayConfig): Endpoint => {
       "[chat] AI SDK options",
     );
     addSpanEvent("hebo.options.prepared");
-    setSpanAttributes(getChatRequestAttributes(inputs, genAiSignalLevel));
+    setSpanAttributes(getChatRequestAttributes(ctx.body, genAiSignalLevel));
     // Build middleware chain (model -> forward params -> provider).
     const languageModelWithMiddleware = wrapLanguageModel({
@@ -138,6 +140,10 @@ export const chatCompletions = (config: GatewayConfig): Endpoint => {
             res as unknown as GenerateTextResult<ToolSet, Output.Output>,
             ctx.resolvedModelId!,
           );
+          logger.trace(
+            { requestId: ctx.requestId, result: streamResult },
+            "[chat] ChatCompletions",
+          );
           addSpanEvent("hebo.result.transformed");
           const genAiResponseAttrs = getChatResponseAttributes(streamResult, genAiSignalLevel);
@@ -180,6 +186,7 @@ export const chatCompletions = (config: GatewayConfig): Endpoint => {
     // Transform result.
     ctx.result = toChatCompletions(result, ctx.resolvedModelId);
+    logger.trace({ requestId: ctx.requestId, result: ctx.result }, "[chat] ChatCompletions");
     addSpanEvent("hebo.result.transformed");
     const genAiResponseAttrs = getChatResponseAttributes(ctx.result, genAiSignalLevel);

package/src/endpoints/embeddings/handler.ts CHANGED Viewed

@@ -29,7 +29,7 @@ import {
   getEmbeddingsRequestAttributes,
   getEmbeddingsResponseAttributes,
 } from "./otel";
-import { EmbeddingsBodySchema } from "./schema";
+import { EmbeddingsBodySchema, type EmbeddingsBody } from "./schema";
 export const embeddings = (config: GatewayConfig): Endpoint => {
   const hooks = config.hooks;
@@ -50,6 +50,7 @@ export const embeddings = (config: GatewayConfig): Endpoint => {
     } catch {
       throw new GatewayError("Invalid JSON", 400);
     }
+    logger.trace({ requestId: ctx.requestId, result: ctx.body }, "[chat] EmbeddingsBody");
     addSpanEvent("hebo.request.deserialized");
     const parsed = EmbeddingsBodySchema.safeParse(ctx.body);
@@ -61,7 +62,7 @@ export const embeddings = (config: GatewayConfig): Endpoint => {
     addSpanEvent("hebo.request.parsed");
     if (hooks?.before) {
-      ctx.body = (await hooks.before(ctx as BeforeHookContext)) ?? ctx.body;
+      ctx.body = ((await hooks.before(ctx as BeforeHookContext)) as EmbeddingsBody) ?? ctx.body;
       addSpanEvent("hebo.hooks.before.completed");
     }
@@ -100,7 +101,7 @@ export const embeddings = (config: GatewayConfig): Endpoint => {
       "[embeddings] AI SDK options",
     );
     addSpanEvent("hebo.options.prepared");
-    setSpanAttributes(getEmbeddingsRequestAttributes(inputs, genAiSignalLevel));
+    setSpanAttributes(getEmbeddingsRequestAttributes(ctx.body, genAiSignalLevel));
     // Build middleware chain (model -> forward params -> provider).
     const embeddingModelWithMiddleware = wrapEmbeddingModel({
@@ -121,6 +122,7 @@ export const embeddings = (config: GatewayConfig): Endpoint => {
     // Transform result.
     ctx.result = toEmbeddings(result, ctx.modelId);
+    logger.trace({ requestId: ctx.requestId, result: ctx.result }, "[chat] Embeddings");
     addSpanEvent("hebo.result.transformed");
     const genAiResponseAttrs = getEmbeddingsResponseAttributes(ctx.result, genAiSignalLevel);
     recordTokenUsage(genAiResponseAttrs, genAiGeneralAttrs, genAiSignalLevel);

package/src/middleware/debug.ts ADDED Viewed

@@ -0,0 +1,37 @@
+import type { EmbeddingModelMiddleware, LanguageModelMiddleware } from "ai";
+import { logger } from "../logger";
+export const debugLanguageFinalParamsMiddleware: LanguageModelMiddleware = {
+  specificationVersion: "v3",
+  // eslint-disable-next-line require-await
+  transformParams: async ({ params, model }) => {
+    logger.trace(
+      {
+        kind: "text",
+        modelId: model.modelId,
+        providerId: model.provider,
+        params,
+      },
+      "[middleware] final params",
+    );
+    return params;
+  },
+};
+export const debugEmbeddingFinalParamsMiddleware: EmbeddingModelMiddleware = {
+  specificationVersion: "v3",
+  // eslint-disable-next-line require-await
+  transformParams: async ({ params, model }) => {
+    logger.trace(
+      {
+        kind: "embedding",
+        modelId: model.modelId,
+        providerId: model.provider,
+        params,
+      },
+      "[middleware] final params",
+    );
+    return params;
+  },
+};

package/src/middleware/matcher.ts CHANGED Viewed

@@ -6,6 +6,7 @@ import type { ProviderId } from "../providers/types";
 import { logger } from "../logger";
 import { addSpanEvent } from "../telemetry/span";
 import { forwardParamsEmbeddingMiddleware, forwardParamsMiddleware } from "./common";
+import { debugEmbeddingFinalParamsMiddleware, debugLanguageFinalParamsMiddleware } from "./debug";
 type MiddlewareEntries = {
   language?: LanguageModelMiddleware[];
@@ -110,6 +111,9 @@ class ModelMiddlewareMatcher {
     if (providerId) {
       out.push(...this.collect(this.provider.match(providerId), kind));
     }
+    out.push(
+      kind === "text" ? debugLanguageFinalParamsMiddleware : debugEmbeddingFinalParamsMiddleware,
+    );
     if (this.cache.size >= ModelMiddlewareMatcher.MAX_CACHE) {
       let n = Math.ceil(ModelMiddlewareMatcher.MAX_CACHE * 0.2);