@hebo-ai/gateway 0.6.2 → 0.8.0-rc0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +134 -7
- package/package.json +46 -1
- package/dist/config.d.ts +0 -2
- package/dist/config.js +0 -81
- package/dist/endpoints/chat-completions/converters.d.ts +0 -43
- package/dist/endpoints/chat-completions/converters.js +0 -625
- package/dist/endpoints/chat-completions/handler.d.ts +0 -2
- package/dist/endpoints/chat-completions/handler.js +0 -149
- package/dist/endpoints/chat-completions/index.d.ts +0 -4
- package/dist/endpoints/chat-completions/index.js +0 -4
- package/dist/endpoints/chat-completions/otel.d.ts +0 -5
- package/dist/endpoints/chat-completions/otel.js +0 -171
- package/dist/endpoints/chat-completions/schema.d.ts +0 -1188
- package/dist/endpoints/chat-completions/schema.js +0 -298
- package/dist/endpoints/embeddings/converters.d.ts +0 -10
- package/dist/endpoints/embeddings/converters.js +0 -31
- package/dist/endpoints/embeddings/handler.d.ts +0 -2
- package/dist/endpoints/embeddings/handler.js +0 -104
- package/dist/endpoints/embeddings/index.d.ts +0 -4
- package/dist/endpoints/embeddings/index.js +0 -4
- package/dist/endpoints/embeddings/otel.d.ts +0 -5
- package/dist/endpoints/embeddings/otel.js +0 -29
- package/dist/endpoints/embeddings/schema.d.ts +0 -44
- package/dist/endpoints/embeddings/schema.js +0 -29
- package/dist/endpoints/models/converters.d.ts +0 -6
- package/dist/endpoints/models/converters.js +0 -42
- package/dist/endpoints/models/handler.d.ts +0 -2
- package/dist/endpoints/models/handler.js +0 -29
- package/dist/endpoints/models/index.d.ts +0 -3
- package/dist/endpoints/models/index.js +0 -3
- package/dist/endpoints/models/schema.d.ts +0 -42
- package/dist/endpoints/models/schema.js +0 -31
- package/dist/errors/ai-sdk.d.ts +0 -2
- package/dist/errors/ai-sdk.js +0 -52
- package/dist/errors/gateway.d.ts +0 -5
- package/dist/errors/gateway.js +0 -13
- package/dist/errors/openai.d.ts +0 -20
- package/dist/errors/openai.js +0 -40
- package/dist/errors/utils.d.ts +0 -22
- package/dist/errors/utils.js +0 -44
- package/dist/gateway.d.ts +0 -9
- package/dist/gateway.js +0 -40
- package/dist/index.d.ts +0 -14
- package/dist/index.js +0 -13
- package/dist/lifecycle.d.ts +0 -2
- package/dist/lifecycle.js +0 -98
- package/dist/logger/default.d.ts +0 -4
- package/dist/logger/default.js +0 -81
- package/dist/logger/index.d.ts +0 -11
- package/dist/logger/index.js +0 -25
- package/dist/middleware/common.d.ts +0 -12
- package/dist/middleware/common.js +0 -146
- package/dist/middleware/debug.d.ts +0 -3
- package/dist/middleware/debug.js +0 -27
- package/dist/middleware/matcher.d.ts +0 -28
- package/dist/middleware/matcher.js +0 -118
- package/dist/middleware/utils.d.ts +0 -2
- package/dist/middleware/utils.js +0 -24
- package/dist/models/amazon/index.d.ts +0 -2
- package/dist/models/amazon/index.js +0 -2
- package/dist/models/amazon/middleware.d.ts +0 -3
- package/dist/models/amazon/middleware.js +0 -68
- package/dist/models/amazon/presets.d.ts +0 -345
- package/dist/models/amazon/presets.js +0 -80
- package/dist/models/anthropic/index.d.ts +0 -2
- package/dist/models/anthropic/index.js +0 -2
- package/dist/models/anthropic/middleware.d.ts +0 -5
- package/dist/models/anthropic/middleware.js +0 -127
- package/dist/models/anthropic/presets.d.ts +0 -711
- package/dist/models/anthropic/presets.js +0 -135
- package/dist/models/catalog.d.ts +0 -4
- package/dist/models/catalog.js +0 -8
- package/dist/models/cohere/index.d.ts +0 -2
- package/dist/models/cohere/index.js +0 -2
- package/dist/models/cohere/middleware.d.ts +0 -3
- package/dist/models/cohere/middleware.js +0 -62
- package/dist/models/cohere/presets.d.ts +0 -411
- package/dist/models/cohere/presets.js +0 -134
- package/dist/models/google/index.d.ts +0 -2
- package/dist/models/google/index.js +0 -2
- package/dist/models/google/middleware.d.ts +0 -8
- package/dist/models/google/middleware.js +0 -111
- package/dist/models/google/presets.d.ts +0 -375
- package/dist/models/google/presets.js +0 -82
- package/dist/models/meta/index.d.ts +0 -1
- package/dist/models/meta/index.js +0 -1
- package/dist/models/meta/presets.d.ts +0 -483
- package/dist/models/meta/presets.js +0 -95
- package/dist/models/openai/index.d.ts +0 -2
- package/dist/models/openai/index.js +0 -2
- package/dist/models/openai/middleware.d.ts +0 -4
- package/dist/models/openai/middleware.js +0 -88
- package/dist/models/openai/presets.d.ts +0 -959
- package/dist/models/openai/presets.js +0 -213
- package/dist/models/types.d.ts +0 -20
- package/dist/models/types.js +0 -84
- package/dist/models/voyage/index.d.ts +0 -2
- package/dist/models/voyage/index.js +0 -2
- package/dist/models/voyage/middleware.d.ts +0 -2
- package/dist/models/voyage/middleware.js +0 -19
- package/dist/models/voyage/presets.d.ts +0 -436
- package/dist/models/voyage/presets.js +0 -85
- package/dist/providers/anthropic/canonical.d.ts +0 -3
- package/dist/providers/anthropic/canonical.js +0 -9
- package/dist/providers/anthropic/index.d.ts +0 -1
- package/dist/providers/anthropic/index.js +0 -1
- package/dist/providers/bedrock/canonical.d.ts +0 -17
- package/dist/providers/bedrock/canonical.js +0 -61
- package/dist/providers/bedrock/index.d.ts +0 -2
- package/dist/providers/bedrock/index.js +0 -2
- package/dist/providers/bedrock/middleware.d.ts +0 -4
- package/dist/providers/bedrock/middleware.js +0 -104
- package/dist/providers/cohere/canonical.d.ts +0 -3
- package/dist/providers/cohere/canonical.js +0 -17
- package/dist/providers/cohere/index.d.ts +0 -1
- package/dist/providers/cohere/index.js +0 -1
- package/dist/providers/groq/canonical.d.ts +0 -3
- package/dist/providers/groq/canonical.js +0 -12
- package/dist/providers/groq/index.d.ts +0 -1
- package/dist/providers/groq/index.js +0 -1
- package/dist/providers/openai/canonical.d.ts +0 -3
- package/dist/providers/openai/canonical.js +0 -8
- package/dist/providers/openai/index.d.ts +0 -1
- package/dist/providers/openai/index.js +0 -1
- package/dist/providers/registry.d.ts +0 -24
- package/dist/providers/registry.js +0 -103
- package/dist/providers/types.d.ts +0 -7
- package/dist/providers/types.js +0 -11
- package/dist/providers/vertex/canonical.d.ts +0 -3
- package/dist/providers/vertex/canonical.js +0 -8
- package/dist/providers/vertex/index.d.ts +0 -1
- package/dist/providers/vertex/index.js +0 -1
- package/dist/providers/voyage/canonical.d.ts +0 -3
- package/dist/providers/voyage/canonical.js +0 -7
- package/dist/providers/voyage/index.d.ts +0 -1
- package/dist/providers/voyage/index.js +0 -1
- package/dist/telemetry/ai-sdk.d.ts +0 -2
- package/dist/telemetry/ai-sdk.js +0 -31
- package/dist/telemetry/baggage.d.ts +0 -1
- package/dist/telemetry/baggage.js +0 -24
- package/dist/telemetry/fetch.d.ts +0 -2
- package/dist/telemetry/fetch.js +0 -49
- package/dist/telemetry/gen-ai.d.ts +0 -6
- package/dist/telemetry/gen-ai.js +0 -78
- package/dist/telemetry/http.d.ts +0 -3
- package/dist/telemetry/http.js +0 -54
- package/dist/telemetry/index.d.ts +0 -1
- package/dist/telemetry/index.js +0 -1
- package/dist/telemetry/memory.d.ts +0 -2
- package/dist/telemetry/memory.js +0 -43
- package/dist/telemetry/span.d.ts +0 -13
- package/dist/telemetry/span.js +0 -60
- package/dist/telemetry/stream.d.ts +0 -3
- package/dist/telemetry/stream.js +0 -58
- package/dist/types.d.ts +0 -176
- package/dist/types.js +0 -1
- package/dist/utils/env.d.ts +0 -2
- package/dist/utils/env.js +0 -7
- package/dist/utils/headers.d.ts +0 -4
- package/dist/utils/headers.js +0 -22
- package/dist/utils/preset.d.ts +0 -10
- package/dist/utils/preset.js +0 -42
- package/dist/utils/request.d.ts +0 -2
- package/dist/utils/request.js +0 -43
- package/dist/utils/response.d.ts +0 -3
- package/dist/utils/response.js +0 -70
- package/dist/utils/url.d.ts +0 -4
- package/dist/utils/url.js +0 -21
package/dist/telemetry/memory.js
DELETED
|
@@ -1,43 +0,0 @@
|
|
|
1
|
-
import { metrics } from "@opentelemetry/api";
|
|
2
|
-
const getMeter = () => metrics.getMeter("@hebo/gateway");
|
|
3
|
-
const defaultHeapSpaceAttrs = { "v8js.heap.space.name": "total" };
|
|
4
|
-
let registered = false;
|
|
5
|
-
const isEnabled = (level) => level === "recommended" || level === "full";
|
|
6
|
-
const observeMemory = (observe) => {
|
|
7
|
-
let usage;
|
|
8
|
-
try {
|
|
9
|
-
usage = globalThis.process?.memoryUsage?.();
|
|
10
|
-
}
|
|
11
|
-
catch {
|
|
12
|
-
return;
|
|
13
|
-
}
|
|
14
|
-
if (!usage)
|
|
15
|
-
return;
|
|
16
|
-
observe(usage.heapUsed, usage.rss);
|
|
17
|
-
};
|
|
18
|
-
export const observeV8jsMemoryMetrics = (level) => {
|
|
19
|
-
if (!isEnabled(level) || registered)
|
|
20
|
-
return;
|
|
21
|
-
registered = true;
|
|
22
|
-
const meter = getMeter();
|
|
23
|
-
meter
|
|
24
|
-
.createObservableGauge("v8js.memory.heap.used", {
|
|
25
|
-
description: "Used bytes in the V8 heap",
|
|
26
|
-
unit: "By",
|
|
27
|
-
})
|
|
28
|
-
.addCallback((result) => {
|
|
29
|
-
observeMemory((heapUsed) => {
|
|
30
|
-
result.observe(heapUsed, defaultHeapSpaceAttrs);
|
|
31
|
-
});
|
|
32
|
-
});
|
|
33
|
-
meter
|
|
34
|
-
.createObservableGauge("v8js.memory.heap.space.physical_size", {
|
|
35
|
-
description: "Physical bytes allocated for the V8 heap space",
|
|
36
|
-
unit: "By",
|
|
37
|
-
})
|
|
38
|
-
.addCallback((result) => {
|
|
39
|
-
observeMemory((_, rss) => {
|
|
40
|
-
result.observe(rss, defaultHeapSpaceAttrs);
|
|
41
|
-
});
|
|
42
|
-
});
|
|
43
|
-
};
|
package/dist/telemetry/span.d.ts
DELETED
|
@@ -1,13 +0,0 @@
|
|
|
1
|
-
import type { Attributes, SpanOptions, Tracer } from "@opentelemetry/api";
|
|
2
|
-
import type { TelemetrySignalLevel } from "../types";
|
|
3
|
-
export declare const setSpanTracer: (tracer?: Tracer) => void;
|
|
4
|
-
export declare const setSpanEventsEnabled: (level?: TelemetrySignalLevel) => void;
|
|
5
|
-
export declare const startSpan: (name: string, options?: SpanOptions) => import("@opentelemetry/api").Span & {
|
|
6
|
-
runWithContext: <T>(fn: () => Promise<T> | T) => T | Promise<T>;
|
|
7
|
-
recordError: (_error: unknown) => void;
|
|
8
|
-
finish: () => void;
|
|
9
|
-
isExisting: boolean;
|
|
10
|
-
};
|
|
11
|
-
export declare const withSpan: <T>(name: string, run: () => Promise<T> | T, options?: SpanOptions) => Promise<T>;
|
|
12
|
-
export declare const addSpanEvent: (name: string, attributes?: Attributes) => void;
|
|
13
|
-
export declare const setSpanAttributes: (attributes?: Attributes) => void;
|
package/dist/telemetry/span.js
DELETED
|
@@ -1,60 +0,0 @@
|
|
|
1
|
-
import { INVALID_SPAN_CONTEXT, SpanKind, SpanStatusCode, context, trace } from "@opentelemetry/api";
|
|
2
|
-
const DEFAULT_TRACER_NAME = "@hebo/gateway";
|
|
3
|
-
let spanTracer;
|
|
4
|
-
let spanEventsEnabled = false;
|
|
5
|
-
const NOOP_SPAN = {
|
|
6
|
-
runWithContext: (fn) => fn(),
|
|
7
|
-
recordError: (_error) => { },
|
|
8
|
-
finish: () => { },
|
|
9
|
-
isExisting: true,
|
|
10
|
-
};
|
|
11
|
-
export const setSpanTracer = (tracer) => {
|
|
12
|
-
spanTracer = tracer ?? trace.getTracer(DEFAULT_TRACER_NAME);
|
|
13
|
-
};
|
|
14
|
-
export const setSpanEventsEnabled = (level) => {
|
|
15
|
-
spanEventsEnabled = level === "recommended" || level === "full";
|
|
16
|
-
};
|
|
17
|
-
export const startSpan = (name, options) => {
|
|
18
|
-
if (!spanTracer) {
|
|
19
|
-
return Object.assign(trace.wrapSpanContext(INVALID_SPAN_CONTEXT), NOOP_SPAN);
|
|
20
|
-
}
|
|
21
|
-
const parentContext = context.active();
|
|
22
|
-
const activeSpan = trace.getActiveSpan();
|
|
23
|
-
const span = spanTracer.startSpan(name, { kind: activeSpan ? SpanKind.INTERNAL : SpanKind.SERVER, ...options }, parentContext);
|
|
24
|
-
const runWithContext = (fn) => context.with(trace.setSpan(parentContext, span), fn);
|
|
25
|
-
const recordError = (error) => {
|
|
26
|
-
const err = error instanceof Error ? error : new Error(String(error));
|
|
27
|
-
span.recordException(err);
|
|
28
|
-
span.setStatus({ code: SpanStatusCode.ERROR, message: err.message });
|
|
29
|
-
};
|
|
30
|
-
const finish = () => {
|
|
31
|
-
span.end();
|
|
32
|
-
};
|
|
33
|
-
return Object.assign(span, { runWithContext, recordError, finish, isExisting: !!activeSpan });
|
|
34
|
-
};
|
|
35
|
-
export const withSpan = async (name, run, options) => {
|
|
36
|
-
if (!spanTracer) {
|
|
37
|
-
return run();
|
|
38
|
-
}
|
|
39
|
-
const started = startSpan(name, options);
|
|
40
|
-
try {
|
|
41
|
-
return await started.runWithContext(run);
|
|
42
|
-
}
|
|
43
|
-
catch (error) {
|
|
44
|
-
started.recordError(error);
|
|
45
|
-
throw error;
|
|
46
|
-
}
|
|
47
|
-
finally {
|
|
48
|
-
started.finish();
|
|
49
|
-
}
|
|
50
|
-
};
|
|
51
|
-
export const addSpanEvent = (name, attributes) => {
|
|
52
|
-
if (!spanEventsEnabled)
|
|
53
|
-
return;
|
|
54
|
-
trace.getActiveSpan()?.addEvent(name, attributes);
|
|
55
|
-
};
|
|
56
|
-
export const setSpanAttributes = (attributes) => {
|
|
57
|
-
if (!attributes)
|
|
58
|
-
return;
|
|
59
|
-
trace.getActiveSpan()?.setAttributes(attributes);
|
|
60
|
-
};
|
package/dist/telemetry/stream.js
DELETED
|
@@ -1,58 +0,0 @@
|
|
|
1
|
-
import { toOpenAIError } from "../errors/openai";
|
|
2
|
-
const isErrorChunk = (v) => v instanceof Error || (typeof v === "object" && v !== null && "error" in v);
|
|
3
|
-
export const wrapStream = (src, hooks) => {
|
|
4
|
-
let finished = false;
|
|
5
|
-
let reader;
|
|
6
|
-
const done = (controller, status, reason) => {
|
|
7
|
-
if (finished)
|
|
8
|
-
return;
|
|
9
|
-
finished = true;
|
|
10
|
-
hooks.onDone?.(status, reason);
|
|
11
|
-
if (status !== 200) {
|
|
12
|
-
reader?.cancel(reason).catch(() => { });
|
|
13
|
-
}
|
|
14
|
-
try {
|
|
15
|
-
controller.close();
|
|
16
|
-
}
|
|
17
|
-
catch { }
|
|
18
|
-
};
|
|
19
|
-
return new ReadableStream({
|
|
20
|
-
async start(controller) {
|
|
21
|
-
reader = src.getReader();
|
|
22
|
-
try {
|
|
23
|
-
for (;;) {
|
|
24
|
-
// oxlint-disable-next-line no-await-in-loop, no-unsafe-assignment
|
|
25
|
-
const { value, done: eof } = await reader.read();
|
|
26
|
-
if (eof)
|
|
27
|
-
break;
|
|
28
|
-
controller.enqueue(value);
|
|
29
|
-
if (isErrorChunk(value)) {
|
|
30
|
-
done(controller, toOpenAIError(value).error.type === "invalid_request_error" ? 422 : 502, value);
|
|
31
|
-
return;
|
|
32
|
-
}
|
|
33
|
-
}
|
|
34
|
-
done(controller, 200);
|
|
35
|
-
}
|
|
36
|
-
catch (err) {
|
|
37
|
-
try {
|
|
38
|
-
controller.enqueue(toOpenAIError(err));
|
|
39
|
-
}
|
|
40
|
-
catch { }
|
|
41
|
-
done(controller, 502, err);
|
|
42
|
-
}
|
|
43
|
-
finally {
|
|
44
|
-
try {
|
|
45
|
-
reader?.releaseLock();
|
|
46
|
-
}
|
|
47
|
-
catch { }
|
|
48
|
-
}
|
|
49
|
-
},
|
|
50
|
-
cancel(reason) {
|
|
51
|
-
if (finished)
|
|
52
|
-
return;
|
|
53
|
-
finished = true;
|
|
54
|
-
hooks.onDone?.(499, reason);
|
|
55
|
-
reader?.cancel(reason).catch(() => { });
|
|
56
|
-
},
|
|
57
|
-
});
|
|
58
|
-
};
|
package/dist/types.d.ts
DELETED
|
@@ -1,176 +0,0 @@
|
|
|
1
|
-
import type { ProviderV3 } from "@ai-sdk/provider";
|
|
2
|
-
import type { Tracer } from "@opentelemetry/api";
|
|
3
|
-
import type { ChatCompletions, ChatCompletionsBody, ChatCompletionsChunk } from "./endpoints/chat-completions/schema";
|
|
4
|
-
import type { Embeddings, EmbeddingsBody } from "./endpoints/embeddings/schema";
|
|
5
|
-
import type { Model, ModelList } from "./endpoints/models";
|
|
6
|
-
import type { Logger, LoggerConfig } from "./logger";
|
|
7
|
-
import type { ModelCatalog, ModelId } from "./models/types";
|
|
8
|
-
import type { ProviderId, ProviderRegistry } from "./providers/types";
|
|
9
|
-
/**
|
|
10
|
-
* Per-request context shared across handlers and hooks.
|
|
11
|
-
*/
|
|
12
|
-
export type GatewayContext = {
|
|
13
|
-
/**
|
|
14
|
-
* Mutable bag for passing data between hooks.
|
|
15
|
-
*/
|
|
16
|
-
state: Record<string, unknown>;
|
|
17
|
-
/**
|
|
18
|
-
* Provider registry from config.
|
|
19
|
-
*/
|
|
20
|
-
providers: ProviderRegistry;
|
|
21
|
-
/**
|
|
22
|
-
* Model catalog from config.
|
|
23
|
-
*/
|
|
24
|
-
models: ModelCatalog;
|
|
25
|
-
/**
|
|
26
|
-
* Incoming request for the handler.
|
|
27
|
-
*/
|
|
28
|
-
request: Request;
|
|
29
|
-
/**
|
|
30
|
-
* Resolved request ID for logging and telemetry.
|
|
31
|
-
*/
|
|
32
|
-
requestId: string;
|
|
33
|
-
/**
|
|
34
|
-
* Parsed body from the request.
|
|
35
|
-
*/
|
|
36
|
-
body?: ChatCompletionsBody | EmbeddingsBody;
|
|
37
|
-
/**
|
|
38
|
-
* Incoming model ID.
|
|
39
|
-
*/
|
|
40
|
-
modelId?: ModelId;
|
|
41
|
-
/**
|
|
42
|
-
* Resolved model ID.
|
|
43
|
-
*/
|
|
44
|
-
resolvedModelId?: ModelId;
|
|
45
|
-
/**
|
|
46
|
-
* Operation type.
|
|
47
|
-
*/
|
|
48
|
-
operation?: "chat" | "embeddings" | "models";
|
|
49
|
-
/**
|
|
50
|
-
* Resolved provider instance.
|
|
51
|
-
*/
|
|
52
|
-
provider?: ProviderV3;
|
|
53
|
-
/**
|
|
54
|
-
* Resolved provider ID.
|
|
55
|
-
*/
|
|
56
|
-
resolvedProviderId?: ProviderId;
|
|
57
|
-
/**
|
|
58
|
-
* Result returned by the handler (pre-response).
|
|
59
|
-
*/
|
|
60
|
-
result?: ChatCompletions | ReadableStream<ChatCompletionsChunk | Error> | Embeddings | Model | ModelList;
|
|
61
|
-
/**
|
|
62
|
-
* Response object returned by the handler.
|
|
63
|
-
*/
|
|
64
|
-
response?: Response;
|
|
65
|
-
};
|
|
66
|
-
/**
|
|
67
|
-
* Hook context: all fields readonly except `state`.
|
|
68
|
-
*/
|
|
69
|
-
export type HookContext = Omit<Readonly<GatewayContext>, "state"> & {
|
|
70
|
-
state: GatewayContext["state"];
|
|
71
|
-
};
|
|
72
|
-
type RequiredHookContext<K extends keyof GatewayContext> = Omit<HookContext, K> & Required<Pick<HookContext, K>>;
|
|
73
|
-
export type OnRequestHookContext = RequiredHookContext<"request">;
|
|
74
|
-
export type BeforeHookContext = RequiredHookContext<"request" | "operation" | "body">;
|
|
75
|
-
export type ResolveModelHookContext = RequiredHookContext<"request" | "operation" | "body" | "modelId">;
|
|
76
|
-
export type ResolveProviderHookContext = RequiredHookContext<"request" | "operation" | "body" | "modelId" | "resolvedModelId">;
|
|
77
|
-
export type AfterHookContext = RequiredHookContext<"request" | "operation" | "body" | "modelId" | "resolvedModelId" | "provider" | "resolvedProviderId" | "result">;
|
|
78
|
-
export type OnResponseHookContext = RequiredHookContext<"request" | "response">;
|
|
79
|
-
/**
|
|
80
|
-
* Hooks to plugin to the gateway lifecycle.
|
|
81
|
-
*/
|
|
82
|
-
export type GatewayHooks = {
|
|
83
|
-
/**
|
|
84
|
-
* Runs before any endpoint handler logic.
|
|
85
|
-
* @returns Optional Response to short-circuit the request.
|
|
86
|
-
*/
|
|
87
|
-
onRequest?: (ctx: OnRequestHookContext) => void | Response | Promise<void | Response>;
|
|
88
|
-
/**
|
|
89
|
-
* Runs after request JSON is parsed and validated for chat completions / embeddings.
|
|
90
|
-
* @returns Replacement parsed body, or undefined to keep original.
|
|
91
|
-
*/
|
|
92
|
-
before?: (ctx: BeforeHookContext) => void | ChatCompletionsBody | EmbeddingsBody | Promise<void | ChatCompletionsBody | EmbeddingsBody>;
|
|
93
|
-
/**
|
|
94
|
-
* Maps a user-provided model ID or alias to a canonical ID.
|
|
95
|
-
* @returns Canonical model ID or undefined to keep original.
|
|
96
|
-
*/
|
|
97
|
-
resolveModelId?: (ctx: ResolveModelHookContext) => ModelId | void | Promise<ModelId | void>;
|
|
98
|
-
/**
|
|
99
|
-
* Picks a provider instance for the request.
|
|
100
|
-
* @returns ProviderV3 to override, or undefined to use default.
|
|
101
|
-
*/
|
|
102
|
-
resolveProvider?: (ctx: ResolveProviderHookContext) => ProviderV3 | void | Promise<ProviderV3 | void>;
|
|
103
|
-
/**
|
|
104
|
-
* Runs after the endpoint handler.
|
|
105
|
-
* @returns Result to replace, or undefined to keep original.
|
|
106
|
-
*/
|
|
107
|
-
after?: (ctx: AfterHookContext) => void | ChatCompletions | ReadableStream<ChatCompletionsChunk | Error> | Embeddings | Promise<void | ChatCompletions | ReadableStream<ChatCompletionsChunk | Error> | Embeddings>;
|
|
108
|
-
/**
|
|
109
|
-
* Runs after the lifecycle has produced the final Response.
|
|
110
|
-
* @returns Replacement Response, or undefined to keep original.
|
|
111
|
-
*/
|
|
112
|
-
onResponse?: (ctx: OnResponseHookContext) => void | Response | Promise<void | Response>;
|
|
113
|
-
};
|
|
114
|
-
export type TelemetrySignalLevel = "off" | "required" | "recommended" | "full";
|
|
115
|
-
/**
|
|
116
|
-
* Main configuration object for the gateway.
|
|
117
|
-
*/
|
|
118
|
-
export type GatewayConfig = {
|
|
119
|
-
/**
|
|
120
|
-
* Optional base path the gateway is mounted under (e.g. "/v1/gateway").
|
|
121
|
-
*/
|
|
122
|
-
basePath?: string;
|
|
123
|
-
/**
|
|
124
|
-
* Provider registry keyed by canonical provider IDs.
|
|
125
|
-
*/
|
|
126
|
-
providers: ProviderRegistry;
|
|
127
|
-
/**
|
|
128
|
-
* Model catalog keyed by canonical model IDs.
|
|
129
|
-
*/
|
|
130
|
-
models: ModelCatalog;
|
|
131
|
-
/**
|
|
132
|
-
* Optional lifecycle hooks for routing, auth, and response shaping.
|
|
133
|
-
*/
|
|
134
|
-
hooks?: GatewayHooks;
|
|
135
|
-
/**
|
|
136
|
-
* Preferred logger configuration: custom logger or default logger settings.
|
|
137
|
-
*/
|
|
138
|
-
logger?: Logger | LoggerConfig | null;
|
|
139
|
-
/**
|
|
140
|
-
* Optional AI SDK telemetry configuration.
|
|
141
|
-
*/
|
|
142
|
-
telemetry?: {
|
|
143
|
-
/**
|
|
144
|
-
* Enable AI SDK OpenTelemetry instrumentation.
|
|
145
|
-
* Disabled by default.
|
|
146
|
-
*/
|
|
147
|
-
enabled?: boolean;
|
|
148
|
-
/**
|
|
149
|
-
* Optional custom OpenTelemetry tracer passed to AI SDK telemetry.
|
|
150
|
-
*/
|
|
151
|
-
tracer?: Tracer;
|
|
152
|
-
/**
|
|
153
|
-
* Telemetry signal levels by namespace.
|
|
154
|
-
* - off: disable the namespace
|
|
155
|
-
* - required: minimal baseline
|
|
156
|
-
* - recommended: practical defaults
|
|
157
|
-
* - full: include all available details
|
|
158
|
-
*/
|
|
159
|
-
signals?: {
|
|
160
|
-
gen_ai?: TelemetrySignalLevel;
|
|
161
|
-
http?: TelemetrySignalLevel;
|
|
162
|
-
hebo?: TelemetrySignalLevel;
|
|
163
|
-
};
|
|
164
|
-
};
|
|
165
|
-
};
|
|
166
|
-
export declare const kParsed: unique symbol;
|
|
167
|
-
export type GatewayConfigParsed = GatewayConfig & {
|
|
168
|
-
[kParsed]: true;
|
|
169
|
-
};
|
|
170
|
-
export interface Endpoint {
|
|
171
|
-
handler: (request: Request, state?: Record<string, unknown>) => Promise<Response>;
|
|
172
|
-
}
|
|
173
|
-
export interface HeboGateway<Routes extends Record<string, Endpoint>> extends Endpoint {
|
|
174
|
-
routes: Routes;
|
|
175
|
-
}
|
|
176
|
-
export {};
|
package/dist/types.js
DELETED
|
@@ -1 +0,0 @@
|
|
|
1
|
-
export const kParsed = Symbol("hebo.gateway.parsed");
|
package/dist/utils/env.d.ts
DELETED
package/dist/utils/env.js
DELETED
|
@@ -1,7 +0,0 @@
|
|
|
1
|
-
const NODE_ENV = typeof process === "undefined"
|
|
2
|
-
? // oxlint-disable-next-line no-unsafe-member-access
|
|
3
|
-
(globalThis.NODE_ENV ?? globalThis.ENV?.NODE_ENV)
|
|
4
|
-
: // oxlint-disable-next-line no-unsafe-assignment
|
|
5
|
-
process.env?.NODE_ENV;
|
|
6
|
-
export const isProduction = () => NODE_ENV === "production";
|
|
7
|
-
export const isTest = () => NODE_ENV === "test";
|
package/dist/utils/headers.d.ts
DELETED
package/dist/utils/headers.js
DELETED
|
@@ -1,22 +0,0 @@
|
|
|
1
|
-
export const REQUEST_ID_HEADER = "x-request-id";
|
|
2
|
-
export const resolveRequestId = (source) => {
|
|
3
|
-
if (!source)
|
|
4
|
-
return undefined;
|
|
5
|
-
if (source instanceof Request) {
|
|
6
|
-
return source.headers.get(REQUEST_ID_HEADER) ?? undefined;
|
|
7
|
-
}
|
|
8
|
-
const headers = source.headers;
|
|
9
|
-
if (!headers)
|
|
10
|
-
return undefined;
|
|
11
|
-
if (headers instanceof Headers) {
|
|
12
|
-
return headers.get(REQUEST_ID_HEADER) ?? undefined;
|
|
13
|
-
}
|
|
14
|
-
if (Array.isArray(headers)) {
|
|
15
|
-
for (const [key, value] of headers) {
|
|
16
|
-
if (key.toLowerCase() === REQUEST_ID_HEADER)
|
|
17
|
-
return value;
|
|
18
|
-
}
|
|
19
|
-
return undefined;
|
|
20
|
-
}
|
|
21
|
-
return headers[REQUEST_ID_HEADER];
|
|
22
|
-
};
|
package/dist/utils/preset.d.ts
DELETED
|
@@ -1,10 +0,0 @@
|
|
|
1
|
-
export type DeepPartial<T> = T extends (...args: unknown[]) => unknown ? T : T extends readonly (infer U)[] ? readonly DeepPartial<U>[] : T extends object ? {
|
|
2
|
-
[K in keyof T]?: DeepPartial<T[K]>;
|
|
3
|
-
} : T;
|
|
4
|
-
/**
|
|
5
|
-
* Deep merge where overrides win.
|
|
6
|
-
* Arrays are replaced.
|
|
7
|
-
*/
|
|
8
|
-
export declare function deepMerge<A extends object, B extends object>(base: A, override?: B): A & B;
|
|
9
|
-
export type Preset<Id extends string, T extends Record<string, unknown>, Base extends DeepPartial<T>> = <O extends DeepPartial<T>>(override?: O) => Record<Id, Base & O>;
|
|
10
|
-
export declare function presetFor<Ids extends string, T extends Record<string, unknown>>(): <const Id extends Ids, const Base extends DeepPartial<T>>(id: Id, base: Base) => Preset<Id, T, Base>;
|
package/dist/utils/preset.js
DELETED
|
@@ -1,42 +0,0 @@
|
|
|
1
|
-
function isPlainObject(v) {
|
|
2
|
-
if (!v || typeof v !== "object" || Array.isArray(v))
|
|
3
|
-
return false;
|
|
4
|
-
// oxlint-disable-next-line no-unsafe-assignment
|
|
5
|
-
const proto = Object.getPrototypeOf(v);
|
|
6
|
-
return proto === Object.prototype || proto === null;
|
|
7
|
-
}
|
|
8
|
-
/**
|
|
9
|
-
* Deep merge where overrides win.
|
|
10
|
-
* Arrays are replaced.
|
|
11
|
-
*/
|
|
12
|
-
export function deepMerge(base, override) {
|
|
13
|
-
if (override === null || override === undefined)
|
|
14
|
-
return base;
|
|
15
|
-
if (!isPlainObject(base) || !isPlainObject(override)) {
|
|
16
|
-
return override;
|
|
17
|
-
}
|
|
18
|
-
const out = { ...base };
|
|
19
|
-
for (const [key, ov] of Object.entries(override)) {
|
|
20
|
-
if (ov === undefined)
|
|
21
|
-
continue;
|
|
22
|
-
const bv = out[key];
|
|
23
|
-
if (Array.isArray(ov)) {
|
|
24
|
-
out[key] = ov;
|
|
25
|
-
continue;
|
|
26
|
-
}
|
|
27
|
-
if (isPlainObject(bv) && isPlainObject(ov)) {
|
|
28
|
-
out[key] = deepMerge(bv, ov);
|
|
29
|
-
continue;
|
|
30
|
-
}
|
|
31
|
-
out[key] = ov;
|
|
32
|
-
}
|
|
33
|
-
return out;
|
|
34
|
-
}
|
|
35
|
-
export function presetFor() {
|
|
36
|
-
return function preset(id, base) {
|
|
37
|
-
return (override) => {
|
|
38
|
-
const merged = deepMerge(base, override ?? {});
|
|
39
|
-
return { [id]: merged };
|
|
40
|
-
};
|
|
41
|
-
};
|
|
42
|
-
}
|
package/dist/utils/request.d.ts
DELETED
package/dist/utils/request.js
DELETED
|
@@ -1,43 +0,0 @@
|
|
|
1
|
-
import pkg from "../../package.json" with { type: "json" };
|
|
2
|
-
import { resolveRequestId } from "./headers";
|
|
3
|
-
const GATEWAY_VERSION = pkg.version;
|
|
4
|
-
const FORWARD_HEADER_ALLOWLIST = [
|
|
5
|
-
// OpenAI + OpenAI-compatible providers (Azure, Groq, Together, Fireworks, etc.)
|
|
6
|
-
"openai-beta",
|
|
7
|
-
"openai-organization",
|
|
8
|
-
"openai-project",
|
|
9
|
-
// OpenRouter
|
|
10
|
-
"x-openrouter-categories",
|
|
11
|
-
"x-openrouter-title",
|
|
12
|
-
"x-title",
|
|
13
|
-
// Anthropic
|
|
14
|
-
"anthropic-beta",
|
|
15
|
-
// AWS Bedrock
|
|
16
|
-
"x-amzn-bedrock-guardrailidentifier",
|
|
17
|
-
"x-amzn-bedrock-guardrailversion",
|
|
18
|
-
"x-amzn-bedrock-performanceconfig-latency",
|
|
19
|
-
"x-amzn-bedrock-trace",
|
|
20
|
-
// Cohere
|
|
21
|
-
"x-client-name",
|
|
22
|
-
// Vertex provisioned throughput / endpoint routing
|
|
23
|
-
"x-vertex-ai-endpoint-id",
|
|
24
|
-
"x-vertex-ai-llm-request-type",
|
|
25
|
-
"x-vertex-ai-llm-shared-request-type",
|
|
26
|
-
];
|
|
27
|
-
const createRequestId = () => "req_" + crypto.getRandomValues(new Uint32Array(2)).reduce((s, n) => s + n.toString(36), "");
|
|
28
|
-
export const resolveOrCreateRequestId = (request) => resolveRequestId(request) ?? createRequestId();
|
|
29
|
-
export const prepareForwardHeaders = (request) => {
|
|
30
|
-
const userAgent = request.headers.get("user-agent");
|
|
31
|
-
const appendedUserAgent = userAgent
|
|
32
|
-
? `${userAgent} @hebo-ai/gateway/${GATEWAY_VERSION}`
|
|
33
|
-
: `@hebo-ai/gateway/${GATEWAY_VERSION}`;
|
|
34
|
-
const headers = {
|
|
35
|
-
"user-agent": appendedUserAgent,
|
|
36
|
-
};
|
|
37
|
-
for (const key of FORWARD_HEADER_ALLOWLIST) {
|
|
38
|
-
const value = request.headers.get(key);
|
|
39
|
-
if (value !== null)
|
|
40
|
-
headers[key] = value;
|
|
41
|
-
}
|
|
42
|
-
return headers;
|
|
43
|
-
};
|
package/dist/utils/response.d.ts
DELETED
|
@@ -1,3 +0,0 @@
|
|
|
1
|
-
export declare const prepareResponseInit: (requestId: string) => ResponseInit;
|
|
2
|
-
export declare const mergeResponseInit: (defaultHeaders: HeadersInit, responseInit?: ResponseInit) => ResponseInit;
|
|
3
|
-
export declare const toResponse: (result: ReadableStream | Uint8Array<ArrayBuffer> | object | string, responseInit?: ResponseInit) => Response;
|
package/dist/utils/response.js
DELETED
|
@@ -1,70 +0,0 @@
|
|
|
1
|
-
import { REQUEST_ID_HEADER } from "./headers";
|
|
2
|
-
const TEXT_ENCODER = new TextEncoder();
|
|
3
|
-
class JsonToSseTransformStream extends TransformStream {
|
|
4
|
-
constructor() {
|
|
5
|
-
super({
|
|
6
|
-
transform(part, controller) {
|
|
7
|
-
controller.enqueue(`data: ${JSON.stringify(part)}\n\n`);
|
|
8
|
-
},
|
|
9
|
-
flush(controller) {
|
|
10
|
-
controller.enqueue("data: [DONE]\n\n");
|
|
11
|
-
},
|
|
12
|
-
});
|
|
13
|
-
}
|
|
14
|
-
}
|
|
15
|
-
export const prepareResponseInit = (requestId) => ({
|
|
16
|
-
headers: { [REQUEST_ID_HEADER]: requestId },
|
|
17
|
-
});
|
|
18
|
-
export const mergeResponseInit = (defaultHeaders, responseInit) => {
|
|
19
|
-
const headers = new Headers(defaultHeaders);
|
|
20
|
-
const override = responseInit?.headers;
|
|
21
|
-
if (override) {
|
|
22
|
-
new Headers(override).forEach((value, key) => {
|
|
23
|
-
headers.set(key, value);
|
|
24
|
-
});
|
|
25
|
-
}
|
|
26
|
-
if (!responseInit)
|
|
27
|
-
return { headers };
|
|
28
|
-
return {
|
|
29
|
-
status: responseInit.status,
|
|
30
|
-
statusText: responseInit.statusText,
|
|
31
|
-
headers,
|
|
32
|
-
};
|
|
33
|
-
};
|
|
34
|
-
export const toResponse = (result, responseInit) => {
|
|
35
|
-
let body;
|
|
36
|
-
const isStream = result instanceof ReadableStream;
|
|
37
|
-
if (isStream) {
|
|
38
|
-
body = result.pipeThrough(new JsonToSseTransformStream()).pipeThrough(new TextEncoderStream());
|
|
39
|
-
}
|
|
40
|
-
else if (result instanceof Uint8Array) {
|
|
41
|
-
body = result;
|
|
42
|
-
}
|
|
43
|
-
else if (typeof result === "string") {
|
|
44
|
-
body = TEXT_ENCODER.encode(result);
|
|
45
|
-
}
|
|
46
|
-
else if (result instanceof Error) {
|
|
47
|
-
body = TEXT_ENCODER.encode(JSON.stringify({ message: result.message }));
|
|
48
|
-
}
|
|
49
|
-
else {
|
|
50
|
-
body = TEXT_ENCODER.encode(JSON.stringify(result));
|
|
51
|
-
}
|
|
52
|
-
if (!responseInit?.statusText) {
|
|
53
|
-
const isError = result instanceof Error;
|
|
54
|
-
const status = responseInit?.status ?? (isError ? 500 : 200);
|
|
55
|
-
const statusText = isError ? "REQUEST_FAILED" : "OK";
|
|
56
|
-
const headers = responseInit?.headers;
|
|
57
|
-
responseInit = headers ? { status, statusText, headers } : { status, statusText };
|
|
58
|
-
}
|
|
59
|
-
const init = mergeResponseInit(isStream
|
|
60
|
-
? {
|
|
61
|
-
"content-type": "text/event-stream",
|
|
62
|
-
"cache-control": "no-cache",
|
|
63
|
-
connection: "keep-alive",
|
|
64
|
-
}
|
|
65
|
-
: {
|
|
66
|
-
"content-type": "application/json",
|
|
67
|
-
"content-length": String(body.byteLength),
|
|
68
|
-
}, responseInit);
|
|
69
|
-
return new Response(body, init);
|
|
70
|
-
};
|
package/dist/utils/url.d.ts
DELETED
package/dist/utils/url.js
DELETED
|
@@ -1,21 +0,0 @@
|
|
|
1
|
-
export const parseDataUrl = (url) => {
|
|
2
|
-
if (url.slice(0, 5).toLowerCase() !== "data:") {
|
|
3
|
-
return { mimeType: "", dataStart: 0 };
|
|
4
|
-
}
|
|
5
|
-
const MAX_HEADER_LENGTH = 1024;
|
|
6
|
-
const headerEnd = Math.min(url.length, 5 + MAX_HEADER_LENGTH);
|
|
7
|
-
const comma = url.indexOf(",", 5);
|
|
8
|
-
if (comma <= 5 || comma > headerEnd) {
|
|
9
|
-
return { mimeType: "", dataStart: 0 };
|
|
10
|
-
}
|
|
11
|
-
const semi = url.indexOf(";", 5);
|
|
12
|
-
const mimeEnd = semi !== -1 && semi < comma ? semi : comma;
|
|
13
|
-
const mimeType = url.slice(5, mimeEnd).trim();
|
|
14
|
-
if (!mimeType) {
|
|
15
|
-
return { mimeType: "", dataStart: 0 };
|
|
16
|
-
}
|
|
17
|
-
return {
|
|
18
|
-
mimeType,
|
|
19
|
-
dataStart: comma + 1,
|
|
20
|
-
};
|
|
21
|
-
};
|