@llmops/app 0.1.3 → 0.1.5-beta.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/.vite/manifest.json +535 -168
- package/dist/assets/Form-B1rZ0Hvr.js +1 -0
- package/dist/assets/InternalBackdrop-CXjGP6a9.js +12 -0
- package/dist/assets/_environment-zVjmOhBI.js +1 -0
- package/dist/assets/_observability-CQ4Ll_WT.js +1 -0
- package/dist/assets/_observability-DPSeR4-h.css +1 -0
- package/dist/assets/_settings-B87EsM9n.css +1 -0
- package/dist/assets/_settings-Bv8acMq8.js +1 -0
- package/dist/assets/{_tabs-DqcWXw0k.js → _tabs-Bi-rsAVV.js} +1 -1
- package/dist/assets/{_tabs-f2ku-dN-.js → _tabs-oKfgxR5m.js} +1 -1
- package/dist/assets/_variant-Zg5HjNSN.js +30 -0
- package/dist/assets/{_variants-B0pPx_AW.js → _variants-B36Lo8m_.js} +1 -1
- package/dist/assets/area.css-DTnbbu5M.js +1 -0
- package/dist/assets/button-DftzA6-1.js +1 -0
- package/dist/assets/check-PaWYhFn6.js +1 -0
- package/dist/assets/chevron-down-BjDiaa62.js +1 -0
- package/dist/assets/{chevron-right-C4hlJkjh.js → chevron-right-Dz77YeP_.js} +1 -1
- package/dist/assets/configs-CtNuMmVR.js +1 -0
- package/dist/assets/{copy-8RnLMadS.js → copy-D-DZB-6Z.js} +1 -1
- package/dist/assets/costs-DwVSRTwW.js +1 -0
- package/dist/assets/en-US-C8ut0f5H.js +1 -0
- package/dist/assets/environments-BB95BiC0.js +1 -0
- package/dist/assets/formatDistance-Bok3-MB1.js +1 -0
- package/dist/assets/getDisabledMountTransitionStyles-CKUvhO4q.js +1 -0
- package/dist/assets/index-BCY9aD4r.js +16 -0
- package/dist/assets/index-BS3B2BG5.js +1 -0
- package/dist/assets/{index-CzBp_9q8.css → index-BiCR_Kj2.css} +1 -1
- package/dist/assets/index-CnOYeKc1.js +1 -0
- package/dist/assets/index-CpAxLUl2.js +1 -0
- package/dist/assets/index-D841new6.js +1 -0
- package/dist/assets/index-DvzXLQL6.js +4 -0
- package/dist/assets/index-xdhK5tU9.js +1 -0
- package/dist/assets/{index.esm-Du3lv78y.js → index.esm-COTq2pHX.js} +1 -1
- package/dist/assets/info-box-JXSyJ9E4.css +1 -0
- package/dist/assets/info-box.css-HIaMvhbC.js +1 -0
- package/dist/assets/llmops-B3IIte87.css +1 -0
- package/dist/assets/llmops-C5uyvq6E.js +1 -0
- package/dist/assets/observability-C5jdcUSg.css +1 -0
- package/dist/assets/observability.css-dztiak5K.js +1 -0
- package/dist/assets/overview-BwCF8A1G.js +1 -0
- package/dist/assets/{plus-BNVL12hi.js → plus-C_L0BpbU.js} +1 -1
- package/dist/assets/popover-CSR0ctop.js +1 -0
- package/dist/assets/popupStateMapping-DkOpwBhG.js +1 -0
- package/dist/assets/requests-D8wE_E2M.js +1 -0
- package/dist/assets/{route-DCt595Gm.js → route-CI77gokb.js} +1 -1
- package/dist/assets/{route-D_ra2qKi.js → route-CZ2yCnzN.js} +1 -1
- package/dist/assets/route-vfMzB8KR.js +1 -0
- package/dist/assets/route-wrnLt3bn.js +1 -0
- package/dist/assets/secrets-B9u5jvFm.js +1 -0
- package/dist/assets/settings-24qWHZEq.js +1 -0
- package/dist/assets/settings-BLt538aO.js +1 -0
- package/dist/assets/{table-6j4oSY37.js → table-xLf4iXV8.js} +1 -1
- package/dist/assets/{tabs.css-BDs200M3.js → tabs.css-fttLH8Xj.js} +1 -1
- package/dist/assets/{targeting-BOZ8PRbu.js → targeting-DZIwwaYV.js} +1 -1
- package/dist/assets/tooltip-BKoDpdAC.js +1 -0
- package/dist/assets/update-or-create-name-ChWLK2jI.js +1 -0
- package/dist/assets/useButton-Ct8hIyjz.js +1 -0
- package/dist/assets/useConfigList-Du__Gu7q.js +1 -0
- package/dist/assets/{useConfigVariants-DoAiT4HN.js → useConfigVariants-C8frrCcZ.js} +1 -1
- package/dist/assets/useEnvironments-CYkrqAdO.js +1 -0
- package/dist/assets/useFocus-Du1aH2j1.js +1 -0
- package/dist/assets/{useMutation-B5RT6zjK.js → useMutation-VUB-GXkv.js} +1 -1
- package/dist/assets/usePopupAutoResize-ddPHogUJ.js +1 -0
- package/dist/assets/useRole-DP91D1OX.js +1 -0
- package/dist/assets/useSetTargeting-CQWutQzN.css +1 -0
- package/dist/assets/useSetTargeting-D1rPM8vz.js +1 -0
- package/dist/assets/useSyncedFloatingRootContext-BzuhbdSw.js +1 -0
- package/dist/assets/useTargetingRules-DS57orU0.js +1 -0
- package/dist/assets/useValueChanged-vz8uKgCk.js +1 -0
- package/dist/assets/user-profile-Bt3_D9Gr.js +1 -0
- package/dist/assets/variants-CYXSNKzX.js +1 -0
- package/dist/assets/variants.css-BjGKD3Nv.js +1 -0
- package/dist/assets/workspace-general-BRMpUqb-.js +1 -0
- package/dist/assets/workspace-general-ET4CEZQV.css +1 -0
- package/dist/index.cjs +763 -23
- package/dist/index.mjs +764 -24
- package/package.json +3 -3
- package/dist/assets/Form-CR9iKNJV.js +0 -1
- package/dist/assets/_environment-DUWlgl3c.js +0 -1
- package/dist/assets/_variant-D5crm4Ds.js +0 -30
- package/dist/assets/button-DO9sNXVT.js +0 -1
- package/dist/assets/check-DqI6mrEe.js +0 -1
- package/dist/assets/configs-D7rrXGVw.js +0 -1
- package/dist/assets/environments-CQ_2r1iM.js +0 -1
- package/dist/assets/formatDistance-fxR--uRk.js +0 -1
- package/dist/assets/index-8q56yhPq.js +0 -16
- package/dist/assets/index-CAAXzvj0.js +0 -1
- package/dist/assets/index-Cr1VB5iR.js +0 -1
- package/dist/assets/index-Dd3OazzV.js +0 -1
- package/dist/assets/new-config-state-B8sMe-TC.css +0 -1
- package/dist/assets/new-config-state.css-BkrgBLVT.js +0 -1
- package/dist/assets/secrets-DoNAc8Mo.js +0 -1
- package/dist/assets/settings-C9bl_jrl.js +0 -1
- package/dist/assets/settings-CdtZpv34.js +0 -1
- package/dist/assets/update-or-create-name-B72U1gm0.js +0 -4
- package/dist/assets/useButton-CAZmhHhe.js +0 -1
- package/dist/assets/useConfigList-DVy2f9Ka.js +0 -1
- package/dist/assets/useEnvironments-B9zdgoPZ.js +0 -1
- package/dist/assets/useRole-BBEFofTs.js +0 -1
- package/dist/assets/useSetTargeting-DIyb-zyZ.css +0 -1
- package/dist/assets/useSetTargeting-x-2mNQAV.js +0 -1
- package/dist/assets/useTargetingRules-DWyIfOXq.js +0 -1
- package/dist/assets/useValueChanged-DLCw33hO.js +0 -12
- package/dist/assets/variants-CLcQicJ2.js +0 -1
- package/dist/assets/variants.css-CRQAZpOT.js +0 -1
- /package/dist/assets/{formatDistance-DoOD1Loz.css → area-DoOD1Loz.css} +0 -0
package/dist/index.cjs
CHANGED
|
@@ -56,13 +56,14 @@ let __hono_zod_validator = require("@hono/zod-validator");
|
|
|
56
56
|
let hono_pretty_json = require("hono/pretty-json");
|
|
57
57
|
let hono_http_exception = require("hono/http-exception");
|
|
58
58
|
let hono_cors = require("hono/cors");
|
|
59
|
+
let node_crypto = require("node:crypto");
|
|
59
60
|
let __llmops_gateway = require("@llmops/gateway");
|
|
60
61
|
__llmops_gateway = __toESM(__llmops_gateway);
|
|
61
62
|
let node_process = require("node:process");
|
|
62
63
|
let __llmops_core_db = require("@llmops/core/db");
|
|
63
64
|
|
|
64
65
|
//#region src/client/index.tsx?url
|
|
65
|
-
var client_default = "/assets/index-
|
|
66
|
+
var client_default = "/assets/index-BCY9aD4r.js";
|
|
66
67
|
|
|
67
68
|
//#endregion
|
|
68
69
|
//#region src/client/styles/styles.css?url
|
|
@@ -93,7 +94,7 @@ const ReactRefresh = () => {
|
|
|
93
94
|
const { renderToString } = react_dom_server.default;
|
|
94
95
|
const manifestPath = (0, node_path.join)((0, node_path.dirname)((0, node_url.fileURLToPath)(require("url").pathToFileURL(__filename).href)), "./.vite/manifest.json");
|
|
95
96
|
const manifest = (0, node_fs.existsSync)(manifestPath) ? JSON.parse((0, node_fs.readFileSync)(manifestPath, "utf-8")) : {};
|
|
96
|
-
const renderer = ({ basePath = "", dev = false, llmProviders }) => {
|
|
97
|
+
const renderer = ({ basePath = "", dev = false, llmProviders, authType }) => {
|
|
97
98
|
const stylesPath = basePath === "/" ? styles_default : basePath + styles_default;
|
|
98
99
|
const clientPath = basePath === "/" ? client_default : basePath + client_default;
|
|
99
100
|
const faviconPath = basePath === "/" ? "/favicon.ico" : basePath + "/assets/favicon.ico";
|
|
@@ -356,7 +357,8 @@ const renderer = ({ basePath = "", dev = false, llmProviders }) => {
|
|
|
356
357
|
/* @__PURE__ */ (0, react_jsx_runtime.jsx)("script", { children: `
|
|
357
358
|
window.bootstrapData = {
|
|
358
359
|
basePath: "${basePath}",
|
|
359
|
-
llmProviders: ${JSON.stringify(llmProviders || [])}
|
|
360
|
+
llmProviders: ${JSON.stringify(llmProviders || [])},
|
|
361
|
+
authType: "${authType || "basic"}"
|
|
360
362
|
};
|
|
361
363
|
` }),
|
|
362
364
|
dev && /* @__PURE__ */ (0, react_jsx_runtime.jsx)(ReactRefresh, {})
|
|
@@ -12707,11 +12709,13 @@ var zod_default = external_exports;
|
|
|
12707
12709
|
//#endregion
|
|
12708
12710
|
//#region src/server/lib/zv.ts
|
|
12709
12711
|
const zv = (target, schema) => (0, __hono_zod_validator.zValidator)(target, schema, (result, c) => {
|
|
12710
|
-
if (!result.success)
|
|
12711
|
-
|
|
12712
|
-
|
|
12713
|
-
|
|
12714
|
-
|
|
12712
|
+
if (!result.success) return c.json({
|
|
12713
|
+
message: "Bad Request",
|
|
12714
|
+
errors: result.error.issues.map((issue$1) => ({
|
|
12715
|
+
path: issue$1.path.join("."),
|
|
12716
|
+
message: issue$1.message
|
|
12717
|
+
}))
|
|
12718
|
+
}, 400);
|
|
12715
12719
|
});
|
|
12716
12720
|
|
|
12717
12721
|
//#endregion
|
|
@@ -12738,9 +12742,228 @@ const internalServerError = (message, code) => {
|
|
|
12738
12742
|
};
|
|
12739
12743
|
};
|
|
12740
12744
|
|
|
12745
|
+
//#endregion
|
|
12746
|
+
//#region src/server/handlers/analytics/index.ts
|
|
12747
|
+
/**
|
|
12748
|
+
* Convert micro-dollars to formatted dollar string
|
|
12749
|
+
*/
|
|
12750
|
+
function formatCost(microDollars, decimals = 6) {
|
|
12751
|
+
return `$${(microDollars / 1e6).toFixed(decimals)}`;
|
|
12752
|
+
}
|
|
12753
|
+
/**
|
|
12754
|
+
* Parse ISO date string to Date object
|
|
12755
|
+
* Accepts both ISO strings (2026-01-02T10:30:00.000Z) and date-only strings (2026-01-02)
|
|
12756
|
+
*/
|
|
12757
|
+
function parseDate(dateStr) {
|
|
12758
|
+
const date$4 = new Date(dateStr);
|
|
12759
|
+
if (isNaN(date$4.getTime())) throw new Error(`Invalid date string: ${dateStr}`);
|
|
12760
|
+
return date$4;
|
|
12761
|
+
}
|
|
12762
|
+
/**
|
|
12763
|
+
* Parse date string for start of range
|
|
12764
|
+
* - ISO strings are used as-is
|
|
12765
|
+
* - Date-only strings (YYYY-MM-DD) are treated as start of day UTC
|
|
12766
|
+
*/
|
|
12767
|
+
function parseStartDate(dateStr) {
|
|
12768
|
+
return parseDate(dateStr);
|
|
12769
|
+
}
|
|
12770
|
+
/**
|
|
12771
|
+
* Parse date string for end of range
|
|
12772
|
+
* - ISO strings are used as-is
|
|
12773
|
+
* - Date-only strings (YYYY-MM-DD) are set to end of day (23:59:59.999 UTC)
|
|
12774
|
+
*/
|
|
12775
|
+
function parseEndDate(dateStr) {
|
|
12776
|
+
const date$4 = parseDate(dateStr);
|
|
12777
|
+
if (!dateStr.includes("T")) date$4.setUTCHours(23, 59, 59, 999);
|
|
12778
|
+
return date$4;
|
|
12779
|
+
}
|
|
12780
|
+
/**
|
|
12781
|
+
* Zod schema for ISO date strings
|
|
12782
|
+
* Validates that the string can be parsed as a valid date
|
|
12783
|
+
*/
|
|
12784
|
+
const isoDateString = zod_default.string().refine((val) => !isNaN(new Date(val).getTime()), { message: "Invalid date format. Expected ISO 8601 string (e.g., 2026-01-02T10:30:00.000Z) or date string (e.g., 2026-01-02)" });
|
|
12785
|
+
/**
|
|
12786
|
+
* Date range query schema
|
|
12787
|
+
* Accepts ISO 8601 date strings or date-only strings (YYYY-MM-DD)
|
|
12788
|
+
* - startDate: Used as-is for ISO strings, start of day for date-only
|
|
12789
|
+
* - endDate: Used as-is for ISO strings, end of day (23:59:59.999) for date-only
|
|
12790
|
+
*/
|
|
12791
|
+
const dateRangeSchema = zod_default.object({
|
|
12792
|
+
startDate: isoDateString.transform(parseStartDate),
|
|
12793
|
+
endDate: isoDateString.transform(parseEndDate)
|
|
12794
|
+
});
|
|
12795
|
+
/**
|
|
12796
|
+
* Analytics API routes for cost and usage tracking
|
|
12797
|
+
*/
|
|
12798
|
+
const app$10 = new hono.Hono().get("/requests", zv("query", zod_default.object({
|
|
12799
|
+
limit: zod_default.string().transform(Number).optional(),
|
|
12800
|
+
offset: zod_default.string().transform(Number).optional(),
|
|
12801
|
+
configId: zod_default.string().uuid().optional(),
|
|
12802
|
+
provider: zod_default.string().optional(),
|
|
12803
|
+
model: zod_default.string().optional(),
|
|
12804
|
+
startDate: isoDateString.optional(),
|
|
12805
|
+
endDate: isoDateString.optional()
|
|
12806
|
+
})), async (c) => {
|
|
12807
|
+
const db = c.get("db");
|
|
12808
|
+
const query = c.req.valid("query");
|
|
12809
|
+
try {
|
|
12810
|
+
const requests = await db.listRequests({
|
|
12811
|
+
limit: query.limit,
|
|
12812
|
+
offset: query.offset,
|
|
12813
|
+
configId: query.configId,
|
|
12814
|
+
provider: query.provider,
|
|
12815
|
+
model: query.model,
|
|
12816
|
+
startDate: query.startDate ? parseStartDate(query.startDate) : void 0,
|
|
12817
|
+
endDate: query.endDate ? parseEndDate(query.endDate) : void 0
|
|
12818
|
+
});
|
|
12819
|
+
return c.json(successResponse(requests, 200));
|
|
12820
|
+
} catch (error$45) {
|
|
12821
|
+
console.error("Error fetching requests:", error$45);
|
|
12822
|
+
return c.json(internalServerError("Failed to fetch requests", 500), 500);
|
|
12823
|
+
}
|
|
12824
|
+
}).get("/requests/:requestId", zv("param", zod_default.object({ requestId: zod_default.string().uuid() })), async (c) => {
|
|
12825
|
+
const db = c.get("db");
|
|
12826
|
+
const { requestId } = c.req.valid("param");
|
|
12827
|
+
try {
|
|
12828
|
+
const request = await db.getRequestByRequestId(requestId);
|
|
12829
|
+
if (!request) return c.json({ error: "Request not found" }, 404);
|
|
12830
|
+
return c.json(successResponse(request, 200));
|
|
12831
|
+
} catch (error$45) {
|
|
12832
|
+
console.error("Error fetching request:", error$45);
|
|
12833
|
+
return c.json(internalServerError("Failed to fetch request", 500), 500);
|
|
12834
|
+
}
|
|
12835
|
+
}).get("/costs/total", zv("query", dateRangeSchema), async (c) => {
|
|
12836
|
+
const db = c.get("db");
|
|
12837
|
+
const { startDate, endDate } = c.req.valid("query");
|
|
12838
|
+
try {
|
|
12839
|
+
const data = await db.getTotalCost({
|
|
12840
|
+
startDate,
|
|
12841
|
+
endDate
|
|
12842
|
+
});
|
|
12843
|
+
if (!data) return c.json(successResponse({
|
|
12844
|
+
totalCost: 0,
|
|
12845
|
+
totalCostFormatted: "$0.000000",
|
|
12846
|
+
totalInputCost: 0,
|
|
12847
|
+
totalOutputCost: 0,
|
|
12848
|
+
totalPromptTokens: 0,
|
|
12849
|
+
totalCompletionTokens: 0,
|
|
12850
|
+
totalTokens: 0,
|
|
12851
|
+
requestCount: 0
|
|
12852
|
+
}, 200));
|
|
12853
|
+
return c.json(successResponse({
|
|
12854
|
+
...data,
|
|
12855
|
+
totalCostFormatted: formatCost(data.totalCost),
|
|
12856
|
+
totalInputCostFormatted: formatCost(data.totalInputCost),
|
|
12857
|
+
totalOutputCostFormatted: formatCost(data.totalOutputCost)
|
|
12858
|
+
}, 200));
|
|
12859
|
+
} catch (error$45) {
|
|
12860
|
+
console.error("Error fetching total costs:", error$45);
|
|
12861
|
+
return c.json(internalServerError("Failed to fetch total costs", 500), 500);
|
|
12862
|
+
}
|
|
12863
|
+
}).get("/costs/by-model", zv("query", dateRangeSchema), async (c) => {
|
|
12864
|
+
const db = c.get("db");
|
|
12865
|
+
const { startDate, endDate } = c.req.valid("query");
|
|
12866
|
+
try {
|
|
12867
|
+
const data = await db.getCostByModel({
|
|
12868
|
+
startDate,
|
|
12869
|
+
endDate
|
|
12870
|
+
});
|
|
12871
|
+
return c.json(successResponse(data, 200));
|
|
12872
|
+
} catch (error$45) {
|
|
12873
|
+
console.error("Error fetching costs by model:", error$45);
|
|
12874
|
+
return c.json(internalServerError("Failed to fetch costs by model", 500), 500);
|
|
12875
|
+
}
|
|
12876
|
+
}).get("/costs/by-provider", zv("query", dateRangeSchema), async (c) => {
|
|
12877
|
+
const db = c.get("db");
|
|
12878
|
+
const { startDate, endDate } = c.req.valid("query");
|
|
12879
|
+
try {
|
|
12880
|
+
const data = await db.getCostByProvider({
|
|
12881
|
+
startDate,
|
|
12882
|
+
endDate
|
|
12883
|
+
});
|
|
12884
|
+
return c.json(successResponse(data, 200));
|
|
12885
|
+
} catch (error$45) {
|
|
12886
|
+
console.error("Error fetching costs by provider:", error$45);
|
|
12887
|
+
return c.json(internalServerError("Failed to fetch costs by provider", 500), 500);
|
|
12888
|
+
}
|
|
12889
|
+
}).get("/costs/by-config", zv("query", dateRangeSchema), async (c) => {
|
|
12890
|
+
const db = c.get("db");
|
|
12891
|
+
const { startDate, endDate } = c.req.valid("query");
|
|
12892
|
+
try {
|
|
12893
|
+
const data = await db.getCostByConfig({
|
|
12894
|
+
startDate,
|
|
12895
|
+
endDate
|
|
12896
|
+
});
|
|
12897
|
+
return c.json(successResponse(data, 200));
|
|
12898
|
+
} catch (error$45) {
|
|
12899
|
+
console.error("Error fetching costs by config:", error$45);
|
|
12900
|
+
return c.json(internalServerError("Failed to fetch costs by config", 500), 500);
|
|
12901
|
+
}
|
|
12902
|
+
}).get("/costs/daily", zv("query", dateRangeSchema), async (c) => {
|
|
12903
|
+
const db = c.get("db");
|
|
12904
|
+
const { startDate, endDate } = c.req.valid("query");
|
|
12905
|
+
try {
|
|
12906
|
+
const data = await db.getDailyCosts({
|
|
12907
|
+
startDate,
|
|
12908
|
+
endDate
|
|
12909
|
+
});
|
|
12910
|
+
return c.json(successResponse(data, 200));
|
|
12911
|
+
} catch (error$45) {
|
|
12912
|
+
console.error("Error fetching daily costs:", error$45);
|
|
12913
|
+
return c.json(internalServerError("Failed to fetch daily costs", 500), 500);
|
|
12914
|
+
}
|
|
12915
|
+
}).get("/costs/summary", zv("query", dateRangeSchema.extend({ groupBy: zod_default.enum([
|
|
12916
|
+
"day",
|
|
12917
|
+
"hour",
|
|
12918
|
+
"model",
|
|
12919
|
+
"provider",
|
|
12920
|
+
"config"
|
|
12921
|
+
]).optional() })), async (c) => {
|
|
12922
|
+
const db = c.get("db");
|
|
12923
|
+
const { startDate, endDate, groupBy } = c.req.valid("query");
|
|
12924
|
+
try {
|
|
12925
|
+
const data = await db.getCostSummary({
|
|
12926
|
+
startDate,
|
|
12927
|
+
endDate,
|
|
12928
|
+
groupBy
|
|
12929
|
+
});
|
|
12930
|
+
return c.json(successResponse(data, 200));
|
|
12931
|
+
} catch (error$45) {
|
|
12932
|
+
console.error("Error fetching cost summary:", error$45);
|
|
12933
|
+
return c.json(internalServerError("Failed to fetch cost summary", 500), 500);
|
|
12934
|
+
}
|
|
12935
|
+
}).get("/stats", zv("query", dateRangeSchema), async (c) => {
|
|
12936
|
+
const db = c.get("db");
|
|
12937
|
+
const { startDate, endDate } = c.req.valid("query");
|
|
12938
|
+
try {
|
|
12939
|
+
const data = await db.getRequestStats({
|
|
12940
|
+
startDate,
|
|
12941
|
+
endDate
|
|
12942
|
+
});
|
|
12943
|
+
if (!data) return c.json(successResponse({
|
|
12944
|
+
totalRequests: 0,
|
|
12945
|
+
successfulRequests: 0,
|
|
12946
|
+
failedRequests: 0,
|
|
12947
|
+
streamingRequests: 0,
|
|
12948
|
+
avgLatencyMs: 0,
|
|
12949
|
+
maxLatencyMs: 0,
|
|
12950
|
+
minLatencyMs: 0,
|
|
12951
|
+
successRate: 0
|
|
12952
|
+
}, 200));
|
|
12953
|
+
return c.json(successResponse({
|
|
12954
|
+
...data,
|
|
12955
|
+
successRate: data.totalRequests > 0 ? (data.successfulRequests / data.totalRequests * 100).toFixed(2) : 0
|
|
12956
|
+
}, 200));
|
|
12957
|
+
} catch (error$45) {
|
|
12958
|
+
console.error("Error fetching request stats:", error$45);
|
|
12959
|
+
return c.json(internalServerError("Failed to fetch request stats", 500), 500);
|
|
12960
|
+
}
|
|
12961
|
+
});
|
|
12962
|
+
var analytics_default = app$10;
|
|
12963
|
+
|
|
12741
12964
|
//#endregion
|
|
12742
12965
|
//#region src/server/handlers/configs/index.ts
|
|
12743
|
-
const app$
|
|
12966
|
+
const app$9 = new hono.Hono().post("/", zv("json", zod_default.object({ name: zod_default.string().min(1) })), async (c) => {
|
|
12744
12967
|
const db = c.get("db");
|
|
12745
12968
|
try {
|
|
12746
12969
|
const value = await db.createNewConfig({ name: c.req.valid("json").name });
|
|
@@ -12844,7 +13067,7 @@ const app$8 = new hono.Hono().post("/", zv("json", zod_default.object({ name: zo
|
|
|
12844
13067
|
return c.json(internalServerError("Failed to delete config", 500), 500);
|
|
12845
13068
|
}
|
|
12846
13069
|
});
|
|
12847
|
-
var configs_default = app$
|
|
13070
|
+
var configs_default = app$9;
|
|
12848
13071
|
|
|
12849
13072
|
//#endregion
|
|
12850
13073
|
//#region src/server/handlers/environments/index.ts
|
|
@@ -12855,7 +13078,7 @@ var configs_default = app$8;
|
|
|
12855
13078
|
const generateSecretKey$1 = (slug) => {
|
|
12856
13079
|
return `sec_${slug.slice(0, 4).toLowerCase()}_${(0, __llmops_core.generateId)(24)}`;
|
|
12857
13080
|
};
|
|
12858
|
-
const app$
|
|
13081
|
+
const app$8 = new hono.Hono().post("/", zv("json", zod_default.object({
|
|
12859
13082
|
name: zod_default.string().min(1),
|
|
12860
13083
|
slug: zod_default.string().min(1),
|
|
12861
13084
|
isProd: zod_default.boolean().optional()
|
|
@@ -12940,7 +13163,7 @@ const app$7 = new hono.Hono().post("/", zv("json", zod_default.object({
|
|
|
12940
13163
|
return c.json(internalServerError("Failed to fetch environment secrets", 500), 500);
|
|
12941
13164
|
}
|
|
12942
13165
|
});
|
|
12943
|
-
var environments_default = app$
|
|
13166
|
+
var environments_default = app$8;
|
|
12944
13167
|
|
|
12945
13168
|
//#endregion
|
|
12946
13169
|
//#region src/server/handlers/providers/index.ts
|
|
@@ -12960,7 +13183,7 @@ async function fetchModelsDevData() {
|
|
|
12960
13183
|
cacheTimestamp = now;
|
|
12961
13184
|
return modelsCache;
|
|
12962
13185
|
}
|
|
12963
|
-
const app$
|
|
13186
|
+
const app$7 = new hono.Hono().get("/", async (c) => {
|
|
12964
13187
|
try {
|
|
12965
13188
|
const data = await fetchModelsDevData();
|
|
12966
13189
|
const providers = Object.values(data).map((provider) => ({
|
|
@@ -13068,11 +13291,11 @@ const app$6 = new hono.Hono().get("/", async (c) => {
|
|
|
13068
13291
|
return c.json(internalServerError("Failed to fetch models", 500), 500);
|
|
13069
13292
|
}
|
|
13070
13293
|
});
|
|
13071
|
-
var providers_default = app$
|
|
13294
|
+
var providers_default = app$7;
|
|
13072
13295
|
|
|
13073
13296
|
//#endregion
|
|
13074
13297
|
//#region src/server/handlers/targeting/index.ts
|
|
13075
|
-
const app$
|
|
13298
|
+
const app$6 = new hono.Hono().post("/", zv("json", zod_default.object({
|
|
13076
13299
|
environmentId: zod_default.string().uuid(),
|
|
13077
13300
|
configId: zod_default.string().uuid(),
|
|
13078
13301
|
configVariantId: zod_default.string().uuid(),
|
|
@@ -13199,11 +13422,11 @@ const app$5 = new hono.Hono().post("/", zv("json", zod_default.object({
|
|
|
13199
13422
|
return c.json(internalServerError("Failed to set targeting for environment", 500), 500);
|
|
13200
13423
|
}
|
|
13201
13424
|
});
|
|
13202
|
-
var targeting_default = app$
|
|
13425
|
+
var targeting_default = app$6;
|
|
13203
13426
|
|
|
13204
13427
|
//#endregion
|
|
13205
13428
|
//#region src/server/handlers/variants.ts
|
|
13206
|
-
const app$
|
|
13429
|
+
const app$5 = new hono.Hono().get("/:id", zv("param", zod_default.object({ id: zod_default.string().uuid() })), async (c) => {
|
|
13207
13430
|
const db = c.get("db");
|
|
13208
13431
|
const { id } = c.req.valid("param");
|
|
13209
13432
|
const versionParam = c.req.query("version");
|
|
@@ -13350,7 +13573,31 @@ const app$4 = new hono.Hono().get("/:id", zv("param", zod_default.object({ id: z
|
|
|
13350
13573
|
return c.json(internalServerError("Failed to fetch variant version", 500), 500);
|
|
13351
13574
|
}
|
|
13352
13575
|
});
|
|
13353
|
-
var variants_default = app$
|
|
13576
|
+
var variants_default = app$5;
|
|
13577
|
+
|
|
13578
|
+
//#endregion
|
|
13579
|
+
//#region src/server/handlers/workspace-settings/index.ts
|
|
13580
|
+
const app$4 = new hono.Hono().get("/", async (c) => {
|
|
13581
|
+
const db = c.get("db");
|
|
13582
|
+
try {
|
|
13583
|
+
const settings = await db.getWorkspaceSettings();
|
|
13584
|
+
return c.json(successResponse(settings, 200));
|
|
13585
|
+
} catch (error$45) {
|
|
13586
|
+
console.error("Error fetching workspace settings:", error$45);
|
|
13587
|
+
return c.json(internalServerError("Failed to fetch workspace settings", 500), 500);
|
|
13588
|
+
}
|
|
13589
|
+
}).patch("/", zv("json", zod_default.object({ name: zod_default.string().nullable().optional() })), async (c) => {
|
|
13590
|
+
const db = c.get("db");
|
|
13591
|
+
const body = c.req.valid("json");
|
|
13592
|
+
try {
|
|
13593
|
+
const settings = await db.updateWorkspaceSettings(body);
|
|
13594
|
+
return c.json(successResponse(settings, 200));
|
|
13595
|
+
} catch (error$45) {
|
|
13596
|
+
console.error("Error updating workspace settings:", error$45);
|
|
13597
|
+
return c.json(internalServerError("Failed to update workspace settings", 500), 500);
|
|
13598
|
+
}
|
|
13599
|
+
});
|
|
13600
|
+
var workspace_settings_default = app$4;
|
|
13354
13601
|
|
|
13355
13602
|
//#endregion
|
|
13356
13603
|
//#region src/server/handlers/v1.ts
|
|
@@ -13371,7 +13618,7 @@ const app$3 = new hono.Hono().use("*", async (c, next) => {
|
|
|
13371
13618
|
error: "Auth middleware not configured",
|
|
13372
13619
|
message: `Auth type "${config$1.auth.type}" requires @llmops/enterprise middleware. Either use basicAuth() from @llmops/sdk or install @llmops/enterprise and add the auth middleware.`
|
|
13373
13620
|
}, 501);
|
|
13374
|
-
}).route("/configs", configs_default).route("/environments", environments_default).route("/providers", providers_default).route("/targeting", targeting_default).route("/variants", variants_default);
|
|
13621
|
+
}).route("/analytics", analytics_default).route("/configs", configs_default).route("/environments", environments_default).route("/providers", providers_default).route("/targeting", targeting_default).route("/variants", variants_default).route("/workspace-settings", workspace_settings_default);
|
|
13375
13622
|
var v1_default = app$3;
|
|
13376
13623
|
|
|
13377
13624
|
//#endregion
|
|
@@ -13541,7 +13788,7 @@ const createGatewayAdapterMiddleware = () => {
|
|
|
13541
13788
|
if (method === "POST" && contentType === "application/json" && (path$1.endsWith("/chat/completions") || path$1.endsWith("/completions"))) {
|
|
13542
13789
|
const mergedBody = mergeChatCompletionBody(await c.req.json(), variantConfig, data.modelName);
|
|
13543
13790
|
const newHeaders = new Headers(c.req.raw.headers);
|
|
13544
|
-
newHeaders.set("x-
|
|
13791
|
+
newHeaders.set("x-llmops-config", JSON.stringify(portkeyConfig));
|
|
13545
13792
|
const newRequest = new Request(c.req.raw.url, {
|
|
13546
13793
|
method: c.req.raw.method,
|
|
13547
13794
|
headers: newHeaders,
|
|
@@ -13554,9 +13801,11 @@ const createGatewayAdapterMiddleware = () => {
|
|
|
13554
13801
|
configurable: true
|
|
13555
13802
|
});
|
|
13556
13803
|
c.req.bodyCache = {};
|
|
13557
|
-
} else c.req.raw.headers.set("x-
|
|
13804
|
+
} else c.req.raw.headers.set("x-llmops-config", JSON.stringify(portkeyConfig));
|
|
13558
13805
|
c.set("variantConfig", variantConfig);
|
|
13559
13806
|
c.set("variantModel", variantConfig.model || data.modelName);
|
|
13807
|
+
c.set("configId", data.configId);
|
|
13808
|
+
c.set("variantId", data.variantId);
|
|
13560
13809
|
await next();
|
|
13561
13810
|
} catch (error$45) {
|
|
13562
13811
|
console.error("Gateway adapter error:", error$45);
|
|
@@ -13568,12 +13817,501 @@ const createGatewayAdapterMiddleware = () => {
|
|
|
13568
13817
|
};
|
|
13569
13818
|
};
|
|
13570
13819
|
|
|
13820
|
+
//#endregion
|
|
13821
|
+
//#region src/server/lib/streamingCostExtractor.ts
|
|
13822
|
+
/**
|
|
13823
|
+
* Creates a TransformStream that passes through SSE data while extracting usage info.
|
|
13824
|
+
*
|
|
13825
|
+
* @param onComplete - Callback invoked when stream completes with extracted usage
|
|
13826
|
+
* @returns TransformStream that passes through the original stream
|
|
13827
|
+
*
|
|
13828
|
+
* @example
|
|
13829
|
+
* ```typescript
|
|
13830
|
+
* const { stream, usagePromise } = createStreamingCostExtractor();
|
|
13831
|
+
*
|
|
13832
|
+
* // Pipe the response through the extractor
|
|
13833
|
+
* const transformedResponse = originalResponse.body.pipeThrough(stream);
|
|
13834
|
+
*
|
|
13835
|
+
* // Later, get the usage
|
|
13836
|
+
* const usage = await usagePromise;
|
|
13837
|
+
* if (usage) {
|
|
13838
|
+
* console.log(`Tokens used: ${usage.totalTokens}`);
|
|
13839
|
+
* }
|
|
13840
|
+
* ```
|
|
13841
|
+
*/
|
|
13842
|
+
function createStreamingCostExtractor() {
|
|
13843
|
+
let extractedUsage = null;
|
|
13844
|
+
let buffer = "";
|
|
13845
|
+
let resolveUsage;
|
|
13846
|
+
const usagePromise = new Promise((resolve) => {
|
|
13847
|
+
resolveUsage = resolve;
|
|
13848
|
+
});
|
|
13849
|
+
const decoder = new TextDecoder();
|
|
13850
|
+
return {
|
|
13851
|
+
stream: new TransformStream({
|
|
13852
|
+
transform(chunk, controller) {
|
|
13853
|
+
controller.enqueue(chunk);
|
|
13854
|
+
const text = decoder.decode(chunk, { stream: true });
|
|
13855
|
+
buffer += text;
|
|
13856
|
+
const messages = buffer.split("\n\n");
|
|
13857
|
+
buffer = messages.pop() || "";
|
|
13858
|
+
for (const message of messages) {
|
|
13859
|
+
const trimmed = message.trim();
|
|
13860
|
+
if (!trimmed) continue;
|
|
13861
|
+
if (!trimmed.startsWith("data:")) continue;
|
|
13862
|
+
const jsonPart = trimmed.slice(5).trim();
|
|
13863
|
+
if (jsonPart === "[DONE]") continue;
|
|
13864
|
+
try {
|
|
13865
|
+
const parsed = JSON.parse(jsonPart);
|
|
13866
|
+
if (parsed.usage) extractedUsage = {
|
|
13867
|
+
promptTokens: parsed.usage.prompt_tokens ?? 0,
|
|
13868
|
+
completionTokens: parsed.usage.completion_tokens ?? 0,
|
|
13869
|
+
totalTokens: parsed.usage.total_tokens ?? 0,
|
|
13870
|
+
cachedTokens: parsed.usage.prompt_tokens_details?.cached_tokens
|
|
13871
|
+
};
|
|
13872
|
+
} catch {}
|
|
13873
|
+
}
|
|
13874
|
+
},
|
|
13875
|
+
flush(controller) {
|
|
13876
|
+
if (buffer.trim()) {
|
|
13877
|
+
const trimmed = buffer.trim();
|
|
13878
|
+
if (trimmed.startsWith("data:")) {
|
|
13879
|
+
const jsonPart = trimmed.slice(5).trim();
|
|
13880
|
+
if (jsonPart !== "[DONE]") try {
|
|
13881
|
+
const parsed = JSON.parse(jsonPart);
|
|
13882
|
+
if (parsed.usage) extractedUsage = {
|
|
13883
|
+
promptTokens: parsed.usage.prompt_tokens ?? 0,
|
|
13884
|
+
completionTokens: parsed.usage.completion_tokens ?? 0,
|
|
13885
|
+
totalTokens: parsed.usage.total_tokens ?? 0,
|
|
13886
|
+
cachedTokens: parsed.usage.prompt_tokens_details?.cached_tokens
|
|
13887
|
+
};
|
|
13888
|
+
} catch {}
|
|
13889
|
+
}
|
|
13890
|
+
}
|
|
13891
|
+
resolveUsage(extractedUsage);
|
|
13892
|
+
}
|
|
13893
|
+
}),
|
|
13894
|
+
usagePromise
|
|
13895
|
+
};
|
|
13896
|
+
}
|
|
13897
|
+
/**
|
|
13898
|
+
* Wraps a Response with a streaming body to extract usage information.
|
|
13899
|
+
*
|
|
13900
|
+
* @param response - Original streaming Response
|
|
13901
|
+
* @returns Object with transformed response and promise for usage data
|
|
13902
|
+
*
|
|
13903
|
+
* @example
|
|
13904
|
+
* ```typescript
|
|
13905
|
+
* const result = wrapStreamingResponse(originalResponse);
|
|
13906
|
+
*
|
|
13907
|
+
* // Return the transformed response to the client
|
|
13908
|
+
* return result.response;
|
|
13909
|
+
*
|
|
13910
|
+
* // After response is sent, get usage for cost tracking
|
|
13911
|
+
* result.usagePromise.then((usage) => {
|
|
13912
|
+
* if (usage) {
|
|
13913
|
+
* trackCost(usage);
|
|
13914
|
+
* }
|
|
13915
|
+
* });
|
|
13916
|
+
* ```
|
|
13917
|
+
*/
|
|
13918
|
+
function wrapStreamingResponse(response) {
|
|
13919
|
+
if (!response.body) return {
|
|
13920
|
+
response,
|
|
13921
|
+
usagePromise: Promise.resolve(null)
|
|
13922
|
+
};
|
|
13923
|
+
const { stream, usagePromise } = createStreamingCostExtractor();
|
|
13924
|
+
const transformedBody = response.body.pipeThrough(stream);
|
|
13925
|
+
return {
|
|
13926
|
+
response: new Response(transformedBody, {
|
|
13927
|
+
status: response.status,
|
|
13928
|
+
statusText: response.statusText,
|
|
13929
|
+
headers: response.headers
|
|
13930
|
+
}),
|
|
13931
|
+
usagePromise
|
|
13932
|
+
};
|
|
13933
|
+
}
|
|
13934
|
+
/**
|
|
13935
|
+
* Ensures stream_options.include_usage is set for cost tracking
|
|
13936
|
+
* Modifies the body in place.
|
|
13937
|
+
*
|
|
13938
|
+
* @param body - Request body (will be modified)
|
|
13939
|
+
* @returns Modified body with include_usage enabled
|
|
13940
|
+
*/
|
|
13941
|
+
function ensureStreamUsageEnabled(body) {
|
|
13942
|
+
if (body.stream === true) body.stream_options = {
|
|
13943
|
+
...body.stream_options || {},
|
|
13944
|
+
include_usage: true
|
|
13945
|
+
};
|
|
13946
|
+
return body;
|
|
13947
|
+
}
|
|
13948
|
+
|
|
13949
|
+
//#endregion
|
|
13950
|
+
//#region src/server/services/batchWriter.ts
|
|
13951
|
+
/**
|
|
13952
|
+
* Creates a BatchWriter instance
|
|
13953
|
+
*
|
|
13954
|
+
* @example
|
|
13955
|
+
* ```typescript
|
|
13956
|
+
* const writer = createBatchWriter(
|
|
13957
|
+
* { batchInsertRequests: db.batchInsertRequests },
|
|
13958
|
+
* { flushIntervalMs: 2000 }
|
|
13959
|
+
* );
|
|
13960
|
+
*
|
|
13961
|
+
* // Enqueue a request
|
|
13962
|
+
* writer.enqueue({
|
|
13963
|
+
* requestId: 'req-123',
|
|
13964
|
+
* provider: 'openai',
|
|
13965
|
+
* model: 'gpt-4o',
|
|
13966
|
+
* // ... other fields
|
|
13967
|
+
* });
|
|
13968
|
+
*
|
|
13969
|
+
* // When shutting down
|
|
13970
|
+
* await writer.stop();
|
|
13971
|
+
* ```
|
|
13972
|
+
*/
|
|
13973
|
+
function createBatchWriter(deps, config$1 = {}) {
|
|
13974
|
+
const { flushIntervalMs = 2e3, maxBatchSize = 100, debug = false } = config$1;
|
|
13975
|
+
let queue = [];
|
|
13976
|
+
let flushTimer = null;
|
|
13977
|
+
let running = false;
|
|
13978
|
+
let flushing = false;
|
|
13979
|
+
const log = debug ? (msg) => __llmops_core.logger.debug(msg) : () => {};
|
|
13980
|
+
/**
|
|
13981
|
+
* Flush all queued requests to the database
|
|
13982
|
+
*/
|
|
13983
|
+
async function flush() {
|
|
13984
|
+
if (flushing || queue.length === 0) return;
|
|
13985
|
+
flushing = true;
|
|
13986
|
+
const batch = queue;
|
|
13987
|
+
queue = [];
|
|
13988
|
+
try {
|
|
13989
|
+
log(`[BatchWriter] Flushing ${batch.length} requests`);
|
|
13990
|
+
log(`[BatchWriter] Flushed ${(await deps.batchInsertRequests(batch)).count} requests successfully`);
|
|
13991
|
+
} catch (error$45) {
|
|
13992
|
+
const errorMsg = error$45 instanceof Error ? error$45.message : String(error$45);
|
|
13993
|
+
__llmops_core.logger.error(`[BatchWriter] Flush failed, re-queuing requests: ${errorMsg}`);
|
|
13994
|
+
queue = [...batch, ...queue];
|
|
13995
|
+
} finally {
|
|
13996
|
+
flushing = false;
|
|
13997
|
+
}
|
|
13998
|
+
}
|
|
13999
|
+
/**
|
|
14000
|
+
* Start the periodic flush timer
|
|
14001
|
+
*/
|
|
14002
|
+
function start() {
|
|
14003
|
+
if (running) return;
|
|
14004
|
+
running = true;
|
|
14005
|
+
flushTimer = setInterval(() => {
|
|
14006
|
+
flush().catch((err) => {
|
|
14007
|
+
const errorMsg = err instanceof Error ? err.message : String(err);
|
|
14008
|
+
__llmops_core.logger.error(`[BatchWriter] Periodic flush error: ${errorMsg}`);
|
|
14009
|
+
});
|
|
14010
|
+
}, flushIntervalMs);
|
|
14011
|
+
log(`[BatchWriter] Started with ${flushIntervalMs}ms flush interval`);
|
|
14012
|
+
}
|
|
14013
|
+
/**
|
|
14014
|
+
* Stop the batch writer and flush remaining items
|
|
14015
|
+
*/
|
|
14016
|
+
async function stop() {
|
|
14017
|
+
if (!running) return;
|
|
14018
|
+
running = false;
|
|
14019
|
+
if (flushTimer) {
|
|
14020
|
+
clearInterval(flushTimer);
|
|
14021
|
+
flushTimer = null;
|
|
14022
|
+
}
|
|
14023
|
+
await flush();
|
|
14024
|
+
log("[BatchWriter] Stopped");
|
|
14025
|
+
}
|
|
14026
|
+
/**
|
|
14027
|
+
* Add a request to the batch queue
|
|
14028
|
+
*/
|
|
14029
|
+
function enqueue(request) {
|
|
14030
|
+
queue.push(request);
|
|
14031
|
+
log(`[BatchWriter] Enqueued request ${request.requestId}, queue size: ${queue.length}`);
|
|
14032
|
+
if (!running) start();
|
|
14033
|
+
if (queue.length >= maxBatchSize) {
|
|
14034
|
+
log(`[BatchWriter] Max batch size reached, forcing flush`);
|
|
14035
|
+
flush().catch((err) => {
|
|
14036
|
+
const errorMsg = err instanceof Error ? err.message : String(err);
|
|
14037
|
+
__llmops_core.logger.error(`[BatchWriter] Forced flush error: ${errorMsg}`);
|
|
14038
|
+
});
|
|
14039
|
+
}
|
|
14040
|
+
}
|
|
14041
|
+
return {
|
|
14042
|
+
enqueue,
|
|
14043
|
+
flush,
|
|
14044
|
+
stop,
|
|
14045
|
+
queueLength: () => queue.length,
|
|
14046
|
+
isRunning: () => running
|
|
14047
|
+
};
|
|
14048
|
+
}
|
|
14049
|
+
/**
|
|
14050
|
+
* Global singleton instance
|
|
14051
|
+
* Lazily initialized when first accessed
|
|
14052
|
+
*/
|
|
14053
|
+
let globalWriter = null;
|
|
14054
|
+
/**
|
|
14055
|
+
* Get or create the global BatchWriter instance
|
|
14056
|
+
*
|
|
14057
|
+
* @param deps - Database dependencies (required on first call)
|
|
14058
|
+
* @param config - Optional configuration
|
|
14059
|
+
* @returns The global BatchWriter instance
|
|
14060
|
+
*/
|
|
14061
|
+
function getGlobalBatchWriter(deps, config$1) {
|
|
14062
|
+
if (!globalWriter) {
|
|
14063
|
+
if (!deps) throw new Error("BatchWriter dependencies required on first initialization");
|
|
14064
|
+
globalWriter = createBatchWriter(deps, config$1);
|
|
14065
|
+
}
|
|
14066
|
+
return globalWriter;
|
|
14067
|
+
}
|
|
14068
|
+
|
|
14069
|
+
//#endregion
|
|
14070
|
+
//#region src/server/middlewares/costTracking.ts
|
|
14071
|
+
/**
|
|
14072
|
+
* Calculate cost in micro-dollars
|
|
14073
|
+
* 1 dollar = 1,000,000 micro-dollars
|
|
14074
|
+
*/
|
|
14075
|
+
function calculateCost(usage, pricing) {
|
|
14076
|
+
const inputCost = Math.round(usage.promptTokens * pricing.inputCostPer1M);
|
|
14077
|
+
const outputCost = Math.round(usage.completionTokens * pricing.outputCostPer1M);
|
|
14078
|
+
return {
|
|
14079
|
+
inputCost,
|
|
14080
|
+
outputCost,
|
|
14081
|
+
totalCost: inputCost + outputCost
|
|
14082
|
+
};
|
|
14083
|
+
}
|
|
14084
|
+
/**
|
|
14085
|
+
* Simple pricing provider that fetches from models.dev
|
|
14086
|
+
*/
|
|
14087
|
+
var PricingProvider = class {
|
|
14088
|
+
cache = /* @__PURE__ */ new Map();
|
|
14089
|
+
lastFetch = 0;
|
|
14090
|
+
cacheTTL = 300 * 1e3;
|
|
14091
|
+
fetchPromise = null;
|
|
14092
|
+
getCacheKey(provider, model) {
|
|
14093
|
+
return `${provider.toLowerCase()}:${model.toLowerCase()}`;
|
|
14094
|
+
}
|
|
14095
|
+
async fetchPricingData() {
|
|
14096
|
+
try {
|
|
14097
|
+
const response = await fetch("https://models.dev/api.json");
|
|
14098
|
+
if (!response.ok) return;
|
|
14099
|
+
const data = await response.json();
|
|
14100
|
+
this.cache.clear();
|
|
14101
|
+
for (const [providerId, provider] of Object.entries(data)) {
|
|
14102
|
+
const p = provider;
|
|
14103
|
+
if (!p.models) continue;
|
|
14104
|
+
for (const [, model] of Object.entries(p.models)) {
|
|
14105
|
+
if (!model.cost) continue;
|
|
14106
|
+
const cacheKey = this.getCacheKey(providerId, model.id);
|
|
14107
|
+
this.cache.set(cacheKey, {
|
|
14108
|
+
inputCostPer1M: model.cost.input ?? 0,
|
|
14109
|
+
outputCostPer1M: model.cost.output ?? 0
|
|
14110
|
+
});
|
|
14111
|
+
}
|
|
14112
|
+
}
|
|
14113
|
+
this.lastFetch = Date.now();
|
|
14114
|
+
} catch {}
|
|
14115
|
+
}
|
|
14116
|
+
async ensureFreshCache() {
|
|
14117
|
+
if (Date.now() - this.lastFetch < this.cacheTTL && this.cache.size > 0) return;
|
|
14118
|
+
if (!this.fetchPromise) this.fetchPromise = this.fetchPricingData().finally(() => {
|
|
14119
|
+
this.fetchPromise = null;
|
|
14120
|
+
});
|
|
14121
|
+
await this.fetchPromise;
|
|
14122
|
+
}
|
|
14123
|
+
async getModelPricing(provider, model) {
|
|
14124
|
+
await this.ensureFreshCache();
|
|
14125
|
+
return this.cache.get(this.getCacheKey(provider, model)) || null;
|
|
14126
|
+
}
|
|
14127
|
+
};
|
|
14128
|
+
const pricingProvider = new PricingProvider();
|
|
14129
|
+
/**
|
|
14130
|
+
* Creates cost tracking middleware that logs LLM requests with usage and cost data.
|
|
14131
|
+
*
|
|
14132
|
+
* Features:
|
|
14133
|
+
* - Tracks both streaming and non-streaming requests
|
|
14134
|
+
* - Calculates costs using models.dev pricing data
|
|
14135
|
+
* - Batches database writes for performance
|
|
14136
|
+
* - Adds x-llmops-request-id header for tracing
|
|
14137
|
+
*/
|
|
14138
|
+
function createCostTrackingMiddleware(config$1 = {}) {
|
|
14139
|
+
const { enabled = true, trackErrors = true, flushIntervalMs = 2e3, debug = false } = config$1;
|
|
14140
|
+
const log = debug ? (msg) => __llmops_core.logger.debug(`[CostTracking] ${msg}`) : () => {};
|
|
14141
|
+
return async (c, next) => {
|
|
14142
|
+
if (!enabled) return next();
|
|
14143
|
+
const path$1 = c.req.path;
|
|
14144
|
+
if (!path$1.endsWith("/chat/completions") && !path$1.endsWith("/completions")) return next();
|
|
14145
|
+
const requestId = (0, node_crypto.randomUUID)();
|
|
14146
|
+
const startTime = Date.now();
|
|
14147
|
+
c.header("x-llmops-request-id", requestId);
|
|
14148
|
+
let body = {};
|
|
14149
|
+
let isStreaming = false;
|
|
14150
|
+
try {
|
|
14151
|
+
body = await c.req.raw.clone().json();
|
|
14152
|
+
isStreaming = body.stream === true;
|
|
14153
|
+
if (isStreaming) {
|
|
14154
|
+
body = ensureStreamUsageEnabled(body);
|
|
14155
|
+
const newHeaders = new Headers(c.req.raw.headers);
|
|
14156
|
+
const newRequest = new Request(c.req.raw.url, {
|
|
14157
|
+
method: c.req.raw.method,
|
|
14158
|
+
headers: newHeaders,
|
|
14159
|
+
body: JSON.stringify(body),
|
|
14160
|
+
duplex: "half"
|
|
14161
|
+
});
|
|
14162
|
+
Object.defineProperty(c.req, "raw", {
|
|
14163
|
+
value: newRequest,
|
|
14164
|
+
writable: true,
|
|
14165
|
+
configurable: true
|
|
14166
|
+
});
|
|
14167
|
+
c.req.bodyCache = {};
|
|
14168
|
+
}
|
|
14169
|
+
} catch {
|
|
14170
|
+
log("Failed to parse request body");
|
|
14171
|
+
}
|
|
14172
|
+
const context = {
|
|
14173
|
+
requestId,
|
|
14174
|
+
startTime,
|
|
14175
|
+
provider: "",
|
|
14176
|
+
model: body.model || "",
|
|
14177
|
+
configId: c.get("configId"),
|
|
14178
|
+
endpoint: path$1,
|
|
14179
|
+
isStreaming
|
|
14180
|
+
};
|
|
14181
|
+
c.set("__costTrackingContext", context);
|
|
14182
|
+
await next();
|
|
14183
|
+
const response = c.res;
|
|
14184
|
+
const statusCode = response.status;
|
|
14185
|
+
const latencyMs = Date.now() - startTime;
|
|
14186
|
+
const variantModel = c.get("variantModel") || context.model;
|
|
14187
|
+
let provider = "unknown";
|
|
14188
|
+
const llmopsConfigHeader = c.req.header("x-llmops-config");
|
|
14189
|
+
if (llmopsConfigHeader) try {
|
|
14190
|
+
provider = JSON.parse(llmopsConfigHeader).provider || provider;
|
|
14191
|
+
} catch {}
|
|
14192
|
+
if (!variantModel) {
|
|
14193
|
+
log(`Skipping request tracking - no model info`);
|
|
14194
|
+
return;
|
|
14195
|
+
}
|
|
14196
|
+
const db = c.get("db");
|
|
14197
|
+
const batchWriter = getGlobalBatchWriter({ batchInsertRequests: (requests) => db.batchInsertRequests(requests) }, {
|
|
14198
|
+
flushIntervalMs,
|
|
14199
|
+
debug
|
|
14200
|
+
});
|
|
14201
|
+
if (isStreaming && response.body) {
|
|
14202
|
+
const { response: wrappedResponse, usagePromise } = wrapStreamingResponse(response);
|
|
14203
|
+
c.res = wrappedResponse;
|
|
14204
|
+
usagePromise.then(async (usage) => {
|
|
14205
|
+
await processUsageAndLog({
|
|
14206
|
+
requestId,
|
|
14207
|
+
provider,
|
|
14208
|
+
model: variantModel,
|
|
14209
|
+
configId: c.get("configId"),
|
|
14210
|
+
variantId: c.get("variantId"),
|
|
14211
|
+
endpoint: context.endpoint,
|
|
14212
|
+
statusCode,
|
|
14213
|
+
latencyMs,
|
|
14214
|
+
isStreaming: true,
|
|
14215
|
+
usage: usage ? {
|
|
14216
|
+
promptTokens: usage.promptTokens,
|
|
14217
|
+
completionTokens: usage.completionTokens,
|
|
14218
|
+
totalTokens: usage.totalTokens,
|
|
14219
|
+
cachedTokens: usage.cachedTokens
|
|
14220
|
+
} : null,
|
|
14221
|
+
batchWriter,
|
|
14222
|
+
trackErrors,
|
|
14223
|
+
log
|
|
14224
|
+
});
|
|
14225
|
+
}).catch((err) => {
|
|
14226
|
+
__llmops_core.logger.error(`[CostTracking] Failed to process streaming usage: ${err}`);
|
|
14227
|
+
});
|
|
14228
|
+
} else {
|
|
14229
|
+
let usage = null;
|
|
14230
|
+
try {
|
|
14231
|
+
const responseBody = await response.clone().json();
|
|
14232
|
+
if (responseBody.usage) usage = {
|
|
14233
|
+
promptTokens: responseBody.usage.prompt_tokens || 0,
|
|
14234
|
+
completionTokens: responseBody.usage.completion_tokens || 0,
|
|
14235
|
+
totalTokens: responseBody.usage.total_tokens || 0,
|
|
14236
|
+
cachedTokens: responseBody.usage.prompt_tokens_details?.cached_tokens
|
|
14237
|
+
};
|
|
14238
|
+
} catch {
|
|
14239
|
+
log("Failed to parse response body for usage");
|
|
14240
|
+
}
|
|
14241
|
+
await processUsageAndLog({
|
|
14242
|
+
requestId,
|
|
14243
|
+
provider,
|
|
14244
|
+
model: variantModel,
|
|
14245
|
+
configId: c.get("configId"),
|
|
14246
|
+
variantId: c.get("variantId"),
|
|
14247
|
+
endpoint: context.endpoint,
|
|
14248
|
+
statusCode,
|
|
14249
|
+
latencyMs,
|
|
14250
|
+
isStreaming: false,
|
|
14251
|
+
usage,
|
|
14252
|
+
batchWriter,
|
|
14253
|
+
trackErrors,
|
|
14254
|
+
log
|
|
14255
|
+
});
|
|
14256
|
+
}
|
|
14257
|
+
};
|
|
14258
|
+
}
|
|
14259
|
+
/**
|
|
14260
|
+
* Process usage data and log to batch writer
|
|
14261
|
+
*/
|
|
14262
|
+
async function processUsageAndLog(params) {
|
|
14263
|
+
const { requestId, provider, model, configId, variantId, endpoint, statusCode, latencyMs, isStreaming, usage, batchWriter, trackErrors, log } = params;
|
|
14264
|
+
if (!trackErrors && statusCode >= 400) {
|
|
14265
|
+
log(`Skipping error response (${statusCode})`);
|
|
14266
|
+
return;
|
|
14267
|
+
}
|
|
14268
|
+
let cost = 0;
|
|
14269
|
+
let inputCost = 0;
|
|
14270
|
+
let outputCost = 0;
|
|
14271
|
+
if (usage && usage.promptTokens + usage.completionTokens > 0) try {
|
|
14272
|
+
const pricing = await pricingProvider.getModelPricing(provider, model);
|
|
14273
|
+
if (pricing) {
|
|
14274
|
+
const costResult = calculateCost({
|
|
14275
|
+
promptTokens: usage.promptTokens,
|
|
14276
|
+
completionTokens: usage.completionTokens
|
|
14277
|
+
}, pricing);
|
|
14278
|
+
cost = costResult.totalCost;
|
|
14279
|
+
inputCost = costResult.inputCost;
|
|
14280
|
+
outputCost = costResult.outputCost;
|
|
14281
|
+
log(`Calculated cost: ${cost} micro-dollars for ${provider}/${model}`);
|
|
14282
|
+
} else log(`No pricing found for ${provider}/${model}`);
|
|
14283
|
+
} catch (err) {
|
|
14284
|
+
__llmops_core.logger.error(`[CostTracking] Failed to calculate cost: ${err}`);
|
|
14285
|
+
}
|
|
14286
|
+
const requestData = {
|
|
14287
|
+
requestId,
|
|
14288
|
+
configId: configId || null,
|
|
14289
|
+
variantId: variantId || null,
|
|
14290
|
+
provider,
|
|
14291
|
+
model,
|
|
14292
|
+
promptTokens: usage?.promptTokens || 0,
|
|
14293
|
+
completionTokens: usage?.completionTokens || 0,
|
|
14294
|
+
totalTokens: usage?.totalTokens || 0,
|
|
14295
|
+
cachedTokens: usage?.cachedTokens || 0,
|
|
14296
|
+
cost,
|
|
14297
|
+
inputCost,
|
|
14298
|
+
outputCost,
|
|
14299
|
+
endpoint,
|
|
14300
|
+
statusCode,
|
|
14301
|
+
latencyMs,
|
|
14302
|
+
isStreaming,
|
|
14303
|
+
tags: {}
|
|
14304
|
+
};
|
|
14305
|
+
batchWriter.enqueue(requestData);
|
|
14306
|
+
log(`Enqueued request ${requestId} for logging`);
|
|
14307
|
+
}
|
|
14308
|
+
|
|
13571
14309
|
//#endregion
|
|
13572
14310
|
//#region src/server/handlers/genai/index.ts
|
|
13573
14311
|
const app$2 = new hono.Hono();
|
|
13574
14312
|
app$2.use("*", (0, hono_pretty_json.prettyJSON)()).get("/health", async (c) => {
|
|
13575
14313
|
return c.json({ status: "healthy" });
|
|
13576
|
-
}).use("*", requestValidator).use("*", createRequestGuardMiddleware()).use("*", createGatewayAdapterMiddleware()).route("/", __llmops_gateway.default).notFound((c) => c.json({ error: {
|
|
14314
|
+
}).use("*", requestValidator).use("*", createRequestGuardMiddleware()).use("*", createCostTrackingMiddleware()).use("*", createGatewayAdapterMiddleware()).route("/", __llmops_gateway.default).notFound((c) => c.json({ error: {
|
|
13577
14315
|
message: "Not Found",
|
|
13578
14316
|
type: "invalid_request_error"
|
|
13579
14317
|
} }, 404)).onError((err, c) => {
|
|
@@ -13604,10 +14342,12 @@ app.use("/assets/*", (0, hono_serve_static.serveStatic)({
|
|
|
13604
14342
|
if (!c.req.path.startsWith("/api")) {
|
|
13605
14343
|
const basePath = c.var.llmopsConfig?.basePath || "";
|
|
13606
14344
|
const llmProviders = c.var.llmProviders || [];
|
|
14345
|
+
const authType = c.var.llmopsConfig?.auth?.type || "basic";
|
|
13607
14346
|
return c.html(renderer({
|
|
13608
14347
|
basePath,
|
|
13609
14348
|
dev: node_process.env.LLMOPS_DEV === "true",
|
|
13610
|
-
llmProviders
|
|
14349
|
+
llmProviders,
|
|
14350
|
+
authType
|
|
13611
14351
|
}));
|
|
13612
14352
|
}
|
|
13613
14353
|
await next();
|