steroids-cli 0.10.62 → 0.11.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +1 -0
- package/dist/commands/hf.d.ts +11 -0
- package/dist/commands/hf.d.ts.map +1 -0
- package/dist/commands/hf.js +51 -0
- package/dist/commands/hf.js.map +1 -0
- package/dist/config/ai-setup.d.ts +1 -1
- package/dist/config/ai-setup.d.ts.map +1 -1
- package/dist/config/loader.d.ts +1 -1
- package/dist/config/loader.d.ts.map +1 -1
- package/dist/config/loader.js +3 -1
- package/dist/config/loader.js.map +1 -1
- package/dist/config/schema.js +3 -3
- package/dist/config/schema.js.map +1 -1
- package/dist/huggingface/auth.d.ts +25 -0
- package/dist/huggingface/auth.d.ts.map +1 -0
- package/dist/huggingface/auth.js +120 -0
- package/dist/huggingface/auth.js.map +1 -0
- package/dist/huggingface/hub-client.d.ts +101 -0
- package/dist/huggingface/hub-client.d.ts.map +1 -0
- package/dist/huggingface/hub-client.js +119 -0
- package/dist/huggingface/hub-client.js.map +1 -0
- package/dist/huggingface/metrics.d.ts +58 -0
- package/dist/huggingface/metrics.d.ts.map +1 -0
- package/dist/huggingface/metrics.js +272 -0
- package/dist/huggingface/metrics.js.map +1 -0
- package/dist/huggingface/model-registry.d.ts +74 -0
- package/dist/huggingface/model-registry.d.ts.map +1 -0
- package/dist/huggingface/model-registry.js +334 -0
- package/dist/huggingface/model-registry.js.map +1 -0
- package/dist/index.js +5 -0
- package/dist/index.js.map +1 -1
- package/dist/ollama/api-client.d.ts +138 -0
- package/dist/ollama/api-client.d.ts.map +1 -0
- package/dist/ollama/api-client.js +229 -0
- package/dist/ollama/api-client.js.map +1 -0
- package/dist/ollama/connection.d.ts +35 -0
- package/dist/ollama/connection.d.ts.map +1 -0
- package/dist/ollama/connection.js +243 -0
- package/dist/ollama/connection.js.map +1 -0
- package/dist/ollama/metrics.d.ts +32 -0
- package/dist/ollama/metrics.d.ts.map +1 -0
- package/dist/ollama/metrics.js +70 -0
- package/dist/ollama/metrics.js.map +1 -0
- package/dist/ollama/model-registry.d.ts +33 -0
- package/dist/ollama/model-registry.d.ts.map +1 -0
- package/dist/ollama/model-registry.js +117 -0
- package/dist/ollama/model-registry.js.map +1 -0
- package/dist/providers/huggingface.d.ts +40 -0
- package/dist/providers/huggingface.d.ts.map +1 -0
- package/dist/providers/huggingface.js +391 -0
- package/dist/providers/huggingface.js.map +1 -0
- package/dist/providers/index.d.ts +1 -0
- package/dist/providers/index.d.ts.map +1 -1
- package/dist/providers/index.js +5 -1
- package/dist/providers/index.js.map +1 -1
- package/dist/providers/interface.d.ts +1 -1
- package/dist/providers/interface.d.ts.map +1 -1
- package/dist/providers/interface.js +9 -0
- package/dist/providers/interface.js.map +1 -1
- package/dist/providers/ollama-error-utils.d.ts +12 -0
- package/dist/providers/ollama-error-utils.d.ts.map +1 -0
- package/dist/providers/ollama-error-utils.js +60 -0
- package/dist/providers/ollama-error-utils.js.map +1 -0
- package/dist/providers/ollama-utils.d.ts +17 -0
- package/dist/providers/ollama-utils.d.ts.map +1 -0
- package/dist/providers/ollama-utils.js +115 -0
- package/dist/providers/ollama-utils.js.map +1 -0
- package/dist/providers/ollama.d.ts +15 -34
- package/dist/providers/ollama.d.ts.map +1 -1
- package/dist/providers/ollama.js +365 -206
- package/dist/providers/ollama.js.map +1 -1
- package/dist/providers/registry.d.ts.map +1 -1
- package/dist/providers/registry.js +2 -0
- package/dist/providers/registry.js.map +1 -1
- package/dist/runners/global-db-connection.d.ts.map +1 -1
- package/dist/runners/global-db-connection.js +7 -0
- package/dist/runners/global-db-connection.js.map +1 -1
- package/dist/runners/global-db-schema-migrations-v17-v20.d.ts +10 -0
- package/dist/runners/global-db-schema-migrations-v17-v20.d.ts.map +1 -0
- package/dist/runners/global-db-schema-migrations-v17-v20.js +104 -0
- package/dist/runners/global-db-schema-migrations-v17-v20.js.map +1 -0
- package/dist/runners/global-db-schema.d.ts +2 -4
- package/dist/runners/global-db-schema.d.ts.map +1 -1
- package/dist/runners/global-db-schema.js +15 -50
- package/dist/runners/global-db-schema.js.map +1 -1
- package/dist/runners/global-db.d.ts +1 -1
- package/dist/runners/global-db.d.ts.map +1 -1
- package/dist/runners/global-db.js +3 -1
- package/dist/runners/global-db.js.map +1 -1
- package/package.json +1 -1
|
@@ -0,0 +1,58 @@
|
|
|
1
|
+
import type { TokenUsage } from '../providers/interface.js';
|
|
2
|
+
import { HuggingFaceModelRegistry } from './model-registry.js';
|
|
3
|
+
export interface HFRouteSelection {
|
|
4
|
+
baseModel: string;
|
|
5
|
+
routingPolicy: string;
|
|
6
|
+
explicitProvider: string | null;
|
|
7
|
+
}
|
|
8
|
+
export interface HFHubRateLimitSnapshot {
|
|
9
|
+
remaining: number | null;
|
|
10
|
+
limit: number | null;
|
|
11
|
+
resetSeconds: number | null;
|
|
12
|
+
windowSeconds: number | null;
|
|
13
|
+
observedAtMs: number;
|
|
14
|
+
}
|
|
15
|
+
export interface HFUsageSummary {
|
|
16
|
+
promptTokens: number;
|
|
17
|
+
completionTokens: number;
|
|
18
|
+
totalTokens: number;
|
|
19
|
+
requests: number;
|
|
20
|
+
estimatedCostUsd: number;
|
|
21
|
+
}
|
|
22
|
+
export interface HFUsageByModel {
|
|
23
|
+
model: string;
|
|
24
|
+
provider: string | null;
|
|
25
|
+
routingPolicy: string;
|
|
26
|
+
promptTokens: number;
|
|
27
|
+
completionTokens: number;
|
|
28
|
+
totalTokens: number;
|
|
29
|
+
requests: number;
|
|
30
|
+
estimatedCostUsd: number;
|
|
31
|
+
}
|
|
32
|
+
export interface HFUsageDashboard {
|
|
33
|
+
today: HFUsageSummary;
|
|
34
|
+
byModel7d: HFUsageByModel[];
|
|
35
|
+
}
|
|
36
|
+
export declare function parseRoutedModel(model: string): HFRouteSelection;
|
|
37
|
+
export declare function parseHubRateLimitHeaders(headers: Headers | {
|
|
38
|
+
rateLimit?: string | null;
|
|
39
|
+
rateLimitPolicy?: string | null;
|
|
40
|
+
}, nowMs?: number): HFHubRateLimitSnapshot | null;
|
|
41
|
+
export declare function extractInferenceProviderFromHeaders(headers: Headers): string | null;
|
|
42
|
+
export declare class HuggingFaceUsageMetrics {
|
|
43
|
+
private readonly registry;
|
|
44
|
+
constructor(options?: {
|
|
45
|
+
registry?: Pick<HuggingFaceModelRegistry, 'getCachedModel'>;
|
|
46
|
+
});
|
|
47
|
+
recordInvocationUsage(input: {
|
|
48
|
+
requestedModel: string;
|
|
49
|
+
role?: 'orchestrator' | 'coder' | 'reviewer';
|
|
50
|
+
tokenUsage?: TokenUsage;
|
|
51
|
+
providerHint?: string | null;
|
|
52
|
+
createdAtMs?: number;
|
|
53
|
+
}): void;
|
|
54
|
+
getDashboardUsage(): HFUsageDashboard;
|
|
55
|
+
getUsageSummary(hours: number): HFUsageSummary;
|
|
56
|
+
getUsageByModel(hours: number, limit?: number): HFUsageByModel[];
|
|
57
|
+
}
|
|
58
|
+
//# sourceMappingURL=metrics.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"metrics.d.ts","sourceRoot":"","sources":["../../src/huggingface/metrics.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,UAAU,EAAE,MAAM,2BAA2B,CAAC;AAE5D,OAAO,EAAE,wBAAwB,EAAsB,MAAM,qBAAqB,CAAC;AAInF,MAAM,WAAW,gBAAgB;IAC/B,SAAS,EAAE,MAAM,CAAC;IAClB,aAAa,EAAE,MAAM,CAAC;IACtB,gBAAgB,EAAE,MAAM,GAAG,IAAI,CAAC;CACjC;AAED,MAAM,WAAW,sBAAsB;IACrC,SAAS,EAAE,MAAM,GAAG,IAAI,CAAC;IACzB,KAAK,EAAE,MAAM,GAAG,IAAI,CAAC;IACrB,YAAY,EAAE,MAAM,GAAG,IAAI,CAAC;IAC5B,aAAa,EAAE,MAAM,GAAG,IAAI,CAAC;IAC7B,YAAY,EAAE,MAAM,CAAC;CACtB;AAED,MAAM,WAAW,cAAc;IAC7B,YAAY,EAAE,MAAM,CAAC;IACrB,gBAAgB,EAAE,MAAM,CAAC;IACzB,WAAW,EAAE,MAAM,CAAC;IACpB,QAAQ,EAAE,MAAM,CAAC;IACjB,gBAAgB,EAAE,MAAM,CAAC;CAC1B;AAED,MAAM,WAAW,cAAc;IAC7B,KAAK,EAAE,MAAM,CAAC;IACd,QAAQ,EAAE,MAAM,GAAG,IAAI,CAAC;IACxB,aAAa,EAAE,MAAM,CAAC;IACtB,YAAY,EAAE,MAAM,CAAC;IACrB,gBAAgB,EAAE,MAAM,CAAC;IACzB,WAAW,EAAE,MAAM,CAAC;IACpB,QAAQ,EAAE,MAAM,CAAC;IACjB,gBAAgB,EAAE,MAAM,CAAC;CAC1B;AAED,MAAM,WAAW,gBAAgB;IAC/B,KAAK,EAAE,cAAc,CAAC;IACtB,SAAS,EAAE,cAAc,EAAE,CAAC;CAC7B;AAYD,wBAAgB,gBAAgB,CAAC,KAAK,EAAE,MAAM,GAAG,gBAAgB,CAqChE;AAED,wBAAgB,wBAAwB,CACtC,OAAO,EACH,OAAO,GACP;IACA,SAAS,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAC1B,eAAe,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;CACjC,EACH,KAAK,SAAa,GACjB,sBAAsB,GAAG,IAAI,CAe/B;AAED,wBAAgB,mCAAmC,CAAC,OAAO,EAAE,OAAO,GAAG,MAAM,GAAG,IAAI,CAgBnF;AAED,qBAAa,uBAAuB;IAClC,OAAO,CAAC,QAAQ,CAAC,QAAQ,CAAmD;gBAEhE,OAAO,GAAE;QAAE,QAAQ,CAAC,EAAE,IAAI,CAAC,wBAAwB,EAAE,gBAAgB,CAAC,CAAA;KAAO;IAIzF,qBAAqB,CAAC,KAAK,EAAE;QAC3B,cAAc,EAAE,MAAM,CAAC;QACvB,IAAI,CAAC,EAAE,cAAc,GAAG,OAAO,GAAG,UAAU,CAAC;QAC7C,UAAU,CAAC,EAAE,UAAU,CAAC;QACxB,YAAY,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;QAC7B,WAAW,CAAC,EAAE,MAAM,CAAC;KACtB,GAAG,IAAI;IAsCR,iBAAiB,IAAI,gBAAgB;IAOrC,eAAe,CAAC,KAAK,EAAE,MAAM,GAAG,cAAc;IA4B9C,eAAe,CAAC,KAAK,EAAE,MAAM,EAAE,KAAK,SAAI,GAAG,cAAc,EAAE;CAyC5D"}
|
|
@@ -0,0 +1,272 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
|
3
|
+
exports.HuggingFaceUsageMetrics = void 0;
|
|
4
|
+
exports.parseRoutedModel = parseRoutedModel;
|
|
5
|
+
exports.parseHubRateLimitHeaders = parseHubRateLimitHeaders;
|
|
6
|
+
exports.extractInferenceProviderFromHeaders = extractInferenceProviderFromHeaders;
|
|
7
|
+
const global_db_js_1 = require("../runners/global-db.js");
|
|
8
|
+
const model_registry_js_1 = require("./model-registry.js");
|
|
9
|
+
const BASE_ROUTING_POLICIES = new Set(['fastest', 'cheapest', 'preferred']);
|
|
10
|
+
function parseRoutedModel(model) {
|
|
11
|
+
const trimmed = model.trim();
|
|
12
|
+
if (!trimmed) {
|
|
13
|
+
return {
|
|
14
|
+
baseModel: '',
|
|
15
|
+
routingPolicy: 'fastest',
|
|
16
|
+
explicitProvider: null,
|
|
17
|
+
};
|
|
18
|
+
}
|
|
19
|
+
const suffixIndex = trimmed.lastIndexOf(':');
|
|
20
|
+
if (suffixIndex <= 0) {
|
|
21
|
+
return {
|
|
22
|
+
baseModel: trimmed,
|
|
23
|
+
routingPolicy: 'fastest',
|
|
24
|
+
explicitProvider: null,
|
|
25
|
+
};
|
|
26
|
+
}
|
|
27
|
+
const baseModel = trimmed.slice(0, suffixIndex).trim();
|
|
28
|
+
const suffix = trimmed.slice(suffixIndex + 1).trim();
|
|
29
|
+
if (!suffix) {
|
|
30
|
+
return {
|
|
31
|
+
baseModel,
|
|
32
|
+
routingPolicy: 'fastest',
|
|
33
|
+
explicitProvider: null,
|
|
34
|
+
};
|
|
35
|
+
}
|
|
36
|
+
const routingPolicy = suffix.toLowerCase();
|
|
37
|
+
const explicitProvider = BASE_ROUTING_POLICIES.has(routingPolicy) ? null : routingPolicy;
|
|
38
|
+
return {
|
|
39
|
+
baseModel,
|
|
40
|
+
routingPolicy,
|
|
41
|
+
explicitProvider,
|
|
42
|
+
};
|
|
43
|
+
}
|
|
44
|
+
function parseHubRateLimitHeaders(headers, nowMs = Date.now()) {
|
|
45
|
+
const rateLimit = getHeaderValue(headers, 'ratelimit');
|
|
46
|
+
const rateLimitPolicy = getHeaderValue(headers, 'ratelimit-policy');
|
|
47
|
+
if (!rateLimit && !rateLimitPolicy) {
|
|
48
|
+
return null;
|
|
49
|
+
}
|
|
50
|
+
return {
|
|
51
|
+
remaining: parseHeaderMetric(rateLimit, 'r'),
|
|
52
|
+
limit: parseHeaderMetric(rateLimitPolicy, 'q'),
|
|
53
|
+
resetSeconds: parseHeaderMetric(rateLimit, 't'),
|
|
54
|
+
windowSeconds: parseHeaderMetric(rateLimitPolicy, 'w'),
|
|
55
|
+
observedAtMs: nowMs,
|
|
56
|
+
};
|
|
57
|
+
}
|
|
58
|
+
function extractInferenceProviderFromHeaders(headers) {
|
|
59
|
+
const candidates = [
|
|
60
|
+
'x-hf-inference-provider',
|
|
61
|
+
'x-inference-provider',
|
|
62
|
+
'x-provider',
|
|
63
|
+
'huggingface-inference-provider',
|
|
64
|
+
];
|
|
65
|
+
for (const key of candidates) {
|
|
66
|
+
const value = headers.get(key);
|
|
67
|
+
if (!value)
|
|
68
|
+
continue;
|
|
69
|
+
const provider = value.trim().toLowerCase();
|
|
70
|
+
if (provider)
|
|
71
|
+
return provider;
|
|
72
|
+
}
|
|
73
|
+
return null;
|
|
74
|
+
}
|
|
75
|
+
class HuggingFaceUsageMetrics {
|
|
76
|
+
registry;
|
|
77
|
+
constructor(options = {}) {
|
|
78
|
+
this.registry = options.registry ?? new model_registry_js_1.HuggingFaceModelRegistry();
|
|
79
|
+
}
|
|
80
|
+
recordInvocationUsage(input) {
|
|
81
|
+
const usage = input.tokenUsage;
|
|
82
|
+
if (!usage)
|
|
83
|
+
return;
|
|
84
|
+
const promptTokens = toSafeInt(usage.inputTokens);
|
|
85
|
+
const completionTokens = toSafeInt(usage.outputTokens);
|
|
86
|
+
if (promptTokens === null || completionTokens === null)
|
|
87
|
+
return;
|
|
88
|
+
const route = parseRoutedModel(input.requestedModel);
|
|
89
|
+
if (!route.baseModel)
|
|
90
|
+
return;
|
|
91
|
+
const model = this.registry.getCachedModel(route.baseModel);
|
|
92
|
+
const pricingSelection = selectPricing(model, route.routingPolicy, route.explicitProvider, input.providerHint);
|
|
93
|
+
const estimatedCostUsd = pricingSelection.pricing
|
|
94
|
+
? estimateCostUsd(promptTokens, completionTokens, pricingSelection.pricing.input, pricingSelection.pricing.output)
|
|
95
|
+
: null;
|
|
96
|
+
const { db, close } = (0, global_db_js_1.openGlobalDatabase)();
|
|
97
|
+
try {
|
|
98
|
+
db.prepare(`INSERT INTO hf_usage (
|
|
99
|
+
model, provider, routing_policy, role, prompt_tokens, completion_tokens, estimated_cost_usd, created_at
|
|
100
|
+
) VALUES (?, ?, ?, ?, ?, ?, ?, ?)`).run(route.baseModel, pricingSelection.provider, route.routingPolicy, input.role ?? null, promptTokens, completionTokens, estimatedCostUsd, input.createdAtMs ?? Date.now());
|
|
101
|
+
}
|
|
102
|
+
finally {
|
|
103
|
+
close();
|
|
104
|
+
}
|
|
105
|
+
}
|
|
106
|
+
getDashboardUsage() {
|
|
107
|
+
return {
|
|
108
|
+
today: this.getUsageSummary(24),
|
|
109
|
+
byModel7d: this.getUsageByModel(24 * 7, 8),
|
|
110
|
+
};
|
|
111
|
+
}
|
|
112
|
+
getUsageSummary(hours) {
|
|
113
|
+
const sinceMs = Date.now() - (Math.max(1, hours) * 60 * 60 * 1000);
|
|
114
|
+
const { db, close } = (0, global_db_js_1.openGlobalDatabase)();
|
|
115
|
+
try {
|
|
116
|
+
const row = db.prepare(`SELECT
|
|
117
|
+
COALESCE(SUM(prompt_tokens), 0) AS prompt_tokens,
|
|
118
|
+
COALESCE(SUM(completion_tokens), 0) AS completion_tokens,
|
|
119
|
+
COUNT(*) AS requests,
|
|
120
|
+
COALESCE(SUM(estimated_cost_usd), 0) AS estimated_cost_usd
|
|
121
|
+
FROM hf_usage
|
|
122
|
+
WHERE created_at >= ?`).get(sinceMs);
|
|
123
|
+
const promptTokens = row.prompt_tokens ?? 0;
|
|
124
|
+
const completionTokens = row.completion_tokens ?? 0;
|
|
125
|
+
return {
|
|
126
|
+
promptTokens,
|
|
127
|
+
completionTokens,
|
|
128
|
+
totalTokens: promptTokens + completionTokens,
|
|
129
|
+
requests: row.requests ?? 0,
|
|
130
|
+
estimatedCostUsd: row.estimated_cost_usd ?? 0,
|
|
131
|
+
};
|
|
132
|
+
}
|
|
133
|
+
finally {
|
|
134
|
+
close();
|
|
135
|
+
}
|
|
136
|
+
}
|
|
137
|
+
getUsageByModel(hours, limit = 8) {
|
|
138
|
+
const sinceMs = Date.now() - (Math.max(1, hours) * 60 * 60 * 1000);
|
|
139
|
+
const cappedLimit = Math.max(1, Math.min(50, limit));
|
|
140
|
+
const { db, close } = (0, global_db_js_1.openGlobalDatabase)();
|
|
141
|
+
try {
|
|
142
|
+
const rows = db.prepare(`SELECT
|
|
143
|
+
model,
|
|
144
|
+
provider,
|
|
145
|
+
COALESCE(routing_policy, 'fastest') AS routing_policy,
|
|
146
|
+
COALESCE(SUM(prompt_tokens), 0) AS prompt_tokens,
|
|
147
|
+
COALESCE(SUM(completion_tokens), 0) AS completion_tokens,
|
|
148
|
+
COUNT(*) AS requests,
|
|
149
|
+
COALESCE(SUM(estimated_cost_usd), 0) AS estimated_cost_usd
|
|
150
|
+
FROM hf_usage
|
|
151
|
+
WHERE created_at >= ?
|
|
152
|
+
GROUP BY model, provider, routing_policy
|
|
153
|
+
ORDER BY (COALESCE(SUM(prompt_tokens), 0) + COALESCE(SUM(completion_tokens), 0)) DESC,
|
|
154
|
+
COUNT(*) DESC,
|
|
155
|
+
model ASC
|
|
156
|
+
LIMIT ?`).all(sinceMs, cappedLimit);
|
|
157
|
+
return rows.map((row) => {
|
|
158
|
+
const promptTokens = row.prompt_tokens ?? 0;
|
|
159
|
+
const completionTokens = row.completion_tokens ?? 0;
|
|
160
|
+
return {
|
|
161
|
+
model: row.model,
|
|
162
|
+
provider: row.provider,
|
|
163
|
+
routingPolicy: row.routing_policy ?? 'fastest',
|
|
164
|
+
promptTokens,
|
|
165
|
+
completionTokens,
|
|
166
|
+
totalTokens: promptTokens + completionTokens,
|
|
167
|
+
requests: row.requests ?? 0,
|
|
168
|
+
estimatedCostUsd: row.estimated_cost_usd ?? 0,
|
|
169
|
+
};
|
|
170
|
+
});
|
|
171
|
+
}
|
|
172
|
+
finally {
|
|
173
|
+
close();
|
|
174
|
+
}
|
|
175
|
+
}
|
|
176
|
+
}
|
|
177
|
+
exports.HuggingFaceUsageMetrics = HuggingFaceUsageMetrics;
|
|
178
|
+
function getHeaderValue(headers, key) {
|
|
179
|
+
if (headers instanceof Headers) {
|
|
180
|
+
return headers.get(key);
|
|
181
|
+
}
|
|
182
|
+
if (key === 'ratelimit')
|
|
183
|
+
return headers.rateLimit ?? null;
|
|
184
|
+
return headers.rateLimitPolicy ?? null;
|
|
185
|
+
}
|
|
186
|
+
function parseHeaderMetric(raw, token) {
|
|
187
|
+
if (!raw)
|
|
188
|
+
return null;
|
|
189
|
+
const match = raw.match(new RegExp(`(?:^|[;,\\s])${token}=(\\d+)`, 'i'));
|
|
190
|
+
if (!match)
|
|
191
|
+
return null;
|
|
192
|
+
const parsed = Number.parseInt(match[1], 10);
|
|
193
|
+
return Number.isFinite(parsed) ? parsed : null;
|
|
194
|
+
}
|
|
195
|
+
function toSafeInt(value) {
|
|
196
|
+
if (typeof value !== 'number' || !Number.isFinite(value))
|
|
197
|
+
return null;
|
|
198
|
+
const normalized = Math.round(value);
|
|
199
|
+
return normalized >= 0 ? normalized : null;
|
|
200
|
+
}
|
|
201
|
+
function estimateCostUsd(promptTokens, completionTokens, inputPerMillion, outputPerMillion) {
|
|
202
|
+
return (promptTokens * inputPerMillion / 1_000_000) + (completionTokens * outputPerMillion / 1_000_000);
|
|
203
|
+
}
|
|
204
|
+
function selectPricing(model, routingPolicy, explicitProvider, providerHint) {
|
|
205
|
+
const pricing = model?.pricing;
|
|
206
|
+
if (!pricing || Object.keys(pricing).length === 0) {
|
|
207
|
+
return { provider: explicitProvider ?? providerHint ?? null, pricing: null };
|
|
208
|
+
}
|
|
209
|
+
const providerMap = normalizeProviderMap(pricing);
|
|
210
|
+
const selectedByHint = providerHint ? providerMap.get(providerHint.toLowerCase()) : undefined;
|
|
211
|
+
if (selectedByHint) {
|
|
212
|
+
return {
|
|
213
|
+
provider: selectedByHint.provider,
|
|
214
|
+
pricing: selectedByHint.pricing,
|
|
215
|
+
};
|
|
216
|
+
}
|
|
217
|
+
if (explicitProvider) {
|
|
218
|
+
const byExplicitProvider = providerMap.get(explicitProvider.toLowerCase());
|
|
219
|
+
if (byExplicitProvider) {
|
|
220
|
+
return {
|
|
221
|
+
provider: byExplicitProvider.provider,
|
|
222
|
+
pricing: byExplicitProvider.pricing,
|
|
223
|
+
};
|
|
224
|
+
}
|
|
225
|
+
}
|
|
226
|
+
if (routingPolicy === 'cheapest') {
|
|
227
|
+
const cheapest = Array.from(providerMap.values()).sort((a, b) => {
|
|
228
|
+
const aCost = a.pricing.input + a.pricing.output;
|
|
229
|
+
const bCost = b.pricing.input + b.pricing.output;
|
|
230
|
+
return aCost - bCost || a.provider.localeCompare(b.provider);
|
|
231
|
+
})[0];
|
|
232
|
+
if (cheapest) {
|
|
233
|
+
return {
|
|
234
|
+
provider: cheapest.provider,
|
|
235
|
+
pricing: cheapest.pricing,
|
|
236
|
+
};
|
|
237
|
+
}
|
|
238
|
+
}
|
|
239
|
+
const prices = Array.from(providerMap.values());
|
|
240
|
+
if (prices.length === 0) {
|
|
241
|
+
return { provider: explicitProvider ?? providerHint ?? null, pricing: null };
|
|
242
|
+
}
|
|
243
|
+
const avgInput = prices.reduce((sum, p) => sum + p.pricing.input, 0) / prices.length;
|
|
244
|
+
const avgOutput = prices.reduce((sum, p) => sum + p.pricing.output, 0) / prices.length;
|
|
245
|
+
return {
|
|
246
|
+
provider: explicitProvider ?? providerHint ?? null,
|
|
247
|
+
pricing: {
|
|
248
|
+
input: avgInput,
|
|
249
|
+
output: avgOutput,
|
|
250
|
+
},
|
|
251
|
+
};
|
|
252
|
+
}
|
|
253
|
+
function normalizeProviderMap(pricing) {
|
|
254
|
+
const result = new Map();
|
|
255
|
+
for (const [provider, rate] of Object.entries(pricing)) {
|
|
256
|
+
if (typeof rate.input !== 'number' ||
|
|
257
|
+
typeof rate.output !== 'number' ||
|
|
258
|
+
!Number.isFinite(rate.input) ||
|
|
259
|
+
!Number.isFinite(rate.output)) {
|
|
260
|
+
continue;
|
|
261
|
+
}
|
|
262
|
+
result.set(provider.toLowerCase(), {
|
|
263
|
+
provider,
|
|
264
|
+
pricing: {
|
|
265
|
+
input: rate.input,
|
|
266
|
+
output: rate.output,
|
|
267
|
+
},
|
|
268
|
+
});
|
|
269
|
+
}
|
|
270
|
+
return result;
|
|
271
|
+
}
|
|
272
|
+
//# sourceMappingURL=metrics.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"metrics.js","sourceRoot":"","sources":["../../src/huggingface/metrics.ts"],"names":[],"mappings":";;;AAsDA,4CAqCC;AAED,4DAuBC;AAED,kFAgBC;AArID,0DAA6D;AAC7D,2DAAmF;AAEnF,MAAM,qBAAqB,GAAG,IAAI,GAAG,CAAC,CAAC,SAAS,EAAE,UAAU,EAAE,WAAW,CAAC,CAAC,CAAC;AAkD5E,SAAgB,gBAAgB,CAAC,KAAa;IAC5C,MAAM,OAAO,GAAG,KAAK,CAAC,IAAI,EAAE,CAAC;IAC7B,IAAI,CAAC,OAAO,EAAE,CAAC;QACb,OAAO;YACL,SAAS,EAAE,EAAE;YACb,aAAa,EAAE,SAAS;YACxB,gBAAgB,EAAE,IAAI;SACvB,CAAC;IACJ,CAAC;IAED,MAAM,WAAW,GAAG,OAAO,CAAC,WAAW,CAAC,GAAG,CAAC,CAAC;IAC7C,IAAI,WAAW,IAAI,CAAC,EAAE,CAAC;QACrB,OAAO;YACL,SAAS,EAAE,OAAO;YAClB,aAAa,EAAE,SAAS;YACxB,gBAAgB,EAAE,IAAI;SACvB,CAAC;IACJ,CAAC;IAED,MAAM,SAAS,GAAG,OAAO,CAAC,KAAK,CAAC,CAAC,EAAE,WAAW,CAAC,CAAC,IAAI,EAAE,CAAC;IACvD,MAAM,MAAM,GAAG,OAAO,CAAC,KAAK,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC;IACrD,IAAI,CAAC,MAAM,EAAE,CAAC;QACZ,OAAO;YACL,SAAS;YACT,aAAa,EAAE,SAAS;YACxB,gBAAgB,EAAE,IAAI;SACvB,CAAC;IACJ,CAAC;IAED,MAAM,aAAa,GAAG,MAAM,CAAC,WAAW,EAAE,CAAC;IAC3C,MAAM,gBAAgB,GAAG,qBAAqB,CAAC,GAAG,CAAC,aAAa,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,aAAa,CAAC;IAEzF,OAAO;QACL,SAAS;QACT,aAAa;QACb,gBAAgB;KACjB,CAAC;AACJ,CAAC;AAED,SAAgB,wBAAwB,CACtC,OAKG,EACH,KAAK,GAAG,IAAI,CAAC,GAAG,EAAE;IAElB,MAAM,SAAS,GAAG,cAAc,CAAC,OAAO,EAAE,WAAW,CAAC,CAAC;IACvD,MAAM,eAAe,GAAG,cAAc,CAAC,OAAO,EAAE,kBAAkB,CAAC,CAAC;IAEpE,IAAI,CAAC,SAAS,IAAI,CAAC,eAAe,EAAE,CAAC;QACnC,OAAO,IAAI,CAAC;IACd,CAAC;IAED,OAAO;QACL,SAAS,EAAE,iBAAiB,CAAC,SAAS,EAAE,GAAG,CAAC;QAC5C,KAAK,EAAE,iBAAiB,CAAC,eAAe,EAAE,GAAG,CAAC;QAC9C,YAAY,EAAE,iBAAiB,CAAC,SAAS,EAAE,GAAG,CAAC;QAC/C,aAAa,EAAE,iBAAiB,CAAC,eAAe,EAAE,GAAG,CAAC;QACtD,YAAY,EAAE,KAAK;KACpB,CAAC;AACJ,CAAC;AAED,SAAgB,mCAAmC,CAAC,OAAgB;IAClE,MAAM,UAAU,GAAG;QACjB,yBAAyB;QACzB,sBAAsB;QACtB,YAAY;QACZ,gCAAgC;KACjC,CAAC;IAEF,KAAK,MAAM,GAAG,IAAI,UAAU,EAAE,CAAC;QAC7B,MAAM,KAAK,GAAG,OAAO,CAAC,GAAG,CAAC,GAAG,CAAC,CAAC;QAC/B,IAAI,CAAC,KAAK;YAAE,SAAS;QACrB,MAAM,QAAQ,GAAG,KAAK,CAAC,IAAI,EAAE,CAAC,WAAW,EAAE,CAAC;QAC5C,IAAI,QAAQ;YAAE,OAAO,QAAQ,CAAC;IAChC,CAAC;IAED,OAAO,IAAI,CAAC;AACd,CAAC;AAED,MAAa,uBAAuB;IACjB,QAAQ,CAAmD;IAE5E,YAAY,UAA2E,EAAE;QACvF,IAAI,CAAC,QAAQ,GAAG,OAAO,CAAC,QAAQ,IAAI,IAAI,4CAAwB,EAAE,CAAC;IACrE,CAAC;IAED,qBAAqB,CAAC,KAMrB;QACC,MAAM,KAAK,GAAG,KAAK,CAAC,UAAU,CAAC;QAC/B,IAAI,CAAC,KAAK;YAAE,OAAO;QAEnB,MAAM,YAAY,GAAG,SAAS,CAAC,KAAK,CAAC,WAAW,CAAC,CAAC;QAClD,MAAM,gBAAgB,GAAG,SAAS,CAAC,KAAK,CAAC,YAAY,CAAC,CAAC;QACvD,IAAI,YAAY,KAAK,IAAI,IAAI,gBAAgB,KAAK,IAAI;YAAE,OAAO;QAE/D,MAAM,KAAK,GAAG,gBAAgB,CAAC,KAAK,CAAC,cAAc,CAAC,CAAC;QACrD,IAAI,CAAC,KAAK,CAAC,SAAS;YAAE,OAAO;QAE7B,MAAM,KAAK,GAAG,IAAI,CAAC,QAAQ,CAAC,cAAc,CAAC,KAAK,CAAC,SAAS,CAAC,CAAC;QAC5D,MAAM,gBAAgB,GAAG,aAAa,CAAC,KAAK,EAAE,KAAK,CAAC,aAAa,EAAE,KAAK,CAAC,gBAAgB,EAAE,KAAK,CAAC,YAAY,CAAC,CAAC;QAC/G,MAAM,gBAAgB,GAAG,gBAAgB,CAAC,OAAO;YAC/C,CAAC,CAAC,eAAe,CAAC,YAAY,EAAE,gBAAgB,EAAE,gBAAgB,CAAC,OAAO,CAAC,KAAK,EAAE,gBAAgB,CAAC,OAAO,CAAC,MAAM,CAAC;YAClH,CAAC,CAAC,IAAI,CAAC;QAET,MAAM,EAAE,EAAE,EAAE,KAAK,EAAE,GAAG,IAAA,iCAAkB,GAAE,CAAC;QAC3C,IAAI,CAAC;YACH,EAAE,CAAC,OAAO,CACR;;0CAEkC,CACnC,CAAC,GAAG,CACH,KAAK,CAAC,SAAS,EACf,gBAAgB,CAAC,QAAQ,EACzB,KAAK,CAAC,aAAa,EACnB,KAAK,CAAC,IAAI,IAAI,IAAI,EAClB,YAAY,EACZ,gBAAgB,EAChB,gBAAgB,EAChB,KAAK,CAAC,WAAW,IAAI,IAAI,CAAC,GAAG,EAAE,CAChC,CAAC;QACJ,CAAC;gBAAS,CAAC;YACT,KAAK,EAAE,CAAC;QACV,CAAC;IACH,CAAC;IAED,iBAAiB;QACf,OAAO;YACL,KAAK,EAAE,IAAI,CAAC,eAAe,CAAC,EAAE,CAAC;YAC/B,SAAS,EAAE,IAAI,CAAC,eAAe,CAAC,EAAE,GAAG,CAAC,EAAE,CAAC,CAAC;SAC3C,CAAC;IACJ,CAAC;IAED,eAAe,CAAC,KAAa;QAC3B,MAAM,OAAO,GAAG,IAAI,CAAC,GAAG,EAAE,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,IAAI,CAAC,CAAC;QACnE,MAAM,EAAE,EAAE,EAAE,KAAK,EAAE,GAAG,IAAA,iCAAkB,GAAE,CAAC;QAC3C,IAAI,CAAC;YACH,MAAM,GAAG,GAAG,EAAE,CAAC,OAAO,CACpB;;;;;;+BAMuB,CACxB,CAAC,GAAG,CAAC,OAAO,CAAe,CAAC;YAE7B,MAAM,YAAY,GAAG,GAAG,CAAC,aAAa,IAAI,CAAC,CAAC;YAC5C,MAAM,gBAAgB,GAAG,GAAG,CAAC,iBAAiB,IAAI,CAAC,CAAC;YACpD,OAAO;gBACL,YAAY;gBACZ,gBAAgB;gBAChB,WAAW,EAAE,YAAY,GAAG,gBAAgB;gBAC5C,QAAQ,EAAE,GAAG,CAAC,QAAQ,IAAI,CAAC;gBAC3B,gBAAgB,EAAE,GAAG,CAAC,kBAAkB,IAAI,CAAC;aAC9C,CAAC;QACJ,CAAC;gBAAS,CAAC;YACT,KAAK,EAAE,CAAC;QACV,CAAC;IACH,CAAC;IAED,eAAe,CAAC,KAAa,EAAE,KAAK,GAAG,CAAC;QACtC,MAAM,OAAO,GAAG,IAAI,CAAC,GAAG,EAAE,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,IAAI,CAAC,CAAC;QACnE,MAAM,WAAW,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,EAAE,EAAE,KAAK,CAAC,CAAC,CAAC;QACrD,MAAM,EAAE,EAAE,EAAE,KAAK,EAAE,GAAG,IAAA,iCAAkB,GAAE,CAAC;QAC3C,IAAI,CAAC;YACH,MAAM,IAAI,GAAG,EAAE,CAAC,OAAO,CACrB;;;;;;;;;;;;;;iBAcS,CACV,CAAC,GAAG,CAAC,OAAO,EAAE,WAAW,CAAiB,CAAC;YAE5C,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,GAAG,EAAE,EAAE;gBACtB,MAAM,YAAY,GAAG,GAAG,CAAC,aAAa,IAAI,CAAC,CAAC;gBAC5C,MAAM,gBAAgB,GAAG,GAAG,CAAC,iBAAiB,IAAI,CAAC,CAAC;gBACpD,OAAO;oBACL,KAAK,EAAE,GAAG,CAAC,KAAK;oBAChB,QAAQ,EAAE,GAAG,CAAC,QAAQ;oBACtB,aAAa,EAAE,GAAG,CAAC,cAAc,IAAI,SAAS;oBAC9C,YAAY;oBACZ,gBAAgB;oBAChB,WAAW,EAAE,YAAY,GAAG,gBAAgB;oBAC5C,QAAQ,EAAE,GAAG,CAAC,QAAQ,IAAI,CAAC;oBAC3B,gBAAgB,EAAE,GAAG,CAAC,kBAAkB,IAAI,CAAC;iBAC9C,CAAC;YACJ,CAAC,CAAC,CAAC;QACL,CAAC;gBAAS,CAAC;YACT,KAAK,EAAE,CAAC;QACV,CAAC;IACH,CAAC;CACF;AA/HD,0DA+HC;AAED,SAAS,cAAc,CACrB,OAKG,EACH,GAAqC;IAErC,IAAI,OAAO,YAAY,OAAO,EAAE,CAAC;QAC/B,OAAO,OAAO,CAAC,GAAG,CAAC,GAAG,CAAC,CAAC;IAC1B,CAAC;IAED,IAAI,GAAG,KAAK,WAAW;QAAE,OAAO,OAAO,CAAC,SAAS,IAAI,IAAI,CAAC;IAC1D,OAAO,OAAO,CAAC,eAAe,IAAI,IAAI,CAAC;AACzC,CAAC;AAED,SAAS,iBAAiB,CAAC,GAAkB,EAAE,KAA4B;IACzE,IAAI,CAAC,GAAG;QAAE,OAAO,IAAI,CAAC;IACtB,MAAM,KAAK,GAAG,GAAG,CAAC,KAAK,CAAC,IAAI,MAAM,CAAC,gBAAgB,KAAK,SAAS,EAAE,GAAG,CAAC,CAAC,CAAC;IACzE,IAAI,CAAC,KAAK;QAAE,OAAO,IAAI,CAAC;IACxB,MAAM,MAAM,GAAG,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;IAC7C,OAAO,MAAM,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,IAAI,CAAC;AACjD,CAAC;AAED,SAAS,SAAS,CAAC,KAAc;IAC/B,IAAI,OAAO,KAAK,KAAK,QAAQ,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC;QAAE,OAAO,IAAI,CAAC;IACtE,MAAM,UAAU,GAAG,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC;IACrC,OAAO,UAAU,IAAI,CAAC,CAAC,CAAC,CAAC,UAAU,CAAC,CAAC,CAAC,IAAI,CAAC;AAC7C,CAAC;AAED,SAAS,eAAe,CACtB,YAAoB,EACpB,gBAAwB,EACxB,eAAuB,EACvB,gBAAwB;IAExB,OAAO,CAAC,YAAY,GAAG,eAAe,GAAG,SAAS,CAAC,GAAG,CAAC,gBAAgB,GAAG,gBAAgB,GAAG,SAAS,CAAC,CAAC;AAC1G,CAAC;AAED,SAAS,aAAa,CACpB,KAA2B,EAC3B,aAAqB,EACrB,gBAA+B,EAC/B,YAA4B;IAK5B,MAAM,OAAO,GAAG,KAAK,EAAE,OAAO,CAAC;IAC/B,IAAI,CAAC,OAAO,IAAI,MAAM,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QAClD,OAAO,EAAE,QAAQ,EAAE,gBAAgB,IAAI,YAAY,IAAI,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,CAAC;IAC/E,CAAC;IAED,MAAM,WAAW,GAAG,oBAAoB,CAAC,OAAO,CAAC,CAAC;IAClD,MAAM,cAAc,GAAG,YAAY,CAAC,CAAC,CAAC,WAAW,CAAC,GAAG,CAAC,YAAY,CAAC,WAAW,EAAE,CAAC,CAAC,CAAC,CAAC,SAAS,CAAC;IAC9F,IAAI,cAAc,EAAE,CAAC;QACnB,OAAO;YACL,QAAQ,EAAE,cAAc,CAAC,QAAQ;YACjC,OAAO,EAAE,cAAc,CAAC,OAAO;SAChC,CAAC;IACJ,CAAC;IAED,IAAI,gBAAgB,EAAE,CAAC;QACrB,MAAM,kBAAkB,GAAG,WAAW,CAAC,GAAG,CAAC,gBAAgB,CAAC,WAAW,EAAE,CAAC,CAAC;QAC3E,IAAI,kBAAkB,EAAE,CAAC;YACvB,OAAO;gBACL,QAAQ,EAAE,kBAAkB,CAAC,QAAQ;gBACrC,OAAO,EAAE,kBAAkB,CAAC,OAAO;aACpC,CAAC;QACJ,CAAC;IACH,CAAC;IAED,IAAI,aAAa,KAAK,UAAU,EAAE,CAAC;QACjC,MAAM,QAAQ,GAAG,KAAK,CAAC,IAAI,CAAC,WAAW,CAAC,MAAM,EAAE,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE;YAC9D,MAAM,KAAK,GAAG,CAAC,CAAC,OAAO,CAAC,KAAK,GAAG,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC;YACjD,MAAM,KAAK,GAAG,CAAC,CAAC,OAAO,CAAC,KAAK,GAAG,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC;YACjD,OAAO,KAAK,GAAG,KAAK,IAAI,CAAC,CAAC,QAAQ,CAAC,aAAa,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC;QAC/D,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;QAEN,IAAI,QAAQ,EAAE,CAAC;YACb,OAAO;gBACL,QAAQ,EAAE,QAAQ,CAAC,QAAQ;gBAC3B,OAAO,EAAE,QAAQ,CAAC,OAAO;aAC1B,CAAC;QACJ,CAAC;IACH,CAAC;IAED,MAAM,MAAM,GAAG,KAAK,CAAC,IAAI,CAAC,WAAW,CAAC,MAAM,EAAE,CAAC,CAAC;IAChD,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QACxB,OAAO,EAAE,QAAQ,EAAE,gBAAgB,IAAI,YAAY,IAAI,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,CAAC;IAC/E,CAAC;IAED,MAAM,QAAQ,GAAG,MAAM,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,CAAC,EAAE,EAAE,CAAC,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,KAAK,EAAE,CAAC,CAAC,GAAG,MAAM,CAAC,MAAM,CAAC;IACrF,MAAM,SAAS,GAAG,MAAM,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,CAAC,EAAE,EAAE,CAAC,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC,GAAG,MAAM,CAAC,MAAM,CAAC;IAEvF,OAAO;QACL,QAAQ,EAAE,gBAAgB,IAAI,YAAY,IAAI,IAAI;QAClD,OAAO,EAAE;YACP,KAAK,EAAE,QAAQ;YACf,MAAM,EAAE,SAAS;SAClB;KACF,CAAC;AACJ,CAAC;AAED,SAAS,oBAAoB,CAC3B,OAA0D;IAE1D,MAAM,MAAM,GAAG,IAAI,GAAG,EAA4E,CAAC;IAEnG,KAAK,MAAM,CAAC,QAAQ,EAAE,IAAI,CAAC,IAAI,MAAM,CAAC,OAAO,CAAC,OAAO,CAAC,EAAE,CAAC;QACvD,IACE,OAAO,IAAI,CAAC,KAAK,KAAK,QAAQ;YAC9B,OAAO,IAAI,CAAC,MAAM,KAAK,QAAQ;YAC/B,CAAC,MAAM,CAAC,QAAQ,CAAC,IAAI,CAAC,KAAK,CAAC;YAC5B,CAAC,MAAM,CAAC,QAAQ,CAAC,IAAI,CAAC,MAAM,CAAC,EAC7B,CAAC;YACD,SAAS;QACX,CAAC;QACD,MAAM,CAAC,GAAG,CAAC,QAAQ,CAAC,WAAW,EAAE,EAAE;YACjC,QAAQ;YACR,OAAO,EAAE;gBACP,KAAK,EAAE,IAAI,CAAC,KAAK;gBACjB,MAAM,EAAE,IAAI,CAAC,MAAM;aACpB;SACF,CAAC,CAAC;IACL,CAAC;IAED,OAAO,MAAM,CAAC;AAChB,CAAC"}
|
|
@@ -0,0 +1,74 @@
|
|
|
1
|
+
import { HuggingFaceHubClient } from './hub-client.js';
|
|
2
|
+
export type HFModelSource = 'curated' | 'search' | 'manual';
|
|
3
|
+
export interface HFCachedModel {
|
|
4
|
+
id: string;
|
|
5
|
+
pipelineTag: string;
|
|
6
|
+
downloads: number;
|
|
7
|
+
likes: number;
|
|
8
|
+
tags: string[];
|
|
9
|
+
providers: string[];
|
|
10
|
+
providerDetails?: HFProviderDetail[];
|
|
11
|
+
contextLength?: number;
|
|
12
|
+
pricing?: Record<string, {
|
|
13
|
+
input: number;
|
|
14
|
+
output: number;
|
|
15
|
+
}>;
|
|
16
|
+
supportsTools?: boolean;
|
|
17
|
+
providerContextLengths?: Record<string, number>;
|
|
18
|
+
addedAt: number;
|
|
19
|
+
source: HFModelSource;
|
|
20
|
+
}
|
|
21
|
+
export interface HFProviderDetail {
|
|
22
|
+
provider: string;
|
|
23
|
+
contextLength?: number;
|
|
24
|
+
pricing?: {
|
|
25
|
+
input: number;
|
|
26
|
+
output: number;
|
|
27
|
+
};
|
|
28
|
+
supportsTools?: boolean;
|
|
29
|
+
supportsStructuredOutput?: boolean;
|
|
30
|
+
isModelAuthor?: boolean;
|
|
31
|
+
}
|
|
32
|
+
export interface HFModelCache {
|
|
33
|
+
lastUpdated: number;
|
|
34
|
+
models: HFCachedModel[];
|
|
35
|
+
}
|
|
36
|
+
export declare class HuggingFaceModelRegistry {
|
|
37
|
+
private readonly client;
|
|
38
|
+
private readonly cacheFilePath;
|
|
39
|
+
private readonly cacheTtlMs;
|
|
40
|
+
private readonly curatedLimit;
|
|
41
|
+
private readonly nowFn;
|
|
42
|
+
constructor(options?: {
|
|
43
|
+
client?: HuggingFaceHubClient;
|
|
44
|
+
cacheFilePath?: string;
|
|
45
|
+
cacheTtlMs?: number;
|
|
46
|
+
curatedLimit?: number;
|
|
47
|
+
nowFn?: () => number;
|
|
48
|
+
});
|
|
49
|
+
getCuratedModels(options?: {
|
|
50
|
+
forceRefresh?: boolean;
|
|
51
|
+
token?: string;
|
|
52
|
+
}): Promise<HFCachedModel[]>;
|
|
53
|
+
refreshCuratedModels(options?: {
|
|
54
|
+
token?: string;
|
|
55
|
+
}): Promise<HFCachedModel[]>;
|
|
56
|
+
searchModels(query: string, options?: {
|
|
57
|
+
limit?: number;
|
|
58
|
+
token?: string;
|
|
59
|
+
}): Promise<HFCachedModel[]>;
|
|
60
|
+
getCachedModel(modelId: string): HFCachedModel | null;
|
|
61
|
+
private fetchTrendingList;
|
|
62
|
+
private mergeCandidates;
|
|
63
|
+
private rankCandidates;
|
|
64
|
+
private enrichProviders;
|
|
65
|
+
private extractProviders;
|
|
66
|
+
private toCachedModel;
|
|
67
|
+
private getRouterModelMap;
|
|
68
|
+
private toProviderStats;
|
|
69
|
+
private toTimestamp;
|
|
70
|
+
private readCache;
|
|
71
|
+
private writeCache;
|
|
72
|
+
private upsertModelsIntoCache;
|
|
73
|
+
}
|
|
74
|
+
//# sourceMappingURL=model-registry.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"model-registry.d.ts","sourceRoot":"","sources":["../../src/huggingface/model-registry.ts"],"names":[],"mappings":"AAGA,OAAO,EACL,oBAAoB,EAMrB,MAAM,iBAAiB,CAAC;AAKzB,MAAM,MAAM,aAAa,GAAG,SAAS,GAAG,QAAQ,GAAG,QAAQ,CAAC;AAE5D,MAAM,WAAW,aAAa;IAC5B,EAAE,EAAE,MAAM,CAAC;IACX,WAAW,EAAE,MAAM,CAAC;IACpB,SAAS,EAAE,MAAM,CAAC;IAClB,KAAK,EAAE,MAAM,CAAC;IACd,IAAI,EAAE,MAAM,EAAE,CAAC;IACf,SAAS,EAAE,MAAM,EAAE,CAAC;IACpB,eAAe,CAAC,EAAE,gBAAgB,EAAE,CAAC;IACrC,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE;QAAE,KAAK,EAAE,MAAM,CAAC;QAAC,MAAM,EAAE,MAAM,CAAA;KAAE,CAAC,CAAC;IAC5D,aAAa,CAAC,EAAE,OAAO,CAAC;IACxB,sBAAsB,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IAChD,OAAO,EAAE,MAAM,CAAC;IAChB,MAAM,EAAE,aAAa,CAAC;CACvB;AAED,MAAM,WAAW,gBAAgB;IAC/B,QAAQ,EAAE,MAAM,CAAC;IACjB,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,OAAO,CAAC,EAAE;QAAE,KAAK,EAAE,MAAM,CAAC;QAAC,MAAM,EAAE,MAAM,CAAA;KAAE,CAAC;IAC5C,aAAa,CAAC,EAAE,OAAO,CAAC;IACxB,wBAAwB,CAAC,EAAE,OAAO,CAAC;IACnC,aAAa,CAAC,EAAE,OAAO,CAAC;CACzB;AAED,MAAM,WAAW,YAAY;IAC3B,WAAW,EAAE,MAAM,CAAC;IACpB,MAAM,EAAE,aAAa,EAAE,CAAC;CACzB;AASD,qBAAa,wBAAwB;IACnC,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAuB;IAC9C,OAAO,CAAC,QAAQ,CAAC,aAAa,CAAS;IACvC,OAAO,CAAC,QAAQ,CAAC,UAAU,CAAS;IACpC,OAAO,CAAC,QAAQ,CAAC,YAAY,CAAS;IACtC,OAAO,CAAC,QAAQ,CAAC,KAAK,CAAe;gBAEzB,OAAO,GAAE;QACnB,MAAM,CAAC,EAAE,oBAAoB,CAAC;QAC9B,aAAa,CAAC,EAAE,MAAM,CAAC;QACvB,UAAU,CAAC,EAAE,MAAM,CAAC;QACpB,YAAY,CAAC,EAAE,MAAM,CAAC;QACtB,KAAK,CAAC,EAAE,MAAM,MAAM,CAAC;KACjB;IAQA,gBAAgB,CAAC,OAAO,GAAE;QAAE,YAAY,CAAC,EAAE,OAAO,CAAC;QAAC,KAAK,CAAC,EAAE,MAAM,CAAA;KAAO,GAAG,OAAO,CAAC,aAAa,EAAE,CAAC;IAYpG,oBAAoB,CAAC,OAAO,GAAE;QAAE,KAAK,CAAC,EAAE,MAAM,CAAA;KAAO,GAAG,OAAO,CAAC,aAAa,EAAE,CAAC;IA2ChF,YAAY,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,GAAE;QAAE,KAAK,CAAC,EAAE,MAAM,CAAC;QAAC,KAAK,CAAC,EAAE,MAAM,CAAA;KAAO,GAAG,OAAO,CAAC,aAAa,EAAE,CAAC;IAU7G,cAAc,CAAC,OAAO,EAAE,MAAM,GAAG,aAAa,GAAG,IAAI;YAMvC,iBAAiB;IAgB/B,OAAO,CAAC,eAAe;IAuCvB,OAAO,CAAC,cAAc;YAkCR,eAAe;IAqB7B,OAAO,CAAC,gBAAgB;IAQxB,OAAO,CAAC,aAAa;YA2BP,iBAAiB;IAS/B,OAAO,CAAC,eAAe;IAkEvB,OAAO,CAAC,WAAW;IAMnB,OAAO,CAAC,SAAS;IAmBjB,OAAO,CAAC,UAAU;IAMlB,OAAO,CAAC,qBAAqB;CAY9B"}
|