@jsonstudio/llms 0.6.2979 → 0.6.3238
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/conversion/args-mapping.js +8 -0
- package/dist/conversion/{shared/bridge-actions.js → bridge-actions.js} +2 -1
- package/dist/conversion/{shared/bridge-id-utils.js → bridge-id-utils.js} +1 -1
- package/dist/conversion/{shared/bridge-instructions.js → bridge-instructions.js} +1 -1
- package/dist/conversion/{shared/bridge-message-utils.d.ts → bridge-message-utils.d.ts} +1 -1
- package/dist/conversion/{shared/bridge-message-utils.js → bridge-message-utils.js} +5 -149
- package/dist/conversion/{shared/bridge-metadata.js → bridge-metadata.js} +1 -1
- package/dist/conversion/{shared/bridge-policies.js → bridge-policies.js} +1 -1
- package/dist/conversion/codecs/gemini-openai-codec.js +27 -8
- package/dist/conversion/codecs/responses-openai-codec.js +1 -1
- package/dist/conversion/{shared/compaction-detect.d.ts → compaction-detect.d.ts} +1 -1
- package/dist/conversion/compaction-detect.js +4 -0
- package/dist/conversion/compat/actions/apply-patch-fixer.js +2 -2
- package/dist/conversion/compat/actions/deepseek-web-response.d.ts +0 -1
- package/dist/conversion/compat/actions/deepseek-web-response.js +15 -405
- package/dist/conversion/compat/actions/harvest-tool-calls-from-text.js +1 -1
- package/dist/conversion/compat/actions/lmstudio-responses-fc-ids.js +1 -1
- package/dist/conversion/compat/actions/qwen-transform.js +74 -2
- package/dist/conversion/compat/actions/snapshot.js +1 -1
- package/dist/conversion/compat/antigravity-session-signature.js +36 -0
- package/dist/conversion/compat/profiles/chat-deepseek-web.json +0 -22
- package/dist/conversion/compat/profiles/chat-glm.json +251 -72
- package/dist/conversion/compat/profiles/chat-iflow.json +174 -39
- package/dist/conversion/compat/profiles/chat-lmstudio.json +43 -14
- package/dist/conversion/hub/operation-table/operation-table-runner.js +2 -2
- package/dist/conversion/hub/operation-table/semantic-mappers/anthropic-mapper.js +1 -1
- package/dist/conversion/hub/operation-table/semantic-mappers/archive/chat-mapper.archive.d.ts +8 -0
- package/dist/conversion/hub/operation-table/semantic-mappers/archive/chat-mapper.archive.js +404 -0
- package/dist/conversion/hub/operation-table/semantic-mappers/chat-mapper.js +5 -381
- package/dist/conversion/hub/operation-table/semantic-mappers/gemini-mapper.js +2 -2
- package/dist/conversion/hub/operation-table/semantic-mappers/responses-mapper.js +2 -8
- package/dist/conversion/hub/pipeline/hub-pipeline.d.ts +1 -0
- package/dist/conversion/hub/pipeline/hub-pipeline.js +50 -3
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage2_semantic_map/index.d.ts +1 -1
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage2_semantic_map/index.js +62 -0
- package/dist/conversion/hub/pipeline/stages/req_process/req_process_stage2_route_select/index.js +3 -1
- package/dist/conversion/hub/pipeline/stages/resp_inbound/resp_inbound_stage1_sse_decode/index.js +1 -1
- package/dist/conversion/hub/pipeline/stages/resp_outbound/resp_outbound_stage1_client_remap/chat-process-semantics-bridge.d.ts +1 -1
- package/dist/conversion/hub/pipeline/stages/resp_process/resp_process_stage1_tool_governance/index.js +42 -29
- package/dist/conversion/hub/pipeline/stages/resp_process/resp_process_stage2_finalize/index.js +12 -0
- package/dist/conversion/hub/policy/protocol-spec.js +1 -1
- package/dist/conversion/hub/process/chat-process-clock-reminders.js +1 -1
- package/dist/conversion/hub/process/chat-process-clock-tools.js +1 -1
- package/dist/conversion/hub/process/chat-process-continue-execution.js +1 -1
- package/dist/conversion/hub/process/chat-process-servertool-orchestration.js +1 -1
- package/dist/conversion/hub/process/chat-process-web-search.js +1 -1
- package/dist/conversion/hub/response/provider-response.js +14 -5
- package/dist/conversion/hub/response/response-mappers.js +23 -1
- package/dist/conversion/hub/response/response-runtime.js +28 -5
- package/dist/conversion/hub/snapshot-recorder.js +3 -92
- package/dist/conversion/hub/tool-governance/engine.d.ts +8 -0
- package/dist/conversion/hub/tool-governance/engine.js +40 -193
- package/dist/conversion/hub/tool-governance/rules.js +73 -69
- package/dist/conversion/hub/tool-surface/tool-surface-engine.js +1 -1
- package/dist/conversion/index.d.ts +1 -2
- package/dist/conversion/index.js +1 -2
- package/dist/conversion/{shared/jsonish.js → jsonish.js} +1 -1
- package/dist/conversion/{shared/mcp-injection.js → mcp-injection.js} +1 -1
- package/dist/conversion/media.js +4 -0
- package/dist/conversion/{shared/metadata-passthrough.d.ts → metadata-passthrough.d.ts} +1 -1
- package/dist/conversion/{shared/metadata-passthrough.js → metadata-passthrough.js} +2 -2
- package/dist/conversion/payload-budget.js +47 -0
- package/dist/conversion/protocol-field-allowlists.d.ts +7 -0
- package/dist/conversion/protocol-field-allowlists.js +9 -0
- package/dist/conversion/{shared/protocol-state.d.ts → protocol-state.d.ts} +2 -2
- package/dist/conversion/{shared/protocol-state.js → protocol-state.js} +2 -2
- package/dist/conversion/{shared/errors.d.ts → provider-protocol-error.d.ts} +0 -3
- package/dist/conversion/provider-protocol-error.js +25 -0
- package/dist/conversion/responses/responses-openai-bridge/response-payload.js +8 -5
- package/dist/conversion/responses/responses-openai-bridge/types.d.ts +1 -1
- package/dist/conversion/responses/responses-openai-bridge.d.ts +1 -1
- package/dist/conversion/responses/responses-openai-bridge.js +43 -10
- package/dist/conversion/{shared/runtime-metadata.d.ts → runtime-metadata.d.ts} +1 -1
- package/dist/conversion/{shared/runtime-metadata.js → runtime-metadata.js} +2 -2
- package/dist/conversion/shared/anthropic-message-utils.js +19 -8
- package/dist/conversion/shared/chat-request-filters.d.ts +3 -4
- package/dist/conversion/shared/chat-request-filters.js +22 -78
- package/dist/conversion/shared/gemini-tool-utils.d.ts +1 -1
- package/dist/conversion/shared/openai-finalizer.js +1 -0
- package/dist/conversion/shared/openai-message-normalize.js +2 -2
- package/dist/conversion/shared/reasoning-normalizer.js +6 -0
- package/dist/conversion/shared/reasoning-utils.js +5 -2
- package/dist/conversion/shared/responses-conversation-store.js +1 -1
- package/dist/conversion/shared/responses-output-builder.js +55 -11
- package/dist/conversion/shared/responses-reasoning-registry.d.ts +14 -2
- package/dist/conversion/shared/responses-reasoning-registry.js +34 -6
- package/dist/conversion/shared/responses-response-utils.js +99 -9
- package/dist/conversion/shared/responses-tool-utils.js +1 -1
- package/dist/conversion/shared/text-markup-normalizer/normalize.d.ts +1 -1
- package/dist/conversion/shared/text-markup-normalizer.d.ts +2 -2
- package/dist/conversion/shared/text-markup-normalizer.js +1 -1
- package/dist/conversion/shared/tool-filter-pipeline.js +1 -1
- package/dist/conversion/shared/tool-governor.js +3 -3
- package/dist/conversion/shared/tool-mapping.d.ts +1 -1
- package/dist/conversion/{shared/snapshot-utils.d.ts → snapshot-utils.d.ts} +11 -0
- package/dist/conversion/{shared/snapshot-utils.js → snapshot-utils.js} +14 -23
- package/dist/conversion/types/text-markup-normalizer.d.ts +13 -0
- package/dist/conversion/types/text-markup-normalizer.js +1 -0
- package/dist/filters/special/request-tools-normalize.js +1 -1
- package/dist/filters/special/response-tool-text-canonicalize.js +2 -2
- package/dist/native/router_hotpath_napi.node +0 -0
- package/dist/quota/quota-manager.js +31 -59
- package/dist/quota/quota-state.js +14 -7
- package/dist/router/virtual-router/bootstrap/profile-builder.d.ts +1 -0
- package/dist/router/virtual-router/bootstrap/profile-builder.js +13 -0
- package/dist/router/virtual-router/bootstrap/provider-normalization.d.ts +2 -0
- package/dist/router/virtual-router/bootstrap/provider-normalization.js +4 -1
- package/dist/router/virtual-router/bootstrap/streaming-helpers.d.ts +7 -0
- package/dist/router/virtual-router/bootstrap/streaming-helpers.js +44 -0
- package/dist/router/virtual-router/bootstrap.js +2 -0
- package/dist/router/virtual-router/engine/routing-state/store.d.ts +1 -2
- package/dist/router/virtual-router/engine/routing-state/store.js +2 -2
- package/dist/router/virtual-router/engine-legacy/config.d.ts +11 -0
- package/dist/router/virtual-router/engine-legacy/config.js +108 -0
- package/dist/router/virtual-router/engine-legacy/direct-model.d.ts +10 -0
- package/dist/router/virtual-router/engine-legacy/direct-model.js +38 -0
- package/dist/router/virtual-router/engine-legacy/health.d.ts +13 -0
- package/dist/router/virtual-router/engine-legacy/health.js +104 -0
- package/dist/router/virtual-router/engine-legacy/helpers.d.ts +16 -0
- package/dist/router/virtual-router/engine-legacy/helpers.js +226 -0
- package/dist/router/virtual-router/engine-legacy/route-finalize.d.ts +9 -0
- package/dist/router/virtual-router/engine-legacy/route-finalize.js +84 -0
- package/dist/router/virtual-router/engine-legacy/route-selection.d.ts +17 -0
- package/dist/router/virtual-router/engine-legacy/route-selection.js +205 -0
- package/dist/router/virtual-router/engine-legacy/route-state-allowlist.d.ts +3 -0
- package/dist/router/virtual-router/engine-legacy/route-state-allowlist.js +36 -0
- package/dist/router/virtual-router/engine-legacy/route-state.d.ts +12 -0
- package/dist/router/virtual-router/engine-legacy/route-state.js +386 -0
- package/dist/router/virtual-router/engine-legacy/route-utils.d.ts +19 -0
- package/dist/router/virtual-router/engine-legacy/route-utils.js +212 -0
- package/dist/router/virtual-router/engine-legacy/routing.d.ts +8 -0
- package/dist/router/virtual-router/engine-legacy/routing.js +8 -0
- package/dist/router/virtual-router/engine-legacy/selection-core.d.ts +28 -0
- package/dist/router/virtual-router/engine-legacy/selection-core.js +112 -0
- package/dist/router/virtual-router/engine-legacy/selection-state.d.ts +16 -0
- package/dist/router/virtual-router/engine-legacy/selection-state.js +187 -0
- package/dist/router/virtual-router/engine-legacy/state-accessors.d.ts +21 -0
- package/dist/router/virtual-router/engine-legacy/state-accessors.js +118 -0
- package/dist/router/virtual-router/engine-legacy.d.ts +123 -0
- package/dist/router/virtual-router/engine-legacy.js +194 -0
- package/dist/router/virtual-router/engine-logging.d.ts +2 -0
- package/dist/router/virtual-router/engine-logging.js +7 -2
- package/dist/router/virtual-router/engine-selection/key-parsing.js +0 -3
- package/dist/router/virtual-router/engine-selection/native-chat-request-filter-semantics.d.ts +1 -0
- package/dist/router/virtual-router/engine-selection/native-chat-request-filter-semantics.js +54 -0
- package/dist/router/virtual-router/engine-selection/native-hub-bridge-policy-semantics.d.ts +10 -0
- package/dist/router/virtual-router/engine-selection/native-hub-bridge-policy-semantics.js +67 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-governance-semantics.d.ts +30 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-governance-semantics.js +202 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-semantic-mappers.d.ts +2 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-semantic-mappers.js +83 -0
- package/dist/router/virtual-router/engine-selection/native-router-hotpath-loader.js +43 -2
- package/dist/router/virtual-router/engine-selection/native-shared-conversion-semantics.d.ts +75 -0
- package/dist/router/virtual-router/engine-selection/native-shared-conversion-semantics.js +205 -0
- package/dist/router/virtual-router/engine-selection/native-snapshot-hooks.d.ts +3 -0
- package/dist/router/virtual-router/engine-selection/native-snapshot-hooks.js +109 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-engine-proxy.d.ts +16 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-engine-proxy.js +14 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-routing-instructions-semantics.d.ts +2 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-routing-instructions-semantics.js +86 -0
- package/dist/router/virtual-router/engine-selection/tier-selection-quota-integration.js +100 -0
- package/dist/router/virtual-router/engine-selection/tier-selection-select.js +99 -0
- package/dist/router/virtual-router/engine.d.ts +22 -105
- package/dist/router/virtual-router/engine.js +274 -1641
- package/dist/router/virtual-router/load-balancer.d.ts +8 -0
- package/dist/router/virtual-router/load-balancer.js +65 -2
- package/dist/router/virtual-router/provider-registry.js +2 -0
- package/dist/router/virtual-router/routing-instructions/clean.d.ts +3 -0
- package/dist/router/virtual-router/routing-instructions/clean.js +34 -0
- package/dist/router/virtual-router/routing-instructions/parse.d.ts +18 -0
- package/dist/router/virtual-router/routing-instructions/parse.js +377 -0
- package/dist/router/virtual-router/routing-instructions/state.d.ts +4 -0
- package/dist/router/virtual-router/routing-instructions/state.js +245 -0
- package/dist/router/virtual-router/routing-instructions/types.d.ts +70 -0
- package/dist/router/virtual-router/routing-instructions/types.js +2 -0
- package/dist/router/virtual-router/routing-instructions.d.ts +5 -89
- package/dist/router/virtual-router/routing-instructions.js +4 -655
- package/dist/router/virtual-router/sticky-session-store.d.ts +4 -0
- package/dist/router/virtual-router/sticky-session-store.js +19 -81
- package/dist/router/virtual-router/tool-signals.js +21 -3
- package/dist/router/virtual-router/types.d.ts +4 -0
- package/dist/servertool/clock/session-scope.js +32 -1
- package/dist/servertool/engine.js +79 -8
- package/dist/servertool/handlers/antigravity-thought-signature-bootstrap.js +1 -1
- package/dist/servertool/handlers/clock-auto.js +1 -1
- package/dist/servertool/handlers/clock.js +1 -1
- package/dist/servertool/handlers/compaction-detect.d.ts +1 -1
- package/dist/servertool/handlers/compaction-detect.js +1 -1
- package/dist/servertool/handlers/gemini-empty-reply-continue.js +1 -1
- package/dist/servertool/handlers/iflow-model-error-retry.js +1 -1
- package/dist/servertool/handlers/recursive-detection-guard.js +1 -1
- package/dist/servertool/handlers/review.js +1 -1
- package/dist/servertool/handlers/stop-message-auto/iflow-followup.js +1 -1
- package/dist/servertool/handlers/stop-message-auto/runtime-utils.js +1 -1
- package/dist/servertool/handlers/stop-message-auto.js +1 -1
- package/dist/servertool/handlers/vision.js +1 -1
- package/dist/servertool/handlers/web-search.js +1 -1
- package/dist/servertool/reenter-backend.js +1 -1
- package/dist/servertool/server-side-tools.js +2 -2
- package/dist/servertool/stop-gateway-context.js +1 -1
- package/dist/servertool/stop-message-compare-context.js +1 -1
- package/dist/sse/json-to-sse/event-generators/responses.d.ts +4 -0
- package/dist/sse/json-to-sse/event-generators/responses.js +95 -1
- package/dist/sse/json-to-sse/sequencers/responses-sequencer.js +6 -4
- package/dist/sse/sse-to-json/builders/response-builder.d.ts +8 -0
- package/dist/sse/sse-to-json/builders/response-builder.js +162 -4
- package/dist/sse/sse-to-json/responses-sse-to-json-converter.js +2 -0
- package/dist/sse/types/responses-types.d.ts +6 -2
- package/dist/tools/apply-patch/structured/coercion.js +5 -0
- package/dist/tools/args-json.js +29 -0
- package/package.json +8 -5
- package/dist/conversion/shared/args-mapping.js +0 -77
- package/dist/conversion/shared/compaction-detect.js +0 -4
- package/dist/conversion/shared/errors.js +0 -31
- package/dist/conversion/shared/media.js +0 -4
- package/dist/conversion/shared/payload-budget.js +0 -165
- package/dist/conversion/shared/protocol-field-allowlists.d.ts +0 -7
- package/dist/conversion/shared/protocol-field-allowlists.js +0 -149
- package/dist/conversion/shared/snapshot-hooks.d.ts +0 -11
- package/dist/conversion/shared/snapshot-hooks.js +0 -503
- package/dist/conversion/shared/text-markup-normalizer/extractors-apply-patch.d.ts +0 -2
- package/dist/conversion/shared/text-markup-normalizer/extractors-apply-patch.js +0 -129
- package/dist/conversion/shared/text-markup-normalizer/extractors-json.d.ts +0 -4
- package/dist/conversion/shared/text-markup-normalizer/extractors-json.js +0 -637
- package/dist/conversion/shared/text-markup-normalizer/extractors-shared.d.ts +0 -21
- package/dist/conversion/shared/text-markup-normalizer/extractors-shared.js +0 -177
- package/dist/conversion/shared/text-markup-normalizer/extractors-transcript.d.ts +0 -5
- package/dist/conversion/shared/text-markup-normalizer/extractors-transcript.js +0 -385
- package/dist/conversion/shared/text-markup-normalizer/extractors-xml.d.ts +0 -10
- package/dist/conversion/shared/text-markup-normalizer/extractors-xml.js +0 -602
- package/dist/conversion/shared/text-markup-normalizer/extractors.d.ts +0 -5
- package/dist/conversion/shared/text-markup-normalizer/extractors.js +0 -4
- package/dist/conversion/shared/tool-canonicalizer.d.ts +0 -2
- package/dist/conversion/shared/tool-canonicalizer.js +0 -38
- /package/dist/conversion/{shared/args-mapping.d.ts → args-mapping.d.ts} +0 -0
- /package/dist/conversion/{shared/bridge-actions.d.ts → bridge-actions.d.ts} +0 -0
- /package/dist/conversion/{shared/bridge-id-utils.d.ts → bridge-id-utils.d.ts} +0 -0
- /package/dist/conversion/{shared/bridge-instructions.d.ts → bridge-instructions.d.ts} +0 -0
- /package/dist/conversion/{shared/bridge-metadata.d.ts → bridge-metadata.d.ts} +0 -0
- /package/dist/conversion/{shared/bridge-policies.d.ts → bridge-policies.d.ts} +0 -0
- /package/dist/conversion/{shared/jsonish.d.ts → jsonish.d.ts} +0 -0
- /package/dist/conversion/{shared/mcp-injection.d.ts → mcp-injection.d.ts} +0 -0
- /package/dist/conversion/{shared/media.d.ts → media.d.ts} +0 -0
- /package/dist/conversion/{shared/payload-budget.d.ts → payload-budget.d.ts} +0 -0
- /package/dist/conversion/{shared → types}/bridge-message-types.d.ts +0 -0
- /package/dist/conversion/{shared → types}/bridge-message-types.js +0 -0
|
@@ -0,0 +1,84 @@
|
|
|
1
|
+
import { resolveRoutingMode } from '../engine/routing-state/metadata.js';
|
|
2
|
+
import { buildHitReason, createVirtualRouterHitRecord, formatVirtualRouterHit, toVirtualRouterHitEvent } from '../engine-logging.js';
|
|
3
|
+
import { recordAntigravitySessionLease } from '../engine/antigravity/alias-lease.js';
|
|
4
|
+
export function finalizeRoutingDecision(engine, metadata, routingState, metadataInstructions, instructions, selectionResult) {
|
|
5
|
+
const { selection, classification, requestedRoute, features } = selectionResult;
|
|
6
|
+
const baseTarget = engine.providerRegistry.buildTarget(selection.providerKey);
|
|
7
|
+
const forceVision = selection.routeUsed === 'vision' && engine.routeHasForceFlag('vision');
|
|
8
|
+
const target = {
|
|
9
|
+
...baseTarget,
|
|
10
|
+
...(engine.webSearchForce ? { forceWebSearch: true } : {}),
|
|
11
|
+
...(forceVision ? { forceVision: true } : {})
|
|
12
|
+
};
|
|
13
|
+
const instructionProcessMode = engine.resolveInstructionProcessModeForSelection(selection.providerKey, routingState);
|
|
14
|
+
if (instructionProcessMode) {
|
|
15
|
+
target.processMode = instructionProcessMode;
|
|
16
|
+
}
|
|
17
|
+
recordAntigravitySessionLease({
|
|
18
|
+
metadata: features.metadata,
|
|
19
|
+
providerKey: selection.providerKey,
|
|
20
|
+
sessionKey: engine.resolveSessionScope(features.metadata),
|
|
21
|
+
providerRegistry: engine.providerRegistry,
|
|
22
|
+
leaseStore: engine.stickySessionManager.getAllStores().aliasLeaseStore,
|
|
23
|
+
sessionAliasStore: engine.stickySessionManager.getAllStores().sessionAliasStore,
|
|
24
|
+
persistence: engine.antigravityLeasePersistence,
|
|
25
|
+
aliasReuseCooldownMs: engine.stickySessionManager.getAliasReuseCooldownMs(),
|
|
26
|
+
commitSessionBinding: false,
|
|
27
|
+
debug: engine.debug
|
|
28
|
+
});
|
|
29
|
+
const routingMode = resolveRoutingMode([...metadataInstructions, ...instructions], routingState);
|
|
30
|
+
const hitReason = buildHitReason(selection.routeUsed, selection.providerKey, classification, features, routingMode, { providerRegistry: engine.providerRegistry, contextRouting: engine.contextRouting });
|
|
31
|
+
const stickyScope = routingMode !== 'none' ? engine.resolveSessionScope(metadata) : undefined;
|
|
32
|
+
const routeForLog = routingMode === 'sticky' ? 'sticky' : selection.routeUsed;
|
|
33
|
+
const hitRecord = createVirtualRouterHitRecord({
|
|
34
|
+
requestId: metadata.requestId,
|
|
35
|
+
routeName: routeForLog,
|
|
36
|
+
poolId: selection.poolId,
|
|
37
|
+
providerKey: selection.providerKey,
|
|
38
|
+
modelId: target.modelId || undefined,
|
|
39
|
+
hitReason,
|
|
40
|
+
stickyScope,
|
|
41
|
+
routingState,
|
|
42
|
+
requestTokens: features.estimatedTokens,
|
|
43
|
+
selectionPenalty: engine.resolveSelectionPenalty(selection.providerKey)
|
|
44
|
+
});
|
|
45
|
+
engine.routeAnalytics.incrementRouteStat(selection.routeUsed, selection.providerKey, hitRecord);
|
|
46
|
+
try {
|
|
47
|
+
engine.statsCenter.recordVirtualRouterHit(toVirtualRouterHitEvent(hitRecord, {
|
|
48
|
+
requestId: metadata.requestId,
|
|
49
|
+
entryEndpoint: metadata.entryEndpoint || '/v1/chat/completions'
|
|
50
|
+
}));
|
|
51
|
+
}
|
|
52
|
+
catch {
|
|
53
|
+
// stats must never break routing
|
|
54
|
+
}
|
|
55
|
+
const formatted = formatVirtualRouterHit(hitRecord);
|
|
56
|
+
if (formatted) {
|
|
57
|
+
engine.debug?.log?.(formatted);
|
|
58
|
+
}
|
|
59
|
+
else {
|
|
60
|
+
engine.debug?.log?.(formatVirtualRouterHit(hitRecord));
|
|
61
|
+
}
|
|
62
|
+
const didFallback = selection.routeUsed !== requestedRoute;
|
|
63
|
+
return {
|
|
64
|
+
target,
|
|
65
|
+
decision: {
|
|
66
|
+
routeName: selection.routeUsed,
|
|
67
|
+
providerKey: selection.providerKey,
|
|
68
|
+
pool: selection.pool,
|
|
69
|
+
poolId: selection.poolId,
|
|
70
|
+
confidence: classification.confidence,
|
|
71
|
+
reasoning: classification.reasoning,
|
|
72
|
+
fallback: didFallback
|
|
73
|
+
},
|
|
74
|
+
diagnostics: {
|
|
75
|
+
routeName: selection.routeUsed,
|
|
76
|
+
providerKey: selection.providerKey,
|
|
77
|
+
pool: selection.pool,
|
|
78
|
+
poolId: selection.poolId,
|
|
79
|
+
reasoning: classification.reasoning,
|
|
80
|
+
fallback: didFallback,
|
|
81
|
+
confidence: classification.confidence
|
|
82
|
+
}
|
|
83
|
+
};
|
|
84
|
+
}
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
import type { ProcessedRequest, StandardizedRequest } from '../../../conversion/hub/types/standardized.js';
|
|
2
|
+
import type { ClassificationResult, RoutingFeatures, RouterMetadataInput } from '../types.js';
|
|
3
|
+
import type { RoutingInstructionState } from '../routing-instructions.js';
|
|
4
|
+
import type { VirtualRouterEngine } from '../engine-legacy.js';
|
|
5
|
+
export type RoutingSelectionResult = {
|
|
6
|
+
routingState: RoutingInstructionState;
|
|
7
|
+
requestedRoute: string;
|
|
8
|
+
classification: ClassificationResult;
|
|
9
|
+
selection: {
|
|
10
|
+
providerKey: string;
|
|
11
|
+
routeUsed: string;
|
|
12
|
+
pool: string[];
|
|
13
|
+
poolId?: string;
|
|
14
|
+
};
|
|
15
|
+
features: RoutingFeatures;
|
|
16
|
+
};
|
|
17
|
+
export declare function selectRoutingTarget(engine: VirtualRouterEngine, request: StandardizedRequest | ProcessedRequest, metadata: RouterMetadataInput, routingState: RoutingInstructionState, stateKey: string): RoutingSelectionResult;
|
|
@@ -0,0 +1,205 @@
|
|
|
1
|
+
import { DEFAULT_ROUTE, VirtualRouterError, VirtualRouterErrorCode } from '../types.js';
|
|
2
|
+
import { buildRoutingFeatures } from '../features.js';
|
|
3
|
+
import { persistRoutingInstructionState } from '../engine/routing-state/store.js';
|
|
4
|
+
import { selectDirectProviderModel, selectFromStickyPool as selectFromStickyPoolImpl } from '../engine/routing-pools/index.js';
|
|
5
|
+
export function selectRoutingTarget(engine, request, metadata, routingState, stateKey) {
|
|
6
|
+
const features = buildRoutingFeatures(request, metadata);
|
|
7
|
+
const directProviderModel = engine.parseDirectProviderModel(request?.model);
|
|
8
|
+
let classification;
|
|
9
|
+
let requestedRoute;
|
|
10
|
+
let selection = null;
|
|
11
|
+
const selectionDeps = {
|
|
12
|
+
routing: engine.routing,
|
|
13
|
+
providerRegistry: engine.providerRegistry,
|
|
14
|
+
healthManager: engine.healthManager,
|
|
15
|
+
contextAdvisor: engine.contextAdvisor,
|
|
16
|
+
loadBalancer: engine.loadBalancer,
|
|
17
|
+
isProviderCoolingDown: (key) => engine.isProviderCoolingDown(key),
|
|
18
|
+
resolveStickyKey: (m) => engine.resolveStickyKey(m),
|
|
19
|
+
quotaView: engine.quotaView
|
|
20
|
+
};
|
|
21
|
+
if (directProviderModel) {
|
|
22
|
+
const forceMediaFallback = engine.shouldFallbackDirectModelForMedia(directProviderModel, features);
|
|
23
|
+
const providerKeys = engine.providerRegistry.listProviderKeys(directProviderModel.providerId);
|
|
24
|
+
let hasModel = false;
|
|
25
|
+
for (const key of providerKeys) {
|
|
26
|
+
try {
|
|
27
|
+
const profile = engine.providerRegistry.get(key);
|
|
28
|
+
if (profile?.modelId === directProviderModel.modelId) {
|
|
29
|
+
hasModel = true;
|
|
30
|
+
break;
|
|
31
|
+
}
|
|
32
|
+
}
|
|
33
|
+
catch {
|
|
34
|
+
continue;
|
|
35
|
+
}
|
|
36
|
+
}
|
|
37
|
+
if (!hasModel) {
|
|
38
|
+
throw new VirtualRouterError(`Unknown model ${directProviderModel.modelId} for provider ${directProviderModel.providerId}`, VirtualRouterErrorCode.CONFIG_ERROR, { providerId: directProviderModel.providerId, modelId: directProviderModel.modelId });
|
|
39
|
+
}
|
|
40
|
+
if (!forceMediaFallback) {
|
|
41
|
+
const directSelection = selectDirectProviderModel(directProviderModel.providerId, directProviderModel.modelId, metadata, features, routingState, selectionDeps);
|
|
42
|
+
if (!directSelection) {
|
|
43
|
+
throw new VirtualRouterError(`All providers unavailable for model ${directProviderModel.providerId}.${directProviderModel.modelId}`, VirtualRouterErrorCode.PROVIDER_NOT_AVAILABLE, { providerId: directProviderModel.providerId, modelId: directProviderModel.modelId });
|
|
44
|
+
}
|
|
45
|
+
classification = {
|
|
46
|
+
routeName: 'direct',
|
|
47
|
+
confidence: 1,
|
|
48
|
+
reasoning: `direct_model:${directProviderModel.providerId}.${directProviderModel.modelId}`,
|
|
49
|
+
fallback: false,
|
|
50
|
+
candidates: ['direct']
|
|
51
|
+
};
|
|
52
|
+
requestedRoute = 'direct';
|
|
53
|
+
selection = directSelection;
|
|
54
|
+
}
|
|
55
|
+
else {
|
|
56
|
+
classification = engine.classifier.classify(features);
|
|
57
|
+
requestedRoute = engine.normalizeRouteAlias(classification.routeName || DEFAULT_ROUTE);
|
|
58
|
+
selection = engine.selectProvider(requestedRoute, metadata, classification, features, routingState);
|
|
59
|
+
}
|
|
60
|
+
}
|
|
61
|
+
else {
|
|
62
|
+
// Prefer target (from "<**!provider.model**>") is evaluated before routing classification.
|
|
63
|
+
const preferTarget = routingState.preferTarget;
|
|
64
|
+
if (preferTarget && typeof preferTarget.provider === 'string' && preferTarget.provider.trim()) {
|
|
65
|
+
const providerId = preferTarget.provider.trim();
|
|
66
|
+
const keyAlias = typeof preferTarget.keyAlias === 'string' ? preferTarget.keyAlias.trim() : '';
|
|
67
|
+
const modelId = typeof preferTarget.model === 'string' ? preferTarget.model.trim() : '';
|
|
68
|
+
const keyIndex = typeof preferTarget.keyIndex === 'number' && Number.isFinite(preferTarget.keyIndex)
|
|
69
|
+
? Math.floor(preferTarget.keyIndex)
|
|
70
|
+
: undefined;
|
|
71
|
+
const candidateKeys = [];
|
|
72
|
+
if (keyIndex !== undefined && keyIndex > 0) {
|
|
73
|
+
const runtimeKey = engine.providerRegistry.resolveRuntimeKeyByIndex(providerId, keyIndex);
|
|
74
|
+
if (runtimeKey) {
|
|
75
|
+
candidateKeys.push(runtimeKey);
|
|
76
|
+
}
|
|
77
|
+
}
|
|
78
|
+
else if (modelId) {
|
|
79
|
+
const allKeys = engine.providerRegistry.listProviderKeys(providerId);
|
|
80
|
+
for (const key of allKeys) {
|
|
81
|
+
if (keyAlias) {
|
|
82
|
+
const prefix = `${providerId}.${keyAlias}.`;
|
|
83
|
+
if (!key.startsWith(prefix)) {
|
|
84
|
+
continue;
|
|
85
|
+
}
|
|
86
|
+
}
|
|
87
|
+
try {
|
|
88
|
+
const profile = engine.providerRegistry.get(key);
|
|
89
|
+
if (profile?.modelId === modelId) {
|
|
90
|
+
candidateKeys.push(key);
|
|
91
|
+
}
|
|
92
|
+
}
|
|
93
|
+
catch {
|
|
94
|
+
continue;
|
|
95
|
+
}
|
|
96
|
+
}
|
|
97
|
+
}
|
|
98
|
+
const allowAliasRotation = !keyAlias && keyIndex === undefined;
|
|
99
|
+
const eligibleKeys = (() => {
|
|
100
|
+
if (candidateKeys.length === 0) {
|
|
101
|
+
return [];
|
|
102
|
+
}
|
|
103
|
+
const quotaView = selectionDeps.quotaView;
|
|
104
|
+
const now = quotaView ? Date.now() : 0;
|
|
105
|
+
return candidateKeys.filter((key) => {
|
|
106
|
+
if (!quotaView) {
|
|
107
|
+
if (engine.isProviderCoolingDown(key)) {
|
|
108
|
+
return false;
|
|
109
|
+
}
|
|
110
|
+
if (!engine.healthManager.isAvailable(key)) {
|
|
111
|
+
return false;
|
|
112
|
+
}
|
|
113
|
+
return true;
|
|
114
|
+
}
|
|
115
|
+
const entry = quotaView(key);
|
|
116
|
+
if (!entry) {
|
|
117
|
+
return true;
|
|
118
|
+
}
|
|
119
|
+
if (!entry.inPool) {
|
|
120
|
+
return false;
|
|
121
|
+
}
|
|
122
|
+
if (entry.cooldownUntil && entry.cooldownUntil > now) {
|
|
123
|
+
return false;
|
|
124
|
+
}
|
|
125
|
+
if (entry.blacklistUntil && entry.blacklistUntil > now) {
|
|
126
|
+
return false;
|
|
127
|
+
}
|
|
128
|
+
return true;
|
|
129
|
+
});
|
|
130
|
+
})();
|
|
131
|
+
const preferSelection = eligibleKeys.length > 0
|
|
132
|
+
? selectFromStickyPoolImpl(new Set(eligibleKeys), metadata, features, routingState, selectionDeps, {
|
|
133
|
+
allowAliasRotation
|
|
134
|
+
})
|
|
135
|
+
: null;
|
|
136
|
+
if (preferSelection) {
|
|
137
|
+
classification = {
|
|
138
|
+
routeName: 'prefer',
|
|
139
|
+
confidence: 1,
|
|
140
|
+
reasoning: keyIndex !== undefined ? `prefer_key:${providerId}.${keyIndex}` : `prefer_model:${providerId}.${modelId}`,
|
|
141
|
+
fallback: false,
|
|
142
|
+
candidates: ['prefer']
|
|
143
|
+
};
|
|
144
|
+
requestedRoute = 'prefer';
|
|
145
|
+
selection = {
|
|
146
|
+
...preferSelection,
|
|
147
|
+
routeUsed: 'prefer',
|
|
148
|
+
poolId: 'prefer-primary'
|
|
149
|
+
};
|
|
150
|
+
}
|
|
151
|
+
else if (routingState.preferTarget) {
|
|
152
|
+
// Auto-clear only when the target becomes invalid or blocked by explicit routing instructions.
|
|
153
|
+
// Do NOT clear for temporary unavailability (e.g. 429 cooldown, quota cooldown, transient health).
|
|
154
|
+
const shouldAutoClear = (() => {
|
|
155
|
+
if (candidateKeys.length === 0) {
|
|
156
|
+
return true;
|
|
157
|
+
}
|
|
158
|
+
// Prefer selection failed despite eligible keys existing: treat as a hard block (e.g. routing rules).
|
|
159
|
+
if (eligibleKeys.length > 0) {
|
|
160
|
+
return true;
|
|
161
|
+
}
|
|
162
|
+
// If quota explicitly marks the preferred target as out-of-pool, clear the prefer instruction so
|
|
163
|
+
// the router can fall back to other targets without repeatedly retrying an impossible preference.
|
|
164
|
+
if (selectionDeps.quotaView) {
|
|
165
|
+
for (const key of candidateKeys) {
|
|
166
|
+
const entry = selectionDeps.quotaView(key);
|
|
167
|
+
if (entry && entry.inPool === false) {
|
|
168
|
+
return true;
|
|
169
|
+
}
|
|
170
|
+
}
|
|
171
|
+
}
|
|
172
|
+
return false;
|
|
173
|
+
})();
|
|
174
|
+
if (shouldAutoClear) {
|
|
175
|
+
routingState = {
|
|
176
|
+
...routingState,
|
|
177
|
+
preferTarget: undefined
|
|
178
|
+
};
|
|
179
|
+
engine.routingInstructionState.set(stateKey, routingState);
|
|
180
|
+
persistRoutingInstructionState(stateKey, routingState, engine.routingStateStore);
|
|
181
|
+
}
|
|
182
|
+
}
|
|
183
|
+
}
|
|
184
|
+
if (!selection) {
|
|
185
|
+
classification = metadata.routeHint && metadata.routeHint.trim()
|
|
186
|
+
? {
|
|
187
|
+
routeName: metadata.routeHint.trim(),
|
|
188
|
+
confidence: 1,
|
|
189
|
+
reasoning: `route_hint:${metadata.routeHint.trim()}`,
|
|
190
|
+
fallback: false,
|
|
191
|
+
candidates: [metadata.routeHint.trim()]
|
|
192
|
+
}
|
|
193
|
+
: engine.classifier.classify(features);
|
|
194
|
+
requestedRoute = engine.normalizeRouteAlias(classification.routeName || DEFAULT_ROUTE);
|
|
195
|
+
selection = engine.selectProvider(requestedRoute, metadata, classification, features, routingState);
|
|
196
|
+
}
|
|
197
|
+
}
|
|
198
|
+
return {
|
|
199
|
+
routingState,
|
|
200
|
+
requestedRoute,
|
|
201
|
+
classification: classification,
|
|
202
|
+
selection: selection,
|
|
203
|
+
features
|
|
204
|
+
};
|
|
205
|
+
}
|
|
@@ -0,0 +1,3 @@
|
|
|
1
|
+
import type { RoutingInstructionState } from '../routing-instructions.js';
|
|
2
|
+
import type { VirtualRouterEngine } from '../engine-legacy.js';
|
|
3
|
+
export declare function enforceAllowlistIntersection(engine: VirtualRouterEngine, routingState: RoutingInstructionState, stateKey: string): RoutingInstructionState;
|
|
@@ -0,0 +1,36 @@
|
|
|
1
|
+
import { extractProviderId } from '../engine/provider-key/parse.js';
|
|
2
|
+
import { persistRoutingInstructionState } from '../engine/routing-state/store.js';
|
|
3
|
+
export function enforceAllowlistIntersection(engine, routingState, stateKey) {
|
|
4
|
+
if (routingState.allowedProviders.size === 0) {
|
|
5
|
+
return routingState;
|
|
6
|
+
}
|
|
7
|
+
const providersInRouting = new Set();
|
|
8
|
+
for (const pools of Object.values(engine.routing)) {
|
|
9
|
+
if (!Array.isArray(pools))
|
|
10
|
+
continue;
|
|
11
|
+
for (const pool of pools) {
|
|
12
|
+
if (!pool || !Array.isArray(pool.targets))
|
|
13
|
+
continue;
|
|
14
|
+
for (const key of pool.targets) {
|
|
15
|
+
if (typeof key !== 'string' || !key)
|
|
16
|
+
continue;
|
|
17
|
+
const providerId = extractProviderId(key);
|
|
18
|
+
if (providerId) {
|
|
19
|
+
providersInRouting.add(providerId);
|
|
20
|
+
}
|
|
21
|
+
}
|
|
22
|
+
}
|
|
23
|
+
}
|
|
24
|
+
const allowed = Array.from(routingState.allowedProviders).filter((provider) => typeof provider === 'string');
|
|
25
|
+
const hasIntersection = allowed.some((provider) => providersInRouting.has(provider));
|
|
26
|
+
if (!hasIntersection) {
|
|
27
|
+
const nextState = {
|
|
28
|
+
...routingState,
|
|
29
|
+
allowedProviders: new Set()
|
|
30
|
+
};
|
|
31
|
+
engine.routingInstructionState.set(stateKey, nextState);
|
|
32
|
+
persistRoutingInstructionState(stateKey, nextState, engine.routingStateStore);
|
|
33
|
+
return nextState;
|
|
34
|
+
}
|
|
35
|
+
return routingState;
|
|
36
|
+
}
|
|
@@ -0,0 +1,12 @@
|
|
|
1
|
+
import type { ProcessedRequest, StandardizedRequest } from '../../../conversion/hub/types/standardized.js';
|
|
2
|
+
import type { RouterMetadataInput } from '../types.js';
|
|
3
|
+
import type { RoutingInstruction, RoutingInstructionState } from '../routing-instructions.js';
|
|
4
|
+
import type { VirtualRouterEngine } from '../engine-legacy.js';
|
|
5
|
+
export type RoutingStateResult = {
|
|
6
|
+
routingState: RoutingInstructionState;
|
|
7
|
+
stateKey: string;
|
|
8
|
+
stopMessageScope?: string;
|
|
9
|
+
metadataInstructions: RoutingInstruction[];
|
|
10
|
+
instructions: RoutingInstruction[];
|
|
11
|
+
};
|
|
12
|
+
export declare function buildRoutingState(engine: VirtualRouterEngine, request: StandardizedRequest | ProcessedRequest, metadata: RouterMetadataInput): RoutingStateResult;
|