@jsonstudio/llms 0.6.2172 → 0.6.2979
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +2 -0
- package/dist/conversion/compat/antigravity-session-signature.js +35 -1
- package/dist/conversion/compat/profiles/chat-gemini-cli.json +0 -7
- package/dist/conversion/compat/profiles/chat-gemini.json +0 -6
- package/dist/conversion/hub/core/detour-registry.d.ts +2 -0
- package/dist/conversion/hub/core/hub-context.d.ts +3 -1
- package/dist/conversion/hub/core/index.d.ts +1 -0
- package/dist/conversion/hub/core/stage-driver.js +2 -0
- package/dist/conversion/hub/format-adapters/anthropic-format-adapter.js +15 -4
- package/dist/conversion/hub/format-adapters/chat-format-adapter.js +15 -4
- package/dist/conversion/hub/format-adapters/gemini-format-adapter.js +15 -4
- package/dist/conversion/hub/format-adapters/responses-format-adapter.js +15 -4
- package/dist/conversion/hub/hub-feature.js +3 -2
- package/dist/conversion/hub/node-support.js +9 -4
- package/dist/conversion/hub/operation-table/operation-table-runner.js +10 -6
- package/dist/conversion/hub/operation-table/semantic-mappers/anthropic-mapper.js +2 -2
- package/dist/conversion/hub/operation-table/semantic-mappers/chat-mapper.js +10 -10
- package/dist/conversion/hub/operation-table/semantic-mappers/gemini-mapper.js +4 -8
- package/dist/conversion/hub/operation-table/semantic-mappers/responses-mapper.js +19 -65
- package/dist/conversion/hub/ops/operations.js +2 -121
- package/dist/conversion/hub/pipeline/compat/compat-engine.js +6 -0
- package/dist/conversion/hub/pipeline/compat/compat-pipeline-executor.d.ts +1 -1
- package/dist/conversion/hub/pipeline/compat/compat-pipeline-executor.js +33 -1042
- package/dist/conversion/hub/pipeline/compat/compat-profile-resolver.js +2 -0
- package/dist/conversion/hub/pipeline/compat/compat-profile-store.js +2 -0
- package/dist/conversion/hub/pipeline/compat/compat-types.d.ts +14 -17
- package/dist/conversion/hub/pipeline/compat/native-adapter-context.d.ts +3 -0
- package/dist/conversion/hub/pipeline/compat/native-adapter-context.js +39 -0
- package/dist/conversion/hub/pipeline/hub-pipeline.js +115 -262
- package/dist/conversion/hub/pipeline/session-identifiers.js +6 -196
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage1_format_parse/index.d.ts +1 -2
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage1_format_parse/index.js +37 -1
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage2_semantic_map/index.js +12 -86
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage2_semantic_map/semantic-lift.d.ts +14 -0
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage2_semantic_map/semantic-lift.js +24 -0
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/archive/shell-like-tool-call-normalization-fallback.d.ts +2 -0
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/archive/shell-like-tool-call-normalization-fallback.js +157 -0
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/context-capture-orchestration.d.ts +16 -0
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/context-capture-orchestration.js +29 -0
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/context-factories.js +3 -1
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/index.d.ts +2 -15
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/index.js +8 -595
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/responses-context-snapshot.d.ts +8 -0
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/responses-context-snapshot.js +28 -0
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/tool-output-diagnostics.d.ts +2 -0
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/tool-output-diagnostics.js +4 -0
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/tool-output-snapshot.d.ts +10 -0
- package/dist/conversion/hub/pipeline/stages/req_inbound/req_inbound_stage3_context_capture/tool-output-snapshot.js +12 -0
- package/dist/conversion/hub/pipeline/stages/req_outbound/req_outbound_stage1_semantic_map/context-merge.d.ts +3 -0
- package/dist/conversion/hub/pipeline/stages/req_outbound/req_outbound_stage1_semantic_map/context-merge.js +30 -0
- package/dist/conversion/hub/pipeline/stages/req_outbound/req_outbound_stage1_semantic_map/index.js +9 -129
- package/dist/conversion/hub/pipeline/stages/req_outbound/req_outbound_stage2_format_build/index.d.ts +1 -4
- package/dist/conversion/hub/pipeline/stages/req_outbound/req_outbound_stage2_format_build/index.js +9 -26
- package/dist/conversion/hub/pipeline/stages/req_outbound/req_outbound_stage3_compat/index.js +32 -14
- package/dist/conversion/hub/pipeline/stages/req_process/req_process_stage1_tool_governance/index.d.ts +2 -2
- package/dist/conversion/hub/pipeline/stages/req_process/req_process_stage1_tool_governance/index.js +48 -8
- package/dist/conversion/hub/pipeline/stages/req_process/req_process_stage2_route_select/index.js +18 -3
- package/dist/conversion/hub/pipeline/stages/resp_inbound/resp_inbound_stage1_sse_decode/index.js +10 -198
- package/dist/conversion/hub/pipeline/stages/resp_inbound/resp_inbound_stage1_sse_decode/stream-json-sniffer.d.ts +3 -0
- package/dist/conversion/hub/pipeline/stages/resp_inbound/resp_inbound_stage1_sse_decode/stream-json-sniffer.js +81 -0
- package/dist/conversion/hub/pipeline/stages/resp_inbound/resp_inbound_stage2_format_parse/index.d.ts +1 -2
- package/dist/conversion/hub/pipeline/stages/resp_inbound/resp_inbound_stage2_format_parse/index.js +36 -1
- package/dist/conversion/hub/pipeline/stages/resp_inbound/resp_inbound_stage3_semantic_map/index.js +3 -1
- package/dist/conversion/hub/pipeline/stages/resp_outbound/resp_outbound_stage1_client_remap/chat-process-semantics-bridge.d.ts +6 -0
- package/dist/conversion/hub/pipeline/stages/resp_outbound/resp_outbound_stage1_client_remap/chat-process-semantics-bridge.js +17 -0
- package/dist/conversion/hub/pipeline/stages/resp_outbound/resp_outbound_stage1_client_remap/client-remap-protocol-switch.d.ts +9 -0
- package/dist/conversion/hub/pipeline/stages/resp_outbound/resp_outbound_stage1_client_remap/client-remap-protocol-switch.js +28 -0
- package/dist/conversion/hub/pipeline/stages/resp_outbound/resp_outbound_stage1_client_remap/index.d.ts +1 -2
- package/dist/conversion/hub/pipeline/stages/resp_outbound/resp_outbound_stage1_client_remap/index.js +14 -102
- package/dist/conversion/hub/pipeline/stages/resp_outbound/resp_outbound_stage2_sse_stream/index.js +3 -1
- package/dist/conversion/hub/pipeline/stages/resp_process/resp_process_stage1_tool_governance/index.js +12 -10
- package/dist/conversion/hub/pipeline/stages/resp_process/resp_process_stage2_finalize/index.js +6 -5
- package/dist/conversion/hub/pipeline/stages/resp_process/resp_process_stage3_servertool_orchestration/index.d.ts +11 -1
- package/dist/conversion/hub/pipeline/stages/resp_process/resp_process_stage3_servertool_orchestration/index.js +10 -32
- package/dist/conversion/hub/pipeline/stages/utils.js +17 -1
- package/dist/conversion/hub/pipeline/target-utils.js +14 -91
- package/dist/conversion/hub/pipelines/inbound.js +3 -1
- package/dist/conversion/hub/pipelines/outbound.js +2 -0
- package/dist/conversion/hub/policy/policy-engine.js +9 -3
- package/dist/conversion/hub/policy/protocol-spec.js +20 -148
- package/dist/conversion/hub/process/chat-process-anthropic-alias.d.ts +2 -0
- package/dist/conversion/hub/process/chat-process-anthropic-alias.js +36 -0
- package/dist/conversion/hub/process/chat-process-clock-directive-parser.d.ts +5 -0
- package/dist/conversion/hub/process/chat-process-clock-directive-parser.js +48 -0
- package/dist/conversion/hub/process/chat-process-clock-directives.d.ts +24 -0
- package/dist/conversion/hub/process/chat-process-clock-directives.js +98 -0
- package/dist/conversion/hub/process/chat-process-clock-reminder-directives.d.ts +8 -0
- package/dist/conversion/hub/process/chat-process-clock-reminder-directives.js +42 -0
- package/dist/conversion/hub/process/chat-process-clock-reminder-finalize.d.ts +14 -0
- package/dist/conversion/hub/process/chat-process-clock-reminder-finalize.js +10 -0
- package/dist/conversion/hub/process/chat-process-clock-reminder-messages.d.ts +5 -0
- package/dist/conversion/hub/process/chat-process-clock-reminder-messages.js +10 -0
- package/dist/conversion/hub/process/chat-process-clock-reminder-orchestration.d.ts +30 -0
- package/dist/conversion/hub/process/chat-process-clock-reminder-orchestration.js +68 -0
- package/dist/conversion/hub/process/chat-process-clock-reminder-time-tag.d.ts +9 -0
- package/dist/conversion/hub/process/chat-process-clock-reminder-time-tag.js +18 -0
- package/dist/conversion/hub/process/chat-process-clock-reminders.d.ts +2 -0
- package/dist/conversion/hub/process/chat-process-clock-reminders.js +104 -0
- package/dist/conversion/hub/process/chat-process-clock-tool-schemas.d.ts +3 -0
- package/dist/conversion/hub/process/chat-process-clock-tool-schemas.js +233 -0
- package/dist/conversion/hub/process/chat-process-clock-tools.d.ts +6 -0
- package/dist/conversion/hub/process/chat-process-clock-tools.js +41 -0
- package/dist/conversion/hub/process/chat-process-continue-execution.d.ts +11 -0
- package/dist/conversion/hub/process/chat-process-continue-execution.js +82 -0
- package/dist/conversion/hub/process/chat-process-governance-context.d.ts +15 -0
- package/dist/conversion/hub/process/chat-process-governance-context.js +7 -0
- package/dist/conversion/hub/process/chat-process-governance-finalize.d.ts +16 -0
- package/dist/conversion/hub/process/chat-process-governance-finalize.js +11 -0
- package/dist/conversion/hub/process/chat-process-governance-orchestration.d.ts +9 -0
- package/dist/conversion/hub/process/chat-process-governance-orchestration.js +47 -0
- package/dist/conversion/hub/process/chat-process-governed-control-ops.d.ts +8 -0
- package/dist/conversion/hub/process/chat-process-governed-control-ops.js +5 -0
- package/dist/conversion/hub/process/chat-process-governed-filter-call.d.ts +12 -0
- package/dist/conversion/hub/process/chat-process-governed-filter-call.js +18 -0
- package/dist/conversion/hub/process/chat-process-governed-merge.d.ts +8 -0
- package/dist/conversion/hub/process/chat-process-governed-merge.js +11 -0
- package/dist/conversion/hub/process/chat-process-media.d.ts +3 -0
- package/dist/conversion/hub/process/chat-process-media.js +18 -0
- package/dist/conversion/hub/process/chat-process-node-result.d.ts +23 -0
- package/dist/conversion/hub/process/chat-process-node-result.js +24 -0
- package/dist/conversion/hub/process/chat-process-pending-tool-sync.d.ts +14 -0
- package/dist/conversion/hub/process/chat-process-pending-tool-sync.js +52 -0
- package/dist/conversion/hub/process/chat-process-post-governed-normalization.d.ts +8 -0
- package/dist/conversion/hub/process/chat-process-post-governed-normalization.js +16 -0
- package/dist/conversion/hub/process/chat-process-review.d.ts +2 -0
- package/dist/conversion/hub/process/chat-process-review.js +8 -0
- package/dist/conversion/hub/process/chat-process-servertool-orchestration.d.ts +8 -0
- package/dist/conversion/hub/process/chat-process-servertool-orchestration.js +22 -0
- package/dist/conversion/hub/process/chat-process-tool-normalization.d.ts +2 -0
- package/dist/conversion/hub/process/chat-process-tool-normalization.js +4 -0
- package/dist/conversion/hub/process/chat-process-web-search-intent.d.ts +12 -0
- package/dist/conversion/hub/process/chat-process-web-search-intent.js +13 -0
- package/dist/conversion/hub/process/chat-process-web-search-tool-schema.d.ts +3 -0
- package/dist/conversion/hub/process/chat-process-web-search-tool-schema.js +4 -0
- package/dist/conversion/hub/process/chat-process-web-search.d.ts +8 -0
- package/dist/conversion/hub/process/chat-process-web-search.js +26 -0
- package/dist/conversion/hub/process/chat-process.d.ts +2 -19
- package/dist/conversion/hub/process/chat-process.js +12 -1701
- package/dist/conversion/hub/process/client-inject-readiness.d.ts +1 -0
- package/dist/conversion/hub/process/client-inject-readiness.js +4 -0
- package/dist/conversion/hub/registry.js +5 -2
- package/dist/conversion/hub/response/chat-response-utils.js +5 -86
- package/dist/conversion/hub/response/provider-response.d.ts +9 -0
- package/dist/conversion/hub/response/provider-response.js +6 -21
- package/dist/conversion/hub/response/response-mappers.js +2 -26
- package/dist/conversion/hub/response/response-runtime.js +2 -93
- package/dist/conversion/hub/semantic-mappers/anthropic-mapper.d.ts +1 -0
- package/dist/conversion/hub/semantic-mappers/anthropic-mapper.js +1 -0
- package/dist/conversion/hub/semantic-mappers/chat-mapper.d.ts +1 -0
- package/dist/conversion/hub/semantic-mappers/chat-mapper.js +1 -0
- package/dist/conversion/hub/semantic-mappers/gemini-mapper.d.ts +1 -0
- package/dist/conversion/hub/semantic-mappers/gemini-mapper.js +1 -0
- package/dist/conversion/hub/semantic-mappers/responses-mapper.d.ts +1 -0
- package/dist/conversion/hub/semantic-mappers/responses-mapper.js +1 -0
- package/dist/conversion/hub/snapshot-recorder.js +10 -3
- package/dist/conversion/hub/standardized-bridge.js +11 -288
- package/dist/conversion/hub/tool-governance/engine.js +5 -0
- package/dist/conversion/hub/tool-governance/rules.js +10 -10
- package/dist/conversion/hub/tool-session-compat.d.ts +2 -2
- package/dist/conversion/hub/tool-session-compat.js +17 -231
- package/dist/conversion/hub/tool-surface/tool-surface-engine.js +5 -3
- package/dist/conversion/responses/responses-host-policy.js +2 -12
- package/dist/conversion/responses/responses-openai-bridge/response-payload.js +6 -82
- package/dist/conversion/responses/responses-openai-bridge/types.d.ts +1 -0
- package/dist/conversion/responses/responses-openai-bridge.js +21 -54
- package/dist/conversion/shared/anthropic-message-utils.js +151 -13
- package/dist/conversion/shared/args-mapping.js +2 -146
- package/dist/conversion/shared/bridge-actions.js +203 -718
- package/dist/conversion/shared/bridge-id-utils.js +5 -71
- package/dist/conversion/shared/bridge-instructions.js +2 -1
- package/dist/conversion/shared/bridge-message-types.d.ts +2 -0
- package/dist/conversion/shared/bridge-message-utils.js +1 -2
- package/dist/conversion/shared/bridge-metadata.d.ts +1 -0
- package/dist/conversion/shared/bridge-metadata.js +4 -0
- package/dist/conversion/shared/bridge-policies.js +5 -189
- package/dist/conversion/shared/chat-envelope-validator.js +2 -126
- package/dist/conversion/shared/chat-output-normalizer.js +2 -54
- package/dist/conversion/shared/compaction-detect.js +2 -57
- package/dist/conversion/shared/gemini-tool-utils.js +9 -524
- package/dist/conversion/shared/jsonish.js +3 -160
- package/dist/conversion/shared/mcp-injection.js +3 -169
- package/dist/conversion/shared/media.js +2 -7
- package/dist/conversion/shared/metadata-passthrough.js +9 -46
- package/dist/conversion/shared/openai-finalizer.js +2 -1
- package/dist/conversion/shared/openai-message-normalize.js +11 -283
- package/dist/conversion/shared/output-content-normalizer.js +9 -112
- package/dist/conversion/shared/payload-budget.js +2 -85
- package/dist/conversion/shared/protocol-state.js +11 -7
- package/dist/conversion/shared/reasoning-mapping.js +2 -6
- package/dist/conversion/shared/reasoning-normalizer.js +4 -1
- package/dist/conversion/shared/reasoning-tool-normalizer.js +14 -126
- package/dist/conversion/shared/reasoning-tool-parser.js +4 -87
- package/dist/conversion/shared/reasoning-utils.js +2 -6
- package/dist/conversion/shared/responses-conversation-store.js +4 -82
- package/dist/conversion/shared/responses-output-builder.js +11 -47
- package/dist/conversion/shared/responses-reasoning-registry.js +7 -1
- package/dist/conversion/shared/responses-request-adapter.d.ts +7 -1
- package/dist/conversion/shared/responses-request-adapter.js +14 -1
- package/dist/conversion/shared/responses-response-utils.js +6 -7
- package/dist/conversion/shared/responses-tool-utils.d.ts +1 -0
- package/dist/conversion/shared/responses-tool-utils.js +90 -14
- package/dist/conversion/shared/runtime-metadata.js +13 -5
- package/dist/conversion/shared/streaming-text-extractor.js +2 -7
- package/dist/conversion/shared/text-markup-normalizer/normalize.d.ts +1 -1
- package/dist/conversion/shared/text-markup-normalizer/normalize.js +43 -17
- package/dist/conversion/shared/text-markup-normalizer.d.ts +1 -0
- package/dist/conversion/shared/text-markup-normalizer.js +1 -0
- package/dist/conversion/shared/thought-signature-validator.js +3 -2
- package/dist/conversion/shared/tool-argument-repairer.js +2 -2
- package/dist/conversion/shared/tool-call-id-manager.js +5 -7
- package/dist/conversion/shared/tool-call-utils.js +3 -45
- package/dist/conversion/shared/tool-canonicalizer.js +25 -29
- package/dist/conversion/shared/tool-filter-pipeline.js +4 -99
- package/dist/conversion/shared/tool-governor.d.ts +6 -0
- package/dist/conversion/shared/tool-governor.js +43 -125
- package/dist/conversion/shared/tool-harvester.js +2 -8
- package/dist/conversion/shared/tool-mapping.js +2 -5
- package/dist/conversion/shared/tooling.d.ts +0 -4
- package/dist/conversion/shared/tooling.js +18 -0
- package/dist/native/router_hotpath_napi.node +0 -0
- package/dist/router/virtual-router/engine/provider-key/parse.d.ts +1 -6
- package/dist/router/virtual-router/engine/provider-key/parse.js +1 -43
- package/dist/router/virtual-router/engine/routing-state/store.js +48 -12
- package/dist/router/virtual-router/engine-logging.js +4 -3
- package/dist/router/virtual-router/engine-selection/alias-selection.js +45 -83
- package/dist/router/virtual-router/engine-selection/key-parsing.js +9 -23
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-directive-parser.d.ts +20 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-directive-parser.js +163 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-reminder-directives.d.ts +7 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-reminder-directives.js +103 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-reminder-orchestration-semantics.d.ts +10 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-reminder-orchestration-semantics.js +110 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-reminder-semantics.d.ts +8 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-reminder-semantics.js +281 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-reminder-time-tag-semantics.d.ts +1 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-reminder-time-tag-semantics.js +25 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-reminders-semantics.d.ts +4 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-reminders-semantics.js +44 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-tool-schema-semantics.d.ts +2 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-clock-tool-schema-semantics.js +62 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-governance-semantics.d.ts +40 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-governance-semantics.js +484 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-governed-filter-semantics.d.ts +9 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-governed-filter-semantics.js +64 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-node-result-semantics.d.ts +5 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-node-result-semantics.js +163 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-post-governed-normalization-semantics.d.ts +1 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-post-governed-normalization-semantics.js +49 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-servertool-orchestration-semantics.d.ts +30 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-servertool-orchestration-semantics.js +446 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-web-search-intent-semantics.d.ts +1 -0
- package/dist/router/virtual-router/engine-selection/native-chat-process-web-search-intent-semantics.js +49 -0
- package/dist/router/virtual-router/engine-selection/native-hub-bridge-action-semantics.d.ts +134 -0
- package/dist/router/virtual-router/engine-selection/native-hub-bridge-action-semantics.js +729 -0
- package/dist/router/virtual-router/engine-selection/native-hub-bridge-policy-semantics.d.ts +62 -0
- package/dist/router/virtual-router/engine-selection/native-hub-bridge-policy-semantics.js +338 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-edge-stage-semantics.d.ts +18 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-edge-stage-semantics.js +317 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-inbound-outbound-semantics.d.ts +22 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-inbound-outbound-semantics.js +426 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-orchestration-semantics.d.ts +57 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-orchestration-semantics.js +705 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-req-inbound-semantics.d.ts +46 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-req-inbound-semantics.js +503 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-req-outbound-semantics.d.ts +146 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-req-outbound-semantics.js +570 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-req-process-semantics.d.ts +25 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-req-process-semantics.js +148 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-resp-semantics.d.ts +25 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-resp-semantics.js +637 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-session-identifiers-semantics.d.ts +11 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-session-identifiers-semantics.js +207 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-target-semantics.d.ts +3 -0
- package/dist/router/virtual-router/engine-selection/native-hub-pipeline-target-semantics.js +128 -0
- package/dist/router/virtual-router/engine-selection/native-router-hotpath-analysis.d.ts +57 -0
- package/dist/router/virtual-router/engine-selection/native-router-hotpath-analysis.js +217 -0
- package/dist/router/virtual-router/engine-selection/native-router-hotpath-loader.d.ts +5 -0
- package/dist/router/virtual-router/engine-selection/native-router-hotpath-loader.js +284 -0
- package/dist/router/virtual-router/engine-selection/native-router-hotpath-policy.d.ts +5 -0
- package/dist/router/virtual-router/engine-selection/native-router-hotpath-policy.js +18 -0
- package/dist/router/virtual-router/engine-selection/native-router-hotpath-quota-buckets.d.ts +25 -0
- package/dist/router/virtual-router/engine-selection/native-router-hotpath-quota-buckets.js +85 -0
- package/dist/router/virtual-router/engine-selection/native-router-hotpath.d.ts +59 -0
- package/dist/router/virtual-router/engine-selection/native-router-hotpath.js +117 -0
- package/dist/router/virtual-router/engine-selection/native-shared-conversion-semantics.d.ts +76 -0
- package/dist/router/virtual-router/engine-selection/native-shared-conversion-semantics.js +1166 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-alias-selection-semantics.d.ts +16 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-alias-selection-semantics.js +96 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-stop-message-actions-semantics.d.ts +6 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-stop-message-actions-semantics.js +85 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-stop-message-semantics.d.ts +9 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-stop-message-semantics.js +70 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-stop-message-state-semantics.d.ts +2 -0
- package/dist/router/virtual-router/engine-selection/native-virtual-router-stop-message-state-semantics.js +76 -0
- package/dist/router/virtual-router/engine-selection/route-utils.js +1 -1
- package/dist/router/virtual-router/engine-selection/tier-selection-antigravity-session-lease.d.ts +10 -0
- package/dist/router/virtual-router/engine-selection/tier-selection-antigravity-session-lease.js +231 -0
- package/dist/router/virtual-router/engine-selection/tier-selection-antigravity-target-split.d.ts +4 -0
- package/dist/router/virtual-router/engine-selection/tier-selection-antigravity-target-split.js +43 -0
- package/dist/router/virtual-router/engine-selection/tier-selection-quota-integration.d.ts +27 -0
- package/dist/router/virtual-router/engine-selection/tier-selection-quota-integration.js +116 -0
- package/dist/router/virtual-router/engine-selection/tier-selection-select.d.ts +1 -1
- package/dist/router/virtual-router/engine-selection/tier-selection-select.js +29 -129
- package/dist/router/virtual-router/engine-selection/tier-selection.js +2 -265
- package/dist/router/virtual-router/engine.js +258 -249
- package/dist/router/virtual-router/features.js +2 -2
- package/dist/router/virtual-router/routing-instructions.d.ts +5 -7
- package/dist/router/virtual-router/routing-instructions.js +93 -66
- package/dist/router/virtual-router/routing-stop-message-actions.js +91 -112
- package/dist/router/virtual-router/routing-stop-message-parser.js +9 -132
- package/dist/router/virtual-router/routing-stop-message-state-codec.d.ts +1 -0
- package/dist/router/virtual-router/routing-stop-message-state-codec.js +58 -71
- package/dist/router/virtual-router/sticky-session-store.js +4 -2
- package/dist/router/virtual-router/stop-message-file-resolver.d.ts +1 -0
- package/dist/router/virtual-router/stop-message-file-resolver.js +10 -0
- package/dist/router/virtual-router/stop-message-state-sync.d.ts +1 -1
- package/dist/router/virtual-router/stop-message-state-sync.js +3 -7
- package/dist/router/virtual-router/token-counter.js +0 -9
- package/dist/router/virtual-router/types.d.ts +9 -7
- package/dist/servertool/clock/config.js +23 -51
- package/dist/servertool/clock/io.js +1 -0
- package/dist/servertool/clock/session-scope.d.ts +2 -2
- package/dist/servertool/clock/session-scope.js +5 -47
- package/dist/servertool/engine.d.ts +9 -0
- package/dist/servertool/engine.js +196 -79
- package/dist/servertool/handlers/antigravity-thought-signature-bootstrap.js +2 -2
- package/dist/servertool/handlers/clock.js +1 -1
- package/dist/servertool/handlers/continue-execution.js +8 -4
- package/dist/servertool/handlers/followup-request-builder.js +18 -1
- package/dist/servertool/handlers/gemini-empty-reply-continue.js +7 -1
- package/dist/servertool/handlers/review.js +180 -0
- package/dist/servertool/handlers/stop-message-auto/blocked-report.js +59 -1
- package/dist/servertool/handlers/stop-message-auto/iflow-followup.d.ts +23 -2
- package/dist/servertool/handlers/stop-message-auto/iflow-followup.js +397 -89
- package/dist/servertool/handlers/stop-message-auto/routing-state.d.ts +5 -15
- package/dist/servertool/handlers/stop-message-auto/routing-state.js +29 -55
- package/dist/servertool/handlers/stop-message-auto/runtime-utils.d.ts +6 -0
- package/dist/servertool/handlers/stop-message-auto/runtime-utils.js +35 -61
- package/dist/servertool/handlers/stop-message-auto.js +392 -76
- package/dist/servertool/server-side-tools.d.ts +1 -0
- package/dist/servertool/server-side-tools.js +90 -52
- package/dist/servertool/types.d.ts +17 -0
- package/dist/tools/apply-patch/patch-text/normalize.js +11 -0
- package/dist/tools/exec-command/validator.d.ts +4 -1
- package/dist/tools/exec-command/validator.js +87 -3
- package/dist/tools/tool-registry.d.ts +7 -1
- package/dist/tools/tool-registry.js +3 -2
- package/package.json +115 -7
- package/dist/servertool/handlers/stop-message-stage-policy/bd-runtime.d.ts +0 -18
- package/dist/servertool/handlers/stop-message-stage-policy/bd-runtime.js +0 -398
- package/dist/servertool/handlers/stop-message-stage-policy/decision.d.ts +0 -9
- package/dist/servertool/handlers/stop-message-stage-policy/decision.js +0 -127
- package/dist/servertool/handlers/stop-message-stage-policy/observation.d.ts +0 -2
- package/dist/servertool/handlers/stop-message-stage-policy/observation.js +0 -179
- package/dist/servertool/handlers/stop-message-stage-policy/templates.d.ts +0 -4
- package/dist/servertool/handlers/stop-message-stage-policy/templates.js +0 -96
- package/dist/servertool/handlers/stop-message-stage-policy/text-utils.d.ts +0 -9
- package/dist/servertool/handlers/stop-message-stage-policy/text-utils.js +0 -89
- package/dist/servertool/handlers/stop-message-stage-policy/types.d.ts +0 -59
- package/dist/servertool/handlers/stop-message-stage-policy.d.ts +0 -3
- package/dist/servertool/handlers/stop-message-stage-policy.js +0 -2
- /package/dist/servertool/handlers/{stop-message-stage-policy/types.js → review.d.ts} +0 -0
|
@@ -0,0 +1,27 @@
|
|
|
1
|
+
import type { ContextAdvisorResult } from '../context-advisor.js';
|
|
2
|
+
import { type ResolvedContextWeightedConfig } from '../context-weighted.js';
|
|
3
|
+
import { type ResolvedHealthWeightedConfig } from '../health-weighted.js';
|
|
4
|
+
import type { RoutePoolTier } from '../types.js';
|
|
5
|
+
import type { SelectionDeps, TrySelectFromTierOptions } from './selection-deps.js';
|
|
6
|
+
export declare function selectProviderKeyWithQuotaBuckets(opts: {
|
|
7
|
+
routeName: string;
|
|
8
|
+
tier: RoutePoolTier;
|
|
9
|
+
stickyKey: string | undefined;
|
|
10
|
+
candidates: string[];
|
|
11
|
+
isSafePool: boolean;
|
|
12
|
+
deps: SelectionDeps;
|
|
13
|
+
options: TrySelectFromTierOptions;
|
|
14
|
+
contextResult: ContextAdvisorResult;
|
|
15
|
+
warnRatio: number;
|
|
16
|
+
excludedKeys: Set<string>;
|
|
17
|
+
isRecoveryAttempt: boolean;
|
|
18
|
+
now: number;
|
|
19
|
+
nowForWeights: number;
|
|
20
|
+
healthWeightedCfg: ResolvedHealthWeightedConfig;
|
|
21
|
+
contextWeightedCfg: ResolvedContextWeightedConfig;
|
|
22
|
+
quotaView: NonNullable<SelectionDeps['quotaView']>;
|
|
23
|
+
isAvailable: (key: string) => boolean;
|
|
24
|
+
selectFirstAvailable: (keys: string[]) => string | null;
|
|
25
|
+
applyAliasStickyQueuePinning: (candidates: string[]) => string[];
|
|
26
|
+
preferAntigravityAliasesOnRetry: (candidates: string[]) => string[];
|
|
27
|
+
}): string | null;
|
|
@@ -0,0 +1,116 @@
|
|
|
1
|
+
import { computeContextMultiplier } from '../context-weighted.js';
|
|
2
|
+
import { computeHealthWeight } from '../health-weighted.js';
|
|
3
|
+
import { buildQuotaBuckets } from './native-router-hotpath.js';
|
|
4
|
+
import { computeContextWeightMultipliers } from './context-weight-multipliers.js';
|
|
5
|
+
import { pickPriorityGroup } from './tier-priority.js';
|
|
6
|
+
export function selectProviderKeyWithQuotaBuckets(opts) {
|
|
7
|
+
const { routeName, tier, stickyKey, candidates, isSafePool, deps, options, contextResult, warnRatio, isRecoveryAttempt, now, nowForWeights, healthWeightedCfg, contextWeightedCfg, quotaView, isAvailable, selectFirstAvailable, applyAliasStickyQueuePinning, preferAntigravityAliasesOnRetry } = opts;
|
|
8
|
+
const bucketInputs = candidates.map((key, order) => {
|
|
9
|
+
const entry = quotaView(key);
|
|
10
|
+
const penaltyRaw = entry?.selectionPenalty;
|
|
11
|
+
return {
|
|
12
|
+
key,
|
|
13
|
+
order,
|
|
14
|
+
hasQuota: Boolean(entry),
|
|
15
|
+
inPool: entry ? entry.inPool !== false : true,
|
|
16
|
+
...(entry && typeof entry.cooldownUntil === 'number' ? { cooldownUntil: entry.cooldownUntil } : {}),
|
|
17
|
+
...(entry && typeof entry.blacklistUntil === 'number' ? { blacklistUntil: entry.blacklistUntil } : {}),
|
|
18
|
+
...(entry && typeof entry.priorityTier === 'number' ? { priorityTier: entry.priorityTier } : {}),
|
|
19
|
+
...(typeof penaltyRaw === 'number' ? { selectionPenalty: penaltyRaw } : {})
|
|
20
|
+
};
|
|
21
|
+
});
|
|
22
|
+
const { priorities: sortedPriorities, buckets } = buildQuotaBuckets(bucketInputs, now);
|
|
23
|
+
for (const priority of sortedPriorities) {
|
|
24
|
+
const bucket = buckets.get(priority) ?? [];
|
|
25
|
+
if (!bucket.length) {
|
|
26
|
+
continue;
|
|
27
|
+
}
|
|
28
|
+
bucket.sort((a, b) => a.order - b.order);
|
|
29
|
+
let bucketCandidates = bucket.map((item) => item.key);
|
|
30
|
+
if (bucketCandidates.length === 1) {
|
|
31
|
+
return bucketCandidates[0] ?? null;
|
|
32
|
+
}
|
|
33
|
+
if (isRecoveryAttempt) {
|
|
34
|
+
bucketCandidates = preferAntigravityAliasesOnRetry(bucketCandidates);
|
|
35
|
+
}
|
|
36
|
+
bucketCandidates = applyAliasStickyQueuePinning(bucketCandidates);
|
|
37
|
+
const bucketWeights = {};
|
|
38
|
+
for (const item of bucket) {
|
|
39
|
+
if (healthWeightedCfg.enabled) {
|
|
40
|
+
const entry = quotaView(item.key);
|
|
41
|
+
const { weight } = computeHealthWeight(entry, nowForWeights, healthWeightedCfg);
|
|
42
|
+
bucketWeights[item.key] = weight;
|
|
43
|
+
}
|
|
44
|
+
else {
|
|
45
|
+
bucketWeights[item.key] = Math.max(1, Math.floor(100 / (1 + Math.max(0, item.penalty))));
|
|
46
|
+
}
|
|
47
|
+
}
|
|
48
|
+
if (isSafePool && contextWeightedCfg.enabled) {
|
|
49
|
+
const ctx = computeContextWeightMultipliers({
|
|
50
|
+
candidates: bucketCandidates,
|
|
51
|
+
usage: contextResult.usage,
|
|
52
|
+
warnRatio,
|
|
53
|
+
cfg: contextWeightedCfg
|
|
54
|
+
});
|
|
55
|
+
if (ctx) {
|
|
56
|
+
for (const key of bucketCandidates) {
|
|
57
|
+
const m = computeContextMultiplier({
|
|
58
|
+
effectiveSafeRefTokens: ctx.ref,
|
|
59
|
+
effectiveSafeTokens: ctx.eff[key] ?? 1,
|
|
60
|
+
cfg: contextWeightedCfg
|
|
61
|
+
});
|
|
62
|
+
bucketWeights[key] = Math.max(1, Math.round((bucketWeights[key] ?? 1) * m));
|
|
63
|
+
}
|
|
64
|
+
}
|
|
65
|
+
}
|
|
66
|
+
if (tier.mode === 'priority') {
|
|
67
|
+
if (!isRecoveryAttempt) {
|
|
68
|
+
const group = pickPriorityGroup({
|
|
69
|
+
candidates: bucketCandidates,
|
|
70
|
+
orderedTargets: tier.targets,
|
|
71
|
+
providerRegistry: deps.providerRegistry,
|
|
72
|
+
availabilityCheck: isAvailable
|
|
73
|
+
});
|
|
74
|
+
if (!group) {
|
|
75
|
+
continue;
|
|
76
|
+
}
|
|
77
|
+
const groupWeights = {};
|
|
78
|
+
for (const key of group.groupCandidates) {
|
|
79
|
+
groupWeights[key] = bucketWeights[key] ?? 1;
|
|
80
|
+
}
|
|
81
|
+
const selected = deps.loadBalancer.select({
|
|
82
|
+
routeName: `${routeName}:${tier.id}:priority:${priority}:group:${group.groupId}`,
|
|
83
|
+
candidates: group.groupCandidates,
|
|
84
|
+
stickyKey: options.allowAliasRotation ? undefined : stickyKey,
|
|
85
|
+
weights: groupWeights,
|
|
86
|
+
availabilityCheck: isAvailable
|
|
87
|
+
}, 'round-robin');
|
|
88
|
+
if (selected) {
|
|
89
|
+
return selected;
|
|
90
|
+
}
|
|
91
|
+
continue;
|
|
92
|
+
}
|
|
93
|
+
const recovered = selectFirstAvailable(bucketCandidates);
|
|
94
|
+
if (recovered)
|
|
95
|
+
return recovered;
|
|
96
|
+
continue;
|
|
97
|
+
}
|
|
98
|
+
if (isRecoveryAttempt) {
|
|
99
|
+
const recovered = selectFirstAvailable(bucketCandidates);
|
|
100
|
+
if (recovered)
|
|
101
|
+
return recovered;
|
|
102
|
+
continue;
|
|
103
|
+
}
|
|
104
|
+
const selected = deps.loadBalancer.select({
|
|
105
|
+
routeName: `${routeName}:${tier.id}`,
|
|
106
|
+
candidates: bucketCandidates,
|
|
107
|
+
stickyKey: options.allowAliasRotation ? undefined : stickyKey,
|
|
108
|
+
weights: bucketWeights,
|
|
109
|
+
availabilityCheck: isAvailable
|
|
110
|
+
}, tier.mode === 'round-robin' ? 'round-robin' : undefined);
|
|
111
|
+
if (selected) {
|
|
112
|
+
return selected;
|
|
113
|
+
}
|
|
114
|
+
}
|
|
115
|
+
return null;
|
|
116
|
+
}
|
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
import type { ContextAdvisorResult } from '../context-advisor.js';
|
|
2
|
-
import {
|
|
2
|
+
import type { ResolvedHealthWeightedConfig } from '../health-weighted.js';
|
|
3
3
|
import type { RoutePoolTier } from '../types.js';
|
|
4
4
|
import type { ResolvedContextWeightedConfig } from '../context-weighted.js';
|
|
5
5
|
import type { SelectionDeps, TrySelectFromTierOptions } from './selection-deps.js';
|
|
@@ -1,9 +1,9 @@
|
|
|
1
1
|
import { computeContextMultiplier } from '../context-weighted.js';
|
|
2
|
-
import { computeHealthWeight } from '../health-weighted.js';
|
|
3
2
|
import { pinCandidatesByAliasQueue, resolveAliasSelectionStrategy } from './alias-selection.js';
|
|
4
3
|
import { computeContextWeightMultipliers } from './context-weight-multipliers.js';
|
|
5
4
|
import { extractKeyAlias, extractProviderId, getProviderModelId } from './key-parsing.js';
|
|
6
5
|
import { pickPriorityGroup } from './tier-priority.js';
|
|
6
|
+
import { selectProviderKeyWithQuotaBuckets } from './tier-selection-quota-integration.js';
|
|
7
7
|
function applyAliasStickyQueuePinning(opts) {
|
|
8
8
|
const { candidates, orderedTargets, deps, excludedKeys } = opts;
|
|
9
9
|
if (!Array.isArray(candidates) || candidates.length < 2) {
|
|
@@ -250,135 +250,35 @@ export function selectProviderKeyFromCandidatePool(opts) {
|
|
|
250
250
|
availabilityCheck: isAvailable
|
|
251
251
|
}, tier.mode === 'round-robin' ? 'round-robin' : undefined);
|
|
252
252
|
}
|
|
253
|
-
|
|
254
|
-
|
|
255
|
-
|
|
256
|
-
|
|
257
|
-
|
|
258
|
-
|
|
259
|
-
|
|
260
|
-
|
|
261
|
-
|
|
262
|
-
|
|
263
|
-
|
|
264
|
-
|
|
265
|
-
|
|
266
|
-
|
|
267
|
-
|
|
268
|
-
|
|
269
|
-
|
|
270
|
-
|
|
271
|
-
|
|
272
|
-
|
|
273
|
-
|
|
274
|
-
const penalty = typeof penaltyRaw === 'number' && Number.isFinite(penaltyRaw) && penaltyRaw > 0 ? Math.floor(penaltyRaw) : 0;
|
|
275
|
-
const list = buckets.get(tierPriority) ?? [];
|
|
276
|
-
list.push({ key, penalty, order: order++ });
|
|
277
|
-
buckets.set(tierPriority, list);
|
|
278
|
-
}
|
|
279
|
-
const sortedPriorities = Array.from(buckets.keys()).sort((a, b) => a - b);
|
|
280
|
-
for (const priority of sortedPriorities) {
|
|
281
|
-
const bucket = buckets.get(priority) ?? [];
|
|
282
|
-
if (!bucket.length) {
|
|
283
|
-
continue;
|
|
284
|
-
}
|
|
285
|
-
// Keep candidate ordering stable (config order). Availability/blacklist/cooldown still apply.
|
|
286
|
-
bucket.sort((a, b) => a.order - b.order);
|
|
287
|
-
let bucketCandidates = bucket.map((item) => item.key);
|
|
288
|
-
// Single-provider pool should never be "emptied" by health/cooldown.
|
|
289
|
-
if (bucketCandidates.length === 1) {
|
|
290
|
-
return bucketCandidates[0] ?? null;
|
|
291
|
-
}
|
|
292
|
-
if (isRecoveryAttempt) {
|
|
293
|
-
bucketCandidates = preferAntigravityAliasesOnRetry({ candidates: bucketCandidates, excludedKeys, deps });
|
|
294
|
-
}
|
|
295
|
-
// Alias-level selection strategy (config-driven).
|
|
296
|
-
// For configured providers, we stick to one alias globally and rotate only on error/unavailability.
|
|
297
|
-
bucketCandidates = applyAliasStickyQueuePinning({
|
|
298
|
-
candidates: bucketCandidates,
|
|
253
|
+
return selectProviderKeyWithQuotaBuckets({
|
|
254
|
+
routeName,
|
|
255
|
+
tier,
|
|
256
|
+
stickyKey,
|
|
257
|
+
candidates,
|
|
258
|
+
isSafePool,
|
|
259
|
+
deps,
|
|
260
|
+
options,
|
|
261
|
+
contextResult,
|
|
262
|
+
warnRatio,
|
|
263
|
+
excludedKeys,
|
|
264
|
+
isRecoveryAttempt,
|
|
265
|
+
now,
|
|
266
|
+
nowForWeights,
|
|
267
|
+
healthWeightedCfg,
|
|
268
|
+
contextWeightedCfg,
|
|
269
|
+
quotaView,
|
|
270
|
+
isAvailable,
|
|
271
|
+
selectFirstAvailable,
|
|
272
|
+
applyAliasStickyQueuePinning: (quotaCandidates) => applyAliasStickyQueuePinning({
|
|
273
|
+
candidates: quotaCandidates,
|
|
299
274
|
orderedTargets: tier.targets,
|
|
300
275
|
deps,
|
|
301
276
|
excludedKeys
|
|
302
|
-
})
|
|
303
|
-
|
|
304
|
-
|
|
305
|
-
|
|
306
|
-
|
|
307
|
-
|
|
308
|
-
|
|
309
|
-
bucketWeights[item.key] = weight;
|
|
310
|
-
bucketMultipliers[item.key] = multiplier;
|
|
311
|
-
}
|
|
312
|
-
else {
|
|
313
|
-
// Legacy: penalty => lower weight, but never zero (unhealthy should still get a chance).
|
|
314
|
-
bucketWeights[item.key] = Math.max(1, Math.floor(100 / (1 + Math.max(0, item.penalty))));
|
|
315
|
-
bucketMultipliers[item.key] = 1;
|
|
316
|
-
}
|
|
317
|
-
}
|
|
318
|
-
if (isSafePool && contextWeightedCfg.enabled) {
|
|
319
|
-
const ctx = computeContextWeightMultipliers({ candidates: bucketCandidates, usage: contextResult.usage, warnRatio, cfg: contextWeightedCfg });
|
|
320
|
-
if (ctx) {
|
|
321
|
-
for (const key of bucketCandidates) {
|
|
322
|
-
const m = computeContextMultiplier({
|
|
323
|
-
effectiveSafeRefTokens: ctx.ref,
|
|
324
|
-
effectiveSafeTokens: ctx.eff[key] ?? 1,
|
|
325
|
-
cfg: contextWeightedCfg
|
|
326
|
-
});
|
|
327
|
-
bucketWeights[key] = Math.max(1, Math.round((bucketWeights[key] ?? 1) * m));
|
|
328
|
-
}
|
|
329
|
-
}
|
|
330
|
-
}
|
|
331
|
-
if (tier.mode === 'priority') {
|
|
332
|
-
if (!isRecoveryAttempt) {
|
|
333
|
-
const group = pickPriorityGroup({
|
|
334
|
-
candidates: bucketCandidates,
|
|
335
|
-
orderedTargets: tier.targets,
|
|
336
|
-
providerRegistry: deps.providerRegistry,
|
|
337
|
-
availabilityCheck: isAvailable
|
|
338
|
-
});
|
|
339
|
-
if (!group) {
|
|
340
|
-
continue;
|
|
341
|
-
}
|
|
342
|
-
const groupWeights = {};
|
|
343
|
-
for (const key of group.groupCandidates) {
|
|
344
|
-
groupWeights[key] = bucketWeights[key] ?? 1;
|
|
345
|
-
}
|
|
346
|
-
const selected = deps.loadBalancer.select({
|
|
347
|
-
routeName: `${routeName}:${tier.id}:priority:${priority}:group:${group.groupId}`,
|
|
348
|
-
candidates: group.groupCandidates,
|
|
349
|
-
stickyKey: options.allowAliasRotation ? undefined : stickyKey,
|
|
350
|
-
weights: groupWeights,
|
|
351
|
-
availabilityCheck: isAvailable
|
|
352
|
-
}, 'round-robin');
|
|
353
|
-
if (selected) {
|
|
354
|
-
return selected;
|
|
355
|
-
}
|
|
356
|
-
continue;
|
|
357
|
-
}
|
|
358
|
-
const recovered = selectFirstAvailable(bucketCandidates);
|
|
359
|
-
if (recovered)
|
|
360
|
-
return recovered;
|
|
361
|
-
continue;
|
|
362
|
-
// (unreachable) recovery handled above
|
|
363
|
-
}
|
|
364
|
-
else {
|
|
365
|
-
if (isRecoveryAttempt) {
|
|
366
|
-
const recovered = selectFirstAvailable(bucketCandidates);
|
|
367
|
-
if (recovered)
|
|
368
|
-
return recovered;
|
|
369
|
-
continue;
|
|
370
|
-
}
|
|
371
|
-
const selected = deps.loadBalancer.select({
|
|
372
|
-
routeName: `${routeName}:${tier.id}`,
|
|
373
|
-
candidates: bucketCandidates,
|
|
374
|
-
stickyKey: options.allowAliasRotation ? undefined : stickyKey,
|
|
375
|
-
weights: bucketWeights,
|
|
376
|
-
availabilityCheck: isAvailable
|
|
377
|
-
}, tier.mode === 'round-robin' ? 'round-robin' : undefined);
|
|
378
|
-
if (selected) {
|
|
379
|
-
return selected;
|
|
380
|
-
}
|
|
381
|
-
}
|
|
382
|
-
}
|
|
383
|
-
return null;
|
|
277
|
+
}),
|
|
278
|
+
preferAntigravityAliasesOnRetry: (quotaCandidates) => preferAntigravityAliasesOnRetry({
|
|
279
|
+
candidates: quotaCandidates,
|
|
280
|
+
excludedKeys,
|
|
281
|
+
deps
|
|
282
|
+
})
|
|
283
|
+
});
|
|
384
284
|
}
|
|
@@ -5,271 +5,8 @@ import { pinCandidatesByAliasQueue, resolveAliasSelectionStrategy } from './alia
|
|
|
5
5
|
import { extractKeyAlias, extractKeyIndex, extractProviderId, getProviderModelId } from './key-parsing.js';
|
|
6
6
|
import { providerSupportsMultimodalRequest } from './multimodal-capability.js';
|
|
7
7
|
import { selectProviderKeyFromCandidatePool } from './tier-selection-select.js';
|
|
8
|
-
import {
|
|
9
|
-
|
|
10
|
-
function isAntigravityGeminiModelKey(providerKey, deps) {
|
|
11
|
-
if ((extractProviderId(providerKey) ?? '') !== 'antigravity') {
|
|
12
|
-
return false;
|
|
13
|
-
}
|
|
14
|
-
const modelId = getProviderModelId(providerKey, deps.providerRegistry) ?? '';
|
|
15
|
-
return modelId.trim().toLowerCase().startsWith('gemini-');
|
|
16
|
-
}
|
|
17
|
-
function extractAntigravityRuntimeBase(providerKey) {
|
|
18
|
-
const value = typeof providerKey === 'string' ? providerKey.trim() : '';
|
|
19
|
-
if (!value)
|
|
20
|
-
return null;
|
|
21
|
-
const firstDot = value.indexOf('.');
|
|
22
|
-
if (firstDot <= 0 || firstDot === value.length - 1)
|
|
23
|
-
return null;
|
|
24
|
-
const secondDot = value.indexOf('.', firstDot + 1);
|
|
25
|
-
if (secondDot <= firstDot + 1)
|
|
26
|
-
return null;
|
|
27
|
-
const providerId = value.slice(0, firstDot);
|
|
28
|
-
const alias = value.slice(firstDot + 1, secondDot);
|
|
29
|
-
if (!providerId || !alias)
|
|
30
|
-
return null;
|
|
31
|
-
return `${providerId}.${alias}`;
|
|
32
|
-
}
|
|
33
|
-
function buildAntigravityLeaseRuntimeKey(runtimeBase) {
|
|
34
|
-
return `${runtimeBase}::gemini`;
|
|
35
|
-
}
|
|
36
|
-
function shouldAvoidAllAntigravityOnRetry(metadata) {
|
|
37
|
-
if (!metadata || typeof metadata !== 'object') {
|
|
38
|
-
return false;
|
|
39
|
-
}
|
|
40
|
-
const rtRaw = metadata.__rt;
|
|
41
|
-
if (!rtRaw || typeof rtRaw !== 'object' || Array.isArray(rtRaw)) {
|
|
42
|
-
return false;
|
|
43
|
-
}
|
|
44
|
-
const rt = rtRaw;
|
|
45
|
-
return rt.antigravityAvoidAllOnRetry === true;
|
|
46
|
-
}
|
|
47
|
-
function isAntigravityGeminiSessionBindingDisabled(metadata) {
|
|
48
|
-
if (!metadata || typeof metadata !== 'object') {
|
|
49
|
-
return false;
|
|
50
|
-
}
|
|
51
|
-
const rtRaw = metadata.__rt;
|
|
52
|
-
if (!rtRaw || typeof rtRaw !== 'object' || Array.isArray(rtRaw)) {
|
|
53
|
-
return false;
|
|
54
|
-
}
|
|
55
|
-
const rt = rtRaw;
|
|
56
|
-
if (rt.disableAntigravitySessionBinding === true) {
|
|
57
|
-
return true;
|
|
58
|
-
}
|
|
59
|
-
const mode = rt.antigravitySessionBinding;
|
|
60
|
-
if (mode === false) {
|
|
61
|
-
return true;
|
|
62
|
-
}
|
|
63
|
-
if (typeof mode === 'string' && ['0', 'false', 'off', 'disabled', 'none'].includes(mode.trim().toLowerCase())) {
|
|
64
|
-
return true;
|
|
65
|
-
}
|
|
66
|
-
return false;
|
|
67
|
-
}
|
|
68
|
-
function shouldAvoidAntigravityAfterRepeatedError(metadata) {
|
|
69
|
-
if (!metadata || typeof metadata !== 'object') {
|
|
70
|
-
return false;
|
|
71
|
-
}
|
|
72
|
-
const rtRaw = metadata.__rt;
|
|
73
|
-
if (!rtRaw || typeof rtRaw !== 'object' || Array.isArray(rtRaw)) {
|
|
74
|
-
return false;
|
|
75
|
-
}
|
|
76
|
-
const rt = rtRaw;
|
|
77
|
-
if (rt.antigravityAvoidAllOnRetry === true) {
|
|
78
|
-
return true;
|
|
79
|
-
}
|
|
80
|
-
const signature = typeof rt.antigravityRetryErrorSignature === 'string' ? rt.antigravityRetryErrorSignature.trim() : '';
|
|
81
|
-
const consecutive = typeof rt.antigravityRetryErrorConsecutive === 'number' && Number.isFinite(rt.antigravityRetryErrorConsecutive)
|
|
82
|
-
? Math.max(0, Math.floor(rt.antigravityRetryErrorConsecutive))
|
|
83
|
-
: 0;
|
|
84
|
-
return signature.length > 0 && signature !== 'unknown' && consecutive >= 2;
|
|
85
|
-
}
|
|
86
|
-
function preferNonAntigravityWhenPossible(candidates) {
|
|
87
|
-
if (!Array.isArray(candidates) || candidates.length < 2) {
|
|
88
|
-
return candidates;
|
|
89
|
-
}
|
|
90
|
-
const nonAntigravity = candidates.filter((key) => (extractProviderId(key) ?? '') !== 'antigravity');
|
|
91
|
-
return nonAntigravity.length > 0 ? nonAntigravity : candidates;
|
|
92
|
-
}
|
|
93
|
-
function extractNonAntigravityTargets(targets) {
|
|
94
|
-
if (!Array.isArray(targets) || targets.length === 0) {
|
|
95
|
-
return [];
|
|
96
|
-
}
|
|
97
|
-
return targets.filter((key) => (extractProviderId(key) ?? '') !== 'antigravity');
|
|
98
|
-
}
|
|
99
|
-
function resolveSessionScopeKey(metadata) {
|
|
100
|
-
if (!metadata || typeof metadata !== 'object') {
|
|
101
|
-
return null;
|
|
102
|
-
}
|
|
103
|
-
const record = metadata;
|
|
104
|
-
const sessionId = typeof record.sessionId === 'string' ? record.sessionId.trim() : '';
|
|
105
|
-
if (sessionId) {
|
|
106
|
-
return `session:${sessionId}`;
|
|
107
|
-
}
|
|
108
|
-
const conversationId = typeof record.conversationId === 'string' ? record.conversationId.trim() : '';
|
|
109
|
-
if (conversationId) {
|
|
110
|
-
return `conversation:${conversationId}`;
|
|
111
|
-
}
|
|
112
|
-
// Antigravity-Manager alignment: when the client does not provide session_id/conversation_id,
|
|
113
|
-
// fall back to the derived antigravitySessionId so alias/session binding still works.
|
|
114
|
-
const antigravitySessionId = typeof record.antigravitySessionId === 'string'
|
|
115
|
-
? String(record.antigravitySessionId).trim()
|
|
116
|
-
: '';
|
|
117
|
-
if (antigravitySessionId) {
|
|
118
|
-
return `session:${antigravitySessionId}`;
|
|
119
|
-
}
|
|
120
|
-
return null;
|
|
121
|
-
}
|
|
122
|
-
function buildScopedSessionKey(sessionKey) {
|
|
123
|
-
// Policy: antigravity alias/session binding applies only to Gemini models.
|
|
124
|
-
return `${sessionKey}::gemini`;
|
|
125
|
-
}
|
|
126
|
-
function extractLeaseRuntimeKey(providerKey, deps) {
|
|
127
|
-
const base = extractAntigravityRuntimeBase(providerKey);
|
|
128
|
-
if (!base)
|
|
129
|
-
return null;
|
|
130
|
-
if ((extractProviderId(providerKey) ?? '') !== 'antigravity')
|
|
131
|
-
return base;
|
|
132
|
-
if (!isAntigravityGeminiModelKey(providerKey, deps)) {
|
|
133
|
-
return null;
|
|
134
|
-
}
|
|
135
|
-
return buildAntigravityLeaseRuntimeKey(base);
|
|
136
|
-
}
|
|
137
|
-
function applyAntigravityAliasSessionLeases(targets, deps, metadata) {
|
|
138
|
-
if (!Array.isArray(targets) || targets.length === 0) {
|
|
139
|
-
return { targets, blocked: 0, preferredPinned: false, pinnedStrict: false };
|
|
140
|
-
}
|
|
141
|
-
if (isAntigravityGeminiSessionBindingDisabled(metadata)) {
|
|
142
|
-
return { targets, blocked: 0, preferredPinned: false, pinnedStrict: false };
|
|
143
|
-
}
|
|
144
|
-
const leaseStore = deps.antigravityAliasLeaseStore;
|
|
145
|
-
const sessionAliasStore = deps.antigravitySessionAliasStore;
|
|
146
|
-
if (!leaseStore || !sessionAliasStore) {
|
|
147
|
-
return { targets, blocked: 0, preferredPinned: false, pinnedStrict: false };
|
|
148
|
-
}
|
|
149
|
-
const sessionKey = resolveSessionScopeKey(metadata);
|
|
150
|
-
if (!sessionKey) {
|
|
151
|
-
return { targets, blocked: 0, preferredPinned: false, pinnedStrict: false };
|
|
152
|
-
}
|
|
153
|
-
const cooldownMs = typeof deps.antigravityAliasReuseCooldownMs === 'number' && Number.isFinite(deps.antigravityAliasReuseCooldownMs)
|
|
154
|
-
? Math.max(0, Math.floor(deps.antigravityAliasReuseCooldownMs))
|
|
155
|
-
: DEFAULT_ANTIGRAVITY_ALIAS_SESSION_COOLDOWN_MS;
|
|
156
|
-
const now = Date.now();
|
|
157
|
-
const bindingModeRaw = deps.loadBalancer.getPolicy().aliasSelection
|
|
158
|
-
?.antigravitySessionBinding;
|
|
159
|
-
const strictRequested = typeof bindingModeRaw === 'string' && bindingModeRaw.trim().toLowerCase() === 'strict';
|
|
160
|
-
const agSessionId = metadata && typeof metadata === 'object' && typeof metadata.antigravitySessionId === 'string'
|
|
161
|
-
? String(metadata.antigravitySessionId).trim()
|
|
162
|
-
: '';
|
|
163
|
-
const hasAntigravityGeminiTargets = targets.some((key) => isAntigravityGeminiModelKey(key, deps));
|
|
164
|
-
let pinnedRuntimeKey = strictRequested && agSessionId && hasAntigravityGeminiTargets
|
|
165
|
-
? lookupAntigravityPinnedAliasForSessionId(agSessionId, { hydrate: true })
|
|
166
|
-
: undefined;
|
|
167
|
-
const pinnedLeaseKey = pinnedRuntimeKey ? buildAntigravityLeaseRuntimeKey(pinnedRuntimeKey) : undefined;
|
|
168
|
-
// If the pinned alias is completely out of pool (quota exhausted), release the pin so we can rotate.
|
|
169
|
-
if (pinnedRuntimeKey && deps.quotaView && agSessionId) {
|
|
170
|
-
const pinnedKeys = targets.filter((key) => isAntigravityGeminiModelKey(key, deps) && extractLeaseRuntimeKey(key, deps) === pinnedLeaseKey);
|
|
171
|
-
if (pinnedKeys.length > 0) {
|
|
172
|
-
const allOutOfPool = pinnedKeys.every((key) => deps.quotaView?.(key)?.inPool === false);
|
|
173
|
-
if (allOutOfPool) {
|
|
174
|
-
const releasedRuntimeKey = pinnedRuntimeKey;
|
|
175
|
-
unpinAntigravitySessionAliasForSessionId(agSessionId);
|
|
176
|
-
pinnedRuntimeKey = undefined;
|
|
177
|
-
sessionAliasStore.delete(buildScopedSessionKey(sessionKey));
|
|
178
|
-
try {
|
|
179
|
-
const raw = String(process.env.ROUTECODEX_STAGE_LOG || process.env.RCC_STAGE_LOG || '').trim().toLowerCase();
|
|
180
|
-
const enabled = raw !== '' && raw !== '0' && raw !== 'false' && raw !== 'no';
|
|
181
|
-
if (enabled) {
|
|
182
|
-
console.log('[virtual-router][antigravity-session-binding] unpin', JSON.stringify({ agSessionId, runtimeKey: releasedRuntimeKey }));
|
|
183
|
-
}
|
|
184
|
-
}
|
|
185
|
-
catch {
|
|
186
|
-
// ignore
|
|
187
|
-
}
|
|
188
|
-
}
|
|
189
|
-
}
|
|
190
|
-
}
|
|
191
|
-
const strictBinding = strictRequested && Boolean(pinnedLeaseKey);
|
|
192
|
-
const geminiSessionKey = buildScopedSessionKey(sessionKey);
|
|
193
|
-
let preferredGeminiRuntimeKey = pinnedLeaseKey || sessionAliasStore.get(geminiSessionKey);
|
|
194
|
-
if (preferredGeminiRuntimeKey && !preferredGeminiRuntimeKey.includes('::')) {
|
|
195
|
-
preferredGeminiRuntimeKey = buildAntigravityLeaseRuntimeKey(preferredGeminiRuntimeKey);
|
|
196
|
-
}
|
|
197
|
-
if (preferredGeminiRuntimeKey && !pinnedLeaseKey) {
|
|
198
|
-
const lease = leaseStore.get(preferredGeminiRuntimeKey);
|
|
199
|
-
if (lease && lease.sessionKey !== geminiSessionKey && now - lease.lastSeenAt < cooldownMs) {
|
|
200
|
-
preferredGeminiRuntimeKey = undefined;
|
|
201
|
-
}
|
|
202
|
-
}
|
|
203
|
-
// If a previously bound alias is completely out of pool (quota exhausted / blacklisted),
|
|
204
|
-
// release the binding so the session can rebind to a different alias on the next successful call.
|
|
205
|
-
if (deps.quotaView && !pinnedLeaseKey && preferredGeminiRuntimeKey) {
|
|
206
|
-
const pinnedKeys = targets.filter((key) => isAntigravityGeminiModelKey(key, deps) && extractLeaseRuntimeKey(key, deps) === preferredGeminiRuntimeKey);
|
|
207
|
-
if (pinnedKeys.length > 0) {
|
|
208
|
-
const allOutOfPool = pinnedKeys.every((key) => deps.quotaView?.(key)?.inPool === false);
|
|
209
|
-
if (allOutOfPool) {
|
|
210
|
-
const releasedRuntimeKey = preferredGeminiRuntimeKey;
|
|
211
|
-
sessionAliasStore.delete(geminiSessionKey);
|
|
212
|
-
preferredGeminiRuntimeKey = undefined;
|
|
213
|
-
try {
|
|
214
|
-
const raw = String(process.env.ROUTECODEX_STAGE_LOG || process.env.RCC_STAGE_LOG || '').trim().toLowerCase();
|
|
215
|
-
const enabled = raw !== '' && raw !== '0' && raw !== 'false' && raw !== 'no';
|
|
216
|
-
if (enabled) {
|
|
217
|
-
console.log('[virtual-router][antigravity-session-binding] release', JSON.stringify({ sessionKey: geminiSessionKey, runtimeKey: releasedRuntimeKey }));
|
|
218
|
-
}
|
|
219
|
-
}
|
|
220
|
-
catch {
|
|
221
|
-
// ignore
|
|
222
|
-
}
|
|
223
|
-
}
|
|
224
|
-
}
|
|
225
|
-
}
|
|
226
|
-
const pinnedGemini = preferredGeminiRuntimeKey
|
|
227
|
-
? targets.filter((key) => isAntigravityGeminiModelKey(key, deps) && extractLeaseRuntimeKey(key, deps) === preferredGeminiRuntimeKey)
|
|
228
|
-
: [];
|
|
229
|
-
const preferredPinned = pinnedGemini.length > 0;
|
|
230
|
-
const pinnedSet = preferredPinned ? new Set([...pinnedGemini]) : null;
|
|
231
|
-
const candidates = preferredPinned
|
|
232
|
-
? [...pinnedGemini, ...targets.filter((key) => !pinnedSet.has(key))]
|
|
233
|
-
: targets;
|
|
234
|
-
const pinnedStrict = strictBinding && Boolean(preferredGeminiRuntimeKey);
|
|
235
|
-
let blocked = 0;
|
|
236
|
-
const filtered = candidates.filter((key) => {
|
|
237
|
-
const providerId = extractProviderId(key);
|
|
238
|
-
if (providerId !== 'antigravity') {
|
|
239
|
-
return true;
|
|
240
|
-
}
|
|
241
|
-
// Policy: antigravity alias/session binding applies only to Gemini models.
|
|
242
|
-
if (!isAntigravityGeminiModelKey(key, deps)) {
|
|
243
|
-
return true;
|
|
244
|
-
}
|
|
245
|
-
const scopedSessionKey = geminiSessionKey;
|
|
246
|
-
const runtimeKey = extractLeaseRuntimeKey(key, deps);
|
|
247
|
-
if (!runtimeKey) {
|
|
248
|
-
return true;
|
|
249
|
-
}
|
|
250
|
-
if (pinnedStrict) {
|
|
251
|
-
if (!isAntigravityGeminiModelKey(key, deps)) {
|
|
252
|
-
return true;
|
|
253
|
-
}
|
|
254
|
-
if (preferredGeminiRuntimeKey && runtimeKey !== preferredGeminiRuntimeKey) {
|
|
255
|
-
return false;
|
|
256
|
-
}
|
|
257
|
-
}
|
|
258
|
-
const lease = leaseStore.get(runtimeKey);
|
|
259
|
-
if (!lease) {
|
|
260
|
-
return true;
|
|
261
|
-
}
|
|
262
|
-
if (lease.sessionKey === scopedSessionKey) {
|
|
263
|
-
return true;
|
|
264
|
-
}
|
|
265
|
-
if (now - lease.lastSeenAt >= cooldownMs) {
|
|
266
|
-
return true;
|
|
267
|
-
}
|
|
268
|
-
blocked += 1;
|
|
269
|
-
return false;
|
|
270
|
-
});
|
|
271
|
-
return { targets: filtered, blocked, preferredPinned, pinnedStrict, preferredRuntimeKey: preferredGeminiRuntimeKey };
|
|
272
|
-
}
|
|
8
|
+
import { applyAntigravityAliasSessionLeases, extractLeaseRuntimeKey, isAntigravityGeminiModelKey, } from './tier-selection-antigravity-session-lease.js';
|
|
9
|
+
import { extractNonAntigravityTargets, preferNonAntigravityWhenPossible, shouldAvoidAllAntigravityOnRetry, shouldAvoidAntigravityAfterRepeatedError } from './tier-selection-antigravity-target-split.js';
|
|
273
10
|
export function trySelectFromTier(routeName, tier, stickyKey, estimatedTokens, features, deps, options) {
|
|
274
11
|
const { disabledProviders, disabledKeysMap, allowedProviders, disabledModels, requiredProviderKeys } = options;
|
|
275
12
|
let targets = Array.isArray(tier.targets) ? tier.targets : [];
|