@juspay/neurolink 9.23.0 → 9.25.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +12 -0
- package/README.md +10 -13
- package/dist/adapters/tts/googleTTSHandler.js +26 -1
- package/dist/adapters/video/vertexVideoHandler.js +23 -17
- package/dist/cli/commands/config.d.ts +3 -3
- package/dist/cli/commands/observability.d.ts +53 -0
- package/dist/cli/commands/observability.js +453 -0
- package/dist/cli/commands/telemetry.d.ts +63 -0
- package/dist/cli/commands/telemetry.js +689 -0
- package/dist/cli/factories/commandFactory.d.ts +34 -0
- package/dist/cli/factories/commandFactory.js +321 -116
- package/dist/cli/parser.js +6 -9
- package/dist/cli/utils/formatters.d.ts +13 -0
- package/dist/cli/utils/formatters.js +23 -0
- package/dist/constants/contextWindows.js +6 -0
- package/dist/constants/enums.d.ts +6 -0
- package/dist/constants/enums.js +8 -2
- package/dist/context/budgetChecker.js +75 -48
- package/dist/context/contextCompactor.js +135 -127
- package/dist/core/baseProvider.d.ts +5 -0
- package/dist/core/baseProvider.js +158 -102
- package/dist/core/conversationMemoryInitializer.js +7 -4
- package/dist/core/conversationMemoryManager.d.ts +2 -0
- package/dist/core/conversationMemoryManager.js +6 -2
- package/dist/core/modules/GenerationHandler.d.ts +2 -2
- package/dist/core/modules/GenerationHandler.js +12 -12
- package/dist/evaluation/ragasEvaluator.js +39 -19
- package/dist/evaluation/scoring.js +46 -20
- package/dist/features/ppt/index.d.ts +1 -1
- package/dist/features/ppt/index.js +1 -1
- package/dist/features/ppt/presentationOrchestrator.js +23 -0
- package/dist/features/ppt/slideGenerator.js +13 -0
- package/dist/features/ppt/slideRenderers.d.ts +1 -1
- package/dist/features/ppt/slideRenderers.js +6 -4
- package/dist/features/ppt/slideTypeInference.d.ts +1 -1
- package/dist/features/ppt/slideTypeInference.js +75 -73
- package/dist/files/fileTools.d.ts +6 -6
- package/dist/index.d.ts +46 -12
- package/dist/index.js +79 -17
- package/dist/lib/adapters/tts/googleTTSHandler.js +26 -1
- package/dist/lib/adapters/video/vertexVideoHandler.js +23 -17
- package/dist/lib/constants/contextWindows.js +6 -0
- package/dist/lib/constants/enums.d.ts +6 -0
- package/dist/lib/constants/enums.js +8 -2
- package/dist/lib/context/budgetChecker.js +75 -48
- package/dist/lib/context/contextCompactor.js +135 -127
- package/dist/lib/core/baseProvider.d.ts +5 -0
- package/dist/lib/core/baseProvider.js +158 -102
- package/dist/lib/core/conversationMemoryInitializer.js +7 -4
- package/dist/lib/core/conversationMemoryManager.d.ts +2 -0
- package/dist/lib/core/conversationMemoryManager.js +6 -2
- package/dist/lib/core/modules/GenerationHandler.d.ts +2 -2
- package/dist/lib/core/modules/GenerationHandler.js +12 -12
- package/dist/lib/evaluation/ragasEvaluator.js +39 -19
- package/dist/lib/evaluation/scoring.js +46 -20
- package/dist/lib/features/ppt/index.d.ts +1 -1
- package/dist/lib/features/ppt/index.js +1 -1
- package/dist/lib/features/ppt/presentationOrchestrator.js +23 -0
- package/dist/lib/features/ppt/slideGenerator.js +13 -0
- package/dist/lib/features/ppt/slideRenderers.d.ts +1 -1
- package/dist/lib/features/ppt/slideRenderers.js +6 -4
- package/dist/lib/features/ppt/slideTypeInference.d.ts +1 -1
- package/dist/lib/features/ppt/slideTypeInference.js +75 -73
- package/dist/lib/files/fileTools.d.ts +6 -6
- package/dist/lib/index.d.ts +46 -12
- package/dist/lib/index.js +79 -17
- package/dist/lib/mcp/httpRateLimiter.js +39 -12
- package/dist/lib/mcp/httpRetryHandler.js +22 -1
- package/dist/lib/mcp/mcpClientFactory.js +13 -15
- package/dist/lib/memory/memoryRetrievalTools.js +22 -0
- package/dist/lib/neurolink.d.ts +64 -72
- package/dist/lib/neurolink.js +984 -566
- package/dist/lib/observability/exporterRegistry.d.ts +152 -0
- package/dist/lib/observability/exporterRegistry.js +414 -0
- package/dist/lib/observability/exporters/arizeExporter.d.ts +32 -0
- package/dist/lib/observability/exporters/arizeExporter.js +139 -0
- package/dist/lib/observability/exporters/baseExporter.d.ts +117 -0
- package/dist/lib/observability/exporters/baseExporter.js +191 -0
- package/dist/lib/observability/exporters/braintrustExporter.d.ts +30 -0
- package/dist/lib/observability/exporters/braintrustExporter.js +155 -0
- package/dist/lib/observability/exporters/datadogExporter.d.ts +37 -0
- package/dist/lib/observability/exporters/datadogExporter.js +197 -0
- package/dist/lib/observability/exporters/index.d.ts +13 -0
- package/dist/lib/observability/exporters/index.js +14 -0
- package/dist/lib/observability/exporters/laminarExporter.d.ts +48 -0
- package/dist/lib/observability/exporters/laminarExporter.js +303 -0
- package/dist/lib/observability/exporters/langfuseExporter.d.ts +47 -0
- package/dist/lib/observability/exporters/langfuseExporter.js +200 -0
- package/dist/lib/observability/exporters/langsmithExporter.d.ts +26 -0
- package/dist/lib/observability/exporters/langsmithExporter.js +124 -0
- package/dist/lib/observability/exporters/otelExporter.d.ts +39 -0
- package/dist/lib/observability/exporters/otelExporter.js +165 -0
- package/dist/lib/observability/exporters/posthogExporter.d.ts +48 -0
- package/dist/lib/observability/exporters/posthogExporter.js +288 -0
- package/dist/lib/observability/exporters/sentryExporter.d.ts +32 -0
- package/dist/lib/observability/exporters/sentryExporter.js +166 -0
- package/dist/lib/observability/index.d.ts +25 -0
- package/dist/lib/observability/index.js +32 -0
- package/dist/lib/observability/metricsAggregator.d.ts +260 -0
- package/dist/lib/observability/metricsAggregator.js +553 -0
- package/dist/lib/observability/otelBridge.d.ts +49 -0
- package/dist/lib/observability/otelBridge.js +132 -0
- package/dist/lib/observability/retryPolicy.d.ts +192 -0
- package/dist/lib/observability/retryPolicy.js +384 -0
- package/dist/lib/observability/sampling/index.d.ts +4 -0
- package/dist/lib/observability/sampling/index.js +5 -0
- package/dist/lib/observability/sampling/samplers.d.ts +116 -0
- package/dist/lib/observability/sampling/samplers.js +217 -0
- package/dist/lib/observability/spanProcessor.d.ts +129 -0
- package/dist/lib/observability/spanProcessor.js +288 -0
- package/dist/lib/observability/tokenTracker.d.ts +156 -0
- package/dist/lib/observability/tokenTracker.js +414 -0
- package/dist/lib/observability/types/exporterTypes.d.ts +250 -0
- package/dist/lib/observability/types/exporterTypes.js +6 -0
- package/dist/lib/observability/types/index.d.ts +6 -0
- package/dist/lib/observability/types/index.js +5 -0
- package/dist/lib/observability/types/spanTypes.d.ts +244 -0
- package/dist/lib/observability/types/spanTypes.js +93 -0
- package/dist/lib/observability/utils/index.d.ts +4 -0
- package/dist/lib/observability/utils/index.js +5 -0
- package/dist/lib/observability/utils/spanSerializer.d.ts +115 -0
- package/dist/lib/observability/utils/spanSerializer.js +287 -0
- package/dist/lib/providers/amazonSagemaker.d.ts +5 -4
- package/dist/lib/providers/amazonSagemaker.js +3 -4
- package/dist/lib/providers/googleVertex.d.ts +7 -0
- package/dist/lib/providers/googleVertex.js +80 -2
- package/dist/lib/rag/pipeline/RAGPipeline.d.ts +0 -5
- package/dist/lib/rag/pipeline/RAGPipeline.js +122 -87
- package/dist/lib/rag/ragIntegration.js +30 -0
- package/dist/lib/rag/retrieval/hybridSearch.js +22 -0
- package/dist/lib/server/abstract/baseServerAdapter.js +51 -19
- package/dist/lib/server/middleware/common.js +44 -12
- package/dist/lib/services/server/ai/observability/instrumentation.d.ts +2 -2
- package/dist/lib/services/server/ai/observability/instrumentation.js +10 -5
- package/dist/lib/types/cli.d.ts +18 -2
- package/dist/lib/types/conversationMemoryInterface.d.ts +2 -0
- package/dist/lib/types/generateTypes.d.ts +2 -2
- package/dist/lib/types/modelTypes.d.ts +18 -18
- package/dist/lib/types/providers.d.ts +5 -0
- package/dist/lib/utils/pricing.js +25 -1
- package/dist/lib/utils/ttsProcessor.js +74 -59
- package/dist/lib/workflow/config.d.ts +36 -36
- package/dist/lib/workflow/core/ensembleExecutor.js +10 -0
- package/dist/lib/workflow/core/judgeScorer.js +20 -2
- package/dist/lib/workflow/core/workflowRunner.js +34 -1
- package/dist/mcp/httpRateLimiter.js +39 -12
- package/dist/mcp/httpRetryHandler.js +22 -1
- package/dist/mcp/mcpClientFactory.js +13 -15
- package/dist/memory/memoryRetrievalTools.js +22 -0
- package/dist/neurolink.d.ts +64 -72
- package/dist/neurolink.js +984 -566
- package/dist/observability/FEATURE-STATUS.md +269 -0
- package/dist/observability/exporterRegistry.d.ts +152 -0
- package/dist/observability/exporterRegistry.js +413 -0
- package/dist/observability/exporters/arizeExporter.d.ts +32 -0
- package/dist/observability/exporters/arizeExporter.js +138 -0
- package/dist/observability/exporters/baseExporter.d.ts +117 -0
- package/dist/observability/exporters/baseExporter.js +190 -0
- package/dist/observability/exporters/braintrustExporter.d.ts +30 -0
- package/dist/observability/exporters/braintrustExporter.js +154 -0
- package/dist/observability/exporters/datadogExporter.d.ts +37 -0
- package/dist/observability/exporters/datadogExporter.js +196 -0
- package/dist/observability/exporters/index.d.ts +13 -0
- package/dist/observability/exporters/index.js +13 -0
- package/dist/observability/exporters/laminarExporter.d.ts +48 -0
- package/dist/observability/exporters/laminarExporter.js +302 -0
- package/dist/observability/exporters/langfuseExporter.d.ts +47 -0
- package/dist/observability/exporters/langfuseExporter.js +199 -0
- package/dist/observability/exporters/langsmithExporter.d.ts +26 -0
- package/dist/observability/exporters/langsmithExporter.js +123 -0
- package/dist/observability/exporters/otelExporter.d.ts +39 -0
- package/dist/observability/exporters/otelExporter.js +164 -0
- package/dist/observability/exporters/posthogExporter.d.ts +48 -0
- package/dist/observability/exporters/posthogExporter.js +287 -0
- package/dist/observability/exporters/sentryExporter.d.ts +32 -0
- package/dist/observability/exporters/sentryExporter.js +165 -0
- package/dist/observability/index.d.ts +25 -0
- package/dist/observability/index.js +31 -0
- package/dist/observability/metricsAggregator.d.ts +260 -0
- package/dist/observability/metricsAggregator.js +552 -0
- package/dist/observability/otelBridge.d.ts +49 -0
- package/dist/observability/otelBridge.js +131 -0
- package/dist/observability/retryPolicy.d.ts +192 -0
- package/dist/observability/retryPolicy.js +383 -0
- package/dist/observability/sampling/index.d.ts +4 -0
- package/dist/observability/sampling/index.js +4 -0
- package/dist/observability/sampling/samplers.d.ts +116 -0
- package/dist/observability/sampling/samplers.js +216 -0
- package/dist/observability/spanProcessor.d.ts +129 -0
- package/dist/observability/spanProcessor.js +287 -0
- package/dist/observability/tokenTracker.d.ts +156 -0
- package/dist/observability/tokenTracker.js +413 -0
- package/dist/observability/types/exporterTypes.d.ts +250 -0
- package/dist/observability/types/exporterTypes.js +5 -0
- package/dist/observability/types/index.d.ts +6 -0
- package/dist/observability/types/index.js +4 -0
- package/dist/observability/types/spanTypes.d.ts +244 -0
- package/dist/observability/types/spanTypes.js +92 -0
- package/dist/observability/utils/index.d.ts +4 -0
- package/dist/observability/utils/index.js +4 -0
- package/dist/observability/utils/spanSerializer.d.ts +115 -0
- package/dist/observability/utils/spanSerializer.js +286 -0
- package/dist/providers/amazonSagemaker.d.ts +5 -4
- package/dist/providers/amazonSagemaker.js +3 -4
- package/dist/providers/googleVertex.d.ts +7 -0
- package/dist/providers/googleVertex.js +80 -2
- package/dist/rag/pipeline/RAGPipeline.d.ts +0 -5
- package/dist/rag/pipeline/RAGPipeline.js +122 -87
- package/dist/rag/ragIntegration.js +30 -0
- package/dist/rag/retrieval/hybridSearch.js +22 -0
- package/dist/server/abstract/baseServerAdapter.js +51 -19
- package/dist/server/middleware/common.js +44 -12
- package/dist/services/server/ai/observability/instrumentation.d.ts +2 -2
- package/dist/services/server/ai/observability/instrumentation.js +10 -5
- package/dist/types/cli.d.ts +18 -2
- package/dist/types/conversationMemoryInterface.d.ts +2 -0
- package/dist/types/generateTypes.d.ts +2 -2
- package/dist/types/providers.d.ts +5 -0
- package/dist/utils/pricing.js +25 -1
- package/dist/utils/ttsProcessor.js +74 -59
- package/dist/workflow/config.d.ts +52 -52
- package/dist/workflow/core/ensembleExecutor.js +10 -0
- package/dist/workflow/core/judgeScorer.js +20 -2
- package/dist/workflow/core/workflowRunner.js +34 -1
- package/package.json +1 -1
|
@@ -8,9 +8,11 @@
|
|
|
8
8
|
* Stage 3: LLM Summarization (expensive -- requires LLM call)
|
|
9
9
|
* Stage 4: Sliding Window Truncation (fallback -- no LLM call)
|
|
10
10
|
*/
|
|
11
|
-
import { trace, SpanStatusCode } from "@opentelemetry/api";
|
|
12
11
|
import { estimateMessagesTokens } from "../utils/tokenEstimation.js";
|
|
13
12
|
import { logger } from "../utils/logger.js";
|
|
13
|
+
import { withTimeout } from "../utils/async/withTimeout.js";
|
|
14
|
+
import { SpanSerializer, SpanType, SpanStatus, } from "../observability/index.js";
|
|
15
|
+
import { getMetricsAggregator } from "../observability/index.js";
|
|
14
16
|
import { pruneToolOutputs } from "./stages/toolOutputPruner.js";
|
|
15
17
|
import { deduplicateFileReads } from "./stages/fileReadDeduplicator.js";
|
|
16
18
|
import { summarizeMessages } from "./stages/structuredSummarizer.js";
|
|
@@ -38,155 +40,161 @@ export class ContextCompactor {
|
|
|
38
40
|
* Run the multi-stage compaction pipeline until messages fit within budget.
|
|
39
41
|
*/
|
|
40
42
|
async compact(messages, targetTokens, memoryConfig, requestId) {
|
|
41
|
-
const
|
|
42
|
-
|
|
43
|
-
|
|
44
|
-
const stagesUsed = [];
|
|
45
|
-
let currentMessages = [...messages];
|
|
46
|
-
logger.info("[Compaction] Starting", {
|
|
47
|
-
requestId,
|
|
48
|
-
estimatedTokens: tokensBefore,
|
|
49
|
-
budgetTokens: targetTokens,
|
|
43
|
+
const span = SpanSerializer.createSpan(SpanType.CONTEXT_COMPACTION, "context.compact", {
|
|
44
|
+
"context.operation": "compact",
|
|
45
|
+
"context.targetTokens": targetTokens,
|
|
50
46
|
});
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
|
|
54
|
-
const
|
|
55
|
-
const
|
|
56
|
-
|
|
57
|
-
|
|
58
|
-
protectedTools: this.config.pruneProtectedTools,
|
|
59
|
-
provider,
|
|
60
|
-
});
|
|
61
|
-
if (pruneResult.pruned) {
|
|
62
|
-
currentMessages = pruneResult.messages;
|
|
63
|
-
stagesUsed.push("prune");
|
|
64
|
-
}
|
|
65
|
-
const stageTokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
66
|
-
logger.info("[Compaction] Stage 1 (prune)", {
|
|
47
|
+
const spanStartTime = Date.now();
|
|
48
|
+
try {
|
|
49
|
+
const provider = this.config.provider || undefined;
|
|
50
|
+
const tokensBefore = estimateMessagesTokens(messages, provider);
|
|
51
|
+
const stagesUsed = [];
|
|
52
|
+
let currentMessages = [...messages];
|
|
53
|
+
logger.info("[Compaction] Starting", {
|
|
67
54
|
requestId,
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
tokensAfter: stageTokensAfter,
|
|
71
|
-
saved: stageTokensBefore - stageTokensAfter,
|
|
55
|
+
estimatedTokens: tokensBefore,
|
|
56
|
+
budgetTokens: targetTokens,
|
|
72
57
|
});
|
|
73
|
-
|
|
74
|
-
|
|
75
|
-
|
|
76
|
-
|
|
77
|
-
|
|
78
|
-
|
|
79
|
-
|
|
80
|
-
|
|
81
|
-
|
|
82
|
-
}
|
|
83
|
-
const stageTokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
84
|
-
logger.info("[Compaction] Stage 2 (deduplicate)", {
|
|
85
|
-
requestId,
|
|
86
|
-
ran: dedupResult.deduplicated,
|
|
87
|
-
tokensBefore: stageTokensBefore,
|
|
88
|
-
tokensAfter: stageTokensAfter,
|
|
89
|
-
saved: stageTokensBefore - stageTokensAfter,
|
|
90
|
-
});
|
|
91
|
-
}
|
|
92
|
-
// Stage 3: LLM Summarization
|
|
93
|
-
if (this.config.enableSummarize &&
|
|
94
|
-
estimateMessagesTokens(currentMessages, provider) > targetTokens) {
|
|
95
|
-
const stageTokensBefore = estimateMessagesTokens(currentMessages, provider);
|
|
96
|
-
try {
|
|
97
|
-
const summarizeResult = await summarizeMessages(currentMessages, {
|
|
98
|
-
provider: this.config.summarizationProvider,
|
|
99
|
-
model: this.config.summarizationModel,
|
|
100
|
-
keepRecentRatio: this.config.keepRecentRatio,
|
|
101
|
-
memoryConfig,
|
|
58
|
+
// Stage 1: Tool Output Pruning
|
|
59
|
+
if (this.config.enablePrune &&
|
|
60
|
+
estimateMessagesTokens(currentMessages, provider) > targetTokens) {
|
|
61
|
+
const stageTokensBefore = estimateMessagesTokens(currentMessages, provider);
|
|
62
|
+
const pruneResult = pruneToolOutputs(currentMessages, {
|
|
63
|
+
protectTokens: this.config.pruneProtectTokens,
|
|
64
|
+
minimumSavings: this.config.pruneMinimumSavings,
|
|
65
|
+
protectedTools: this.config.pruneProtectedTools,
|
|
66
|
+
provider,
|
|
102
67
|
});
|
|
103
|
-
if (
|
|
104
|
-
currentMessages =
|
|
105
|
-
stagesUsed.push("
|
|
68
|
+
if (pruneResult.pruned) {
|
|
69
|
+
currentMessages = pruneResult.messages;
|
|
70
|
+
stagesUsed.push("prune");
|
|
106
71
|
}
|
|
107
72
|
const stageTokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
108
|
-
logger.info("[Compaction] Stage
|
|
73
|
+
logger.info("[Compaction] Stage 1 (prune)", {
|
|
109
74
|
requestId,
|
|
110
|
-
ran:
|
|
75
|
+
ran: pruneResult.pruned,
|
|
111
76
|
tokensBefore: stageTokensBefore,
|
|
112
77
|
tokensAfter: stageTokensAfter,
|
|
113
78
|
saved: stageTokensBefore - stageTokensAfter,
|
|
114
79
|
});
|
|
115
80
|
}
|
|
116
|
-
|
|
117
|
-
|
|
118
|
-
|
|
119
|
-
const
|
|
120
|
-
|
|
81
|
+
// Stage 2: File Read Deduplication
|
|
82
|
+
if (this.config.enableDeduplicate &&
|
|
83
|
+
estimateMessagesTokens(currentMessages, provider) > targetTokens) {
|
|
84
|
+
const stageTokensBefore = estimateMessagesTokens(currentMessages, provider);
|
|
85
|
+
const dedupResult = deduplicateFileReads(currentMessages);
|
|
86
|
+
if (dedupResult.deduplicated) {
|
|
87
|
+
currentMessages = dedupResult.messages;
|
|
88
|
+
stagesUsed.push("deduplicate");
|
|
89
|
+
}
|
|
90
|
+
const stageTokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
91
|
+
logger.info("[Compaction] Stage 2 (deduplicate)", {
|
|
121
92
|
requestId,
|
|
122
|
-
|
|
123
|
-
errorName,
|
|
93
|
+
ran: dedupResult.deduplicated,
|
|
124
94
|
tokensBefore: stageTokensBefore,
|
|
125
|
-
tokensAfter:
|
|
126
|
-
saved:
|
|
95
|
+
tokensAfter: stageTokensAfter,
|
|
96
|
+
saved: stageTokensBefore - stageTokensAfter,
|
|
127
97
|
});
|
|
128
|
-
|
|
129
|
-
|
|
130
|
-
|
|
131
|
-
|
|
132
|
-
|
|
133
|
-
|
|
134
|
-
|
|
135
|
-
|
|
136
|
-
|
|
137
|
-
|
|
98
|
+
}
|
|
99
|
+
// Stage 3: LLM Summarization
|
|
100
|
+
if (this.config.enableSummarize &&
|
|
101
|
+
estimateMessagesTokens(currentMessages, provider) > targetTokens) {
|
|
102
|
+
const stageTokensBefore = estimateMessagesTokens(currentMessages, provider);
|
|
103
|
+
try {
|
|
104
|
+
const summarizeResult = await withTimeout(summarizeMessages(currentMessages, {
|
|
105
|
+
provider: this.config.summarizationProvider,
|
|
106
|
+
model: this.config.summarizationModel,
|
|
107
|
+
keepRecentRatio: this.config.keepRecentRatio,
|
|
108
|
+
memoryConfig,
|
|
109
|
+
}), 120_000, "LLM summarization timed out after 120s");
|
|
110
|
+
if (summarizeResult.summarized) {
|
|
111
|
+
currentMessages = summarizeResult.messages;
|
|
112
|
+
stagesUsed.push("summarize");
|
|
138
113
|
}
|
|
139
|
-
|
|
140
|
-
|
|
141
|
-
|
|
142
|
-
|
|
114
|
+
const stageTokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
115
|
+
logger.info("[Compaction] Stage 3 (summarize)", {
|
|
116
|
+
requestId,
|
|
117
|
+
ran: summarizeResult.summarized,
|
|
118
|
+
tokensBefore: stageTokensBefore,
|
|
119
|
+
tokensAfter: stageTokensAfter,
|
|
120
|
+
saved: stageTokensBefore - stageTokensAfter,
|
|
121
|
+
});
|
|
122
|
+
}
|
|
123
|
+
catch (error) {
|
|
124
|
+
const err = error instanceof Error ? error : new Error(String(error));
|
|
125
|
+
logger.warn("[Compaction] Stage 3 (summarize) FAILED", {
|
|
126
|
+
requestId,
|
|
127
|
+
error: err.message,
|
|
128
|
+
errorName: err.name,
|
|
129
|
+
tokensBefore: stageTokensBefore,
|
|
130
|
+
tokensAfter: stageTokensBefore,
|
|
131
|
+
saved: 0,
|
|
132
|
+
});
|
|
133
|
+
// Record failure on the compaction span for trace visibility
|
|
134
|
+
SpanSerializer.updateAttributes(span, {
|
|
135
|
+
"compaction.stage3.error": err.message,
|
|
136
|
+
"compaction.stage3.errorName": err.name,
|
|
137
|
+
"compaction.stage3.tokensBefore": stageTokensBefore,
|
|
138
|
+
"compaction.stage3_failed": true,
|
|
143
139
|
});
|
|
140
|
+
// Fall through to Stage 4 truncation as before
|
|
144
141
|
}
|
|
145
|
-
// Fall through to Stage 4 truncation as before
|
|
146
142
|
}
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
|
|
154
|
-
|
|
155
|
-
|
|
156
|
-
|
|
157
|
-
|
|
158
|
-
|
|
159
|
-
|
|
160
|
-
|
|
161
|
-
|
|
162
|
-
|
|
143
|
+
// Stage 4: Sliding Window Truncation (fallback)
|
|
144
|
+
if (this.config.enableTruncate &&
|
|
145
|
+
estimateMessagesTokens(currentMessages, provider) > targetTokens) {
|
|
146
|
+
const stageTokensBefore = estimateMessagesTokens(currentMessages, provider);
|
|
147
|
+
const truncResult = truncateWithSlidingWindow(currentMessages, {
|
|
148
|
+
fraction: this.config.truncationFraction,
|
|
149
|
+
});
|
|
150
|
+
if (truncResult.truncated) {
|
|
151
|
+
currentMessages = truncResult.messages;
|
|
152
|
+
stagesUsed.push("truncate");
|
|
153
|
+
}
|
|
154
|
+
const stageTokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
155
|
+
logger.info("[Compaction] Stage 4 (truncate)", {
|
|
156
|
+
requestId,
|
|
157
|
+
ran: truncResult.truncated,
|
|
158
|
+
tokensBefore: stageTokensBefore,
|
|
159
|
+
tokensAfter: stageTokensAfter,
|
|
160
|
+
saved: stageTokensBefore - stageTokensAfter,
|
|
161
|
+
});
|
|
163
162
|
}
|
|
164
|
-
const
|
|
165
|
-
logger.info("[Compaction]
|
|
163
|
+
const tokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
164
|
+
logger.info("[Compaction] Complete", {
|
|
166
165
|
requestId,
|
|
167
|
-
|
|
168
|
-
|
|
169
|
-
|
|
170
|
-
|
|
166
|
+
tokensBefore,
|
|
167
|
+
tokensAfter,
|
|
168
|
+
totalSaved: tokensBefore - tokensAfter,
|
|
169
|
+
stagesUsed,
|
|
170
|
+
durationMs: Date.now() - spanStartTime,
|
|
171
171
|
});
|
|
172
|
+
const result = {
|
|
173
|
+
compacted: stagesUsed.length > 0,
|
|
174
|
+
stagesUsed,
|
|
175
|
+
tokensBefore,
|
|
176
|
+
tokensAfter,
|
|
177
|
+
tokensSaved: tokensBefore - tokensAfter,
|
|
178
|
+
messages: currentMessages,
|
|
179
|
+
};
|
|
180
|
+
span.durationMs = Date.now() - spanStartTime;
|
|
181
|
+
const endedSpan = SpanSerializer.endSpan(SpanSerializer.updateAttributes(span, {
|
|
182
|
+
"context.stage": stagesUsed.join(",") || "none",
|
|
183
|
+
"context.tokensBefore": tokensBefore,
|
|
184
|
+
"context.tokensAfter": tokensAfter,
|
|
185
|
+
"context.tokensSaved": tokensBefore - tokensAfter,
|
|
186
|
+
}), SpanStatus.OK);
|
|
187
|
+
getMetricsAggregator().recordSpan(endedSpan);
|
|
188
|
+
return result;
|
|
189
|
+
}
|
|
190
|
+
catch (error) {
|
|
191
|
+
span.durationMs = Date.now() - spanStartTime;
|
|
192
|
+
const endedSpan = SpanSerializer.endSpan(span, SpanStatus.ERROR);
|
|
193
|
+
endedSpan.statusMessage =
|
|
194
|
+
error instanceof Error ? error.message : String(error);
|
|
195
|
+
getMetricsAggregator().recordSpan(endedSpan);
|
|
196
|
+
throw error;
|
|
172
197
|
}
|
|
173
|
-
const tokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
174
|
-
logger.info("[Compaction] Complete", {
|
|
175
|
-
requestId,
|
|
176
|
-
tokensBefore,
|
|
177
|
-
tokensAfter,
|
|
178
|
-
totalSaved: tokensBefore - tokensAfter,
|
|
179
|
-
stagesUsed,
|
|
180
|
-
durationMs: Date.now() - compactionStartTime,
|
|
181
|
-
});
|
|
182
|
-
return {
|
|
183
|
-
compacted: stagesUsed.length > 0,
|
|
184
|
-
stagesUsed,
|
|
185
|
-
tokensBefore,
|
|
186
|
-
tokensAfter,
|
|
187
|
-
tokensSaved: tokensBefore - tokensAfter,
|
|
188
|
-
messages: currentMessages,
|
|
189
|
-
};
|
|
190
198
|
}
|
|
191
199
|
}
|
|
192
200
|
//# sourceMappingURL=contextCompactor.js.map
|
|
@@ -24,6 +24,11 @@ export declare abstract class BaseProvider implements AIProvider {
|
|
|
24
24
|
protected sessionId?: string;
|
|
25
25
|
protected userId?: string;
|
|
26
26
|
protected neurolink?: NeuroLink;
|
|
27
|
+
/** Trace context propagated from NeuroLink SDK for span hierarchy */
|
|
28
|
+
_traceContext: {
|
|
29
|
+
traceId: string;
|
|
30
|
+
parentSpanId: string;
|
|
31
|
+
} | null;
|
|
27
32
|
private readonly messageBuilder;
|
|
28
33
|
private readonly streamHandler;
|
|
29
34
|
private readonly generationHandler;
|