npm - lynkr - Versions diffs - 8.0.0 → 9.0.1 - Mend

lynkr 8.0.0 → 9.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (128) hide show

package/.lynkr/telemetry.db +0 -0
package/.lynkr/telemetry.db-shm +0 -0
package/.lynkr/telemetry.db-wal +0 -0
package/README.md +196 -322
package/lynkr-skill.tar.gz +0 -0
package/package.json +4 -3
package/src/api/openai-router.js +64 -13
package/src/api/providers-handler.js +171 -3
package/src/api/router.js +9 -2
package/src/clients/circuit-breaker.js +10 -247
package/src/clients/codex-process.js +342 -0
package/src/clients/codex-utils.js +143 -0
package/src/clients/databricks.js +210 -63
package/src/clients/resilience.js +540 -0
package/src/clients/retry.js +22 -167
package/src/clients/standard-tools.js +23 -0
package/src/config/index.js +77 -0
package/src/context/compression.js +42 -9
package/src/context/distill.js +492 -0
package/src/orchestrator/index.js +48 -8
package/src/routing/complexity-analyzer.js +258 -5
package/src/routing/index.js +12 -2
package/src/routing/latency-tracker.js +148 -0
package/src/routing/model-tiers.js +2 -0
package/src/routing/quality-scorer.js +113 -0
package/src/routing/telemetry.js +464 -0
package/src/server.js +13 -12
package/src/tools/code-graph.js +538 -0
package/src/tools/code-mode.js +304 -0
package/src/tools/index.js +4 -0
package/src/tools/lazy-loader.js +18 -0
package/src/tools/mcp-remote.js +7 -0
package/src/tools/smart-selection.js +11 -0
package/src/tools/tinyfish.js +358 -0
package/src/tools/truncate.js +1 -0
package/src/utils/payload.js +206 -0
package/src/utils/perf-timer.js +80 -0
package/.github/FUNDING.yml +0 -15
package/.github/workflows/README.md +0 -215
package/.github/workflows/ci.yml +0 -69
package/.github/workflows/index.yml +0 -62
package/.github/workflows/web-tools-tests.yml +0 -56
package/CITATIONS.bib +0 -6
package/DEPLOYMENT.md +0 -1001
package/LYNKR-TUI-PLAN.md +0 -984
package/PERFORMANCE-REPORT.md +0 -866
package/PLAN-per-client-model-routing.md +0 -252
package/docs/42642f749da6234f41b6b425c3bb07c9.txt +0 -1
package/docs/BingSiteAuth.xml +0 -4
package/docs/docs-style.css +0 -478
package/docs/docs.html +0 -198
package/docs/google5be250e608e6da39.html +0 -1
package/docs/index.html +0 -577
package/docs/index.md +0 -584
package/docs/robots.txt +0 -4
package/docs/sitemap.xml +0 -44
package/docs/style.css +0 -1223
package/docs/toon-integration-spec.md +0 -130
package/documentation/README.md +0 -101
package/documentation/api.md +0 -806
package/documentation/claude-code-cli.md +0 -679
package/documentation/codex-cli.md +0 -397
package/documentation/contributing.md +0 -571
package/documentation/cursor-integration.md +0 -734
package/documentation/docker.md +0 -874
package/documentation/embeddings.md +0 -762
package/documentation/faq.md +0 -713
package/documentation/features.md +0 -403
package/documentation/headroom.md +0 -519
package/documentation/installation.md +0 -758
package/documentation/memory-system.md +0 -476
package/documentation/production.md +0 -636
package/documentation/providers.md +0 -1009
package/documentation/routing.md +0 -476
package/documentation/testing.md +0 -629
package/documentation/token-optimization.md +0 -325
package/documentation/tools.md +0 -697
package/documentation/troubleshooting.md +0 -969
package/final-test.js +0 -33
package/headroom-sidecar/config.py +0 -93
package/headroom-sidecar/requirements.txt +0 -14
package/headroom-sidecar/server.py +0 -451
package/monitor-agents.sh +0 -31
package/scripts/audit-log-reader.js +0 -399
package/scripts/compact-dictionary.js +0 -204
package/scripts/test-deduplication.js +0 -448
package/src/db/database.sqlite +0 -0
package/te +0 -11622
package/test/README.md +0 -212
package/test/azure-openai-config.test.js +0 -213
package/test/azure-openai-error-resilience.test.js +0 -238
package/test/azure-openai-format-conversion.test.js +0 -354
package/test/azure-openai-integration.test.js +0 -287
package/test/azure-openai-routing.test.js +0 -175
package/test/azure-openai-streaming.test.js +0 -171
package/test/bedrock-integration.test.js +0 -457
package/test/comprehensive-test-suite.js +0 -928
package/test/config-validation.test.js +0 -207
package/test/cursor-integration.test.js +0 -484
package/test/format-conversion.test.js +0 -578
package/test/hybrid-routing-integration.test.js +0 -269
package/test/hybrid-routing-performance.test.js +0 -428
package/test/llamacpp-integration.test.js +0 -882
package/test/lmstudio-integration.test.js +0 -347
package/test/memory/extractor.test.js +0 -398
package/test/memory/retriever.test.js +0 -613
package/test/memory/retriever.test.js.bak +0 -585
package/test/memory/search.test.js +0 -537
package/test/memory/search.test.js.bak +0 -389
package/test/memory/store.test.js +0 -344
package/test/memory/store.test.js.bak +0 -312
package/test/memory/surprise.test.js +0 -300
package/test/memory-performance.test.js +0 -472
package/test/openai-integration.test.js +0 -683
package/test/openrouter-error-resilience.test.js +0 -418
package/test/passthrough-mode.test.js +0 -385
package/test/performance-benchmark.js +0 -351
package/test/performance-tests.js +0 -528
package/test/routing.test.js +0 -225
package/test/toon-compression.test.js +0 -131
package/test/web-tools.test.js +0 -329
package/test-agents-simple.js +0 -43
package/test-cli-connection.sh +0 -33
package/test-learning-unit.js +0 -126
package/test-learning.js +0 -112
package/test-parallel-agents.sh +0 -124
package/test-parallel-direct.js +0 -155
package/test-subagents.sh +0 -117

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "lynkr",
-  "version": "8.0.0",
+  "version": "9.0.1",
   "description": "Self-hosted Claude Code & Cursor proxy with Databricks,AWS BedRock,Azure  adapters, openrouter, Ollama,llamacpp,LM Studio, workspace tooling, and MCP integration.",
   "main": "index.js",
   "bin": {
@@ -8,13 +8,13 @@
     "lynkr-setup": "./scripts/setup.js"
   },
   "scripts": {
-    "prestart": "node -e \"if(process.env.HEADROOM_ENABLED==='true'&&process.env.HEADROOM_DOCKER_ENABLED!=='false'){process.exit(0)}else{process.exit(1)}\" && docker compose --profile headroom up -d headroom 2>/dev/null || echo 'Headroom skipped (disabled or Docker not running)'",
+    "prestart": "node -e \"if(process.env.HEADROOM_ENABLED==='true'&&process.env.HEADROOM_DOCKER_ENABLED!=='false'){process.exit(0)}else{process.exit(1)}\" && docker compose --profile headroom up -d --build headroom 2>/dev/null || echo 'Headroom skipped (disabled or Docker not running)'",
     "start": "node index.js 2>&1 | npx pino-pretty --sync",
     "stop": "node -e \"if(process.env.HEADROOM_ENABLED==='true'&&process.env.HEADROOM_DOCKER_ENABLED!=='false'){process.exit(0)}else{process.exit(1)}\" && docker compose --profile headroom down || echo 'Headroom skipped (disabled or Docker not running)'",
     "dev": "nodemon index.js",
     "lint": "eslint src index.js",
     "test": "npm run test:unit && npm run test:performance",
-    "test:unit": "DATABRICKS_API_KEY=test-key DATABRICKS_API_BASE=http://test.com node --test test/routing.test.js test/hybrid-routing-integration.test.js test/web-tools.test.js test/passthrough-mode.test.js test/openrouter-error-resilience.test.js test/format-conversion.test.js test/azure-openai-config.test.js test/azure-openai-format-conversion.test.js test/azure-openai-routing.test.js test/azure-openai-streaming.test.js test/azure-openai-error-resilience.test.js test/azure-openai-integration.test.js test/openai-integration.test.js test/toon-compression.test.js test/llamacpp-integration.test.js test/memory/store.test.js test/memory/surprise.test.js test/memory/extractor.test.js test/memory/search.test.js test/memory/retriever.test.js",
+    "test:unit": "DATABRICKS_API_KEY=test-key DATABRICKS_API_BASE=http://test.com node --test test/routing.test.js test/hybrid-routing-integration.test.js test/web-tools.test.js test/passthrough-mode.test.js test/openrouter-error-resilience.test.js test/format-conversion.test.js test/azure-openai-config.test.js test/azure-openai-format-conversion.test.js test/azure-openai-routing.test.js test/azure-openai-streaming.test.js test/azure-openai-error-resilience.test.js test/azure-openai-integration.test.js test/openai-integration.test.js test/toon-compression.test.js test/llamacpp-integration.test.js test/resilience.test.js test/telemetry-routing.test.js test/memory/store.test.js test/memory/surprise.test.js test/memory/extractor.test.js test/memory/search.test.js test/memory/retriever.test.js test/distill.test.js test/large-payload.test.js test/code-mode.test.js",
     "test:memory": "DATABRICKS_API_KEY=test-key DATABRICKS_API_BASE=http://test.com node --test test/memory/store.test.js test/memory/surprise.test.js test/memory/extractor.test.js test/memory/search.test.js test/memory/retriever.test.js",
     "test:new-features": "DATABRICKS_API_KEY=test-key DATABRICKS_API_BASE=http://test.com node --test test/passthrough-mode.test.js test/openrouter-error-resilience.test.js test/format-conversion.test.js",
     "test:performance": "DATABRICKS_API_KEY=test-key DATABRICKS_API_BASE=http://test.com node test/hybrid-routing-performance.test.js && DATABRICKS_API_KEY=test-key DATABRICKS_API_BASE=http://test.com node test/performance-tests.js",
@@ -48,6 +48,7 @@
     "@babel/parser": "^7.29.0",
     "@babel/traverse": "^7.29.0",
     "@toon-format/toon": "^2.1.0",
+    "cockatiel": "^3.2.1",
     "compression": "^1.7.4",
     "diff": "^5.2.0",
     "dotenv": "^16.4.5",

package/src/api/openai-router.js CHANGED Viewed

@@ -27,6 +27,23 @@ const { IDE_SAFE_TOOLS } = require("../clients/standard-tools");
 const router = express.Router();
+/**
+ * Resolve the model name for OpenAI responses.
+ * In OpenClaw mode, returns the actual provider/model from routing metadata.
+ */
+function resolveResponseModel(resultBody, requestModel) {
+  if (config.openclaw?.enabled && resultBody?._routingMeta) {
+    const meta = resultBody._routingMeta;
+    if (meta.provider && meta.model) {
+      return `${meta.provider}/${meta.model}`;
+    }
+    if (meta.provider) {
+      return meta.provider;
+    }
+  }
+  return requestModel;
+}
 /**
  * Client detection - identifies which AI coding tool is making the request
  * @param {Object} headers - Request headers
@@ -126,6 +143,13 @@ const CLIENT_TOOL_MAPPINGS = {
       mapArgs: (a) => ({
         query: a.query || ""
       })
+    },
+    "WebAgent": {
+      name: "web_agent",
+      mapArgs: (a) => ({
+        url: a.url || "",
+        goal: a.goal || ""
+      })
     }
   },
@@ -181,6 +205,13 @@ const CLIENT_TOOL_MAPPINGS = {
         path: a.path || a.directory || ".",
         recursive: false
       })
+    },
+    "WebAgent": {
+      name: "web_agent",
+      mapArgs: (a) => ({
+        url: a.url || "",
+        goal: a.goal || ""
+      })
     }
   },
@@ -237,6 +268,13 @@ const CLIENT_TOOL_MAPPINGS = {
         path: a.path || a.directory || ".",
         recursive: false
       })
+    },
+    "WebAgent": {
+      name: "web_agent",
+      mapArgs: (a) => ({
+        url: a.url || "",
+        goal: a.goal || ""
+      })
     }
   },
@@ -287,6 +325,13 @@ const CLIENT_TOOL_MAPPINGS = {
       mapArgs: (a) => ({
         filepath: a.path || a.directory || "."
       })
+    },
+    "WebAgent": {
+      name: "web_agent",
+      mapArgs: (a) => ({
+        url: a.url || "",
+        goal: a.goal || ""
+      })
     }
   }
 };
@@ -406,8 +451,10 @@ router.post("/chat/completions", async (req, res) => {
     //      that have a mapping in CLIENT_TOOL_MAPPINGS — this ensures clients like
     //      Codex don't see tools they can't handle (Task, WebFetch, NotebookEdit)
     //      while Claude Code (unknown client) gets the full IDE_SAFE_TOOLS set.
+    // Skip injection if client explicitly opted out (tool_choice: "none" or empty tools array).
     const clientType = detectClient(req.headers);
-    if (!anthropicRequest.tools || anthropicRequest.tools.length === 0) {
+    const clientExplicitlyDisabledTools = req.body.tool_choice === "none" || Array.isArray(req.body.tools);
+    if (!clientExplicitlyDisabledTools && (!anthropicRequest.tools || anthropicRequest.tools.length === 0)) {
       const clientMappings = CLIENT_TOOL_MAPPINGS[clientType];
       const clientTools = clientMappings
         ? IDE_SAFE_TOOLS.filter(t => clientMappings[t.name])
@@ -469,7 +516,8 @@ router.post("/chat/completions", async (req, res) => {
         }
         // Convert to OpenAI format
-        const openaiResponse = convertAnthropicToOpenAI(result.body, req.body.model);
+        const streamModel = resolveResponseModel(result.body, req.body.model);
+        const openaiResponse = convertAnthropicToOpenAI(result.body, streamModel);
         // Debug: Log what we're about to stream
         logger.debug({
@@ -509,7 +557,7 @@ router.post("/chat/completions", async (req, res) => {
           id: openaiResponse.id,
           object: "chat.completion.chunk",
           created: openaiResponse.created,
-          model: req.body.model,
+          model: streamModel,
           system_fingerprint: "fp_lynkr",
           choices: [{
             index: 0,
@@ -531,7 +579,7 @@ router.post("/chat/completions", async (req, res) => {
             id: openaiResponse.id,
             object: "chat.completion.chunk",
             created: openaiResponse.created,
-            model: req.body.model,
+            model: streamModel,
             system_fingerprint: "fp_lynkr",
             choices: [{
               index: 0,
@@ -551,7 +599,7 @@ router.post("/chat/completions", async (req, res) => {
               id: openaiResponse.id,
               object: "chat.completion.chunk",
               created: openaiResponse.created,
-              model: req.body.model,
+              model: streamModel,
               choices: [{
                 index: 0,
                 delta: {
@@ -578,7 +626,7 @@ router.post("/chat/completions", async (req, res) => {
           id: openaiResponse.id,
           object: "chat.completion.chunk",
           created: openaiResponse.created,
-          model: req.body.model,
+          model: streamModel,
           system_fingerprint: "fp_lynkr",
           choices: [{
             index: 0,
@@ -649,7 +697,7 @@ router.post("/chat/completions", async (req, res) => {
       }, "Orchestrator result structure");
       // Convert Anthropic response to OpenAI format
-      const openaiResponse = convertAnthropicToOpenAI(result.body, req.body.model);
+      const openaiResponse = convertAnthropicToOpenAI(result.body, resolveResponseModel(result.body, req.body.model));
       // Map tool names for known IDE clients
       if (clientType !== "unknown" && openaiResponse.choices?.[0]?.message?.tool_calls?.length > 0) {
@@ -1450,8 +1498,10 @@ router.post("/responses", async (req, res) => {
     }, "After Chat→Anthropic conversion");
     // Inject tools if client didn't send any (same two-layer filtering as chat/completions).
+    // Skip injection if client explicitly opted out (tool_choice: "none" or empty tools array).
     const clientType = detectClient(req.headers);
-    if (!anthropicRequest.tools || anthropicRequest.tools.length === 0) {
+    const clientExplicitlyDisabledTools = req.body.tool_choice === "none" || Array.isArray(req.body.tools);
+    if (!clientExplicitlyDisabledTools && (!anthropicRequest.tools || anthropicRequest.tools.length === 0)) {
       const clientMappings = CLIENT_TOOL_MAPPINGS[clientType];
       const clientTools = clientMappings
         ? IDE_SAFE_TOOLS.filter(t => clientMappings[t.name])
@@ -1503,7 +1553,8 @@ router.post("/responses", async (req, res) => {
         }, "=== ORCHESTRATOR RESULT FOR RESPONSES API ===");
         // Convert back: Anthropic → OpenAI → Responses
-        const chatResponse = convertAnthropicToOpenAI(result.body, req.body.model);
+        const responsesModel = resolveResponseModel(result.body, req.body.model);
+        const chatResponse = convertAnthropicToOpenAI(result.body, responsesModel);
         logger.debug({
           chatContent: chatResponse.choices?.[0]?.message?.content?.substring(0, 200),
@@ -1565,7 +1616,7 @@ router.post("/responses", async (req, res) => {
             object: "response",
             status: "in_progress",
             created_at: createdAt,
-            model: req.body.model,
+            model: responsesModel,
             output: [],
             usage: null
           },
@@ -1582,7 +1633,7 @@ router.post("/responses", async (req, res) => {
             object: "response",
             status: "in_progress",
             created_at: createdAt,
-            model: req.body.model,
+            model: responsesModel,
             output: [],
             usage: null
           },
@@ -1761,7 +1812,7 @@ router.post("/responses", async (req, res) => {
             object: "response",
             status: "completed",
             created_at: createdAt,
-            model: req.body.model,
+            model: responsesModel,
             output: outputItems,
             usage: {
               input_tokens: responsesResponse.usage?.prompt_tokens || 0,
@@ -1814,7 +1865,7 @@ router.post("/responses", async (req, res) => {
       });
       // Convert back: Anthropic → OpenAI → Responses
-      const chatResponse = convertAnthropicToOpenAI(result.body, req.body.model);
+      const chatResponse = convertAnthropicToOpenAI(result.body, resolveResponseModel(result.body, req.body.model));
       const responsesResponse = convertChatToResponses(chatResponse);
       logger.info({

package/src/api/providers-handler.js CHANGED Viewed

@@ -415,8 +415,8 @@ router.get("/health/providers", (req, res) => {
     // Get circuit breaker states
     const circuitBreakerStates = {};
     const allBreakers = registry.getAll();
-    for (const [name, breaker] of Object.entries(allBreakers)) {
-      circuitBreakerStates[name] = breaker.state;
+    for (const breaker of allBreakers) {
+      circuitBreakerStates[breaker.name] = breaker.state;
     }
     // Get all provider health
@@ -452,7 +452,8 @@ router.get("/health/providers/:name", (req, res) => {
     // Get circuit breaker state for this provider
     const allBreakers = registry.getAll();
-    const circuitState = allBreakers[providerName]?.state || "CLOSED";
+    const breakerState = allBreakers.find((b) => b.name === providerName);
+    const circuitState = breakerState?.state || "CLOSED";
     // Get detailed metrics
     const metrics = healthTracker.getProviderMetrics(providerName);
@@ -477,4 +478,171 @@ router.get("/health/providers/:name", (req, res) => {
   }
 });
+// ============================================================================
+// Routing Telemetry Endpoints
+// ============================================================================
+const telemetry = require("../routing/telemetry");
+const { getLatencyTracker } = require("../routing/latency-tracker");
+/**
+ * GET /v1/routing/stats
+ *
+ * Aggregated routing telemetry statistics.
+ */
+router.get("/routing/stats", (req, res) => {
+  try {
+    const since = req.query.since ? Number(req.query.since) : undefined;
+    const until = req.query.until ? Number(req.query.until) : undefined;
+    const stats = telemetry.getStats({ since, until });
+    if (!stats) {
+      return res.json({ object: "routing_stats", data: null, message: "No telemetry data available" });
+    }
+    // Merge latency tracker percentiles
+    const latencyTracker = getLatencyTracker();
+    const latencyStats = {};
+    for (const [provider, pStats] of latencyTracker.getAllStats()) {
+      latencyStats[provider] = pStats;
+    }
+    res.json({
+      object: "routing_stats",
+      data: { ...stats, latencyPercentiles: latencyStats },
+      timestamp: new Date().toISOString(),
+    });
+  } catch (error) {
+    logger.error({ error: error.message }, "Error getting routing stats");
+    res.status(500).json({ error: { type: "server_error", message: error.message } });
+  }
+});
+/**
+ * GET /v1/routing/stats/:provider
+ *
+ * Per-provider routing telemetry.
+ */
+router.get("/routing/stats/:provider", (req, res) => {
+  try {
+    const provider = req.params.provider.toLowerCase();
+    const since = req.query.since ? Number(req.query.since) : undefined;
+    const stats = telemetry.getProviderStats(provider, { since });
+    if (!stats) {
+      return res.json({ object: "provider_routing_stats", data: null, message: `No data for ${provider}` });
+    }
+    const latencyTracker = getLatencyTracker();
+    const latency = latencyTracker.getStats(provider);
+    res.json({
+      object: "provider_routing_stats",
+      provider,
+      data: { ...stats, latency },
+      timestamp: new Date().toISOString(),
+    });
+  } catch (error) {
+    logger.error({ error: error.message }, "Error getting provider routing stats");
+    res.status(500).json({ error: { type: "server_error", message: error.message } });
+  }
+});
+/**
+ * GET /v1/routing/telemetry
+ *
+ * Raw telemetry records (most recent first).
+ */
+router.get("/routing/telemetry", (req, res) => {
+  try {
+    const filters = {
+      provider: req.query.provider,
+      tier: req.query.tier,
+      since: req.query.since ? Number(req.query.since) : undefined,
+      limit: req.query.limit ? Number(req.query.limit) : 100,
+    };
+    const records = telemetry.query(filters);
+    res.json({ object: "telemetry_list", data: records, count: records.length });
+  } catch (error) {
+    logger.error({ error: error.message }, "Error querying telemetry");
+    res.status(500).json({ error: { type: "server_error", message: error.message } });
+  }
+});
+/**
+ * GET /v1/routing/accuracy
+ *
+ * Routing accuracy analysis (over/under-provisioned percentages).
+ */
+router.get("/routing/accuracy", (req, res) => {
+  try {
+    const since = req.query.since ? Number(req.query.since) : undefined;
+    const accuracy = telemetry.getRoutingAccuracy({ since });
+    res.json({
+      object: "routing_accuracy",
+      data: accuracy,
+      timestamp: new Date().toISOString(),
+    });
+  } catch (error) {
+    logger.error({ error: error.message }, "Error getting routing accuracy");
+    res.status(500).json({ error: { type: "server_error", message: error.message } });
+  }
+});
+// ── Admin: Hot Reload Config + Reset Circuit Breakers ─────────────────
+router.post("/admin/reload", (req, res) => {
+  try {
+    config.reloadConfig();
+    const registry = getCircuitBreakerRegistry();
+    const states = registry.getAll();
+    res.json({
+      object: "admin_reload",
+      status: "ok",
+      reloaded: [
+        "modelTiers",
+        "apiKeys",
+        "providerSettings",
+        "circuitBreakers",
+      ],
+      circuitBreakers: states.map(s => ({ name: s.name, state: s.state })),
+      timestamp: new Date().toISOString(),
+    });
+  } catch (error) {
+    logger.error({ error: error.message }, "Admin reload failed");
+    res.status(500).json({ error: { type: "server_error", message: error.message } });
+  }
+});
+router.post("/admin/circuit-breakers/reset", (req, res) => {
+  try {
+    const provider = req.query.provider || req.body?.provider;
+    const registry = getCircuitBreakerRegistry();
+    if (provider) {
+      const breaker = registry.breakers?.get(provider);
+      if (breaker) {
+        breaker.reset();
+        res.json({ object: "circuit_breaker_reset", provider, status: "reset" });
+      } else {
+        res.status(404).json({ error: { message: `No circuit breaker for provider: ${provider}` } });
+      }
+    } else {
+      registry.resetAll();
+      const states = registry.getAll();
+      res.json({
+        object: "circuit_breaker_reset",
+        provider: "all",
+        status: "reset",
+        breakers: states.map(s => ({ name: s.name, state: s.state })),
+      });
+    }
+  } catch (error) {
+    logger.error({ error: error.message }, "Circuit breaker reset failed");
+    res.status(500).json({ error: { type: "server_error", message: error.message } });
+  }
+});
 module.exports = router;

package/src/api/router.js CHANGED Viewed

@@ -136,7 +136,7 @@ router.post("/routing/analyze", async (req, res) => {
     const { getModelTierSelector } = require("../routing/model-tiers");
     const { getModelRegistry } = require("../routing/model-registry");
-    const analysis = analyzeComplexity(req.body, { weighted: req.query.weighted === "true" });
+    const analysis = await analyzeComplexity(req.body, { weighted: req.query.weighted === "true" });
     const agentic = getAgenticDetector().detect(req.body);
     const selector = getModelTierSelector();
     const tier = selector.getTier(analysis.score);
@@ -210,13 +210,17 @@ router.post("/api/event_logging/batch", (req, res) => {
 router.post("/v1/messages", rateLimiter, async (req, res, next) => {
   try {
+    const { createTimer } = require("../utils/perf-timer");
+    const timer = createTimer("POST /v1/messages");
     metrics.recordRequest();
     // Support both query parameter (?stream=true) and body parameter ({"stream": true})
     const wantsStream = Boolean(req.query?.stream === 'true' || req.body?.stream);
     const hasTools = Array.isArray(req.body?.tools) && req.body.tools.length > 0;
+    timer.mark("parseRequest");
     // Analyze complexity for routing headers (Phase 3)
-    const complexity = analyzeComplexity(req.body);
+    const complexity = await analyzeComplexity(req.body);
+    timer.mark("analyzeComplexity");
     let preRouteProvider = 'cloud';
     if (complexity.recommendation === 'local') {
       // Use tier config to determine actual provider instead of hardcoding 'ollama'
@@ -430,6 +434,7 @@ router.post("/v1/messages", rateLimiter, async (req, res, next) => {
     }
     // Non-streaming or tool-based requests (buffered path)
+    timer.mark("preProcessMessage");
     const result = await processMessage({
       payload: req.body,
       headers: req.headers,
@@ -440,6 +445,8 @@ router.post("/v1/messages", rateLimiter, async (req, res, next) => {
         maxDurationMs: req.body?.max_duration_ms,
       },
     });
+    timer.mark("processMessage");
+    timer.done();
     // Legacy streaming wrapper (for tool-based requests that requested streaming)
     if (wantsStream && hasTools) {