@agentlensai/server 0.11.0 → 0.13.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +21 -0
- package/dist/cloud/auth/rbac.d.ts +1 -1
- package/dist/cloud/auth/rbac.d.ts.map +1 -1
- package/dist/cloud/auth/rbac.js +2 -2
- package/dist/cloud/auth/rbac.js.map +1 -1
- package/dist/cloud/billing/stripe-client.d.ts.map +1 -1
- package/dist/cloud/billing/stripe-client.js +6 -1
- package/dist/cloud/billing/stripe-client.js.map +1 -1
- package/dist/cloud/ingestion/gateway.d.ts.map +1 -1
- package/dist/cloud/ingestion/gateway.js +0 -1
- package/dist/cloud/ingestion/gateway.js.map +1 -1
- package/dist/cloud/middleware/validate-org-access.d.ts +14 -0
- package/dist/cloud/middleware/validate-org-access.d.ts.map +1 -0
- package/dist/cloud/middleware/validate-org-access.js +38 -0
- package/dist/cloud/middleware/validate-org-access.js.map +1 -0
- package/dist/cloud/routes/index.d.ts +13 -0
- package/dist/cloud/routes/index.d.ts.map +1 -0
- package/dist/cloud/routes/index.js +98 -0
- package/dist/cloud/routes/index.js.map +1 -0
- package/dist/config.d.ts +33 -1
- package/dist/config.d.ts.map +1 -1
- package/dist/config.js +71 -1
- package/dist/config.js.map +1 -1
- package/dist/db/api-key-lookup.d.ts +25 -0
- package/dist/db/api-key-lookup.d.ts.map +1 -0
- package/dist/db/api-key-lookup.js +38 -0
- package/dist/db/api-key-lookup.js.map +1 -0
- package/dist/db/connection.postgres.d.ts +44 -0
- package/dist/db/connection.postgres.d.ts.map +1 -0
- package/dist/db/connection.postgres.js +79 -0
- package/dist/db/connection.postgres.js.map +1 -0
- package/dist/db/cost-budget-store.d.ts +30 -0
- package/dist/db/cost-budget-store.d.ts.map +1 -0
- package/dist/db/cost-budget-store.js +201 -0
- package/dist/db/cost-budget-store.js.map +1 -0
- package/dist/db/drizzle/0000_initial.sql +336 -0
- package/dist/db/drizzle/0001_indexes.sql +20 -0
- package/dist/db/drizzle/0002_pgvector.sql +19 -0
- package/dist/db/drizzle/drizzle/0000_initial.sql +336 -0
- package/dist/db/drizzle/drizzle/0001_indexes.sql +20 -0
- package/dist/db/drizzle/drizzle/0002_pgvector.sql +19 -0
- package/dist/db/drizzle/drizzle/meta/0000_snapshot.json +2593 -0
- package/dist/db/drizzle/drizzle/meta/_journal.json +27 -0
- package/dist/db/drizzle/meta/0000_snapshot.json +2593 -0
- package/dist/db/drizzle/meta/_journal.json +27 -0
- package/dist/db/embedding-store.d.ts +2 -1
- package/dist/db/embedding-store.d.ts.map +1 -1
- package/dist/db/embedding-store.interface.d.ts +19 -0
- package/dist/db/embedding-store.interface.d.ts.map +1 -0
- package/dist/db/embedding-store.interface.js +7 -0
- package/dist/db/embedding-store.interface.js.map +1 -0
- package/dist/db/embedding-store.js +3 -1
- package/dist/db/embedding-store.js.map +1 -1
- package/dist/db/eval-store.d.ts +88 -0
- package/dist/db/eval-store.d.ts.map +1 -0
- package/dist/db/eval-store.js +408 -0
- package/dist/db/eval-store.js.map +1 -0
- package/dist/db/guardrail-store.d.ts +9 -0
- package/dist/db/guardrail-store.d.ts.map +1 -1
- package/dist/db/guardrail-store.js +57 -3
- package/dist/db/guardrail-store.js.map +1 -1
- package/dist/db/index.d.ts +7 -0
- package/dist/db/index.d.ts.map +1 -1
- package/dist/db/index.js +4 -12
- package/dist/db/index.js.map +1 -1
- package/dist/db/migrate.d.ts +5 -22
- package/dist/db/migrate.d.ts.map +1 -1
- package/dist/db/migrate.js +7 -637
- package/dist/db/migrate.js.map +1 -1
- package/dist/db/migrate.postgres.d.ts +16 -0
- package/dist/db/migrate.postgres.d.ts.map +1 -0
- package/dist/db/migrate.postgres.js +23 -0
- package/dist/db/migrate.postgres.js.map +1 -0
- package/dist/db/migrate.sqlite.d.ts +26 -0
- package/dist/db/migrate.sqlite.d.ts.map +1 -0
- package/dist/db/migrate.sqlite.js +920 -0
- package/dist/db/migrate.sqlite.js.map +1 -0
- package/dist/db/postgres-embedding-store.d.ts +23 -0
- package/dist/db/postgres-embedding-store.d.ts.map +1 -0
- package/dist/db/postgres-embedding-store.js +218 -0
- package/dist/db/postgres-embedding-store.js.map +1 -0
- package/dist/db/postgres-store.d.ts +80 -0
- package/dist/db/postgres-store.d.ts.map +1 -0
- package/dist/db/postgres-store.js +910 -0
- package/dist/db/postgres-store.js.map +1 -0
- package/dist/db/prompt-store.d.ts +57 -0
- package/dist/db/prompt-store.d.ts.map +1 -0
- package/dist/db/prompt-store.js +300 -0
- package/dist/db/prompt-store.js.map +1 -0
- package/dist/db/repositories/agent-repository.d.ts +21 -0
- package/dist/db/repositories/agent-repository.d.ts.map +1 -0
- package/dist/db/repositories/agent-repository.js +142 -0
- package/dist/db/repositories/agent-repository.js.map +1 -0
- package/dist/db/repositories/alert-repository.d.ts +27 -0
- package/dist/db/repositories/alert-repository.d.ts.map +1 -0
- package/dist/db/repositories/alert-repository.js +164 -0
- package/dist/db/repositories/alert-repository.js.map +1 -0
- package/dist/db/repositories/analytics-repository.d.ts +24 -0
- package/dist/db/repositories/analytics-repository.d.ts.map +1 -0
- package/dist/db/repositories/analytics-repository.js +147 -0
- package/dist/db/repositories/analytics-repository.js.map +1 -0
- package/dist/db/repositories/event-repository.d.ts +81 -0
- package/dist/db/repositories/event-repository.d.ts.map +1 -0
- package/dist/db/repositories/event-repository.js +331 -0
- package/dist/db/repositories/event-repository.js.map +1 -0
- package/dist/db/repositories/notification-channel-repository.d.ts +28 -0
- package/dist/db/repositories/notification-channel-repository.d.ts.map +1 -0
- package/dist/db/repositories/notification-channel-repository.js +151 -0
- package/dist/db/repositories/notification-channel-repository.js.map +1 -0
- package/dist/db/repositories/session-repository.d.ts +26 -0
- package/dist/db/repositories/session-repository.d.ts.map +1 -0
- package/dist/db/repositories/session-repository.js +240 -0
- package/dist/db/repositories/session-repository.js.map +1 -0
- package/dist/db/schema.postgres.d.ts +4681 -0
- package/dist/db/schema.postgres.d.ts.map +1 -0
- package/dist/db/schema.postgres.js +458 -0
- package/dist/db/schema.postgres.js.map +1 -0
- package/dist/db/schema.sqlite.d.ts +2221 -671
- package/dist/db/schema.sqlite.d.ts.map +1 -1
- package/dist/db/schema.sqlite.js +137 -2
- package/dist/db/schema.sqlite.js.map +1 -1
- package/dist/db/services/retention-service.d.ts +13 -0
- package/dist/db/services/retention-service.d.ts.map +1 -0
- package/dist/db/services/retention-service.js +48 -0
- package/dist/db/services/retention-service.js.map +1 -0
- package/dist/db/shared/query-helpers.d.ts +32 -0
- package/dist/db/shared/query-helpers.d.ts.map +1 -0
- package/dist/db/shared/query-helpers.js +180 -0
- package/dist/db/shared/query-helpers.js.map +1 -0
- package/dist/db/sqlite-store.d.ts +48 -55
- package/dist/db/sqlite-store.d.ts.map +1 -1
- package/dist/db/sqlite-store.js +78 -945
- package/dist/db/sqlite-store.js.map +1 -1
- package/dist/db/tenant-scoped-store.d.ts +18 -1
- package/dist/db/tenant-scoped-store.d.ts.map +1 -1
- package/dist/db/tenant-scoped-store.js +6 -0
- package/dist/db/tenant-scoped-store.js.map +1 -1
- package/dist/index.d.ts +28 -14
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +432 -97
- package/dist/index.js.map +1 -1
- package/dist/lib/alert-engine.d.ts +10 -0
- package/dist/lib/alert-engine.d.ts.map +1 -1
- package/dist/lib/alert-engine.js +73 -20
- package/dist/lib/alert-engine.js.map +1 -1
- package/dist/lib/audit-verify.d.ts +40 -0
- package/dist/lib/audit-verify.d.ts.map +1 -0
- package/dist/lib/audit-verify.js +128 -0
- package/dist/lib/audit-verify.js.map +1 -0
- package/dist/lib/audit.d.ts +37 -0
- package/dist/lib/audit.d.ts.map +1 -0
- package/dist/lib/audit.js +59 -0
- package/dist/lib/audit.js.map +1 -0
- package/dist/lib/budget-engine.d.ts +26 -0
- package/dist/lib/budget-engine.d.ts.map +1 -0
- package/dist/lib/budget-engine.js +201 -0
- package/dist/lib/budget-engine.js.map +1 -0
- package/dist/lib/compliance-export.d.ts +41 -0
- package/dist/lib/compliance-export.d.ts.map +1 -0
- package/dist/lib/compliance-export.js +124 -0
- package/dist/lib/compliance-export.js.map +1 -0
- package/dist/lib/compliance-report.d.ts +87 -0
- package/dist/lib/compliance-report.d.ts.map +1 -0
- package/dist/lib/compliance-report.js +148 -0
- package/dist/lib/compliance-report.js.map +1 -0
- package/dist/lib/context/retrieval.d.ts +5 -3
- package/dist/lib/context/retrieval.d.ts.map +1 -1
- package/dist/lib/context/retrieval.js +5 -2
- package/dist/lib/context/retrieval.js.map +1 -1
- package/dist/lib/cost-anomaly-detector.d.ts +23 -0
- package/dist/lib/cost-anomaly-detector.d.ts.map +1 -0
- package/dist/lib/cost-anomaly-detector.js +108 -0
- package/dist/lib/cost-anomaly-detector.js.map +1 -0
- package/dist/lib/db-resilience.d.ts +15 -0
- package/dist/lib/db-resilience.d.ts.map +1 -0
- package/dist/lib/db-resilience.js +49 -0
- package/dist/lib/db-resilience.js.map +1 -0
- package/dist/lib/diagnostics/cache.d.ts +29 -0
- package/dist/lib/diagnostics/cache.d.ts.map +1 -0
- package/dist/lib/diagnostics/cache.js +88 -0
- package/dist/lib/diagnostics/cache.js.map +1 -0
- package/dist/lib/diagnostics/context-builder.d.ts +41 -0
- package/dist/lib/diagnostics/context-builder.d.ts.map +1 -0
- package/dist/lib/diagnostics/context-builder.js +135 -0
- package/dist/lib/diagnostics/context-builder.js.map +1 -0
- package/dist/lib/diagnostics/index.d.ts +34 -0
- package/dist/lib/diagnostics/index.d.ts.map +1 -0
- package/dist/lib/diagnostics/index.js +223 -0
- package/dist/lib/diagnostics/index.js.map +1 -0
- package/dist/lib/diagnostics/llm-client.d.ts +24 -0
- package/dist/lib/diagnostics/llm-client.d.ts.map +1 -0
- package/dist/lib/diagnostics/llm-client.js +42 -0
- package/dist/lib/diagnostics/llm-client.js.map +1 -0
- package/dist/lib/diagnostics/prompt-templates.d.ts +18 -0
- package/dist/lib/diagnostics/prompt-templates.d.ts.map +1 -0
- package/dist/lib/diagnostics/prompt-templates.js +144 -0
- package/dist/lib/diagnostics/prompt-templates.js.map +1 -0
- package/dist/lib/diagnostics/providers/anthropic.d.ts +8 -0
- package/dist/lib/diagnostics/providers/anthropic.d.ts.map +1 -0
- package/dist/lib/diagnostics/providers/anthropic.js +79 -0
- package/dist/lib/diagnostics/providers/anthropic.js.map +1 -0
- package/dist/lib/diagnostics/providers/openai.d.ts +8 -0
- package/dist/lib/diagnostics/providers/openai.d.ts.map +1 -0
- package/dist/lib/diagnostics/providers/openai.js +70 -0
- package/dist/lib/diagnostics/providers/openai.js.map +1 -0
- package/dist/lib/diagnostics/providers/types.d.ts +23 -0
- package/dist/lib/diagnostics/providers/types.d.ts.map +1 -0
- package/dist/lib/diagnostics/providers/types.js +5 -0
- package/dist/lib/diagnostics/providers/types.js.map +1 -0
- package/dist/lib/diagnostics/response-parser.d.ts +60 -0
- package/dist/lib/diagnostics/response-parser.d.ts.map +1 -0
- package/dist/lib/diagnostics/response-parser.js +55 -0
- package/dist/lib/diagnostics/response-parser.js.map +1 -0
- package/dist/lib/diagnostics/types.d.ts +60 -0
- package/dist/lib/diagnostics/types.d.ts.map +1 -0
- package/dist/lib/diagnostics/types.js +7 -0
- package/dist/lib/diagnostics/types.js.map +1 -0
- package/dist/lib/embeddings/index.d.ts +6 -3
- package/dist/lib/embeddings/index.d.ts.map +1 -1
- package/dist/lib/embeddings/index.js +7 -15
- package/dist/lib/embeddings/index.js.map +1 -1
- package/dist/lib/embeddings/worker.d.ts +2 -2
- package/dist/lib/embeddings/worker.d.ts.map +1 -1
- package/dist/lib/embeddings/worker.js +3 -1
- package/dist/lib/embeddings/worker.js.map +1 -1
- package/dist/lib/error-sanitizer.d.ts +28 -0
- package/dist/lib/error-sanitizer.d.ts.map +1 -0
- package/dist/lib/error-sanitizer.js +106 -0
- package/dist/lib/error-sanitizer.js.map +1 -0
- package/dist/lib/eval/index.d.ts +15 -0
- package/dist/lib/eval/index.d.ts.map +1 -0
- package/dist/lib/eval/index.js +24 -0
- package/dist/lib/eval/index.js.map +1 -0
- package/dist/lib/eval/runner.d.ts +28 -0
- package/dist/lib/eval/runner.d.ts.map +1 -0
- package/dist/lib/eval/runner.js +260 -0
- package/dist/lib/eval/runner.js.map +1 -0
- package/dist/lib/eval/scorers/contains.d.ts +10 -0
- package/dist/lib/eval/scorers/contains.d.ts.map +1 -0
- package/dist/lib/eval/scorers/contains.js +33 -0
- package/dist/lib/eval/scorers/contains.js.map +1 -0
- package/dist/lib/eval/scorers/exact-match.d.ts +10 -0
- package/dist/lib/eval/scorers/exact-match.d.ts.map +1 -0
- package/dist/lib/eval/scorers/exact-match.js +33 -0
- package/dist/lib/eval/scorers/exact-match.js.map +1 -0
- package/dist/lib/eval/scorers/index.d.ts +20 -0
- package/dist/lib/eval/scorers/index.d.ts.map +1 -0
- package/dist/lib/eval/scorers/index.js +19 -0
- package/dist/lib/eval/scorers/index.js.map +1 -0
- package/dist/lib/eval/scorers/llm-judge.d.ts +22 -0
- package/dist/lib/eval/scorers/llm-judge.d.ts.map +1 -0
- package/dist/lib/eval/scorers/llm-judge.js +79 -0
- package/dist/lib/eval/scorers/llm-judge.js.map +1 -0
- package/dist/lib/eval/scorers/regex.d.ts +10 -0
- package/dist/lib/eval/scorers/regex.d.ts.map +1 -0
- package/dist/lib/eval/scorers/regex.js +36 -0
- package/dist/lib/eval/scorers/regex.js.map +1 -0
- package/dist/lib/guardrails/actions.d.ts +6 -0
- package/dist/lib/guardrails/actions.d.ts.map +1 -1
- package/dist/lib/guardrails/actions.js +82 -0
- package/dist/lib/guardrails/actions.js.map +1 -1
- package/dist/lib/guardrails/conditions.d.ts +47 -0
- package/dist/lib/guardrails/conditions.d.ts.map +1 -1
- package/dist/lib/guardrails/conditions.js +55 -10
- package/dist/lib/guardrails/conditions.js.map +1 -1
- package/dist/lib/guardrails/content-engine.d.ts +19 -0
- package/dist/lib/guardrails/content-engine.d.ts.map +1 -0
- package/dist/lib/guardrails/content-engine.js +154 -0
- package/dist/lib/guardrails/content-engine.js.map +1 -0
- package/dist/lib/guardrails/engine.d.ts +33 -0
- package/dist/lib/guardrails/engine.d.ts.map +1 -1
- package/dist/lib/guardrails/engine.js +37 -2
- package/dist/lib/guardrails/engine.js.map +1 -1
- package/dist/lib/guardrails/scanners/base-scanner.d.ts +23 -0
- package/dist/lib/guardrails/scanners/base-scanner.d.ts.map +1 -0
- package/dist/lib/guardrails/scanners/base-scanner.js +7 -0
- package/dist/lib/guardrails/scanners/base-scanner.js.map +1 -0
- package/dist/lib/guardrails/scanners/patterns/pii-patterns.d.ts +13 -0
- package/dist/lib/guardrails/scanners/patterns/pii-patterns.d.ts.map +1 -0
- package/dist/lib/guardrails/scanners/patterns/pii-patterns.js +49 -0
- package/dist/lib/guardrails/scanners/patterns/pii-patterns.js.map +1 -0
- package/dist/lib/guardrails/scanners/patterns/secret-patterns.d.ts +6 -0
- package/dist/lib/guardrails/scanners/patterns/secret-patterns.d.ts.map +1 -0
- package/dist/lib/guardrails/scanners/patterns/secret-patterns.js +69 -0
- package/dist/lib/guardrails/scanners/patterns/secret-patterns.js.map +1 -0
- package/dist/lib/guardrails/scanners/pii-scanner.d.ts +10 -0
- package/dist/lib/guardrails/scanners/pii-scanner.d.ts.map +1 -0
- package/dist/lib/guardrails/scanners/pii-scanner.js +57 -0
- package/dist/lib/guardrails/scanners/pii-scanner.js.map +1 -0
- package/dist/lib/guardrails/scanners/scanner-registry.d.ts +14 -0
- package/dist/lib/guardrails/scanners/scanner-registry.d.ts.map +1 -0
- package/dist/lib/guardrails/scanners/scanner-registry.js +51 -0
- package/dist/lib/guardrails/scanners/scanner-registry.js.map +1 -0
- package/dist/lib/guardrails/scanners/secrets-scanner.d.ts +9 -0
- package/dist/lib/guardrails/scanners/secrets-scanner.d.ts.map +1 -0
- package/dist/lib/guardrails/scanners/secrets-scanner.js +47 -0
- package/dist/lib/guardrails/scanners/secrets-scanner.js.map +1 -0
- package/dist/lib/logger.d.ts +8 -0
- package/dist/lib/logger.d.ts.map +1 -0
- package/dist/lib/logger.js +31 -0
- package/dist/lib/logger.js.map +1 -0
- package/dist/lib/lore-client.d.ts +128 -0
- package/dist/lib/lore-client.d.ts.map +1 -0
- package/dist/lib/lore-client.js +188 -0
- package/dist/lib/lore-client.js.map +1 -0
- package/dist/lib/mesh-client.d.ts +31 -0
- package/dist/lib/mesh-client.d.ts.map +1 -0
- package/dist/lib/mesh-client.js +72 -0
- package/dist/lib/mesh-client.js.map +1 -0
- package/dist/lib/notifications/grouping-buffer.d.ts +25 -0
- package/dist/lib/notifications/grouping-buffer.d.ts.map +1 -0
- package/dist/lib/notifications/grouping-buffer.js +73 -0
- package/dist/lib/notifications/grouping-buffer.js.map +1 -0
- package/dist/lib/notifications/provider.d.ts +10 -0
- package/dist/lib/notifications/provider.d.ts.map +1 -0
- package/dist/lib/notifications/provider.js +5 -0
- package/dist/lib/notifications/provider.js.map +1 -0
- package/dist/lib/notifications/providers/email.d.ts +14 -0
- package/dist/lib/notifications/providers/email.d.ts.map +1 -0
- package/dist/lib/notifications/providers/email.js +88 -0
- package/dist/lib/notifications/providers/email.js.map +1 -0
- package/dist/lib/notifications/providers/pagerduty.d.ts +16 -0
- package/dist/lib/notifications/providers/pagerduty.d.ts.map +1 -0
- package/dist/lib/notifications/providers/pagerduty.js +94 -0
- package/dist/lib/notifications/providers/pagerduty.js.map +1 -0
- package/dist/lib/notifications/providers/slack.d.ts +14 -0
- package/dist/lib/notifications/providers/slack.d.ts.map +1 -0
- package/dist/lib/notifications/providers/slack.js +106 -0
- package/dist/lib/notifications/providers/slack.js.map +1 -0
- package/dist/lib/notifications/providers/webhook.d.ts +16 -0
- package/dist/lib/notifications/providers/webhook.d.ts.map +1 -0
- package/dist/lib/notifications/providers/webhook.js +78 -0
- package/dist/lib/notifications/providers/webhook.js.map +1 -0
- package/dist/lib/notifications/router.d.ts +30 -0
- package/dist/lib/notifications/router.d.ts.map +1 -0
- package/dist/lib/notifications/router.js +137 -0
- package/dist/lib/notifications/router.js.map +1 -0
- package/dist/lib/notifications/ssrf.d.ts +13 -0
- package/dist/lib/notifications/ssrf.d.ts.map +1 -0
- package/dist/lib/notifications/ssrf.js +37 -0
- package/dist/lib/notifications/ssrf.js.map +1 -0
- package/dist/lib/optimization/analyzers/model-downgrade.d.ts +15 -0
- package/dist/lib/optimization/analyzers/model-downgrade.d.ts.map +1 -0
- package/dist/lib/optimization/analyzers/model-downgrade.js +58 -0
- package/dist/lib/optimization/analyzers/model-downgrade.js.map +1 -0
- package/dist/lib/optimization/analyzers/prompt-optimization.d.ts +17 -0
- package/dist/lib/optimization/analyzers/prompt-optimization.d.ts.map +1 -0
- package/dist/lib/optimization/analyzers/prompt-optimization.js +160 -0
- package/dist/lib/optimization/analyzers/prompt-optimization.js.map +1 -0
- package/dist/lib/optimization/analyzers/types.d.ts +23 -0
- package/dist/lib/optimization/analyzers/types.d.ts.map +1 -0
- package/dist/lib/optimization/analyzers/types.js +5 -0
- package/dist/lib/optimization/analyzers/types.js.map +1 -0
- package/dist/lib/optimization/classifier.d.ts +4 -3
- package/dist/lib/optimization/classifier.d.ts.map +1 -1
- package/dist/lib/optimization/classifier.js +15 -9
- package/dist/lib/optimization/classifier.js.map +1 -1
- package/dist/lib/optimization/cost-optimizer.d.ts +21 -0
- package/dist/lib/optimization/cost-optimizer.d.ts.map +1 -0
- package/dist/lib/optimization/cost-optimizer.js +114 -0
- package/dist/lib/optimization/cost-optimizer.js.map +1 -0
- package/dist/lib/optimization/engine.d.ts.map +1 -1
- package/dist/lib/optimization/engine.js +45 -6
- package/dist/lib/optimization/engine.js.map +1 -1
- package/dist/lib/optimization/forecast.d.ts +39 -0
- package/dist/lib/optimization/forecast.d.ts.map +1 -0
- package/dist/lib/optimization/forecast.js +128 -0
- package/dist/lib/optimization/forecast.js.map +1 -0
- package/dist/lib/secrets.d.ts +30 -0
- package/dist/lib/secrets.d.ts.map +1 -0
- package/dist/lib/secrets.js +103 -0
- package/dist/lib/secrets.js.map +1 -0
- package/dist/lib/threshold-monitor.d.ts +53 -0
- package/dist/lib/threshold-monitor.d.ts.map +1 -0
- package/dist/lib/threshold-monitor.js +112 -0
- package/dist/lib/threshold-monitor.js.map +1 -0
- package/dist/middleware/audit.d.ts +16 -0
- package/dist/middleware/audit.d.ts.map +1 -0
- package/dist/middleware/audit.js +16 -0
- package/dist/middleware/audit.js.map +1 -0
- package/dist/middleware/auth-errors.d.ts +67 -0
- package/dist/middleware/auth-errors.d.ts.map +1 -0
- package/dist/middleware/auth-errors.js +84 -0
- package/dist/middleware/auth-errors.js.map +1 -0
- package/dist/middleware/auth.d.ts +5 -2
- package/dist/middleware/auth.d.ts.map +1 -1
- package/dist/middleware/auth.js +44 -17
- package/dist/middleware/auth.js.map +1 -1
- package/dist/middleware/body-limit.d.ts +9 -0
- package/dist/middleware/body-limit.d.ts.map +1 -0
- package/dist/middleware/body-limit.js +15 -0
- package/dist/middleware/body-limit.js.map +1 -0
- package/dist/middleware/cors-config.d.ts +30 -0
- package/dist/middleware/cors-config.d.ts.map +1 -0
- package/dist/middleware/cors-config.js +55 -0
- package/dist/middleware/cors-config.js.map +1 -0
- package/dist/middleware/rate-limit.d.ts +9 -0
- package/dist/middleware/rate-limit.d.ts.map +1 -0
- package/dist/middleware/rate-limit.js +56 -0
- package/dist/middleware/rate-limit.js.map +1 -0
- package/dist/middleware/rbac.d.ts +30 -0
- package/dist/middleware/rbac.d.ts.map +1 -0
- package/dist/middleware/rbac.js +87 -0
- package/dist/middleware/rbac.js.map +1 -0
- package/dist/middleware/security-headers.d.ts +12 -0
- package/dist/middleware/security-headers.d.ts.map +1 -0
- package/dist/middleware/security-headers.js +57 -0
- package/dist/middleware/security-headers.js.map +1 -0
- package/dist/middleware/unified-auth.d.ts +49 -0
- package/dist/middleware/unified-auth.d.ts.map +1 -0
- package/dist/middleware/unified-auth.js +246 -0
- package/dist/middleware/unified-auth.js.map +1 -0
- package/dist/middleware/validation.d.ts +31 -0
- package/dist/middleware/validation.d.ts.map +1 -0
- package/dist/middleware/validation.js +45 -0
- package/dist/middleware/validation.js.map +1 -0
- package/dist/routes/alerts.d.ts.map +1 -1
- package/dist/routes/alerts.js +4 -3
- package/dist/routes/alerts.js.map +1 -1
- package/dist/routes/analytics.d.ts +2 -1
- package/dist/routes/analytics.d.ts.map +1 -1
- package/dist/routes/analytics.js +175 -95
- package/dist/routes/analytics.js.map +1 -1
- package/dist/routes/api-keys.d.ts +5 -0
- package/dist/routes/api-keys.d.ts.map +1 -1
- package/dist/routes/api-keys.js +89 -8
- package/dist/routes/api-keys.js.map +1 -1
- package/dist/routes/audit-verify.d.ts +12 -0
- package/dist/routes/audit-verify.d.ts.map +1 -0
- package/dist/routes/audit-verify.js +73 -0
- package/dist/routes/audit-verify.js.map +1 -0
- package/dist/routes/audit.d.ts +4 -6
- package/dist/routes/audit.d.ts.map +1 -1
- package/dist/routes/audit.js +54 -157
- package/dist/routes/audit.js.map +1 -1
- package/dist/routes/auth.d.ts +21 -0
- package/dist/routes/auth.d.ts.map +1 -0
- package/dist/routes/auth.js +235 -0
- package/dist/routes/auth.js.map +1 -0
- package/dist/routes/benchmarks.d.ts.map +1 -1
- package/dist/routes/benchmarks.js +63 -11
- package/dist/routes/benchmarks.js.map +1 -1
- package/dist/routes/capabilities-top.d.ts.map +1 -1
- package/dist/routes/capabilities-top.js +1 -4
- package/dist/routes/capabilities-top.js.map +1 -1
- package/dist/routes/capabilities.d.ts.map +1 -1
- package/dist/routes/capabilities.js +1 -7
- package/dist/routes/capabilities.js.map +1 -1
- package/dist/routes/compliance.d.ts +17 -0
- package/dist/routes/compliance.d.ts.map +1 -0
- package/dist/routes/compliance.js +151 -0
- package/dist/routes/compliance.js.map +1 -0
- package/dist/routes/config.d.ts +1 -13
- package/dist/routes/config.d.ts.map +1 -1
- package/dist/routes/context.d.ts.map +1 -1
- package/dist/routes/context.js +6 -5
- package/dist/routes/context.js.map +1 -1
- package/dist/routes/cost-budgets.d.ts +20 -0
- package/dist/routes/cost-budgets.d.ts.map +1 -0
- package/dist/routes/cost-budgets.js +194 -0
- package/dist/routes/cost-budgets.js.map +1 -0
- package/dist/routes/delegation.d.ts.map +1 -1
- package/dist/routes/delegation.js +67 -41
- package/dist/routes/delegation.js.map +1 -1
- package/dist/routes/delegations-top.d.ts.map +1 -1
- package/dist/routes/delegations-top.js +1 -3
- package/dist/routes/delegations-top.js.map +1 -1
- package/dist/routes/diagnose.d.ts +16 -0
- package/dist/routes/diagnose.d.ts.map +1 -0
- package/dist/routes/diagnose.js +82 -0
- package/dist/routes/diagnose.js.map +1 -0
- package/dist/routes/discovery.d.ts.map +1 -1
- package/dist/routes/discovery.js +50 -38
- package/dist/routes/discovery.js.map +1 -1
- package/dist/routes/eval.d.ts +24 -0
- package/dist/routes/eval.d.ts.map +1 -0
- package/dist/routes/eval.js +281 -0
- package/dist/routes/eval.js.map +1 -0
- package/dist/routes/events.d.ts.map +1 -1
- package/dist/routes/events.js +11 -6
- package/dist/routes/events.js.map +1 -1
- package/dist/routes/guardrails.d.ts +2 -1
- package/dist/routes/guardrails.d.ts.map +1 -1
- package/dist/routes/guardrails.js +85 -14
- package/dist/routes/guardrails.js.map +1 -1
- package/dist/routes/health.d.ts +14 -11
- package/dist/routes/health.d.ts.map +1 -1
- package/dist/routes/health.js +181 -61
- package/dist/routes/health.js.map +1 -1
- package/dist/routes/lore-proxy.d.ts +13 -0
- package/dist/routes/lore-proxy.d.ts.map +1 -0
- package/dist/routes/lore-proxy.js +229 -0
- package/dist/routes/lore-proxy.js.map +1 -0
- package/dist/routes/mesh-proxy.d.ts +7 -0
- package/dist/routes/mesh-proxy.d.ts.map +1 -0
- package/dist/routes/mesh-proxy.js +94 -0
- package/dist/routes/mesh-proxy.js.map +1 -0
- package/dist/routes/notifications.d.ts +19 -0
- package/dist/routes/notifications.d.ts.map +1 -0
- package/dist/routes/notifications.js +129 -0
- package/dist/routes/notifications.js.map +1 -0
- package/dist/routes/optimize.d.ts.map +1 -1
- package/dist/routes/optimize.js +44 -0
- package/dist/routes/optimize.js.map +1 -1
- package/dist/routes/otlp.d.ts +17 -0
- package/dist/routes/otlp.d.ts.map +1 -0
- package/dist/routes/otlp.js +544 -0
- package/dist/routes/otlp.js.map +1 -0
- package/dist/routes/prompts.d.ts +21 -0
- package/dist/routes/prompts.d.ts.map +1 -0
- package/dist/routes/prompts.js +173 -0
- package/dist/routes/prompts.js.map +1 -0
- package/dist/routes/recall.d.ts.map +1 -1
- package/dist/routes/recall.js +6 -4
- package/dist/routes/recall.js.map +1 -1
- package/dist/routes/replay.d.ts.map +1 -1
- package/dist/routes/replay.js +2 -1
- package/dist/routes/replay.js.map +1 -1
- package/dist/routes/server-info.d.ts +9 -0
- package/dist/routes/server-info.d.ts.map +1 -0
- package/dist/routes/server-info.js +18 -0
- package/dist/routes/server-info.js.map +1 -0
- package/dist/routes/sessions.d.ts +7 -7
- package/dist/routes/sessions.d.ts.map +1 -1
- package/dist/routes/sessions.js +112 -35
- package/dist/routes/sessions.js.map +1 -1
- package/dist/routes/stats.d.ts.map +1 -1
- package/dist/routes/stats.js +40 -0
- package/dist/routes/stats.js.map +1 -1
- package/dist/routes/stream.d.ts +2 -2
- package/dist/routes/stream.d.ts.map +1 -1
- package/dist/routes/stream.js +7 -11
- package/dist/routes/stream.js.map +1 -1
- package/dist/routes/tenant-helper.d.ts +15 -10
- package/dist/routes/tenant-helper.d.ts.map +1 -1
- package/dist/routes/tenant-helper.js +36 -22
- package/dist/routes/tenant-helper.js.map +1 -1
- package/dist/routes/trust.d.ts.map +1 -1
- package/dist/routes/trust.js +1 -3
- package/dist/routes/trust.js.map +1 -1
- package/dist/schemas/api-keys.d.ts +11 -0
- package/dist/schemas/api-keys.d.ts.map +1 -0
- package/dist/schemas/api-keys.js +10 -0
- package/dist/schemas/api-keys.js.map +1 -0
- package/dist/schemas/common.d.ts +34 -0
- package/dist/schemas/common.d.ts.map +1 -0
- package/dist/schemas/common.js +43 -0
- package/dist/schemas/common.js.map +1 -0
- package/dist/schemas/delegation.d.ts +23 -0
- package/dist/schemas/delegation.d.ts.map +1 -0
- package/dist/schemas/delegation.js +22 -0
- package/dist/schemas/delegation.js.map +1 -0
- package/dist/schemas/discovery.d.ts +17 -0
- package/dist/schemas/discovery.d.ts.map +1 -0
- package/dist/schemas/discovery.js +15 -0
- package/dist/schemas/discovery.js.map +1 -0
- package/dist/schemas/health.d.ts +75 -0
- package/dist/schemas/health.d.ts.map +1 -0
- package/dist/schemas/health.js +55 -0
- package/dist/schemas/health.js.map +1 -0
- package/dist/schemas/index.d.ts +6 -0
- package/dist/schemas/index.d.ts.map +1 -0
- package/dist/schemas/index.js +6 -0
- package/dist/schemas/index.js.map +1 -0
- package/dist/schemas/sessions.d.ts +67 -0
- package/dist/schemas/sessions.d.ts.map +1 -0
- package/dist/schemas/sessions.js +58 -0
- package/dist/schemas/sessions.js.map +1 -0
- package/dist/services/delegation-service.d.ts +1 -4
- package/dist/services/delegation-service.d.ts.map +1 -1
- package/dist/services/delegation-service.js +5 -31
- package/dist/services/delegation-service.js.map +1 -1
- package/package.json +29 -19
- package/dist/db/lesson-store.d.ts +0 -57
- package/dist/db/lesson-store.d.ts.map +0 -1
- package/dist/db/lesson-store.js +0 -217
- package/dist/db/lesson-store.js.map +0 -1
- package/dist/lib/embeddings/local.d.ts +0 -15
- package/dist/lib/embeddings/local.d.ts.map +0 -1
- package/dist/lib/embeddings/local.js +0 -65
- package/dist/lib/embeddings/local.js.map +0 -1
- package/dist/lib/redaction/human-review-layer.d.ts +0 -37
- package/dist/lib/redaction/human-review-layer.d.ts.map +0 -1
- package/dist/lib/redaction/human-review-layer.js +0 -62
- package/dist/lib/redaction/human-review-layer.js.map +0 -1
- package/dist/lib/redaction/index.d.ts +0 -12
- package/dist/lib/redaction/index.d.ts.map +0 -1
- package/dist/lib/redaction/index.js +0 -12
- package/dist/lib/redaction/index.js.map +0 -1
- package/dist/lib/redaction/pii-detection-layer.d.ts +0 -30
- package/dist/lib/redaction/pii-detection-layer.d.ts.map +0 -1
- package/dist/lib/redaction/pii-detection-layer.js +0 -183
- package/dist/lib/redaction/pii-detection-layer.js.map +0 -1
- package/dist/lib/redaction/pipeline.d.ts +0 -26
- package/dist/lib/redaction/pipeline.d.ts.map +0 -1
- package/dist/lib/redaction/pipeline.js +0 -91
- package/dist/lib/redaction/pipeline.js.map +0 -1
- package/dist/lib/redaction/secret-detection-layer.d.ts +0 -10
- package/dist/lib/redaction/secret-detection-layer.d.ts.map +0 -1
- package/dist/lib/redaction/secret-detection-layer.js +0 -79
- package/dist/lib/redaction/secret-detection-layer.js.map +0 -1
- package/dist/lib/redaction/secret-patterns.d.ts +0 -29
- package/dist/lib/redaction/secret-patterns.d.ts.map +0 -1
- package/dist/lib/redaction/secret-patterns.js +0 -133
- package/dist/lib/redaction/secret-patterns.js.map +0 -1
- package/dist/lib/redaction/semantic-denylist-layer.d.ts +0 -10
- package/dist/lib/redaction/semantic-denylist-layer.d.ts.map +0 -1
- package/dist/lib/redaction/semantic-denylist-layer.js +0 -64
- package/dist/lib/redaction/semantic-denylist-layer.js.map +0 -1
- package/dist/lib/redaction/tenant-deidentification-layer.d.ts +0 -10
- package/dist/lib/redaction/tenant-deidentification-layer.d.ts.map +0 -1
- package/dist/lib/redaction/tenant-deidentification-layer.js +0 -64
- package/dist/lib/redaction/tenant-deidentification-layer.js.map +0 -1
- package/dist/lib/redaction/url-path-scrubbing-layer.d.ts +0 -14
- package/dist/lib/redaction/url-path-scrubbing-layer.d.ts.map +0 -1
- package/dist/lib/redaction/url-path-scrubbing-layer.js +0 -156
- package/dist/lib/redaction/url-path-scrubbing-layer.js.map +0 -1
- package/dist/routes/community.d.ts +0 -24
- package/dist/routes/community.d.ts.map +0 -1
- package/dist/routes/community.js +0 -272
- package/dist/routes/community.js.map +0 -1
- package/dist/routes/lessons.d.ts +0 -19
- package/dist/routes/lessons.d.ts.map +0 -1
- package/dist/routes/lessons.js +0 -164
- package/dist/routes/lessons.js.map +0 -1
- package/dist/routes/redaction-test.d.ts +0 -14
- package/dist/routes/redaction-test.d.ts.map +0 -1
- package/dist/routes/redaction-test.js +0 -33
- package/dist/routes/redaction-test.js.map +0 -1
- package/dist/services/community-service.d.ts +0 -283
- package/dist/services/community-service.d.ts.map +0 -1
- package/dist/services/community-service.js +0 -816
- package/dist/services/community-service.js.map +0 -1
|
@@ -0,0 +1,58 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* ModelDowngradeAnalyzer (Feature 17 — Story 17.2)
|
|
3
|
+
*
|
|
4
|
+
* Wraps the existing OptimizationEngine and maps its CostRecommendation
|
|
5
|
+
* output to EnhancedRecommendation with category 'model_downgrade'.
|
|
6
|
+
*/
|
|
7
|
+
import { DEFAULT_MODEL_COSTS } from '@agentlensai/core';
|
|
8
|
+
import { OptimizationEngine } from '../engine.js';
|
|
9
|
+
import { createHash } from 'node:crypto';
|
|
10
|
+
export class ModelDowngradeAnalyzer {
|
|
11
|
+
name = 'model_downgrade';
|
|
12
|
+
engine;
|
|
13
|
+
constructor(modelCosts = DEFAULT_MODEL_COSTS) {
|
|
14
|
+
this.engine = new OptimizationEngine(modelCosts);
|
|
15
|
+
}
|
|
16
|
+
async analyze(ctx) {
|
|
17
|
+
const result = await this.engine.getRecommendations(ctx.store, {
|
|
18
|
+
agentId: ctx.agentId,
|
|
19
|
+
period: ctx.period,
|
|
20
|
+
limit: ctx.limit,
|
|
21
|
+
});
|
|
22
|
+
const now = new Date().toISOString();
|
|
23
|
+
return result.recommendations.map((rec) => {
|
|
24
|
+
const id = createHash('sha256')
|
|
25
|
+
.update(`model_downgrade:${rec.agentId}:${rec.currentModel}:${rec.recommendedModel}:${rec.complexityTier}`)
|
|
26
|
+
.digest('hex')
|
|
27
|
+
.slice(0, 16);
|
|
28
|
+
return {
|
|
29
|
+
id,
|
|
30
|
+
category: 'model_downgrade',
|
|
31
|
+
estimatedMonthlySavings: rec.monthlySavings,
|
|
32
|
+
confidence: rec.confidence,
|
|
33
|
+
difficulty: 'config_change',
|
|
34
|
+
actionableSteps: [
|
|
35
|
+
`Change model from ${rec.currentModel} to ${rec.recommendedModel} for ${rec.complexityTier} complexity calls`,
|
|
36
|
+
'Monitor success rate for 48h after switch',
|
|
37
|
+
],
|
|
38
|
+
agentId: rec.agentId,
|
|
39
|
+
evidence: {
|
|
40
|
+
callsAnalyzed: rec.callVolume,
|
|
41
|
+
period: ctx.period,
|
|
42
|
+
},
|
|
43
|
+
createdAt: now,
|
|
44
|
+
modelDowngrade: {
|
|
45
|
+
currentModel: rec.currentModel,
|
|
46
|
+
recommendedModel: rec.recommendedModel,
|
|
47
|
+
complexityTier: rec.complexityTier,
|
|
48
|
+
currentCostPerCall: rec.currentCostPerCall,
|
|
49
|
+
recommendedCostPerCall: rec.recommendedCostPerCall,
|
|
50
|
+
callVolume: rec.callVolume,
|
|
51
|
+
currentSuccessRate: rec.currentSuccessRate,
|
|
52
|
+
recommendedSuccessRate: rec.recommendedSuccessRate,
|
|
53
|
+
},
|
|
54
|
+
};
|
|
55
|
+
});
|
|
56
|
+
}
|
|
57
|
+
}
|
|
58
|
+
//# sourceMappingURL=model-downgrade.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"model-downgrade.js","sourceRoot":"","sources":["../../../../src/lib/optimization/analyzers/model-downgrade.ts"],"names":[],"mappings":"AAAA;;;;;GAKG;AAGH,OAAO,EAAE,mBAAmB,EAAE,MAAM,mBAAmB,CAAC;AACxD,OAAO,EAAE,kBAAkB,EAAE,MAAM,cAAc,CAAC;AAElD,OAAO,EAAE,UAAU,EAAE,MAAM,aAAa,CAAC;AAEzC,MAAM,OAAO,sBAAsB;IACxB,IAAI,GAAG,iBAAiB,CAAC;IAC1B,MAAM,CAAqB;IAEnC,YAAY,aAAyB,mBAAmB;QACtD,IAAI,CAAC,MAAM,GAAG,IAAI,kBAAkB,CAAC,UAAU,CAAC,CAAC;IACnD,CAAC;IAED,KAAK,CAAC,OAAO,CAAC,GAAoB;QAChC,MAAM,MAAM,GAAG,MAAM,IAAI,CAAC,MAAM,CAAC,kBAAkB,CAAC,GAAG,CAAC,KAAK,EAAE;YAC7D,OAAO,EAAE,GAAG,CAAC,OAAO;YACpB,MAAM,EAAE,GAAG,CAAC,MAAM;YAClB,KAAK,EAAE,GAAG,CAAC,KAAK;SACjB,CAAC,CAAC;QAEH,MAAM,GAAG,GAAG,IAAI,IAAI,EAAE,CAAC,WAAW,EAAE,CAAC;QAErC,OAAO,MAAM,CAAC,eAAe,CAAC,GAAG,CAAC,CAAC,GAAG,EAAE,EAAE;YACxC,MAAM,EAAE,GAAG,UAAU,CAAC,QAAQ,CAAC;iBAC5B,MAAM,CAAC,mBAAmB,GAAG,CAAC,OAAO,IAAI,GAAG,CAAC,YAAY,IAAI,GAAG,CAAC,gBAAgB,IAAI,GAAG,CAAC,cAAc,EAAE,CAAC;iBAC1G,MAAM,CAAC,KAAK,CAAC;iBACb,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;YAEhB,OAAO;gBACL,EAAE;gBACF,QAAQ,EAAE,iBAA0B;gBACpC,uBAAuB,EAAE,GAAG,CAAC,cAAc;gBAC3C,UAAU,EAAE,GAAG,CAAC,UAAU;gBAC1B,UAAU,EAAE,eAAwB;gBACpC,eAAe,EAAE;oBACf,qBAAqB,GAAG,CAAC,YAAY,OAAO,GAAG,CAAC,gBAAgB,QAAQ,GAAG,CAAC,cAAc,mBAAmB;oBAC7G,2CAA2C;iBAC5C;gBACD,OAAO,EAAE,GAAG,CAAC,OAAO;gBACpB,QAAQ,EAAE;oBACR,aAAa,EAAE,GAAG,CAAC,UAAU;oBAC7B,MAAM,EAAE,GAAG,CAAC,MAAM;iBACnB;gBACD,SAAS,EAAE,GAAG;gBACd,cAAc,EAAE;oBACd,YAAY,EAAE,GAAG,CAAC,YAAY;oBAC9B,gBAAgB,EAAE,GAAG,CAAC,gBAAgB;oBACtC,cAAc,EAAE,GAAG,CAAC,cAAc;oBAClC,kBAAkB,EAAE,GAAG,CAAC,kBAAkB;oBAC1C,sBAAsB,EAAE,GAAG,CAAC,sBAAsB;oBAClD,UAAU,EAAE,GAAG,CAAC,UAAU;oBAC1B,kBAAkB,EAAE,GAAG,CAAC,kBAAkB;oBAC1C,sBAAsB,EAAE,GAAG,CAAC,sBAAsB;iBACnD;aACF,CAAC;QACJ,CAAC,CAAC,CAAC;IACL,CAAC;CACF"}
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* PromptOptimizationAnalyzer (Feature 17 — Story 17.3)
|
|
3
|
+
*
|
|
4
|
+
* Detects cost-saving opportunities in prompt construction:
|
|
5
|
+
* 1. System prompts exceeding 4,000 tokens (string length ÷ 4 estimation)
|
|
6
|
+
* 2. Repeated context patterns within sessions (>30% shared prefix)
|
|
7
|
+
*/
|
|
8
|
+
import type { ModelCosts, EnhancedRecommendation } from '@agentlensai/core';
|
|
9
|
+
import type { Analyzer, AnalyzerContext } from './types.js';
|
|
10
|
+
export declare class PromptOptimizationAnalyzer implements Analyzer {
|
|
11
|
+
private readonly modelCosts;
|
|
12
|
+
readonly name = "prompt_optimization";
|
|
13
|
+
constructor(modelCosts?: ModelCosts);
|
|
14
|
+
analyze(ctx: AnalyzerContext): Promise<EnhancedRecommendation[]>;
|
|
15
|
+
private determineConfidence;
|
|
16
|
+
}
|
|
17
|
+
//# sourceMappingURL=prompt-optimization.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"prompt-optimization.d.ts","sourceRoot":"","sources":["../../../../src/lib/optimization/analyzers/prompt-optimization.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAEH,OAAO,KAAK,EACV,UAAU,EACV,sBAAsB,EAKvB,MAAM,mBAAmB,CAAC;AAE3B,OAAO,KAAK,EAAE,QAAQ,EAAE,eAAe,EAAE,MAAM,YAAY,CAAC;AAM5D,qBAAa,0BAA2B,YAAW,QAAQ;IAG7C,OAAO,CAAC,QAAQ,CAAC,UAAU;IAFvC,QAAQ,CAAC,IAAI,yBAAyB;gBAET,UAAU,GAAE,UAAgC;IAEnE,OAAO,CAAC,GAAG,EAAE,eAAe,GAAG,OAAO,CAAC,sBAAsB,EAAE,CAAC;IA8JtE,OAAO,CAAC,mBAAmB;CAK5B"}
|
|
@@ -0,0 +1,160 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* PromptOptimizationAnalyzer (Feature 17 — Story 17.3)
|
|
3
|
+
*
|
|
4
|
+
* Detects cost-saving opportunities in prompt construction:
|
|
5
|
+
* 1. System prompts exceeding 4,000 tokens (string length ÷ 4 estimation)
|
|
6
|
+
* 2. Repeated context patterns within sessions (>30% shared prefix)
|
|
7
|
+
*/
|
|
8
|
+
import { DEFAULT_MODEL_COSTS, lookupModelCost } from '@agentlensai/core';
|
|
9
|
+
import { createHash } from 'node:crypto';
|
|
10
|
+
const SYSTEM_PROMPT_TOKEN_THRESHOLD = 4000;
|
|
11
|
+
const REPEATED_CONTEXT_RATIO = 0.3;
|
|
12
|
+
export class PromptOptimizationAnalyzer {
|
|
13
|
+
modelCosts;
|
|
14
|
+
name = 'prompt_optimization';
|
|
15
|
+
constructor(modelCosts = DEFAULT_MODEL_COSTS) {
|
|
16
|
+
this.modelCosts = modelCosts;
|
|
17
|
+
}
|
|
18
|
+
async analyze(ctx) {
|
|
19
|
+
const recommendations = [];
|
|
20
|
+
const now = new Date().toISOString();
|
|
21
|
+
// Group calls by (agentId, model)
|
|
22
|
+
const groupMap = new Map();
|
|
23
|
+
// Session-level grouping for repeated context detection
|
|
24
|
+
const sessionCalls = new Map();
|
|
25
|
+
for (const evt of ctx.llmCallEvents) {
|
|
26
|
+
const payload = evt.payload;
|
|
27
|
+
const model = payload.model;
|
|
28
|
+
if (!model || !payload.messages)
|
|
29
|
+
continue;
|
|
30
|
+
const agentId = evt.agentId;
|
|
31
|
+
const groupKey = `${agentId}::${model}`;
|
|
32
|
+
// System prompt analysis
|
|
33
|
+
let group = groupMap.get(groupKey);
|
|
34
|
+
if (!group) {
|
|
35
|
+
group = { agentId, model, systemTokenCounts: [], sessionIds: new Set(), callCount: 0 };
|
|
36
|
+
groupMap.set(groupKey, group);
|
|
37
|
+
}
|
|
38
|
+
group.callCount++;
|
|
39
|
+
if (evt.sessionId)
|
|
40
|
+
group.sessionIds.add(evt.sessionId);
|
|
41
|
+
const systemMsgs = payload.messages.filter(m => m.role === 'system');
|
|
42
|
+
if (systemMsgs.length > 0) {
|
|
43
|
+
const totalLen = systemMsgs.reduce((sum, m) => sum + (m.content?.length ?? 0), 0);
|
|
44
|
+
const estimatedTokens = Math.ceil(totalLen / 4);
|
|
45
|
+
group.systemTokenCounts.push(estimatedTokens);
|
|
46
|
+
}
|
|
47
|
+
// Repeated context: hash first non-system message content as prefix
|
|
48
|
+
if (evt.sessionId) {
|
|
49
|
+
const sessionKey = `${evt.sessionId}::${model}`;
|
|
50
|
+
let sc = sessionCalls.get(sessionKey);
|
|
51
|
+
if (!sc) {
|
|
52
|
+
sc = { agentId, model, prefixHashes: [] };
|
|
53
|
+
sessionCalls.set(sessionKey, sc);
|
|
54
|
+
}
|
|
55
|
+
const nonSystem = payload.messages.filter(m => m.role !== 'system');
|
|
56
|
+
if (nonSystem.length > 0) {
|
|
57
|
+
const prefix = nonSystem.map(m => m.content ?? '').join('|').slice(0, 500);
|
|
58
|
+
const hash = createHash('md5').update(prefix).digest('hex');
|
|
59
|
+
sc.prefixHashes.push(hash);
|
|
60
|
+
}
|
|
61
|
+
}
|
|
62
|
+
}
|
|
63
|
+
// Detect large system prompts
|
|
64
|
+
for (const [, group] of groupMap) {
|
|
65
|
+
if (group.systemTokenCounts.length === 0)
|
|
66
|
+
continue;
|
|
67
|
+
const sorted = [...group.systemTokenCounts].sort((a, b) => a - b);
|
|
68
|
+
const median = sorted[Math.floor(sorted.length / 2)];
|
|
69
|
+
if (median > SYSTEM_PROMPT_TOKEN_THRESHOLD) {
|
|
70
|
+
const reducible = Math.floor((median - SYSTEM_PROMPT_TOKEN_THRESHOLD) * 0.5);
|
|
71
|
+
const modelCost = lookupModelCost(group.model, this.modelCosts);
|
|
72
|
+
const inputCostPer1M = modelCost?.input ?? 3;
|
|
73
|
+
const savings = (reducible / 1_000_000) * inputCostPer1M * group.callCount * (30 / ctx.period);
|
|
74
|
+
if (savings <= 0)
|
|
75
|
+
continue;
|
|
76
|
+
const id = createHash('sha256')
|
|
77
|
+
.update(`prompt_optimization:system_prompt_size:${group.agentId}:${group.model}`)
|
|
78
|
+
.digest('hex')
|
|
79
|
+
.slice(0, 16);
|
|
80
|
+
const sessionArr = Array.from(group.sessionIds);
|
|
81
|
+
recommendations.push({
|
|
82
|
+
id,
|
|
83
|
+
category: 'prompt_optimization',
|
|
84
|
+
estimatedMonthlySavings: Math.round(savings * 1_000_000) / 1_000_000,
|
|
85
|
+
confidence: this.determineConfidence(group.callCount),
|
|
86
|
+
difficulty: 'code_change',
|
|
87
|
+
actionableSteps: [
|
|
88
|
+
`Reduce system prompt for ${group.model} — median is ~${median} tokens, ${SYSTEM_PROMPT_TOKEN_THRESHOLD} recommended`,
|
|
89
|
+
'Consider extracting static instructions into a reference doc or using prompt compression',
|
|
90
|
+
],
|
|
91
|
+
agentId: group.agentId,
|
|
92
|
+
evidence: { callsAnalyzed: group.callCount, period: ctx.period },
|
|
93
|
+
createdAt: now,
|
|
94
|
+
promptOptimization: {
|
|
95
|
+
targetType: 'system_prompt_size',
|
|
96
|
+
currentTokens: median,
|
|
97
|
+
estimatedReducibleTokens: reducible,
|
|
98
|
+
sampleSessionIds: sessionArr.slice(0, 3),
|
|
99
|
+
},
|
|
100
|
+
});
|
|
101
|
+
}
|
|
102
|
+
}
|
|
103
|
+
// Detect repeated context within sessions
|
|
104
|
+
for (const [sessionKey, sc] of sessionCalls) {
|
|
105
|
+
if (sc.prefixHashes.length < 3)
|
|
106
|
+
continue;
|
|
107
|
+
// Count most frequent prefix hash
|
|
108
|
+
const freq = new Map();
|
|
109
|
+
for (const h of sc.prefixHashes) {
|
|
110
|
+
freq.set(h, (freq.get(h) ?? 0) + 1);
|
|
111
|
+
}
|
|
112
|
+
const maxFreq = Math.max(...freq.values());
|
|
113
|
+
const ratio = maxFreq / sc.prefixHashes.length;
|
|
114
|
+
if (ratio > REPEATED_CONTEXT_RATIO && maxFreq >= 3) {
|
|
115
|
+
// Estimate token savings: average message length of repeated prefix
|
|
116
|
+
const estimatedTokensSaved = 500; // conservative estimate per repeated call
|
|
117
|
+
const modelCost = lookupModelCost(sc.model, this.modelCosts);
|
|
118
|
+
const inputCostPer1M = modelCost?.input ?? 3;
|
|
119
|
+
const redundantCalls = maxFreq - 1;
|
|
120
|
+
const savings = (estimatedTokensSaved / 1_000_000) * inputCostPer1M * redundantCalls * (30 / ctx.period);
|
|
121
|
+
if (savings <= 0)
|
|
122
|
+
continue;
|
|
123
|
+
const sessionId = sessionKey.split('::')[0];
|
|
124
|
+
const id = createHash('sha256')
|
|
125
|
+
.update(`prompt_optimization:repeated_context:${sc.agentId}:${sessionId}`)
|
|
126
|
+
.digest('hex')
|
|
127
|
+
.slice(0, 16);
|
|
128
|
+
recommendations.push({
|
|
129
|
+
id,
|
|
130
|
+
category: 'prompt_optimization',
|
|
131
|
+
estimatedMonthlySavings: Math.round(savings * 1_000_000) / 1_000_000,
|
|
132
|
+
confidence: this.determineConfidence(sc.prefixHashes.length),
|
|
133
|
+
difficulty: 'code_change',
|
|
134
|
+
actionableSteps: [
|
|
135
|
+
`Session has ${maxFreq} calls with repeated context prefix — consider caching or summarizing context`,
|
|
136
|
+
'Use conversation summarization to reduce context window growth',
|
|
137
|
+
],
|
|
138
|
+
agentId: sc.agentId,
|
|
139
|
+
evidence: { callsAnalyzed: sc.prefixHashes.length, period: ctx.period },
|
|
140
|
+
createdAt: now,
|
|
141
|
+
promptOptimization: {
|
|
142
|
+
targetType: 'repeated_context',
|
|
143
|
+
currentTokens: estimatedTokensSaved * maxFreq,
|
|
144
|
+
estimatedReducibleTokens: estimatedTokensSaved * redundantCalls,
|
|
145
|
+
sampleSessionIds: [sessionId],
|
|
146
|
+
},
|
|
147
|
+
});
|
|
148
|
+
}
|
|
149
|
+
}
|
|
150
|
+
return recommendations;
|
|
151
|
+
}
|
|
152
|
+
determineConfidence(callCount) {
|
|
153
|
+
if (callCount >= 50)
|
|
154
|
+
return 'high';
|
|
155
|
+
if (callCount >= 20)
|
|
156
|
+
return 'medium';
|
|
157
|
+
return 'low';
|
|
158
|
+
}
|
|
159
|
+
}
|
|
160
|
+
//# sourceMappingURL=prompt-optimization.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"prompt-optimization.js","sourceRoot":"","sources":["../../../../src/lib/optimization/analyzers/prompt-optimization.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAUH,OAAO,EAAE,mBAAmB,EAAE,eAAe,EAAE,MAAM,mBAAmB,CAAC;AAEzE,OAAO,EAAE,UAAU,EAAE,MAAM,aAAa,CAAC;AAEzC,MAAM,6BAA6B,GAAG,IAAI,CAAC;AAC3C,MAAM,sBAAsB,GAAG,GAAG,CAAC;AAEnC,MAAM,OAAO,0BAA0B;IAGR;IAFpB,IAAI,GAAG,qBAAqB,CAAC;IAEtC,YAA6B,aAAyB,mBAAmB;QAA5C,eAAU,GAAV,UAAU,CAAkC;IAAG,CAAC;IAE7E,KAAK,CAAC,OAAO,CAAC,GAAoB;QAChC,MAAM,eAAe,GAA6B,EAAE,CAAC;QACrD,MAAM,GAAG,GAAG,IAAI,IAAI,EAAE,CAAC,WAAW,EAAE,CAAC;QAErC,kCAAkC;QAClC,MAAM,QAAQ,GAAG,IAAI,GAAG,EAMpB,CAAC;QAEL,wDAAwD;QACxD,MAAM,YAAY,GAAG,IAAI,GAAG,EAIxB,CAAC;QAEL,KAAK,MAAM,GAAG,IAAI,GAAG,CAAC,aAAa,EAAE,CAAC;YACpC,MAAM,OAAO,GAAG,GAAG,CAAC,OAAkC,CAAC;YACvD,MAAM,KAAK,GAAG,OAAO,CAAC,KAAK,CAAC;YAC5B,IAAI,CAAC,KAAK,IAAI,CAAC,OAAO,CAAC,QAAQ;gBAAE,SAAS;YAE1C,MAAM,OAAO,GAAG,GAAG,CAAC,OAAO,CAAC;YAC5B,MAAM,QAAQ,GAAG,GAAG,OAAO,KAAK,KAAK,EAAE,CAAC;YAExC,yBAAyB;YACzB,IAAI,KAAK,GAAG,QAAQ,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;YACnC,IAAI,CAAC,KAAK,EAAE,CAAC;gBACX,KAAK,GAAG,EAAE,OAAO,EAAE,KAAK,EAAE,iBAAiB,EAAE,EAAE,EAAE,UAAU,EAAE,IAAI,GAAG,EAAE,EAAE,SAAS,EAAE,CAAC,EAAE,CAAC;gBACvF,QAAQ,CAAC,GAAG,CAAC,QAAQ,EAAE,KAAK,CAAC,CAAC;YAChC,CAAC;YACD,KAAK,CAAC,SAAS,EAAE,CAAC;YAClB,IAAI,GAAG,CAAC,SAAS;gBAAE,KAAK,CAAC,UAAU,CAAC,GAAG,CAAC,GAAG,CAAC,SAAS,CAAC,CAAC;YAEvD,MAAM,UAAU,GAAG,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,KAAK,QAAQ,CAAC,CAAC;YACrE,IAAI,UAAU,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;gBAC1B,MAAM,QAAQ,GAAG,UAAU,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,CAAC,EAAE,EAAE,CAAC,GAAG,GAAG,CAAC,CAAC,CAAC,OAAO,EAAE,MAAM,IAAI,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC;gBAClF,MAAM,eAAe,GAAG,IAAI,CAAC,IAAI,CAAC,QAAQ,GAAG,CAAC,CAAC,CAAC;gBAChD,KAAK,CAAC,iBAAiB,CAAC,IAAI,CAAC,eAAe,CAAC,CAAC;YAChD,CAAC;YAED,oEAAoE;YACpE,IAAI,GAAG,CAAC,SAAS,EAAE,CAAC;gBAClB,MAAM,UAAU,GAAG,GAAG,GAAG,CAAC,SAAS,KAAK,KAAK,EAAE,CAAC;gBAChD,IAAI,EAAE,GAAG,YAAY,CAAC,GAAG,CAAC,UAAU,CAAC,CAAC;gBACtC,IAAI,CAAC,EAAE,EAAE,CAAC;oBACR,EAAE,GAAG,EAAE,OAAO,EAAE,KAAK,EAAE,YAAY,EAAE,EAAE,EAAE,CAAC;oBAC1C,YAAY,CAAC,GAAG,CAAC,UAAU,EAAE,EAAE,CAAC,CAAC;gBACnC,CAAC;gBACD,MAAM,SAAS,GAAG,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,KAAK,QAAQ,CAAC,CAAC;gBACpE,IAAI,SAAS,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;oBACzB,MAAM,MAAM,GAAG,SAAS,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,OAAO,IAAI,EAAE,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,KAAK,CAAC,CAAC,EAAE,GAAG,CAAC,CAAC;oBAC3E,MAAM,IAAI,GAAG,UAAU,CAAC,KAAK,CAAC,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC;oBAC5D,EAAE,CAAC,YAAY,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;gBAC7B,CAAC;YACH,CAAC;QACH,CAAC;QAED,8BAA8B;QAC9B,KAAK,MAAM,CAAC,EAAE,KAAK,CAAC,IAAI,QAAQ,EAAE,CAAC;YACjC,IAAI,KAAK,CAAC,iBAAiB,CAAC,MAAM,KAAK,CAAC;gBAAE,SAAS;YACnD,MAAM,MAAM,GAAG,CAAC,GAAG,KAAK,CAAC,iBAAiB,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC;YAClE,MAAM,MAAM,GAAG,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,MAAM,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC;YAErD,IAAI,MAAM,GAAG,6BAA6B,EAAE,CAAC;gBAC3C,MAAM,SAAS,GAAG,IAAI,CAAC,KAAK,CAAC,CAAC,MAAM,GAAG,6BAA6B,CAAC,GAAG,GAAG,CAAC,CAAC;gBAC7E,MAAM,SAAS,GAAG,eAAe,CAAC,KAAK,CAAC,KAAK,EAAE,IAAI,CAAC,UAAU,CAAC,CAAC;gBAChE,MAAM,cAAc,GAAG,SAAS,EAAE,KAAK,IAAI,CAAC,CAAC;gBAC7C,MAAM,OAAO,GAAG,CAAC,SAAS,GAAG,SAAS,CAAC,GAAG,cAAc,GAAG,KAAK,CAAC,SAAS,GAAG,CAAC,EAAE,GAAG,GAAG,CAAC,MAAM,CAAC,CAAC;gBAE/F,IAAI,OAAO,IAAI,CAAC;oBAAE,SAAS;gBAE3B,MAAM,EAAE,GAAG,UAAU,CAAC,QAAQ,CAAC;qBAC5B,MAAM,CAAC,0CAA0C,KAAK,CAAC,OAAO,IAAI,KAAK,CAAC,KAAK,EAAE,CAAC;qBAChF,MAAM,CAAC,KAAK,CAAC;qBACb,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;gBAEhB,MAAM,UAAU,GAAG,KAAK,CAAC,IAAI,CAAC,KAAK,CAAC,UAAU,CAAC,CAAC;gBAChD,eAAe,CAAC,IAAI,CAAC;oBACnB,EAAE;oBACF,QAAQ,EAAE,qBAAqB;oBAC/B,uBAAuB,EAAE,IAAI,CAAC,KAAK,CAAC,OAAO,GAAG,SAAS,CAAC,GAAG,SAAS;oBACpE,UAAU,EAAE,IAAI,CAAC,mBAAmB,CAAC,KAAK,CAAC,SAAS,CAAC;oBACrD,UAAU,EAAE,aAAa;oBACzB,eAAe,EAAE;wBACf,4BAA4B,KAAK,CAAC,KAAK,iBAAiB,MAAM,YAAY,6BAA6B,cAAc;wBACrH,0FAA0F;qBAC3F;oBACD,OAAO,EAAE,KAAK,CAAC,OAAO;oBACtB,QAAQ,EAAE,EAAE,aAAa,EAAE,KAAK,CAAC,SAAS,EAAE,MAAM,EAAE,GAAG,CAAC,MAAM,EAAE;oBAChE,SAAS,EAAE,GAAG;oBACd,kBAAkB,EAAE;wBAClB,UAAU,EAAE,oBAAoB;wBAChC,aAAa,EAAE,MAAM;wBACrB,wBAAwB,EAAE,SAAS;wBACnC,gBAAgB,EAAE,UAAU,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC;qBACzC;iBACF,CAAC,CAAC;YACL,CAAC;QACH,CAAC;QAED,0CAA0C;QAC1C,KAAK,MAAM,CAAC,UAAU,EAAE,EAAE,CAAC,IAAI,YAAY,EAAE,CAAC;YAC5C,IAAI,EAAE,CAAC,YAAY,CAAC,MAAM,GAAG,CAAC;gBAAE,SAAS;YAEzC,kCAAkC;YAClC,MAAM,IAAI,GAAG,IAAI,GAAG,EAAkB,CAAC;YACvC,KAAK,MAAM,CAAC,IAAI,EAAE,CAAC,YAAY,EAAE,CAAC;gBAChC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC;YACtC,CAAC;YACD,MAAM,OAAO,GAAG,IAAI,CAAC,GAAG,CAAC,GAAG,IAAI,CAAC,MAAM,EAAE,CAAC,CAAC;YAC3C,MAAM,KAAK,GAAG,OAAO,GAAG,EAAE,CAAC,YAAY,CAAC,MAAM,CAAC;YAE/C,IAAI,KAAK,GAAG,sBAAsB,IAAI,OAAO,IAAI,CAAC,EAAE,CAAC;gBACnD,oEAAoE;gBACpE,MAAM,oBAAoB,GAAG,GAAG,CAAC,CAAC,0CAA0C;gBAC5E,MAAM,SAAS,GAAG,eAAe,CAAC,EAAE,CAAC,KAAK,EAAE,IAAI,CAAC,UAAU,CAAC,CAAC;gBAC7D,MAAM,cAAc,GAAG,SAAS,EAAE,KAAK,IAAI,CAAC,CAAC;gBAC7C,MAAM,cAAc,GAAG,OAAO,GAAG,CAAC,CAAC;gBACnC,MAAM,OAAO,GAAG,CAAC,oBAAoB,GAAG,SAAS,CAAC,GAAG,cAAc,GAAG,cAAc,GAAG,CAAC,EAAE,GAAG,GAAG,CAAC,MAAM,CAAC,CAAC;gBAEzG,IAAI,OAAO,IAAI,CAAC;oBAAE,SAAS;gBAE3B,MAAM,SAAS,GAAG,UAAU,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,CAAC;gBAC5C,MAAM,EAAE,GAAG,UAAU,CAAC,QAAQ,CAAC;qBAC5B,MAAM,CAAC,wCAAwC,EAAE,CAAC,OAAO,IAAI,SAAS,EAAE,CAAC;qBACzE,MAAM,CAAC,KAAK,CAAC;qBACb,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;gBAEhB,eAAe,CAAC,IAAI,CAAC;oBACnB,EAAE;oBACF,QAAQ,EAAE,qBAAqB;oBAC/B,uBAAuB,EAAE,IAAI,CAAC,KAAK,CAAC,OAAO,GAAG,SAAS,CAAC,GAAG,SAAS;oBACpE,UAAU,EAAE,IAAI,CAAC,mBAAmB,CAAC,EAAE,CAAC,YAAY,CAAC,MAAM,CAAC;oBAC5D,UAAU,EAAE,aAAa;oBACzB,eAAe,EAAE;wBACf,eAAe,OAAO,+EAA+E;wBACrG,gEAAgE;qBACjE;oBACD,OAAO,EAAE,EAAE,CAAC,OAAO;oBACnB,QAAQ,EAAE,EAAE,aAAa,EAAE,EAAE,CAAC,YAAY,CAAC,MAAM,EAAE,MAAM,EAAE,GAAG,CAAC,MAAM,EAAE;oBACvE,SAAS,EAAE,GAAG;oBACd,kBAAkB,EAAE;wBAClB,UAAU,EAAE,kBAAkB;wBAC9B,aAAa,EAAE,oBAAoB,GAAG,OAAO;wBAC7C,wBAAwB,EAAE,oBAAoB,GAAG,cAAc;wBAC/D,gBAAgB,EAAE,CAAC,SAAS,CAAC;qBAC9B;iBACF,CAAC,CAAC;YACL,CAAC;QACH,CAAC;QAED,OAAO,eAAe,CAAC;IACzB,CAAC;IAEO,mBAAmB,CAAC,SAAiB;QAC3C,IAAI,SAAS,IAAI,EAAE;YAAE,OAAO,MAAM,CAAC;QACnC,IAAI,SAAS,IAAI,EAAE;YAAE,OAAO,QAAQ,CAAC;QACrC,OAAO,KAAK,CAAC;IACf,CAAC;CACF"}
|
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Analyzer Plugin Interface (Feature 17 — Story 17.1)
|
|
3
|
+
*/
|
|
4
|
+
import type { IEventStore, AgentLensEvent, EnhancedRecommendation } from '@agentlensai/core';
|
|
5
|
+
export interface AnalyzerContext {
|
|
6
|
+
store: IEventStore;
|
|
7
|
+
agentId?: string;
|
|
8
|
+
from: string;
|
|
9
|
+
to: string;
|
|
10
|
+
period: number;
|
|
11
|
+
limit: number;
|
|
12
|
+
/** Pre-fetched llm_call events (shared across analyzers) */
|
|
13
|
+
llmCallEvents: AgentLensEvent[];
|
|
14
|
+
/** Pre-fetched llm_response events (shared across analyzers) */
|
|
15
|
+
llmResponseEvents: AgentLensEvent[];
|
|
16
|
+
/** callId → llm_response event map */
|
|
17
|
+
responseMap: Map<string, AgentLensEvent>;
|
|
18
|
+
}
|
|
19
|
+
export interface Analyzer {
|
|
20
|
+
readonly name: string;
|
|
21
|
+
analyze(ctx: AnalyzerContext): Promise<EnhancedRecommendation[]>;
|
|
22
|
+
}
|
|
23
|
+
//# sourceMappingURL=types.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"types.d.ts","sourceRoot":"","sources":["../../../../src/lib/optimization/analyzers/types.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,OAAO,KAAK,EAAE,WAAW,EAAE,cAAc,EAAE,sBAAsB,EAAE,MAAM,mBAAmB,CAAC;AAE7F,MAAM,WAAW,eAAe;IAC9B,KAAK,EAAE,WAAW,CAAC;IACnB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,IAAI,EAAE,MAAM,CAAC;IACb,EAAE,EAAE,MAAM,CAAC;IACX,MAAM,EAAE,MAAM,CAAC;IACf,KAAK,EAAE,MAAM,CAAC;IACd,4DAA4D;IAC5D,aAAa,EAAE,cAAc,EAAE,CAAC;IAChC,gEAAgE;IAChE,iBAAiB,EAAE,cAAc,EAAE,CAAC;IACpC,sCAAsC;IACtC,WAAW,EAAE,GAAG,CAAC,MAAM,EAAE,cAAc,CAAC,CAAC;CAC1C;AAED,MAAM,WAAW,QAAQ;IACvB,QAAQ,CAAC,IAAI,EAAE,MAAM,CAAC;IACtB,OAAO,CAAC,GAAG,EAAE,eAAe,GAAG,OAAO,CAAC,sBAAsB,EAAE,CAAC,CAAC;CAClE"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"types.js","sourceRoot":"","sources":["../../../../src/lib/optimization/analyzers/types.ts"],"names":[],"mappings":"AAAA;;GAEG"}
|
|
@@ -19,9 +19,10 @@ export interface ClassificationResult {
|
|
|
19
19
|
* Classify an LLM call's complexity based on token usage and tool calls.
|
|
20
20
|
*
|
|
21
21
|
* Thresholds:
|
|
22
|
-
* Simple: <
|
|
23
|
-
* Moderate:
|
|
24
|
-
* Complex:
|
|
22
|
+
* Simple: <1000 input tokens AND 0 tool calls
|
|
23
|
+
* Moderate: 1000-10000 input tokens OR 1-5 tool calls
|
|
24
|
+
* Complex: 10000-50000 input tokens OR 6-15 tool calls
|
|
25
|
+
* Expert: >50000 input tokens OR 16+ tool calls
|
|
25
26
|
*
|
|
26
27
|
* When both input tokens and tool call count are unknown (null/undefined),
|
|
27
28
|
* the function defaults to 'moderate' as the safest assumption.
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"classifier.d.ts","sourceRoot":"","sources":["../../../src/lib/optimization/classifier.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAEH,OAAO,KAAK,EAAE,cAAc,EAAE,cAAc,EAAsC,MAAM,mBAAmB,CAAC;AAE5G,MAAM,WAAW,qBAAqB;IACpC,WAAW,EAAE,MAAM,CAAC;IACpB,YAAY,EAAE,MAAM,CAAC;IACrB,aAAa,EAAE,MAAM,CAAC;CACvB;AAED,MAAM,WAAW,oBAAoB;IACnC,IAAI,EAAE,cAAc,CAAC;IACrB,OAAO,EAAE,qBAAqB,CAAC;CAChC;AAED
|
|
1
|
+
{"version":3,"file":"classifier.d.ts","sourceRoot":"","sources":["../../../src/lib/optimization/classifier.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAEH,OAAO,KAAK,EAAE,cAAc,EAAE,cAAc,EAAsC,MAAM,mBAAmB,CAAC;AAE5G,MAAM,WAAW,qBAAqB;IACpC,WAAW,EAAE,MAAM,CAAC;IACpB,YAAY,EAAE,MAAM,CAAC;IACrB,aAAa,EAAE,MAAM,CAAC;CACvB;AAED,MAAM,WAAW,oBAAoB;IACnC,IAAI,EAAE,cAAc,CAAC;IACrB,OAAO,EAAE,qBAAqB,CAAC;CAChC;AAED;;;;;;;;;;;;;;;GAeG;AACH,wBAAgB,sBAAsB,CACpC,SAAS,EAAE,cAAc,EACzB,aAAa,CAAC,EAAE,cAAc,GAAG,IAAI,GACpC,oBAAoB,CAkBtB"}
|
|
@@ -9,9 +9,10 @@
|
|
|
9
9
|
* Classify an LLM call's complexity based on token usage and tool calls.
|
|
10
10
|
*
|
|
11
11
|
* Thresholds:
|
|
12
|
-
* Simple: <
|
|
13
|
-
* Moderate:
|
|
14
|
-
* Complex:
|
|
12
|
+
* Simple: <1000 input tokens AND 0 tool calls
|
|
13
|
+
* Moderate: 1000-10000 input tokens OR 1-5 tool calls
|
|
14
|
+
* Complex: 10000-50000 input tokens OR 6-15 tool calls
|
|
15
|
+
* Expert: >50000 input tokens OR 16+ tool calls
|
|
15
16
|
*
|
|
16
17
|
* When both input tokens and tool call count are unknown (null/undefined),
|
|
17
18
|
* the function defaults to 'moderate' as the safest assumption.
|
|
@@ -85,17 +86,22 @@ function determineTier(inputTokens, toolCallCount) {
|
|
|
85
86
|
if (!tokensKnown && !toolsKnown) {
|
|
86
87
|
return 'moderate';
|
|
87
88
|
}
|
|
88
|
-
// Check
|
|
89
|
-
if (tokensKnown && inputTokens >
|
|
89
|
+
// Check expert thresholds first (most restrictive)
|
|
90
|
+
if (tokensKnown && inputTokens > 50000)
|
|
91
|
+
return 'expert';
|
|
92
|
+
if (toolsKnown && toolCallCount >= 16)
|
|
93
|
+
return 'expert';
|
|
94
|
+
// Check complex thresholds
|
|
95
|
+
if (tokensKnown && inputTokens > 10000)
|
|
90
96
|
return 'complex';
|
|
91
|
-
if (toolsKnown && toolCallCount >=
|
|
97
|
+
if (toolsKnown && toolCallCount >= 6)
|
|
92
98
|
return 'complex';
|
|
93
99
|
// Check simple thresholds (requires BOTH conditions)
|
|
94
|
-
if (tokensKnown && inputTokens <
|
|
100
|
+
if (tokensKnown && inputTokens < 1000 && toolsKnown && toolCallCount === 0) {
|
|
95
101
|
return 'simple';
|
|
96
102
|
}
|
|
97
|
-
// If only tokens known and <
|
|
98
|
-
if (tokensKnown && inputTokens <
|
|
103
|
+
// If only tokens known and <1000 with no tool info → can't confirm simple
|
|
104
|
+
if (tokensKnown && inputTokens < 1000 && !toolsKnown) {
|
|
99
105
|
return 'moderate';
|
|
100
106
|
}
|
|
101
107
|
// If only tools known and 0 with no token info → can't confirm simple
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"classifier.js","sourceRoot":"","sources":["../../../src/lib/optimization/classifier.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAeH
|
|
1
|
+
{"version":3,"file":"classifier.js","sourceRoot":"","sources":["../../../src/lib/optimization/classifier.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAeH;;;;;;;;;;;;;;;GAeG;AACH,MAAM,UAAU,sBAAsB,CACpC,SAAyB,EACzB,aAAqC;IAErC,MAAM,WAAW,GAAG,SAAS,CAAC,OAAkC,CAAC;IACjE,MAAM,eAAe,GAAG,aAAa,EAAE,OAAkD,CAAC;IAE1F,qDAAqD;IACrD,MAAM,WAAW,GAAG,kBAAkB,CAAC,WAAW,EAAE,eAAe,CAAC,CAAC;IACrE,MAAM,YAAY,GAAG,mBAAmB,CAAC,eAAe,CAAC,CAAC;IAC1D,MAAM,aAAa,GAAG,oBAAoB,CAAC,WAAW,EAAE,eAAe,CAAC,CAAC;IAEzE,MAAM,OAAO,GAA0B;QACrC,WAAW,EAAE,WAAW,IAAI,CAAC;QAC7B,YAAY,EAAE,YAAY,IAAI,CAAC;QAC/B,aAAa,EAAE,aAAa,IAAI,CAAC;KAClC,CAAC;IAEF,MAAM,IAAI,GAAG,aAAa,CAAC,WAAW,EAAE,aAAa,CAAC,CAAC;IAEvD,OAAO,EAAE,IAAI,EAAE,OAAO,EAAE,CAAC;AAC3B,CAAC;AAED;;;GAGG;AACH,SAAS,kBAAkB,CACzB,WAAoC,EACpC,eAA6C;IAE7C,6DAA6D;IAC7D,MAAM,YAAY,GAAG,eAAe,EAAE,KAAK,EAAE,WAAW,CAAC;IACzD,IAAI,YAAY,IAAI,IAAI,IAAI,YAAY,IAAI,CAAC;QAAE,OAAO,YAAY,CAAC;IAEnE,iEAAiE;IACjE,MAAM,aAAa,GAAG,WAAsC,CAAC;IAC7D,MAAM,KAAK,GAAG,aAAa,CAAC,KAA6C,CAAC;IAC1E,IAAI,KAAK,EAAE,WAAW,IAAI,IAAI,IAAI,KAAK,CAAC,WAAW,IAAI,CAAC;QAAE,OAAO,KAAK,CAAC,WAAW,CAAC;IAEnF,OAAO,IAAI,CAAC;AACd,CAAC;AAED;;GAEG;AACH,SAAS,mBAAmB,CAC1B,eAA6C;IAE7C,MAAM,YAAY,GAAG,eAAe,EAAE,KAAK,EAAE,YAAY,CAAC;IAC1D,IAAI,YAAY,IAAI,IAAI,IAAI,YAAY,IAAI,CAAC;QAAE,OAAO,YAAY,CAAC;IACnE,OAAO,IAAI,CAAC;AACd,CAAC;AAED;;;;GAIG;AACH,SAAS,oBAAoB,CAC3B,WAAoC,EACpC,eAA6C;IAE7C,2DAA2D;IAC3D,IAAI,eAAe,EAAE,SAAS,IAAI,IAAI,EAAE,CAAC;QACvC,OAAO,eAAe,CAAC,SAAS,CAAC,MAAM,CAAC;IAC1C,CAAC;IAED,kDAAkD;IAClD,0FAA0F;IAC1F,OAAO,CAAC,CAAC;AACX,CAAC;AAED;;;GAGG;AACH,SAAS,aAAa,CACpB,WAA0B,EAC1B,aAA4B;IAE5B,MAAM,WAAW,GAAG,WAAW,IAAI,IAAI,CAAC;IACxC,MAAM,UAAU,GAAG,aAAa,IAAI,IAAI,CAAC;IAEzC,iDAAiD;IACjD,IAAI,CAAC,WAAW,IAAI,CAAC,UAAU,EAAE,CAAC;QAChC,OAAO,UAAU,CAAC;IACpB,CAAC;IAED,mDAAmD;IACnD,IAAI,WAAW,IAAI,WAAY,GAAG,KAAK;QAAE,OAAO,QAAQ,CAAC;IACzD,IAAI,UAAU,IAAI,aAAc,IAAI,EAAE;QAAE,OAAO,QAAQ,CAAC;IAExD,2BAA2B;IAC3B,IAAI,WAAW,IAAI,WAAY,GAAG,KAAK;QAAE,OAAO,SAAS,CAAC;IAC1D,IAAI,UAAU,IAAI,aAAc,IAAI,CAAC;QAAE,OAAO,SAAS,CAAC;IAExD,qDAAqD;IACrD,IAAI,WAAW,IAAI,WAAY,GAAG,IAAI,IAAI,UAAU,IAAI,aAAc,KAAK,CAAC,EAAE,CAAC;QAC7E,OAAO,QAAQ,CAAC;IAClB,CAAC;IACD,0EAA0E;IAC1E,IAAI,WAAW,IAAI,WAAY,GAAG,IAAI,IAAI,CAAC,UAAU,EAAE,CAAC;QACtD,OAAO,UAAU,CAAC;IACpB,CAAC;IACD,sEAAsE;IACtE,IAAI,CAAC,WAAW,IAAI,UAAU,IAAI,aAAc,KAAK,CAAC,EAAE,CAAC;QACvD,OAAO,UAAU,CAAC;IACpB,CAAC;IAED,8BAA8B;IAC9B,OAAO,UAAU,CAAC;AACpB,CAAC"}
|
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* CostOptimizer Façade (Feature 17 — Story 17.4)
|
|
3
|
+
*
|
|
4
|
+
* Orchestrates multiple analyzers in parallel, deduplicates results,
|
|
5
|
+
* sorts by savings, and returns EnhancedOptimizationResult.
|
|
6
|
+
*/
|
|
7
|
+
import type { IEventStore, ModelCosts, EnhancedOptimizationResult } from '@agentlensai/core';
|
|
8
|
+
export declare class CostOptimizer {
|
|
9
|
+
private readonly store;
|
|
10
|
+
private readonly modelCosts;
|
|
11
|
+
private analyzers;
|
|
12
|
+
constructor(store: IEventStore, modelCosts?: ModelCosts);
|
|
13
|
+
getRecommendations(options: {
|
|
14
|
+
agentId?: string;
|
|
15
|
+
period: number;
|
|
16
|
+
limit: number;
|
|
17
|
+
includeCrossAgent?: boolean;
|
|
18
|
+
}): Promise<EnhancedOptimizationResult>;
|
|
19
|
+
private computeCategorySummary;
|
|
20
|
+
}
|
|
21
|
+
//# sourceMappingURL=cost-optimizer.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"cost-optimizer.d.ts","sourceRoot":"","sources":["../../../src/lib/optimization/cost-optimizer.ts"],"names":[],"mappings":"AAAA;;;;;GAKG;AAEH,OAAO,KAAK,EACV,WAAW,EACX,UAAU,EACV,0BAA0B,EAK3B,MAAM,mBAAmB,CAAC;AAa3B,qBAAa,aAAa;IAItB,OAAO,CAAC,QAAQ,CAAC,KAAK;IACtB,OAAO,CAAC,QAAQ,CAAC,UAAU;IAJ7B,OAAO,CAAC,SAAS,CAAa;gBAGX,KAAK,EAAE,WAAW,EAClB,UAAU,GAAE,UAAgC;IAQzD,kBAAkB,CAAC,OAAO,EAAE;QAChC,OAAO,CAAC,EAAE,MAAM,CAAC;QACjB,MAAM,EAAE,MAAM,CAAC;QACf,KAAK,EAAE,MAAM,CAAC;QACd,iBAAiB,CAAC,EAAE,OAAO,CAAC;KAC7B,GAAG,OAAO,CAAC,0BAA0B,CAAC;IAiFvC,OAAO,CAAC,sBAAsB;CAoB/B"}
|
|
@@ -0,0 +1,114 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* CostOptimizer Façade (Feature 17 — Story 17.4)
|
|
3
|
+
*
|
|
4
|
+
* Orchestrates multiple analyzers in parallel, deduplicates results,
|
|
5
|
+
* sorts by savings, and returns EnhancedOptimizationResult.
|
|
6
|
+
*/
|
|
7
|
+
import { DEFAULT_MODEL_COSTS } from '@agentlensai/core';
|
|
8
|
+
import { ModelDowngradeAnalyzer } from './analyzers/model-downgrade.js';
|
|
9
|
+
import { PromptOptimizationAnalyzer } from './analyzers/prompt-optimization.js';
|
|
10
|
+
const ALL_CATEGORIES = [
|
|
11
|
+
'model_downgrade',
|
|
12
|
+
'prompt_optimization',
|
|
13
|
+
'caching',
|
|
14
|
+
'tool_reduction',
|
|
15
|
+
];
|
|
16
|
+
export class CostOptimizer {
|
|
17
|
+
store;
|
|
18
|
+
modelCosts;
|
|
19
|
+
analyzers;
|
|
20
|
+
constructor(store, modelCosts = DEFAULT_MODEL_COSTS) {
|
|
21
|
+
this.store = store;
|
|
22
|
+
this.modelCosts = modelCosts;
|
|
23
|
+
this.analyzers = [
|
|
24
|
+
new ModelDowngradeAnalyzer(modelCosts),
|
|
25
|
+
new PromptOptimizationAnalyzer(modelCosts),
|
|
26
|
+
];
|
|
27
|
+
}
|
|
28
|
+
async getRecommendations(options) {
|
|
29
|
+
const now = new Date();
|
|
30
|
+
const from = new Date(now.getTime() - options.period * 24 * 60 * 60 * 1000).toISOString();
|
|
31
|
+
const to = now.toISOString();
|
|
32
|
+
// Pre-fetch events once
|
|
33
|
+
const [callResult, responseResult] = await Promise.all([
|
|
34
|
+
this.store.queryEvents({
|
|
35
|
+
eventType: 'llm_call',
|
|
36
|
+
agentId: options.agentId,
|
|
37
|
+
from,
|
|
38
|
+
to,
|
|
39
|
+
limit: 10_000,
|
|
40
|
+
order: 'asc',
|
|
41
|
+
}),
|
|
42
|
+
this.store.queryEvents({
|
|
43
|
+
eventType: 'llm_response',
|
|
44
|
+
agentId: options.agentId,
|
|
45
|
+
from,
|
|
46
|
+
to,
|
|
47
|
+
limit: 10_000,
|
|
48
|
+
order: 'asc',
|
|
49
|
+
}),
|
|
50
|
+
]);
|
|
51
|
+
// Build response lookup
|
|
52
|
+
const responseMap = new Map();
|
|
53
|
+
for (const evt of responseResult.events) {
|
|
54
|
+
const payload = evt.payload;
|
|
55
|
+
if (payload.callId) {
|
|
56
|
+
responseMap.set(payload.callId, evt);
|
|
57
|
+
}
|
|
58
|
+
}
|
|
59
|
+
const ctx = {
|
|
60
|
+
store: this.store,
|
|
61
|
+
agentId: options.agentId,
|
|
62
|
+
from,
|
|
63
|
+
to,
|
|
64
|
+
period: options.period,
|
|
65
|
+
limit: options.limit,
|
|
66
|
+
llmCallEvents: callResult.events,
|
|
67
|
+
llmResponseEvents: responseResult.events,
|
|
68
|
+
responseMap,
|
|
69
|
+
};
|
|
70
|
+
// Run all analyzers in parallel
|
|
71
|
+
const results = await Promise.all(this.analyzers.map(a => a.analyze(ctx)));
|
|
72
|
+
// Flatten, deduplicate, sort
|
|
73
|
+
const seen = new Set();
|
|
74
|
+
let recommendations = [];
|
|
75
|
+
for (const recs of results) {
|
|
76
|
+
for (const rec of recs) {
|
|
77
|
+
if (!seen.has(rec.id)) {
|
|
78
|
+
seen.add(rec.id);
|
|
79
|
+
recommendations.push(rec);
|
|
80
|
+
}
|
|
81
|
+
}
|
|
82
|
+
}
|
|
83
|
+
recommendations.sort((a, b) => b.estimatedMonthlySavings - a.estimatedMonthlySavings);
|
|
84
|
+
recommendations = recommendations.slice(0, options.limit);
|
|
85
|
+
const totalPotentialSavings = recommendations.reduce((sum, r) => sum + r.estimatedMonthlySavings, 0);
|
|
86
|
+
const byCategory = this.computeCategorySummary(recommendations);
|
|
87
|
+
return {
|
|
88
|
+
recommendations,
|
|
89
|
+
totalPotentialSavings: Math.round(totalPotentialSavings * 1_000_000) / 1_000_000,
|
|
90
|
+
period: options.period,
|
|
91
|
+
analyzedCalls: callResult.events.length,
|
|
92
|
+
byCategory,
|
|
93
|
+
};
|
|
94
|
+
}
|
|
95
|
+
computeCategorySummary(recommendations) {
|
|
96
|
+
const summary = {};
|
|
97
|
+
for (const cat of ALL_CATEGORIES) {
|
|
98
|
+
summary[cat] = { count: 0, totalSavings: 0 };
|
|
99
|
+
}
|
|
100
|
+
for (const rec of recommendations) {
|
|
101
|
+
const entry = summary[rec.category];
|
|
102
|
+
if (entry) {
|
|
103
|
+
entry.count++;
|
|
104
|
+
entry.totalSavings += rec.estimatedMonthlySavings;
|
|
105
|
+
}
|
|
106
|
+
}
|
|
107
|
+
// Round
|
|
108
|
+
for (const cat of ALL_CATEGORIES) {
|
|
109
|
+
summary[cat].totalSavings = Math.round(summary[cat].totalSavings * 1_000_000) / 1_000_000;
|
|
110
|
+
}
|
|
111
|
+
return summary;
|
|
112
|
+
}
|
|
113
|
+
}
|
|
114
|
+
//# sourceMappingURL=cost-optimizer.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"cost-optimizer.js","sourceRoot":"","sources":["../../../src/lib/optimization/cost-optimizer.ts"],"names":[],"mappings":"AAAA;;;;;GAKG;AAWH,OAAO,EAAE,mBAAmB,EAAE,MAAM,mBAAmB,CAAC;AAExD,OAAO,EAAE,sBAAsB,EAAE,MAAM,gCAAgC,CAAC;AACxE,OAAO,EAAE,0BAA0B,EAAE,MAAM,oCAAoC,CAAC;AAEhF,MAAM,cAAc,GAA2B;IAC7C,iBAAiB;IACjB,qBAAqB;IACrB,SAAS;IACT,gBAAgB;CACjB,CAAC;AAEF,MAAM,OAAO,aAAa;IAIL;IACA;IAJX,SAAS,CAAa;IAE9B,YACmB,KAAkB,EAClB,aAAyB,mBAAmB;QAD5C,UAAK,GAAL,KAAK,CAAa;QAClB,eAAU,GAAV,UAAU,CAAkC;QAE7D,IAAI,CAAC,SAAS,GAAG;YACf,IAAI,sBAAsB,CAAC,UAAU,CAAC;YACtC,IAAI,0BAA0B,CAAC,UAAU,CAAC;SAC3C,CAAC;IACJ,CAAC;IAED,KAAK,CAAC,kBAAkB,CAAC,OAKxB;QACC,MAAM,GAAG,GAAG,IAAI,IAAI,EAAE,CAAC;QACvB,MAAM,IAAI,GAAG,IAAI,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,GAAG,OAAO,CAAC,MAAM,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,IAAI,CAAC,CAAC,WAAW,EAAE,CAAC;QAC1F,MAAM,EAAE,GAAG,GAAG,CAAC,WAAW,EAAE,CAAC;QAE7B,wBAAwB;QACxB,MAAM,CAAC,UAAU,EAAE,cAAc,CAAC,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YACrD,IAAI,CAAC,KAAK,CAAC,WAAW,CAAC;gBACrB,SAAS,EAAE,UAAU;gBACrB,OAAO,EAAE,OAAO,CAAC,OAAO;gBACxB,IAAI;gBACJ,EAAE;gBACF,KAAK,EAAE,MAAM;gBACb,KAAK,EAAE,KAAK;aACb,CAAC;YACF,IAAI,CAAC,KAAK,CAAC,WAAW,CAAC;gBACrB,SAAS,EAAE,cAAc;gBACzB,OAAO,EAAE,OAAO,CAAC,OAAO;gBACxB,IAAI;gBACJ,EAAE;gBACF,KAAK,EAAE,MAAM;gBACb,KAAK,EAAE,KAAK;aACb,CAAC;SACH,CAAC,CAAC;QAEH,wBAAwB;QACxB,MAAM,WAAW,GAAG,IAAI,GAAG,EAA0B,CAAC;QACtD,KAAK,MAAM,GAAG,IAAI,cAAc,CAAC,MAAM,EAAE,CAAC;YACxC,MAAM,OAAO,GAAG,GAAG,CAAC,OAAsC,CAAC;YAC3D,IAAI,OAAO,CAAC,MAAM,EAAE,CAAC;gBACnB,WAAW,CAAC,GAAG,CAAC,OAAO,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;YACvC,CAAC;QACH,CAAC;QAED,MAAM,GAAG,GAAoB;YAC3B,KAAK,EAAE,IAAI,CAAC,KAAK;YACjB,OAAO,EAAE,OAAO,CAAC,OAAO;YACxB,IAAI;YACJ,EAAE;YACF,MAAM,EAAE,OAAO,CAAC,MAAM;YACtB,KAAK,EAAE,OAAO,CAAC,KAAK;YACpB,aAAa,EAAE,UAAU,CAAC,MAAM;YAChC,iBAAiB,EAAE,cAAc,CAAC,MAAM;YACxC,WAAW;SACZ,CAAC;QAEF,gCAAgC;QAChC,MAAM,OAAO,GAAG,MAAM,OAAO,CAAC,GAAG,CAC/B,IAAI,CAAC,SAAS,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC,CACxC,CAAC;QAEF,6BAA6B;QAC7B,MAAM,IAAI,GAAG,IAAI,GAAG,EAAU,CAAC;QAC/B,IAAI,eAAe,GAA6B,EAAE,CAAC;QACnD,KAAK,MAAM,IAAI,IAAI,OAAO,EAAE,CAAC;YAC3B,KAAK,MAAM,GAAG,IAAI,IAAI,EAAE,CAAC;gBACvB,IAAI,CAAC,IAAI,CAAC,GAAG,CAAC,GAAG,CAAC,EAAE,CAAC,EAAE,CAAC;oBACtB,IAAI,CAAC,GAAG,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;oBACjB,eAAe,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;gBAC5B,CAAC;YACH,CAAC;QACH,CAAC;QAED,eAAe,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,uBAAuB,GAAG,CAAC,CAAC,uBAAuB,CAAC,CAAC;QACtF,eAAe,GAAG,eAAe,CAAC,KAAK,CAAC,CAAC,EAAE,OAAO,CAAC,KAAK,CAAC,CAAC;QAE1D,MAAM,qBAAqB,GAAG,eAAe,CAAC,MAAM,CAClD,CAAC,GAAG,EAAE,CAAC,EAAE,EAAE,CAAC,GAAG,GAAG,CAAC,CAAC,uBAAuB,EAAE,CAAC,CAC/C,CAAC;QAEF,MAAM,UAAU,GAAG,IAAI,CAAC,sBAAsB,CAAC,eAAe,CAAC,CAAC;QAEhE,OAAO;YACL,eAAe;YACf,qBAAqB,EAAE,IAAI,CAAC,KAAK,CAAC,qBAAqB,GAAG,SAAS,CAAC,GAAG,SAAS;YAChF,MAAM,EAAE,OAAO,CAAC,MAAM;YACtB,aAAa,EAAE,UAAU,CAAC,MAAM,CAAC,MAAM;YACvC,UAAU;SACX,CAAC;IACJ,CAAC;IAEO,sBAAsB,CAC5B,eAAyC;QAEzC,MAAM,OAAO,GAA0E,EAAS,CAAC;QACjG,KAAK,MAAM,GAAG,IAAI,cAAc,EAAE,CAAC;YACjC,OAAO,CAAC,GAAG,CAAC,GAAG,EAAE,KAAK,EAAE,CAAC,EAAE,YAAY,EAAE,CAAC,EAAE,CAAC;QAC/C,CAAC;QACD,KAAK,MAAM,GAAG,IAAI,eAAe,EAAE,CAAC;YAClC,MAAM,KAAK,GAAG,OAAO,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;YACpC,IAAI,KAAK,EAAE,CAAC;gBACV,KAAK,CAAC,KAAK,EAAE,CAAC;gBACd,KAAK,CAAC,YAAY,IAAI,GAAG,CAAC,uBAAuB,CAAC;YACpD,CAAC;QACH,CAAC;QACD,QAAQ;QACR,KAAK,MAAM,GAAG,IAAI,cAAc,EAAE,CAAC;YACjC,OAAO,CAAC,GAAG,CAAC,CAAC,YAAY,GAAG,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC,YAAY,GAAG,SAAS,CAAC,GAAG,SAAS,CAAC;QAC5F,CAAC;QACD,OAAO,OAAO,CAAC;IACjB,CAAC;CACF"}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"engine.d.ts","sourceRoot":"","sources":["../../../src/lib/optimization/engine.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAEH,OAAO,KAAK,EACV,WAAW,EAGX,kBAAkB,EAClB,UAAU,EAKX,MAAM,mBAAmB,CAAC;
|
|
1
|
+
{"version":3,"file":"engine.d.ts","sourceRoot":"","sources":["../../../src/lib/optimization/engine.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAEH,OAAO,KAAK,EACV,WAAW,EAGX,kBAAkB,EAClB,UAAU,EAKX,MAAM,mBAAmB,CAAC;AA8B3B,qBAAa,kBAAkB;IAE3B,OAAO,CAAC,QAAQ,CAAC,UAAU;gBAAV,UAAU,GAAE,UAAgC;IAGzD,kBAAkB,CACtB,KAAK,EAAE,WAAW,EAClB,OAAO,EAAE;QACP,OAAO,CAAC,EAAE,MAAM,CAAC;QACjB,MAAM,EAAE,MAAM,CAAC;QACf,KAAK,EAAE,MAAM,CAAC;KACf,GACA,OAAO,CAAC,kBAAkB,CAAC;IAyM9B;;;OAGG;IACH,OAAO,CAAC,gBAAgB;IAwBxB,OAAO,CAAC,mBAAmB;CAK5B"}
|
|
@@ -5,8 +5,20 @@
|
|
|
5
5
|
* each complexity tier where a cheaper alternative has proven
|
|
6
6
|
* reliable (≥95% success rate).
|
|
7
7
|
*/
|
|
8
|
-
import { DEFAULT_MODEL_COSTS } from '@agentlensai/core';
|
|
8
|
+
import { DEFAULT_MODEL_COSTS, lookupModelCost } from '@agentlensai/core';
|
|
9
9
|
import { classifyCallComplexity } from './classifier.js';
|
|
10
|
+
/** Allowed downgrade paths — only recommend within these */
|
|
11
|
+
const DOWNGRADE_PATHS = {
|
|
12
|
+
'claude-opus-4-6': ['claude-sonnet-4-6', 'claude-sonnet-4'],
|
|
13
|
+
'claude-opus-4': ['claude-sonnet-4', 'claude-sonnet-4-6'],
|
|
14
|
+
'claude-sonnet-4-6': ['claude-haiku-4-5-20251001'],
|
|
15
|
+
'claude-sonnet-4': ['claude-haiku-4-5-20251001', 'claude-haiku-3.5'],
|
|
16
|
+
'gpt-4o': ['gpt-4o-mini'],
|
|
17
|
+
'gpt-4.1': ['gpt-4.1-mini', 'gpt-4.1-nano'],
|
|
18
|
+
'gpt-4.1-mini': ['gpt-4.1-nano'],
|
|
19
|
+
};
|
|
20
|
+
/** Minimum calls required at a tier before making a recommendation */
|
|
21
|
+
const MIN_CALL_VOLUME = 20;
|
|
10
22
|
export class OptimizationEngine {
|
|
11
23
|
modelCosts;
|
|
12
24
|
constructor(modelCosts = DEFAULT_MODEL_COSTS) {
|
|
@@ -101,37 +113,64 @@ export class OptimizationEngine {
|
|
|
101
113
|
// 4. For each group, look for cheaper alternatives
|
|
102
114
|
const recommendations = [];
|
|
103
115
|
for (const [, group] of groups) {
|
|
116
|
+
// Never recommend downgrading expert tier
|
|
117
|
+
if (group.tier === 'expert')
|
|
118
|
+
continue;
|
|
119
|
+
// Require minimum call volume for the current model
|
|
120
|
+
if (group.callCount < MIN_CALL_VOLUME)
|
|
121
|
+
continue;
|
|
104
122
|
const currentCostPerCall = group.callCount > 0 ? group.totalCost / group.callCount : 0;
|
|
105
123
|
const currentSuccessRate = group.callCount > 0 ? group.successCount / group.callCount : 0;
|
|
106
124
|
// Get effective cost rate for this model
|
|
107
125
|
const currentModelCost = this.getModelCostRate(group);
|
|
108
126
|
if (currentModelCost === null)
|
|
109
127
|
continue;
|
|
128
|
+
// Get allowed downgrade targets for this model
|
|
129
|
+
const allowedTargets = DOWNGRADE_PATHS[group.model];
|
|
130
|
+
if (!allowedTargets || allowedTargets.length === 0)
|
|
131
|
+
continue;
|
|
110
132
|
// Find cheaper alternatives that have data at this tier
|
|
111
133
|
for (const [, candidateGroup] of groups) {
|
|
112
134
|
if (candidateGroup.model === group.model)
|
|
113
135
|
continue;
|
|
114
136
|
if (candidateGroup.tier !== group.tier)
|
|
115
137
|
continue;
|
|
138
|
+
// Only recommend within allowed downgrade paths
|
|
139
|
+
if (!allowedTargets.includes(candidateGroup.model))
|
|
140
|
+
continue;
|
|
141
|
+
// Require minimum call volume for the candidate at this tier
|
|
142
|
+
if (candidateGroup.callCount < MIN_CALL_VOLUME)
|
|
143
|
+
continue;
|
|
116
144
|
const candidateCostRate = this.getModelCostRate(candidateGroup);
|
|
117
145
|
if (candidateCostRate === null)
|
|
118
146
|
continue;
|
|
119
147
|
// Must be cheaper
|
|
120
148
|
if (candidateCostRate >= currentModelCost)
|
|
121
149
|
continue;
|
|
122
|
-
// Must have ≥
|
|
150
|
+
// Must have ≥98% success rate
|
|
123
151
|
const candidateSuccessRate = candidateGroup.callCount > 0
|
|
124
152
|
? candidateGroup.successCount / candidateGroup.callCount
|
|
125
153
|
: 0;
|
|
126
|
-
if (candidateSuccessRate < 0.
|
|
154
|
+
if (candidateSuccessRate < 0.98)
|
|
127
155
|
continue;
|
|
128
156
|
const recommendedCostPerCall = candidateGroup.callCount > 0
|
|
129
157
|
? candidateGroup.totalCost / candidateGroup.callCount
|
|
130
158
|
: 0;
|
|
131
|
-
|
|
159
|
+
// Don't extrapolate wildly for short periods
|
|
160
|
+
let monthlySavings;
|
|
161
|
+
let confidence;
|
|
162
|
+
const savingsPerPeriod = (currentCostPerCall - recommendedCostPerCall) * group.callCount;
|
|
163
|
+
if (period < 7) {
|
|
164
|
+
// Short period: don't extrapolate, use actual savings, lower confidence
|
|
165
|
+
monthlySavings = savingsPerPeriod;
|
|
166
|
+
confidence = 'low';
|
|
167
|
+
}
|
|
168
|
+
else {
|
|
169
|
+
monthlySavings = savingsPerPeriod * (30 / period);
|
|
170
|
+
confidence = this.determineConfidence(group.callCount);
|
|
171
|
+
}
|
|
132
172
|
if (monthlySavings <= 0)
|
|
133
173
|
continue;
|
|
134
|
-
const confidence = this.determineConfidence(group.callCount);
|
|
135
174
|
// Pick a representative agentId (first in set)
|
|
136
175
|
const agentId = group.agentIds.values().next().value ?? '';
|
|
137
176
|
recommendations.push({
|
|
@@ -165,7 +204,7 @@ export class OptimizationEngine {
|
|
|
165
204
|
* Uses known model costs table, or falls back to actual cost data from events.
|
|
166
205
|
*/
|
|
167
206
|
getModelCostRate(group) {
|
|
168
|
-
const knownCost = this.modelCosts
|
|
207
|
+
const knownCost = lookupModelCost(group.model, this.modelCosts);
|
|
169
208
|
if (knownCost) {
|
|
170
209
|
// Weighted average using actual input/output ratio when available
|
|
171
210
|
const totalTokens = group.totalInputTokens + group.totalOutputTokens;
|