@dipseth/opensearch-logs 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.env.example +14 -0
- package/alerts/langfuse-usage.yaml +142 -0
- package/alerts/production-incidents.yaml +280 -0
- package/alerts/service-health.yaml +98 -0
- package/dashboards/langfuse-usage.yaml +57 -0
- package/dist/create-dashboards.d.ts +10 -0
- package/dist/create-dashboards.js +38 -0
- package/dist/create-dashboards.js.map +1 -0
- package/dist/interfaces/alert.interfaces.d.ts +323 -0
- package/dist/interfaces/alert.interfaces.js +6 -0
- package/dist/interfaces/alert.interfaces.js.map +1 -0
- package/dist/interfaces/dashboard-gen.interfaces.d.ts +33 -0
- package/dist/interfaces/dashboard-gen.interfaces.js +3 -0
- package/dist/interfaces/dashboard-gen.interfaces.js.map +1 -0
- package/dist/interfaces/interfaces.d.ts +312 -0
- package/dist/interfaces/interfaces.js +3 -0
- package/dist/interfaces/interfaces.js.map +1 -0
- package/dist/interfaces/playbook.interfaces.d.ts +140 -0
- package/dist/interfaces/playbook.interfaces.js +3 -0
- package/dist/interfaces/playbook.interfaces.js.map +1 -0
- package/dist/os-alert.d.ts +17 -0
- package/dist/os-alert.js +245 -0
- package/dist/os-alert.js.map +1 -0
- package/dist/os-dash.d.ts +9 -0
- package/dist/os-dash.js +53 -0
- package/dist/os-dash.js.map +1 -0
- package/dist/os-monitor.d.ts +12 -0
- package/dist/os-monitor.js +59 -0
- package/dist/os-monitor.js.map +1 -0
- package/dist/os-playbook.d.ts +9 -0
- package/dist/os-playbook.js +71 -0
- package/dist/os-playbook.js.map +1 -0
- package/dist/os-search.d.ts +11 -0
- package/dist/os-search.js +84 -0
- package/dist/os-search.js.map +1 -0
- package/dist/repositories/index.d.ts +1 -0
- package/dist/repositories/index.js +2 -0
- package/dist/repositories/index.js.map +1 -0
- package/dist/repositories/opensearch.repository.d.ts +51 -0
- package/dist/repositories/opensearch.repository.js +167 -0
- package/dist/repositories/opensearch.repository.js.map +1 -0
- package/dist/services/alert.service.d.ts +73 -0
- package/dist/services/alert.service.js +503 -0
- package/dist/services/alert.service.js.map +1 -0
- package/dist/services/dashboard-gen.service.d.ts +36 -0
- package/dist/services/dashboard-gen.service.js +162 -0
- package/dist/services/dashboard-gen.service.js.map +1 -0
- package/dist/services/dashboard.service.d.ts +33 -0
- package/dist/services/dashboard.service.js +428 -0
- package/dist/services/dashboard.service.js.map +1 -0
- package/dist/services/gchat.service.d.ts +45 -0
- package/dist/services/gchat.service.js +228 -0
- package/dist/services/gchat.service.js.map +1 -0
- package/dist/services/index.d.ts +8 -0
- package/dist/services/index.js +9 -0
- package/dist/services/index.js.map +1 -0
- package/dist/services/monitor.service.d.ts +18 -0
- package/dist/services/monitor.service.js +342 -0
- package/dist/services/monitor.service.js.map +1 -0
- package/dist/services/panel-layout.d.ts +21 -0
- package/dist/services/panel-layout.js +33 -0
- package/dist/services/panel-layout.js.map +1 -0
- package/dist/services/playbook-dashboard.service.d.ts +19 -0
- package/dist/services/playbook-dashboard.service.js +434 -0
- package/dist/services/playbook-dashboard.service.js.map +1 -0
- package/dist/services/playbook.service.d.ts +13 -0
- package/dist/services/playbook.service.js +621 -0
- package/dist/services/playbook.service.js.map +1 -0
- package/dist/services/search.service.d.ts +30 -0
- package/dist/services/search.service.js +885 -0
- package/dist/services/search.service.js.map +1 -0
- package/dist/utils/cli.d.ts +14 -0
- package/dist/utils/cli.js +90 -0
- package/dist/utils/cli.js.map +1 -0
- package/dist/utils/config.d.ts +20 -0
- package/dist/utils/config.js +104 -0
- package/dist/utils/config.js.map +1 -0
- package/dist/utils/index.d.ts +5 -0
- package/dist/utils/index.js +5 -0
- package/dist/utils/index.js.map +1 -0
- package/dist/utils/service-registry.d.ts +15 -0
- package/dist/utils/service-registry.js +56 -0
- package/dist/utils/service-registry.js.map +1 -0
- package/dist/utils/template.d.ts +18 -0
- package/dist/utils/template.js +66 -0
- package/dist/utils/template.js.map +1 -0
- package/package.json +76 -0
- package/playbooks/error-investigation.yaml +45 -0
- package/playbooks/incident-triage.yaml +32 -0
- package/playbooks/post-deploy-validation.yaml +24 -0
- package/playbooks/service-deep-dive.yaml +42 -0
|
@@ -0,0 +1,45 @@
|
|
|
1
|
+
name: Error Investigation
|
|
2
|
+
description: Deep dive into error patterns — counts, breakdowns, timeline, and correlation with latency.
|
|
3
|
+
|
|
4
|
+
defaults:
|
|
5
|
+
env: production
|
|
6
|
+
hours: 4
|
|
7
|
+
limit: 20
|
|
8
|
+
|
|
9
|
+
steps:
|
|
10
|
+
pattern_scan:
|
|
11
|
+
type: pattern-count
|
|
12
|
+
description: Scan all known incident patterns
|
|
13
|
+
|
|
14
|
+
error_breakdown:
|
|
15
|
+
type: errors
|
|
16
|
+
description: Full error breakdown by status, service, endpoint
|
|
17
|
+
|
|
18
|
+
error_histogram:
|
|
19
|
+
type: histogram
|
|
20
|
+
description: Error volume over time
|
|
21
|
+
depends_on: [error_breakdown]
|
|
22
|
+
args:
|
|
23
|
+
level: ERROR
|
|
24
|
+
interval: 30m
|
|
25
|
+
|
|
26
|
+
latency:
|
|
27
|
+
type: latency
|
|
28
|
+
description: Check if latency correlates with errors
|
|
29
|
+
|
|
30
|
+
error_timeline:
|
|
31
|
+
type: timeline
|
|
32
|
+
description: Chronological error events
|
|
33
|
+
depends_on: [error_breakdown]
|
|
34
|
+
args:
|
|
35
|
+
level: ERROR
|
|
36
|
+
limit: 50
|
|
37
|
+
|
|
38
|
+
five_hundred_samples:
|
|
39
|
+
type: search
|
|
40
|
+
description: Recent 500 error samples
|
|
41
|
+
depends_on: [error_breakdown]
|
|
42
|
+
args:
|
|
43
|
+
status: "5xx"
|
|
44
|
+
limit: 15
|
|
45
|
+
optional: true
|
|
@@ -0,0 +1,32 @@
|
|
|
1
|
+
name: Incident Triage
|
|
2
|
+
description: Broad production investigation — error patterns, service health, latency, then sample errors from top offenders.
|
|
3
|
+
|
|
4
|
+
defaults:
|
|
5
|
+
env: production
|
|
6
|
+
hours: 1
|
|
7
|
+
limit: 20
|
|
8
|
+
|
|
9
|
+
steps:
|
|
10
|
+
patterns:
|
|
11
|
+
type: pattern-count
|
|
12
|
+
description: Scan all known incident patterns
|
|
13
|
+
|
|
14
|
+
errors:
|
|
15
|
+
type: errors
|
|
16
|
+
description: Error breakdown by status, service, and endpoint
|
|
17
|
+
|
|
18
|
+
services:
|
|
19
|
+
type: services
|
|
20
|
+
description: Per-service health table
|
|
21
|
+
|
|
22
|
+
latency:
|
|
23
|
+
type: latency
|
|
24
|
+
description: Overall and per-service latency percentiles
|
|
25
|
+
|
|
26
|
+
error_samples:
|
|
27
|
+
type: search
|
|
28
|
+
description: Recent error log samples
|
|
29
|
+
depends_on: [errors]
|
|
30
|
+
args:
|
|
31
|
+
level: ERROR
|
|
32
|
+
limit: 10
|
|
@@ -0,0 +1,24 @@
|
|
|
1
|
+
name: Post-Deploy Validation
|
|
2
|
+
description: Quick health check after a deployment — patterns, errors, and latency in a short window.
|
|
3
|
+
|
|
4
|
+
defaults:
|
|
5
|
+
env: production
|
|
6
|
+
hours: 0.5
|
|
7
|
+
limit: 10
|
|
8
|
+
|
|
9
|
+
steps:
|
|
10
|
+
patterns:
|
|
11
|
+
type: pattern-count
|
|
12
|
+
description: Check for known bad patterns
|
|
13
|
+
|
|
14
|
+
errors:
|
|
15
|
+
type: errors
|
|
16
|
+
description: Error summary
|
|
17
|
+
|
|
18
|
+
latency:
|
|
19
|
+
type: latency
|
|
20
|
+
description: Latency check
|
|
21
|
+
|
|
22
|
+
services:
|
|
23
|
+
type: services
|
|
24
|
+
description: Service health overview
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
name: Service Deep Dive
|
|
2
|
+
description: Focused investigation of a single service — requires --service flag.
|
|
3
|
+
|
|
4
|
+
defaults:
|
|
5
|
+
env: production
|
|
6
|
+
hours: 2
|
|
7
|
+
limit: 20
|
|
8
|
+
|
|
9
|
+
steps:
|
|
10
|
+
overview:
|
|
11
|
+
type: count
|
|
12
|
+
description: Total log volume for this service
|
|
13
|
+
|
|
14
|
+
errors:
|
|
15
|
+
type: errors
|
|
16
|
+
description: Error breakdown for this service
|
|
17
|
+
|
|
18
|
+
latency:
|
|
19
|
+
type: latency
|
|
20
|
+
description: Latency percentiles for this service
|
|
21
|
+
|
|
22
|
+
error_timeline:
|
|
23
|
+
type: timeline
|
|
24
|
+
description: Chronological error events
|
|
25
|
+
depends_on: [errors]
|
|
26
|
+
args:
|
|
27
|
+
level: ERROR
|
|
28
|
+
limit: 30
|
|
29
|
+
|
|
30
|
+
recent_500s:
|
|
31
|
+
type: search
|
|
32
|
+
description: Recent 500 errors
|
|
33
|
+
depends_on: [errors]
|
|
34
|
+
args:
|
|
35
|
+
status: "5xx"
|
|
36
|
+
limit: 10
|
|
37
|
+
|
|
38
|
+
histogram:
|
|
39
|
+
type: histogram
|
|
40
|
+
description: Request volume over time
|
|
41
|
+
args:
|
|
42
|
+
interval: 15m
|