claude-flow-novice 2.18.24 → 2.18.25
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/config/agent-whitelist.json +281 -0
- package/config/default.yml +180 -0
- package/config/feature-flags.json +315 -0
- package/config/fix-reports/config-manager-custom-keys.json +15 -0
- package/config/hooks/post-edit-pipeline.js +858 -0
- package/config/hooks/post-edit-pipeline.js.original +612 -0
- package/config/kong/grafana/datasources/prometheus.yml +24 -0
- package/config/kong/kong.yml +496 -0
- package/config/kong/prometheus.yml +49 -0
- package/config/logrotate.d/cfn-logs +221 -0
- package/config/loki/loki-config.yml +172 -0
- package/config/loki/retention.yml +107 -0
- package/config/mcp-servers.json +152 -0
- package/config/production.yml.example +72 -0
- package/config/prometheus.yml +85 -0
- package/config/promtail/promtail-config.yml +162 -0
- package/config/redis.conf +33 -0
- package/config/redis.config.js +115 -0
- package/config/skill-requirements.json +341 -0
- package/config/sla-definitions.test.yml +66 -0
- package/config/sla-definitions.yml +150 -0
- package/package.json +1 -1
|
@@ -0,0 +1,341 @@
|
|
|
1
|
+
{
|
|
2
|
+
"version": "1.0.0",
|
|
3
|
+
"description": "Skill requirements for MCP tools and servers",
|
|
4
|
+
"lastUpdated": "2025-11-05",
|
|
5
|
+
"tools": {
|
|
6
|
+
"take_screenshot": {
|
|
7
|
+
"displayName": "Take Screenshot",
|
|
8
|
+
"requiredSkills": [
|
|
9
|
+
"browser-automation",
|
|
10
|
+
"screenshot-capture"
|
|
11
|
+
],
|
|
12
|
+
"optionalSkills": [
|
|
13
|
+
"ui-development",
|
|
14
|
+
"accessibility-testing"
|
|
15
|
+
],
|
|
16
|
+
"allowedAgentTypes": [
|
|
17
|
+
"react-frontend-engineer",
|
|
18
|
+
"ui-designer",
|
|
19
|
+
"accessibility-validator",
|
|
20
|
+
"mobile-dev"
|
|
21
|
+
],
|
|
22
|
+
"resourceImpact": {
|
|
23
|
+
"memoryMB": 256,
|
|
24
|
+
"cpuUnits": 2,
|
|
25
|
+
"durationSeconds": 10
|
|
26
|
+
},
|
|
27
|
+
"description": "Capture webpage screenshots with Playwright"
|
|
28
|
+
},
|
|
29
|
+
"search_google": {
|
|
30
|
+
"displayName": "Search Google",
|
|
31
|
+
"requiredSkills": [
|
|
32
|
+
"browser-automation",
|
|
33
|
+
"web-search"
|
|
34
|
+
],
|
|
35
|
+
"optionalSkills": [
|
|
36
|
+
"seo-analysis",
|
|
37
|
+
"content-research"
|
|
38
|
+
],
|
|
39
|
+
"allowedAgentTypes": [
|
|
40
|
+
"react-frontend-engineer",
|
|
41
|
+
"ui-designer",
|
|
42
|
+
"mobile-dev"
|
|
43
|
+
],
|
|
44
|
+
"resourceImpact": {
|
|
45
|
+
"memoryMB": 512,
|
|
46
|
+
"cpuUnits": 3,
|
|
47
|
+
"durationSeconds": 15
|
|
48
|
+
},
|
|
49
|
+
"description": "Search Google and return results"
|
|
50
|
+
},
|
|
51
|
+
"navigate_and_interact": {
|
|
52
|
+
"displayName": "Navigate and Interact",
|
|
53
|
+
"requiredSkills": [
|
|
54
|
+
"browser-automation",
|
|
55
|
+
"web-interaction"
|
|
56
|
+
],
|
|
57
|
+
"optionalSkills": [
|
|
58
|
+
"form-testing",
|
|
59
|
+
"user-journey-testing"
|
|
60
|
+
],
|
|
61
|
+
"allowedAgentTypes": [
|
|
62
|
+
"react-frontend-engineer",
|
|
63
|
+
"ui-designer",
|
|
64
|
+
"accessibility-validator",
|
|
65
|
+
"mobile-dev"
|
|
66
|
+
],
|
|
67
|
+
"resourceImpact": {
|
|
68
|
+
"memoryMB": 384,
|
|
69
|
+
"cpuUnits": 3,
|
|
70
|
+
"durationSeconds": 20
|
|
71
|
+
},
|
|
72
|
+
"description": "Navigate web pages and interact with elements"
|
|
73
|
+
},
|
|
74
|
+
"redis_get": {
|
|
75
|
+
"displayName": "Redis Get Operation",
|
|
76
|
+
"requiredSkills": [
|
|
77
|
+
"redis-operations"
|
|
78
|
+
],
|
|
79
|
+
"optionalSkills": [
|
|
80
|
+
"cache-management",
|
|
81
|
+
"data-retrieval"
|
|
82
|
+
],
|
|
83
|
+
"allowedAgentTypes": [
|
|
84
|
+
"backend-developer",
|
|
85
|
+
"database-architect",
|
|
86
|
+
"api-gateway-specialist",
|
|
87
|
+
"devops-engineer"
|
|
88
|
+
],
|
|
89
|
+
"resourceImpact": {
|
|
90
|
+
"memoryMB": 64,
|
|
91
|
+
"cpuUnits": 1,
|
|
92
|
+
"durationSeconds": 2
|
|
93
|
+
},
|
|
94
|
+
"description": "Retrieve data from Redis cache"
|
|
95
|
+
},
|
|
96
|
+
"redis_set": {
|
|
97
|
+
"displayName": "Redis Set Operation",
|
|
98
|
+
"requiredSkills": [
|
|
99
|
+
"redis-operations"
|
|
100
|
+
],
|
|
101
|
+
"optionalSkills": [
|
|
102
|
+
"cache-management",
|
|
103
|
+
"data-storage"
|
|
104
|
+
],
|
|
105
|
+
"allowedAgentTypes": [
|
|
106
|
+
"backend-developer",
|
|
107
|
+
"database-architect",
|
|
108
|
+
"api-gateway-specialist",
|
|
109
|
+
"devops-engineer"
|
|
110
|
+
],
|
|
111
|
+
"resourceImpact": {
|
|
112
|
+
"memoryMB": 64,
|
|
113
|
+
"cpuUnits": 1,
|
|
114
|
+
"durationSeconds": 2
|
|
115
|
+
},
|
|
116
|
+
"description": "Store data in Redis cache"
|
|
117
|
+
},
|
|
118
|
+
"postgres_query": {
|
|
119
|
+
"displayName": "PostgreSQL Query",
|
|
120
|
+
"requiredSkills": [
|
|
121
|
+
"database-design",
|
|
122
|
+
"sql-operations"
|
|
123
|
+
],
|
|
124
|
+
"optionalSkills": [
|
|
125
|
+
"query-optimization",
|
|
126
|
+
"data-analysis"
|
|
127
|
+
],
|
|
128
|
+
"allowedAgentTypes": [
|
|
129
|
+
"backend-developer",
|
|
130
|
+
"database-architect",
|
|
131
|
+
"api-gateway-specialist"
|
|
132
|
+
],
|
|
133
|
+
"resourceImpact": {
|
|
134
|
+
"memoryMB": 128,
|
|
135
|
+
"cpuUnits": 2,
|
|
136
|
+
"durationSeconds": 5
|
|
137
|
+
},
|
|
138
|
+
"description": "Execute PostgreSQL queries"
|
|
139
|
+
},
|
|
140
|
+
"api_test_endpoint": {
|
|
141
|
+
"displayName": "API Endpoint Testing",
|
|
142
|
+
"requiredSkills": [
|
|
143
|
+
"api-development",
|
|
144
|
+
"api-testing"
|
|
145
|
+
],
|
|
146
|
+
"optionalSkills": [
|
|
147
|
+
"load-testing",
|
|
148
|
+
"security-testing"
|
|
149
|
+
],
|
|
150
|
+
"allowedAgentTypes": [
|
|
151
|
+
"backend-developer",
|
|
152
|
+
"api-gateway-specialist",
|
|
153
|
+
"security-specialist",
|
|
154
|
+
"performance-tester"
|
|
155
|
+
],
|
|
156
|
+
"resourceImpact": {
|
|
157
|
+
"memoryMB": 192,
|
|
158
|
+
"cpuUnits": 2,
|
|
159
|
+
"durationSeconds": 8
|
|
160
|
+
},
|
|
161
|
+
"description": "Test API endpoints for functionality and performance"
|
|
162
|
+
},
|
|
163
|
+
"security_scan": {
|
|
164
|
+
"displayName": "Security Vulnerability Scan",
|
|
165
|
+
"requiredSkills": [
|
|
166
|
+
"security-auditing",
|
|
167
|
+
"vulnerability-scanning"
|
|
168
|
+
],
|
|
169
|
+
"optionalSkills": [
|
|
170
|
+
"penetration-testing",
|
|
171
|
+
"compliance-checking"
|
|
172
|
+
],
|
|
173
|
+
"allowedAgentTypes": [
|
|
174
|
+
"security-specialist",
|
|
175
|
+
"backend-developer",
|
|
176
|
+
"devops-engineer"
|
|
177
|
+
],
|
|
178
|
+
"resourceImpact": {
|
|
179
|
+
"memoryMB": 512,
|
|
180
|
+
"cpuUnits": 4,
|
|
181
|
+
"durationSeconds": 30
|
|
182
|
+
},
|
|
183
|
+
"description": "Scan for security vulnerabilities"
|
|
184
|
+
},
|
|
185
|
+
"kubernetes_deploy": {
|
|
186
|
+
"displayName": "Kubernetes Deployment",
|
|
187
|
+
"requiredSkills": [
|
|
188
|
+
"kubernetes-management",
|
|
189
|
+
"container-orchestration"
|
|
190
|
+
],
|
|
191
|
+
"optionalSkills": [
|
|
192
|
+
"helm-charts",
|
|
193
|
+
"service-mesh"
|
|
194
|
+
],
|
|
195
|
+
"allowedAgentTypes": [
|
|
196
|
+
"kubernetes-specialist",
|
|
197
|
+
"devops-engineer"
|
|
198
|
+
],
|
|
199
|
+
"resourceImpact": {
|
|
200
|
+
"memoryMB": 256,
|
|
201
|
+
"cpuUnits": 2,
|
|
202
|
+
"durationSeconds": 45
|
|
203
|
+
},
|
|
204
|
+
"description": "Deploy applications to Kubernetes cluster"
|
|
205
|
+
},
|
|
206
|
+
"monitoring_metrics": {
|
|
207
|
+
"displayName": "Monitoring Metrics Collection",
|
|
208
|
+
"requiredSkills": [
|
|
209
|
+
"metrics-collection",
|
|
210
|
+
"performance-monitoring"
|
|
211
|
+
],
|
|
212
|
+
"optionalSkills": [
|
|
213
|
+
"alerting-systems",
|
|
214
|
+
"dashboard-creation"
|
|
215
|
+
],
|
|
216
|
+
"allowedAgentTypes": [
|
|
217
|
+
"monitoring-specialist",
|
|
218
|
+
"devops-engineer",
|
|
219
|
+
"performance-tester",
|
|
220
|
+
"kubernetes-specialist"
|
|
221
|
+
],
|
|
222
|
+
"resourceImpact": {
|
|
223
|
+
"memoryMB": 192,
|
|
224
|
+
"cpuUnits": 2,
|
|
225
|
+
"durationSeconds": 10
|
|
226
|
+
},
|
|
227
|
+
"description": "Collect and analyze monitoring metrics"
|
|
228
|
+
},
|
|
229
|
+
"log_analysis": {
|
|
230
|
+
"displayName": "Log Analysis",
|
|
231
|
+
"requiredSkills": [
|
|
232
|
+
"log-analysis",
|
|
233
|
+
"troubleshooting"
|
|
234
|
+
],
|
|
235
|
+
"optionalSkills": [
|
|
236
|
+
"incident-response",
|
|
237
|
+
"pattern-matching"
|
|
238
|
+
],
|
|
239
|
+
"allowedAgentTypes": [
|
|
240
|
+
"monitoring-specialist",
|
|
241
|
+
"devops-engineer",
|
|
242
|
+
"backend-developer",
|
|
243
|
+
"security-specialist"
|
|
244
|
+
],
|
|
245
|
+
"resourceImpact": {
|
|
246
|
+
"memoryMB": 384,
|
|
247
|
+
"cpuUnits": 3,
|
|
248
|
+
"durationSeconds": 15
|
|
249
|
+
},
|
|
250
|
+
"description": "Analyze application and system logs"
|
|
251
|
+
},
|
|
252
|
+
"load_test": {
|
|
253
|
+
"displayName": "Load Testing",
|
|
254
|
+
"requiredSkills": [
|
|
255
|
+
"load-testing",
|
|
256
|
+
"performance-monitoring"
|
|
257
|
+
],
|
|
258
|
+
"optionalSkills": [
|
|
259
|
+
"stress-testing",
|
|
260
|
+
"benchmarking"
|
|
261
|
+
],
|
|
262
|
+
"allowedAgentTypes": [
|
|
263
|
+
"performance-tester",
|
|
264
|
+
"backend-developer",
|
|
265
|
+
"devops-engineer"
|
|
266
|
+
],
|
|
267
|
+
"resourceImpact": {
|
|
268
|
+
"memoryMB": 1024,
|
|
269
|
+
"cpuUnits": 6,
|
|
270
|
+
"durationSeconds": 120
|
|
271
|
+
},
|
|
272
|
+
"description": "Perform load testing on applications"
|
|
273
|
+
},
|
|
274
|
+
"accessibility_audit": {
|
|
275
|
+
"displayName": "Accessibility Audit",
|
|
276
|
+
"requiredSkills": [
|
|
277
|
+
"accessibility-testing",
|
|
278
|
+
"wcag-compliance"
|
|
279
|
+
],
|
|
280
|
+
"optionalSkills": [
|
|
281
|
+
"screen-reader-testing",
|
|
282
|
+
"color-contrast-analysis"
|
|
283
|
+
],
|
|
284
|
+
"allowedAgentTypes": [
|
|
285
|
+
"accessibility-validator",
|
|
286
|
+
"ui-designer",
|
|
287
|
+
"react-frontend-engineer"
|
|
288
|
+
],
|
|
289
|
+
"resourceImpact": {
|
|
290
|
+
"memoryMB": 384,
|
|
291
|
+
"cpuUnits": 3,
|
|
292
|
+
"durationSeconds": 25
|
|
293
|
+
},
|
|
294
|
+
"description": "Audit applications for accessibility compliance"
|
|
295
|
+
},
|
|
296
|
+
"responsive_test": {
|
|
297
|
+
"displayName": "Responsive Design Testing",
|
|
298
|
+
"requiredSkills": [
|
|
299
|
+
"responsive-testing",
|
|
300
|
+
"device-testing"
|
|
301
|
+
],
|
|
302
|
+
"optionalSkills": [
|
|
303
|
+
"mobile-development",
|
|
304
|
+
"css-testing"
|
|
305
|
+
],
|
|
306
|
+
"allowedAgentTypes": [
|
|
307
|
+
"mobile-dev",
|
|
308
|
+
"ui-designer",
|
|
309
|
+
"react-frontend-engineer"
|
|
310
|
+
],
|
|
311
|
+
"resourceImpact": {
|
|
312
|
+
"memoryMB": 512,
|
|
313
|
+
"cpuUnits": 3,
|
|
314
|
+
"durationSeconds": 20
|
|
315
|
+
},
|
|
316
|
+
"description": "Test responsive design across different screen sizes"
|
|
317
|
+
},
|
|
318
|
+
"screenshot_analysis": {
|
|
319
|
+
"displayName": "Screenshot Analysis",
|
|
320
|
+
"requiredSkills": [
|
|
321
|
+
"screenshot-capture",
|
|
322
|
+
"visual-analysis"
|
|
323
|
+
],
|
|
324
|
+
"optionalSkills": [
|
|
325
|
+
"ui-testing",
|
|
326
|
+
"regression-testing"
|
|
327
|
+
],
|
|
328
|
+
"allowedAgentTypes": [
|
|
329
|
+
"ui-designer",
|
|
330
|
+
"react-frontend-engineer",
|
|
331
|
+
"accessibility-validator"
|
|
332
|
+
],
|
|
333
|
+
"resourceImpact": {
|
|
334
|
+
"memoryMB": 768,
|
|
335
|
+
"cpuUnits": 4,
|
|
336
|
+
"durationSeconds": 15
|
|
337
|
+
},
|
|
338
|
+
"description": "Analyze screenshots for visual differences and issues"
|
|
339
|
+
}
|
|
340
|
+
}
|
|
341
|
+
}
|
|
@@ -0,0 +1,66 @@
|
|
|
1
|
+
# SLA Definitions for Performance Monitoring
|
|
2
|
+
# Test Configuration - Used for unit tests
|
|
3
|
+
#
|
|
4
|
+
# Each SLA definition specifies performance targets and baseline percentiles
|
|
5
|
+
# Used to track and alert on performance degradation
|
|
6
|
+
#
|
|
7
|
+
# SLA Target: <X>ms = P50 should be below X ms
|
|
8
|
+
# Baseline P95: Performance threshold for 95th percentile
|
|
9
|
+
# Baseline P99: Performance threshold for 99th percentile
|
|
10
|
+
#
|
|
11
|
+
# See docs/PERFORMANCE_MONITORING_GUIDE.md for detailed configuration
|
|
12
|
+
|
|
13
|
+
slas:
|
|
14
|
+
# Agent Startup SLA
|
|
15
|
+
# Target: Initialize new agent in <2s
|
|
16
|
+
agent_startup:
|
|
17
|
+
target: 2000 # ms - median response time target
|
|
18
|
+
p95: 2000 # 95th percentile
|
|
19
|
+
p99: 5000 # 99th percentile
|
|
20
|
+
enabled: true
|
|
21
|
+
alert_threshold: 1.2 # Alert if performance degrades >20%
|
|
22
|
+
|
|
23
|
+
# Query Execution SLA
|
|
24
|
+
# Target: Execute database queries in <5s
|
|
25
|
+
query_execution:
|
|
26
|
+
target: 5000 # ms - median response time target
|
|
27
|
+
p95: 5000 # 95th percentile
|
|
28
|
+
p99: 10000 # 99th percentile
|
|
29
|
+
enabled: true
|
|
30
|
+
alert_threshold: 1.2 # Alert if performance degrades >20%
|
|
31
|
+
|
|
32
|
+
# Skill Execution SLA
|
|
33
|
+
# Target: Complete skill execution in <30s
|
|
34
|
+
skill_execution:
|
|
35
|
+
target: 30000 # ms - median response time target
|
|
36
|
+
p95: 30000 # 95th percentile
|
|
37
|
+
p99: 60000 # 99th percentile
|
|
38
|
+
enabled: true
|
|
39
|
+
alert_threshold: 1.2 # Alert if performance degrades >20%
|
|
40
|
+
|
|
41
|
+
# Transaction Commit SLA
|
|
42
|
+
# Target: Commit database transaction in <5s
|
|
43
|
+
transaction_commit:
|
|
44
|
+
target: 5000 # ms - median response time target
|
|
45
|
+
p95: 5000 # 95th percentile
|
|
46
|
+
p99: 10000 # 99th percentile
|
|
47
|
+
enabled: true
|
|
48
|
+
alert_threshold: 1.2 # Alert if performance degrades >20%
|
|
49
|
+
|
|
50
|
+
# Global SLA Configuration
|
|
51
|
+
global:
|
|
52
|
+
# Monthly SLA violation threshold (target <5%)
|
|
53
|
+
monthly_violation_target: 0.05
|
|
54
|
+
|
|
55
|
+
# Degradation detection parameters
|
|
56
|
+
degradation_window_minutes: 5 # Evaluate last 5 minutes
|
|
57
|
+
degradation_threshold_percent: 20 # Alert if >20% degradation
|
|
58
|
+
degradation_consecutive_samples: 5 # Require 5+ samples
|
|
59
|
+
|
|
60
|
+
# Alert configuration
|
|
61
|
+
alert_resolution_hours: 24 # Auto-resolve alerts after 24h
|
|
62
|
+
|
|
63
|
+
# Retention policy
|
|
64
|
+
metrics_retention_days: 90 # Keep metrics for 90 days
|
|
65
|
+
alerts_retention_days: 365 # Keep alert history for 1 year
|
|
66
|
+
baseline_calculation_days: 30 # Default baseline window
|
|
@@ -0,0 +1,150 @@
|
|
|
1
|
+
# SLA Definitions for Performance Monitoring
|
|
2
|
+
# Production Configuration
|
|
3
|
+
#
|
|
4
|
+
# Each SLA definition specifies performance targets and baseline percentiles
|
|
5
|
+
# Used to track and alert on performance degradation
|
|
6
|
+
#
|
|
7
|
+
# SLA Target: <X>ms = P50 should be below X ms
|
|
8
|
+
# Baseline P95: Performance threshold for 95th percentile
|
|
9
|
+
# Baseline P99: Performance threshold for 99th percentile
|
|
10
|
+
#
|
|
11
|
+
# See docs/PERFORMANCE_MONITORING_GUIDE.md for detailed configuration
|
|
12
|
+
|
|
13
|
+
slas:
|
|
14
|
+
# Agent Startup SLA
|
|
15
|
+
# Target: Initialize new agent in <2s
|
|
16
|
+
# Used for: Agent spawning, initialization
|
|
17
|
+
agent_startup:
|
|
18
|
+
target: 2000 # ms - median response time target
|
|
19
|
+
p95: 2000 # 95th percentile - 95% of startups should be <2s
|
|
20
|
+
p99: 5000 # 99th percentile - 99% of startups should be <5s
|
|
21
|
+
enabled: true
|
|
22
|
+
alert_threshold: 1.2 # Alert if performance degrades >20%
|
|
23
|
+
|
|
24
|
+
# Query Execution SLA
|
|
25
|
+
# Target: Execute database queries in <5s
|
|
26
|
+
# Used for: Database queries, API calls
|
|
27
|
+
query_execution:
|
|
28
|
+
target: 5000 # ms - median response time target
|
|
29
|
+
p95: 5000 # 95th percentile - 95% of queries should be <5s
|
|
30
|
+
p99: 10000 # 99th percentile - 99% of queries should be <10s
|
|
31
|
+
enabled: true
|
|
32
|
+
alert_threshold: 1.2 # Alert if performance degrades >20%
|
|
33
|
+
|
|
34
|
+
# Skill Execution SLA
|
|
35
|
+
# Target: Complete skill execution in <30s
|
|
36
|
+
# Used for: Skill runs, custom operations
|
|
37
|
+
skill_execution:
|
|
38
|
+
target: 30000 # ms - median response time target
|
|
39
|
+
p95: 30000 # 95th percentile - 95% of skills should complete in <30s
|
|
40
|
+
p99: 60000 # 99th percentile - 99% of skills should complete in <60s
|
|
41
|
+
enabled: true
|
|
42
|
+
alert_threshold: 1.2 # Alert if performance degrades >20%
|
|
43
|
+
|
|
44
|
+
# Transaction Commit SLA
|
|
45
|
+
# Target: Commit database transaction in <5s
|
|
46
|
+
# Used for: Database transactions, writes
|
|
47
|
+
transaction_commit:
|
|
48
|
+
target: 5000 # ms - median response time target
|
|
49
|
+
p95: 5000 # 95th percentile - 95% of commits should be <5s
|
|
50
|
+
p99: 10000 # 99th percentile - 99% of commits should be <10s
|
|
51
|
+
enabled: true
|
|
52
|
+
alert_threshold: 1.2 # Alert if performance degrades >20%
|
|
53
|
+
|
|
54
|
+
# Log Shipment SLA
|
|
55
|
+
# Target: Ship logs in <1s
|
|
56
|
+
# Used for: Log aggregation, metrics export
|
|
57
|
+
log_shipment:
|
|
58
|
+
target: 1000 # ms - median shipment time
|
|
59
|
+
p95: 1000 # 95th percentile
|
|
60
|
+
p99: 2000 # 99th percentile
|
|
61
|
+
enabled: true
|
|
62
|
+
alert_threshold: 1.2 # Alert if performance degrades >20%
|
|
63
|
+
|
|
64
|
+
# Checkpoint Save SLA
|
|
65
|
+
# Target: Save checkpoint in <5s
|
|
66
|
+
# Used for: State management, distributed coordination
|
|
67
|
+
checkpoint_save:
|
|
68
|
+
target: 5000 # ms - median save time
|
|
69
|
+
p95: 5000 # 95th percentile
|
|
70
|
+
p99: 10000 # 99th percentile
|
|
71
|
+
enabled: true
|
|
72
|
+
alert_threshold: 1.2 # Alert if performance degrades >20%
|
|
73
|
+
|
|
74
|
+
# Cache Lookup SLA
|
|
75
|
+
# Target: Cache lookup in <100ms
|
|
76
|
+
# Used for: In-memory cache, rapid access patterns
|
|
77
|
+
cache_lookup:
|
|
78
|
+
target: 100 # ms - median lookup time
|
|
79
|
+
p95: 100 # 95th percentile
|
|
80
|
+
p99: 500 # 99th percentile
|
|
81
|
+
enabled: true
|
|
82
|
+
alert_threshold: 1.2 # Alert if performance degrades >20%
|
|
83
|
+
|
|
84
|
+
# Global SLA Configuration
|
|
85
|
+
global:
|
|
86
|
+
# Monthly SLA violation threshold (target <5%)
|
|
87
|
+
# This means we aim for >95% compliance monthly
|
|
88
|
+
monthly_violation_target: 0.05
|
|
89
|
+
|
|
90
|
+
# Degradation detection parameters
|
|
91
|
+
degradation_window_minutes: 5 # Evaluate last 5 minutes of data
|
|
92
|
+
degradation_threshold_percent: 20 # Alert if >20% degradation from baseline
|
|
93
|
+
degradation_consecutive_samples: 5 # Require 5+ samples to declare degradation
|
|
94
|
+
|
|
95
|
+
# Alert configuration
|
|
96
|
+
alert_resolution_hours: 24 # Auto-resolve alerts after 24h if not re-triggered
|
|
97
|
+
alert_batch_window_minutes: 5 # Batch similar alerts within 5 minute window
|
|
98
|
+
alert_max_frequency_per_hour: 10 # Max 10 alerts per operation per hour
|
|
99
|
+
|
|
100
|
+
# Retention policy
|
|
101
|
+
metrics_retention_days: 90 # Keep detailed metrics for 90 days
|
|
102
|
+
alerts_retention_days: 365 # Keep alert history for 1 year
|
|
103
|
+
baseline_calculation_days: 30 # Default baseline window (30 days of history)
|
|
104
|
+
baseline_cache_ttl_minutes: 5 # Cache baseline calculations for 5 minutes
|
|
105
|
+
|
|
106
|
+
# Performance targets for monitoring service itself
|
|
107
|
+
metric_recording_overhead_ms: 10 # Recording should add <10ms overhead
|
|
108
|
+
baseline_calculation_target_ms: 5000 # Calculation should complete in <5s
|
|
109
|
+
sla_check_target_ms: 50 # SLA checks should complete in <50ms
|
|
110
|
+
|
|
111
|
+
# Alerting thresholds
|
|
112
|
+
alerting:
|
|
113
|
+
# SLA violation alert conditions
|
|
114
|
+
violation_alert:
|
|
115
|
+
enabled: true
|
|
116
|
+
level: warning # Alert level for SLA violations
|
|
117
|
+
threshold: 1 # Alert on every violation
|
|
118
|
+
|
|
119
|
+
# Degradation alert conditions
|
|
120
|
+
degradation_alert:
|
|
121
|
+
enabled: true
|
|
122
|
+
level: warning # Alert level for degradation
|
|
123
|
+
threshold: 1.2 # Alert if >20% degradation
|
|
124
|
+
|
|
125
|
+
# Critical threshold alerts
|
|
126
|
+
critical_alert:
|
|
127
|
+
enabled: true
|
|
128
|
+
level: critical # Alert level for critical threshold
|
|
129
|
+
threshold: 1.5 # Alert if >50% degradation
|
|
130
|
+
|
|
131
|
+
# Notification channels
|
|
132
|
+
notifications:
|
|
133
|
+
# Email notifications for critical alerts
|
|
134
|
+
email:
|
|
135
|
+
enabled: true
|
|
136
|
+
critical_only: false
|
|
137
|
+
recipients: [] # Configure in environment or secrets
|
|
138
|
+
|
|
139
|
+
# Slack notifications for performance issues
|
|
140
|
+
slack:
|
|
141
|
+
enabled: true
|
|
142
|
+
critical_only: true
|
|
143
|
+
channel: '#performance-alerts'
|
|
144
|
+
webhook_url: "${SLACK_WEBHOOK_PERFORMANCE}" # Set via environment variable
|
|
145
|
+
|
|
146
|
+
# PagerDuty for critical incidents
|
|
147
|
+
pagerduty:
|
|
148
|
+
enabled: false
|
|
149
|
+
critical_only: true
|
|
150
|
+
api_key: "${PAGERDUTY_API_KEY}" # Set via environment variable
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "claude-flow-novice",
|
|
3
|
-
"version": "2.18.
|
|
3
|
+
"version": "2.18.25",
|
|
4
4
|
"description": "Claude Flow Novice - Advanced orchestration platform for multi-agent AI workflows with CFN Loop architecture\n\nIncludes Local RuVector Accelerator and all CFN skills for complete functionality.",
|
|
5
5
|
"main": "index.js",
|
|
6
6
|
"type": "module",
|