npm - @unrdf/observability - Versions diffs - 26.4.2 - Mend

@unrdf/observability 26.4.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

package/.eslintrc.cjs +10 -0
package/IMPLEMENTATION-SUMMARY.md +478 -0
package/LICENSE +21 -0
package/README.md +482 -0
package/capability-map.md +90 -0
package/config/alert-rules.yml +269 -0
package/config/prometheus.yml +136 -0
package/dashboards/grafana-unrdf.json +798 -0
package/dashboards/unrdf-workflow-dashboard.json +295 -0
package/docs/OBSERVABILITY-PATTERNS.md +681 -0
package/docs/OBSERVABILITY-RUNBOOK.md +554 -0
package/examples/observability-demo.mjs +334 -0
package/package.json +46 -0
package/src/advanced-metrics.mjs +413 -0
package/src/alerts/alert-manager.mjs +436 -0
package/src/custom-events.mjs +558 -0
package/src/distributed-tracing.mjs +352 -0
package/src/exporters/grafana-exporter.mjs +415 -0
package/src/index.mjs +61 -0
package/src/metrics/workflow-metrics.mjs +346 -0
package/src/receipts/anchor.mjs +155 -0
package/src/receipts/index.mjs +62 -0
package/src/receipts/merkle-tree.mjs +188 -0
package/src/receipts/receipt-chain.mjs +209 -0
package/src/receipts/receipt-schema.mjs +128 -0
package/src/receipts/tamper-detection.mjs +219 -0
package/test/advanced-metrics.test.mjs +302 -0
package/test/custom-events.test.mjs +387 -0
package/test/distributed-tracing.test.mjs +314 -0
package/validation/observability-validation.mjs +366 -0
package/vitest.config.mjs +25 -0

package/src/metrics/workflow-metrics.mjs ADDED Viewed

@@ -0,0 +1,346 @@
+/**
+ * @unrdf/observability - Workflow Metrics Module
+ *
+ * Prometheus metrics collection for distributed workflow execution.
+ * Provides real-time metrics for workflow executions, task completions,
+ * resource utilization, and custom business metrics.
+ *
+ * @module @unrdf/observability/metrics
+ */
+import { register, Counter, Histogram, Gauge, Summary } from 'prom-client';
+import { z } from 'zod';
+/**
+ * Workflow execution status enum
+ */
+export const WorkflowStatus = {
+  PENDING: 'pending',
+  RUNNING: 'running',
+  COMPLETED: 'completed',
+  FAILED: 'failed',
+  CANCELLED: 'cancelled',
+};
+/**
+ * Metric configuration schema
+ * @type {z.ZodObject}
+ */
+const MetricConfigSchema = z.object({
+  enableDefaultMetrics: z.boolean().default(true),
+  prefix: z.string().default('unrdf_workflow_'),
+  labels: z.record(z.string()).optional(),
+  collectInterval: z.number().min(1000).default(10000), // 10s default
+});
+/**
+ * WorkflowMetrics - Comprehensive Prometheus metrics for workflows
+ *
+ * Collects and exposes metrics for:
+ * - Workflow executions (total, active, completed, failed)
+ * - Task performance (duration, success rate)
+ * - Resource utilization (CPU, memory, queue depth)
+ * - Custom business metrics
+ *
+ * @class
+ */
+export class WorkflowMetrics {
+  /**
+   * @param {object} config - Metric configuration
+   * @param {boolean} [config.enableDefaultMetrics=true] - Enable Node.js default metrics
+   * @param {string} [config.prefix='unrdf_workflow_'] - Metric name prefix
+   * @param {Record<string, string>} [config.labels] - Global labels for all metrics
+   * @param {number} [config.collectInterval=10000] - Collection interval in ms
+   */
+  constructor(config = {}) {
+    const validated = MetricConfigSchema.parse(config);
+    this.config = validated;
+    this.registry = register;
+    // Enable default Node.js metrics (heap, CPU, event loop, etc.)
+    if (validated.enableDefaultMetrics) {
+      register.setDefaultLabels(validated.labels || {});
+    }
+    this._initializeMetrics();
+  }
+  /**
+   * Initialize all Prometheus metrics
+   * @private
+   */
+  _initializeMetrics() {
+    const { prefix } = this.config;
+    // Workflow Execution Metrics
+    this.workflowExecutionsTotal = new Counter({
+      name: `${prefix}executions_total`,
+      help: 'Total number of workflow executions',
+      labelNames: ['workflow_id', 'status', 'pattern'],
+    });
+    this.workflowExecutionDuration = new Histogram({
+      name: `${prefix}execution_duration_seconds`,
+      help: 'Workflow execution duration in seconds',
+      labelNames: ['workflow_id', 'status', 'pattern'],
+      buckets: [0.1, 0.5, 1, 2, 5, 10, 30, 60, 120, 300], // 100ms to 5min
+    });
+    this.workflowActiveGauge = new Gauge({
+      name: `${prefix}active_workflows`,
+      help: 'Number of currently active workflows',
+      labelNames: ['workflow_id', 'pattern'],
+    });
+    // Task Execution Metrics
+    this.taskExecutionsTotal = new Counter({
+      name: `${prefix}task_executions_total`,
+      help: 'Total number of task executions',
+      labelNames: ['workflow_id', 'task_id', 'task_type', 'status'],
+    });
+    this.taskExecutionDuration = new Histogram({
+      name: `${prefix}task_duration_seconds`,
+      help: 'Task execution duration in seconds',
+      labelNames: ['workflow_id', 'task_id', 'task_type'],
+      buckets: [0.01, 0.05, 0.1, 0.5, 1, 2, 5, 10, 30], // 10ms to 30s
+    });
+    this.taskQueueDepth = new Gauge({
+      name: `${prefix}task_queue_depth`,
+      help: 'Number of tasks waiting in queue',
+      labelNames: ['workflow_id', 'queue_name'],
+    });
+    // Resource Utilization Metrics
+    this.resourceUtilization = new Gauge({
+      name: `${prefix}resource_utilization`,
+      help: 'Resource utilization percentage (0-100)',
+      labelNames: ['resource_type', 'resource_id'],
+    });
+    this.resourceAllocations = new Counter({
+      name: `${prefix}resource_allocations_total`,
+      help: 'Total resource allocation events',
+      labelNames: ['resource_type', 'status'],
+    });
+    // Event Sourcing Metrics
+    this.eventsAppended = new Counter({
+      name: `${prefix}events_appended_total`,
+      help: 'Total events appended to event store',
+      labelNames: ['event_type', 'workflow_id'],
+    });
+    this.eventStoreSize = new Gauge({
+      name: `${prefix}event_store_size_bytes`,
+      help: 'Size of event store in bytes',
+      labelNames: ['workflow_id'],
+    });
+    // Business Metrics
+    this.policyEvaluations = new Counter({
+      name: `${prefix}policy_evaluations_total`,
+      help: 'Total policy evaluations',
+      labelNames: ['policy_name', 'result'],
+    });
+    this.cryptoReceiptGenerations = new Counter({
+      name: `${prefix}crypto_receipts_total`,
+      help: 'Total cryptographic receipts generated',
+      labelNames: ['workflow_id', 'algorithm'],
+    });
+    // Performance Metrics
+    this.latencyPercentiles = new Summary({
+      name: `${prefix}latency_percentiles`,
+      help: 'Latency percentiles for workflow operations',
+      labelNames: ['operation'],
+      percentiles: [0.5, 0.9, 0.95, 0.99],
+    });
+    // Error Metrics
+    this.errors = new Counter({
+      name: `${prefix}errors_total`,
+      help: 'Total errors encountered',
+      labelNames: ['error_type', 'workflow_id', 'severity'],
+    });
+  }
+  /**
+   * Record workflow execution start
+   * @param {string} workflowId - Workflow identifier
+   * @param {string} pattern - YAWL pattern type
+   */
+  recordWorkflowStart(workflowId, pattern = 'unknown') {
+    this.workflowActiveGauge.inc({ workflow_id: workflowId, pattern });
+    this.workflowExecutionsTotal.inc({ workflow_id: workflowId, status: 'started', pattern });
+  }
+  /**
+   * Record workflow execution completion
+   * @param {string} workflowId - Workflow identifier
+   * @param {string} status - Completion status
+   * @param {number} durationSeconds - Execution duration in seconds
+   * @param {string} pattern - YAWL pattern type
+   */
+  recordWorkflowComplete(workflowId, status, durationSeconds, pattern = 'unknown') {
+    this.workflowActiveGauge.dec({ workflow_id: workflowId, pattern });
+    this.workflowExecutionsTotal.inc({ workflow_id: workflowId, status, pattern });
+    this.workflowExecutionDuration.observe(
+      { workflow_id: workflowId, status, pattern },
+      durationSeconds
+    );
+  }
+  /**
+   * Record task execution
+   * @param {string} workflowId - Workflow identifier
+   * @param {string} taskId - Task identifier
+   * @param {string} taskType - Task type
+   * @param {string} status - Execution status
+   * @param {number} durationSeconds - Execution duration in seconds
+   */
+  recordTaskExecution(workflowId, taskId, taskType, status, durationSeconds) {
+    this.taskExecutionsTotal.inc({
+      workflow_id: workflowId,
+      task_id: taskId,
+      task_type: taskType,
+      status,
+    });
+    this.taskExecutionDuration.observe(
+      { workflow_id: workflowId, task_id: taskId, task_type: taskType },
+      durationSeconds
+    );
+  }
+  /**
+   * Update task queue depth
+   * @param {string} workflowId - Workflow identifier
+   * @param {string} queueName - Queue name
+   * @param {number} depth - Current queue depth
+   */
+  updateTaskQueueDepth(workflowId, queueName, depth) {
+    this.taskQueueDepth.set({ workflow_id: workflowId, queue_name: queueName }, depth);
+  }
+  /**
+   * Record resource utilization
+   * @param {string} resourceType - Type of resource (cpu, memory, disk, etc.)
+   * @param {string} resourceId - Resource identifier
+   * @param {number} utilizationPercent - Utilization percentage (0-100)
+   */
+  recordResourceUtilization(resourceType, resourceId, utilizationPercent) {
+    this.resourceUtilization.set(
+      { resource_type: resourceType, resource_id: resourceId },
+      utilizationPercent
+    );
+  }
+  /**
+   * Record resource allocation event
+   * @param {string} resourceType - Type of resource
+   * @param {string} status - Allocation status (allocated, deallocated, failed)
+   */
+  recordResourceAllocation(resourceType, status) {
+    this.resourceAllocations.inc({ resource_type: resourceType, status });
+  }
+  /**
+   * Record event appended to event store
+   * @param {string} eventType - Type of event
+   * @param {string} workflowId - Workflow identifier
+   */
+  recordEventAppended(eventType, workflowId) {
+    this.eventsAppended.inc({ event_type: eventType, workflow_id: workflowId });
+  }
+  /**
+   * Update event store size
+   * @param {string} workflowId - Workflow identifier
+   * @param {number} sizeBytes - Size in bytes
+   */
+  updateEventStoreSize(workflowId, sizeBytes) {
+    this.eventStoreSize.set({ workflow_id: workflowId }, sizeBytes);
+  }
+  /**
+   * Record policy evaluation
+   * @param {string} policyName - Policy name
+   * @param {string} result - Evaluation result (allow, deny, error)
+   */
+  recordPolicyEvaluation(policyName, result) {
+    this.policyEvaluations.inc({ policy_name: policyName, result });
+  }
+  /**
+   * Record cryptographic receipt generation
+   * @param {string} workflowId - Workflow identifier
+   * @param {string} algorithm - Hash algorithm (BLAKE3, SHA256, etc.)
+   */
+  recordCryptoReceipt(workflowId, algorithm = 'BLAKE3') {
+    this.cryptoReceiptGenerations.inc({ workflow_id: workflowId, algorithm });
+  }
+  /**
+   * Record operation latency for percentile calculation
+   * @param {string} operation - Operation name
+   * @param {number} latencyMs - Latency in milliseconds
+   */
+  recordLatency(operation, latencyMs) {
+    this.latencyPercentiles.observe({ operation }, latencyMs / 1000);
+  }
+  /**
+   * Record error
+   * @param {string} errorType - Error type
+   * @param {string} workflowId - Workflow identifier
+   * @param {string} severity - Error severity (low, medium, high, critical)
+   */
+  recordError(errorType, workflowId, severity = 'medium') {
+    this.errors.inc({ error_type: errorType, workflow_id: workflowId, severity });
+  }
+  /**
+   * Get all metrics in Prometheus format
+   * @returns {Promise<string>} Prometheus metrics text format
+   */
+  async getMetrics() {
+    return this.registry.metrics();
+  }
+  /**
+   * Get metrics as JSON
+   * @returns {Promise<object[]>} Metrics in JSON format
+   */
+  async getMetricsJSON() {
+    return this.registry.getMetricsAsJSON();
+  }
+  /**
+   * Clear all metrics (useful for testing)
+   */
+  clearMetrics() {
+    this.registry.clear();
+    this._initializeMetrics();
+  }
+  /**
+   * Get metric registry
+   * @returns {object} Prometheus registry
+   */
+  getRegistry() {
+    return this.registry;
+  }
+}
+/**
+ * Create a workflow metrics instance
+ * @param {object} config - Metric configuration
+ * @returns {WorkflowMetrics} Metrics instance
+ */
+export function createWorkflowMetrics(config = {}) {
+  return new WorkflowMetrics(config);
+}
+export default WorkflowMetrics;

package/src/receipts/anchor.mjs ADDED Viewed

@@ -0,0 +1,155 @@
+/**
+ * Receipt Anchoring - External timestamping and verification
+ *
+ * Provides anchoring to external systems:
+ * - Blockchain (Ethereum, Bitcoin, etc.)
+ * - Git repositories (commit SHA)
+ * - Timestamp authorities (RFC 3161)
+ *
+ * @module @unrdf/observability/receipts/anchor
+ */
+import { AnchorSchema } from './receipt-schema.mjs';
+/**
+ * ReceiptAnchorer - Anchor Merkle roots to external systems
+ *
+ * @example
+ * const anchorer = new ReceiptAnchorer();
+ * const anchor = await anchorer.anchorToGit(merkleRoot, commitSha, repo);
+ */
+export class ReceiptAnchorer {
+  /**
+   * Anchor Merkle root to Git repository
+   *
+   * @param {string} merkleRoot - Merkle root hash to anchor
+   * @param {string} commitSha - Git commit SHA
+   * @param {string} repository - Repository identifier
+   * @returns {Promise<Object>} Anchor proof
+   */
+  async anchorToGit(merkleRoot, commitSha, repository) {
+    const anchor = {
+      merkleRoot,
+      anchorType: 'git',
+      anchorData: {
+        commitSha,
+        repository,
+      },
+      timestamp: new Date().toISOString(),
+    };
+    return AnchorSchema.parse(anchor);
+  }
+  /**
+   * Anchor Merkle root to blockchain
+   *
+   * @param {string} merkleRoot - Merkle root hash to anchor
+   * @param {string} txHash - Transaction hash
+   * @param {number} blockNumber - Block number
+   * @param {string} network - Network name (e.g., 'ethereum', 'bitcoin')
+   * @returns {Promise<Object>} Anchor proof
+   */
+  async anchorToBlockchain(merkleRoot, txHash, blockNumber, network) {
+    const anchor = {
+      merkleRoot,
+      anchorType: 'blockchain',
+      anchorData: {
+        txHash,
+        blockNumber,
+        network,
+      },
+      timestamp: new Date().toISOString(),
+    };
+    return AnchorSchema.parse(anchor);
+  }
+  /**
+   * Anchor Merkle root to timestamp authority
+   *
+   * @param {string} merkleRoot - Merkle root hash to anchor
+   * @param {string} timestampToken - RFC 3161 timestamp token
+   * @param {string} authority - Timestamp authority identifier
+   * @returns {Promise<Object>} Anchor proof
+   */
+  async anchorToTimestampService(merkleRoot, timestampToken, authority) {
+    const anchor = {
+      merkleRoot,
+      anchorType: 'timestamp-service',
+      anchorData: {
+        timestampToken,
+        authority,
+      },
+      timestamp: new Date().toISOString(),
+    };
+    return AnchorSchema.parse(anchor);
+  }
+  /**
+   * Verify an anchor proof
+   *
+   * @param {Object} anchor - Anchor to verify
+   * @returns {Promise<Object>} Verification result
+   */
+  async verifyAnchor(anchor) {
+    try {
+      AnchorSchema.parse(anchor);
+      // Basic validation - actual verification would query external systems
+      const errors = [];
+      if (anchor.anchorType === 'git') {
+        if (!anchor.anchorData.commitSha || !anchor.anchorData.repository) {
+          errors.push('Git anchor missing commitSha or repository');
+        }
+      } else if (anchor.anchorType === 'blockchain') {
+        if (!anchor.anchorData.txHash || !anchor.anchorData.network) {
+          errors.push('Blockchain anchor missing txHash or network');
+        }
+      } else if (anchor.anchorType === 'timestamp-service') {
+        if (!anchor.anchorData.timestampToken || !anchor.anchorData.authority) {
+          errors.push('Timestamp anchor missing token or authority');
+        }
+      }
+      return {
+        valid: errors.length === 0,
+        errors,
+        anchorType: anchor.anchorType,
+        timestamp: anchor.timestamp,
+      };
+    } catch (err) {
+      return {
+        valid: false,
+        errors: ['Anchor validation failed: ' + err.message],
+      };
+    }
+  }
+  /**
+   * Export anchor for external verification
+   *
+   * @param {Object} anchor - Anchor to export
+   * @returns {string} Base64-encoded anchor
+   */
+  exportAnchor(anchor) {
+    const json = JSON.stringify(anchor);
+    return Buffer.from(json, 'utf8').toString('base64');
+  }
+  /**
+   * Import anchor from external source
+   *
+   * @param {string} base64Anchor - Base64-encoded anchor
+   * @returns {Object} Anchor object
+   */
+  importAnchor(base64Anchor) {
+    const json = Buffer.from(base64Anchor, 'base64').toString('utf8');
+    const anchor = JSON.parse(json);
+    return AnchorSchema.parse(anchor);
+  }
+}
+export default ReceiptAnchorer;

package/src/receipts/index.mjs ADDED Viewed

@@ -0,0 +1,62 @@
+/**
+ * Receipts System - Unified API
+ *
+ * Tamper-evident audit trails with:
+ * - Hash-chained receipts
+ * - Merkle tree batching
+ * - Tamper detection
+ * - External anchoring
+ *
+ * @module @unrdf/observability/receipts
+ */
+import { ReceiptChain as Chain } from './receipt-chain.mjs';
+import { MerkleTree as Tree } from './merkle-tree.mjs';
+import { TamperDetector as Detector } from './tamper-detection.mjs';
+import { ReceiptAnchorer as Anchorer } from './anchor.mjs';
+import {
+  ReceiptSchema,
+  MerkleProofSchema,
+  AnchorSchema,
+  VerificationResultSchema,
+  ChainExportSchema,
+} from './receipt-schema.mjs';
+export const ReceiptChain = Chain;
+export const MerkleTree = Tree;
+export const TamperDetector = Detector;
+export const ReceiptAnchorer = Anchorer;
+export {
+  ReceiptSchema,
+  MerkleProofSchema,
+  AnchorSchema,
+  VerificationResultSchema,
+  ChainExportSchema,
+};
+/**
+ * Quick start: Create receipt chain with tamper detection
+ *
+ * @example
+ * import { ReceiptChain, TamperDetector } from '@unrdf/observability/receipts';
+ *
+ * const chain = new ReceiptChain('audit-1');
+ * await chain.append({
+ *   operation: 'admit',
+ *   payload: { delta: 'delta_001' },
+ *   actor: 'system'
+ * });
+ *
+ * const detector = new TamperDetector();
+ * const result = await detector.verifyChain(chain.getAllReceipts());
+ * console.log(result.valid); // true
+ */
+export default {
+  ReceiptChain,
+  MerkleTree,
+  TamperDetector,
+  ReceiptAnchorer,
+};