npm - autotel - Versions diffs - 3.0.0 → 3.0.4 - Mend

autotel 3.0.0 → 3.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (114) hide show

package/README.md +21 -4
package/dist/attribute-redacting-processor.cjs +8 -8
package/dist/attribute-redacting-processor.d.cts +10 -1
package/dist/attribute-redacting-processor.d.ts +10 -1
package/dist/attribute-redacting-processor.js +1 -1
package/dist/attributes.cjs +21 -21
package/dist/attributes.js +2 -2
package/dist/auto.cjs +3 -3
package/dist/auto.js +2 -2
package/dist/{chunk-IUDXKLS4.js → chunk-34X3TKHA.js} +3 -3
package/dist/{chunk-IUDXKLS4.js.map → chunk-34X3TKHA.js.map} +1 -1
package/dist/{chunk-3QMFLJHJ.js → chunk-4LF6FV2V.js} +3 -3
package/dist/{chunk-3QMFLJHJ.js.map → chunk-4LF6FV2V.js.map} +1 -1
package/dist/{chunk-L7JDUDJD.cjs → chunk-AAYCDHH6.cjs} +7 -7
package/dist/{chunk-L7JDUDJD.cjs.map → chunk-AAYCDHH6.cjs.map} +1 -1
package/dist/{chunk-DWOBIBLY.cjs → chunk-AY2SY3MO.cjs} +5 -5
package/dist/{chunk-DWOBIBLY.cjs.map → chunk-AY2SY3MO.cjs.map} +1 -1
package/dist/{chunk-563EL6O6.cjs → chunk-BPO2PQ3T.cjs} +12 -8
package/dist/chunk-BPO2PQ3T.cjs.map +1 -0
package/dist/{chunk-ZSABTI3C.cjs → chunk-DAZ7EGR4.cjs} +17 -17
package/dist/{chunk-ZSABTI3C.cjs.map → chunk-DAZ7EGR4.cjs.map} +1 -1
package/dist/{chunk-ER43K7ES.js → chunk-DDXIUZEG.js} +3 -3
package/dist/{chunk-ER43K7ES.js.map → chunk-DDXIUZEG.js.map} +1 -1
package/dist/{chunk-JKIMEPI2.cjs → chunk-DQ2SUROF.cjs} +4 -4
package/dist/{chunk-JKIMEPI2.cjs.map → chunk-DQ2SUROF.cjs.map} +1 -1
package/dist/{chunk-DAAJLUTO.js → chunk-F3TNRW2P.js} +6 -5
package/dist/chunk-F3TNRW2P.js.map +1 -0
package/dist/{chunk-7HNQYHK4.js → chunk-HBLWOI6P.js} +3 -3
package/dist/{chunk-7HNQYHK4.js.map → chunk-HBLWOI6P.js.map} +1 -1
package/dist/{chunk-TDNKIHKT.js → chunk-JVWJDHDB.js} +13 -4
package/dist/chunk-JVWJDHDB.js.map +1 -0
package/dist/{chunk-CJ4PD2TZ.cjs → chunk-KKGM42RQ.cjs} +13 -13
package/dist/{chunk-CJ4PD2TZ.cjs.map → chunk-KKGM42RQ.cjs.map} +1 -1
package/dist/{chunk-KHGA4OST.cjs → chunk-LMFPZHI4.cjs} +5 -5
package/dist/{chunk-KHGA4OST.cjs.map → chunk-LMFPZHI4.cjs.map} +1 -1
package/dist/{chunk-CMNGGTQL.cjs → chunk-NXLRY2CE.cjs} +13 -4
package/dist/chunk-NXLRY2CE.cjs.map +1 -0
package/dist/{chunk-4DAG3RFS.js → chunk-OM4OSBOP.js} +4 -4
package/dist/{chunk-4DAG3RFS.js.map → chunk-OM4OSBOP.js.map} +1 -1
package/dist/{chunk-MOK3E54E.cjs → chunk-WSGAHSZQ.cjs} +34 -33
package/dist/chunk-WSGAHSZQ.cjs.map +1 -0
package/dist/{chunk-QG3U5ONP.js → chunk-Z7VAOK5X.js} +3 -3
package/dist/{chunk-QG3U5ONP.js.map → chunk-Z7VAOK5X.js.map} +1 -1
package/dist/{chunk-W35FVJBC.js → chunk-ZDPIWKWD.js} +9 -5
package/dist/chunk-ZDPIWKWD.js.map +1 -0
package/dist/correlation-id.cjs +11 -11
package/dist/correlation-id.js +3 -3
package/dist/decorators.cjs +5 -5
package/dist/decorators.js +4 -4
package/dist/event.cjs +7 -7
package/dist/event.js +4 -4
package/dist/functional.cjs +11 -11
package/dist/functional.d.cts +20 -17
package/dist/functional.d.ts +20 -17
package/dist/functional.js +4 -4
package/dist/http.cjs +4 -4
package/dist/http.js +3 -3
package/dist/index.cjs +226 -92
package/dist/index.cjs.map +1 -1
package/dist/index.d.cts +67 -3
package/dist/index.d.ts +67 -3
package/dist/index.js +138 -15
package/dist/index.js.map +1 -1
package/dist/instrumentation.cjs +9 -9
package/dist/instrumentation.js +2 -2
package/dist/messaging.cjs +8 -8
package/dist/messaging.js +5 -5
package/dist/semantic-helpers.cjs +9 -9
package/dist/semantic-helpers.js +5 -5
package/dist/webhook.cjs +6 -6
package/dist/webhook.js +4 -4
package/dist/workflow-distributed.cjs +6 -6
package/dist/workflow-distributed.js +4 -4
package/dist/workflow.cjs +9 -9
package/dist/workflow.js +5 -5
package/package.json +43 -45
package/skills/analyze-traces/SKILL.md +178 -0
package/skills/autotel-core/SKILL.md +0 -7
package/skills/autotel-events/SKILL.md +0 -6
package/skills/autotel-frameworks/SKILL.md +0 -9
package/skills/autotel-instrumentation/SKILL.md +0 -7
package/skills/autotel-request-logging/SKILL.md +0 -8
package/skills/autotel-structured-errors/SKILL.md +0 -7
package/skills/build-audit-trails/SKILL.md +302 -0
package/skills/debug-missing-spans/SKILL.md +248 -0
package/skills/migrate-to-autotel/SKILL.md +268 -0
package/skills/review-otel-patterns/SKILL.md +488 -0
package/skills/review-otel-patterns/references/code-review.md +75 -0
package/skills/review-otel-patterns/references/processor-pipeline.md +205 -0
package/skills/review-otel-patterns/references/structured-errors.md +102 -0
package/skills/review-otel-patterns/references/wide-spans.md +85 -0
package/skills/tune-sampling/SKILL.md +210 -0
package/src/attribute-redacting-processor.test.ts +6 -4
package/src/attribute-redacting-processor.ts +11 -2
package/src/drain-toolkit.test.ts +113 -0
package/src/drain-toolkit.ts +129 -0
package/src/enricher-toolkit.test.ts +67 -0
package/src/enricher-toolkit.ts +79 -0
package/src/functional.test.ts +18 -0
package/src/functional.ts +32 -20
package/src/index.ts +19 -0
package/src/redact-values.test.ts +24 -10
package/src/redact-values.ts +9 -2
package/src/request-logger.test.ts +91 -0
package/src/request-logger.ts +36 -2
package/src/structured-error.test.ts +4 -1
package/bin/intent.js +0 -6
package/dist/chunk-563EL6O6.cjs.map +0 -1
package/dist/chunk-CMNGGTQL.cjs.map +0 -1
package/dist/chunk-DAAJLUTO.js.map +0 -1
package/dist/chunk-MOK3E54E.cjs.map +0 -1
package/dist/chunk-TDNKIHKT.js.map +0 -1
package/dist/chunk-W35FVJBC.js.map +0 -1
package/src/package-manifest.test.ts +0 -24

package/skills/review-otel-patterns/references/processor-pipeline.md ADDED Viewed

@@ -0,0 +1,205 @@
+# Processor pipeline cookbook
+Composable building blocks for the autotel pipeline. Each helper is small enough to reason about in isolation and isolates errors so a single bad processor cannot break the others.
+## Primitives
+| Helper                       | Type              | Purpose                                                      |
+| ---------------------------- | ----------------- | ------------------------------------------------------------ |
+| `defineConfig(config)`       | identity          | Authoring helper for typed config                            |
+| `composeSpanProcessors([…])` | `SpanProcessor`   | Fan span lifecycle to multiple processors                    |
+| `composePostProcessors([…])` | `PostProcessorFn` | Chain post-processors (each sees the output of the previous) |
+| `composeSubscribers([…])`    | `EdgeSubscriber`  | Fire in-process side effects in order                        |
+All from `autotel-edge`.
+## Multi-backend export
+```typescript
+import { BatchSpanProcessor } from 'autotel/processors';
+import { OTLPHttpJsonExporter } from 'autotel/exporters';
+import { composeSpanProcessors, defineConfig } from 'autotel-edge';
+const honeycomb = new BatchSpanProcessor(
+  new OTLPHttpJsonExporter({
+    url: 'https://api.honeycomb.io/v1/traces',
+    headers: { 'x-honeycomb-team': process.env.HONEYCOMB_KEY! },
+  }),
+);
+const grafana = new BatchSpanProcessor(
+  new OTLPHttpJsonExporter({
+    url: process.env.GRAFANA_OTLP_URL!,
+    headers: { authorization: `Basic ${process.env.GRAFANA_AUTH!}` },
+  }),
+);
+export const config = defineConfig({
+  service: { name: 'checkout' },
+  spanProcessors: composeSpanProcessors([honeycomb, grafana]),
+});
+```
+## Tail sampling: keep errors + slow + 10% otherwise
+```typescript
+import { TailSamplingProcessor } from 'autotel/processors';
+import { composeSpanProcessors } from 'autotel-edge';
+const tail = new TailSamplingProcessor({
+  keep: (trace) => {
+    if (trace.localRootSpan.status?.code === SpanStatusCode.ERROR) return true;
+    if (trace.localRootSpan.duration[0] > 1) return true; // > 1s
+    return Math.random() < 0.1;
+  },
+});
+spanProcessors: composeSpanProcessors([new BatchSpanProcessor(otlp), tail]);
+```
+## Drop noisy spans before they reach the batcher
+```typescript
+import { FilteringSpanProcessor } from 'autotel/processors';
+const dropHealth = new FilteringSpanProcessor({
+  exclude: (span) => /^GET \/(healthz|ready)$/.test(span.name),
+});
+spanProcessors: composeSpanProcessors([
+  dropHealth,
+  new BatchSpanProcessor(otlp),
+]);
+```
+## Bound URL cardinality
+```typescript
+import { SpanNameNormalizingProcessor } from 'autotel/processors';
+const normalise = new SpanNameNormalizingProcessor({
+  // Replace UUIDs and 24-char hex ids with placeholders
+  replacements: [
+    {
+      match: /[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}/g,
+      with: ':id',
+    },
+    { match: /[0-9a-f]{24}/g, with: ':id' },
+  ],
+});
+```
+Now `GET /users/123e4567-e89b-12d3-a456-426614174000/orders` becomes `GET /users/:id/orders` in your traces — fewer unique span names, dramatically faster queries.
+## Lift baggage onto every span
+```typescript
+import { BaggageSpanProcessor } from 'autotel/processors';
+// Anything placed in baggage upstream becomes an attribute on every child span
+const baggage = new BaggageSpanProcessor({ keys: ['tenant', 'feature_flags'] });
+spanProcessors: composeSpanProcessors([baggage, new BatchSpanProcessor(otlp)]);
+```
+## Subscribers for in-process side effects
+Subscribers run synchronously in the parent context — ideal for metrics, audit, and cost calculation that you want recorded **before** the span goes to the batcher.
+```typescript
+import type { EdgeSubscriber } from 'autotel-edge';
+import { composeSubscribers } from 'autotel-edge';
+const metricsSubscriber: EdgeSubscriber = (event) => {
+  if (
+    event.kind === 'span.end' &&
+    event.span.attributes['http.response.status_code'] >= 500
+  ) {
+    metrics.errorCounter.add(1, { route: event.span.name });
+  }
+};
+const auditSubscriber: EdgeSubscriber = (event) => {
+  if (event.kind === 'span.end' && event.span.name.startsWith('admin.')) {
+    audit.write({
+      kind: event.span.name,
+      actor: event.span.attributes['user.id'],
+    });
+  }
+};
+subscribers: [composeSubscribers([metricsSubscriber, auditSubscriber])];
+```
+## Post-processors for last-mile rewrites
+Post-processors mutate the array of spans **after** sampling, just before export. Use for redacting stack traces, dropping fields, or annotating with deployment info.
+```typescript
+import type { PostProcessorFn } from 'autotel-edge';
+import { composePostProcessors } from 'autotel-edge';
+import { createStringRedactor } from 'autotel';
+const redactStacks = createStringRedactor('strict');
+const cleanStacks: PostProcessorFn = (spans) =>
+  spans.map((s) => {
+    if (typeof s.attributes['exception.stacktrace'] === 'string') {
+      s.attributes['exception.stacktrace'] = redactStacks(
+        s.attributes['exception.stacktrace'],
+      );
+    }
+    return s;
+  });
+const tagDeploy: PostProcessorFn = (spans) =>
+  spans.map((s) => ({
+    ...s,
+    attributes: { ...s.attributes, 'deploy.id': process.env.RELEASE! },
+  }));
+postProcessor: composePostProcessors([cleanStacks, tagDeploy]);
+```
+## Putting it all together
+```typescript
+import {
+  defineConfig,
+  composeSpanProcessors,
+  composeSubscribers,
+  composePostProcessors,
+} from 'autotel-edge';
+export const otelConfig = defineConfig({
+  service: { name: 'checkout' },
+  attributeRedactor: 'strict',
+  spanProcessors: composeSpanProcessors([
+    dropHealth, // 1. drop spans we never want
+    normaliseUrls, // 2. bound cardinality
+    new BatchSpanProcessor(honeycomb),
+    new BatchSpanProcessor(grafana),
+    tailSampler, // 3. keep errors + slow + 10%
+  ]),
+  subscribers: [
+    composeSubscribers([metricsSubscriber, auditSubscriber, aiCostSubscriber]),
+  ],
+  postProcessor: composePostProcessors([cleanStacks, tagDeploy]),
+});
+```
+## Error isolation
+Every compose helper catches errors per item and logs to `console.error` with the helper name. A single bad processor cannot break the others — important when one of your subscribers is a third-party integration (Datadog, PagerDuty, …) that can rate-limit or 502.
+## Choosing between subscribers and post-processors
+| You want…                                 | Use                                                        |
+| ----------------------------------------- | ---------------------------------------------------------- |
+| Mutate exported span attributes           | `postProcessor`                                            |
+| Drop spans entirely                       | `FilteringSpanProcessor` (early) or tail sampler           |
+| Update an in-process metric on every span | `subscribers`                                              |
+| Send an audit log to a DB                 | `subscribers` (use `log.fork('audit')` if writes are slow) |
+| Re-emit spans to a second backend         | second `BatchSpanProcessor` in `composeSpanProcessors`     |

package/skills/review-otel-patterns/references/structured-errors.md ADDED Viewed

@@ -0,0 +1,102 @@
+# Structured errors
+`createStructuredError` produces an `Error` carrying enough context to be:
+- **Recorded onto the active span** (`exception.type`, `exception.message`, `exception.stacktrace`, `span.status = ERROR`).
+- **Returned to clients safely** (`internal` is stripped by `parseError`).
+- **Self-documenting** (`why` explains the cause, `fix` tells the caller what to do, `link` points at runbook docs).
+## Field reference
+| Field      | Audience    | Purpose                                                    |
+| ---------- | ----------- | ---------------------------------------------------------- |
+| `message`  | Both        | Short, stable summary                                      |
+| `status`   | Both        | HTTP status (drives client behaviour and span status code) |
+| `why`      | Both        | Human-readable cause (`"Card declined by issuer"`)         |
+| `fix`      | Client      | Remediation hint (`"Use a different payment method"`)      |
+| `link`     | Client      | URL to docs / runbook                                      |
+| `code`     | Both        | Machine-readable code (`"PAYMENT_DECLINED"`)               |
+| `cause`    | Server only | The underlying error                                       |
+| `internal` | Server only | Diagnostic metadata (`{ correlationId, resourceId }`)      |
+| `details`  | Both        | Structured payload (e.g. validation errors per field)      |
+## Templates
+### Validation (400)
+```typescript
+throw createStructuredError({
+  status: 400,
+  code: 'VALIDATION_ERROR',
+  message: 'Invalid request body',
+  why: 'One or more fields failed validation',
+  fix: 'Check the `details` field for per-field errors',
+  details: { email: 'must be a valid email', age: 'must be ≥ 18' },
+});
+```
+### Auth (401 / 403)
+```typescript
+throw createStructuredError({
+  status: 403,
+  code: 'FORBIDDEN',
+  message: 'Not allowed',
+  why: 'You do not have access to this resource',
+  fix: 'Ask the workspace owner for access',
+  link: 'https://docs.example.com/permissions',
+  internal: { resourceId: 'proj_123', userRole: 'member' },
+});
+```
+### Payment (402)
+```typescript
+throw createStructuredError({
+  status: 402,
+  code: 'PAYMENT_DECLINED',
+  message: 'Payment declined',
+  why: 'Card declined by issuer — insufficient funds',
+  fix: 'Use a different payment method or contact your bank',
+  link: 'https://docs.example.com/payments/declined',
+  cause: stripeError,
+  internal: { stripeChargeId: 'ch_…', riskScore: stripeError.risk_level },
+});
+```
+### Upstream failure (502 / 503 / 504)
+```typescript
+throw createStructuredError({
+  status: 502,
+  code: 'UPSTREAM_FAILED',
+  message: 'Inventory service is unavailable',
+  why: 'Could not reach the inventory service',
+  fix: 'Retry in a few minutes',
+  cause: fetchError,
+  internal: { upstream: 'inventory-svc', retryAttempt: 3 },
+});
+```
+## At HTTP boundaries
+```typescript
+import { parseError } from 'autotel';
+app.onError((error, c) => {
+  // span.status is already ERROR with exception fields recorded
+  const parsed = parseError(error);
+  // `internal` and `cause` are stripped here — never leak them to clients
+  return c.json(parsed, parsed.status);
+});
+```
+## Anti-patterns
+| Anti-pattern                                                 | Fix                                                                                    |
+| ------------------------------------------------------------ | -------------------------------------------------------------------------------------- |
+| `throw new Error('something went wrong')`                    | `createStructuredError({ message, status, why, fix })`                                 |
+| Putting support IDs in `message` (`"Failed for user 42"`)    | Use `internal: { userId: 42 }`                                                         |
+| Returning `details: { error: stack }` to clients             | Stack traces stay in `cause` / span; never serialise them out                          |
+| `console.error(e); throw e`                                  | Just throw — autotel's span will pick up the exception                                 |
+| Two callers throwing different shapes for the same condition | Centralise: `function declined(reason: string) { throw createStructuredError({ … }) }` |

package/skills/review-otel-patterns/references/wide-spans.md ADDED Viewed

@@ -0,0 +1,85 @@
+# Designing wide spans
+A wide span is a single span per logical unit of work (request, job, message, fork) carrying _all_ the fields you'd ever want to filter or group by. autotel lets you build them with `useLogger().set({ … })` — fields are flattened to OTel attributes with stable dotted keys.
+## Anatomy
+```typescript
+import { useLogger } from 'autotel';
+export const POST = withAutotel(async (request) => {
+  const log = useLogger();
+  // Identity
+  log.set({ user: { id: 'usr_123', plan: 'enterprise', role: 'admin' } });
+  // Inputs
+  log.set({ cart: { items: 3, total: 14_999, currency: 'USD' } });
+  // Decisions / branches
+  log.set({ promo: { applied: 'SUMMER10', discount: 1_500 } });
+  // Outputs
+  log.set({
+    payment: { provider: 'stripe', method: 'card', authCode: 'auth_x' },
+  });
+  return Response.json({ ok: true });
+});
+```
+OTel attributes recorded:
+```
+user.id=usr_123
+user.plan=enterprise
+user.role=admin
+cart.items=3
+cart.total=14999
+cart.currency=USD
+promo.applied=SUMMER10
+promo.discount=1500
+payment.provider=stripe
+payment.method=card
+payment.authCode=auth_x
+```
+## Rules of thumb
+1. **One wide span per logical unit of work.** Many tiny spans hurt query speed; deep call trees can be opt-in (`autotel-drizzle`, `autotel-mongoose`).
+2. **Group with objects.** `{ user: { id, plan } }` not `userId` / `userPlan`. The flatten step keeps the key shape stable.
+3. **Capture decisions, not just inputs.** Which branch ran, which promo applied, which fallback fired.
+4. **Keep cardinality bounded.** Don't put per-request UUIDs in `span.name`; use `SpanNameNormalizingProcessor`. Free-text labels go in attributes.
+5. **Avoid raw bodies.** Pick the shape: `{ user: { id, plan } }` — never `log.set({ user: requestBody })`.
+6. **Trust the redactor.** PII you forgot to think about (emails, JWTs, cards) gets masked in production. See `attributeRedactor: 'default'`.
+## When you need correlated child spans
+Use `trace()` to wrap discrete sub-operations whose duration matters:
+```typescript
+import { trace } from 'autotel';
+const fetchInventory = trace(async (sku: string) => {
+  /* … */
+});
+const reserveStock = trace(async (sku: string, qty: number) => {
+  /* … */
+});
+await fetchInventory(sku);
+await reserveStock(sku, qty);
+```
+Each gets its own span with the function name; both are children of the active request span.
+## When you need background work
+`log.fork('label', fn)` spawns a child span that emits its own wide event with `_parentCorrelationId` set, even after the parent response has been returned. Pass `lifecycle.onChildEnter / onChildExit` if your framework tracks active loggers (Elysia, etc.).
+```typescript
+log.fork('audit-write', async () => {
+  await audit.write({ kind: 'order.created', orderId });
+});
+return Response.json({ ok: true }); // parent returns immediately
+```

package/skills/tune-sampling/SKILL.md ADDED Viewed

@@ -0,0 +1,210 @@
+---
+name: tune-sampling
+description: >
+  Choose a sampling strategy for an autotel-instrumented service. Covers
+  head sampling (per-span-kind rates, parent-based, ratio), tail sampling
+  (keep errors, slow, AI-aware, debug-headers), cost vs cardinality
+  tradeoffs, and the math for picking rates that hit a target spans/second
+  budget. Includes recipes for low-volume admin services, high-volume APIs,
+  AI agents, and Cloudflare Workers.
+license: MIT
+---
+# Tune sampling
+Untuned tracing is either expensive (100 % at scale costs money + drowns dashboards) or unhelpful (1 % loses the failure modes you need to see). The right answer is almost always **head sample most of the boring traffic, tail keep all the interesting traffic**, with explicit overrides for AI calls and customer escalations.
+## When to use
+- Hitting your observability budget
+- Dashboards too sparse to spot anomalies
+- "We have the trace IDs but the spans are gone" complaints
+- New service launching at scale
+- Long-running AI agents producing 50+ spans per request
+## The mental model
+```
+Total cost = (spans/sec × $/span) + (storage_GB × $/GB-month)
+                   ↑
+Head sampling reduces this directly.
+```
+Head sampling makes a decision **at span start** — fast, but coarse (it doesn't know if the span will fail).
+Tail sampling makes the decision **at span end** — slower, more storage upfront, but precise.
+The right mix:
+- **Head sample at the entry point** to keep volume tractable.
+- **Tail keep** the high-value subset (errors, slow, AI, debug-headered).
+- **Don't sample audit spans** — separate processor, see [`build-audit-trails`](../build-audit-trails/SKILL.md).
+## Head sampling recipes
+### Default for a typical web service
+```typescript
+init({
+  service: 'my-app',
+  sampling: {
+    rates: {
+      server: 25, // server entry spans — sample ¼
+      client: 5, // outbound HTTP — sample 1/20
+      internal: 5, // internal sub-spans — sample 1/20
+    },
+  },
+});
+```
+Children of a sampled root are **all** kept (parent-based propagation is the default). So `server: 25` means 25 % of _user requests_, complete trace each.
+### High-volume API (>1 k req/s)
+```typescript
+sampling: {
+  rates: { server: 5, client: 1, internal: 1 }, // 5 % → tail keeps errors anyway
+  tail: keepInterestingTraces,
+},
+```
+### Low-volume admin / internal service (<10 req/s)
+100 % is fine. Don't penalise yourself for a service that produces 1 GB of traces a week.
+### Cloudflare Workers (per-colo budget)
+Workers run distributed — head sampling is your friend because there's no central queue:
+```typescript
+defineWorkerFetch(
+  {
+    service: { name: 'edge' },
+    sampling: { rates: { server: 10 } }, // 10 % per colo, scales naturally
+  },
+  handler,
+);
+```
+## Tail sampling — keep interesting traces
+Tail sampling looks at the full trace (root span + children) before deciding. autotel ships `TailSamplingProcessor`:
+```typescript
+import { TailSamplingProcessor } from 'autotel/processors';
+import { SpanStatusCode } from '@opentelemetry/api';
+const tail = new TailSamplingProcessor({
+  keep: (trace) => {
+    // 1. Always keep errors
+    if (trace.localRootSpan.status?.code === SpanStatusCode.ERROR) return true;
+    if (trace.spans.some((s) => s.status?.code === SpanStatusCode.ERROR))
+      return true;
+    // 2. Always keep slow traces (configurable threshold)
+    if (durationMs(trace.localRootSpan) > 1_000) return true;
+    // 3. Always keep customer-marked traces
+    if (trace.localRootSpan.attributes['debug.trace'] === true) return true;
+    // 4. Always keep AI traces (rare + expensive — full visibility helps)
+    if (
+      trace.spans.some((s) => typeof s.attributes['gen_ai.system'] === 'string')
+    )
+      return true;
+    // 5. Otherwise: respect head sampling decision
+    return false;
+  },
+});
+```
+### Combining with multi-backend
+```typescript
+spanProcessors: composeSpanProcessors([
+  // Drop nothing here — we want the tail processor to see the full trace
+  new BatchSpanProcessor(localExporter),
+  tail, // filters before remote export
+  new BatchSpanProcessor(expensiveRemoteExporter),
+]);
+```
+## AI / LLM-aware sampling
+LLM calls produce 5–50 spans per request and are 100× more expensive than a typical handler call. Tradeoffs:
+- **Don't head-sample AI handlers below 50 %** — debugging "why did the model loop" requires the full chain.
+- **Always tail-keep AI traces** — the `gen_ai.*` attributes flag them.
+- **Cost-aware sampling** — keep all calls above a $ threshold:
+```typescript
+keep: (trace) => {
+  const cost = trace.spans.reduce(
+    (acc, s) =>
+      acc +
+      (typeof s.attributes['gen_ai.cost.usd'] === 'number'
+        ? (s.attributes['gen_ai.cost.usd'] as number)
+        : 0),
+    0,
+  );
+  if (cost > 0.1) return true; // any trace > $0.10 → keep
+  if (cost > 0.01) return Math.random() < 0.5; // > $0.01 → 50 %
+  return Math.random() < 0.1; // < $0.01 → 10 %
+};
+```
+## Customer-driven sampling (debug header)
+Let support flip on full tracing per request:
+```typescript
+const tail = new TailSamplingProcessor({
+  keep: (trace) => trace.localRootSpan.attributes['x-debug-trace'] === '1' || /* … */,
+})
+```
+In your middleware:
+```typescript
+if (request.headers.get('x-debug-trace') === '1') {
+  useLogger().set({ 'x-debug-trace': '1' });
+}
+```
+Now any user can mark a request as "trace this fully" by sending the header — invaluable for reproducing customer reports.
+## Sizing the rate
+Target volume:
+```
+spans/sec ≈ requests/sec × spans_per_request × head_rate × tail_keep_rate
+```
+Worked example for a 100 req/s API with 8 spans/req:
+| Head rate | Tail keep                        | Result                                       |
+| --------- | -------------------------------- | -------------------------------------------- |
+| 100 %     | 100 %                            | 800 spans/sec — expensive                    |
+| 10 %      | 100 % (errors + slow + AI ≈ 5 %) | ≈ 110 spans/sec — sweet spot                 |
+| 1 %       | 100 %                            | ≈ 18 spans/sec — too sparse for p99 alerting |
+For per-vendor pricing:
+- **Honeycomb**: $0.000005 / event for paid plans. 110 spans/sec × 86 400 s = 9.5 M events/day = $48/day.
+- **Datadog APM**: ~$1.27/M spans ingested (varies by region). Same volume → ~$12/day.
+- **Grafana Cloud**: 100 GB free tier; 110 spans/sec ≈ 5 GB/day.
+## Anti-patterns
+| Anti-pattern                                 | Fix                                                           |
+| -------------------------------------------- | ------------------------------------------------------------- |
+| 100 % sampling at scale "to be safe"         | You're paying 10–100× without proportional value              |
+| 1 % sampling with no tail keep               | You'll miss every interesting failure                         |
+| Forgetting to tail-keep errors               | Sampled traces with errors → silent customer pain             |
+| Same rate for `server` and `internal`        | Internal sub-spans are 5–20× more numerous; sample harder     |
+| Ratio-based sampling on service entry point  | Use parent-based — children of a sampled trace stay together  |
+| Head-sampling AI calls below 50 %            | Debugging tool loops requires the full chain                  |
+| Audit spans subject to sampling              | Route them to a separate processor (see `build-audit-trails`) |
+| Tail processor before exporter (loses spans) | Tail processor goes between head sampler and remote exporter  |
+| Rate-by-route hand-coded in handlers         | Use head sampler + tail keep — declarative, one place         |

package/src/attribute-redacting-processor.test.ts CHANGED Viewed

@@ -184,8 +184,9 @@ describe('AttributeRedactingProcessor', () => {
         });
         processor.onEnd(span);
+        // SSN has no smart mask; falls back to the default replacement.
         expect(mockProcessor.endedSpans[0]!.attributes['user.ssn']).toBe(
-          '*******89',
+          '[REDACTED]',
         );
       });
@@ -199,8 +200,9 @@ describe('AttributeRedactingProcessor', () => {
         });
         processor.onEnd(span);
+        // PCI-DSS compliant: last 4 digits preserved.
         expect(mockProcessor.endedSpans[0]!.attributes['payment.card']).toBe(
-          '**************11',
+          '****1111',
         );
       });
@@ -710,12 +712,12 @@ describe('edge cases', () => {
     });
     const span = createMockReadableSpan({
-      contacts: 'Email: john@example.com, Phone: 555-123-4567',
+      contacts: 'Email: john@example.com, Phone: +1 555-123-4567',
     });
     processor.onEnd(span);
     expect(mockProcessor.endedSpans[0]!.attributes.contacts).toBe(
-      'Email: j***@***.com, Phone: ********67',
+      'Email: j***@***.com, Phone: +1******67',
     );
   });
 });

package/src/attribute-redacting-processor.ts CHANGED Viewed

@@ -147,10 +147,19 @@ export const builtinPatterns = {
       /\b(?!0\.0\.0\.0\b)(?!127\.0\.0\.1\b)\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}\b/g,
     mask: (m: string) => `***.***.***.${m.split('.').pop()}`,
   },
-  /** International phone numbers → +33******78 (country code + last 2 digits) */
+  /**
+   * International / formatted phone numbers.
+   *
+   * Matches:
+   * - `+33 1 23 45 67 89` -> `+33******89`
+   * - `(415) 555-1234` -> `********34`
+   * - `555-123-4567` / `555.123.4567` / `5551234567` -> `********67`
+   *
+   * Bare short digit runs like `12345678` are intentionally not matched.
+   */
   phone: {
     pattern:
-      /(?:\+\d{1,3}[\s.-]?)?\(?\d{1,4}\)?[\s.-]?\d{2,4}[\s.-]?\d{2,4}[\s.-]?\d{2,4}\b/g,
+      /(?:\+\d{1,3}[\s.-]?\(?\d{1,4}\)?(?:[\s.-]?\d{2,4}){2,4}|\(\d{1,4}\)(?:[\s.-]?\d{2,4}){2,4}|\b\d{3}[-.]?\d{3}[-.]?\d{4}\b)/g,
     mask: (m: string) => {
       const digits = m.replace(/[^\d]/g, '');
       const hasPlus = m.startsWith('+');