@heystack/otel 0.7.0 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/README.md CHANGED
@@ -90,7 +90,7 @@ export default instrument(
90
90
  getUser: (req) => ({
91
91
  id: req.headers.get("x-user-id") ?? undefined,
92
92
  }),
93
- instrumentBindings: true, // auto-trace D1/KV/R2/Vectorize
93
+ instrumentBindings: true, // auto-trace D1/KV/R2/Vectorize/AI/Queues/Service bindings
94
94
  },
95
95
  );
96
96
  ```
@@ -116,7 +116,7 @@ Set the key as a secret: `wrangler secret put HEYSTACK_API_KEY`.
116
116
  | `service` | `string` | **Required.** Service name that appears in the Heystack console. |
117
117
  | `apiKey` | `string?` | Defaults to `env.HEYSTACK_API_KEY`. |
118
118
  | `getUser` | `(req: Request) => { id?, session?, requestId? } \| undefined` | Called per request. `id` → `enduser.id`, `session` → `session.id`, `requestId` → `http.request.id` (falls back to the `cf-ray` header). |
119
- | `instrumentBindings` | `boolean \| string[]` | `true` = auto child spans for all detected D1/KV/R2/Vectorize bindings; `string[]` = only the named bindings. Default `false`. |
119
+ | `instrumentBindings` | `boolean \| string[]` | `true` = auto child spans for all detected D1 / KV / R2 / Vectorize / Workers AI / Queue producer / Service binding bindings; `string[]` = only the named bindings. Default `false`. |
120
120
  | `sampling` | `{ rate?: number } \| { remote: true }` | Head-sampling configuration. `{ rate }`: keep a deterministic fraction of fresh root traces (0–1; default `1` = keep all). `{ remote: true }`: fetch the rate from the Heystack config endpoint instead — lets you change it centrally without redeploying. Cold isolates keep all traffic until the first config fetch resolves; fails open if the config can't be reached. Parent-respecting in both modes: a request arriving with a sampled `traceparent` is always recorded. See [Head sampling](#head-sampling) below. |
121
121
  | `waitUntil` | `(p: Promise<unknown>) => void` | Override the isolate keep-alive hook; defaults to the auto-detected `ctx.waitUntil`. |
122
122
  | `endpoint` | `string?` | Override the ingest endpoint (advanced). |
@@ -159,7 +159,7 @@ On startup the worker fetches its configured rate from the Heystack config endpo
159
159
  - **Outbound `fetch`** — each outbound subrequest while a request span is active gets a CLIENT child span (`http.request.method`, `url.full`, `server.address`, `http.response.status_code`). A W3C `traceparent` header is injected into the subrequest so a downstream Heystack-instrumented service continues the same trace (distributed tracing across services). The exporter's own ingest POST is never traced.
160
160
  - **Queue consumers (`queue`)** — a CONSUMER span per batch, with `messaging.destination.name` (queue name) and `messaging.batch.message_count`.
161
161
  - **Scheduled handlers (`scheduled`)** — an INTERNAL span per invocation, with `controller.cron`.
162
- - **Binding calls** (when `instrumentBindings` is set) — a child span for every D1 query (`db.statement`), KV read/write, R2 operation, and Vectorize query.
162
+ - **Binding calls** (when `instrumentBindings` is set) — a child span for every D1 query (`db.statement`), KV read/write, R2 operation, Vectorize query, Workers AI inference (`gen_ai.*` attributes including model name and token usage), Queue `.send`/`.sendBatch` (PRODUCER spans with `messaging.*` attributes), and Service binding `.fetch` calls (CLIENT spans with `traceparent` injected so calls to other Workers stitch into the same distributed trace).
163
163
 
164
164
  ### Client enrichment
165
165
 
@@ -305,6 +305,7 @@ As belt-and-suspenders the exporter also drops any span whose HTTP target points
305
305
 
306
306
  ## Migration / versioning
307
307
 
308
+ - **`0.8.0`** — **`/workers`: Workers AI, Queue producer, and Service binding instrumentation.** `instrumentBindings: true` now auto-wraps three additional binding types: `env.AI.run()` emits CLIENT spans with `gen_ai.system`, `gen_ai.request.model`, and `gen_ai.usage.input_tokens`/`output_tokens` (streaming results are never consumed); Queue `.send`/`.sendBatch` emit PRODUCER spans with `messaging.*` attributes including batch size; Service binding `.fetch` emits a CLIENT span and injects a W3C `traceparent` header into the outgoing request so calls to other Workers appear in the same distributed trace. `startSpan` factory now accepts an optional `SpanKind` for correct CLIENT/PRODUCER categorisation. No breaking changes.
308
309
  - **`0.7.0`** — **`/workers`: remote sampling (`sampling: { remote: true }`).** New `sampling` variant that fetches the head-sampling rate from the Heystack config endpoint at runtime, so you can change it from the console without redeploying. Cold isolates keep all traffic until the first config fetch resolves (fails open). If the config endpoint is unreachable, the worker keeps everything. Same parent-respecting rule as `sampling: { rate }`. No breaking changes; existing `sampling: { rate }` configs are unchanged.
309
310
  - **`0.6.0`** — **`/workers`: head sampling (`sampling: { rate }`).** New optional `WorkersConfig` field: `sampling.rate` (0–1, default `1`). Keeps a deterministic fraction of fresh root traces — the drop decision is made in the worker before export (no egress, no ingest cost). Parent-respecting: requests arriving with a sampled `traceparent` are always recorded. Consistent with server-side sampling (same trace-ID hash). No breaking changes; all new options are optional. See [Head sampling](#head-sampling).
310
311
  - **`0.5.0`** — **`/workers`: identity enrichment, binding tracing, outbound-fetch tracing, manual span helpers.** New `WorkersConfig` options: `getUser` (attach `enduser.id`/`session.id`/`http.request.id` per request from a synchronous callback), `instrumentBindings` (auto child spans for D1/KV/R2/Vectorize — `true` = all detected, or a `string[]` to select). Outbound `fetch` calls made inside a traced handler automatically get CLIENT child spans with `traceparent` injection (distributed tracing across services). New ergonomic exports from `/workers`: `withSpan(name, attrs?, fn)` runs a function inside a named child span (auto-parented, exceptions recorded, `span.end()` in `finally`); `addEvent(name, attrs?)` adds an event to the active span. No breaking changes; all new options are optional.
@@ -1,33 +1,51 @@
1
- import { type Span } from "@opentelemetry/api";
1
+ import { SpanKind, type Span } from "@opentelemetry/api";
2
2
  export interface InstrumentBindingsOpts {
3
3
  /**
4
4
  * Factory that creates and starts a new child span. Called at binding method
5
5
  * invocation time (inside the traced handler scope), so `context.active()`
6
6
  * at that moment correctly parents to the root span.
7
7
  *
8
- * For integration: pass `(name, attrs) => tracer.startSpan(name, { attributes: attrs }, context.active())`.
8
+ * For integration: pass `(name, attrs, kind) => tracer.startSpan(name, { attributes: attrs, kind }, context.active())`.
9
9
  * For unit tests: inject a fake so no global provider is required.
10
10
  */
11
- startSpan: (name: string, attrs: Record<string, unknown>) => Span;
11
+ startSpan: (name: string, attrs: Record<string, unknown>, kind?: SpanKind) => Span;
12
12
  /**
13
- * `true` → auto-detect and wrap all D1/KV/R2/Vectorize bindings.
13
+ * `true` → auto-detect and wrap all D1/KV/R2/Vectorize/AI/Queue/Service bindings.
14
14
  * `string[]` → only wrap bindings whose env key is listed.
15
15
  */
16
16
  select: boolean | string[];
17
17
  }
18
+ /**
19
+ * Build a new args array for `fetch(input, init?)` with a `traceparent` header
20
+ * injected WITHOUT mutating the caller's original Request or init object.
21
+ *
22
+ * - `Request` first arg → rebuilt as `new Request(original, { headers })`.
23
+ * - String/URL first arg → spread a new init object with an augmented Headers.
24
+ */
25
+ export declare function injectTraceparentArgs(args: any[], traceparent: string): any[];
18
26
  /**
19
27
  * Wrap an env object's Cloudflare bindings so that each binding operation
20
28
  * emits a child span under the currently-active OTel context.
21
29
  *
22
- * Detects binding type by duck-typing (D1: `prepare`; KV: `get`+`put`+`list`;
23
- * R2: `get`+`put`+`head`; Vectorize: `query`+`upsert`). Unrecognised bindings
24
- * are passed through unchanged.
30
+ * Detects binding type by duck-typing:
31
+ * - D1: `prepare`
32
+ * - R2: `get`+`put`+`head`
33
+ * - KV: `get`+`put`+`list`
34
+ * - Vectorize: `query`+`upsert`
35
+ * - Workers AI: `run` (without `prepare`)
36
+ * - Queue producer: `send`+`sendBatch`
37
+ * - Service binding / Fetcher: `fetch` (last branch; most generic)
38
+ *
39
+ * Unrecognised bindings are passed through unchanged.
25
40
  *
26
41
  * Each wrapped binding is a `Proxy` over the original — non-wrapped prototype
27
42
  * methods fall through to the real binding so no functionality is lost.
28
43
  *
44
+ * Service-binding spans inject a W3C `traceparent` header into outgoing
45
+ * requests so calls to other Workers stitch into one distributed trace.
46
+ *
29
47
  * @param env - The Worker env / binding bag.
30
- * @param opts - `startSpan` factory + `select` filter.
48
+ * @param opts - `startSpan` factory (now accepts optional `SpanKind`) + `select` filter.
31
49
  * @returns A shallow copy of `env` with selected bindings replaced by proxies.
32
50
  */
33
51
  export declare function instrumentEnv<E extends Record<string, unknown>>(env: E, opts: InstrumentBindingsOpts): E;
@@ -1,13 +1,14 @@
1
1
  // ---------------------------------------------------------------------------
2
2
  // Cloudflare binding instrumentation for @heystack/otel/workers.
3
3
  //
4
- // Wraps D1, KV, R2, and Vectorize bindings with OTel child spans so that
5
- // every binding operation is visible as a child of the active request span.
4
+ // Wraps D1, KV, R2, Vectorize, Workers AI, Queue producers, and Service
5
+ // bindings with OTel child spans so that every binding operation is visible
6
+ // as a child of the active request span.
6
7
  //
7
8
  // WinterCG-safe: no `node:*` imports. Span factory is injected so the logic
8
9
  // is pure and unit-testable without a global provider.
9
10
  // ---------------------------------------------------------------------------
10
- import { context, SpanStatusCode } from "@opentelemetry/api";
11
+ import { context, SpanKind, SpanStatusCode } from "@opentelemetry/api";
11
12
  import { isTracingSuppressed } from "@opentelemetry/core";
12
13
  // ---------------------------------------------------------------------------
13
14
  // Duck-type detectors — conservative; require the distinctive method set
@@ -31,6 +32,24 @@ function isVectorizeLike(b) {
31
32
  return (typeof b?.query === "function" &&
32
33
  typeof b?.upsert === "function");
33
34
  }
35
+ /**
36
+ * Workers AI: has `run` but NOT `prepare` (which would match D1 first anyway).
37
+ * The `prepare` exclusion is defensive — D1 is already matched before this branch.
38
+ */
39
+ function isWorkersAILike(b) {
40
+ return (typeof b?.run === "function" &&
41
+ typeof b?.prepare !== "function");
42
+ }
43
+ /** Queue producer: exposes both `send` and `sendBatch`. */
44
+ function isQueueLike(b) {
45
+ return (typeof b?.send === "function" &&
46
+ typeof b?.sendBatch === "function");
47
+ }
48
+ /** Service binding / Fetcher: last branch — anything with `.fetch`. Prior branches
49
+ * exclude D1/R2/KV/Vectorize/AI/Queue, so order alone is sufficient. */
50
+ function isServiceLike(b) {
51
+ return typeof b?.fetch === "function";
52
+ }
34
53
  // ---------------------------------------------------------------------------
35
54
  // Span lifecycle helper
36
55
  // ---------------------------------------------------------------------------
@@ -161,21 +180,153 @@ function wrapVectorize(binding, opts, indexName) {
161
180
  });
162
181
  }
163
182
  // ---------------------------------------------------------------------------
183
+ // Workers AI wrapper
184
+ // ---------------------------------------------------------------------------
185
+ function wrapWorkersAI(binding, opts, _name) {
186
+ return makeProxy(binding, {
187
+ run: async (...args) => {
188
+ if (isTracingSuppressed(context.active())) {
189
+ return binding.run(...args);
190
+ }
191
+ const attrs = {
192
+ "gen_ai.system": "cloudflare.workers_ai",
193
+ };
194
+ if (typeof args[0] === "string") {
195
+ attrs["gen_ai.request.model"] = args[0];
196
+ }
197
+ const span = opts.startSpan("AI run", attrs, SpanKind.CLIENT);
198
+ try {
199
+ const result = await binding.run(...args);
200
+ // Best-effort usage extraction — never read/await/tee the stream.
201
+ try {
202
+ if (result &&
203
+ typeof result === "object" &&
204
+ !(result instanceof ReadableStream) &&
205
+ typeof result.usage === "object") {
206
+ const usage = result.usage;
207
+ if (typeof usage.prompt_tokens === "number") {
208
+ span.setAttribute("gen_ai.usage.input_tokens", usage.prompt_tokens);
209
+ }
210
+ if (typeof usage.completion_tokens === "number") {
211
+ span.setAttribute("gen_ai.usage.output_tokens", usage.completion_tokens);
212
+ }
213
+ }
214
+ }
215
+ catch {
216
+ // Swallow — a weird shape must never throw.
217
+ }
218
+ return result;
219
+ }
220
+ catch (err) {
221
+ span.recordException(err instanceof Error ? err : new Error(String(err)));
222
+ span.setStatus({
223
+ code: SpanStatusCode.ERROR,
224
+ message: err instanceof Error ? err.message : String(err),
225
+ });
226
+ throw err;
227
+ }
228
+ finally {
229
+ span.end();
230
+ }
231
+ },
232
+ });
233
+ }
234
+ // ---------------------------------------------------------------------------
235
+ // Queue producer wrapper
236
+ // ---------------------------------------------------------------------------
237
+ function wrapQueue(binding, opts, name) {
238
+ const baseAttrs = {
239
+ "messaging.system": "cloudflare_queues",
240
+ "messaging.destination.name": name,
241
+ };
242
+ return makeProxy(binding, {
243
+ send: async (...args) => {
244
+ if (isTracingSuppressed(context.active())) {
245
+ return binding.send(...args);
246
+ }
247
+ const span = opts.startSpan("Queue send", { ...baseAttrs, "messaging.operation": "send" }, SpanKind.PRODUCER);
248
+ return runWithSpan(span, () => binding.send(...args));
249
+ },
250
+ sendBatch: async (...args) => {
251
+ if (isTracingSuppressed(context.active())) {
252
+ return binding.sendBatch(...args);
253
+ }
254
+ const batchAttrs = {
255
+ ...baseAttrs,
256
+ "messaging.operation": "sendBatch",
257
+ };
258
+ if (Array.isArray(args[0])) {
259
+ batchAttrs["messaging.batch.message_count"] = args[0].length;
260
+ }
261
+ const span = opts.startSpan("Queue sendBatch", batchAttrs, SpanKind.PRODUCER);
262
+ return runWithSpan(span, () => binding.sendBatch(...args));
263
+ },
264
+ });
265
+ }
266
+ // ---------------------------------------------------------------------------
267
+ // Service binding / Fetcher wrapper + traceparent injection
268
+ // ---------------------------------------------------------------------------
269
+ /**
270
+ * Build a new args array for `fetch(input, init?)` with a `traceparent` header
271
+ * injected WITHOUT mutating the caller's original Request or init object.
272
+ *
273
+ * - `Request` first arg → rebuilt as `new Request(original, { headers })`.
274
+ * - String/URL first arg → spread a new init object with an augmented Headers.
275
+ */
276
+ export function injectTraceparentArgs(args, traceparent) {
277
+ const [input, ...rest] = args;
278
+ if (input instanceof Request) {
279
+ const headers = new Headers(input.headers);
280
+ headers.set("traceparent", traceparent);
281
+ return [new Request(input, { headers }), ...rest];
282
+ }
283
+ // String or URL
284
+ const init = { ...(rest[0] ?? {}) };
285
+ const headers = new Headers(init.headers);
286
+ headers.set("traceparent", traceparent);
287
+ init.headers = headers;
288
+ return [input, init];
289
+ }
290
+ function wrapService(binding, opts, name) {
291
+ return makeProxy(binding, {
292
+ fetch: async (...args) => {
293
+ if (isTracingSuppressed(context.active())) {
294
+ return binding.fetch(...args);
295
+ }
296
+ const span = opts.startSpan(`Service ${name} fetch`, { "peer.service": name }, SpanKind.CLIENT);
297
+ const sc = span.spanContext();
298
+ const traceparent = `00-${sc.traceId}-${sc.spanId}-01`;
299
+ const injectedArgs = injectTraceparentArgs(args, traceparent);
300
+ return runWithSpan(span, () => binding.fetch(...injectedArgs));
301
+ },
302
+ });
303
+ }
304
+ // ---------------------------------------------------------------------------
164
305
  // Main export
165
306
  // ---------------------------------------------------------------------------
166
307
  /**
167
308
  * Wrap an env object's Cloudflare bindings so that each binding operation
168
309
  * emits a child span under the currently-active OTel context.
169
310
  *
170
- * Detects binding type by duck-typing (D1: `prepare`; KV: `get`+`put`+`list`;
171
- * R2: `get`+`put`+`head`; Vectorize: `query`+`upsert`). Unrecognised bindings
172
- * are passed through unchanged.
311
+ * Detects binding type by duck-typing:
312
+ * - D1: `prepare`
313
+ * - R2: `get`+`put`+`head`
314
+ * - KV: `get`+`put`+`list`
315
+ * - Vectorize: `query`+`upsert`
316
+ * - Workers AI: `run` (without `prepare`)
317
+ * - Queue producer: `send`+`sendBatch`
318
+ * - Service binding / Fetcher: `fetch` (last branch; most generic)
319
+ *
320
+ * Unrecognised bindings are passed through unchanged.
173
321
  *
174
322
  * Each wrapped binding is a `Proxy` over the original — non-wrapped prototype
175
323
  * methods fall through to the real binding so no functionality is lost.
176
324
  *
325
+ * Service-binding spans inject a W3C `traceparent` header into outgoing
326
+ * requests so calls to other Workers stitch into one distributed trace.
327
+ *
177
328
  * @param env - The Worker env / binding bag.
178
- * @param opts - `startSpan` factory + `select` filter.
329
+ * @param opts - `startSpan` factory (now accepts optional `SpanKind`) + `select` filter.
179
330
  * @returns A shallow copy of `env` with selected bindings replaced by proxies.
180
331
  */
181
332
  export function instrumentEnv(env, opts) {
@@ -199,6 +350,15 @@ export function instrumentEnv(env, opts) {
199
350
  else if (isVectorizeLike(binding)) {
200
351
  result[key] = wrapVectorize(binding, opts, key);
201
352
  }
353
+ else if (isWorkersAILike(binding)) {
354
+ result[key] = wrapWorkersAI(binding, opts, key);
355
+ }
356
+ else if (isQueueLike(binding)) {
357
+ result[key] = wrapQueue(binding, opts, key);
358
+ }
359
+ else if (isServiceLike(binding)) {
360
+ result[key] = wrapService(binding, opts, key);
361
+ }
202
362
  // Unrecognised bindings are left as-is.
203
363
  }
204
364
  return result;
package/dist/workers.js CHANGED
@@ -838,7 +838,7 @@ export function instrument(handler, config) {
838
838
  if (config.instrumentBindings) {
839
839
  const binTracer = trace.getTracer("heystack");
840
840
  handlerEnv = instrumentEnv(env, {
841
- startSpan: (name, attrs) => binTracer.startSpan(name, { attributes: attrs }, context.active()),
841
+ startSpan: (name, attrs, kind) => binTracer.startSpan(name, { attributes: attrs, kind }, context.active()),
842
842
  select: config.instrumentBindings,
843
843
  });
844
844
  }
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@heystack/otel",
3
- "version": "0.7.0",
3
+ "version": "0.8.0",
4
4
  "description": "Runtime-aware OpenTelemetry tracing that exports to Heystack (Node, Next.js, Workers).",
5
5
  "license": "MIT",
6
6
  "type": "module",