npm - @axiom-lattice/gateway - Versions diffs - 1.0.11 → 1.0.13 - Mend

@axiom-lattice/gateway 1.0.11 → 1.0.13

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

package/.turbo/turbo-build.log +10 -10
package/RESUME_STREAM_CONTENT_BASED.md +325 -0
package/RESUME_STREAM_README.md +388 -0
package/dist/index.d.mts +47 -1
package/dist/index.d.ts +47 -1
package/dist/index.js +324 -10
package/dist/index.js.map +1 -1
package/dist/index.mjs +331 -11
package/dist/index.mjs.map +1 -1
package/package.json +5 -3
package/src/controllers/run.ts +62 -1
package/src/index.ts +4 -4
package/src/routes/index.ts +36 -3
package/src/schemas/index.ts +194 -0
package/src/services/agent_service.ts +129 -15
package/src/swagger.ts +77 -0

package/RESUME_STREAM_README.md ADDED Viewed

@@ -0,0 +1,388 @@
+# Resume Stream Feature
+## Overview
+The `resume_stream` feature allows you to continue receiving streaming chunks from a known position. This is particularly useful for scenarios where the client connection is interrupted (e.g., page refresh, network issues) and you want to seamlessly continue from where you left off.
+## Architecture
+### ChunkBuffer Integration
+The feature leverages the `ChunkBuffer` module from `@axiom-lattice/core` to:
+- Store streaming chunks in memory
+- Track thread status (active/completed/aborted)
+- Provide TTL-based automatic cleanup
+- Calculate and return only new chunks since a known position
+### How It Works
+```
+┌─────────────────┐
+│  Original       │
+│  Streaming      │ ──► Chunks stored in ChunkBuffer
+│  (agent_stream) │     (thread_id, message_id, content)
+└─────────────────┘
+         │
+         │ Connection lost / Page refresh
+         │
+         ▼
+┌─────────────────┐
+│  Resume Stream  │
+│  (from known    │ ──► Polls for new chunks
+│  position)      │     Returns only new content
+└─────────────────┘     Ends when thread completes
+```
+## API Reference
+### `resume_stream(options)`
+Creates an async iterator that yields new chunks as they arrive.
+#### Parameters
+```typescript
+{
+  thread_id: string;        // Thread identifier
+  message_id: string;       // Message identifier (usually run_id)
+  known_content: string;    // Content already received (used to find resume position)
+  poll_interval?: number;   // Polling interval in ms (default: 100)
+}
+```
+#### Returns
+An async iterable object with `Symbol.asyncIterator`:
+```typescript
+{
+  content: string; // Chunk content
+  timestamp: number; // When chunk was added
+  messageId: string; // Message identifier
+}
+```
+#### Behavior
+- **Polling**: Checks for new chunks every `poll_interval` milliseconds
+- **Status Check**: Monitors thread status (active/completed/aborted)
+- **Timeout**: Automatically stops after 30 seconds of no new data
+- **Completion**: Exits when thread is no longer active
+## Usage Examples
+### Example 1: Basic Resume After Page Refresh
+```typescript
+import {
+  resume_stream,
+  get_accumulated_content,
+} from "./services/agent_service";
+// Client already received content before refresh (e.g., from localStorage or state)
+const knownContent = "Hello world! This is content I already received...";
+const stream = await resume_stream({
+  thread_id: "thread-123",
+  message_id: "msg-abc-456",
+  known_content: knownContent,
+});
+// Consume new chunks
+for await (const chunk of stream) {
+  console.log("New content:", chunk.content);
+  displayInUI(chunk.content); // Update your UI
+}
+console.log("Stream completed!");
+```
+### Example 2: Check Status Before Resuming
+```typescript
+import { get_thread_status, resume_stream } from "./services/agent_service";
+// Check thread status first
+const status = await get_thread_status("thread-123");
+if (!status.exists) {
+  console.log("Thread not found or expired");
+} else if (status.status === "completed") {
+  // Thread already finished, get full content
+  const content = await get_accumulated_content("thread-123");
+  displayFullContent(content);
+} else if (status.status === "active") {
+  // Thread still streaming, resume from current position
+  const currentContent = await get_accumulated_content("thread-123");
+  const stream = await resume_stream({
+    thread_id: "thread-123",
+    message_id: "msg-123",
+    known_content: currentContent,
+  });
+  for await (const chunk of stream) {
+    appendToUI(chunk.content);
+  }
+}
+```
+### Example 3: Express/Fastify Endpoint (SSE)
+```typescript
+import express from "express";
+import { resume_stream } from "./services/agent_service";
+const app = express();
+app.post("/api/resume-stream", async (req, res) => {
+  const { thread_id, message_id, known_content } = req.body;
+  // Set up Server-Sent Events
+  res.setHeader("Content-Type", "text/event-stream");
+  res.setHeader("Cache-Control", "no-cache");
+  res.setHeader("Connection", "keep-alive");
+  try {
+    const stream = await resume_stream({
+      thread_id,
+      message_id,
+      known_content,
+    });
+    for await (const chunk of stream) {
+      res.write(`data: ${JSON.stringify(chunk)}\n\n`);
+    }
+    res.write("event: complete\ndata: {}\n\n");
+    res.end();
+  } catch (error) {
+    res.write(
+      `event: error\ndata: ${JSON.stringify({ error: error.message })}\n\n`
+    );
+    res.end();
+  }
+});
+```
+### Example 4: React Hook
+```typescript
+import { useState, useEffect } from 'react';
+function useResumeStream(threadId: string, messageId: string, knownContent: string) {
+  const [content, setContent] = useState('');
+  const [isStreaming, setIsStreaming] = useState(false);
+  const [error, setError] = useState<Error | null>(null);
+  useEffect(() => {
+    let isCancelled = false;
+    async function startStream() {
+      setIsStreaming(true);
+      try {
+        const stream = await resume_stream({
+          thread_id: threadId,
+          message_id: messageId,
+          known_content: knownContent,
+        });
+        for await (const chunk of stream) {
+          if (isCancelled) break;
+          setContent(prev => prev + chunk.content);
+        }
+      } catch (err) {
+        if (!isCancelled) {
+          setError(err as Error);
+        }
+      } finally {
+        if (!isCancelled) {
+          setIsStreaming(false);
+        }
+      }
+    }
+    startStream();
+    return () => {
+      isCancelled = true;
+    };
+  }, [threadId, messageId, knownContent]);
+  return { content, isStreaming, error };
+}
+// Usage in component
+function ChatMessage({ threadId, messageId, initialContent }) {
+  const { content, isStreaming } = useResumeStream(
+    threadId,
+    messageId,
+    initialContent
+  );
+  return (
+    <div>
+      {initialContent + content}
+      {isStreaming && <span className="cursor">▋</span>}
+    </div>
+  );
+}
+```
+## Related Functions
+### `get_accumulated_content(thread_id)`
+Get all accumulated content for a thread.
+```typescript
+const content = await get_accumulated_content("thread-123");
+```
+### `get_thread_status(thread_id)`
+Get thread status and metadata.
+```typescript
+const status = await get_thread_status("thread-123");
+// {
+//   exists: true,
+//   status: 'active' | 'completed' | 'aborted',
+//   chunkCount: 42,
+//   createdAt: 1234567890,
+//   updatedAt: 1234567900
+// }
+```
+### `get_active_threads()`
+Get all currently active threads.
+```typescript
+const activeThreads = await get_active_threads();
+// ['thread-1', 'thread-2', 'thread-3']
+```
+### `clear_thread_buffer(thread_id)`
+Manually clear a thread's buffer.
+```typescript
+await clear_thread_buffer("thread-123");
+```
+## Configuration
+### TTL (Time-To-Live)
+Threads are automatically cleaned up after 1 hour of inactivity:
+```typescript
+// In agent_service.ts
+const buffer = new InMemoryChunkBuffer({
+  ttl: 60 * 60 * 1000, // 1 hour
+  cleanupInterval: 5 * 60 * 1000, // Clean every 5 minutes
+});
+```
+### Polling Interval
+Adjust polling frequency based on your needs:
+```typescript
+// Fast polling for real-time updates
+const stream = await resume_stream({
+  thread_id: "thread-123",
+  message_id: "msg-123",
+  known_content: knownContent,
+  poll_interval: 50, // Check every 50ms
+});
+// Slower polling to reduce server load
+const stream = await resume_stream({
+  thread_id: "thread-123",
+  message_id: "msg-123",
+  known_content: knownContent,
+  poll_interval: 500, // Check every 500ms
+});
+```
+### Timeout
+The resume stream automatically times out after 30 seconds of no new data:
+```typescript
+// In agent_service.ts - resume_stream function
+const maxIdleTime = 30000; // 30 seconds
+```
+## Error Handling
+### Thread Not Found
+```typescript
+const stream = await resume_stream({
+  thread_id: "non-existent",
+  message_id: "msg-123",
+  known_content: "",
+});
+// Stream will exit immediately if thread doesn't exist
+for await (const chunk of stream) {
+  // Won't execute
+}
+```
+### Network Errors
+```typescript
+try {
+  const stream = await resume_stream({
+    thread_id: "thread-123",
+    message_id: "msg-123",
+    known_content: previousContent,
+  });
+  for await (const chunk of stream) {
+    displayChunk(chunk);
+  }
+} catch (error) {
+  console.error("Stream error:", error);
+  showErrorToUser("Failed to resume stream");
+}
+```
+## Best Practices
+1. **Always Check Status First**: Check thread status before attempting to resume
+2. **Store Message ID**: Keep track of the `message_id` (usually `run_id`) with your content
+3. **Preserve Content Exactly**: Store the exact content as received (no formatting/processing)
+4. **Handle Completion**: Be prepared for the stream to end at any time
+5. **Implement Retry Logic**: Add retry mechanism for transient failures
+6. **Set Appropriate Poll Interval**: Balance between responsiveness and server load
+7. **Content Matching**: The algorithm matches content intelligently - exact match, prefix, or suffix
+## Performance Considerations
+- **Memory Usage**: Chunks are stored in memory (consider TTL for long-running applications)
+- **Polling Overhead**: Lower `poll_interval` increases server load but improves responsiveness
+- **Concurrent Streams**: Multiple resume streams can run concurrently
+- **Cleanup**: Old threads are automatically cleaned up based on TTL
+## Limitations
+- **In-Memory Only**: Current implementation stores chunks in memory (lost on server restart)
+- **Single Message Per Thread**: Designed for one active message per thread
+- **Content Matching**: Relies on exact content matching (whitespace, encoding must match)
+- **No Persistence**: Chunks are not persisted to disk or database
+- **Performance**: Content matching is O(n) where n is number of chunks
+## Future Enhancements
+- **Persistent Storage**: Add Redis or database backend for persistence across restarts
+- **WebSocket Support**: Direct WebSocket integration for lower latency
+- **Event-Based Notifications**: Use event emitters instead of polling
+- **Compression**: Compress stored chunks to reduce memory usage
+- **Multi-Message Support**: Handle multiple concurrent messages per thread

package/dist/index.d.mts CHANGED Viewed

@@ -1,10 +1,56 @@
-import * as fastify from 'fastify';
 import * as http from 'http';
+import * as fastify from 'fastify';
+declare const defaultSwaggerConfig: {
+    openapi: {
+        openapi: string;
+        info: {
+            title: string;
+            description: string;
+            version: string;
+            contact: {
+                name: string;
+                email: string;
+            };
+        };
+        servers: {
+            url: string;
+            description: string;
+        }[];
+        components: {
+            securitySchemes: {
+                bearerAuth: {
+                    type: "http";
+                    scheme: "bearer";
+                    bearerFormat: string;
+                };
+            };
+        };
+        security: {
+            bearerAuth: never[];
+        }[];
+        tags: {
+            name: string;
+            description: string;
+        }[];
+    };
+};
+declare const defaultSwaggerUiConfig: {
+    routePrefix: string;
+    uiConfig: {
+        docExpansion: "full";
+        deepLinking: boolean;
+    };
+    staticCSP: boolean;
+    transformStaticCSP: (header: string) => string;
+};
 declare const LatticeGateway: {
     startAsHttpEndpoint: ({ port }: {
         port: number;
     }) => Promise<void>;
+    configureSwagger: (app: fastify.FastifyInstance, customSwaggerConfig?: Partial<typeof defaultSwaggerConfig>, customSwaggerUiConfig?: Partial<typeof defaultSwaggerUiConfig>) => Promise<void>;
+    registerLatticeRoutes: (app: fastify.FastifyInstance) => void;
     app: fastify.FastifyInstance<http.Server<typeof http.IncomingMessage, typeof http.ServerResponse>, http.IncomingMessage, http.ServerResponse<http.IncomingMessage>, fastify.FastifyBaseLogger, fastify.FastifyTypeProviderDefault> & PromiseLike<fastify.FastifyInstance<http.Server<typeof http.IncomingMessage, typeof http.ServerResponse>, http.IncomingMessage, http.ServerResponse<http.IncomingMessage>, fastify.FastifyBaseLogger, fastify.FastifyTypeProviderDefault>> & {
         __linterBrands: "SafePromiseLike";
     };

package/dist/index.d.ts CHANGED Viewed

@@ -1,10 +1,56 @@
-import * as fastify from 'fastify';
 import * as http from 'http';
+import * as fastify from 'fastify';
+declare const defaultSwaggerConfig: {
+    openapi: {
+        openapi: string;
+        info: {
+            title: string;
+            description: string;
+            version: string;
+            contact: {
+                name: string;
+                email: string;
+            };
+        };
+        servers: {
+            url: string;
+            description: string;
+        }[];
+        components: {
+            securitySchemes: {
+                bearerAuth: {
+                    type: "http";
+                    scheme: "bearer";
+                    bearerFormat: string;
+                };
+            };
+        };
+        security: {
+            bearerAuth: never[];
+        }[];
+        tags: {
+            name: string;
+            description: string;
+        }[];
+    };
+};
+declare const defaultSwaggerUiConfig: {
+    routePrefix: string;
+    uiConfig: {
+        docExpansion: "full";
+        deepLinking: boolean;
+    };
+    staticCSP: boolean;
+    transformStaticCSP: (header: string) => string;
+};
 declare const LatticeGateway: {
     startAsHttpEndpoint: ({ port }: {
         port: number;
     }) => Promise<void>;
+    configureSwagger: (app: fastify.FastifyInstance, customSwaggerConfig?: Partial<typeof defaultSwaggerConfig>, customSwaggerUiConfig?: Partial<typeof defaultSwaggerUiConfig>) => Promise<void>;
+    registerLatticeRoutes: (app: fastify.FastifyInstance) => void;
     app: fastify.FastifyInstance<http.Server<typeof http.IncomingMessage, typeof http.ServerResponse>, http.IncomingMessage, http.ServerResponse<http.IncomingMessage>, fastify.FastifyBaseLogger, fastify.FastifyTypeProviderDefault> & PromiseLike<fastify.FastifyInstance<http.Server<typeof http.IncomingMessage, typeof http.ServerResponse>, http.IncomingMessage, http.ServerResponse<http.IncomingMessage>, fastify.FastifyBaseLogger, fastify.FastifyTypeProviderDefault>> & {
         __linterBrands: "SafePromiseLike";
     };