npm - groundswell - Versions diffs - 0.0.1 - Mend

groundswell 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (120) hide show

package/.claude/settings.local.json +9 -0
package/.claude/system_prompts/task-breakdown.md +100 -0
package/PRPs/001-hierarchical-workflow-engine.md +2438 -0
package/PRPs/PRDs/001-hierarchical-workflow-engine.md +543 -0
package/PRPs/PRDs/002-agent-prompt.md +390 -0
package/PRPs/PRDs/003-agent-prompt.md +943 -0
package/PRPs/PRDs/004-agent-prompt.md +1136 -0
package/PRPs/PRDs/tasks-001.json +492 -0
package/PRPs/README.md +83 -0
package/PRPs/templates/prp_base.md +222 -0
package/README.md +218 -0
package/docs/agent.md +422 -0
package/docs/prompt.md +419 -0
package/docs/workflow.md +600 -0
package/examples/README.md +244 -0
package/examples/examples/01-basic-workflow.ts +100 -0
package/examples/examples/02-decorator-options.ts +217 -0
package/examples/examples/03-parent-child.ts +241 -0
package/examples/examples/04-observers-debugger.ts +340 -0
package/examples/examples/05-error-handling.ts +387 -0
package/examples/examples/06-concurrent-tasks.ts +352 -0
package/examples/examples/07-agent-loops.ts +432 -0
package/examples/examples/08-sdk-features.ts +667 -0
package/examples/examples/09-reflection.ts +573 -0
package/examples/examples/10-introspection.ts +550 -0
package/examples/index.ts +143 -0
package/examples/utils/helpers.ts +57 -0
package/llms_full.txt +5890 -0
package/package.json +63 -0
package/plan/P1P2/PRP.md +527 -0
package/plan/P1P2/research/LRU_CACHE_BEST_PRACTICES.md +1929 -0
package/plan/P1P2/research/LRU_CACHE_CODE_PATTERNS.md +857 -0
package/plan/P1P2/research/LRU_CACHE_INTEGRATION_GUIDE.md +738 -0
package/plan/P1P2/research/LRU_CACHE_RESEARCH_INDEX.md +424 -0
package/plan/P1P2/research/REFLECTION_INDEX.md +291 -0
package/plan/P1P2/research/REFLECTION_RESEARCH_REPORT.md +1342 -0
package/plan/P1P2/research/RESEARCH_SUMMARY.md +342 -0
package/plan/P1P2/research/anthropic-sdk.md +174 -0
package/plan/P1P2/research/async-local-storage.md +200 -0
package/plan/P1P2/research/reflection-code-patterns.md +1205 -0
package/plan/P1P2/research/reflection-decision-matrix.md +421 -0
package/plan/P1P2/research/reflection-implementation-guide.md +1341 -0
package/plan/P1P2/research/reflection-integration-guide.md +834 -0
package/plan/P1P2/research/reflection-patterns.md +1468 -0
package/plan/P1P2/research/reflection-quick-reference.md +558 -0
package/plan/P1P2/research/zod-schema.md +152 -0
package/plan/P3P4/PRP.md +1388 -0
package/plan/P3P4/research/caching-lru.md +116 -0
package/plan/P3P4/research/introspection-tools.md +177 -0
package/plan/P3P4/research/reflection-patterns.md +117 -0
package/plan/P4P5/PRP.md +1136 -0
package/plan/P4P5/research/RESEARCH_SUMMARY.md +151 -0
package/plan/architecture/external_deps.md +358 -0
package/plan/architecture/system_context.md +242 -0
package/plan/backlog.json +867 -0
package/plan/research/INTROSPECTION_RESEARCH_SUMMARY.md +378 -0
package/plan/research/README-INTROSPECTION.md +352 -0
package/plan/research/agent-introspection-patterns.md +1085 -0
package/plan/research/introspection-security-guide.md +928 -0
package/plan/research/introspection-tool-examples.md +875 -0
package/scripts/generate-llms-full.ts +206 -0
package/src/__tests__/integration/agent-workflow.test.ts +256 -0
package/src/__tests__/integration/tree-mirroring.test.ts +114 -0
package/src/__tests__/unit/agent.test.ts +169 -0
package/src/__tests__/unit/cache-key.test.ts +182 -0
package/src/__tests__/unit/cache.test.ts +172 -0
package/src/__tests__/unit/context.test.ts +138 -0
package/src/__tests__/unit/decorators.test.ts +100 -0
package/src/__tests__/unit/introspection-tools.test.ts +277 -0
package/src/__tests__/unit/prompt.test.ts +135 -0
package/src/__tests__/unit/reflection.test.ts +210 -0
package/src/__tests__/unit/tree-debugger.test.ts +85 -0
package/src/__tests__/unit/workflow.test.ts +81 -0
package/src/cache/cache-key.ts +244 -0
package/src/cache/cache.ts +236 -0
package/src/cache/index.ts +8 -0
package/src/core/agent.ts +573 -0
package/src/core/context.ts +119 -0
package/src/core/event-tree.ts +260 -0
package/src/core/factory.ts +123 -0
package/src/core/index.ts +17 -0
package/src/core/logger.ts +87 -0
package/src/core/mcp-handler.ts +184 -0
package/src/core/prompt.ts +150 -0
package/src/core/workflow-context.ts +349 -0
package/src/core/workflow.ts +302 -0
package/src/debugger/index.ts +1 -0
package/src/debugger/tree-debugger.ts +210 -0
package/src/decorators/index.ts +3 -0
package/src/decorators/observed-state.ts +95 -0
package/src/decorators/step.ts +139 -0
package/src/decorators/task.ts +96 -0
package/src/examples/index.ts +2 -0
package/src/examples/tdd-orchestrator.ts +65 -0
package/src/examples/test-cycle-workflow.ts +64 -0
package/src/index.ts +140 -0
package/src/reflection/index.ts +5 -0
package/src/reflection/reflection.ts +407 -0
package/src/tools/index.ts +36 -0
package/src/tools/introspection.ts +464 -0
package/src/types/agent.ts +90 -0
package/src/types/decorators.ts +25 -0
package/src/types/error-strategy.ts +13 -0
package/src/types/error.ts +20 -0
package/src/types/events.ts +74 -0
package/src/types/index.ts +55 -0
package/src/types/logging.ts +24 -0
package/src/types/observer.ts +18 -0
package/src/types/prompt.ts +40 -0
package/src/types/reflection.ts +117 -0
package/src/types/sdk-primitives.ts +128 -0
package/src/types/snapshot.ts +14 -0
package/src/types/workflow-context.ts +163 -0
package/src/types/workflow.ts +37 -0
package/src/utils/id.ts +11 -0
package/src/utils/index.ts +3 -0
package/src/utils/observable.ts +77 -0
package/tasks.json +0 -0
package/tsconfig.json +22 -0
package/vitest.config.ts +16 -0

package/docs/agent.md ADDED Viewed

@@ -0,0 +1,422 @@
+# Agents
+Agents are lightweight wrappers around the Anthropic SDK that execute prompts, manage tool invocation cycles, and integrate with caching and reflection systems.
+## Table of Contents
+- [Basic Usage](#basic-usage)
+- [Configuration](#configuration)
+- [Executing Prompts](#executing-prompts)
+- [Reflection](#reflection)
+- [Tools and MCP](#tools-and-mcp)
+- [Hooks](#hooks)
+- [Caching](#caching)
+- [API Reference](#api-reference)
+## Basic Usage
+```typescript
+import { createAgent, createPrompt } from 'groundswell';
+import { z } from 'zod';
+const agent = createAgent({
+  name: 'AnalysisAgent',
+  model: 'claude-sonnet-4-20250514',
+  enableCache: true,
+});
+const prompt = createPrompt({
+  user: 'Analyze this code for bugs',
+  data: { code: 'function foo() { return 42; }' },
+  responseFormat: z.object({
+    bugs: z.array(z.string()),
+    severity: z.enum(['low', 'medium', 'high']),
+  }),
+});
+const result = await agent.prompt(prompt);
+// result is typed: { bugs: string[], severity: 'low' | 'medium' | 'high' }
+```
+## Configuration
+### AgentConfig
+```typescript
+interface AgentConfig {
+  name?: string;                    // Human-readable name
+  system?: string;                  // System prompt
+  tools?: Tool[];                   // Available tools
+  mcps?: MCPServer[];               // MCP servers to connect
+  skills?: Skill[];                 // Skills to load
+  hooks?: AgentHooks;               // Lifecycle hooks
+  env?: Record<string, string>;     // Environment variables
+  enableReflection?: boolean;       // Enable reflection capability
+  enableCache?: boolean;            // Enable response caching
+  model?: string;                   // Model to use
+  maxTokens?: number;               // Max tokens for responses
+  temperature?: number;             // Response temperature
+}
+```
+### Configuration Priority
+Configuration follows a three-level override hierarchy:
+1. **Prompt-level** (highest priority)
+2. **Execution-level** (via `PromptOverrides`)
+3. **Agent-level** (lowest priority)
+```typescript
+const agent = createAgent({
+  system: 'Default system prompt',  // Agent-level
+  model: 'claude-sonnet-4-20250514',
+});
+const prompt = createPrompt({
+  user: 'Hello',
+  system: 'Override system prompt',  // Prompt-level (wins)
+  responseFormat: z.object({ response: z.string() }),
+});
+// Or override at execution time
+const result = await agent.prompt(prompt, {
+  model: 'claude-opus-4-5-20251101',  // Execution-level override
+});
+```
+## Executing Prompts
+### prompt()
+Returns validated response data:
+```typescript
+const result = await agent.prompt(prompt);
+// result is T (the response type)
+```
+### promptWithMetadata()
+Returns full execution metadata:
+```typescript
+const result = await agent.promptWithMetadata(prompt);
+console.log(result.data);       // Validated response
+console.log(result.usage);      // { input_tokens, output_tokens }
+console.log(result.duration);   // Total time in ms
+console.log(result.toolCalls);  // Number of tool invocations
+```
+### PromptResult
+```typescript
+interface PromptResult<T> {
+  data: T;                  // Validated response
+  usage: TokenUsage;        // Token usage stats
+  duration: number;         // Duration in milliseconds
+  toolCalls: number;        // Number of tool calls
+}
+interface TokenUsage {
+  input_tokens: number;
+  output_tokens: number;
+}
+```
+## Reflection
+Enable self-correction with the `reflect()` method:
+```typescript
+const agent = createAgent({
+  name: 'ReflectiveAgent',
+  enableReflection: true,
+});
+const result = await agent.reflect(prompt);
+```
+The reflection system prepends a reflection prefix to the system prompt:
+```
+Before answering, reflect on your reasoning step by step.
+Consider alternative approaches and potential errors.
+Then provide your final answer.
+```
+### Reflection Configuration
+```typescript
+// Agent-level
+const agent = createAgent({
+  enableReflection: true,
+});
+// Prompt-level
+const prompt = createPrompt({
+  user: 'Complex question',
+  enableReflection: true,
+  responseFormat: schema,
+});
+// Execution-level
+const result = await agent.prompt(prompt, {
+  enableReflection: true,
+});
+```
+## Tools and MCP
+### Tool Definition
+```typescript
+import type { Tool } from 'groundswell';
+const calculatorTool: Tool = {
+  name: 'calculate',
+  description: 'Performs arithmetic operations',
+  input_schema: {
+    type: 'object',
+    properties: {
+      operation: { type: 'string', enum: ['add', 'subtract', 'multiply', 'divide'] },
+      a: { type: 'number' },
+      b: { type: 'number' },
+    },
+    required: ['operation', 'a', 'b'],
+  },
+};
+```
+### MCP Handler
+Register tools with an MCP handler:
+```typescript
+import { MCPHandler } from 'groundswell';
+const mcpHandler = new MCPHandler();
+mcpHandler.registerServer({
+  name: 'demo',
+  transport: 'inprocess',
+  tools: [calculatorTool],
+});
+mcpHandler.registerToolExecutor('demo', 'calculate', async (input) => {
+  const { operation, a, b } = input;
+  switch (operation) {
+    case 'add': return { result: a + b };
+    case 'subtract': return { result: a - b };
+    case 'multiply': return { result: a * b };
+    case 'divide': return { result: a / b };
+  }
+});
+const agent = createAgent({
+  tools: mcpHandler.getTools(),
+});
+```
+### Tool Execution Flow
+1. Agent sends prompt to API
+2. API requests tool use
+3. Agent executes tool via MCP handler
+4. Result sent back to API
+5. Loop continues until no more tool calls
+6. Final response validated and returned
+## Hooks
+Lifecycle hooks enable logging, monitoring, and custom processing:
+```typescript
+import type { AgentHooks, PreToolUseContext, PostToolUseContext } from 'groundswell';
+const hooks: AgentHooks = {
+  preToolUse: [
+    async (ctx: PreToolUseContext) => {
+      console.log(`[PRE] Tool: ${ctx.toolName}`);
+      console.log(`Input:`, ctx.input);
+    }
+  ],
+  postToolUse: [
+    async (ctx: PostToolUseContext) => {
+      console.log(`[POST] Tool: ${ctx.toolName}`);
+      console.log(`Output:`, ctx.output);
+      console.log(`Duration: ${ctx.duration}ms`);
+    }
+  ],
+  sessionStart: [
+    async (ctx) => {
+      console.log(`Session started: ${ctx.agentName}`);
+    }
+  ],
+  sessionEnd: [
+    async (ctx) => {
+      console.log(`Session ended: ${ctx.totalDuration}ms`);
+    }
+  ],
+};
+const agent = createAgent({
+  hooks,
+});
+```
+### Hook Types
+| Hook | Trigger | Context |
+|------|---------|---------|
+| `preToolUse` | Before tool execution | `toolName`, `input` |
+| `postToolUse` | After tool execution | `toolName`, `input`, `output`, `duration` |
+| `sessionStart` | Before prompt execution | `agentName`, `promptId` |
+| `sessionEnd` | After prompt execution | `agentName`, `totalDuration` |
+## Caching
+### Enable Caching
+```typescript
+const agent = createAgent({
+  enableCache: true,
+});
+// First call: API request made, result cached
+const result1 = await agent.prompt(prompt);
+// Second call: cached result returned
+const result2 = await agent.prompt(prompt);
+```
+### Cache Metrics
+```typescript
+import { defaultCache } from 'groundswell';
+const metrics = defaultCache.metrics();
+console.log(`Hits: ${metrics.hits}`);
+console.log(`Misses: ${metrics.misses}`);
+console.log(`Hit rate: ${metrics.hitRate}%`);
+console.log(`Size: ${metrics.size} items`);
+console.log(`Size bytes: ${metrics.sizeBytes}`);
+```
+### Cache Key Generation
+Cache keys are deterministic SHA-256 hashes of:
+- User message
+- Data
+- System prompt
+- Model
+- Temperature
+- Max tokens
+- Tools
+- MCP servers
+- Skills
+- Response format schema
+Identical inputs always produce identical keys.
+### Disable Cache for Specific Call
+```typescript
+const result = await agent.prompt(prompt, {
+  disableCache: true,
+});
+```
+### Clear Cache
+```typescript
+import { defaultCache } from 'groundswell';
+await defaultCache.clear();
+// Or bust by prefix (agent ID)
+await defaultCache.bustPrefix(agent.id);
+```
+### Cache Configuration
+```typescript
+import { LLMCache } from 'groundswell';
+const customCache = new LLMCache({
+  maxItems: 500,           // Default: 1000
+  maxSizeBytes: 25_000_000, // Default: 50MB
+  defaultTTLMs: 7_200_000,  // Default: 1 hour
+});
+```
+## API Reference
+### Agent Class
+```typescript
+class Agent {
+  readonly id: string;
+  readonly name: string;
+  constructor(config?: AgentConfig);
+  prompt<T>(prompt: Prompt<T>, overrides?: PromptOverrides): Promise<T>;
+  promptWithMetadata<T>(prompt: Prompt<T>, overrides?: PromptOverrides): Promise<PromptResult<T>>;
+  reflect<T>(prompt: Prompt<T>, overrides?: PromptOverrides): Promise<T>;
+}
+```
+### Factory Function
+```typescript
+function createAgent(config?: AgentConfig): Agent;
+```
+### PromptOverrides
+```typescript
+interface PromptOverrides {
+  system?: string;
+  model?: string;
+  temperature?: number;
+  maxTokens?: number;
+  enableReflection?: boolean;
+  disableCache?: boolean;
+}
+```
+### Types
+```typescript
+interface Tool {
+  name: string;
+  description: string;
+  input_schema: {
+    type: 'object';
+    properties: Record<string, unknown>;
+    required?: string[];
+  };
+}
+interface MCPServer {
+  name: string;
+  transport: 'inprocess' | 'stdio' | 'http';
+  tools?: Tool[];
+}
+interface Skill {
+  name: string;
+  path: string;
+}
+interface AgentHooks {
+  preToolUse?: Array<(ctx: PreToolUseContext) => Promise<void>>;
+  postToolUse?: Array<(ctx: PostToolUseContext) => Promise<void>>;
+  sessionStart?: Array<(ctx: SessionStartContext) => Promise<void>>;
+  sessionEnd?: Array<(ctx: SessionEndContext) => Promise<void>>;
+}
+```
+See [examples/08-sdk-features.ts](../examples/examples/08-sdk-features.ts) for tools and hooks usage.