npm - stagent - Versions diffs - 0.1.9 → 0.1.11 - Mend

stagent 0.1.9 → 0.1.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (81) hide show

package/README.md +144 -62
package/package.json +1 -2
package/public/readme/cost-usage-list.png +0 -0
package/public/readme/dashboard-bulk-select.png +0 -0
package/public/readme/dashboard-card-edit.png +0 -0
package/public/readme/dashboard-create-form-ai-applied.png +0 -0
package/public/readme/dashboard-create-form-ai-assist.png +0 -0
package/public/readme/dashboard-create-form-empty.png +0 -0
package/public/readme/dashboard-create-form-filled.png +0 -0
package/public/readme/dashboard-filtered.png +0 -0
package/public/readme/dashboard-list.png +0 -0
package/public/readme/dashboard-sorted.png +0 -0
package/public/readme/dashboard-workflow-confirm.png +0 -0
package/public/readme/documents-grid.png +0 -0
package/public/readme/documents-list.png +0 -0
package/public/readme/home-below-fold.png +0 -0
package/public/readme/home-list.png +0 -0
package/public/readme/inbox-list.png +0 -0
package/public/readme/monitor-list.png +0 -0
package/public/readme/profiles-list.png +0 -0
package/public/readme/projects-detail.png +0 -0
package/public/readme/projects-list.png +0 -0
package/public/readme/schedules-list.png +0 -0
package/public/readme/settings-list.png +0 -0
package/public/readme/workflows-list.png +0 -0
package/src/app/api/profiles/route.ts +0 -1
package/src/app/api/workflows/from-assist/route.ts +143 -0
package/src/app/dashboard/page.tsx +24 -2
package/src/app/globals.css +0 -5
package/src/app/tasks/page.tsx +5 -0
package/src/app/workflows/from-assist/page.tsx +35 -0
package/src/components/profiles/profile-detail-view.tsx +1 -16
package/src/components/profiles/profile-form-view.tsx +0 -22
package/src/components/projects/project-card.tsx +47 -35
package/src/components/tasks/ai-assist-panel.tsx +31 -10
package/src/components/tasks/task-card.tsx +16 -1
package/src/components/tasks/task-create-panel.tsx +39 -0
package/src/components/workflows/workflow-confirmation-view.tsx +447 -0
package/src/lib/agents/__tests__/claude-agent.test.ts +7 -2
package/src/lib/agents/__tests__/learned-context.test.ts +500 -0
package/src/lib/agents/__tests__/pattern-extractor.test.ts +243 -0
package/src/lib/agents/__tests__/sweep.test.ts +202 -0
package/src/lib/agents/claude-agent.ts +104 -78
package/src/lib/agents/learned-context.ts +5 -13
package/src/lib/agents/pattern-extractor.ts +15 -64
package/src/lib/agents/profiles/__tests__/suggest.test.ts +67 -0
package/src/lib/agents/profiles/builtins/code-reviewer/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/data-analyst/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/devops-engineer/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/document-writer/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/general/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/health-fitness-coach/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/learning-coach/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/project-manager/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/researcher/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/shopping-assistant/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/sweep/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/technical-writer/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/travel-planner/profile.yaml +0 -1
package/src/lib/agents/profiles/builtins/wealth-manager/profile.yaml +0 -1
package/src/lib/agents/profiles/registry.ts +0 -1
package/src/lib/agents/profiles/suggest.ts +36 -0
package/src/lib/agents/profiles/types.ts +0 -1
package/src/lib/agents/runtime/catalog.ts +1 -1
package/src/lib/agents/runtime/claude.ts +102 -6
package/src/lib/agents/runtime/task-assist-types.ts +12 -2
package/src/lib/constants/task-status.ts +6 -0
package/src/lib/data/__tests__/clear.test.ts +42 -0
package/src/lib/data/clear.ts +3 -0
package/src/lib/data/seed-data/profiles.ts +0 -3
package/src/lib/notifications/permissions.ts +6 -2
package/src/lib/usage/__tests__/ledger.test.ts +29 -5
package/src/lib/usage/ledger.ts +3 -1
package/src/lib/usage/pricing.ts +61 -7
package/src/lib/validators/__tests__/profile.test.ts +0 -15
package/src/lib/validators/profile.ts +0 -1
package/src/lib/workflows/__tests__/assist-builder.test.ts +255 -0
package/src/lib/workflows/__tests__/engine.test.ts +2 -0
package/src/lib/workflows/assist-builder.ts +248 -0
package/src/lib/workflows/assist-session.ts +78 -0
package/src/lib/workflows/engine.ts +47 -1

package/README.md CHANGED Viewed

@@ -14,7 +14,7 @@ Open [localhost:3000](http://localhost:3000).
 **Profiles & Policies** · **Blueprints & Schedules** · **Open Source**
-<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/home-workspace.png" alt="Stagent home workspace" width="1200" />
+<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/home-list.png" alt="Stagent home workspace" width="1200" />
 | Home Workspace | Reusable Profiles | Workflow Blueprints | Governed Execution |
 |:-:|:-:|:-:|:-:|
@@ -53,6 +53,9 @@ Stagent ships a shared runtime registry that routes tasks, schedules, and workfl
 | 💸 | **[Cost & Usage](#cost--usage)** | Provider-aware metering, budgets, and spend visibility for governed runs |
 | 🚨 | **[Ambient Approvals](#ambient-approvals)** | Shell-level approval prompts that keep Inbox as the durable supervision queue |
 | 🔒 | **[Tool Permissions](#tool-permission-persistence)** | Trusted-tool policies with explicit "Always Allow" rules |
+| 📋 | **[Kanban Board](#kanban-board-operations)** | Inline editing, bulk operations, and persistent board state |
+| 🤖 | **[AI Assist → Workflows](#ai-assist--workflow-creation)** | Bridge task assist recommendations into governed workflow execution |
+| 🧬 | **[Agent Self-Improvement](#agent-self-improvement)** | Agents learn patterns from execution history with human-approved context evolution |
 ---
@@ -69,6 +72,7 @@ Stagent ships a shared runtime registry that routes tasks, schedules, and workfl
 - **Provider runtime abstraction** — Tasks, schedules, workflows, task assist, and health checks route through shared runtime adapters instead of provider-specific entry points
 - **Reusable agent profiles** — Profiles define instructions, allowed tools, runtime tuning, and MCP configs for repeated use
 - **Permission pre-check** — Saved "Always Allow" patterns bypass the notification loop for trusted tools
+- **Learned context loop** — Pattern extraction → human approval → versioned context injection creates a supervised self-improvement cycle
 ---
@@ -82,9 +86,19 @@ Workspace-level briefing with active work, pending review, failed items, project
 #### Task Execution
 Status-driven execution board with five columns: Planned → Queued → Running → Completed → Failed. Filter across projects, create tasks inline, and open task detail to inspect status, description, and runtime state without leaving the board.
+<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/dashboard-list.png" alt="Stagent kanban board" width="1200" />
+| Filtered by Project | Inline Card Editing | Bulk Select Mode |
+|:-:|:-:|:-:|
+| <img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/dashboard-filtered.png" alt="Dashboard filtered by project" width="380" /> | <img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/dashboard-card-edit.png" alt="Inline task editing dialog" width="380" /> | <img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/dashboard-bulk-select.png" alt="Bulk select mode with actions" width="380" /> |
 #### Projects
 Create and organize projects as containers for related tasks. Each project can specify a working directory — agent tasks resolve `cwd` from the project's path, enabling agents to operate on external codebases. Server-rendered project cards with task counts, status badges, and a detail view at `/projects/[id]`.
+| Project Cards | Project Detail |
+|:-:|:-:|
+| <img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/projects-list.png" alt="Project cards overview" width="580" /> | <img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/projects-detail.png" alt="Project detail view" width="580" /> |
 ### Agent
 #### Provider Runtimes
@@ -101,13 +115,18 @@ Claude Agent SDK integration with the `canUseTool` polling pattern remains the d
 OpenAI Codex App Server is integrated as Stagent's second governed runtime. Codex-backed tasks preserve project working directories, document context, resumable thread IDs, inbox approval requests, user questions, and provider-labeled logs. The same runtime can also power task assist, scheduled firings, and workflow child tasks.
 #### Agent Profiles
-Profile-backed execution with specialist definitions for different job types. Each profile packages instructions, allowed tools, runtime tuning, and MCP server configuration so teams can reuse behavior intentionally instead of relying on ad hoc prompts. Workflow steps and schedules can reference profiles directly, and runtimes can be selected independently when provider support differs.
+Profile-backed execution with specialist definitions for different job types. Each profile packages instructions, allowed tools, max turns, and output format so teams can reuse behavior intentionally instead of relying on ad hoc prompts. Workflow steps and schedules can reference profiles directly, and runtimes can be selected independently when provider support differs.
+<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/profiles-list.png" alt="Stagent agent profiles" width="1200" />
 #### Workflows
-Multi-step task orchestration with three patterns:
+Multi-step task orchestration with six patterns:
 - **Sequence** — Steps execute in order
 - **Planner→Executor** — One agent plans, another executes each step
 - **Human-in-the-Loop Checkpoint** — Pauses for human approval between steps
+- **Parallel** — Concurrent branch execution with fork/join synthesis
+- **Loop** — Iterative agent execution with configurable stop conditions
+- **Swarm** — Mayor/workers/refinery multi-agent orchestration
 State machine engine with step-level retry, project association, and real-time status visualization.
@@ -121,6 +140,18 @@ Both patterns preserve the same governed task model, runtime selection, monitori
 #### AI Task Assist
 AI-powered task creation: generate improved descriptions, break tasks into sub-tasks, recommend workflow patterns, and estimate complexity through the shared runtime task-assist layer. Claude and OpenAI task assist now both route through the provider runtime abstraction.
+| Task Creation Form | AI Suggestions | AI Applied |
+|:-:|:-:|:-:|
+| <img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/dashboard-create-form-empty.png" alt="Empty task creation form" width="380" /> | <img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/dashboard-create-form-ai-assist.png" alt="AI Assist suggestions panel" width="380" /> | <img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/dashboard-create-form-ai-applied.png" alt="AI suggestions applied to form" width="380" /> |
+#### AI Assist → Workflow Creation
+Bridge from AI task assist to workflow engine: when task assist recommends a multi-step plan, a "Create as Workflow" button converts the recommendation into a validated workflow definition with per-step profile assignments, dependency ordering, and pattern selection across all six workflow types. The `WorkflowConfirmationSheet` lets operators review and edit steps, profiles, and configuration before creating the workflow. A keyword-based profile suggestion fallback ensures steps get reasonable profile assignments even without the AI classifier.
+<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/dashboard-workflow-confirm.png" alt="Workflow creation from AI Assist" width="1200" />
+#### Agent Self-Improvement
+Agents learn from execution history through a human-approved instruction evolution loop. After each task completion, the pattern extractor analyzes logs and proposes context updates — concise behavioral rules the agent should follow in future runs. Operators approve, reject, or edit proposals before they take effect. Learned context is versioned with rollback support and size-limited summarization to prevent unbounded growth. A sweep agent can audit the codebase for improvement opportunities and create prioritized tasks from its findings.
 #### Session Management
 Resume failed or cancelled agent tasks with one click. Tracks retry counts (limit: 3), detects expired sessions, and provides atomic claim to prevent duplicate runs.
@@ -133,13 +164,17 @@ Curated agent profiles across work and personal domains, built as portable Claud
 #### Workflow Blueprints
 Pre-configured workflow templates across work and personal domains. Browse blueprints in a gallery with filtering and search, preview steps and required variables, fill in a dynamic form, and create draft workflows with resolved prompts and profile assignments. Create custom blueprints via YAML or import from GitHub URLs. Lineage tracking connects workflows back to their source blueprint.
-<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/workflow-blueprints.png" alt="Stagent workflow blueprint gallery" width="1200" />
+<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/workflows-list.png" alt="Stagent workflow management" width="1200" />
 ### Documents
 #### Document Management
 Full document browser at `/documents` with table and grid views. Upload files with drag-and-drop, preview images/PDFs/markdown/code inline, search by filename and extracted text, and filter by processing status or project. Bulk delete, link/unlink to projects and tasks.
+| Table View | Grid View |
+|:-:|:-:|
+| <img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/documents-list.png" alt="Documents table view" width="580" /> | <img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/documents-grid.png" alt="Documents grid view" width="580" /> |
 #### Document Preprocessing
 Automatic text extraction on upload for five file types: text, PDF (pdf-parse), images (image-size), Office documents (mammoth/jszip), and spreadsheets (xlsx). Extracted text, processed paths, and processing errors are tracked per document.
@@ -157,22 +192,28 @@ Pending permission requests now surface through a shell-level approval presenter
 #### Schedules
 Time-based scheduling for agent tasks with human-friendly intervals (`5m`, `2h`, `1d`) and raw 5-field cron expressions. One-shot and recurring modes with pause/resume lifecycle, expiry limits, and max firings. Each firing creates a child task through the shared execution pipeline, and schedules can now target a runtime explicitly. Scheduler runs as a poll-based engine started via Next.js instrumentation hook.
+<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/schedules-list.png" alt="Stagent schedules" width="1200" />
 #### Micro-Visualizations
 Pure SVG chart primitives (Sparkline, MiniBar, DonutRing) with zero charting dependencies. Integrated into: homepage stats cards (7-day trends), activity feed (24h bar chart), project cards (completion donuts), monitor overview (success rate), and project detail (stacked status + 14-day sparkline). Full accessibility with `role="img"` and `aria-label`.
 #### Cost & Usage
 Provider-normalized metering tracks token and spend activity across tasks, resumes, workflow child tasks, schedules, task assist, and profile tests. The dedicated `Cost & Usage` surface adds summary cards, trend views, provider/model breakdowns, and budget-aware audit visibility on top of the usage ledger.
+<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/cost-usage-list.png" alt="Stagent cost and usage dashboard" width="1200" />
 ### UI & DevEx
 #### Inbox & Human-in-the-Loop
 When an agent needs approval or input, a notification appears in your inbox. Review tool permission requests with "Allow Once" / "Always Allow" / "Deny" buttons, answer agent questions, and see task completion summaries. Supports bulk dismiss and 10s polling.
-<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/inbox-approvals.png" alt="Stagent inbox approval flow" width="1200" />
+<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/inbox-list.png" alt="Stagent inbox approval flow" width="1200" />
 #### Monitoring
 Real-time agent log streaming via Server-Sent Events. Filter by task or event type, click entries to jump to task details, and auto-pause polling when the tab is hidden (Page Visibility API).
+<img src="https://raw.githubusercontent.com/navam-io/stagent/main/public/readme/monitor-list.png" alt="Stagent monitoring dashboard" width="1200" />
 #### Content Handling
 File upload with drag-and-drop in task creation. Type-aware content preview for text, markdown (via react-markdown), code, and JSON. Copy-to-clipboard and download-as-file for task outputs.
@@ -183,7 +224,7 @@ Configuration hub with provider-aware sections: Claude authentication (API key o
 The `npx stagent` entry point boots a Next.js server from the published npm package. It is built from `bin/cli.ts` into `dist/cli.js` using tsup, and serves as the primary distribution channel — no clone required.
 #### Database
-SQLite with WAL mode via better-sqlite3 + Drizzle ORM. Eight tables: `projects`, `tasks`, `workflows`, `agent_logs`, `notifications`, `documents`, `schedules`, `settings`. Self-healing bootstrap — tables are created on startup if missing.
+SQLite with WAL mode via better-sqlite3 + Drizzle ORM. Ten tables: `projects`, `tasks`, `workflows`, `agent_logs`, `notifications`, `documents`, `schedules`, `settings`, `learned_context`, `usage_ledger`. Self-healing bootstrap — tables are created on startup if missing.
 #### App Shell
 Responsive sidebar with collapsible icon-only mode, custom Stagent logo, tooltip navigation, dark/light/system theme, and OKLCH hue 250 blue-indigo color palette. Built on shadcn/ui (New York style) with PWA manifest and app icons. Routes: Home, Dashboard, Projects, Documents, Workflows, Profiles, Schedules, Inbox, Monitor, Settings.
@@ -222,66 +263,96 @@ npm run test:coverage  # Coverage report
 ```
 src/
 ├── app/                  # Next.js App Router pages
-│   ├── dashboard/        # Project overview
+│   ├── dashboard/        # Task kanban board
 │   ├── projects/[id]/    # Project detail
+│   ├── tasks/            # Task detail + creation (redirects to dashboard)
+│   ├── profiles/         # Agent profile gallery + detail + creation
 │   ├── documents/        # Document browser
-│   ├── workflows/        # Workflow management
+│   ├── workflows/        # Workflow management + blueprints
 │   ├── schedules/        # Schedule management
+│   ├── costs/            # Cost & usage dashboard
 │   ├── inbox/            # Notifications
 │   ├── monitor/          # Log streaming
 │   └── settings/         # Configuration
 ├── components/
 │   ├── dashboard/        # Homepage widgets + charts
 │   ├── tasks/            # Board, cards, panels
-│   ├── workflows/        # Workflow UI
+│   ├── profiles/         # Profile gallery, detail, form, learned context
+│   ├── workflows/        # Workflow UI + blueprints + swarm
 │   ├── documents/        # Document browser + upload
+│   ├── costs/            # Cost dashboard + filters
 │   ├── schedules/        # Schedule management
 │   ├── monitoring/       # Log viewer
 │   ├── notifications/    # Inbox + permission actions
-│   ├── settings/         # Auth, permissions, data mgmt
+│   ├── settings/         # Auth, permissions, budgets, data mgmt
 │   ├── shared/           # App shell, sidebar
 │   └── ui/               # shadcn/ui primitives
 └── lib/
-    ├── agents/           # Runtime adapters, provider integrations, profiles
+    ├── agents/           # Runtime adapters, profiles, learned context, pattern extraction
     ├── db/               # Schema, migrations
     ├── documents/        # Preprocessing + context builder
     ├── workflows/        # Engine + types + blueprints
     ├── schedules/        # Scheduler engine + interval parser
     ├── settings/         # Auth, permissions, helpers
+    ├── usage/            # Metering ledger + pricing registry
     ├── constants/        # Status transitions, colors
     ├── queries/          # Chart data aggregation
     ├── validators/       # Zod schemas
     └── utils/            # Shared helpers
 ```
-### API Endpoints
-| Endpoint | Method | Purpose |
-|----------|--------|---------|
-| `/api/projects/[id]` | GET/PUT/DELETE | Project CRUD |
-| `/api/tasks/[id]/execute` | POST | Fire-and-forget task dispatch (202) |
-| `/api/tasks/[id]/resume` | POST | Resume failed/cancelled task |
-| `/api/tasks/[id]/respond` | POST | Human response to agent prompt |
-| `/api/tasks/[id]/logs` | GET | Task log history |
-| `/api/logs/stream` | GET | SSE agent log stream |
-| `/api/notifications` | GET/POST | Notification management |
-| `/api/workflows` | POST | Create workflow |
-| `/api/workflows/[id]/execute` | POST | Execute workflow |
-| `/api/documents` | GET | List documents with joins |
-| `/api/documents/[id]` | PATCH/DELETE | Document metadata + deletion |
-| `/api/uploads` | POST | File upload |
-| `/api/schedules` | GET/POST | Schedule CRUD |
-| `/api/schedules/[id]` | GET/PATCH/DELETE | Schedule detail + updates |
-| `/api/permissions` | GET/POST/DELETE | Tool permission patterns |
-| `/api/settings/openai` | GET/POST | OpenAI Codex runtime settings |
-| `/api/settings/test` | POST | Provider-aware runtime connectivity test |
-| `/api/profiles` | GET | List agent profiles |
-| `/api/profiles/[id]/test` | POST | Run behavioral tests on a profile |
-| `/api/profiles/import` | POST | Import profile from GitHub URL |
-| `/api/blueprints` | GET/POST | List and create blueprints |
-| `/api/blueprints/[id]` | GET/DELETE | Blueprint detail and deletion |
-| `/api/blueprints/[id]/instantiate` | POST | Create workflow from blueprint |
-| `/api/blueprints/import` | POST | Import blueprint from GitHub URL |
+### API Endpoints (48 routes)
+| Domain | Endpoint | Method | Purpose |
+|--------|----------|--------|---------|
+| **Projects** | `/api/projects` | GET/POST | List and create projects |
+| | `/api/projects/[id]` | GET/PUT/DELETE | Project CRUD |
+| **Tasks** | `/api/tasks` | GET/POST | List and create tasks |
+| | `/api/tasks/[id]` | GET/PATCH/DELETE | Task detail, update, delete |
+| | `/api/tasks/[id]/execute` | POST | Fire-and-forget task dispatch (202) |
+| | `/api/tasks/[id]/resume` | POST | Resume failed/cancelled task |
+| | `/api/tasks/[id]/cancel` | POST | Cancel running task |
+| | `/api/tasks/[id]/respond` | POST | Human response to agent prompt |
+| | `/api/tasks/[id]/output` | GET | Task execution output |
+| | `/api/tasks/[id]/logs` | GET | Task log history |
+| | `/api/tasks/assist` | POST | AI task assist (description, subtasks, workflow recommendation) |
+| **Workflows** | `/api/workflows` | GET/POST | List and create workflows |
+| | `/api/workflows/[id]` | GET/PATCH/DELETE | Workflow detail, update, delete |
+| | `/api/workflows/[id]/execute` | POST | Execute workflow |
+| | `/api/workflows/[id]/status` | GET | Workflow execution status |
+| | `/api/workflows/[id]/steps/[stepId]/retry` | POST | Retry failed workflow step |
+| | `/api/workflows/from-assist` | POST | Create workflow from AI assist recommendation |
+| **Blueprints** | `/api/blueprints` | GET/POST | List and create blueprints |
+| | `/api/blueprints/[id]` | GET/DELETE | Blueprint detail and deletion |
+| | `/api/blueprints/[id]/instantiate` | POST | Create workflow from blueprint |
+| | `/api/blueprints/import` | POST | Import blueprint from GitHub URL |
+| **Documents** | `/api/documents` | GET | List documents with joins |
+| | `/api/documents/[id]` | GET/PATCH/DELETE | Document detail, metadata, deletion |
+| | `/api/documents/[id]/file` | GET | Download document file |
+| **Uploads** | `/api/uploads` | POST | File upload |
+| | `/api/uploads/[id]` | GET/DELETE | Upload detail and deletion |
+| | `/api/uploads/cleanup` | POST | Clean up orphaned uploads |
+| **Profiles** | `/api/profiles` | GET | List agent profiles |
+| | `/api/profiles/[id]` | GET/PUT/DELETE | Profile CRUD |
+| | `/api/profiles/[id]/test` | POST | Run behavioral tests on a profile |
+| | `/api/profiles/[id]/context` | GET/POST/PATCH | Learned context: version history, manual add, approve/reject/rollback |
+| | `/api/profiles/import` | POST | Import profile from GitHub URL |
+| **Notifications** | `/api/notifications` | GET/POST | List and create notifications |
+| | `/api/notifications/[id]` | PATCH/DELETE | Update and delete notification |
+| | `/api/notifications/mark-all-read` | POST | Mark all notifications as read |
+| | `/api/notifications/pending-approvals` | GET | Pending approval notifications |
+| | `/api/notifications/pending-approvals/stream` | GET | SSE stream for pending approvals |
+| **Schedules** | `/api/schedules` | GET/POST | Schedule CRUD |
+| | `/api/schedules/[id]` | GET/PATCH/DELETE | Schedule detail + updates |
+| **Settings** | `/api/settings` | GET/POST | General settings |
+| | `/api/settings/openai` | GET/POST | OpenAI Codex runtime settings |
+| | `/api/settings/test` | POST | Provider-aware runtime connectivity test |
+| | `/api/settings/budgets` | GET/POST | Budget configuration |
+| | `/api/permissions` | GET/POST/DELETE | Tool permission patterns |
+| **Monitoring** | `/api/logs/stream` | GET | SSE agent log stream |
+| **Platform** | `/api/command-palette/recent` | GET | Recent command palette items |
+| | `/api/data/clear` | POST | Clear all data |
+| | `/api/data/seed` | POST | Seed sample data |
 ---
@@ -297,29 +368,40 @@ All 14 features shipped across three layers:
 | **Core** | Project management, task board, agent integration, inbox notifications, monitoring dashboard |
 | **Polish** | Homepage dashboard, UX fixes, workflow engine, AI task assist, content handling, session management |
-### Post-MVP — Complete
-| Feature | What shipped |
-|---------|-------------|
-| **Document Management** | File attachments, preprocessing (5 formats), agent document context, document browser UI |
-| **Multi-Agent Routing** | Profile registry (4 profiles), task classifier, per-step profile assignment |
-| **Agent Profile Catalog** | 13 domain-specific profiles, GitHub import, behavioral testing, MCP server passthrough |
-| **Micro-Visualizations** | Sparklines, mini bars, donut rings — zero-dependency SVG charts |
-| **Tool Permission Persistence** | "Always Allow" patterns, pre-check bypass, Settings management |
-| **Scheduled Prompt Loops** | Cron + human-friendly intervals, one-shot/recurring, pause/resume lifecycle |
-| **Provider Runtimes** | Shared runtime registry with Claude Code and OpenAI Codex App Server adapters |
-| **Autonomous Loop Execution** | 4 stop conditions, iteration context chaining, pause/resume, loop status view |
-| **Workflow Blueprints** | 8 templates, gallery, YAML editor, dynamic forms, GitHub import, lineage tracking |
-| **Command Palette** | ⌘K palette with navigation, create actions, recent items, theme toggle |
-### Planned
-| Feature | Description |
-|---------|-------------|
-| **Multi-Agent Swarm** | Multi-agent orchestration with Mayor/Workers/Refinery roles |
-| **Agent Self-Improvement** | Agents learn patterns and update context with human approval |
-| **Document Output Generation** | Agent-generated documents as deliverables |
-| **Parallel Workflows** | Concurrent step execution within workflows |
+### Post-MVP — Complete (27 features)
+| Category | Feature | What shipped |
+|----------|---------|-------------|
+| **Documents** | File Attachments | Upload data layer with project/task linking |
+| | Document Preprocessing | Text extraction for 5 formats (text, PDF, images, Office, spreadsheets) |
+| | Agent Document Context | Automatic document injection into agent prompts |
+| | Document Browser | Table/grid views, search, filters, bulk operations at `/documents` |
+| | Document Output Generation | Agent-generated documents as deliverables |
+| **Agent Intelligence** | Multi-Agent Routing | Profile registry (4 profiles), task classifier, per-step profile assignment |
+| | Autonomous Loop Execution | 4 stop conditions, iteration context chaining, pause/resume, loop status view |
+| | Multi-Agent Swarm | Mayor → worker pool → refinery orchestration with retryable stages |
+| | AI Assist → Workflows | Bridge task assist into workflow engine with profile assignment and pattern selection |
+| | Agent Self-Improvement | Pattern extraction from logs, human-approved context evolution, versioned rollback |
+| **Agent Profiles** | Agent Profile Catalog | 13 domain-specific profiles, GitHub import, behavioral testing, MCP passthrough |
+| | Workflow Blueprints | 8 templates, gallery, YAML editor, dynamic forms, GitHub import, lineage tracking |
+| **UI Enhancement** | Ambient Approvals | Shell-level approval presenter on any route for fast supervision |
+| | Micro-Visualizations | Sparklines, mini bars, donut rings — zero-dependency SVG charts |
+| | Command Palette | ⌘K palette with navigation, create actions, recent items, theme toggle |
+| | Operational Surface | Cross-route composition with consistent layout, density, and interaction patterns |
+| | Profile Surface | Profile gallery stability, detail views, and behavioral testing UI |
+| | Accessibility | ARIA labels, keyboard navigation, focus management, screen reader support |
+| | UI Density Refinement | Tightened spacing, typography, and visual hierarchy across all routes |
+| | Kanban Board Operations | Inline editing, bulk operations, card animations, edit dialog |
+| | Board Context Persistence | Persisted filters, sort order, and project selection across sessions |
+| **Platform** | Scheduled Prompt Loops | Cron + human-friendly intervals, one-shot/recurring, pause/resume lifecycle |
+| | Tool Permission Persistence | "Always Allow" patterns, pre-check bypass, Settings management |
+| | Provider Runtimes | Shared runtime registry with Claude Code and OpenAI Codex App Server adapters |
+| | OpenAI Codex Runtime | Codex App Server integration with inbox approvals, logs, and thread resumption |
+| | Cross-Provider Profiles | Profile compatibility layer ensuring profiles work across Claude and Codex runtimes |
+| | Parallel Fork/Join | 2-5 concurrent research branches with synthesis step |
+| **Governance** | Usage Metering Ledger | Provider-normalized token and spend tracking across all execution paths |
+| | Spend Budget Guardrails | Per-project and global budgets with enforcement and alerts |
+| | Cost & Usage Dashboard | Summary cards, trend views, provider/model breakdowns, budget audit visibility |
 ---

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "stagent",
-  "version": "0.1.9",
+  "version": "0.1.11",
   "description": "Governed AI agent workspace for supervised local execution, workflows, documents, and provider runtimes.",
   "keywords": [
     "ai",
@@ -51,7 +51,6 @@
   },
   "dependencies": {
     "@anthropic-ai/claude-agent-sdk": "^0.2.71",
-    "@anthropic-ai/sdk": "^0.78.0",
     "@dnd-kit/core": "^6.3.1",
     "@dnd-kit/sortable": "^10.0.0",
     "@dnd-kit/utilities": "^3.2.2",

package/public/readme/cost-usage-list.png ADDED Viewed

Binary file

package/public/readme/dashboard-bulk-select.png ADDED Viewed

Binary file

package/public/readme/dashboard-card-edit.png ADDED Viewed

Binary file

package/public/readme/dashboard-create-form-ai-applied.png ADDED Viewed

Binary file

package/public/readme/dashboard-create-form-ai-assist.png ADDED Viewed

Binary file

package/public/readme/dashboard-create-form-empty.png ADDED Viewed

Binary file

package/public/readme/dashboard-create-form-filled.png ADDED Viewed

Binary file

package/public/readme/dashboard-filtered.png ADDED Viewed

Binary file

package/public/readme/dashboard-list.png ADDED Viewed

Binary file

package/public/readme/dashboard-sorted.png ADDED Viewed

Binary file

package/public/readme/dashboard-workflow-confirm.png ADDED Viewed

Binary file

package/public/readme/documents-grid.png ADDED Viewed

Binary file

package/public/readme/documents-list.png ADDED Viewed

Binary file

package/public/readme/home-below-fold.png ADDED Viewed

Binary file

package/public/readme/home-list.png ADDED Viewed

Binary file

package/public/readme/inbox-list.png ADDED Viewed

Binary file

package/public/readme/monitor-list.png ADDED Viewed

Binary file

package/public/readme/profiles-list.png ADDED Viewed

Binary file

package/public/readme/projects-detail.png ADDED Viewed

Binary file

package/public/readme/projects-list.png ADDED Viewed

Binary file

package/public/readme/schedules-list.png ADDED Viewed

Binary file

package/public/readme/settings-list.png ADDED Viewed

Binary file

package/public/readme/workflows-list.png ADDED Viewed

Binary file

package/src/app/api/profiles/route.ts CHANGED Viewed

@@ -13,7 +13,6 @@ export async function GET() {
     allowedTools: p.allowedTools,
     mcpServers: p.mcpServers,
     canUseToolPolicy: p.canUseToolPolicy,
-    temperature: p.temperature,
     maxTurns: p.maxTurns,
     outputFormat: p.outputFormat,
     version: p.version,

package/src/app/api/workflows/from-assist/route.ts ADDED Viewed

@@ -0,0 +1,143 @@
+import { NextRequest, NextResponse } from "next/server";
+import { db } from "@/lib/db";
+import { workflows, tasks } from "@/lib/db/schema";
+import { eq } from "drizzle-orm";
+import type { WorkflowDefinition } from "@/lib/workflows/types";
+import { validateWorkflowDefinition } from "@/lib/workflows/definition-validation";
+import { validateWorkflowDefinitionAssignments } from "@/lib/agents/profiles/assignment-validation";
+import { executeWorkflow } from "@/lib/workflows/engine";
+interface FromAssistBody {
+  name?: string;
+  projectId?: string;
+  definition?: WorkflowDefinition;
+  priority?: number;
+  assignedAgent?: string;
+  executeImmediately?: boolean;
+  parentTask?: {
+    title: string;
+    description: string;
+    agentProfile?: string;
+  };
+}
+export async function POST(req: NextRequest) {
+  const body = (await req.json()) as FromAssistBody;
+  const { name, projectId, definition, priority, assignedAgent, executeImmediately, parentTask } = body;
+  if (!name?.trim()) {
+    return NextResponse.json({ error: "Name is required" }, { status: 400 });
+  }
+  if (!definition) {
+    return NextResponse.json(
+      { error: "Definition must include pattern and at least one step" },
+      { status: 400 }
+    );
+  }
+  const definitionError = validateWorkflowDefinition(definition);
+  if (definitionError) {
+    return NextResponse.json({ error: definitionError }, { status: 400 });
+  }
+  const compatibilityError = validateWorkflowDefinitionAssignments(definition);
+  if (compatibilityError) {
+    return NextResponse.json({ error: compatibilityError }, { status: 400 });
+  }
+  // Transaction: create workflow + tasks + optional parent task atomically
+  const workflowId = crypto.randomUUID();
+  const now = new Date();
+  const taskIds: string[] = [];
+  let parentTaskId: string | null = null;
+  try {
+    db.transaction((tx) => {
+      // Create parent task (no workflowId — visible on dashboard)
+      if (parentTask?.title) {
+        parentTaskId = crypto.randomUUID();
+        tx.insert(tasks)
+          .values({
+            id: parentTaskId,
+            title: parentTask.title,
+            description: parentTask.description || null,
+            projectId: projectId || null,
+            workflowId: null,
+            status: executeImmediately ? "running" : "planned",
+            assignedAgent: assignedAgent ?? null,
+            agentProfile: parentTask.agentProfile ?? null,
+            priority: priority ?? 2,
+            createdAt: now,
+            updatedAt: now,
+          })
+          .run();
+      }
+      // Store sourceTaskId in definition for parent↔workflow linkage
+      const defToStore = parentTaskId
+        ? { ...definition, sourceTaskId: parentTaskId }
+        : definition;
+      // Create workflow
+      tx.insert(workflows)
+        .values({
+          id: workflowId,
+          name: name.trim(),
+          projectId: projectId || null,
+          definition: JSON.stringify(defToStore),
+          status: executeImmediately ? "active" : "draft",
+          createdAt: now,
+          updatedAt: now,
+        })
+        .run();
+      // Create tasks for each step (with workflowId — hidden from dashboard)
+      for (const step of definition.steps) {
+        const taskId = crypto.randomUUID();
+        taskIds.push(taskId);
+        tx.insert(tasks)
+          .values({
+            id: taskId,
+            title: step.name,
+            description: step.prompt,
+            projectId: projectId || null,
+            workflowId,
+            status: "planned",
+            assignedAgent: step.assignedAgent ?? assignedAgent ?? null,
+            agentProfile: step.agentProfile ?? null,
+            priority: priority ?? 2,
+            createdAt: now,
+            updatedAt: now,
+          })
+          .run();
+      }
+    });
+  } catch (error) {
+    console.error("Failed to create workflow from assist:", error);
+    return NextResponse.json(
+      { error: "Failed to create workflow and tasks" },
+      { status: 500 }
+    );
+  }
+  // Fire-and-forget execution if requested
+  if (executeImmediately) {
+    executeWorkflow(workflowId).catch((error) => {
+      console.error(`Workflow ${workflowId} execution failed:`, error);
+    });
+  }
+  const [created] = await db.select().from(workflows).where(eq(workflows.id, workflowId));
+  return NextResponse.json(
+    {
+      workflow: created,
+      taskIds,
+      parentTaskId,
+      status: executeImmediately ? "started" : "created",
+    },
+    { status: 201 }
+  );
+}

package/src/app/dashboard/page.tsx CHANGED Viewed

@@ -1,7 +1,7 @@
 import { Suspense } from "react";
 import { db } from "@/lib/db";
-import { tasks, projects } from "@/lib/db/schema";
-import { desc } from "drizzle-orm";
+import { tasks, projects, workflows } from "@/lib/db/schema";
+import { desc, isNull } from "drizzle-orm";
 import { KanbanBoard } from "@/components/tasks/kanban-board";
 import { SkeletonBoard } from "@/components/tasks/skeleton-board";
 import type { TaskItem } from "@/components/tasks/task-card";
@@ -9,9 +9,11 @@ import type { TaskItem } from "@/components/tasks/task-card";
 export const dynamic = "force-dynamic";
 async function BoardContent() {
+  // Only show parent/standalone tasks — hide workflow step tasks
   const allTasks = await db
     .select()
     .from(tasks)
+    .where(isNull(tasks.workflowId))
     .orderBy(tasks.priority, desc(tasks.createdAt));
   const allProjects = await db
@@ -22,10 +24,30 @@ async function BoardContent() {
   // Build project name lookup for task cards
   const projectMap = new Map(allProjects.map((p) => [p.id, p.name]));
+  // Look up linked workflows for parent tasks (via sourceTaskId in definition JSON)
+  const allWorkflows = await db
+    .select({ id: workflows.id, definition: workflows.definition, status: workflows.status })
+    .from(workflows);
+  const linkedWorkflowMap = new Map<string, { workflowId: string; workflowStatus: string }>();
+  for (const w of allWorkflows) {
+    try {
+      const def = JSON.parse(w.definition);
+      if (def.sourceTaskId) {
+        linkedWorkflowMap.set(def.sourceTaskId, {
+          workflowId: w.id,
+          workflowStatus: w.status,
+        });
+      }
+    } catch { /* skip invalid JSON */ }
+  }
   // Serialize Date objects for client component consumption
   const serializedTasks: TaskItem[] = allTasks.map((t) => ({
     ...t,
     projectName: t.projectId ? projectMap.get(t.projectId) ?? undefined : undefined,
+    linkedWorkflowId: linkedWorkflowMap.get(t.id)?.workflowId,
+    linkedWorkflowStatus: linkedWorkflowMap.get(t.id)?.workflowStatus,
     createdAt: t.createdAt.toISOString(),
     updatedAt: t.updatedAt.toISOString(),
   }));