npm - agda-mcp-server - Versions diffs - 0.4.0 - Mend

agda-mcp-server 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

package/LICENSE +23 -0
package/README.md +472 -0
package/dist/agda/advanced-queries.d.ts +52 -0
package/dist/agda/advanced-queries.js +249 -0
package/dist/agda/advanced-queries.js.map +1 -0
package/dist/agda/batch.d.ts +6 -0
package/dist/agda/batch.js +59 -0
package/dist/agda/batch.js.map +1 -0
package/dist/agda/expression-operations.d.ts +17 -0
package/dist/agda/expression-operations.js +86 -0
package/dist/agda/expression-operations.js.map +1 -0
package/dist/agda/goal-operations.d.ts +29 -0
package/dist/agda/goal-operations.js +156 -0
package/dist/agda/goal-operations.js.map +1 -0
package/dist/agda/response-parsing.d.ts +4 -0
package/dist/agda/response-parsing.js +44 -0
package/dist/agda/response-parsing.js.map +1 -0
package/dist/agda/session.d.ts +88 -0
package/dist/agda/session.js +340 -0
package/dist/agda/session.js.map +1 -0
package/dist/agda/types.d.ts +99 -0
package/dist/agda/types.js +5 -0
package/dist/agda/types.js.map +1 -0
package/dist/agda-process.d.ts +4 -0
package/dist/agda-process.js +14 -0
package/dist/agda-process.js.map +1 -0
package/dist/index.d.ts +11 -0
package/dist/index.js +91 -0
package/dist/index.js.map +1 -0
package/dist/tools/navigation.d.ts +3 -0
package/dist/tools/navigation.js +192 -0
package/dist/tools/navigation.js.map +1 -0
package/dist/tools/proof.d.ts +3 -0
package/dist/tools/proof.js +250 -0
package/dist/tools/proof.js.map +1 -0
package/dist/tools/session.d.ts +3 -0
package/dist/tools/session.js +108 -0
package/dist/tools/session.js.map +1 -0
package/package.json +65 -0

package/LICENSE ADDED Viewed

@@ -0,0 +1,23 @@
+<!-- markdownlint-disable-file MD041 -->
+MIT License
+Copyright (c) 2026 Invariant Holdings, LLC
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

package/README.md ADDED Viewed

@@ -0,0 +1,472 @@
+# agda-mcp-server
+[![npm version](https://img.shields.io/npm/v/agda-mcp-server)](https://www.npmjs.com/package/agda-mcp-server)
+[![CI](https://github.com/LionOfJewdah/agda-mcp-server/actions/workflows/ci.yml/badge.svg)](https://github.com/LionOfJewdah/agda-mcp-server/actions/workflows/ci.yml)
+[![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](LICENSE)
+[![Node >=24](https://img.shields.io/badge/node-%3E%3D24-339933?logo=node.js&logoColor=white)](package.json)
+`agda-mcp-server` is a stateful [Model Context Protocol](https://modelcontextprotocol.io)
+server for interactive [Agda](https://agda.readthedocs.io/) proof development.
+It keeps a long-running Agda process alive in `--interaction-json` mode so MCP
+clients can use Agda the way a human does in an editor: load a file, inspect
+goals, split on variables, refine holes, infer types, normalize expressions,
+search the local environment, and iterate on proofs without restarting Agda for
+every request.
+## What this server provides
+- Persistent interactive Agda sessions.
+- Goal-aware proof actions over MCP.
+- Stateless batch type-checking when you only want a quick validation pass.
+- Navigation and scope-inspection helpers for large Agda codebases.
+- A small extension system for project-specific or domain-specific tools.
+## How it works
+The server launches Agda in `--interaction-json` mode and communicates through
+Agda's IOTCM protocol over standard input and output.
+In practice, the workflow is:
+1. Load an Agda file with `agda_load`.
+2. Agda assigns interaction point IDs to all open goals.
+3. Use those goal IDs with proof-oriented tools such as `agda_goal_type`,
+   `agda_case_split`, `agda_refine`, or `agda_give`.
+4. Reload the file after applying source edits so Agda can refresh its goals.
+This statefulness is the main difference between `agda_load` and the stateless
+`agda_typecheck` command.
+## Requirements
+Before using the server, make sure you have:
+- Node.js `>= 24`
+- An Agda installation available as `agda` on your `PATH`, or
+- A repo-local pinned runner at `tooling/scripts/run-pinned-agda.sh`
+If both are available, the pinned runner is preferred.
+## Installation
+### From source
+```bash
+npm install
+npm run build
+```
+This produces the distributable server in `dist/`.
+### Local CLI entry point
+After building, the executable entry point is:
+```bash
+node dist/index.js
+```
+The published package also exposes the `agda-mcp-server` binary through the
+`bin` field in `package.json`.
+## Quick start
+Start the server on stdio with a project root:
+```bash
+AGDA_MCP_ROOT=/path/to/agda/project node dist/index.js
+```
+If `AGDA_MCP_ROOT` is omitted, the current working directory is used.
+## Examples
+### Example: load a file and inspect goals
+```text
+1. agda_load file="Nat/Properties.agda"
+  → reports load status and goal IDs
+2. agda_session_status
+  → shows the loaded file and active goals
+3. agda_goal_type goalId=0
+  → returns the local context and expected type for `?0`
+```
+### Example: refine a proof hole
+```text
+1. agda_goal_type goalId=0
+  → inspect the goal before editing
+2. agda_refine goalId=0 expr="suc"
+  → apply a constructor or function
+3. agda_metas
+  → inspect any new subgoals created by the refinement
+```
+### Example: check an expression before committing to it
+```text
+1. agda_elaborate goalId=0 expr="map f xs"
+  → see Agda's elaborated form
+2. agda_infer goalId=0 expr="map f xs"
+  → confirm the inferred type
+3. agda_give goalId=0 expr="map f xs"
+  → fill the goal once the expression looks correct
+```
+### Example: stateless validation in CI or editor automation
+```text
+agda_typecheck file="MyModule.agda"
+```
+Use this when you want errors and warnings without creating a persistent session.
+## MCP client configuration
+### Claude Code
+Add a server entry similar to this in your Claude Code settings:
+```json
+{
+  "mcpServers": {
+    "agda": {
+      "command": "node",
+      "args": ["mcp/agda-mcp-server/dist/index.js"],
+      "env": {
+        "AGDA_MCP_ROOT": "."
+      }
+    }
+  }
+}
+```
+### Other MCP clients
+Any MCP client that can spawn a stdio server can run this package. Use the same
+pattern:
+- command: `node`
+- args: path to `dist/index.js`
+- environment: set `AGDA_MCP_ROOT` to the Agda project root
+## Session model
+This server is intentionally stateful.
+- One shared Agda session is kept alive.
+- The session tracks the currently loaded file.
+- Goal IDs are meaningful only for the currently loaded file and current Agda state.
+- If the file changes on disk, reload it with `agda_load` before continuing.
+If you only want a quick compile check and do not need goals, use
+`agda_typecheck` instead of creating a session.
+## Tool reference
+### Session management
+| Tool | Description |
+| --- | --- |
+| `agda_load` | Load and type-check a file, establish the active interactive session, and return current goal IDs |
+| `agda_session_status` | Show the currently loaded file and available goal IDs |
+| `agda_typecheck` | Run a stateless batch type-check without creating or updating the interactive session |
+### Goal inspection and proof interaction
+These tools require a file to be loaded first via `agda_load`.
+| Tool | Description |
+| --- | --- |
+| `agda_goal_type` | Show the goal type and local context for one interaction point |
+| `agda_metas` | List unsolved goals in the loaded file |
+| `agda_case_split` | Case-split on a variable in a goal and return the generated clauses |
+| `agda_give` | Fill a goal with a proposed expression |
+| `agda_refine` | Refine a goal by applying a function or constructor |
+| `agda_auto` | Attempt proof search for a single goal |
+| `agda_auto_all` | Attempt proof search across all goals |
+| `agda_solve_all` | Solve goals that have unique solutions |
+| `agda_compute` | Normalize an expression, either in goal context or at top level |
+| `agda_infer` | Infer the type of an expression, either in goal context or at top level |
+| `agda_constraints` | Show Agda's current constraint set |
+| `agda_elaborate` | Elaborate an expression in a goal context |
+| `agda_helper_function` | Generate a helper function type from a goal-local expression |
+### Navigation and environment inspection
+| Tool | Description |
+| --- | --- |
+| `agda_read_module` | Read a module from disk with line numbers |
+| `agda_list_modules` | List Agda modules under a tier or directory segment |
+| `agda_check_postulates` | Check a file for `postulate` declarations |
+| `agda_search_definitions` | Search source files for matching identifiers or text |
+| `agda_why_in_scope` | Explain why a name is in scope, either at top level or in a goal |
+| `agda_show_module` | Show what a module exports |
+| `agda_search_about` | Search the loaded environment for names whose types mention the query |
+## Typical interactive workflow
+```text
+1. agda_load file="MyModule.agda"
+     → Status: OK, 3 unsolved goals (?0, ?1, ?2)
+2. agda_goal_type goalId=0
+     → Context: (x : Nat), (p : x ≡ zero)
+     → Goal: x + zero ≡ x
+3. agda_auto goalId=0
+     → No automatic solution found.
+4. agda_elaborate goalId=0 expr="+-identityʳ x"
+     → Elaborated: +-identityʳ x : x + zero ≡ x
+5. agda_give goalId=0 expr="+-identityʳ x"
+     → Goal solved.
+6. Apply edits to the source file if needed.
+7. agda_load file="MyModule.agda"
+     → Reload to refresh remaining goals.
+```
+## Stateless vs stateful operations
+Use `agda_typecheck` when you want:
+- a quick yes or no answer about whether a file checks,
+- error and warning output only,
+- no interactive goal information,
+- no persistent Agda session.
+Use `agda_load` when you want:
+- stable goal IDs,
+- interactive commands against holes,
+- proof search, refinement, elaboration, and local type information,
+- a persistent Agda subprocess.
+## Environment variables
+| Variable | Default | Description |
+| --- | --- | --- |
+| `AGDA_MCP_ROOT` | `cwd` | Root directory used to resolve Agda files and relative extension paths |
+| `AGDA_MCP_EXTENSION_MODULES` | unset | Colon-separated list of extension module paths or package specifiers |
+## Extension modules
+The core server is intentionally generic. Project-specific workflows can be added
+through external extension modules loaded at startup.
+Values in `AGDA_MCP_EXTENSION_MODULES` are resolved as follows:
+- absolute filesystem paths are used directly,
+- relative filesystem paths are resolved relative to `AGDA_MCP_ROOT`,
+- `file://` specifiers are used as-is,
+- anything else is treated as a normal module specifier.
+An extension can export `register` or multiple functions whose names begin with
+`register`. Each function receives the MCP server instance, the shared
+`AgdaSession`, and the resolved repo root.
+### Example extension
+```typescript
+import { McpServer } from "@modelcontextprotocol/sdk/server/mcp.js";
+import { z } from "zod";
+import type { AgdaSession } from "agda-mcp-server";
+export function register(
+  server: McpServer,
+  session: AgdaSession,
+  repoRoot: string,
+): void {
+  server.tool(
+    "my_custom_tool",
+    "Example custom Agda tool",
+    {
+      expr: z.string(),
+    },
+    async ({ expr }) => {
+      const loadedFile = session.getLoadedFile();
+      return {
+        content: [
+          {
+            type: "text",
+            text: `repoRoot=${repoRoot}\nloadedFile=${loadedFile ?? "(none)"}\nexpr=${expr}`,
+          },
+        ],
+      };
+    },
+  );
+}
+```
+Then start the server with something like:
+```bash
+AGDA_MCP_ROOT=. AGDA_MCP_EXTENSION_MODULES=dist/my-extension.js node dist/index.js
+```
+## Development
+### Scripts
+| Script | Purpose |
+| --- | --- |
+| `npm run build` | Compile TypeScript into `dist/` |
+| `npm run dev` | Run the TypeScript entry point directly with `tsx` |
+| `npm test` | Build first, then run the Node test suite |
+| `npm run test:integration` | Run the Agda-backed integration test scaffold |
+| `npm run verify` | Run tests and verify package contents with `npm pack --dry-run` |
+### Local development flow
+```bash
+npm install
+npm run build
+npm test
+npm run verify
+```
+### Tests
+The test suite currently focuses on lightweight, deterministic behavior such as:
+- response parsing,
+- Agda command string escaping,
+- Agda binary discovery,
+- session cleanup behavior.
+The tests intentionally avoid depending on a live Agda installation so they can
+run reliably in normal CI environments.
+An integration scaffold is also available for environments where Agda is
+installed:
+```bash
+RUN_AGDA_INTEGRATION=1 npm run test:integration
+```
+## Publishing
+The package is configured for public npm publishing.
+Before publishing:
+1. Update the version in `package.json`.
+2. Run `npm run verify`.
+3. Publish with npm using your normal release process.
+The `prepublishOnly` script runs verification automatically before publish.
+Only the following files are published:
+- `dist/`
+- `README.md`
+- `LICENSE`
+## Continuous integration
+This repository includes a GitHub Actions workflow at
+[.github/workflows/ci.yml](.github/workflows/ci.yml) that:
+- installs dependencies with `npm ci`,
+- runs on pushes and pull requests,
+- verifies the package on Node.js 24.
+## Community and maintenance files
+This repository also includes:
+- [CONTRIBUTING.md](CONTRIBUTING.md) for contributor setup and workflow guidance
+- [SECURITY.md](SECURITY.md) for vulnerability reporting guidance
+- [CHANGELOG.md](CHANGELOG.md) for release history
+- [.github/ISSUE_TEMPLATE/config.yml](.github/ISSUE_TEMPLATE/config.yml) and issue forms for structured reports
+- [.github/pull_request_template.md](.github/pull_request_template.md) for consistent pull requests
+- [.nvmrc](.nvmrc) and the `packageManager` field in [package.json](package.json) for local toolchain alignment
+## Architecture overview
+```text
+src/
+  index.ts
+    Bootstraps the MCP server, registers core tools, and loads extensions.
+  agda-process.ts
+    Public barrel for the Agda integration layer.
+  agda/
+    session.ts
+      Owns the Agda subprocess, transport, buffering, and session state.
+    batch.ts
+      Stateless batch type-checking.
+    goal-operations.ts
+      Goal-centric interactive commands.
+    expression-operations.ts
+      Expression normalization and type inference.
+    advanced-queries.ts
+      Constraints, scope, elaboration, module inspection, and search.
+    response-parsing.ts
+      Helpers for extracting user-facing messages from Agda responses.
+    types.ts
+      Shared types for the Agda integration layer.
+  tools/
+    session.ts
+      MCP tool registration for loading and status operations.
+    proof.ts
+      MCP tool registration for goal-oriented proof actions.
+    navigation.ts
+      MCP tool registration for source and environment navigation.
+```
+## Protocol notes
+The server communicates with Agda using the
+[IOTCM protocol](https://hackage.haskell.org/package/Agda-2.7.0.1/docs/Agda-Interaction-Base.html)
+over `--interaction-json` mode.
+At a high level:
+- commands are written to Agda on stdin as IOTCM strings,
+- Agda emits newline-delimited JSON responses on stdout,
+- stderr output is captured for diagnostics,
+- session completion is inferred from status and running-info messages.
+## Troubleshooting
+### `agda` cannot be found
+Make sure either:
+- `agda` is installed and on your `PATH`, or
+- `tooling/scripts/run-pinned-agda.sh` exists in the repo root.
+### Goal IDs stop working
+Goal IDs are tied to the current loaded file and the current Agda state. If the
+source changed or you applied a case split, reload the file with `agda_load`.
+### Top-level commands fail with "No file loaded"
+Most interactive commands require an active loaded file because they need the
+Agda session context. Start with `agda_load`.
+### Proof search or elaboration returns unexpected output
+Agda response formatting varies across commands. When in doubt, inspect the goal
+again with `agda_goal_type` and retry with a simpler expression.
+## License
+This project is licensed under the MIT License. External extension modules may
+use different licenses.

package/dist/agda/advanced-queries.d.ts ADDED Viewed

@@ -0,0 +1,52 @@
+import type { AgdaSessionContext, AgdaResponse, WhyInScopeResult, ElaborateResult, HelperFunctionResult, ModuleContentsResult, SearchAboutResult, AutoResult, GoalTypeContextInferResult } from "./types.js";
+/**
+ * Show current constraints.
+ */
+export declare function constraints(ctx: AgdaSessionContext): Promise<{
+    text: string;
+    raw: AgdaResponse[];
+}>;
+/**
+ * Solve all goals that have unique solutions.
+ */
+export declare function solveAll(ctx: AgdaSessionContext): Promise<{
+    solutions: string[];
+    raw: AgdaResponse[];
+}>;
+/**
+ * Explain why a name is in scope at a given goal.
+ */
+export declare function whyInScope(ctx: AgdaSessionContext, goalId: number, name: string): Promise<WhyInScopeResult>;
+/**
+ * Explain why a name is in scope at the top level.
+ */
+export declare function whyInScopeTopLevel(ctx: AgdaSessionContext, name: string): Promise<WhyInScopeResult>;
+/**
+ * Elaborate an expression in a goal context (normalize and show full form).
+ */
+export declare function elaborate(ctx: AgdaSessionContext, goalId: number, expr: string): Promise<ElaborateResult>;
+/**
+ * Generate a helper function type for an expression in a goal context.
+ */
+export declare function helperFunction(ctx: AgdaSessionContext, goalId: number, expr: string): Promise<HelperFunctionResult>;
+/**
+ * Show the contents of a module in a goal context.
+ */
+export declare function showModuleContents(ctx: AgdaSessionContext, goalId: number, moduleName: string): Promise<ModuleContentsResult>;
+/**
+ * Show the contents of a module at the top level.
+ */
+export declare function showModuleContentsTopLevel(ctx: AgdaSessionContext, moduleName: string): Promise<ModuleContentsResult>;
+/**
+ * Search for definitions matching a query string.
+ */
+export declare function searchAbout(ctx: AgdaSessionContext, query: string): Promise<SearchAboutResult>;
+/**
+ * Auto-solve all goals.
+ */
+export declare function autoAll(ctx: AgdaSessionContext): Promise<AutoResult>;
+/**
+ * Get the goal type, context, and inferred type of an expression
+ * in a goal context (combined query).
+ */
+export declare function goalTypeContextInfer(ctx: AgdaSessionContext, goalId: number, expr: string): Promise<GoalTypeContextInferResult>;