npm - @dedesfr/prompter - Versions diffs - 0.8.23 → 1.0.0 - Mend

@dedesfr/prompter 0.8.23 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (247) hide show

package/CHANGELOG.md +70 -0
package/README.md +105 -77
package/dist/cli/index.js +25 -1
package/dist/cli/index.js.map +1 -1
package/dist/commands/init.d.ts +1 -7
package/dist/commands/init.d.ts.map +1 -1
package/dist/commands/init.js +60 -299
package/dist/commands/init.js.map +1 -1
package/dist/commands/login.d.ts +4 -0
package/dist/commands/login.d.ts.map +1 -0
package/dist/commands/login.js +56 -0
package/dist/commands/login.js.map +1 -0
package/dist/commands/logout.d.ts +4 -0
package/dist/commands/logout.d.ts.map +1 -0
package/dist/commands/logout.js +14 -0
package/dist/commands/logout.js.map +1 -0
package/dist/commands/update.d.ts.map +1 -1
package/dist/commands/update.js +31 -41
package/dist/commands/update.js.map +1 -1
package/dist/commands/whoami.d.ts +4 -0
package/dist/commands/whoami.d.ts.map +1 -0
package/dist/commands/whoami.js +42 -0
package/dist/commands/whoami.js.map +1 -0
package/dist/core/auth-store.d.ts +10 -0
package/dist/core/auth-store.d.ts.map +1 -0
package/dist/core/auth-store.js +39 -0
package/dist/core/auth-store.js.map +1 -0
package/dist/core/configurators/slash/antigravity.d.ts +2 -5
package/dist/core/configurators/slash/antigravity.d.ts.map +1 -1
package/dist/core/configurators/slash/antigravity.js +2 -57
package/dist/core/configurators/slash/antigravity.js.map +1 -1
package/dist/core/configurators/slash/base.d.ts +6 -18
package/dist/core/configurators/slash/base.d.ts.map +1 -1
package/dist/core/configurators/slash/base.js +8 -77
package/dist/core/configurators/slash/base.js.map +1 -1
package/dist/core/configurators/slash/claude.d.ts +2 -5
package/dist/core/configurators/slash/claude.d.ts.map +1 -1
package/dist/core/configurators/slash/claude.js +2 -57
package/dist/core/configurators/slash/claude.js.map +1 -1
package/dist/core/configurators/slash/codex.d.ts +2 -5
package/dist/core/configurators/slash/codex.d.ts.map +1 -1
package/dist/core/configurators/slash/codex.js +2 -57
package/dist/core/configurators/slash/codex.js.map +1 -1
package/dist/core/configurators/slash/droid.d.ts +2 -5
package/dist/core/configurators/slash/droid.d.ts.map +1 -1
package/dist/core/configurators/slash/droid.js +2 -32
package/dist/core/configurators/slash/droid.js.map +1 -1
package/dist/core/configurators/slash/forge.d.ts +2 -5
package/dist/core/configurators/slash/forge.d.ts.map +1 -1
package/dist/core/configurators/slash/forge.js +2 -32
package/dist/core/configurators/slash/forge.js.map +1 -1
package/dist/core/configurators/slash/github-copilot.d.ts +2 -7
package/dist/core/configurators/slash/github-copilot.d.ts.map +1 -1
package/dist/core/configurators/slash/github-copilot.js +2 -96
package/dist/core/configurators/slash/github-copilot.js.map +1 -1
package/dist/core/configurators/slash/index.d.ts +1 -1
package/dist/core/configurators/slash/index.d.ts.map +1 -1
package/dist/core/configurators/slash/index.js +1 -1
package/dist/core/configurators/slash/index.js.map +1 -1
package/dist/core/configurators/slash/kilocode.d.ts +2 -5
package/dist/core/configurators/slash/kilocode.d.ts.map +1 -1
package/dist/core/configurators/slash/kilocode.js +2 -57
package/dist/core/configurators/slash/kilocode.js.map +1 -1
package/dist/core/configurators/slash/opencode.d.ts +2 -5
package/dist/core/configurators/slash/opencode.d.ts.map +1 -1
package/dist/core/configurators/slash/opencode.js +2 -57
package/dist/core/configurators/slash/opencode.js.map +1 -1
package/dist/core/configurators/slash/registry.d.ts +4 -4
package/dist/core/configurators/slash/registry.d.ts.map +1 -1
package/dist/core/configurators/slash/registry.js.map +1 -1
package/dist/core/registry.d.ts +18 -0
package/dist/core/registry.d.ts.map +1 -0
package/dist/core/registry.js +94 -0
package/dist/core/registry.js.map +1 -0
package/dist/core/templates/index.d.ts +0 -1
package/dist/core/templates/index.d.ts.map +1 -1
package/dist/core/templates/index.js +0 -1
package/dist/core/templates/index.js.map +1 -1
package/package.json +7 -1
package/AGENTS.md +0 -123
package/CLAUDE.md +0 -17
package/build.js +0 -20
package/convex-setup.md +0 -403
package/dist/core/templates/slash-command-templates.d.ts +0 -7
package/dist/core/templates/slash-command-templates.d.ts.map +0 -1
package/dist/core/templates/slash-command-templates.js +0 -1041
package/dist/core/templates/slash-command-templates.js.map +0 -1
package/prompt/ai-humanizer.md +0 -45
package/prompt/api-contract-generator.md +0 -234
package/prompt/apply.md +0 -17
package/prompt/archive.md +0 -21
package/prompt/design-system.md +0 -210
package/prompt/document-explainer.md +0 -149
package/prompt/epic-generator.md +0 -198
package/prompt/epic-single.md +0 -47
package/prompt/erd-generator.md +0 -130
package/prompt/fsd-generator.md +0 -157
package/prompt/prd-agent-generator.md +0 -147
package/prompt/prd-generator.md +0 -195
package/prompt/product-brief.md +0 -289
package/prompt/proposal.md +0 -22
package/prompt/qa-test-scenario.md +0 -133
package/prompt/skill-creator.md +0 -350
package/prompt/story-generator.md +0 -278
package/prompt/story-single.md +0 -70
package/prompt/tdd-generator.md +0 -294
package/prompt/tdd-lite-generator.md +0 -224
package/prompt/wireframe-generator.md +0 -219
package/skills/ai-context-generator/SKILL.md +0 -54
package/skills/ai-context-generator/references/AGENTS.template.md +0 -83
package/skills/ai-context-generator/references/CLAUDE.template.md +0 -39
package/skills/ai-context-generator/references/behavioral-guidelines.md +0 -71
package/skills/ai-context-generator/references/discovery-checklist.md +0 -40
package/skills/ai-context-generator/references/examples/AGENTS.good.md +0 -103
package/skills/ai-context-generator/references/extraction-checklist.md +0 -23
package/skills/ai-context-generator/references/overlays/laravel.md +0 -44
package/skills/cerebro/SKILL.md +0 -187
package/skills/cerebro/references/agents.md +0 -213
package/skills/code-review/SKILL.md +0 -373
package/skills/code-review/assets/report-template-agent.md +0 -212
package/skills/code-review/assets/report-template-compact.md +0 -81
package/skills/code-review/assets/report-template-full.md +0 -264
package/skills/code-review/assets/report-template-human.md +0 -168
package/skills/code-review/references/universal-patterns.md +0 -495
package/skills/design-md/README.md +0 -34
package/skills/design-md/SKILL.md +0 -172
package/skills/design-md/examples/DESIGN.md +0 -154
package/skills/design-system-generator/SKILL.md +0 -324
package/skills/design-system-generator/assets/design-system-template.md +0 -348
package/skills/design-system-generator/references/extraction-patterns.md +0 -321
package/skills/doc-builder/SKILL.md +0 -115
package/skills/doc-builder/references/ui-patterns.md +0 -394
package/skills/document-translator/SKILL.md +0 -58
package/skills/enhance-prompt/README.md +0 -34
package/skills/enhance-prompt/SKILL.md +0 -204
package/skills/enhance-prompt/references/KEYWORDS.md +0 -114
package/skills/feature-planner/SKILL.md +0 -305
package/skills/feature-planner/assets/implementation-plan-template.md +0 -85
package/skills/frontend-design/LICENSE.txt +0 -177
package/skills/frontend-design/SKILL.md +0 -42
package/skills/gamma-builder/SKILL.md +0 -134
package/skills/laravel-code-review/SKILL.md +0 -383
package/skills/laravel-code-review/assets/report-template-agent.md +0 -195
package/skills/laravel-code-review/assets/report-template-compact.md +0 -79
package/skills/laravel-code-review/assets/report-template-full.md +0 -253
package/skills/laravel-code-review/assets/report-template-human.md +0 -159
package/skills/laravel-code-review/references/laravel-patterns.md +0 -571
package/skills/laravel-code-review/references/php84-features.md +0 -442
package/skills/mcp-builder/LICENSE.txt +0 -202
package/skills/mcp-builder/SKILL.md +0 -236
package/skills/mcp-builder/reference/evaluation.md +0 -602
package/skills/mcp-builder/reference/mcp_best_practices.md +0 -249
package/skills/mcp-builder/reference/node_mcp_server.md +0 -970
package/skills/mcp-builder/reference/python_mcp_server.md +0 -719
package/skills/mcp-builder/scripts/connections.py +0 -151
package/skills/mcp-builder/scripts/evaluation.py +0 -373
package/skills/mcp-builder/scripts/example_evaluation.xml +0 -22
package/skills/mcp-builder/scripts/requirements.txt +0 -2
package/skills/meeting-notes/SKILL.md +0 -159
package/skills/meeting-notes/evals/evals.json +0 -23
package/skills/project-orchestrator/SKILL.md +0 -487
package/skills/project-orchestrator/assets/caddy-vps-setup.md +0 -180
package/skills/project-orchestrator/assets/plan-summary-template.md +0 -159
package/skills/prompter-specs/SKILL.md +0 -115
package/skills/prompter-workflow/SKILL.md +0 -166
package/skills/prompter-workflow/evals/evals.json +0 -89
package/skills/sph-generator/SKILL.md +0 -488
package/skills/ui-ux-pro/SKILL.md +0 -199
package/skills/ui-ux-pro/assets/design-spec-template.md +0 -173
package/skills/ui-ux-pro/references/component-patterns.md +0 -255
package/skills/ui-ux-pro/references/design-principles.md +0 -167
package/src/cli/index.ts +0 -223
package/src/commands/archive.ts +0 -302
package/src/commands/change.ts +0 -292
package/src/commands/config.ts +0 -233
package/src/commands/guide.ts +0 -50
package/src/commands/init.ts +0 -899
package/src/commands/list.ts +0 -194
package/src/commands/show.ts +0 -138
package/src/commands/spec.ts +0 -251
package/src/commands/update.ts +0 -156
package/src/commands/upgrade.ts +0 -30
package/src/commands/validate.ts +0 -326
package/src/core/artifact-graph/graph.ts +0 -167
package/src/core/artifact-graph/index.ts +0 -44
package/src/core/artifact-graph/instruction-loader.ts +0 -302
package/src/core/artifact-graph/resolver.ts +0 -226
package/src/core/artifact-graph/schema.ts +0 -124
package/src/core/artifact-graph/state.ts +0 -64
package/src/core/artifact-graph/types.ts +0 -65
package/src/core/completions/command-registry.ts +0 -382
package/src/core/completions/completion-provider.ts +0 -128
package/src/core/completions/generators/bash-generator.ts +0 -191
package/src/core/completions/generators/fish-generator.ts +0 -188
package/src/core/completions/generators/powershell-generator.ts +0 -223
package/src/core/completions/generators/zsh-generator.ts +0 -281
package/src/core/completions/templates/bash-templates.ts +0 -24
package/src/core/completions/templates/fish-templates.ts +0 -40
package/src/core/completions/templates/powershell-templates.ts +0 -25
package/src/core/completions/templates/zsh-templates.ts +0 -36
package/src/core/completions/types.ts +0 -90
package/src/core/config-schema.ts +0 -230
package/src/core/config.ts +0 -181
package/src/core/configurators/slash/antigravity.ts +0 -70
package/src/core/configurators/slash/base.ts +0 -203
package/src/core/configurators/slash/claude.ts +0 -70
package/src/core/configurators/slash/codex.ts +0 -70
package/src/core/configurators/slash/droid.ts +0 -44
package/src/core/configurators/slash/forge.ts +0 -44
package/src/core/configurators/slash/github-copilot.ts +0 -114
package/src/core/configurators/slash/index.ts +0 -10
package/src/core/configurators/slash/kilocode.ts +0 -70
package/src/core/configurators/slash/opencode.ts +0 -70
package/src/core/configurators/slash/registry.ts +0 -51
package/src/core/converters/json-converter.ts +0 -62
package/src/core/global-config.ts +0 -136
package/src/core/parsers/change-parser.ts +0 -234
package/src/core/parsers/markdown-parser.ts +0 -237
package/src/core/parsers/requirement-blocks.ts +0 -234
package/src/core/prompt-templates.ts +0 -3504
package/src/core/schemas/base.schema.ts +0 -20
package/src/core/schemas/change.schema.ts +0 -42
package/src/core/schemas/index.ts +0 -20
package/src/core/schemas/spec.schema.ts +0 -17
package/src/core/skill-discovery.ts +0 -68
package/src/core/specs-apply.ts +0 -483
package/src/core/styles/palette.ts +0 -8
package/src/core/templates/agents-template.ts +0 -459
package/src/core/templates/claude-template.ts +0 -2
package/src/core/templates/index.ts +0 -4
package/src/core/templates/project-template.ts +0 -32
package/src/core/templates/slash-command-templates.ts +0 -1068
package/src/core/validation/constants.ts +0 -48
package/src/core/validation/types.ts +0 -19
package/src/core/validation/validator.ts +0 -449
package/src/core/view.ts +0 -219
package/src/index.ts +0 -1
package/src/utils/change-metadata.ts +0 -171
package/src/utils/change-utils.ts +0 -131
package/src/utils/file-system.ts +0 -252
package/src/utils/index.ts +0 -12
package/src/utils/interactive.ts +0 -29
package/src/utils/item-discovery.ts +0 -66
package/src/utils/match.ts +0 -26
package/src/utils/shell-detection.ts +0 -62
package/src/utils/task-progress.ts +0 -43
package/tsconfig.json +0 -28

package/skills/mcp-builder/scripts/connections.py DELETED Viewed

@@ -1,151 +0,0 @@
-"""Lightweight connection handling for MCP servers."""
-from abc import ABC, abstractmethod
-from contextlib import AsyncExitStack
-from typing import Any
-from mcp import ClientSession, StdioServerParameters
-from mcp.client.sse import sse_client
-from mcp.client.stdio import stdio_client
-from mcp.client.streamable_http import streamablehttp_client
-class MCPConnection(ABC):
-    """Base class for MCP server connections."""
-    def __init__(self):
-        self.session = None
-        self._stack = None
-    @abstractmethod
-    def _create_context(self):
-        """Create the connection context based on connection type."""
-    async def __aenter__(self):
-        """Initialize MCP server connection."""
-        self._stack = AsyncExitStack()
-        await self._stack.__aenter__()
-        try:
-            ctx = self._create_context()
-            result = await self._stack.enter_async_context(ctx)
-            if len(result) == 2:
-                read, write = result
-            elif len(result) == 3:
-                read, write, _ = result
-            else:
-                raise ValueError(f"Unexpected context result: {result}")
-            session_ctx = ClientSession(read, write)
-            self.session = await self._stack.enter_async_context(session_ctx)
-            await self.session.initialize()
-            return self
-        except BaseException:
-            await self._stack.__aexit__(None, None, None)
-            raise
-    async def __aexit__(self, exc_type, exc_val, exc_tb):
-        """Clean up MCP server connection resources."""
-        if self._stack:
-            await self._stack.__aexit__(exc_type, exc_val, exc_tb)
-        self.session = None
-        self._stack = None
-    async def list_tools(self) -> list[dict[str, Any]]:
-        """Retrieve available tools from the MCP server."""
-        response = await self.session.list_tools()
-        return [
-            {
-                "name": tool.name,
-                "description": tool.description,
-                "input_schema": tool.inputSchema,
-            }
-            for tool in response.tools
-        ]
-    async def call_tool(self, tool_name: str, arguments: dict[str, Any]) -> Any:
-        """Call a tool on the MCP server with provided arguments."""
-        result = await self.session.call_tool(tool_name, arguments=arguments)
-        return result.content
-class MCPConnectionStdio(MCPConnection):
-    """MCP connection using standard input/output."""
-    def __init__(self, command: str, args: list[str] = None, env: dict[str, str] = None):
-        super().__init__()
-        self.command = command
-        self.args = args or []
-        self.env = env
-    def _create_context(self):
-        return stdio_client(
-            StdioServerParameters(command=self.command, args=self.args, env=self.env)
-        )
-class MCPConnectionSSE(MCPConnection):
-    """MCP connection using Server-Sent Events."""
-    def __init__(self, url: str, headers: dict[str, str] = None):
-        super().__init__()
-        self.url = url
-        self.headers = headers or {}
-    def _create_context(self):
-        return sse_client(url=self.url, headers=self.headers)
-class MCPConnectionHTTP(MCPConnection):
-    """MCP connection using Streamable HTTP."""
-    def __init__(self, url: str, headers: dict[str, str] = None):
-        super().__init__()
-        self.url = url
-        self.headers = headers or {}
-    def _create_context(self):
-        return streamablehttp_client(url=self.url, headers=self.headers)
-def create_connection(
-    transport: str,
-    command: str = None,
-    args: list[str] = None,
-    env: dict[str, str] = None,
-    url: str = None,
-    headers: dict[str, str] = None,
-) -> MCPConnection:
-    """Factory function to create the appropriate MCP connection.
-    Args:
-        transport: Connection type ("stdio", "sse", or "http")
-        command: Command to run (stdio only)
-        args: Command arguments (stdio only)
-        env: Environment variables (stdio only)
-        url: Server URL (sse and http only)
-        headers: HTTP headers (sse and http only)
-    Returns:
-        MCPConnection instance
-    """
-    transport = transport.lower()
-    if transport == "stdio":
-        if not command:
-            raise ValueError("Command is required for stdio transport")
-        return MCPConnectionStdio(command=command, args=args, env=env)
-    elif transport == "sse":
-        if not url:
-            raise ValueError("URL is required for sse transport")
-        return MCPConnectionSSE(url=url, headers=headers)
-    elif transport in ["http", "streamable_http", "streamable-http"]:
-        if not url:
-            raise ValueError("URL is required for http transport")
-        return MCPConnectionHTTP(url=url, headers=headers)
-    else:
-        raise ValueError(f"Unsupported transport type: {transport}. Use 'stdio', 'sse', or 'http'")

package/skills/mcp-builder/scripts/evaluation.py DELETED Viewed

@@ -1,373 +0,0 @@
-"""MCP Server Evaluation Harness
-This script evaluates MCP servers by running test questions against them using Claude.
-"""
-import argparse
-import asyncio
-import json
-import re
-import sys
-import time
-import traceback
-import xml.etree.ElementTree as ET
-from pathlib import Path
-from typing import Any
-from anthropic import Anthropic
-from connections import create_connection
-EVALUATION_PROMPT = """You are an AI assistant with access to tools.
-When given a task, you MUST:
-1. Use the available tools to complete the task
-2. Provide summary of each step in your approach, wrapped in <summary> tags
-3. Provide feedback on the tools provided, wrapped in <feedback> tags
-4. Provide your final response, wrapped in <response> tags
-Summary Requirements:
-- In your <summary> tags, you must explain:
-  - The steps you took to complete the task
-  - Which tools you used, in what order, and why
-  - The inputs you provided to each tool
-  - The outputs you received from each tool
-  - A summary for how you arrived at the response
-Feedback Requirements:
-- In your <feedback> tags, provide constructive feedback on the tools:
-  - Comment on tool names: Are they clear and descriptive?
-  - Comment on input parameters: Are they well-documented? Are required vs optional parameters clear?
-  - Comment on descriptions: Do they accurately describe what the tool does?
-  - Comment on any errors encountered during tool usage: Did the tool fail to execute? Did the tool return too many tokens?
-  - Identify specific areas for improvement and explain WHY they would help
-  - Be specific and actionable in your suggestions
-Response Requirements:
-- Your response should be concise and directly address what was asked
-- Always wrap your final response in <response> tags
-- If you cannot solve the task return <response>NOT_FOUND</response>
-- For numeric responses, provide just the number
-- For IDs, provide just the ID
-- For names or text, provide the exact text requested
-- Your response should go last"""
-def parse_evaluation_file(file_path: Path) -> list[dict[str, Any]]:
-    """Parse XML evaluation file with qa_pair elements."""
-    try:
-        tree = ET.parse(file_path)
-        root = tree.getroot()
-        evaluations = []
-        for qa_pair in root.findall(".//qa_pair"):
-            question_elem = qa_pair.find("question")
-            answer_elem = qa_pair.find("answer")
-            if question_elem is not None and answer_elem is not None:
-                evaluations.append({
-                    "question": (question_elem.text or "").strip(),
-                    "answer": (answer_elem.text or "").strip(),
-                })
-        return evaluations
-    except Exception as e:
-        print(f"Error parsing evaluation file {file_path}: {e}")
-        return []
-def extract_xml_content(text: str, tag: str) -> str | None:
-    """Extract content from XML tags."""
-    pattern = rf"<{tag}>(.*?)</{tag}>"
-    matches = re.findall(pattern, text, re.DOTALL)
-    return matches[-1].strip() if matches else None
-async def agent_loop(
-    client: Anthropic,
-    model: str,
-    question: str,
-    tools: list[dict[str, Any]],
-    connection: Any,
-) -> tuple[str, dict[str, Any]]:
-    """Run the agent loop with MCP tools."""
-    messages = [{"role": "user", "content": question}]
-    response = await asyncio.to_thread(
-        client.messages.create,
-        model=model,
-        max_tokens=4096,
-        system=EVALUATION_PROMPT,
-        messages=messages,
-        tools=tools,
-    )
-    messages.append({"role": "assistant", "content": response.content})
-    tool_metrics = {}
-    while response.stop_reason == "tool_use":
-        tool_use = next(block for block in response.content if block.type == "tool_use")
-        tool_name = tool_use.name
-        tool_input = tool_use.input
-        tool_start_ts = time.time()
-        try:
-            tool_result = await connection.call_tool(tool_name, tool_input)
-            tool_response = json.dumps(tool_result) if isinstance(tool_result, (dict, list)) else str(tool_result)
-        except Exception as e:
-            tool_response = f"Error executing tool {tool_name}: {str(e)}\n"
-            tool_response += traceback.format_exc()
-        tool_duration = time.time() - tool_start_ts
-        if tool_name not in tool_metrics:
-            tool_metrics[tool_name] = {"count": 0, "durations": []}
-        tool_metrics[tool_name]["count"] += 1
-        tool_metrics[tool_name]["durations"].append(tool_duration)
-        messages.append({
-            "role": "user",
-            "content": [{
-                "type": "tool_result",
-                "tool_use_id": tool_use.id,
-                "content": tool_response,
-            }]
-        })
-        response = await asyncio.to_thread(
-            client.messages.create,
-            model=model,
-            max_tokens=4096,
-            system=EVALUATION_PROMPT,
-            messages=messages,
-            tools=tools,
-        )
-        messages.append({"role": "assistant", "content": response.content})
-    response_text = next(
-        (block.text for block in response.content if hasattr(block, "text")),
-        None,
-    )
-    return response_text, tool_metrics
-async def evaluate_single_task(
-    client: Anthropic,
-    model: str,
-    qa_pair: dict[str, Any],
-    tools: list[dict[str, Any]],
-    connection: Any,
-    task_index: int,
-) -> dict[str, Any]:
-    """Evaluate a single QA pair with the given tools."""
-    start_time = time.time()
-    print(f"Task {task_index + 1}: Running task with question: {qa_pair['question']}")
-    response, tool_metrics = await agent_loop(client, model, qa_pair["question"], tools, connection)
-    response_value = extract_xml_content(response, "response")
-    summary = extract_xml_content(response, "summary")
-    feedback = extract_xml_content(response, "feedback")
-    duration_seconds = time.time() - start_time
-    return {
-        "question": qa_pair["question"],
-        "expected": qa_pair["answer"],
-        "actual": response_value,
-        "score": int(response_value == qa_pair["answer"]) if response_value else 0,
-        "total_duration": duration_seconds,
-        "tool_calls": tool_metrics,
-        "num_tool_calls": sum(len(metrics["durations"]) for metrics in tool_metrics.values()),
-        "summary": summary,
-        "feedback": feedback,
-    }
-REPORT_HEADER = """
-# Evaluation Report
-## Summary
-- **Accuracy**: {correct}/{total} ({accuracy:.1f}%)
-- **Average Task Duration**: {average_duration_s:.2f}s
-- **Average Tool Calls per Task**: {average_tool_calls:.2f}
-- **Total Tool Calls**: {total_tool_calls}
----
-"""
-TASK_TEMPLATE = """
-### Task {task_num}
-**Question**: {question}
-**Ground Truth Answer**: `{expected_answer}`
-**Actual Answer**: `{actual_answer}`
-**Correct**: {correct_indicator}
-**Duration**: {total_duration:.2f}s
-**Tool Calls**: {tool_calls}
-**Summary**
-{summary}
-**Feedback**
-{feedback}
----
-"""
-async def run_evaluation(
-    eval_path: Path,
-    connection: Any,
-    model: str = "claude-3-7-sonnet-20250219",
-) -> str:
-    """Run evaluation with MCP server tools."""
-    print("🚀 Starting Evaluation")
-    client = Anthropic()
-    tools = await connection.list_tools()
-    print(f"📋 Loaded {len(tools)} tools from MCP server")
-    qa_pairs = parse_evaluation_file(eval_path)
-    print(f"📋 Loaded {len(qa_pairs)} evaluation tasks")
-    results = []
-    for i, qa_pair in enumerate(qa_pairs):
-        print(f"Processing task {i + 1}/{len(qa_pairs)}")
-        result = await evaluate_single_task(client, model, qa_pair, tools, connection, i)
-        results.append(result)
-    correct = sum(r["score"] for r in results)
-    accuracy = (correct / len(results)) * 100 if results else 0
-    average_duration_s = sum(r["total_duration"] for r in results) / len(results) if results else 0
-    average_tool_calls = sum(r["num_tool_calls"] for r in results) / len(results) if results else 0
-    total_tool_calls = sum(r["num_tool_calls"] for r in results)
-    report = REPORT_HEADER.format(
-        correct=correct,
-        total=len(results),
-        accuracy=accuracy,
-        average_duration_s=average_duration_s,
-        average_tool_calls=average_tool_calls,
-        total_tool_calls=total_tool_calls,
-    )
-    report += "".join([
-        TASK_TEMPLATE.format(
-            task_num=i + 1,
-            question=qa_pair["question"],
-            expected_answer=qa_pair["answer"],
-            actual_answer=result["actual"] or "N/A",
-            correct_indicator="✅" if result["score"] else "❌",
-            total_duration=result["total_duration"],
-            tool_calls=json.dumps(result["tool_calls"], indent=2),
-            summary=result["summary"] or "N/A",
-            feedback=result["feedback"] or "N/A",
-        )
-        for i, (qa_pair, result) in enumerate(zip(qa_pairs, results))
-    ])
-    return report
-def parse_headers(header_list: list[str]) -> dict[str, str]:
-    """Parse header strings in format 'Key: Value' into a dictionary."""
-    headers = {}
-    if not header_list:
-        return headers
-    for header in header_list:
-        if ":" in header:
-            key, value = header.split(":", 1)
-            headers[key.strip()] = value.strip()
-        else:
-            print(f"Warning: Ignoring malformed header: {header}")
-    return headers
-def parse_env_vars(env_list: list[str]) -> dict[str, str]:
-    """Parse environment variable strings in format 'KEY=VALUE' into a dictionary."""
-    env = {}
-    if not env_list:
-        return env
-    for env_var in env_list:
-        if "=" in env_var:
-            key, value = env_var.split("=", 1)
-            env[key.strip()] = value.strip()
-        else:
-            print(f"Warning: Ignoring malformed environment variable: {env_var}")
-    return env
-async def main():
-    parser = argparse.ArgumentParser(
-        description="Evaluate MCP servers using test questions",
-        formatter_class=argparse.RawDescriptionHelpFormatter,
-        epilog="""
-Examples:
-  # Evaluate a local stdio MCP server
-  python evaluation.py -t stdio -c python -a my_server.py eval.xml
-  # Evaluate an SSE MCP server
-  python evaluation.py -t sse -u https://example.com/mcp -H "Authorization: Bearer token" eval.xml
-  # Evaluate an HTTP MCP server with custom model
-  python evaluation.py -t http -u https://example.com/mcp -m claude-3-5-sonnet-20241022 eval.xml
-        """,
-    )
-    parser.add_argument("eval_file", type=Path, help="Path to evaluation XML file")
-    parser.add_argument("-t", "--transport", choices=["stdio", "sse", "http"], default="stdio", help="Transport type (default: stdio)")
-    parser.add_argument("-m", "--model", default="claude-3-7-sonnet-20250219", help="Claude model to use (default: claude-3-7-sonnet-20250219)")
-    stdio_group = parser.add_argument_group("stdio options")
-    stdio_group.add_argument("-c", "--command", help="Command to run MCP server (stdio only)")
-    stdio_group.add_argument("-a", "--args", nargs="+", help="Arguments for the command (stdio only)")
-    stdio_group.add_argument("-e", "--env", nargs="+", help="Environment variables in KEY=VALUE format (stdio only)")
-    remote_group = parser.add_argument_group("sse/http options")
-    remote_group.add_argument("-u", "--url", help="MCP server URL (sse/http only)")
-    remote_group.add_argument("-H", "--header", nargs="+", dest="headers", help="HTTP headers in 'Key: Value' format (sse/http only)")
-    parser.add_argument("-o", "--output", type=Path, help="Output file for evaluation report (default: stdout)")
-    args = parser.parse_args()
-    if not args.eval_file.exists():
-        print(f"Error: Evaluation file not found: {args.eval_file}")
-        sys.exit(1)
-    headers = parse_headers(args.headers) if args.headers else None
-    env_vars = parse_env_vars(args.env) if args.env else None
-    try:
-        connection = create_connection(
-            transport=args.transport,
-            command=args.command,
-            args=args.args,
-            env=env_vars,
-            url=args.url,
-            headers=headers,
-        )
-    except ValueError as e:
-        print(f"Error: {e}")
-        sys.exit(1)
-    print(f"🔗 Connecting to MCP server via {args.transport}...")
-    async with connection:
-        print("✅ Connected successfully")
-        report = await run_evaluation(args.eval_file, connection, args.model)
-        if args.output:
-            args.output.write_text(report)
-            print(f"\n✅ Report saved to {args.output}")
-        else:
-            print("\n" + report)
-if __name__ == "__main__":
-    asyncio.run(main())

package/skills/mcp-builder/scripts/example_evaluation.xml DELETED Viewed

@@ -1,22 +0,0 @@
-<evaluation>
-   <qa_pair>
-      <question>Calculate the compound interest on $10,000 invested at 5% annual interest rate, compounded monthly for 3 years. What is the final amount in dollars (rounded to 2 decimal places)?</question>
-      <answer>11614.72</answer>
-   </qa_pair>
-   <qa_pair>
-      <question>A projectile is launched at a 45-degree angle with an initial velocity of 50 m/s. Calculate the total distance (in meters) it has traveled from the launch point after 2 seconds, assuming g=9.8 m/s². Round to 2 decimal places.</question>
-      <answer>87.25</answer>
-   </qa_pair>
-   <qa_pair>
-      <question>A sphere has a volume of 500 cubic meters. Calculate its surface area in square meters. Round to 2 decimal places.</question>
-      <answer>304.65</answer>
-   </qa_pair>
-   <qa_pair>
-      <question>Calculate the population standard deviation of this dataset: [12, 15, 18, 22, 25, 30, 35]. Round to 2 decimal places.</question>
-      <answer>7.61</answer>
-   </qa_pair>
-   <qa_pair>
-      <question>Calculate the pH of a solution with a hydrogen ion concentration of 3.5 × 10^-5 M. Round to 2 decimal places.</question>
-      <answer>4.46</answer>
-   </qa_pair>
-</evaluation>

package/skills/mcp-builder/scripts/requirements.txt DELETED Viewed

	@@ -1,2 +0,0 @@
1	- anthropic>=0.39.0
2	- mcp>=1.1.0