PyPI - skilllite - Versions diffs - 0.1.0__py3-none-any.whl → 0.1.2__py3-none-any.whl - Mend

skilllite 0.1.0py3-none-any.whl → 0.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

skilllite/__init__.py +1 -1
skilllite/cli/__init__.py +19 -0
skilllite/cli/__main__.py +10 -0
skilllite/cli/binary.py +93 -0
skilllite/cli/integrations/__init__.py +8 -0
skilllite/cli/integrations/opencode.py +316 -0
skilllite/cli/main.py +142 -0
skilllite/cli/mcp.py +29 -0
skilllite/core/__init__.py +2 -0
skilllite/core/adapters/__init__.py +74 -0
skilllite/core/adapters/langchain.py +362 -0
skilllite/core/adapters/llamaindex.py +264 -0
skilllite/core/handler.py +179 -4
skilllite/core/loops.py +180 -15
skilllite/core/manager.py +82 -15
skilllite/core/metadata.py +14 -7
skilllite/core/security.py +420 -0
skilllite/mcp/server.py +537 -49
skilllite/quick.py +14 -4
skilllite/sandbox/context.py +155 -0
skilllite/sandbox/execution_service.py +254 -0
skilllite/sandbox/skillbox/executor.py +124 -19
skilllite/sandbox/unified_executor.py +359 -0
{skilllite-0.1.0.dist-info → skilllite-0.1.2.dist-info}/METADATA +151 -1
skilllite-0.1.2.dist-info/RECORD +45 -0
skilllite/cli.py +0 -217
skilllite-0.1.0.dist-info/RECORD +0 -32
{skilllite-0.1.0.dist-info → skilllite-0.1.2.dist-info}/WHEEL +0 -0
{skilllite-0.1.0.dist-info → skilllite-0.1.2.dist-info}/entry_points.txt +0 -0
{skilllite-0.1.0.dist-info → skilllite-0.1.2.dist-info}/licenses/LICENSE +0 -0
{skilllite-0.1.0.dist-info → skilllite-0.1.2.dist-info}/top_level.txt +0 -0

skilllite/core/handler.py CHANGED Viewed

@@ -5,16 +5,22 @@ This module handles:
 - Parsing tool calls from LLM responses
 - Executing tool calls
 - Formatting tool results
+Updated to support UnifiedExecutionService for consistent sandbox level handling.
 """
 import json
-from typing import Any, Dict, List, Optional, TYPE_CHECKING
+from typing import Any, Callable, Dict, List, Optional, TYPE_CHECKING
 from .executor import ExecutionResult, SkillExecutor
 from .tools import ToolResult, ToolUseRequest
 if TYPE_CHECKING:
     from .registry import SkillRegistry
+    from ..sandbox.execution_service import UnifiedExecutionService
+# Type alias for confirmation callback
+ConfirmationCallback = Callable[[str, str], bool]
 class ToolCallHandler:
@@ -95,7 +101,71 @@ class ToolCallHandler:
             allow_network=allow_network,
             timeout=timeout
         )
+    def execute_with_unified_service(
+        self,
+        skill_name: str,
+        input_data: Dict[str, Any],
+        confirmation_callback: Optional[ConfirmationCallback] = None,
+        allow_network: Optional[bool] = None,
+        timeout: Optional[int] = None
+    ) -> ExecutionResult:
+        """
+        Execute a skill using the UnifiedExecutionService.
+        This method uses the unified execution layer which:
+        1. Reads sandbox level at runtime (not from instance variables)
+        2. Handles security scanning and confirmation
+        3. Properly downgrades sandbox level after confirmation
+        Args:
+            skill_name: Name of the skill or multi-script tool
+            input_data: Input data for the skill
+            confirmation_callback: Callback for security confirmation
+            allow_network: Whether to allow network access
+            timeout: Execution timeout in seconds
+        Returns:
+            ExecutionResult with output or error
+        """
+        from ..sandbox.execution_service import UnifiedExecutionService
+        service = UnifiedExecutionService.get_instance()
+        # Check if it's a multi-script tool
+        tool_info = self._registry.get_multi_script_tool_info(skill_name)
+        if tool_info:
+            parent_skill = self._registry.get_skill(tool_info["skill_name"])
+            if not parent_skill:
+                return ExecutionResult(
+                    success=False,
+                    error=f"Parent skill not found: {tool_info['skill_name']}"
+                )
+            return service.execute_skill(
+                skill_info=parent_skill,
+                input_data=input_data,
+                entry_point=tool_info["script_path"],
+                confirmation_callback=confirmation_callback,
+                allow_network=allow_network,
+                timeout=timeout,
+            )
+        # Regular skill execution
+        info = self._registry.get_skill(skill_name)
+        if not info:
+            return ExecutionResult(
+                success=False,
+                error=f"Skill not found: {skill_name}"
+            )
+        return service.execute_skill(
+            skill_info=info,
+            input_data=input_data,
+            confirmation_callback=confirmation_callback,
+            allow_network=allow_network,
+            timeout=timeout,
+        )
     def execute_tool_call(
         self,
         request: ToolUseRequest,
@@ -130,7 +200,45 @@ class ToolCallHandler:
                 tool_use_id=request.id,
                 error=result.error or "Unknown error"
             )
+    def execute_tool_call_with_unified_service(
+        self,
+        request: ToolUseRequest,
+        confirmation_callback: Optional[ConfirmationCallback] = None,
+        allow_network: Optional[bool] = None,
+        timeout: Optional[int] = None
+    ) -> ToolResult:
+        """
+        Execute a tool call using the UnifiedExecutionService.
+        Args:
+            request: Tool use request from LLM
+            confirmation_callback: Callback for security confirmation
+            allow_network: Whether to allow network access
+            timeout: Execution timeout in seconds
+        Returns:
+            ToolResult with success or error
+        """
+        result = self.execute_with_unified_service(
+            skill_name=request.name,
+            input_data=request.input,
+            confirmation_callback=confirmation_callback,
+            allow_network=allow_network,
+            timeout=timeout
+        )
+        if result.success:
+            return ToolResult.success(
+                tool_use_id=request.id,
+                content=result.output
+            )
+        else:
+            return ToolResult.error(
+                tool_use_id=request.id,
+                error=result.error or "Unknown error"
+            )
     # ==================== LLM Response Parsing ====================
     def parse_tool_calls(self, response: Any) -> List[ToolUseRequest]:
@@ -186,7 +294,74 @@ class ToolCallHandler:
             )
             results.append(result)
         return results
+    def handle_tool_calls_with_unified_service(
+        self,
+        response: Any,
+        confirmation_callback: Optional[ConfirmationCallback] = None,
+        allow_network: Optional[bool] = None,
+        timeout: Optional[int] = None
+    ) -> List[ToolResult]:
+        """
+        Parse and execute all tool calls using UnifiedExecutionService.
+        This method uses the unified execution layer which:
+        1. Reads sandbox level at runtime
+        2. Handles security scanning and confirmation per-skill
+        3. Properly downgrades sandbox level after confirmation
+        Args:
+            response: Response from OpenAI-compatible API
+            confirmation_callback: Callback for security confirmation
+            allow_network: Whether to allow network access
+            timeout: Execution timeout in seconds
+        Returns:
+            List of ToolResult objects
+        """
+        requests = self.parse_tool_calls(response)
+        results = []
+        for request in requests:
+            result = self.execute_tool_call_with_unified_service(
+                request,
+                confirmation_callback=confirmation_callback,
+                allow_network=allow_network,
+                timeout=timeout
+            )
+            results.append(result)
+        return results
+    def handle_tool_calls_claude_native_with_unified_service(
+        self,
+        response: Any,
+        confirmation_callback: Optional[ConfirmationCallback] = None,
+        allow_network: Optional[bool] = None,
+        timeout: Optional[int] = None
+    ) -> List[ToolResult]:
+        """
+        Parse and execute all Claude tool calls using UnifiedExecutionService.
+        Args:
+            response: Response from Claude's native API
+            confirmation_callback: Callback for security confirmation
+            allow_network: Whether to allow network access
+            timeout: Execution timeout in seconds
+        Returns:
+            List of ToolResult objects
+        """
+        requests = self.parse_tool_calls_claude_native(response)
+        results = []
+        for request in requests:
+            result = self.execute_tool_call_with_unified_service(
+                request,
+                confirmation_callback=confirmation_callback,
+                allow_network=allow_network,
+                timeout=timeout
+            )
+            results.append(result)
+        return results
     def handle_tool_calls_claude_native(
         self,
         response: Any,

skilllite/core/loops.py CHANGED Viewed

@@ -56,11 +56,12 @@ class AgenticLoop:
         custom_tool_handler: Optional[Callable] = None,
         enable_task_planning: bool = True,
         verbose: bool = True,
+        confirmation_callback: Optional[Callable[[str, str], bool]] = None,
         **kwargs
     ):
         """
         Initialize the agentic loop.
         Args:
             manager: SkillManager instance
             client: LLM client (OpenAI or Anthropic)
@@ -71,6 +72,9 @@ class AgenticLoop:
             custom_tool_handler: Optional custom tool handler function
             enable_task_planning: Whether to generate task list before execution
             verbose: Whether to print detailed logs
+            confirmation_callback: Callback for security confirmation (sandbox_level=3).
+                Signature: (security_report: str, scan_id: str) -> bool
+                If None and sandbox_level=3, will use interactive terminal confirmation.
             **kwargs: Additional arguments passed to the LLM
         """
         self.manager = manager
@@ -82,14 +86,157 @@ class AgenticLoop:
         self.custom_tool_handler = custom_tool_handler
         self.enable_task_planning = enable_task_planning
         self.verbose = verbose
+        self.confirmation_callback = confirmation_callback
         self.extra_kwargs = kwargs
         self.task_list: List[Dict] = []
+        # Initialize security scanner for sandbox_level=3
+        self._security_scanner = None
+        self._pending_confirmation = False  # Track if confirmation is pending
     def _log(self, message: str) -> None:
         """Print log message if verbose mode is enabled."""
         if self.verbose:
             print(message)
+    def _get_security_scanner(self):
+        """Get or lazily initialize the security scanner."""
+        if self._security_scanner is None:
+            from .security import SecurityScanner
+            self._security_scanner = SecurityScanner()
+        return self._security_scanner
+    def _should_perform_security_scan(self) -> bool:
+        """Check if security scanning should be performed."""
+        import os
+        sandbox_level = os.environ.get("SKILLBOX_SANDBOX_LEVEL", "3")
+        return sandbox_level == "3" and self.confirmation_callback is not None
+    def _interactive_confirmation(self, report: str, scan_id: str) -> bool:
+        """Default interactive terminal confirmation."""
+        self._log(f"\n{report}")
+        self._log("\n" + "=" * 60)
+        while True:
+            response = input("⚠️  Allow execution? (y/n): ").strip().lower()
+            if response in ['y', 'yes']:
+                return True
+            elif response in ['n', 'no']:
+                return False
+            self._log("Please enter 'y' or 'n'")
+    def _perform_security_confirmation_for_tools(
+        self,
+        tool_calls: List[Any]
+    ) -> bool:
+        """
+        Perform security scan and confirmation for tool calls.
+        Returns True if execution should proceed, False if denied.
+        Also handles skills that require elevated permissions.
+        """
+        import os
+        from .security import SecurityScanResult
+        sandbox_level = os.environ.get("SKILLBOX_SANDBOX_LEVEL", "3")
+        if sandbox_level != "3":
+            return True  # No confirmation needed for levels 1-2
+        # Get skill tool names
+        skill_tool_names = set(self.manager.skill_names())
+        skill_tool_names.update(self.manager._registry.list_multi_script_tools())
+        # Scan each skill tool call
+        combined_issues = []
+        scanned_skills = set()
+        requires_elevated = False  # Track if any skill requires elevated permissions
+        for tc in tool_calls:
+            tool_name = tc.function.name if hasattr(tc, 'function') else tc.get('name', '')
+            # Only scan skill tools, not custom tools
+            if tool_name not in skill_tool_names:
+                continue
+            # Get skill info
+            skill_name = tool_name.split('__')[0] if '__' in tool_name else tool_name
+            if skill_name in scanned_skills:
+                continue
+            scanned_skills.add(skill_name)
+            skill_info = self.manager.get_skill(skill_name)
+            if not skill_info:
+                continue
+            # Check if skill requires elevated permissions
+            if skill_info.metadata and getattr(skill_info.metadata, 'requires_elevated_permissions', False):
+                requires_elevated = True
+                self._log(f"🔓 Skill '{skill_name}' requires elevated permissions")
+            # Parse input data
+            try:
+                import json
+                input_data = json.loads(tc.function.arguments) if hasattr(tc, 'function') else {}
+            except (json.JSONDecodeError, AttributeError):
+                input_data = {}
+            # Perform security scan
+            scanner = self._get_security_scanner()
+            result = scanner.scan_skill(skill_info, input_data)
+            combined_issues.extend(result.issues)
+        # If skill requires elevated permissions, downgrade sandbox level
+        if requires_elevated and not combined_issues:
+            self._log("✅ Skill requires elevated permissions, downgrading to sandbox level 1...")
+            os.environ["SKILLBOX_SANDBOX_LEVEL"] = "1"
+            self._pending_confirmation = True
+            return True
+        if not combined_issues:
+            return True  # No issues found
+        # Create combined scan result
+        high_count = sum(1 for i in combined_issues if i.get("severity") in ["Critical", "High"])
+        medium_count = sum(1 for i in combined_issues if i.get("severity") == "Medium")
+        low_count = sum(1 for i in combined_issues if i.get("severity") == "Low")
+        combined_result = SecurityScanResult(
+            is_safe=high_count == 0,
+            issues=combined_issues,
+            scan_id=f"batch-{len(scanned_skills)}",
+            high_severity_count=high_count,
+            medium_severity_count=medium_count,
+            low_severity_count=low_count,
+        )
+        if not combined_result.requires_confirmation:
+            return True  # Only low/medium issues, proceed
+        # Ask for confirmation
+        report = combined_result.format_report()
+        self._log(f"\n🔒 Security scan detected potential issues:")
+        if self.confirmation_callback:
+            confirmed = self.confirmation_callback(report, combined_result.scan_id)
+        else:
+            confirmed = self._interactive_confirmation(report, combined_result.scan_id)
+        if confirmed:
+            # Temporarily downgrade sandbox level to allow execution
+            self._log("✅ User confirmed. Executing with sandbox level 1...")
+            os.environ["SKILLBOX_SANDBOX_LEVEL"] = "1"
+            self._pending_confirmation = True
+            return True
+        else:
+            self._log("❌ User denied execution.")
+            return False
+    def _restore_sandbox_level(self, original_level: str) -> None:
+        """Restore original sandbox level after execution."""
+        import os
+        if self._pending_confirmation:
+            os.environ["SKILLBOX_SANDBOX_LEVEL"] = original_level
+            self._pending_confirmation = False
     def _get_execution_system_prompt(self) -> str:
         """
         Generate the main execution system prompt for skill selection and file operations.
@@ -534,15 +681,18 @@ Based on the documentation, call the tools with correct parameters.
             # No tool calls
             if not message.tool_calls:
                 self._log("📝 LLM did not call any tools")
                 if self.enable_task_planning:
                     completed_id = self._check_task_completion_in_content(message.content)
                     if completed_id:
                         self._update_task_list(completed_id)
                     if self._check_all_tasks_completed():
                         self._log("🎯 All tasks completed, ending iteration")
                         return response
+                    else:
+                        # Tasks not complete and no tool calls - continue to next iteration
+                        continue
                 else:
                     return response
@@ -570,17 +720,25 @@ Based on the documentation, call the tools with correct parameters.
                 continue
             messages.append(message)
+            # Execute tools using unified execution service
             self._log(f"\n⚙️  Executing tools...")
             if self.custom_tool_handler:
+                # Custom tool handler takes precedence
                 tool_results = self.custom_tool_handler(
                     response, self.manager, allow_network, timeout
                 )
             else:
-                tool_results = self.manager.handle_tool_calls(
-                    response, allow_network=allow_network, timeout=timeout
+                # Use unified execution service with confirmation callback
+                # This handles security scanning, confirmation, and sandbox level management
+                tool_results = self.manager.handle_tool_calls_with_unified_service(
+                    response,
+                    confirmation_callback=self.confirmation_callback or self._interactive_confirmation,
+                    allow_network=allow_network,
+                    timeout=timeout
                 )
             self._log(f"\n📊 Tool execution results:")
             for idx, (result, tc) in enumerate(zip(tool_results, message.tool_calls), 1):
                 output = result.content
@@ -588,7 +746,7 @@ Based on the documentation, call the tools with correct parameters.
                     output = output[:500] + "... (truncated)"
                 self._log(f"   {idx}. {tc.function.name}")
                 self._log(f"      Result: {output}")
             for result in tool_results:
                 messages.append(result.to_openai_format())
@@ -690,19 +848,26 @@ Based on the documentation, call the tools with correct parameters.
                 self._log(f"      Arguments: {json.dumps(block.input, ensure_ascii=False)}")
             messages.append({"role": "assistant", "content": response.content})
+            # Execute tools using unified execution service
             self._log(f"\n⚙️  Executing tools...")
-            tool_results = self.manager.handle_tool_calls_claude_native(
-                response, allow_network=allow_network, timeout=timeout
+            # Use unified execution service with confirmation callback
+            # This handles security scanning, confirmation, and sandbox level management
+            tool_results = self.manager.handle_tool_calls_claude_native_with_unified_service(
+                response,
+                confirmation_callback=self.confirmation_callback or self._interactive_confirmation,
+                allow_network=allow_network,
+                timeout=timeout
             )
             self._log(f"\n📊 Tool execution results:")
             for idx, result in enumerate(tool_results, 1):
                 output = result.content
                 if len(output) > 500:
                     output = output[:500] + "... (truncated)"
                 self._log(f"   {idx}. Result: {output}")
             formatted_results = self.manager.format_tool_results_claude_native(tool_results)
             messages.append({"role": "user", "content": formatted_results})

skilllite/core/manager.py CHANGED Viewed

@@ -304,7 +304,64 @@ class SkillManager:
     ) -> List[ToolResult]:
         """Parse and execute all tool calls from Claude's native API response."""
         return self._handler.handle_tool_calls_claude_native(response, allow_network, timeout)
+    def handle_tool_calls_with_unified_service(
+        self,
+        response: Any,
+        confirmation_callback: Optional[Callable[[str, str], bool]] = None,
+        allow_network: Optional[bool] = None,
+        timeout: Optional[int] = None
+    ) -> List[ToolResult]:
+        """
+        Parse and execute all tool calls using UnifiedExecutionService.
+        This method uses the unified execution layer which:
+        1. Reads sandbox level at runtime
+        2. Handles security scanning and confirmation per-skill
+        3. Properly downgrades sandbox level after confirmation
+        Args:
+            response: Response from OpenAI-compatible API
+            confirmation_callback: Callback for security confirmation
+            allow_network: Whether to allow network access
+            timeout: Execution timeout in seconds
+        Returns:
+            List of ToolResult objects
+        """
+        return self._handler.handle_tool_calls_with_unified_service(
+            response,
+            confirmation_callback=confirmation_callback,
+            allow_network=allow_network,
+            timeout=timeout
+        )
+    def handle_tool_calls_claude_native_with_unified_service(
+        self,
+        response: Any,
+        confirmation_callback: Optional[Callable[[str, str], bool]] = None,
+        allow_network: Optional[bool] = None,
+        timeout: Optional[int] = None
+    ) -> List[ToolResult]:
+        """
+        Parse and execute all Claude tool calls using UnifiedExecutionService.
+        Args:
+            response: Response from Claude's native API
+            confirmation_callback: Callback for security confirmation
+            allow_network: Whether to allow network access
+            timeout: Execution timeout in seconds
+        Returns:
+            List of ToolResult objects
+        """
+        return self._handler.handle_tool_calls_claude_native_with_unified_service(
+            response,
+            confirmation_callback=confirmation_callback,
+            allow_network=allow_network,
+            timeout=timeout
+        )
     def format_tool_results_claude_native(self, results: List[ToolResult]) -> List[Dict[str, Any]]:
         """Format tool results for Claude's native API."""
         return self._handler.format_tool_results_claude_native(results)
@@ -335,6 +392,7 @@ class SkillManager:
         custom_tool_handler: Optional[Callable] = None,
         enable_task_planning: bool = True,
         verbose: bool = True,
+        confirmation_callback: Optional[Callable[[str, str], bool]] = None,
         **kwargs
     ) -> AgenticLoop:
         """
@@ -351,15 +409,16 @@ class SkillManager:
             custom_tool_handler: Optional custom tool handler
             enable_task_planning: Whether to generate task list before execution
             verbose: Whether to print detailed logs
+            confirmation_callback: Callback for security confirmation (sandbox_level=3)
             **kwargs: Additional arguments passed to the LLM
         Returns:
             AgenticLoop instance
         Example:
             # OpenAI-compatible (default)
             loop = manager.create_agentic_loop(client, "gpt-4")
             # Claude native API
             loop = manager.create_agentic_loop(client, "claude-3-opus",
                                                api_format="claude_native")
@@ -375,6 +434,7 @@ class SkillManager:
             custom_tool_handler=custom_tool_handler,
             enable_task_planning=enable_task_planning,
             verbose=verbose,
+            confirmation_callback=confirmation_callback,
             **kwargs
         )
@@ -421,14 +481,15 @@ class SkillManager:
         custom_tool_executor: Optional[Callable] = None,
         enable_task_planning: bool = True,
         verbose: bool = True,
+        confirmation_callback: Optional[Callable[[str, str], bool]] = None,
         **kwargs
     ) -> AgenticLoop:
         """
         Create an enhanced agentic loop with custom tools support.
         This method creates an AgenticLoop that can handle both skill tools
         and custom tools (like file operations).
         Args:
             client: LLM client (OpenAI-compatible)
             model: Model name to use
@@ -438,27 +499,32 @@ class SkillManager:
             custom_tool_executor: Executor function for custom tools
             enable_task_planning: Whether to generate task list before execution
             verbose: Whether to print detailed logs
+            confirmation_callback: Callback for security confirmation (sandbox_level=3)
             **kwargs: Additional arguments passed to the LLM
         Returns:
             AgenticLoop instance with enhanced capabilities
         """
         # Create custom tool handler that combines skill tools and custom tools
         def combined_tool_handler(response, manager, allow_network, timeout):
             from .tools import ToolUseRequest, ToolResult
             requests = ToolUseRequest.parse_from_openai_response(response)
             results = []
             # Get skill tool names
             skill_tool_names = set(self.skill_names())
             skill_tool_names.update(self._registry.list_multi_script_tools())
             for request in requests:
                 if request.name in skill_tool_names:
-                    # Execute as skill tool
-                    result = self._handler.execute_tool_call(
-                        request, allow_network=allow_network, timeout=timeout
+                    # Execute as skill tool using UnifiedExecutionService
+                    # This handles security scanning, confirmation, and proper sandbox level
+                    result = self._handler.execute_tool_call_with_unified_service(
+                        request,
+                        confirmation_callback=confirmation_callback,
+                        allow_network=allow_network,
+                        timeout=timeout
                     )
                     results.append(result)
                 elif custom_tool_executor:
@@ -473,9 +539,9 @@ class SkillManager:
                     results.append(ToolResult.error(
                         request.id, f"No executor found for tool: {request.name}"
                     ))
             return results
         return AgenticLoop(
             manager=self,
             client=client,
@@ -486,6 +552,7 @@ class SkillManager:
             custom_tool_handler=combined_tool_handler if custom_tool_executor else None,
             enable_task_planning=enable_task_planning,
             verbose=verbose,
+            confirmation_callback=confirmation_callback,
             **kwargs
         )

skilllite 0.1.0__py3-none-any.whl → 0.1.2__py3-none-any.whl

skilllite 0.1.0py3-none-any.whl → 0.1.2py3-none-any.whl