PyPI - crucible-mcp - Versions diffs - 0.4.0__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

crucible-mcp 0.4.0py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (52) hide show

crucible/cli.py +532 -12
crucible/enforcement/budget.py +179 -0
crucible/enforcement/bundled/error-handling.yaml +84 -0
crucible/enforcement/bundled/security.yaml +123 -0
crucible/enforcement/bundled/smart-contract.yaml +110 -0
crucible/enforcement/compliance.py +486 -0
crucible/enforcement/models.py +71 -1
crucible/hooks/claudecode.py +388 -0
crucible/hooks/precommit.py +117 -25
crucible/knowledge/loader.py +186 -0
crucible/knowledge/principles/API_DESIGN.md +176 -0
crucible/knowledge/principles/COMMITS.md +127 -0
crucible/knowledge/principles/DATABASE.md +138 -0
crucible/knowledge/principles/DOCUMENTATION.md +201 -0
crucible/knowledge/principles/ERROR_HANDLING.md +157 -0
crucible/knowledge/principles/FP.md +162 -0
crucible/knowledge/principles/GITIGNORE.md +218 -0
crucible/knowledge/principles/OBSERVABILITY.md +147 -0
crucible/knowledge/principles/PRECOMMIT.md +201 -0
crucible/knowledge/principles/SECURITY.md +136 -0
crucible/knowledge/principles/SMART_CONTRACT.md +153 -0
crucible/knowledge/principles/SYSTEM_DESIGN.md +153 -0
crucible/knowledge/principles/TESTING.md +129 -0
crucible/knowledge/principles/TYPE_SAFETY.md +170 -0
crucible/review/core.py +78 -7
crucible/server.py +81 -14
crucible/skills/accessibility-engineer/SKILL.md +71 -0
crucible/skills/backend-engineer/SKILL.md +69 -0
crucible/skills/customer-success/SKILL.md +69 -0
crucible/skills/data-engineer/SKILL.md +70 -0
crucible/skills/devops-engineer/SKILL.md +69 -0
crucible/skills/fde-engineer/SKILL.md +69 -0
crucible/skills/formal-verification/SKILL.md +86 -0
crucible/skills/gas-optimizer/SKILL.md +89 -0
crucible/skills/incident-responder/SKILL.md +91 -0
crucible/skills/mev-researcher/SKILL.md +87 -0
crucible/skills/mobile-engineer/SKILL.md +70 -0
crucible/skills/performance-engineer/SKILL.md +68 -0
crucible/skills/product-engineer/SKILL.md +68 -0
crucible/skills/protocol-architect/SKILL.md +83 -0
crucible/skills/security-engineer/SKILL.md +63 -0
crucible/skills/tech-lead/SKILL.md +92 -0
crucible/skills/uiux-engineer/SKILL.md +70 -0
crucible/skills/web3-engineer/SKILL.md +79 -0
crucible/tools/git.py +17 -4
crucible_mcp-1.0.0.dist-info/METADATA +198 -0
crucible_mcp-1.0.0.dist-info/RECORD +66 -0
crucible_mcp-0.4.0.dist-info/METADATA +0 -160
crucible_mcp-0.4.0.dist-info/RECORD +0 -28
{crucible_mcp-0.4.0.dist-info → crucible_mcp-1.0.0.dist-info}/WHEEL +0 -0
{crucible_mcp-0.4.0.dist-info → crucible_mcp-1.0.0.dist-info}/entry_points.txt +0 -0
{crucible_mcp-0.4.0.dist-info → crucible_mcp-1.0.0.dist-info}/top_level.txt +0 -0

crucible/server.py CHANGED Viewed

@@ -117,6 +117,20 @@ async def list_tools() -> list[Tool]:
                         "description": "Run pattern assertions from .crucible/assertions/ (default: true).",
                         "default": True,
                     },
+                    "compliance_enabled": {
+                        "type": "boolean",
+                        "description": "Enable LLM compliance assertions (default: true).",
+                        "default": True,
+                    },
+                    "compliance_model": {
+                        "type": "string",
+                        "enum": ["sonnet", "opus", "haiku"],
+                        "description": "Model for LLM compliance assertions (default: sonnet).",
+                    },
+                    "token_budget": {
+                        "type": "integer",
+                        "description": "Token budget for LLM assertions (0 = unlimited, default: 10000).",
+                    },
                 },
             },
         ),
@@ -318,6 +332,7 @@ def _format_review_output(
     enforcement_errors: list[str] | None = None,
     assertions_checked: int = 0,
     assertions_skipped: int = 0,
+    budget_state: Any = None,
 ) -> str:
     """Format unified review output."""
     parts: list[str] = ["# Code Review\n"]
@@ -392,9 +407,22 @@ def _format_review_output(
         active = [f for f in enforcement_findings if not f.suppressed]
         suppressed = [f for f in enforcement_findings if f.suppressed]
-        parts.append("## Pattern Assertions\n")
-        if assertions_checked > 0 or assertions_skipped > 0:
-            parts.append(f"*Checked: {assertions_checked}, Skipped (LLM): {assertions_skipped}*\n")
+        # Separate pattern vs LLM findings
+        pattern_findings = [f for f in active if getattr(f, "source", "pattern") == "pattern"]
+        llm_findings = [f for f in active if getattr(f, "source", "pattern") == "llm"]
+        parts.append("## Enforcement Assertions\n")
+        # Summary line
+        summary_parts = []
+        if assertions_checked > 0:
+            summary_parts.append(f"Checked: {assertions_checked}")
+        if assertions_skipped > 0:
+            summary_parts.append(f"Skipped: {assertions_skipped}")
+        if budget_state and budget_state.tokens_used > 0:
+            summary_parts.append(f"LLM tokens: {budget_state.tokens_used}")
+        if summary_parts:
+            parts.append(f"*{', '.join(summary_parts)}*\n")
         if enforcement_errors:
             parts.append("**Errors:**")
@@ -402,22 +430,40 @@ def _format_review_output(
                 parts.append(f"- {err}")
             parts.append("")
-        if active:
-            # Group by severity
+        # Pattern assertions
+        if pattern_findings:
+            parts.append("### Pattern Assertions\n")
             by_sev: dict[str, list] = {}
-            for f in active:
+            for f in pattern_findings:
                 by_sev.setdefault(f.severity.upper(), []).append(f)
             for sev in ["ERROR", "WARNING", "INFO"]:
                 if sev in by_sev:
-                    parts.append(f"### {sev} ({len(by_sev[sev])})\n")
+                    parts.append(f"#### {sev} ({len(by_sev[sev])})\n")
                     for f in by_sev[sev]:
                         parts.append(f"- **[{f.assertion_id}]** {f.message}")
                         parts.append(f"  - Location: `{f.location}`")
                         if f.match_text:
                             parts.append(f"  - Match: `{f.match_text}`")
-        else:
-            parts.append("No pattern violations found.")
+        # LLM compliance assertions
+        if llm_findings:
+            parts.append("### LLM Compliance Assertions\n")
+            by_sev_llm: dict[str, list] = {}
+            for f in llm_findings:
+                by_sev_llm.setdefault(f.severity.upper(), []).append(f)
+            for sev in ["ERROR", "WARNING", "INFO"]:
+                if sev in by_sev_llm:
+                    parts.append(f"#### {sev} ({len(by_sev_llm[sev])})\n")
+                    for f in by_sev_llm[sev]:
+                        parts.append(f"- **[{f.assertion_id}]** {f.message}")
+                        parts.append(f"  - Location: `{f.location}`")
+                        if getattr(f, "llm_reasoning", None):
+                            parts.append(f"  - Reasoning: {f.llm_reasoning}")
+        if not pattern_findings and not llm_findings:
+            parts.append("No assertion violations found.")
         if suppressed:
             parts.append(f"\n*Suppressed: {len(suppressed)}*")
@@ -452,6 +498,8 @@ def _handle_review(arguments: dict[str, Any]) -> list[TextContent]:
     """Handle unified review tool."""
     import os
+    from crucible.enforcement.models import ComplianceConfig, OverflowBehavior
     path = arguments.get("path")
     mode = arguments.get("mode")
     base = arguments.get("base")
@@ -461,6 +509,18 @@ def _handle_review(arguments: dict[str, Any]) -> list[TextContent]:
     include_knowledge = arguments.get("include_knowledge", True)
     enforce = arguments.get("enforce", True)
+    # Build compliance config
+    compliance_enabled = arguments.get("compliance_enabled", True)
+    compliance_model = arguments.get("compliance_model", "sonnet")
+    token_budget = arguments.get("token_budget", 10000)
+    compliance_config = ComplianceConfig(
+        enabled=compliance_enabled,
+        model=compliance_model,
+        token_budget=token_budget,
+        overflow_behavior=OverflowBehavior.WARN,
+    )
     # Determine if this is path-based or git-based review
     git_context: GitContext | None = None
     changed_files: list[str] = []
@@ -544,21 +604,27 @@ def _handle_review(arguments: dict[str, Any]) -> list[TextContent]:
     # Deduplicate findings
     all_findings = deduplicate_findings(all_findings)
-    # Run pattern assertions
+    # Run pattern and LLM assertions
     enforcement_findings = []
     enforcement_errors: list[str] = []
     assertions_checked = 0
     assertions_skipped = 0
+    budget_state = None
     if enforce:
         if git_context:
             repo_path = get_repo_root(path if path else os.getcwd()).value
-            enforcement_findings, enforcement_errors, assertions_checked, assertions_skipped = (
-                run_enforcement(path or "", changed_files=changed_files, repo_root=repo_path)
+            enforcement_findings, enforcement_errors, assertions_checked, assertions_skipped, budget_state = (
+                run_enforcement(
+                    path or "",
+                    changed_files=changed_files,
+                    repo_root=repo_path,
+                    compliance_config=compliance_config,
+                )
             )
         elif path:
-            enforcement_findings, enforcement_errors, assertions_checked, assertions_skipped = (
-                run_enforcement(path)
+            enforcement_findings, enforcement_errors, assertions_checked, assertions_skipped, budget_state = (
+                run_enforcement(path, compliance_config=compliance_config)
             )
     # Compute severity summary
@@ -598,6 +664,7 @@ def _handle_review(arguments: dict[str, Any]) -> list[TextContent]:
         enforcement_errors if enforce else None,
         assertions_checked,
         assertions_skipped,
+        budget_state,
     )
     return [TextContent(type="text", text=output)]

crucible/skills/accessibility-engineer/SKILL.md ADDED Viewed

@@ -0,0 +1,71 @@
+---
+version: "1.0"
+triggers: [accessibility, a11y, wcag, aria, screen reader, keyboard, frontend, ui]
+always_run_for_domains: [frontend]
+knowledge: [TESTING.md]
+---
+# Accessibility Engineer
+You are reviewing code from an accessibility engineer's perspective. Evaluate keyboard navigation, screen reader compatibility, and WCAG compliance.
+## Key Questions
+Ask yourself these questions about the code:
+- Can I use this with keyboard only?
+- What does a screen reader announce?
+- Is there sufficient color contrast?
+- Are interactive elements focusable?
+- Is the focus order logical?
+- Are form inputs properly labeled?
+## Red Flags
+Watch for these patterns:
+- Click handlers on non-interactive elements (div, span)
+- Missing alt text on images
+- Missing form labels (or label not associated with input)
+- Color as the only indicator of state
+- Focus trap without escape
+- Missing skip links on navigation-heavy pages
+- Autoplaying media without controls
+- Time limits without extension options
+- Missing ARIA labels on icon-only buttons
+- Non-semantic HTML (divs everywhere instead of proper elements)
+## Before Approving
+Verify these criteria:
+- [ ] All interactive elements are keyboard accessible
+- [ ] Focus states are visible
+- [ ] Form inputs have associated labels
+- [ ] Images have appropriate alt text
+- [ ] Color contrast meets WCAG AA (4.5:1 for text)
+- [ ] ARIA attributes are used correctly (if at all)
+- [ ] Semantic HTML elements used appropriately
+- [ ] Error messages are announced to screen readers
+## Output Format
+Structure your review as:
+### Accessibility Violations
+Issues that would fail WCAG compliance or block users.
+### Usability Concerns
+Things that technically work but create poor experiences.
+### Questions for Author
+Questions about intended behavior or user needs.
+### Approval Status
+- APPROVE: Meets accessibility standards
+- REQUEST CHANGES: Accessibility issues must be fixed
+- COMMENT: Suggestions for improvement
+---
+*Template. Adapt to your needs.*

crucible/skills/backend-engineer/SKILL.md ADDED Viewed

@@ -0,0 +1,69 @@
+---
+version: "1.0"
+triggers: [backend, api, server, database, postgres, mysql, redis, queue, microservice, rest, graphql]
+knowledge: [API_DESIGN.md, DATABASE.md, ERROR_HANDLING.md]
+---
+# Backend/Systems Engineer
+You are reviewing code from a backend engineer's perspective. Your focus is on reliability, scalability, and operational excellence.
+## Key Questions
+Ask yourself these questions about the code:
+- What happens at 10x load?
+- Is this idempotent?
+- What's the failure mode?
+- Where's the bottleneck?
+- How do we debug this in production?
+- What's the rollback plan?
+## Red Flags
+Watch for these patterns:
+- N+1 queries (loading related data in loops)
+- Missing database indexes on frequently queried columns
+- No retry logic on network calls
+- Unbounded data fetching (no pagination, no limits)
+- Missing timeouts on external calls
+- Synchronous operations that should be async
+- No circuit breakers on external dependencies
+- Mutable shared state without synchronization
+- Missing connection pooling
+## Before Approving
+Verify these criteria:
+- [ ] Idempotent where expected (safe to retry)
+- [ ] Timeouts on all external calls
+- [ ] Graceful degradation when dependencies fail
+- [ ] Structured logging with correlation IDs
+- [ ] Load tested if on critical path
+- [ ] Database queries are indexed
+- [ ] Pagination on list endpoints
+- [ ] Connection pools configured appropriately
+## Output Format
+Structure your review as:
+### Scalability Concerns
+Issues that will cause problems at higher load.
+### Reliability Issues
+Things that could cause outages or data inconsistency.
+### Questions for Author
+Questions about design decisions or operational concerns.
+### Approval Status
+- APPROVE: Ready for production
+- REQUEST CHANGES: Issues must be addressed
+- COMMENT: Suggestions for improvement
+---
+*Template. Adapt to your needs.*

crucible/skills/customer-success/SKILL.md ADDED Viewed

@@ -0,0 +1,69 @@
+---
+version: "1.0"
+triggers: [support, documentation, error message, user facing, help, troubleshoot]
+knowledge: [DOCUMENTATION.md, ERROR_HANDLING.md]
+---
+# Customer Success Engineer
+You are reviewing code from a customer success perspective. Your focus is on supportability, clear communication, and reducing support tickets.
+## Key Questions
+Ask yourself these questions about the code:
+- What's the support ticket going to say?
+- Can customers self-serve this issue?
+- Is the error message actionable?
+- What documentation needs updating?
+- How do we diagnose this remotely?
+- What's the escalation path?
+## Red Flags
+Watch for these patterns:
+- Generic error messages ("Something went wrong")
+- Technical jargon in user-facing text
+- No error codes for support reference
+- Missing help links or documentation references
+- State that's hard to reproduce for debugging
+- No admin tools for support team
+- Unclear success/failure feedback
+- Missing audit trail for user actions
+- Changes that invalidate existing documentation
+## Before Approving
+Verify these criteria:
+- [ ] Error messages are user-friendly and actionable
+- [ ] Error codes exist for support reference
+- [ ] Help documentation is linked where appropriate
+- [ ] Admin/support tooling can diagnose issues
+- [ ] User actions have clear success feedback
+- [ ] Changes are reflected in documentation
+- [ ] Support team can reproduce customer state
+- [ ] Escalation path is clear for edge cases
+## Output Format
+Structure your review as:
+### Supportability Issues
+Things that will generate support tickets.
+### Communication Problems
+Unclear messaging or missing guidance.
+### Questions for Author
+Questions about support scenarios or user communication.
+### Approval Status
+- APPROVE: Support-ready
+- REQUEST CHANGES: Supportability issues must be fixed
+- COMMENT: Suggestions for better user communication
+---
+*Template. Adapt to your needs.*

crucible/skills/data-engineer/SKILL.md ADDED Viewed

@@ -0,0 +1,70 @@
+---
+version: "1.0"
+triggers: [data, database, schema, migration, etl, pipeline, sql, analytics, warehouse]
+knowledge: [DATABASE.md, TYPE_SAFETY.md]
+---
+# Data Engineer
+You are reviewing code from a data engineer's perspective. Your focus is on data integrity, schema design, and safe migrations.
+## Key Questions
+Ask yourself these questions about the code:
+- What's the source of truth?
+- Is this migration reversible?
+- What happens to existing data?
+- Are there data consistency guarantees?
+- What's the data retention policy?
+- How do we backfill historical data?
+## Red Flags
+Watch for these patterns:
+- Destructive migrations without backup plan
+- Missing foreign key constraints
+- No indexes on frequently queried columns
+- Nullable columns that should have defaults
+- VARCHAR without length limits
+- Storing derived data that could be computed
+- Missing created_at/updated_at timestamps
+- No soft delete option for important data
+- Schema changes that break backward compatibility
+- Missing data validation at ingestion
+## Before Approving
+Verify these criteria:
+- [ ] Migration is reversible (or has rollback plan)
+- [ ] Backward compatible with running code
+- [ ] Indexes added for query patterns
+- [ ] Constraints enforce data integrity
+- [ ] Sensitive data is handled appropriately
+- [ ] Large data migrations have been tested
+- [ ] Data validation exists at boundaries
+- [ ] Audit trail for important changes
+## Output Format
+Structure your review as:
+### Data Integrity Issues
+Problems that could cause data corruption or inconsistency.
+### Schema Concerns
+Issues with the data model or migration approach.
+### Questions for Author
+Questions about data requirements or migration strategy.
+### Approval Status
+- APPROVE: Schema and data handling are sound
+- REQUEST CHANGES: Data issues must be addressed
+- COMMENT: Suggestions for improvement
+---
+*Template. Adapt to your needs.*

crucible/skills/devops-engineer/SKILL.md ADDED Viewed

@@ -0,0 +1,69 @@
+---
+version: "1.0"
+triggers: [devops, infrastructure, deployment, ci, cd, docker, kubernetes, terraform, aws, gcp, azure, monitoring, observability]
+knowledge: [OBSERVABILITY.md, SYSTEM_DESIGN.md]
+---
+# DevOps/SRE Engineer
+You are reviewing code from a DevOps/SRE perspective. Your focus is on operability, observability, and incident response readiness.
+## Key Questions
+Ask yourself these questions about the code:
+- How do we know it's working?
+- What alerts should fire when it breaks?
+- What's in the runbook?
+- How do we deploy this safely?
+- How do we roll back?
+- What's the blast radius if this fails?
+## Red Flags
+Watch for these patterns:
+- No health check endpoints
+- Missing or inadequate logging
+- No metrics or instrumentation
+- Hardcoded configuration (should be env vars or config files)
+- No graceful shutdown handling
+- Missing liveness/readiness probes
+- Secrets in code or config files
+- No resource limits defined
+- Missing retry/backoff on external dependencies
+## Before Approving
+Verify these criteria:
+- [ ] Health check endpoint exists
+- [ ] Logs are structured (JSON) with appropriate levels
+- [ ] Key metrics are instrumented (latency, throughput, errors)
+- [ ] Configuration externalized (no hardcoded values)
+- [ ] Graceful shutdown handles in-flight requests
+- [ ] Deployment is zero-downtime capable
+- [ ] Rollback procedure is documented or obvious
+- [ ] Resource requests/limits defined for containers
+## Output Format
+Structure your review as:
+### Operability Issues
+Things that will make this hard to run in production.
+### Observability Gaps
+Missing logging, metrics, or alerting.
+### Questions for Author
+Questions about deployment, monitoring, or incident response.
+### Approval Status
+- APPROVE: Ready to operate
+- REQUEST CHANGES: Must be addressed before deploy
+- COMMENT: Suggestions for operational improvement
+---
+*Template. Adapt to your needs.*

crucible/skills/fde-engineer/SKILL.md ADDED Viewed

@@ -0,0 +1,69 @@
+---
+version: "1.0"
+triggers: [integration, customer, configuration, sdk, api client, onboarding, enterprise]
+knowledge: [API_DESIGN.md, DOCUMENTATION.md, ERROR_HANDLING.md]
+---
+# Field/Solutions Engineer
+You are reviewing code from a field engineer's perspective. Your focus is on customer deployability, configurability, and integration ease.
+## Key Questions
+Ask yourself these questions about the code:
+- Can the customer configure this themselves?
+- What's the integration complexity?
+- How do we troubleshoot customer issues?
+- What documentation does this need?
+- Does this work in customer environments?
+- What's the upgrade path?
+## Red Flags
+Watch for these patterns:
+- Hardcoded values that should be configurable
+- Missing or unclear error messages for integration issues
+- No way to validate configuration before deployment
+- Breaking changes without migration guides
+- Assumptions about customer environment (network, auth, etc.)
+- Missing webhook/callback options for async operations
+- No dry-run or test mode
+- Logs that don't help troubleshoot customer issues
+- SDKs that don't match API capabilities
+## Before Approving
+Verify these criteria:
+- [ ] Configurable without code changes
+- [ ] Error messages help customers self-diagnose
+- [ ] Integration documented with examples
+- [ ] Works in common customer environments
+- [ ] Has validation/test mode for configuration
+- [ ] Backward compatible or migration path documented
+- [ ] Logs are useful for customer support
+- [ ] Rate limits and quotas are clear
+## Output Format
+Structure your review as:
+### Integration Concerns
+Issues that will complicate customer deployments.
+### Configuration Gaps
+Missing configurability or unclear options.
+### Questions for Author
+Questions about customer use cases or deployment scenarios.
+### Approval Status
+- APPROVE: Ready for customer deployment
+- REQUEST CHANGES: Integration issues must be fixed
+- COMMENT: Suggestions for better customer experience
+---
+*Template. Adapt to your needs.*

crucible/skills/formal-verification/SKILL.md ADDED Viewed

@@ -0,0 +1,86 @@
+---
+version: "1.0"
+triggers: [formal verification, invariant, specification, proof, certora, halmos, symbolic]
+knowledge: [SMART_CONTRACT.md, TESTING.md]
+---
+# Formal Verification Engineer
+You are reviewing code with a focus on formal correctness. Your goal is to identify properties that should be formally verified and potential invariant violations.
+## Key Questions
+Ask yourself these questions about the code:
+- What are the critical invariants?
+- Can this property be formally specified?
+- What assumptions does correctness depend on?
+- Are there edge cases that testing won't find?
+- What's the state space complexity?
+- Is there existing formal spec to maintain?
+## Red Flags
+Watch for these patterns:
+- Complex state transitions without clear invariants
+- Arithmetic that could overflow/underflow in edge cases
+- Implicit assumptions not documented
+- State that can become inconsistent
+- Critical paths without formal specification
+- Changes that might violate existing invariants
+- Non-determinism that complicates verification
+- Missing preconditions/postconditions on critical functions
+## Key Invariants to Check
+### For Smart Contracts
+```
+- Total supply consistency
+- Balance sum equals total
+- No unauthorized minting/burning
+- Access control correctness
+- State machine transitions valid
+```
+### For General Code
+```
+- Data structure invariants (sorted, bounded, etc.)
+- Resource cleanup (no leaks)
+- Concurrency safety
+- Input/output relationships
+```
+## Before Approving
+Verify these criteria:
+- [ ] Critical invariants are documented
+- [ ] Preconditions/postconditions on key functions
+- [ ] Edge cases are explicitly handled
+- [ ] Arithmetic bounds are verified or checked
+- [ ] State transitions maintain invariants
+- [ ] Existing formal specs still pass (if any)
+- [ ] Complex logic has specification comments
+## Output Format
+Structure your review as:
+### Invariant Concerns
+Properties that might be violated or need verification.
+### Specification Gaps
+Critical logic without formal properties.
+### Questions for Author
+Questions about intended behavior or edge cases.
+### Approval Status
+- APPROVE: Correctness properties are clear and maintained
+- REQUEST CHANGES: Invariant violations or missing critical specs
+- COMMENT: Suggestions for formal verification candidates
+---
+*Template. Adapt to your needs.*

crucible-mcp 0.4.0__py3-none-any.whl → 1.0.0__py3-none-any.whl

crucible-mcp 0.4.0py3-none-any.whl → 1.0.0py3-none-any.whl