npm - @hustle-together/api-dev-tools - Versions diffs - 1.7.0 → 1.7.1 - Mend

@hustle-together/api-dev-tools 1.7.0 → 1.7.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/hooks/enforce-external-research.py +195 -185
package/package.json +1 -1

package/hooks/enforce-external-research.py CHANGED Viewed

@@ -1,13 +1,20 @@
 #!/usr/bin/env python3
 """
 Hook: UserPromptSubmit
-Purpose: Enforce research before answering external API/SDK questions
+Purpose: ALWAYS enforce research before answering technical questions
-This hook runs BEFORE Claude processes the user's prompt. It detects
-questions about external APIs, SDKs, or services and injects context
-requiring Claude to research first before answering.
+This hook runs BEFORE Claude processes the user's prompt. It aggressively
+detects ANY technical question and requires comprehensive research using
+BOTH Context7 AND multiple WebSearches before answering.
-Philosophy: "When in doubt, research. Training data is ALWAYS potentially outdated."
+Philosophy: "ALWAYS research. Training data is NEVER trustworthy for technical info."
+The hook triggers on:
+- ANY mention of APIs, SDKs, libraries, packages, frameworks
+- ANY technical "how to" or capability questions
+- ANY code-related questions (functions, methods, parameters, types)
+- ANY questions about tools, services, or platforms
+- ANY request for implementation, editing, or changes
 Returns:
   - Prints context to stdout (injected into conversation)
@@ -23,134 +30,172 @@ from datetime import datetime
 STATE_FILE = Path(__file__).parent.parent / "api-dev-state.json"
 # ============================================================================
-# PATTERN-BASED DETECTION
+# AGGRESSIVE DETECTION PATTERNS
 # ============================================================================
-# Patterns that indicate external service/API mentions
-EXTERNAL_SERVICE_PATTERNS = [
-    # Package names
-    r"@[\w-]+/[\w-]+",                    # @scope/package
-    r"\b[\w-]+-(?:sdk|api|js|ts|py)\b",   # something-sdk, something-api, something-js
-    # API/SDK keywords
-    r"\b(?:api|sdk|library|package|module|framework)\b",
-    # Technical implementation terms
-    r"\b(?:endpoint|route|webhook|oauth|auth|token)\b",
-    # Version references
-    r"\bv?\d+\.\d+(?:\.\d+)?\b",           # version numbers like v1.2.3, 2.0
-    # Import/require patterns
-    r"(?:import|require|from)\s+['\"][\w@/-]+['\"]",
+# Technical terms that ALWAYS trigger research
+TECHNICAL_TERMS = [
+    # Code/Development
+    r"\b(?:function|method|class|interface|type|schema|model)\b",
+    r"\b(?:parameter|argument|option|config|setting|property)\b",
+    r"\b(?:import|export|require|module|package|library|dependency)\b",
+    r"\b(?:api|sdk|framework|runtime|engine|platform)\b",
+    r"\b(?:endpoint|route|url|path|request|response|header)\b",
+    r"\b(?:database|query|table|collection|document|record)\b",
+    r"\b(?:authentication|authorization|token|key|secret|credential)\b",
+    r"\b(?:error|exception|bug|issue|problem|fix)\b",
+    r"\b(?:test|spec|coverage|mock|stub|fixture)\b",
+    r"\b(?:deploy|build|compile|bundle|publish|release)\b",
+    r"\b(?:install|setup|configure|initialize|migrate)\b",
+    r"\b(?:provider|service|client|server|handler|middleware)\b",
+    r"\b(?:stream|async|await|promise|callback|event)\b",
+    r"\b(?:component|widget|element|view|layout|template)\b",
+    r"\b(?:state|store|reducer|action|context|hook)\b",
+    r"\b(?:validate|parse|serialize|transform|convert)\b",
+    # Package patterns
+    r"@[\w-]+/[\w-]+",                      # @scope/package
+    r"\b[\w-]+-(?:sdk|api|js|ts|py|go|rs)\b",  # something-sdk, something-api
+    # Version patterns
+    r"\bv?\d+\.\d+(?:\.\d+)?(?:-[\w.]+)?\b",  # v1.2.3, 2.0.0-beta
+    # File patterns
+    r"\b[\w-]+\.(?:ts|js|tsx|jsx|py|go|rs|json|yaml|yml|toml|env)\b",
 ]
-# Patterns that indicate asking about features/capabilities
-CAPABILITY_QUESTION_PATTERNS = [
-    # "What does X support/have/do"
-    r"what\s+(?:does|can|are|is)\s+\w+",
-    r"what\s+\w+\s+(?:support|have|provide|offer)",
-    # "Does X support/have"
-    r"(?:does|can|will)\s+\w+\s+(?:support|have|handle|do|work)",
-    # "How to/do" questions
-    r"how\s+(?:to|do|does|can|should)\s+",
-    # Lists and availability
-    r"(?:list|show)\s+(?:of|all|available)",
-    r"which\s+\w+\s+(?:are|is)\s+(?:available|supported)",
-    r"all\s+(?:available|supported)\s+\w+",
-    # Examples and implementation
-    r"example\s+(?:of|for|using|with)",
-    r"how\s+to\s+(?:use|implement|integrate|connect|setup|configure)",
+# Question patterns that indicate asking about functionality
+QUESTION_PATTERNS = [
+    # Direct questions
+    r"\b(?:what|which|where|when|why|how)\b",
+    r"\b(?:can|could|would|should|will|does|do|is|are)\b.*\?",
+    # Requests
+    r"\b(?:show|tell|explain|describe|list|find|get|give)\b",
+    r"\b(?:help|need|want|looking for|trying to)\b",
+    # Actions
+    r"\b(?:create|make|build|add|implement|write|generate)\b",
+    r"\b(?:update|change|modify|edit|fix|refactor|improve)\b",
+    r"\b(?:delete|remove|drop|clear|reset)\b",
+    r"\b(?:connect|integrate|link|sync|merge)\b",
+    r"\b(?:debug|trace|log|monitor|track)\b",
+    # Comparisons
+    r"\b(?:difference|compare|versus|vs|between|or)\b",
+    r"\b(?:better|best|recommended|preferred|alternative)\b",
 ]
-# Common external service/company names (partial list - patterns catch the rest)
-KNOWN_SERVICES = [
-    # AI/ML
-    "openai", "anthropic", "google", "gemini", "gpt", "claude", "llama",
-    "groq", "perplexity", "mistral", "cohere", "huggingface", "replicate",
-    # Cloud/Infrastructure
-    "aws", "azure", "gcp", "vercel", "netlify", "cloudflare", "supabase",
-    "firebase", "mongodb", "postgres", "redis", "elasticsearch",
-    # APIs/Services
-    "stripe", "twilio", "sendgrid", "mailchimp", "slack", "discord",
-    "github", "gitlab", "bitbucket", "jira", "notion", "airtable",
-    "shopify", "salesforce", "hubspot", "zendesk",
-    # Data/Analytics
-    "segment", "mixpanel", "amplitude", "datadog", "sentry", "grafana",
-    # Media/Content
-    "cloudinary", "imgix", "mux", "brandfetch", "unsplash", "pexels",
-    # Auth
-    "auth0", "okta", "clerk", "nextauth", "passport",
+# Phrases that ALWAYS require research (no exceptions)
+ALWAYS_RESEARCH_PHRASES = [
+    r"how (?:to|do|does|can|should|would)",
+    r"what (?:is|are|does|can|should)",
+    r"(?:does|can|will|should) .+ (?:support|have|handle|work|do)",
+    r"(?:list|show|get|find) (?:all|available|supported)",
+    r"example (?:of|for|using|with|code)",
+    r"(?:implement|add|create|build|write|generate) .+",
+    r"(?:update|change|modify|edit|fix) .+",
+    r"(?:configure|setup|install|deploy) .+",
+    r"(?:error|issue|problem|bug|not working)",
+    r"(?:api|sdk|library|package|module|framework)",
+    r"(?:documentation|docs|reference|guide)",
+]
-    # Payments
-    "paypal", "square", "braintree", "adyen",
+# Exclusion patterns - things that DON'T need research
+EXCLUDE_PATTERNS = [
+    r"^(?:hi|hello|hey|thanks|thank you|ok|okay|yes|no|sure)[\s!?.]*$",
+    r"^(?:good morning|good afternoon|good evening|goodbye|bye)[\s!?.]*$",
+    r"^(?:please|sorry|excuse me)[\s!?.]*$",
+    r"^(?:\d+[\s+\-*/]\d+|calculate|math).*$",  # Simple math
 ]
 # ============================================================================
 # DETECTION LOGIC
 # ============================================================================
-def detect_external_api_question(prompt: str) -> dict:
+def is_excluded(prompt: str) -> bool:
+    """Check if prompt is a simple greeting or non-technical."""
+    prompt_clean = prompt.strip().lower()
+    # Very short prompts that are just greetings
+    if len(prompt_clean) < 20:
+        for pattern in EXCLUDE_PATTERNS:
+            if re.match(pattern, prompt_clean, re.IGNORECASE):
+                return True
+    return False
+def detect_technical_question(prompt: str) -> dict:
     """
-    Detect if the prompt is asking about external APIs/SDKs.
+    Aggressively detect if the prompt is technical and requires research.
     Returns:
         {
             "detected": bool,
             "terms": list of detected terms,
-            "patterns_matched": list of pattern types matched,
-            "confidence": "high" | "medium" | "low"
+            "patterns_matched": list of pattern types,
+            "confidence": "critical" | "high" | "medium" | "low" | "none"
         }
     """
+    if is_excluded(prompt):
+        return {
+            "detected": False,
+            "terms": [],
+            "patterns_matched": [],
+            "confidence": "none",
+        }
     prompt_lower = prompt.lower()
     detected_terms = []
     patterns_matched = []
-    # Check for known services
-    for service in KNOWN_SERVICES:
-        if service in prompt_lower:
-            detected_terms.append(service)
-            patterns_matched.append("known_service")
-    # Check external service patterns
-    for pattern in EXTERNAL_SERVICE_PATTERNS:
+    # Check for ALWAYS_RESEARCH_PHRASES first (highest priority)
+    for pattern in ALWAYS_RESEARCH_PHRASES:
+        if re.search(pattern, prompt_lower, re.IGNORECASE):
+            patterns_matched.append("always_research")
+            # Extract the matched phrase
+            match = re.search(pattern, prompt_lower, re.IGNORECASE)
+            if match:
+                detected_terms.append(match.group(0)[:50])
+    # Check technical terms
+    for pattern in TECHNICAL_TERMS:
         matches = re.findall(pattern, prompt_lower, re.IGNORECASE)
         if matches:
-            detected_terms.extend(matches)
-            patterns_matched.append("external_service_pattern")
+            detected_terms.extend(matches[:3])  # Limit per pattern
+            patterns_matched.append("technical_term")
-    # Check capability question patterns
-    for pattern in CAPABILITY_QUESTION_PATTERNS:
+    # Check question patterns
+    for pattern in QUESTION_PATTERNS:
         if re.search(pattern, prompt_lower, re.IGNORECASE):
-            patterns_matched.append("capability_question")
+            patterns_matched.append("question_pattern")
             break
     # Deduplicate
-    detected_terms = list(set(detected_terms))
+    detected_terms = list(dict.fromkeys(detected_terms))[:10]
     patterns_matched = list(set(patterns_matched))
-    # Determine confidence
-    if "known_service" in patterns_matched and "capability_question" in patterns_matched:
+    # Determine confidence - MUCH more aggressive
+    if "always_research" in patterns_matched:
+        confidence = "critical"
+    elif "technical_term" in patterns_matched and "question_pattern" in patterns_matched:
         confidence = "high"
-    elif "known_service" in patterns_matched or len(detected_terms) >= 2:
-        confidence = "medium"
-    elif patterns_matched:
-        confidence = "low"
+    elif "technical_term" in patterns_matched:
+        confidence = "high"  # Technical terms alone = high
+    elif "question_pattern" in patterns_matched and len(prompt) > 30:
+        confidence = "medium"  # Questions longer than 30 chars
+    elif len(prompt) > 50:
+        confidence = "low"  # Longer prompts default to low (still triggers)
     else:
         confidence = "none"
+    # AGGRESSIVE: Trigger on anything except "none"
+    detected = confidence != "none"
     return {
-        "detected": confidence in ["high", "medium"],
-        "terms": detected_terms[:10],  # Limit to 10 terms
+        "detected": detected,
+        "terms": detected_terms,
         "patterns_matched": patterns_matched,
         "confidence": confidence,
     }
@@ -165,11 +210,11 @@ def check_active_workflow() -> bool:
         state = json.loads(STATE_FILE.read_text())
         phases = state.get("phases", {})
-        # Check if any phase is in progress
         for phase_key, phase_data in phases.items():
             if isinstance(phase_data, dict):
                 status = phase_data.get("status", "")
-                if status in ["in_progress", "pending"]:
+                if status in ["in_progress", "pending", "complete"]:
+                    # If ANY phase has been touched, we're in a workflow
                     return True
         return False
@@ -177,50 +222,13 @@ def check_active_workflow() -> bool:
         return False
-def check_already_researched(terms: list) -> list:
-    """Check which terms have already been researched."""
-    if not STATE_FILE.exists():
-        return []
-    try:
-        state = json.loads(STATE_FILE.read_text())
-        research_queries = state.get("research_queries", [])
-        # Also check sources in phases
-        phases = state.get("phases", {})
-        all_sources = []
-        for phase_data in phases.values():
-            if isinstance(phase_data, dict):
-                sources = phase_data.get("sources", [])
-                all_sources.extend(sources)
-        # Combine all research text
-        all_research_text = " ".join(str(s) for s in all_sources)
-        all_research_text += " ".join(
-            str(q.get("query", "")) + " " + str(q.get("term", ""))
-            for q in research_queries
-            if isinstance(q, dict)
-        )
-        all_research_text = all_research_text.lower()
-        # Find which terms were already researched
-        already_researched = []
-        for term in terms:
-            if term.lower() in all_research_text:
-                already_researched.append(term)
-        return already_researched
-    except (json.JSONDecodeError, Exception):
-        return []
-def log_detection(prompt: str, detection: dict) -> None:
+def log_detection(prompt: str, detection: dict, injected: bool) -> None:
     """Log this detection for debugging/auditing."""
-    if not STATE_FILE.exists():
-        return
     try:
-        state = json.loads(STATE_FILE.read_text())
+        if STATE_FILE.exists():
+            state = json.loads(STATE_FILE.read_text())
+        else:
+            state = {"prompt_detections": []}
         if "prompt_detections" not in state:
             state["prompt_detections"] = []
@@ -229,11 +237,13 @@ def log_detection(prompt: str, detection: dict) -> None:
             "timestamp": datetime.now().isoformat(),
             "prompt_preview": prompt[:100] + "..." if len(prompt) > 100 else prompt,
             "detection": detection,
+            "injected": injected,
         })
-        # Keep only last 20 detections
-        state["prompt_detections"] = state["prompt_detections"][-20:]
+        # Keep only last 50 detections
+        state["prompt_detections"] = state["prompt_detections"][-50:]
+        STATE_FILE.parent.mkdir(parents=True, exist_ok=True)
         STATE_FILE.write_text(json.dumps(state, indent=2))
     except Exception:
         pass  # Don't fail the hook on logging errors
@@ -248,69 +258,69 @@ def main():
     try:
         input_data = json.load(sys.stdin)
     except json.JSONDecodeError:
-        # If we can't parse input, allow without injection
         sys.exit(0)
     prompt = input_data.get("prompt", "")
-    if not prompt:
+    if not prompt or len(prompt.strip()) < 5:
         sys.exit(0)
-    # Check if in active workflow mode (stricter enforcement)
+    # Check if in active workflow mode
     active_workflow = check_active_workflow()
-    # Detect external API questions
-    detection = detect_external_api_question(prompt)
-    # Log for debugging
-    if detection["detected"] or active_workflow:
-        log_detection(prompt, detection)
+    # Detect technical questions
+    detection = detect_technical_question(prompt)
-    # Determine if we should inject research requirement
-    should_inject = False
-    inject_reason = ""
+    # In active workflow, ALWAYS inject (even for low confidence)
+    if active_workflow and detection["confidence"] != "none":
+        detection["detected"] = True
-    if active_workflow:
-        # In active workflow, ALWAYS inject for technical questions
-        if detection["confidence"] in ["high", "medium", "low"]:
-            should_inject = True
-            inject_reason = "active_workflow"
-    elif detection["detected"]:
-        # Check if already researched
-        already_researched = check_already_researched(detection["terms"])
-        unresearched_terms = [t for t in detection["terms"] if t not in already_researched]
+    # Log all detections
+    log_detection(prompt, detection, detection["detected"])
-        if unresearched_terms:
-            should_inject = True
-            inject_reason = "unresearched_terms"
-            detection["unresearched"] = unresearched_terms
-    # Inject context if needed
-    if should_inject:
-        terms_str = ", ".join(detection.get("unresearched", detection["terms"])[:5])
+    # Inject context if detected
+    if detection["detected"]:
+        terms_str = ", ".join(detection["terms"][:5]) if detection["terms"] else "technical question"
+        confidence = detection["confidence"]
+        # Build the injection message
         injection = f"""
 <user-prompt-submit-hook>
-EXTERNAL API/SDK DETECTED: {terms_str}
-Confidence: {detection["confidence"]}
-{"Mode: Active API Development Workflow" if active_workflow else ""}
-MANDATORY RESEARCH REQUIREMENT:
-Before answering this question, you MUST:
-1. Use Context7 (mcp__context7__resolve-library-id + get-library-docs) to look up current documentation
-2. Use WebSearch to find official documentation and recent updates
-3. NEVER answer from training data alone - it may be outdated
-Training data can be months or years old. APIs change constantly.
-Research first. Then answer with verified, current information.
-After researching, cite your sources in your response.
+RESEARCH REQUIRED - {confidence.upper()} CONFIDENCE
+Detected: {terms_str}
+{"MODE: Active API Development Workflow - STRICT ENFORCEMENT" if active_workflow else ""}
+MANDATORY BEFORE ANSWERING:
+1. USE CONTEXT7 FIRST:
+   - Call mcp__context7__resolve-library-id to find the library
+   - Call mcp__context7__get-library-docs to get CURRENT documentation
+   - This gives you the ACTUAL source of truth
+2. USE WEBSEARCH (2-3 SEARCHES MINIMUM):
+   - Search for official documentation
+   - Search with different phrasings to get comprehensive coverage
+   - Search for recent updates, changes, or known issues
+   - Example searches:
+     * "[topic] official documentation"
+     * "[topic] API reference guide"
+     * "[topic] latest updates 2024 2025"
+3. NEVER TRUST TRAINING DATA:
+   - Training data can be months or years outdated
+   - APIs change constantly
+   - Features get added, deprecated, or modified
+   - Parameter names and types change
+4. CITE YOUR SOURCES:
+   - After researching, mention where the information came from
+   - Include links when available
+RESEARCH FIRST. ANSWER SECOND.
 </user-prompt-submit-hook>
 """
         print(injection)
-    # Always allow the prompt to proceed
     sys.exit(0)

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@hustle-together/api-dev-tools",
-  "version": "1.7.0",
+  "version": "1.7.1",
   "description": "Interview-driven API development workflow for Claude Code - Automates research, testing, and documentation",
   "main": "bin/cli.js",
   "bin": {