npm - entroplain - Versions diffs - 0.1.1 → 0.2.0 - Mend

entroplain 0.1.1 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

package/26.0.1 +0 -0
package/CONTRIBUTING.md +103 -103
package/README.md +209 -122
package/dist/entroplain-0.2.0-py3-none-any.whl +0 -0
package/dist/entroplain-0.2.0.tar.gz +0 -0
package/entroplain/__init__.py +30 -33
package/entroplain/cost_tracker.py +231 -0
package/entroplain/dashboard.py +368 -0
package/entroplain/monitor.py +178 -60
package/entroplain/proxy.py +92 -21
package/entroplain-proxy +0 -0
package/package.json +4 -2
package/paper.md +299 -0
package/pip +0 -0
package/pyproject.toml +96 -89
package/test_nvidia.py +56 -0
package/test_proxy.py +16 -0
package/dist/entroplain-0.1.1-py3-none-any.whl +0 -0
package/dist/entroplain-0.1.1.tar.gz +0 -0

package/entroplain/monitor.py CHANGED Viewed

@@ -1,11 +1,20 @@
 """
 Entropy Monitor — Core entropy tracking and early exit logic.
+Supports multiple exit strategies:
+- Valleys plateau: Exit when reasoning milestones stabilize
+- Entropy drop: Exit when model confidence is high
+- Velocity zero: Exit when entropy stops changing
+- Combined: Multiple conditions with AND/OR logic
+- Repetition: Exit when model starts repeating
+- Confidence: Exit when top token probability > threshold for N tokens
 """
 import math
 from typing import List, Tuple, Optional, Dict, Any, Callable
 from dataclasses import dataclass, field
 from enum import Enum
+from collections import Counter
 class ExitCondition(Enum):
@@ -13,6 +22,10 @@ class ExitCondition(Enum):
     ENTROPY_DROP = "entropy_drop"
     VELOCITY_ZERO = "velocity_zero"
     COMBINED = "combined"
+    # New strategies
+    REPETITION = "repetition"
+    CONFIDENCE = "confidence"
+    SEMANTIC = "semantic"
 @dataclass
@@ -23,6 +36,7 @@ class EntropyPoint:
     entropy: float
     is_valley: bool = False
     velocity: float = 0.0
+    confidence: float = 0.0  # Top token probability
 @dataclass
@@ -35,21 +49,25 @@ class MonitorConfig:
     valley_window: int = 5
     plateau_threshold: int = 3
     exit_condition: ExitCondition = ExitCondition.COMBINED
+    # New config options
+    repetition_window: int = 20  # Window to check for repetition
+    repetition_threshold: float = 0.3  # 30% repetition = exit
+    confidence_threshold: float = 0.95  # 95% confidence = exit
+    confidence_min_tokens: int = 5  # Min tokens at high confidence
 class EntropyMonitor:
     """
     Monitor entropy trajectory and detect reasoning convergence.
     Usage:
         monitor = EntropyMonitor()
         for token, entropy in stream:
             monitor.track(token, entropy)
             if monitor.should_exit():
                 break
     """
     def __init__(
         self,
         entropy_threshold: float = 0.15,
@@ -58,7 +76,12 @@ class EntropyMonitor:
         min_tokens: int = 50,
         valley_window: int = 5,
         plateau_threshold: int = 3,
-        exit_condition: str = "combined"
+        exit_condition: str = "combined",
+        # New parameters
+        repetition_window: int = 20,
+        repetition_threshold: float = 0.3,
+        confidence_threshold: float = 0.95,
+        confidence_min_tokens: int = 5,
     ):
         self.config = MonitorConfig(
             entropy_threshold=entropy_threshold,
@@ -67,60 +90,66 @@ class EntropyMonitor:
             min_tokens=min_tokens,
             valley_window=valley_window,
             plateau_threshold=plateau_threshold,
-            exit_condition=ExitCondition(exit_condition)
+            exit_condition=ExitCondition(exit_condition),
+            repetition_window=repetition_window,
+            repetition_threshold=repetition_threshold,
+            confidence_threshold=confidence_threshold,
+            confidence_min_tokens=confidence_min_tokens,
         )
         self._trajectory: List[EntropyPoint] = []
         self._valleys: List[EntropyPoint] = []
         self._index = 0
+        self._high_confidence_count = 0  # Track consecutive high confidence
     def calculate_entropy(self, logprobs: List[float], from_probs: bool = False) -> float:
         """
         Calculate Shannon entropy from log probabilities or probabilities.
         Args:
             logprobs: List of log probabilities (natural log) or probabilities
             from_probs: If True, treat input as probabilities (will convert)
         Returns:
             Shannon entropy in bits
         """
         if not logprobs:
             return 0.0
         entropy = 0.0
         for lp in logprobs:
             if from_probs:
                 prob = lp
             else:
                 prob = math.exp(lp)
             if prob > 0:
                 entropy -= prob * math.log2(prob + 1e-10)
         return entropy
-    def track(self, token: str, entropy: float) -> EntropyPoint:
+    def track(self, token: str, entropy: float, confidence: float = 0.0) -> EntropyPoint:
         """
         Track a token and its entropy value.
         Args:
             token: The generated token
             entropy: Calculated entropy for this token
+            confidence: Top token probability (optional, for confidence strategy)
         Returns:
             EntropyPoint with valley detection
         """
         point = EntropyPoint(
             index=self._index,
             token=token,
-            entropy=entropy
+            entropy=entropy,
+            confidence=confidence
         )
         # Calculate velocity
         if len(self._trajectory) > 0:
             prev = self._trajectory[-1]
             point.velocity = abs(entropy - prev.entropy)
         # Detect valley (local minimum)
         if len(self._trajectory) >= 2:
             prev2 = self._trajectory[-2]
@@ -128,117 +157,174 @@ class EntropyMonitor:
             if prev1.entropy < prev2.entropy and prev1.entropy < entropy:
                 prev1.is_valley = True
                 self._valleys.append(prev1)
         self._trajectory.append(point)
         self._index += 1
+        # Track high confidence
+        if confidence >= self.config.confidence_threshold:
+            self._high_confidence_count += 1
+        else:
+            self._high_confidence_count = 0
         return point
     def get_valleys(self) -> List[Tuple[int, float]]:
         """Get all entropy valleys (local minima) as (index, entropy) tuples."""
         return [(v.index, v.entropy) for v in self._valleys]
     def get_velocity(self) -> float:
         """Get current entropy velocity (rate of change)."""
         if len(self._trajectory) < 2:
             return 0.0
         return self._trajectory[-1].velocity
     def get_mean_entropy(self) -> float:
         """Get mean entropy over the trajectory."""
         if not self._trajectory:
             return 0.0
         return sum(p.entropy for p in self._trajectory) / len(self._trajectory)
     def get_valley_count(self) -> int:
         """Get the number of detected valleys."""
         return len(self._valleys)
     def is_valleys_plateau(self) -> bool:
         """Check if valley count has plateaued."""
         if len(self._valleys) < self.config.min_valleys:
             return False
         # Check if last N valleys have similar spacing
         recent = self._valleys[-self.config.plateau_threshold:]
         if len(recent) < self.config.plateau_threshold:
             return False
         # Calculate spacing between recent valleys
-        spacings = [recent[i+1].index - recent[i].index for i in range(len(recent)-1)]
+        spacings = [
+            recent[i + 1].index - recent[i].index
+            for i in range(len(recent) - 1)
+        ]
         if not spacings:
             return False
         mean_spacing = sum(spacings) / len(spacings)
-        variance = sum((s - mean_spacing)**2 for s in spacings) / len(spacings)
+        variance = sum((s - mean_spacing) ** 2 for s in spacings) / len(spacings)
         # Low variance in spacing = plateau
         return variance < 10  # Threshold tuned empirically
     def is_entropy_low(self) -> bool:
         """Check if current entropy is below threshold."""
         if not self._trajectory:
             return False
         return self._trajectory[-1].entropy < self.config.entropy_threshold
     def is_velocity_stable(self) -> bool:
         """Check if velocity is below threshold."""
         return self.get_velocity() < self.config.velocity_threshold
+    def is_repeating(self) -> bool:
+        """
+        Check if the model is repeating itself.
+        Returns True if the repetition ratio in the recent window
+        exceeds the threshold.
+        """
+        if len(self._trajectory) < self.config.repetition_window:
+            return False
+        # Get recent tokens
+        recent_tokens = [
+            p.token for p in self._trajectory[-self.config.repetition_window :]
+        ]
+        # Count unique vs total
+        counter = Counter(recent_tokens)
+        unique_count = len(counter)
+        total_count = len(recent_tokens)
+        # Calculate repetition ratio
+        repetition_ratio = 1.0 - (unique_count / total_count)
+        return repetition_ratio >= self.config.repetition_threshold
+    def is_confident(self) -> bool:
+        """
+        Check if model has been highly confident for consecutive tokens.
+        Returns True if the last N tokens had confidence >= threshold.
+        """
+        return self._high_confidence_count >= self.config.confidence_min_tokens
     def should_exit(self) -> bool:
         """
         Determine if reasoning has converged and we should exit.
         Uses the configured exit condition:
         - valleys_plateau: Exit when valley count plateaus
         - entropy_drop: Exit when entropy drops below threshold
         - velocity_zero: Exit when velocity stabilizes
         - combined: Use all conditions with AND logic
+        - repetition: Exit when model starts repeating
+        - confidence: Exit when confidence is high for N tokens
         """
         # Always require minimum tokens
         if len(self._trajectory) < self.config.min_tokens:
             return False
-        # Always require minimum valleys
+        # Always require minimum valleys (for most strategies)
+        condition = self.config.exit_condition
+        if condition == ExitCondition.REPETITION:
+            # Repetition doesn't require valleys
+            return self.is_repeating()
+        if condition == ExitCondition.CONFIDENCE:
+            # Confidence doesn't require valleys
+            return self.is_confident()
+        # For other strategies, require minimum valleys
         if len(self._valleys) < self.config.min_valleys:
             return False
-        condition = self.config.exit_condition
         if condition == ExitCondition.VALLEYS_PLATEAU:
             return self.is_valleys_plateau()
         if condition == ExitCondition.ENTROPY_DROP:
             return self.is_entropy_low()
         if condition == ExitCondition.VELOCITY_ZERO:
             return self.is_velocity_stable()
         if condition == ExitCondition.COMBINED:
             # Combined: require entropy low OR valleys plateau, AND velocity stable
             return (self.is_entropy_low() or self.is_valleys_plateau()) and self.is_velocity_stable()
+        if condition == ExitCondition.SEMANTIC:
+            # Placeholder for future semantic convergence detection
+            # Would use embeddings to detect when output stabilizes semantically
+            return False
         return False
     def is_converged(self) -> bool:
         """Alias for should_exit()."""
         return self.should_exit()
     def get_trajectory(self) -> List[float]:
         """Get full entropy trajectory as list of floats."""
         return [p.entropy for p in self._trajectory]
     def get_tokens(self) -> List[str]:
         """Get all tracked tokens."""
         return [p.token for p in self._trajectory]
     def get_stats(self) -> Dict[str, Any]:
         """Get summary statistics."""
         if not self._trajectory:
             return {}
         entropies = [p.entropy for p in self._trajectory]
         return {
             "token_count": len(self._trajectory),
             "valley_count": len(self._valleys),
@@ -247,26 +333,58 @@ class EntropyMonitor:
             "max_entropy": max(entropies),
             "current_entropy": entropies[-1],
             "current_velocity": self.get_velocity(),
-            "is_converged": self.should_exit()
+            "is_converged": self.should_exit(),
+            "exit_reason": self._get_exit_reason(),
         }
+    def _get_exit_reason(self) -> Optional[str]:
+        """Get the reason for early exit (if triggered)."""
+        if not self.should_exit():
+            return None
+        condition = self.config.exit_condition
+        if condition == ExitCondition.REPETITION:
+            return "repetition_detected"
+        if condition == ExitCondition.CONFIDENCE:
+            return "high_confidence"
+        if condition == ExitCondition.ENTROPY_DROP:
+            return "entropy_below_threshold"
+        if condition == ExitCondition.VELOCITY_ZERO:
+            return "velocity_stable"
+        if condition == ExitCondition.VALLEYS_PLATEAU:
+            return "valleys_plateau"
+        if condition == ExitCondition.COMBINED:
+            if self.is_entropy_low() and self.is_velocity_stable():
+                return "entropy_low_velocity_stable"
+            if self.is_valleys_plateau() and self.is_velocity_stable():
+                return "valleys_plateau_velocity_stable"
+            return "combined"
+        return "unknown"
     def reset(self) -> None:
         """Clear all tracked data."""
         self._trajectory.clear()
         self._valleys.clear()
         self._index = 0
+        self._high_confidence_count = 0
-def calculate_entropy(logprobs: List[float], from_probs: bool = False) -> float:
+# Convenience function for one-shot entropy calculation
+def calculate_entropy_from_logprobs(logprobs: List[float]) -> float:
     """
-    Standalone function to calculate Shannon entropy.
+    Calculate Shannon entropy from log probabilities.
     Args:
-        logprobs: List of log probabilities or probabilities
-        from_probs: If True, treat input as probabilities
+        logprobs: List of log probabilities (natural log)
     Returns:
         Shannon entropy in bits
     """
-    monitor = EntropyMonitor()
-    return monitor.calculate_entropy(logprobs, from_probs)
+    entropy = 0.0
+    for lp in logprobs:
+        prob = math.exp(lp)
+        if prob > 0:
+            entropy -= prob * math.log2(prob + 1e-10)
+    return entropy

package/entroplain/proxy.py CHANGED Viewed

@@ -23,6 +23,7 @@ from fastapi.responses import StreamingResponse
 import uvicorn
 from .monitor import EntropyMonitor
+from .cost_tracker import CostTracker, format_cost_report
 logger = logging.getLogger(__name__)
@@ -33,12 +34,14 @@ class ProxyConfig:
     port: int = 8765
     provider: str = "openai"  # openai, anthropic, nvidia
     api_base: str = "https://api.openai.com/v1"
+    model: str = "default"  # For cost tracking
     entropy_threshold: float = 0.15
     min_valleys: int = 2
     min_tokens: int = 50
     velocity_threshold: float = 0.05
     enable_early_exit: bool = True
     log_entropy: bool = True
+    track_cost: bool = True
 class EntropyProxy:
@@ -57,6 +60,7 @@ class EntropyProxy:
             min_tokens=config.min_tokens,
             velocity_threshold=config.velocity_threshold
         )
+        self.cost_tracker = CostTracker(model=config.model) if config.track_cost else None
         self.app = FastAPI(title="Entroplain Proxy")
         self._setup_routes()
@@ -67,17 +71,32 @@ class EntropyProxy:
         @self.app.get("/health")
         async def health():
-            return {"status": "ok", "monitor": self.monitor.get_stats()}
+            stats = self.monitor.get_stats()
+            if self.cost_tracker and self.cost_tracker.output_tokens > 0:
+                stats["cost"] = self.cost_tracker.get_stats()
+            return {"status": "ok", "monitor": stats}
         @self.app.post("/reset")
         async def reset():
             self.monitor.reset()
+            if self.cost_tracker:
+                self.cost_tracker.reset()
             return {"status": "reset"}
     async def _handle_chat(self, request: Request):
         """Handle chat completion requests with entropy monitoring."""
         body = await request.json()
+        # Extract model for cost tracking
+        model = body.get("model", "default")
+        if self.cost_tracker:
+            self.cost_tracker = CostTracker(model=model)
+        # Estimate input tokens
+        input_tokens = self._estimate_tokens(body.get("messages", []))
+        if self.cost_tracker:
+            self.cost_tracker.track_input(input_tokens)
         # Ensure logprobs are enabled for entropy calculation
         if "logprobs" not in body:
             body["logprobs"] = True
@@ -113,6 +132,20 @@ class EntropyProxy:
             media_type="text/event-stream"
         )
+    def _estimate_tokens(self, messages: list) -> int:
+        """Rough estimate of input tokens from messages."""
+        total = 0
+        for msg in messages:
+            content = msg.get("content", "")
+            if isinstance(content, str):
+                # Rough estimate: ~4 chars per token
+                total += len(content) // 4
+            elif isinstance(content, list):
+                for part in content:
+                    if isinstance(part, dict) and part.get("type") == "text":
+                        total += len(part.get("text", "")) // 4
+        return max(total, 10)  # Minimum 10 tokens
     async def _stream_with_entropy(
         self, response: httpx.Response
     ) -> AsyncIterator[str]:
@@ -144,17 +177,29 @@ class EntropyProxy:
                 if choice.get("delta", {}).get("content"):
                     token = choice["delta"]["content"]
                     full_content += token
+                    # Track output token for cost
+                    if self.cost_tracker:
+                        self.cost_tracker.track_output(1)
-                # Calculate entropy from logprobs
-                if choice.get("logprobs", {}).get("content"):
-                    logprobs_data = choice["logprobs"]["content"]
+                # Calculate entropy from logprobs (handle null)
+                logprobs = choice.get("logprobs")
+                if logprobs and logprobs.get("content"):
+                    logprobs_data = logprobs["content"]
                     if logprobs_data:
                         entropy = self._calculate_entropy(logprobs_data[0])
-                        self.monitor.track(token, entropy)
+                        # Get confidence (top token probability)
+                        confidence = 0.0
+                        if logprobs_data[0].get("top_logprobs"):
+                            confidence = math.exp(logprobs_data[0]["top_logprobs"][0]["logprob"])
+                        self.monitor.track(token, entropy, confidence)
                         if self.config.log_entropy:
                             logger.info(
                                 f"Token: {repr(token)}, Entropy: {entropy:.4f}, "
+                                f"Confidence: {confidence:.2%}, "
                                 f"Valleys: {len(self.monitor.get_valleys())}"
                             )
@@ -163,11 +208,23 @@ class EntropyProxy:
                             self.config.enable_early_exit
                             and self.monitor.should_exit()
                         ):
+                            exit_reason = self.monitor._get_exit_reason()
                             logger.info(
                                 f"Early exit triggered! "
+                                f"Reason: {exit_reason}, "
                                 f"Tokens: {len(full_content)}, "
                                 f"Valleys: {len(self.monitor.get_valleys())}"
                             )
+                            # Log cost savings
+                            if self.cost_tracker:
+                                # Estimate what full output would have been
+                                # Typically 2-3x for reasoning tasks
+                                estimated_full = len(full_content) * 2.5
+                                self.cost_tracker.set_full_estimate(int(estimated_full))
+                                estimate = self.cost_tracker.get_estimate()
+                                logger.info(f"Cost savings: ${estimate.cost_saved_usd:.4f} ({estimate.savings_percent:.1f}%)")
                             exited_early = True
                             yield "data: [DONE]\n\n"
                             break
@@ -204,6 +261,7 @@ class EntropyProxy:
 def main():
     """CLI entry point for running the proxy."""
     import argparse
+    import math  # Needed for entropy calculation
     parser = argparse.ArgumentParser(description="Entropy Monitoring Proxy")
     parser.add_argument("--port", type=int, default=8765, help="Proxy port")
@@ -218,6 +276,11 @@ def main():
         default="https://api.openai.com/v1",
         help="API base URL"
     )
+    parser.add_argument(
+        "--model",
+        default="default",
+        help="Model name for cost tracking"
+    )
     parser.add_argument(
         "--entropy-threshold",
         type=float,
@@ -240,6 +303,11 @@ def main():
         action="store_true",
         help="Log entropy values to console"
     )
+    parser.add_argument(
+        "--no-cost-tracking",
+        action="store_true",
+        help="Disable cost tracking"
+    )
     args = parser.parse_args()
@@ -247,29 +315,32 @@ def main():
         port=args.port,
         provider=args.provider,
         api_base=args.api_base,
+        model=args.model,
         entropy_threshold=args.entropy_threshold,
         min_valleys=args.min_valleys,
         enable_early_exit=not args.no_early_exit,
-        log_entropy=args.log_entropy
+        log_entropy=args.log_entropy,
+        track_cost=not args.no_cost_tracking
     )
     proxy = EntropyProxy(config)
-    print(f"""
-╔═══════════════════════════════════════════════════════════╗
-║           ENTROPPLAIN ENTROPY MONITORING PROXY            ║
-╠═══════════════════════════════════════════════════════════╣
-║  Proxy running on: http://localhost:{args.port}                ║
-║  Provider: {args.provider:<10}                                ║
-║  API Base: {args.api_base:<30}     ║
-║  Early Exit: {'DISABLED' if args.no_early_exit else 'ENABLED'}                               ║
-╠═══════════════════════════════════════════════════════════╣
-║  Set your agent's API endpoint to:                        ║
-║    export OPENAI_BASE_URL=http://localhost:{args.port}          ║
-║    # or for NVIDIA:                                        ║
-║    export NVIDIA_BASE_URL=http://localhost:{args.port}         ║
-╚═══════════════════════════════════════════════════════════╝
-    """)
+    # Clean banner with fixed formatting
+    print("\n" + "="*62)
+    print("  ENTROPPLAIN ENTROPY MONITORING PROXY")
+    print("="*62)
+    print(f"  Proxy:      http://localhost:{args.port}")
+    print(f"  Provider:   {args.provider}")
+    print(f"  API Base:   {args.api_base}")
+    print(f"  Model:      {args.model}")
+    print(f"  Early Exit: {'ENABLED' if not args.no_early_exit else 'DISABLED'}")
+    print(f"  Cost Track: {'DISABLED' if args.no_cost_tracking else 'ENABLED'}")
+    print("="*62)
+    print("  Usage:")
+    print(f"    export OPENAI_BASE_URL=http://localhost:{args.port}")
+    print("    # or for NVIDIA:")
+    print(f"    export NVIDIA_BASE_URL=http://localhost:{args.port}")
+    print("="*62 + "\n")
     proxy.run()

package/entroplain-proxy ADDED Viewed

File without changes

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "entroplain",
-  "version": "0.1.1",
+  "version": "0.2.0",
   "description": "Entropy-based early exit for efficient agent reasoning",
   "main": "dist/index.js",
   "types": "dist/index.d.ts",
@@ -16,7 +16,9 @@
     "entropy",
     "early-exit",
     "reasoning",
-    "efficiency"
+    "efficiency",
+    "cost-tracking",
+    "dashboard"
   ],
   "author": "Entroplain Contributors",
   "license": "MIT",