PyPI - entropic-engine - Versions diffs - 1.0.0__tar.gz - Mend

entropic-engine 1.0.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (120) hide show

entropic_engine-1.0.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,220 @@
+Metadata-Version: 2.4
+Name: entropic-engine
+Version: 1.0.0
+Summary: Local-first agentic inference engine with tier-based model routing
+Author: Tristan VanFossen
+License: Apache-2.0
+Keywords: ai,coding,assistant,llm,local
+Classifier: Development Status :: 3 - Alpha
+Classifier: Environment :: Console
+Classifier: Intended Audience :: Developers
+Classifier: License :: OSI Approved :: Apache Software License
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Topic :: Software Development
+Requires-Python: >=3.11
+Description-Content-Type: text/markdown
+Requires-Dist: llama-cpp-python>=0.2.0
+Requires-Dist: mcp>=1.0.0
+Requires-Dist: pydantic>=2.0.0
+Requires-Dist: pydantic-settings>=2.0.0
+Requires-Dist: pyyaml>=6.0.0
+Provides-Extra: tui
+Requires-Dist: textual>=0.47.0; extra == "tui"
+Requires-Dist: rich>=13.0.0; extra == "tui"
+Requires-Dist: click>=8.0.0; extra == "tui"
+Requires-Dist: pylspclient>=0.0.7; extra == "tui"
+Provides-Extra: app
+Requires-Dist: entropic-engine[tui]; extra == "app"
+Requires-Dist: aiosqlite>=0.19.0; extra == "app"
+Requires-Dist: httpx>=0.25.0; extra == "app"
+Provides-Extra: all
+Requires-Dist: entropic-engine[app,voice]; extra == "all"
+Provides-Extra: dev
+Requires-Dist: pytest>=7.0.0; extra == "dev"
+Requires-Dist: pytest-asyncio>=0.21.0; extra == "dev"
+Requires-Dist: pytest-bdd>=7.0.0; extra == "dev"
+Requires-Dist: pytest-cov>=4.0.0; extra == "dev"
+Requires-Dist: mypy>=1.0.0; extra == "dev"
+Requires-Dist: black>=23.0.0; extra == "dev"
+Requires-Dist: ruff>=0.1.0; extra == "dev"
+Requires-Dist: pre-commit>=3.0.0; extra == "dev"
+Requires-Dist: types-pyyaml>=6.0.0; extra == "dev"
+Provides-Extra: voice
+Requires-Dist: numpy<2.2,>=1.26; extra == "voice"
+Requires-Dist: safetensors<0.5,>=0.4.0; extra == "voice"
+Requires-Dist: huggingface-hub<0.28,>=0.24; extra == "voice"
+Requires-Dist: einops==0.7; extra == "voice"
+Requires-Dist: sentencepiece==0.2; extra == "voice"
+Requires-Dist: sounddevice==0.5; extra == "voice"
+Requires-Dist: sphn<0.2,>=0.1.4; extra == "voice"
+Requires-Dist: torch>=2.2.0; extra == "voice"
+Requires-Dist: aiohttp<3.12,>=3.10.5; extra == "voice"
+Requires-Dist: websockets<14.0,>=12.0; extra == "voice"
+Requires-Dist: accelerate>=0.30.0; extra == "voice"
+Requires-Dist: torchao>=0.4.0; extra == "voice"
+# Entropic
+> Local-first agentic inference engine with tier-based model routing
+This started as "I want to build a local-first Claude Code" — which turned out
+to be quite the undertaking. The initial build was a tightly coupled TUI, but it
+became clear pretty quickly that I was duplicating the same core inference engine
+across other local projects wrapping llama-cpp-python. So it evolved into a
+library: the inference engine, model orchestration, agentic loop, and tool
+framework are all importable and reusable without dragging in a UI. The TUI ships
+alongside it as one consumer, and doubles as a testbed for new ideas. There's also
+a very broken voice interface via PersonaPlex that I'll get to eventually.
+The name is a nod to how this actually works. Every handoff — human intent to
+prompt, prompt to model, model to model across tiers — is a lossy translation.
+Information decays at each boundary. That's the entropic process this engine tries
+to manage: structured routing, context management, and tool-augmented reasoning to
+lose as little as possible along the way. A bit of a nihilistic naming convention,
+but the tier routing and model management do earn their keep in practice. There's
+optimization work ahead, but the foundation is solid and I'm always open to new
+directions.
+## Architecture
+Entropic is a **library first, application second**. The inference engine
+(orchestrator, agentic loop, adapters, tool providers) is fully separable from
+any UI. The bundled TUI is one consumer; headless automation, CI/CD agents, and
+custom applications are equally supported.
+```
+pip install entropic-engine          # Core library (inference, engine, tools)
+pip install entropic-engine[app]     # TUI application (includes tui + storage deps)
+pip install entropic-engine[voice]   # Voice interface (PersonaPlex)
+pip install entropic-engine[all]     # Everything
+```
+```
++-----------------------------------------------------+
+|  Application Layer (TUI / Headless / Custom)        |
++-----------------------------------------------------+
+|  Engine          |  Orchestrator    |  Tools         |
+|  - Agentic loop  |  - Tier routing  |  - Filesystem  |
+|  - Directives    |  - Model swap    |  - Bash        |
+|  - Compaction    |  - VRAM mgmt     |  - Diagnostics |
+|  - Context mgmt  |  - Adapters      |  - Git / Todo  |
++-----------------------------------------------------+
+|  Inference Backend (llama-cpp-python)                |
+|  - GGUF models, single-GPU, in-process              |
++-----------------------------------------------------+
+```
+### Tier-Based Routing
+A lightweight router model classifies each prompt and routes to the appropriate
+tier. Only one main model is loaded at a time (VRAM constraint) — the
+orchestrator handles dynamic swapping with lock-protected state transitions.
+| Tier | Purpose | Typical Model |
+|------|---------|---------------|
+| **Thinking** | Complex reasoning, architecture, multi-step analysis | Qwen3-14B Q4_K_M |
+| **Normal** | General conversation and tasks | Falcon-H1R-7B Q8_0 |
+| **Code** | Code generation, editing, refactoring | Falcon-H1R-7B Q8_0 |
+| **Simple** | Greetings, acknowledgments, short responses | (shares normal model) |
+| **Router** | Prompt classification only | Qwen3-0.6B Q8_0 |
+### Agentic Loop
+The engine runs an autonomous tool-calling loop: generate -> parse tool calls ->
+execute tools -> feed results back -> generate again. The loop continues until
+the model produces a complete response or hits the iteration limit.
+Tools communicate back to the engine via **directives** — structured signals
+embedded in tool results that can trigger tier handoffs, context anchoring, and
+state management without the model needing to orchestrate these concerns.
+## Features
+- **Fully Local** — All inference on your hardware via llama-cpp-python. No API keys.
+- **Library API** — Embed the engine in your own application with `LibraryConfig`
+- **Intelligent Routing** — Sub-second prompt classification routes to the right model tier
+- **Single-GPU Orchestration** — Dynamic model swapping with VRAM-aware loading
+- **Per-Model Adapters** — Model-specific chat templates, tool parsing, thinking block handling
+- **Auto-Compaction** — Context summarization for long conversations
+- **MCP Tools** — Filesystem, bash, diagnostics, git, and extensible tool servers
+- **Headless Mode** — Full engine without TUI for automation and testing
+- **TUI** — Terminal interface built on Textual with streaming, tool approval, voice input
+## Requirements
+- Linux (tested on Ubuntu 24.04)
+- NVIDIA GPU with 16GB+ VRAM
+- CUDA 12.4+
+- Python 3.11+
+## Quick Start
+```bash
+git clone https://github.com/tvanfossen/entropic.git
+cd entropic
+./install.sh app
+```
+The install script creates a virtual environment, detects CUDA, and installs
+with the `[app]` extras (TUI + storage dependencies).
+```bash
+# Place GGUF models in ~/models/gguf/ (or configure paths in .entropic/config.local.yaml)
+# Run interactive TUI
+.venv/bin/entropic
+# Or headless
+.venv/bin/entropic --headless
+```
+## CLI
+```bash
+entropic                    # Interactive TUI
+entropic --headless         # Headless mode (automation/testing)
+entropic status             # Show model and system status
+entropic ask "question"     # Single-shot question
+entropic init               # Initialize .entropic/ in current directory
+entropic download <model>   # Download model files
+```
+## Configuration
+Configuration loads in priority order (highest wins):
+1. Built-in defaults
+2. Global config (`~/.entropic/config.yaml`)
+3. Project config (`.entropic/config.local.yaml`)
+4. CLI arguments
+Project context is provided via `.entropic/ENTROPIC.md` — a markdown file
+describing the project that gets included in the system prompt.
+## Library Usage
+```python
+from entropic import LibraryConfig, Orchestrator, Engine, ServerManager
+config = LibraryConfig(
+    config_dir=Path("~/.myapp").expanduser(),
+    tiers={"normal": {"path": "model.gguf", "adapter": "qwen3"}},
+)
+orchestrator = Orchestrator(config.to_app_config())
+await orchestrator.initialize()
+server_manager = ServerManager(config.to_app_config())
+await server_manager.initialize()
+engine = Engine(orchestrator=orchestrator, server_manager=server_manager)
+async for message in engine.run("Hello"):
+    print(message.content)
+```
+See `examples/hello-world/` and `examples/pychess/` for complete integrations.
+## License
+Apache-2.0

entropic_engine-1.0.0/README.md ADDED Viewed

@@ -0,0 +1,164 @@
+# Entropic
+> Local-first agentic inference engine with tier-based model routing
+This started as "I want to build a local-first Claude Code" — which turned out
+to be quite the undertaking. The initial build was a tightly coupled TUI, but it
+became clear pretty quickly that I was duplicating the same core inference engine
+across other local projects wrapping llama-cpp-python. So it evolved into a
+library: the inference engine, model orchestration, agentic loop, and tool
+framework are all importable and reusable without dragging in a UI. The TUI ships
+alongside it as one consumer, and doubles as a testbed for new ideas. There's also
+a very broken voice interface via PersonaPlex that I'll get to eventually.
+The name is a nod to how this actually works. Every handoff — human intent to
+prompt, prompt to model, model to model across tiers — is a lossy translation.
+Information decays at each boundary. That's the entropic process this engine tries
+to manage: structured routing, context management, and tool-augmented reasoning to
+lose as little as possible along the way. A bit of a nihilistic naming convention,
+but the tier routing and model management do earn their keep in practice. There's
+optimization work ahead, but the foundation is solid and I'm always open to new
+directions.
+## Architecture
+Entropic is a **library first, application second**. The inference engine
+(orchestrator, agentic loop, adapters, tool providers) is fully separable from
+any UI. The bundled TUI is one consumer; headless automation, CI/CD agents, and
+custom applications are equally supported.
+```
+pip install entropic-engine          # Core library (inference, engine, tools)
+pip install entropic-engine[app]     # TUI application (includes tui + storage deps)
+pip install entropic-engine[voice]   # Voice interface (PersonaPlex)
+pip install entropic-engine[all]     # Everything
+```
+```
++-----------------------------------------------------+
+|  Application Layer (TUI / Headless / Custom)        |
++-----------------------------------------------------+
+|  Engine          |  Orchestrator    |  Tools         |
+|  - Agentic loop  |  - Tier routing  |  - Filesystem  |
+|  - Directives    |  - Model swap    |  - Bash        |
+|  - Compaction    |  - VRAM mgmt     |  - Diagnostics |
+|  - Context mgmt  |  - Adapters      |  - Git / Todo  |
++-----------------------------------------------------+
+|  Inference Backend (llama-cpp-python)                |
+|  - GGUF models, single-GPU, in-process              |
++-----------------------------------------------------+
+```
+### Tier-Based Routing
+A lightweight router model classifies each prompt and routes to the appropriate
+tier. Only one main model is loaded at a time (VRAM constraint) — the
+orchestrator handles dynamic swapping with lock-protected state transitions.
+| Tier | Purpose | Typical Model |
+|------|---------|---------------|
+| **Thinking** | Complex reasoning, architecture, multi-step analysis | Qwen3-14B Q4_K_M |
+| **Normal** | General conversation and tasks | Falcon-H1R-7B Q8_0 |
+| **Code** | Code generation, editing, refactoring | Falcon-H1R-7B Q8_0 |
+| **Simple** | Greetings, acknowledgments, short responses | (shares normal model) |
+| **Router** | Prompt classification only | Qwen3-0.6B Q8_0 |
+### Agentic Loop
+The engine runs an autonomous tool-calling loop: generate -> parse tool calls ->
+execute tools -> feed results back -> generate again. The loop continues until
+the model produces a complete response or hits the iteration limit.
+Tools communicate back to the engine via **directives** — structured signals
+embedded in tool results that can trigger tier handoffs, context anchoring, and
+state management without the model needing to orchestrate these concerns.
+## Features
+- **Fully Local** — All inference on your hardware via llama-cpp-python. No API keys.
+- **Library API** — Embed the engine in your own application with `LibraryConfig`
+- **Intelligent Routing** — Sub-second prompt classification routes to the right model tier
+- **Single-GPU Orchestration** — Dynamic model swapping with VRAM-aware loading
+- **Per-Model Adapters** — Model-specific chat templates, tool parsing, thinking block handling
+- **Auto-Compaction** — Context summarization for long conversations
+- **MCP Tools** — Filesystem, bash, diagnostics, git, and extensible tool servers
+- **Headless Mode** — Full engine without TUI for automation and testing
+- **TUI** — Terminal interface built on Textual with streaming, tool approval, voice input
+## Requirements
+- Linux (tested on Ubuntu 24.04)
+- NVIDIA GPU with 16GB+ VRAM
+- CUDA 12.4+
+- Python 3.11+
+## Quick Start
+```bash
+git clone https://github.com/tvanfossen/entropic.git
+cd entropic
+./install.sh app
+```
+The install script creates a virtual environment, detects CUDA, and installs
+with the `[app]` extras (TUI + storage dependencies).
+```bash
+# Place GGUF models in ~/models/gguf/ (or configure paths in .entropic/config.local.yaml)
+# Run interactive TUI
+.venv/bin/entropic
+# Or headless
+.venv/bin/entropic --headless
+```
+## CLI
+```bash
+entropic                    # Interactive TUI
+entropic --headless         # Headless mode (automation/testing)
+entropic status             # Show model and system status
+entropic ask "question"     # Single-shot question
+entropic init               # Initialize .entropic/ in current directory
+entropic download <model>   # Download model files
+```
+## Configuration
+Configuration loads in priority order (highest wins):
+1. Built-in defaults
+2. Global config (`~/.entropic/config.yaml`)
+3. Project config (`.entropic/config.local.yaml`)
+4. CLI arguments
+Project context is provided via `.entropic/ENTROPIC.md` — a markdown file
+describing the project that gets included in the system prompt.
+## Library Usage
+```python
+from entropic import LibraryConfig, Orchestrator, Engine, ServerManager
+config = LibraryConfig(
+    config_dir=Path("~/.myapp").expanduser(),
+    tiers={"normal": {"path": "model.gguf", "adapter": "qwen3"}},
+)
+orchestrator = Orchestrator(config.to_app_config())
+await orchestrator.initialize()
+server_manager = ServerManager(config.to_app_config())
+await server_manager.initialize()
+engine = Engine(orchestrator=orchestrator, server_manager=server_manager)
+async for message in engine.run("Hello"):
+    print(message.content)
+```
+See `examples/hello-world/` and `examples/pychess/` for complete integrations.
+## License
+Apache-2.0

entropic_engine-1.0.0/pyproject.toml ADDED Viewed

@@ -0,0 +1,135 @@
+[project]
+name = "entropic-engine"
+version = "1.0.0"
+description = "Local-first agentic inference engine with tier-based model routing"
+readme = "README.md"
+license = {text = "Apache-2.0"}
+requires-python = ">=3.11"
+authors = [
+    {name = "Tristan VanFossen"}
+]
+keywords = ["ai", "coding", "assistant", "llm", "local"]
+classifiers = [
+    "Development Status :: 3 - Alpha",
+    "Environment :: Console",
+    "Intended Audience :: Developers",
+    "License :: OSI Approved :: Apache Software License",
+    "Programming Language :: Python :: 3.11",
+    "Programming Language :: Python :: 3.12",
+    "Topic :: Software Development",
+]
+dependencies = [
+    "llama-cpp-python>=0.2.0",
+    "mcp>=1.0.0",
+    "pydantic>=2.0.0",
+    "pydantic-settings>=2.0.0",
+    "pyyaml>=6.0.0",
+]
+[project.optional-dependencies]
+tui = [
+    "textual>=0.47.0",
+    "rich>=13.0.0",
+    "click>=8.0.0",
+    "pylspclient>=0.0.7",
+]
+app = [
+    "entropic-engine[tui]",
+    "aiosqlite>=0.19.0",
+    "httpx>=0.25.0",
+]
+all = ["entropic-engine[app,voice]"]
+dev = [
+    "pytest>=7.0.0",
+    "pytest-asyncio>=0.21.0",
+    "pytest-bdd>=7.0.0",
+    "pytest-cov>=4.0.0",
+    "mypy>=1.0.0",
+    "black>=23.0.0",
+    "ruff>=0.1.0",
+    "pre-commit>=3.0.0",
+    "types-pyyaml>=6.0.0",
+]
+voice = [
+    # From PersonaPlex requirements
+    "numpy>=1.26,<2.2",
+    "safetensors>=0.4.0,<0.5",
+    "huggingface-hub>=0.24,<0.28",
+    "einops==0.7",
+    "sentencepiece==0.2",
+    "sounddevice==0.5",
+    "sphn>=0.1.4,<0.2",
+    "torch>=2.2.0",
+    "aiohttp>=3.10.5,<3.12",
+    "websockets>=12.0,<14.0",
+    # Optional for INT8 quantization
+    "accelerate>=0.30.0",
+    "torchao>=0.4.0",
+]
+[project.scripts]
+entropic = "entropic.cli:main"
+entropic-voice-server = "entropic.voice.server:main"
+[build-system]
+requires = ["setuptools>=61.0", "wheel"]
+build-backend = "setuptools.build_meta"
+[tool.setuptools.packages.find]
+where = ["src"]
+[tool.setuptools.package-data]
+entropic = ["data/*.yaml", "data/prompts/*.md", "data/grammars/*.gbnf", "data/tools/**/*.json", "ui/*.tcss"]
+[tool.black]
+line-length = 100
+target-version = ["py311", "py312"]
+[tool.ruff]
+line-length = 100
+extend-exclude = ["vendor"]
+[tool.ruff.lint]
+select = ["E", "F", "W", "I", "N", "UP", "B", "C4"]
+ignore = ["E501"]
+[tool.mypy]
+python_version = "3.12"
+strict = true
+ignore_missing_imports = true
+[[tool.mypy.overrides]]
+module = "tests.*"
+strict = false
+disallow_untyped_defs = false
+disallow_untyped_calls = false
+disallow_incomplete_defs = false
+[[tool.mypy.overrides]]
+module = ["entropic.cli", "entropic.cli_download"]
+disallow_untyped_decorators = false
+[[tool.mypy.overrides]]
+module = "entropic.mcp.servers.base"
+disallow_untyped_decorators = false
+[[tool.mypy.overrides]]
+module = "entropic.ui.tui"
+disallow_untyped_decorators = false
+[tool.pytest.ini_options]
+asyncio_mode = "auto"
+testpaths = ["tests"]
+python_files = ["test_*.py"]
+python_functions = ["test_*"]
+# Markers for categorizing tests
+markers = [
+    "unit: Fast tests without external dependencies",
+    "integration: Tests requiring external services (docker, etc)",
+    "model: Tests requiring actual model inference (GPU recommended)",
+    "slow: Tests that take a long time to run",
+]
+# Run all tests by default including model tests
+# Skip model tests with: pytest -m "not model"
+# Run only model tests: pytest -m model

entropic_engine-1.0.0/setup.cfg ADDED Viewed

@@ -0,0 +1,4 @@
+[egg_info]
+tag_build =
+tag_date = 0

entropic_engine-1.0.0/src/entropic/__init__.py ADDED Viewed

@@ -0,0 +1,93 @@
+"""
+Entropi - Local AI inference engine with multi-tier model orchestration.
+Public API for library consumers. Install extras for additional features:
+  pip install entropic-engine          # Core inference engine
+  pip install entropic-engine[tui]     # Terminal UI application
+  pip install entropic-engine[voice]   # Voice interface
+"""
+from entropic.config.loader import ConfigLoader, save_permission, validate_config
+from entropic.config.schema import (
+    CompactionConfig,
+    EntropyConfig,
+    GenerationConfig,
+    LibraryConfig,
+    ModelConfig,
+    ModelsConfig,
+    RoutingConfig,
+    TierConfig,
+)
+from entropic.core.base import (
+    GenerationResult,
+    Message,
+    ModelBackend,
+    ModelTier,
+    ToolCall,
+    ToolProvider,
+    ToolResult,
+)
+from entropic.core.engine import AgentEngine, AgentState, EngineCallbacks, LoopConfig
+from entropic.core.logging import setup_logging, setup_model_logger
+from entropic.core.tool_validation import ToolValidationError
+from entropic.inference.adapters import ChatAdapter, get_adapter, register_adapter
+from entropic.inference.orchestrator import BackendFactory, ModelOrchestrator, RoutingResult
+from entropic.mcp.manager import ServerManager
+from entropic.mcp.provider import InProcessProvider
+from entropic.mcp.servers.base import BaseMCPServer, ServerResponse, load_tool_definition
+from entropic.mcp.tools import BaseTool, ToolRegistry
+from entropic.prompts import TierIdentity, load_tier_identity
+__version__ = "1.0.0"
+__author__ = "Tristan VanFossen"
+__all__ = [
+    # Core types
+    "GenerationResult",
+    "Message",
+    "ModelBackend",
+    "ModelTier",
+    "ToolCall",
+    "ToolProvider",
+    "ToolResult",
+    # Engine
+    "AgentEngine",
+    "AgentState",
+    "EngineCallbacks",
+    "LoopConfig",
+    # Logging
+    "setup_logging",
+    "setup_model_logger",
+    # Config
+    "ConfigLoader",
+    "save_permission",
+    "validate_config",
+    "CompactionConfig",
+    "EntropyConfig",
+    "GenerationConfig",
+    "LibraryConfig",
+    "ModelConfig",
+    "ModelsConfig",
+    "RoutingConfig",
+    "TierConfig",
+    # Orchestrator
+    "BackendFactory",
+    "ModelOrchestrator",
+    "RoutingResult",
+    # Adapters
+    "ChatAdapter",
+    "get_adapter",
+    "register_adapter",
+    # MCP
+    "BaseMCPServer",
+    "BaseTool",
+    "InProcessProvider",
+    "ServerManager",
+    "ServerResponse",
+    "ToolRegistry",
+    "ToolValidationError",
+    "load_tool_definition",
+    # Prompts
+    "TierIdentity",
+    "load_tier_identity",
+]

entropic_engine-1.0.0/src/entropic/__main__.py ADDED Viewed

@@ -0,0 +1,8 @@
+"""
+Allow running as `python -m entropic`.
+"""
+from entropic.cli import main
+if __name__ == "__main__":
+    main()