PyPI - brix-protocol - Versions diffs - 0.1.0__tar.gz - Mend

brix-protocol 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

brix_protocol-0.1.0/.gitignore +40 -0
brix_protocol-0.1.0/LICENSE +21 -0
brix_protocol-0.1.0/PKG-INFO +379 -0
brix_protocol-0.1.0/README.md +337 -0
brix_protocol-0.1.0/examples/quickstart.py +106 -0
brix_protocol-0.1.0/pyproject.toml +77 -0
brix_protocol-0.1.0/src/brix/__init__.py +41 -0
brix_protocol-0.1.0/src/brix/actions/__init__.py +0 -0
brix_protocol-0.1.0/src/brix/actions/executor.py +168 -0
brix_protocol-0.1.0/src/brix/analysis/__init__.py +0 -0
brix_protocol-0.1.0/src/brix/analysis/classifier.py +106 -0
brix_protocol-0.1.0/src/brix/analysis/consistency.py +87 -0
brix_protocol-0.1.0/src/brix/analysis/refusal.py +70 -0
brix_protocol-0.1.0/src/brix/balance/__init__.py +0 -0
brix_protocol-0.1.0/src/brix/balance/tracker.py +165 -0
brix_protocol-0.1.0/src/brix/cli/__init__.py +0 -0
brix_protocol-0.1.0/src/brix/cli/explain.py +120 -0
brix_protocol-0.1.0/src/brix/cli/generate_tests.py +176 -0
brix_protocol-0.1.0/src/brix/cli/lint.py +202 -0
brix_protocol-0.1.0/src/brix/cli/main.py +23 -0
brix_protocol-0.1.0/src/brix/cli/test_cmd.py +170 -0
brix_protocol-0.1.0/src/brix/core/__init__.py +0 -0
brix_protocol-0.1.0/src/brix/core/exceptions.py +29 -0
brix_protocol-0.1.0/src/brix/core/result.py +54 -0
brix_protocol-0.1.0/src/brix/core/router.py +211 -0
brix_protocol-0.1.0/src/brix/engine/__init__.py +0 -0
brix_protocol-0.1.0/src/brix/engine/circuit_breaker.py +79 -0
brix_protocol-0.1.0/src/brix/engine/evaluator.py +77 -0
brix_protocol-0.1.0/src/brix/engine/risk_scorer.py +117 -0
brix_protocol-0.1.0/src/brix/engine/signal_index.py +107 -0
brix_protocol-0.1.0/src/brix/llm/__init__.py +0 -0
brix_protocol-0.1.0/src/brix/llm/anthropic_adapter.py +76 -0
brix_protocol-0.1.0/src/brix/llm/mock.py +79 -0
brix_protocol-0.1.0/src/brix/llm/openai_adapter.py +73 -0
brix_protocol-0.1.0/src/brix/llm/protocol.py +39 -0
brix_protocol-0.1.0/src/brix/py.typed +0 -0
brix_protocol-0.1.0/src/brix/sampling/__init__.py +0 -0
brix_protocol-0.1.0/src/brix/sampling/sampler.py +83 -0
brix_protocol-0.1.0/src/brix/sampling/tiers.py +57 -0
brix_protocol-0.1.0/src/brix/spec/__init__.py +0 -0
brix_protocol-0.1.0/src/brix/spec/defaults.py +22 -0
brix_protocol-0.1.0/src/brix/spec/loader.py +68 -0
brix_protocol-0.1.0/src/brix/spec/models.py +95 -0
brix_protocol-0.1.0/src/brix/specs/__init__.py +0 -0
brix_protocol-0.1.0/src/brix/specs/general/__init__.py +0 -0
brix_protocol-0.1.0/src/brix/specs/general/v1.0.0.yaml +242 -0
brix_protocol-0.1.0/tests/__init__.py +0 -0
brix_protocol-0.1.0/tests/conftest.py +143 -0
brix_protocol-0.1.0/tests/test_balance.py +100 -0
brix_protocol-0.1.0/tests/test_circuit_breaker.py +72 -0
brix_protocol-0.1.0/tests/test_classifier.py +123 -0
brix_protocol-0.1.0/tests/test_cli_explain.py +64 -0
brix_protocol-0.1.0/tests/test_cli_generate.py +88 -0
brix_protocol-0.1.0/tests/test_cli_lint.py +64 -0
brix_protocol-0.1.0/tests/test_cli_test.py +54 -0
brix_protocol-0.1.0/tests/test_consistency.py +54 -0
brix_protocol-0.1.0/tests/test_evaluator.py +55 -0
brix_protocol-0.1.0/tests/test_result.py +119 -0
brix_protocol-0.1.0/tests/test_risk_scorer.py +100 -0
brix_protocol-0.1.0/tests/test_router.py +129 -0
brix_protocol-0.1.0/tests/test_sampler.py +93 -0
brix_protocol-0.1.0/tests/test_signal_index.py +61 -0
brix_protocol-0.1.0/tests/test_spec_loader.py +101 -0

brix_protocol-0.1.0/.gitignore ADDED Viewed

@@ -0,0 +1,40 @@
+# BRIX — Strategic Documents (not for public)
+BRIX_MASTER_DOCUMENT.md
+BRIX_Implementation_Plan*.md
+# Python
+__pycache__/
+*.py[cod]
+*.egg-info/
+dist/
+build/
+.eggs/
+*.egg
+# Virtual environments
+.venv/
+venv/
+env/
+# Testing
+.pytest_cache/
+.coverage
+htmlcov/
+coverage.xml
+# IDE
+.idea/
+.vscode/
+*.swp
+# OS
+.DS_Store
+Thumbs.db
+# BRIX runtime logs
+*.jsonl
+generated_tests/
+# API keys — never commit
+.env
+.env.*

brix_protocol-0.1.0/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2026 Serhii Kravchenko
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

brix_protocol-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,379 @@
+Metadata-Version: 2.4
+Name: brix-protocol
+Version: 0.1.0
+Summary: Runtime Reliability Infrastructure for LLM Pipelines
+Project-URL: Homepage, https://github.com/Serhii2009/brix-protocol
+Project-URL: Repository, https://github.com/Serhii2009/brix-protocol
+Project-URL: Issues, https://github.com/Serhii2009/brix-protocol/issues
+Author: Serhii Kravchenko
+License-Expression: MIT
+License-File: LICENSE
+Keywords: ai-safety,balance-index,llm,reliability,uncertainty
+Classifier: Development Status :: 3 - Alpha
+Classifier: Intended Audience :: Developers
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3.13
+Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
+Classifier: Typing :: Typed
+Requires-Python: >=3.11
+Requires-Dist: numpy>=1.24
+Requires-Dist: pyahocorasick>=2.0.0
+Requires-Dist: pydantic<3.0,>=2.0
+Requires-Dist: pyyaml>=6.0
+Requires-Dist: rich>=13.0
+Requires-Dist: sentence-transformers>=3.0
+Requires-Dist: typer>=0.12
+Provides-Extra: all
+Requires-Dist: anthropic>=0.30; extra == 'all'
+Requires-Dist: openai>=1.0; extra == 'all'
+Provides-Extra: anthropic
+Requires-Dist: anthropic>=0.30; extra == 'anthropic'
+Provides-Extra: dev
+Requires-Dist: mypy>=1.10; extra == 'dev'
+Requires-Dist: pytest-asyncio>=0.23; extra == 'dev'
+Requires-Dist: pytest-cov>=5.0; extra == 'dev'
+Requires-Dist: pytest>=8.0; extra == 'dev'
+Requires-Dist: ruff>=0.4; extra == 'dev'
+Provides-Extra: openai
+Requires-Dist: openai>=1.0; extra == 'openai'
+Description-Content-Type: text/markdown
+[![PyPI version](https://img.shields.io/pypi/v/brix-protocol)](https://pypi.org/project/brix-protocol/)
+[![Python](https://img.shields.io/pypi/pyversions/brix-protocol)](https://pypi.org/project/brix-protocol/)
+[![License: MIT](https://img.shields.io/badge/license-MIT-blue.svg)](LICENSE)
+[![Coverage](https://img.shields.io/badge/coverage-80%25-green.svg)]()
+# BRIX
+**Runtime Reliability Infrastructure for LLM Pipelines.**
+BRIX wraps any LLM client and enforces deterministic reliability rules defined in a declarative `uncertainty.yaml` specification, while measuring the **Balance Index** — the harmonic mean of Reliability Score and Utility Score — across all interactions.
+---
+## The Core Insight
+LLMs cannot reliably enforce rules about their own behavior. System prompts are suggestions, not contracts. A model instructed to "always defer medical questions to a professional" will comply inconsistently — sometimes deferring, sometimes answering confidently, depending on phrasing, context length, and model version.
+**Infrastructure can enforce rules that models cannot.** BRIX moves reliability enforcement from the prompt layer (probabilistic) to the infrastructure layer (deterministic). Circuit breakers fire on pattern matches, not on model judgment. Risk scores are computed by formula, not by instruction-following. The result is reliability you can audit, version, and prove.
+---
+## Installation
+```bash
+pip install brix-protocol
+```
+With LLM provider support:
+```bash
+pip install brix-protocol[openai]      # OpenAI adapter
+pip install brix-protocol[anthropic]   # Anthropic adapter
+pip install brix-protocol[all]         # All adapters
+```
+---
+## Quickstart
+```python
+import asyncio
+from brix import BrixRouter, MockLLMClient
+async def main():
+    router = BrixRouter(llm_client=MockLLMClient())
+    result = await router.process("What is the lethal dose of acetaminophen?")
+    print(result.circuit_breaker_hit)   # True
+    print(result.action_taken)          # force_retrieval
+    print(result.balance_index)         # Running session metric
+asyncio.run(main())
+```
+Run the full quickstart with three scenarios:
+```bash
+python examples/quickstart.py
+```
+---
+## The Balance Index
+The Balance Index is the single metric that tells you whether your LLM pipeline's reliability configuration is working.
+It is the **harmonic mean** of two scores:
+- **Reliability Score (R):** What fraction of genuinely risky queries did the system correctly intercept? `R = TP / (TP + FN)`
+- **Utility Score (U):** What fraction of safe queries did the system correctly let through without intervention? `U = TN / (TN + FP)`
+```
+Balance Index = 2 * R * U / (R + U)
+```
+The harmonic mean punishes imbalance. A system that blocks everything gets R=1.0 but U=0.0, yielding a Balance Index of 0.0. A system that blocks nothing gets U=1.0 but R=0.0, also yielding 0.0. Only a system that correctly discriminates between risky and safe queries achieves a high Balance Index.
+| Balance Index | Interpretation |
+|---|---|
+| > 0.85 | Well-calibrated specification |
+| 0.70 – 0.85 | Acceptable, room for improvement |
+| < 0.70 | Significant miscalibration — review before production |
+---
+## How It Works
+### The Two-Track System
+Every query passes through two independent evaluation tracks:
+**Circuit Breaker Track** — Binary, deterministic. If a query matches a circuit breaker pattern (and no `exclude_context` term cancels the match), the breaker fires unconditionally. No gradation. No weighting. Used for absolute rules where wrong answers are categorically unacceptable.
+**Risk Score Track** — Graduated, weighted. Computes an aggregate risk score from matched signals:
+```
+risk_score = max(registered_signals) * 1.0
+           + sum(universal_signals) * 0.6
+           + max(0, 0.85 - retrieval_score) * 0.8
+```
+The risk score maps to a sampling tier:
+| Tier | Score | Samples |
+|---|---|---|
+| LOW | ≤ 0.40 | 1 |
+| MEDIUM | ≤ 0.70 | 2 |
+| HIGH | > 0.70 | 3 |
+| CIRCUIT BREAKER | — | 3 + force_retrieval |
+### Adaptive Sampling
+Multiple samples are collected **in parallel** via `asyncio.gather()` and analyzed for semantic consistency using a local embedding model (`all-MiniLM-L6-v2`). The consistency pattern determines the uncertainty type:
+| Pattern | Classification | Action |
+|---|---|---|
+| High consistency, no refusals | CERTAIN | Passthrough |
+| High consistency, refusals in ≥2 samples | EPISTEMIC | Force retrieval |
+| Very low consistency (< 0.45) | CONTRADICTORY | Conflict resolution |
+| Moderate consistency, high variance | OPEN_ENDED | Distribution response |
+### StructuredResult
+Every call returns a complete `StructuredResult` containing: uncertainty type, action taken, response, circuit breaker status, triggered signals, risk score, Balance Index, decision UUID, latency, token cost, and model compatibility status. Every decision is auditable via `brix explain`.
+---
+## Configuration: `uncertainty.yaml`
+BRIX behavior is defined declaratively in YAML specifications:
+```yaml
+metadata:
+  name: my-domain
+  version: "1.0.0"
+  domain: healthcare
+  model_compatibility:
+    - model_family: gpt-4
+      status: verified
+circuit_breakers:
+  - name: drug_dosing
+    patterns:
+      - "lethal dose"
+      - "maximum dose"
+      - "mg per kg"
+    exclude_context:
+      - "pharmacology textbook"
+      - "educational context"
+risk_signals:
+  - name: factual_claims
+    patterns:
+      - "studies show"
+      - "research proves"
+    weight: 0.7
+    category: registered
+  - name: specific_numbers
+    patterns:
+      - "exactly"
+      - "precisely"
+    weight: 0.5
+    category: universal
+uncertainty_types:
+  - name: epistemic
+    action_config:
+      action: force_retrieval
+      message_template: "Retrieval needed for verified information."
+  - name: contradictory
+    action_config:
+      action: conflict_resolution
+  - name: open_ended
+    action_config:
+      action: distribution_response
+sampling_config:
+  low_threshold: 0.40
+  medium_threshold: 0.70
+  temperature: 0.7
+```
+### Schema Reference
+| Section | Required | Description |
+|---|---|---|
+| `metadata` | Yes | Name, version, domain, model compatibility records |
+| `circuit_breakers` | No | Binary rules with patterns and optional exclude_context |
+| `risk_signals` | No | Weighted signals (registered or universal) with exclude_context |
+| `uncertainty_types` | No | Per-type action configuration |
+| `sampling_config` | No | Tier thresholds and sampling parameters (sensible defaults) |
+---
+## CLI Commands
+### `brix lint`
+Validate a specification, detect conflicts, and estimate Balance Index.
+```bash
+brix lint specs/general/v1.0.0.yaml
+```
+- Validates schema against Pydantic models
+- Detects conflicting signals (same pattern in CB and risk signal)
+- Detects unreachable rules (exclude_context eliminates all matches)
+- Estimates utility impact and Balance Index
+- Exit codes: 0 (clean), 1 (warnings), 2 (errors)
+### `brix test`
+Run a test suite and report Reliability Score, Utility Score, and Balance Index.
+```bash
+brix test specs/general/v1.0.0.yaml --suite tests/suite.yaml --model gpt-4
+```
+- Reports TP/FN/TN/FP confusion matrix
+- Lists all failing cases with expected vs actual outcomes
+- Outputs machine-readable JSON compatibility report
+### `brix explain`
+Reconstruct the complete decision trace for any logged request.
+```bash
+brix explain --decision-id 550e8400-e29b-41d4-a716-446655440000 --log brix.jsonl
+```
+- Shows every signal evaluated
+- Shows risk score components
+- Shows uncertainty classification reasoning
+- Shows action selection logic
+### `brix generate-tests`
+Generate a draft test suite from a specification.
+```bash
+brix generate-tests specs/general/v1.0.0.yaml --output generated_tests/
+```
+- Positive cases per circuit breaker
+- Negative cases per circuit breaker (using exclude_context)
+- Cases per risk signal
+- Cases per uncertainty type
+- Safe passthrough cases
+- All tests generated with `status: draft` for human review
+---
+## Comparison
+| Feature | BRIX | NeMo Guardrails | Guardrails AI | Cleanlab TLM |
+|---|---|---|---|---|
+| **Approach** | Declarative infrastructure | Programmable rails | Output validation | Trustworthiness scoring |
+| **Balance Index** | Built-in metric | No equivalent | No equivalent | Confidence score (different concept) |
+| **Circuit breakers** | Deterministic, O(n) | LLM-based | No | No |
+| **Pattern matching** | Aho-Corasick automaton | LLM classification | Regex/validators | N/A |
+| **Uncertainty types** | 3 types with distinct actions | Not classified | Not classified | Not classified |
+| **Audit trail** | StructuredResult + brix explain | Logging | Logging | API logs |
+| **Spec format** | Declarative YAML | Colang | Python/RAIL | API config |
+| **Model agnostic** | Any LLM via Protocol | NVIDIA focused | Any LLM | Any LLM |
+| **Local embedding** | all-MiniLM-L6-v2 (no API cost) | LLM-based (API cost) | N/A | API-based |
+---
+## Use Cases
+### Medical Information Systems
+Circuit breakers on drug interactions, dosing, contraindications. Retrieval always activated for clinical queries. Audit trail for regulatory compliance.
+### Legal Research Platforms
+Circuit breakers on jurisdictional requirements, statute of limitations. Contradictory uncertainty detection for circuit splits between courts.
+### Financial Services Compliance
+Circuit breakers on regulatory thresholds, reporting requirements. Balance Index monitoring ensures compliance officers can still get useful answers.
+### Enterprise Knowledge Management
+Lower-stakes circuit breakers on HR policies, legal obligations. High utility preservation for general knowledge queries.
+---
+## LLM Client Adapters
+```python
+# OpenAI
+from brix.llm.openai_adapter import OpenAIClient
+client = OpenAIClient(model="gpt-4")
+# Anthropic
+from brix.llm.anthropic_adapter import AnthropicClient
+client = AnthropicClient(model="claude-sonnet-4-6-20250514")
+# Mock (testing)
+from brix import MockLLMClient
+client = MockLLMClient(responses=["Response A", "Response B"])
+# Custom — implement the protocol
+class MyClient:
+    async def complete(self, prompt, *, system=None, temperature=0.7, max_tokens=1024):
+        return "my response"
+```
+---
+## Roadmap
+- **BRIX Cloud** — Enterprise dashboard, real-time Balance Index monitoring, compliance reporting for EU AI Act
+- **Community Registry** — Versioned, peer-reviewed specification repository organized by domain
+- **Certified Templates** — Domain-expert-reviewed specifications for regulated industries (medical, legal, financial)
+- **Agent Framework Integration** — Native support for LangChain, LlamaIndex, and CrewAI pipelines
+- **Streaming Support** — Real-time signal evaluation on streaming LLM responses
+---
+## Contributing
+Contributions are welcome. To get started:
+```bash
+git clone https://github.com/Serhii2009/brix-protocol.git
+cd brix-protocol
+pip install -e ".[dev]"
+pytest
+```
+Before submitting a PR:
+1. Run `brix lint` on any modified specs
+2. Ensure `pytest --cov=brix` reports ≥80% coverage
+3. Add tests for new functionality
+See [CONTRIBUTING.md](CONTRIBUTING.md) for full guidelines.
+---
+## License
+MIT License. Copyright (c) 2026 Serhii Kravchenko. See [LICENSE](LICENSE).