PyPI - crca - Versions diffs - 1.4.0__py3-none-any.whl → 1.5.0__py3-none-any.whl - Mend

crca 1.4.0py3-none-any.whl → 1.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (306) hide show

CRCA.py +172 -7
MODEL_CARD.md +53 -0
PKG-INFO +8 -2
RELEASE_NOTES.md +17 -0
STABILITY.md +19 -0
architecture/hybrid/consistency_engine.py +362 -0
architecture/hybrid/conversation_manager.py +421 -0
architecture/hybrid/explanation_generator.py +452 -0
architecture/hybrid/few_shot_learner.py +533 -0
architecture/hybrid/graph_compressor.py +286 -0
architecture/hybrid/hybrid_agent.py +4398 -0
architecture/hybrid/language_compiler.py +623 -0
architecture/hybrid/main,py +0 -0
architecture/hybrid/reasoning_tracker.py +322 -0
architecture/hybrid/self_verifier.py +524 -0
architecture/hybrid/task_decomposer.py +567 -0
architecture/hybrid/text_corrector.py +341 -0
benchmark_results/crca_core_benchmarks.json +178 -0
branches/crca_sd/crca_sd_realtime.py +6 -2
branches/general_agent/__init__.py +102 -0
branches/general_agent/general_agent.py +1400 -0
branches/general_agent/personality.py +169 -0
branches/general_agent/utils/__init__.py +19 -0
branches/general_agent/utils/prompt_builder.py +170 -0
{crca-1.4.0.dist-info → crca-1.5.0.dist-info}/METADATA +8 -2
{crca-1.4.0.dist-info → crca-1.5.0.dist-info}/RECORD +303 -20
crca_core/__init__.py +35 -0
crca_core/benchmarks/__init__.py +14 -0
crca_core/benchmarks/synthetic_scm.py +103 -0
crca_core/core/__init__.py +23 -0
crca_core/core/api.py +120 -0
crca_core/core/estimate.py +208 -0
crca_core/core/godclass.py +72 -0
crca_core/core/intervention_design.py +174 -0
crca_core/core/lifecycle.py +48 -0
crca_core/discovery/__init__.py +9 -0
crca_core/discovery/tabular.py +193 -0
crca_core/identify/__init__.py +171 -0
crca_core/identify/backdoor.py +39 -0
crca_core/identify/frontdoor.py +48 -0
crca_core/identify/graph.py +106 -0
crca_core/identify/id_algorithm.py +43 -0
crca_core/identify/iv.py +48 -0
crca_core/models/__init__.py +67 -0
crca_core/models/provenance.py +56 -0
crca_core/models/refusal.py +39 -0
crca_core/models/result.py +83 -0
crca_core/models/spec.py +151 -0
crca_core/models/validation.py +68 -0
crca_core/scm/__init__.py +9 -0
crca_core/scm/linear_gaussian.py +198 -0
crca_core/timeseries/__init__.py +6 -0
crca_core/timeseries/pcmci.py +181 -0
crca_llm/__init__.py +12 -0
crca_llm/client.py +85 -0
crca_llm/coauthor.py +118 -0
crca_llm/orchestrator.py +289 -0
crca_llm/types.py +21 -0
crca_reasoning/__init__.py +16 -0
crca_reasoning/critique.py +54 -0
crca_reasoning/godclass.py +206 -0
crca_reasoning/memory.py +24 -0
crca_reasoning/rationale.py +10 -0
crca_reasoning/react_controller.py +81 -0
crca_reasoning/tool_router.py +97 -0
crca_reasoning/types.py +40 -0
crca_sd/__init__.py +15 -0
crca_sd/crca_sd_core.py +2 -0
crca_sd/crca_sd_governance.py +2 -0
crca_sd/crca_sd_mpc.py +2 -0
crca_sd/crca_sd_realtime.py +2 -0
crca_sd/crca_sd_tui.py +2 -0
cuda-keyring_1.1-1_all.deb +0 -0
cuda-keyring_1.1-1_all.deb.1 +0 -0
docs/IMAGE_ANNOTATION_USAGE.md +539 -0
docs/INSTALL_DEEPSPEED.md +125 -0
docs/api/branches/crca-cg.md +19 -0
docs/api/branches/crca-q.md +27 -0
docs/api/branches/crca-sd.md +37 -0
docs/api/branches/general-agent.md +24 -0
docs/api/branches/overview.md +19 -0
docs/api/crca/agent-methods.md +62 -0
docs/api/crca/operations.md +79 -0
docs/api/crca/overview.md +32 -0
docs/api/image-annotation/engine.md +52 -0
docs/api/image-annotation/overview.md +17 -0
docs/api/schemas/annotation.md +34 -0
docs/api/schemas/core-schemas.md +82 -0
docs/api/schemas/overview.md +32 -0
docs/api/schemas/policy.md +30 -0
docs/api/utils/conversation.md +22 -0
docs/api/utils/graph-reasoner.md +32 -0
docs/api/utils/overview.md +21 -0
docs/api/utils/router.md +19 -0
docs/api/utils/utilities.md +97 -0
docs/architecture/causal-graphs.md +41 -0
docs/architecture/data-flow.md +29 -0
docs/architecture/design-principles.md +33 -0
docs/architecture/hybrid-agent/components.md +38 -0
docs/architecture/hybrid-agent/consistency.md +26 -0
docs/architecture/hybrid-agent/overview.md +44 -0
docs/architecture/hybrid-agent/reasoning.md +22 -0
docs/architecture/llm-integration.md +26 -0
docs/architecture/modular-structure.md +37 -0
docs/architecture/overview.md +69 -0
docs/architecture/policy-engine-arch.md +29 -0
docs/branches/crca-cg/corposwarm.md +39 -0
docs/branches/crca-cg/esg-scoring.md +30 -0
docs/branches/crca-cg/multi-agent.md +35 -0
docs/branches/crca-cg/overview.md +40 -0
docs/branches/crca-q/alternative-data.md +55 -0
docs/branches/crca-q/architecture.md +71 -0
docs/branches/crca-q/backtesting.md +45 -0
docs/branches/crca-q/causal-engine.md +33 -0
docs/branches/crca-q/execution.md +39 -0
docs/branches/crca-q/market-data.md +60 -0
docs/branches/crca-q/overview.md +58 -0
docs/branches/crca-q/philosophy.md +60 -0
docs/branches/crca-q/portfolio-optimization.md +66 -0
docs/branches/crca-q/risk-management.md +102 -0
docs/branches/crca-q/setup.md +65 -0
docs/branches/crca-q/signal-generation.md +61 -0
docs/branches/crca-q/signal-validation.md +43 -0
docs/branches/crca-sd/core.md +84 -0
docs/branches/crca-sd/governance.md +53 -0
docs/branches/crca-sd/mpc-solver.md +65 -0
docs/branches/crca-sd/overview.md +59 -0
docs/branches/crca-sd/realtime.md +28 -0
docs/branches/crca-sd/tui.md +20 -0
docs/branches/general-agent/overview.md +37 -0
docs/branches/general-agent/personality.md +36 -0
docs/branches/general-agent/prompt-builder.md +30 -0
docs/changelog/index.md +79 -0
docs/contributing/code-style.md +69 -0
docs/contributing/documentation.md +43 -0
docs/contributing/overview.md +29 -0
docs/contributing/testing.md +29 -0
docs/core/crcagent/async-operations.md +65 -0
docs/core/crcagent/automatic-extraction.md +107 -0
docs/core/crcagent/batch-prediction.md +80 -0
docs/core/crcagent/bayesian-inference.md +60 -0
docs/core/crcagent/causal-graph.md +92 -0
docs/core/crcagent/counterfactuals.md +96 -0
docs/core/crcagent/deterministic-simulation.md +78 -0
docs/core/crcagent/dual-mode-operation.md +82 -0
docs/core/crcagent/initialization.md +88 -0
docs/core/crcagent/optimization.md +65 -0
docs/core/crcagent/overview.md +63 -0
docs/core/crcagent/time-series.md +57 -0
docs/core/schemas/annotation.md +30 -0
docs/core/schemas/core-schemas.md +82 -0
docs/core/schemas/overview.md +30 -0
docs/core/schemas/policy.md +41 -0
docs/core/templates/base-agent.md +31 -0
docs/core/templates/feature-mixins.md +31 -0
docs/core/templates/overview.md +29 -0
docs/core/templates/templates-guide.md +75 -0
docs/core/tools/mcp-client.md +34 -0
docs/core/tools/overview.md +24 -0
docs/core/utils/conversation.md +27 -0
docs/core/utils/graph-reasoner.md +29 -0
docs/core/utils/overview.md +27 -0
docs/core/utils/router.md +27 -0
docs/core/utils/utilities.md +97 -0
docs/css/custom.css +84 -0
docs/examples/basic-usage.md +57 -0
docs/examples/general-agent/general-agent-examples.md +50 -0
docs/examples/hybrid-agent/hybrid-agent-examples.md +56 -0
docs/examples/image-annotation/image-annotation-examples.md +54 -0
docs/examples/integration/integration-examples.md +58 -0
docs/examples/overview.md +37 -0
docs/examples/trading/trading-examples.md +46 -0
docs/features/causal-reasoning/advanced-topics.md +101 -0
docs/features/causal-reasoning/counterfactuals.md +43 -0
docs/features/causal-reasoning/do-calculus.md +50 -0
docs/features/causal-reasoning/overview.md +47 -0
docs/features/causal-reasoning/structural-models.md +52 -0
docs/features/hybrid-agent/advanced-components.md +55 -0
docs/features/hybrid-agent/core-components.md +64 -0
docs/features/hybrid-agent/overview.md +34 -0
docs/features/image-annotation/engine.md +82 -0
docs/features/image-annotation/features.md +113 -0
docs/features/image-annotation/integration.md +75 -0
docs/features/image-annotation/overview.md +53 -0
docs/features/image-annotation/quickstart.md +73 -0
docs/features/policy-engine/doctrine-ledger.md +105 -0
docs/features/policy-engine/monitoring.md +44 -0
docs/features/policy-engine/mpc-control.md +89 -0
docs/features/policy-engine/overview.md +46 -0
docs/getting-started/configuration.md +225 -0
docs/getting-started/first-agent.md +164 -0
docs/getting-started/installation.md +144 -0
docs/getting-started/quickstart.md +137 -0
docs/index.md +118 -0
docs/js/mathjax.js +13 -0
docs/lrm/discovery_proof_notes.md +25 -0
docs/lrm/finetune_full.md +83 -0
docs/lrm/math_appendix.md +120 -0
docs/lrm/overview.md +32 -0
docs/mkdocs.yml +238 -0
docs/stylesheets/extra.css +21 -0
docs_generated/crca_core/CounterfactualResult.md +12 -0
docs_generated/crca_core/DiscoveryHypothesisResult.md +13 -0
docs_generated/crca_core/DraftSpec.md +13 -0
docs_generated/crca_core/EstimateResult.md +13 -0
docs_generated/crca_core/IdentificationResult.md +17 -0
docs_generated/crca_core/InterventionDesignResult.md +12 -0
docs_generated/crca_core/LockedSpec.md +15 -0
docs_generated/crca_core/RefusalResult.md +12 -0
docs_generated/crca_core/ValidationReport.md +9 -0
docs_generated/crca_core/index.md +13 -0
examples/general_agent_example.py +277 -0
examples/general_agent_quickstart.py +202 -0
examples/general_agent_simple.py +92 -0
examples/hybrid_agent_auto_extraction.py +84 -0
examples/hybrid_agent_dictionary_demo.py +104 -0
examples/hybrid_agent_enhanced.py +179 -0
examples/hybrid_agent_general_knowledge.py +107 -0
examples/image_annotation_quickstart.py +328 -0
examples/test_hybrid_fixes.py +77 -0
image_annotation/__init__.py +27 -0
image_annotation/annotation_engine.py +2593 -0
install_cuda_wsl2.sh +59 -0
install_deepspeed.sh +56 -0
install_deepspeed_simple.sh +87 -0
mkdocs.yml +252 -0
ollama/Modelfile +8 -0
prompts/__init__.py +2 -1
prompts/default_crca.py +9 -1
prompts/general_agent.py +227 -0
prompts/image_annotation.py +56 -0
pyproject.toml +17 -2
requirements-docs.txt +10 -0
requirements.txt +21 -2
schemas/__init__.py +26 -1
schemas/annotation.py +222 -0
schemas/conversation.py +193 -0
schemas/hybrid.py +211 -0
schemas/reasoning.py +276 -0
schemas_export/crca_core/CounterfactualResult.schema.json +108 -0
schemas_export/crca_core/DiscoveryHypothesisResult.schema.json +113 -0
schemas_export/crca_core/DraftSpec.schema.json +635 -0
schemas_export/crca_core/EstimateResult.schema.json +113 -0
schemas_export/crca_core/IdentificationResult.schema.json +145 -0
schemas_export/crca_core/InterventionDesignResult.schema.json +111 -0
schemas_export/crca_core/LockedSpec.schema.json +646 -0
schemas_export/crca_core/RefusalResult.schema.json +90 -0
schemas_export/crca_core/ValidationReport.schema.json +62 -0
scripts/build_lrm_dataset.py +80 -0
scripts/export_crca_core_schemas.py +54 -0
scripts/export_hf_lrm.py +37 -0
scripts/export_ollama_gguf.py +45 -0
scripts/generate_changelog.py +157 -0
scripts/generate_crca_core_docs_from_schemas.py +86 -0
scripts/run_crca_core_benchmarks.py +163 -0
scripts/run_full_finetune.py +198 -0
scripts/run_lrm_eval.py +31 -0
templates/graph_management.py +29 -0
tests/conftest.py +9 -0
tests/test_core.py +2 -3
tests/test_crca_core_discovery_tabular.py +15 -0
tests/test_crca_core_estimate_dowhy.py +36 -0
tests/test_crca_core_identify.py +18 -0
tests/test_crca_core_intervention_design.py +36 -0
tests/test_crca_core_linear_gaussian_scm.py +69 -0
tests/test_crca_core_spec.py +25 -0
tests/test_crca_core_timeseries_pcmci.py +15 -0
tests/test_crca_llm_coauthor.py +12 -0
tests/test_crca_llm_orchestrator.py +80 -0
tests/test_hybrid_agent_llm_enhanced.py +556 -0
tests/test_image_annotation_demo.py +376 -0
tests/test_image_annotation_operational.py +408 -0
tests/test_image_annotation_unit.py +551 -0
tests/test_training_moe.py +13 -0
training/__init__.py +42 -0
training/datasets.py +140 -0
training/deepspeed_zero2_0_5b.json +22 -0
training/deepspeed_zero2_1_5b.json +22 -0
training/deepspeed_zero3_0_5b.json +28 -0
training/deepspeed_zero3_14b.json +28 -0
training/deepspeed_zero3_h100_3gpu.json +20 -0
training/deepspeed_zero3_offload.json +28 -0
training/eval.py +92 -0
training/finetune.py +516 -0
training/public_datasets.py +89 -0
training_data/react_train.jsonl +7473 -0
utils/agent_discovery.py +311 -0
utils/batch_processor.py +317 -0
utils/conversation.py +78 -0
utils/edit_distance.py +118 -0
utils/formatter.py +33 -0
utils/graph_reasoner.py +530 -0
utils/rate_limiter.py +283 -0
utils/router.py +2 -2
utils/tool_discovery.py +307 -0
webui/__init__.py +10 -0
webui/app.py +229 -0
webui/config.py +104 -0
webui/static/css/style.css +332 -0
webui/static/js/main.js +284 -0
webui/templates/index.html +42 -0
tests/test_crca_excel.py +0 -166
tests/test_data_broker.py +0 -424
tests/test_palantir.py +0 -349
{crca-1.4.0.dist-info → crca-1.5.0.dist-info}/WHEEL +0 -0
{crca-1.4.0.dist-info → crca-1.5.0.dist-info}/licenses/LICENSE +0 -0

tests/test_image_annotation_unit.py ADDED Viewed

@@ -0,0 +1,551 @@
+"""
+Unit tests for image annotation engine - testing every feature individually.
+"""
+import os
+import sys
+import numpy as np
+import pytest
+from pathlib import Path
+from PIL import Image
+import tempfile
+import json
+import cv2
+# Add parent directory to path
+sys.path.insert(0, os.path.dirname(os.path.dirname(__file__)))
+# Image annotation unit tests can be slow and may require LLM access depending on configuration.
+if os.environ.get("CRCA_RUN_IMAGE_ANNOTATION_TESTS") != "1":
+    pytest.skip("Set CRCA_RUN_IMAGE_ANNOTATION_TESTS=1 to run image annotation tests", allow_module_level=True)
+try:
+    from image_annotation.annotation_engine import ImageAnnotationEngine, AnnotationConfig
+    from image_annotation import AnnotationResult, AnnotationGraph, PrimitiveEntity, SemanticLabel
+    IMAGE_ANNOTATION_AVAILABLE = True
+except ImportError:
+    IMAGE_ANNOTATION_AVAILABLE = False
+    pytest.skip("Image annotation not available", allow_module_level=True)
+class TestImageAnnotationConfig:
+    """Test configuration system."""
+    def test_default_config(self):
+        """Test default configuration creation."""
+        config = AnnotationConfig()
+        assert config.gpt_model == "gpt-4o-mini"
+        assert config.cache_enabled is True
+        assert config.auto_retry is True
+        assert config.output_format == "overlay"
+    def test_config_from_env(self):
+        """Test loading configuration from environment variables."""
+        import os
+        os.environ["ANNOTATION_GPT_MODEL"] = "gpt-4"
+        os.environ["ANNOTATION_CACHE_ENABLED"] = "false"
+        config = AnnotationConfig.from_env()
+        assert config.gpt_model == "gpt-4"
+        assert config.cache_enabled is False
+        # Cleanup
+        del os.environ["ANNOTATION_GPT_MODEL"]
+        del os.environ["ANNOTATION_CACHE_ENABLED"]
+    def test_config_override(self):
+        """Test configuration parameter override."""
+        config = AnnotationConfig(gpt_model="gpt-4o", cache_enabled=False)
+        assert config.gpt_model == "gpt-4o"
+        assert config.cache_enabled is False
+class TestInputHandling:
+    """Test smart input handling features."""
+    def test_detect_input_type_file_path(self):
+        """Test file path detection."""
+        engine = ImageAnnotationEngine()
+        assert engine._detect_input_type("image.png") == "file_path"
+        assert engine._detect_input_type(Path("image.png")) == "file_path"
+    def test_detect_input_type_url(self):
+        """Test URL detection."""
+        engine = ImageAnnotationEngine()
+        assert engine._detect_input_type("https://example.com/image.png") == "url"
+        assert engine._detect_input_type("http://example.com/image.png") == "url"
+    def test_detect_input_type_numpy(self):
+        """Test numpy array detection."""
+        engine = ImageAnnotationEngine()
+        arr = np.zeros((100, 100, 3), dtype=np.uint8)
+        assert engine._detect_input_type(arr) == "numpy_array"
+    def test_detect_input_type_pil(self):
+        """Test PIL Image detection."""
+        engine = ImageAnnotationEngine()
+        img = Image.new("RGB", (100, 100))
+        assert engine._detect_input_type(img) == "pil_image"
+    def test_detect_input_type_batch(self):
+        """Test batch detection."""
+        engine = ImageAnnotationEngine()
+        assert engine._detect_input_type(["img1.png", "img2.png"]) == "batch"
+    def test_auto_load_numpy(self):
+        """Test loading numpy array."""
+        engine = ImageAnnotationEngine()
+        arr = np.zeros((100, 100, 3), dtype=np.uint8)
+        loaded = engine._auto_load_input(arr)
+        assert isinstance(loaded, np.ndarray)
+        assert loaded.shape == (100, 100, 3)
+    def test_auto_load_pil(self):
+        """Test loading PIL Image."""
+        engine = ImageAnnotationEngine()
+        img = Image.new("RGB", (100, 100), color=(255, 0, 0))
+        loaded = engine._auto_load_input(img)
+        assert isinstance(loaded, np.ndarray)
+        assert len(loaded.shape) == 3  # BGR format
+    def test_auto_load_file(self):
+        """Test loading from file path."""
+        engine = ImageAnnotationEngine()
+        # Create temporary image file
+        with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as f:
+            img = Image.new("RGB", (100, 100), color=(0, 255, 0))
+            img.save(f.name, "PNG")
+            temp_path = f.name
+        try:
+            loaded = engine._auto_load_input(temp_path)
+            assert isinstance(loaded, np.ndarray)
+            assert loaded.shape[0] > 0 and loaded.shape[1] > 0
+        finally:
+            os.unlink(temp_path)
+class TestImageTypeDetection:
+    """Test image type detection."""
+    def test_detect_circuit(self):
+        """Test circuit diagram detection."""
+        engine = ImageAnnotationEngine()
+        # Create synthetic circuit-like image (high line density, circles)
+        img = np.zeros((500, 500, 3), dtype=np.uint8)
+        # Add lines
+        for i in range(0, 500, 20):
+            cv2.line(img, (i, 0), (i, 500), (255, 255, 255), 2)
+        # Add circles
+        for i in range(50, 450, 50):
+            cv2.circle(img, (i, i), 20, (255, 255, 255), 2)
+        img_type = engine._detect_image_type(img)
+        # Should detect as circuit or general
+        assert img_type in ["circuit", "general", "technical"]
+    def test_detect_architectural(self):
+        """Test architectural drawing detection."""
+        engine = ImageAnnotationEngine()
+        # Create synthetic architectural drawing (many parallel lines)
+        img = np.zeros((800, 800, 3), dtype=np.uint8)
+        # Add many parallel lines
+        for i in range(0, 800, 10):
+            cv2.line(img, (0, i), (800, i), (255, 255, 255), 1)
+            cv2.line(img, (i, 0), (i, 800), (255, 255, 255), 1)
+        img_type = engine._detect_image_type(img)
+        # Should detect as architectural or general
+        assert img_type in ["architectural", "general", "technical"]
+    def test_get_type_specific_params(self):
+        """Test getting type-specific parameters."""
+        engine = ImageAnnotationEngine()
+        params = engine._get_type_specific_params("circuit")
+        assert "hough_line_threshold" in params
+        assert "hough_circle_threshold" in params
+        assert "preprocessing_strength" in params
+class TestParameterTuning:
+    """Test automatic parameter tuning."""
+    def test_auto_tune_params(self):
+        """Test automatic parameter tuning."""
+        engine = ImageAnnotationEngine()
+        img = np.zeros((500, 500), dtype=np.uint8)
+        # Add some edges
+        cv2.rectangle(img, (100, 100), (400, 400), 255, 2)
+        params = engine._auto_tune_params(img)
+        assert isinstance(params, dict)
+        assert "hough_line_threshold" in params
+        assert "canny_low" in params
+        assert "canny_high" in params
+    def test_heuristic_tune(self):
+        """Test heuristic-based tuning."""
+        engine = ImageAnnotationEngine()
+        img = np.zeros((200, 200), dtype=np.uint8)
+        cv2.circle(img, (100, 100), 50, 255, 2)
+        params = engine._heuristic_tune(img, "circuit")
+        assert isinstance(params, dict)
+        assert params["hough_line_threshold"] > 0
+    def test_adaptive_refine(self):
+        """Test adaptive parameter refinement."""
+        engine = ImageAnnotationEngine()
+        img = np.zeros((500, 500), dtype=np.uint8)
+        # Create empty result (no primitives)
+        from schemas.annotation import AnnotationGraph, AnnotationResult
+        empty_result = AnnotationResult(
+            annotation_graph=AnnotationGraph(),
+            overlay_image=None,
+            formal_report="",
+            json_output={},
+            processing_time=0.0
+        )
+        base_params = {"hough_line_threshold": 100, "hough_circle_threshold": 30}
+        refined = engine._adaptive_refine(img, empty_result, base_params)
+        # Should relax thresholds
+        assert refined["hough_line_threshold"] <= base_params["hough_line_threshold"]
+class TestRetryLogic:
+    """Test retry logic."""
+    def test_should_retry_no_primitives(self):
+        """Test retry decision for no primitives."""
+        engine = ImageAnnotationEngine()
+        from schemas.annotation import AnnotationGraph, AnnotationResult
+        result = AnnotationResult(
+            annotation_graph=AnnotationGraph(),  # Empty
+            overlay_image=None,
+            formal_report="",
+            json_output={},
+            processing_time=0.0
+        )
+        assert engine._should_retry(result, attempt=0) is True
+    def test_should_retry_low_confidence(self):
+        """Test retry decision for low confidence."""
+        engine = ImageAnnotationEngine()
+        from schemas.annotation import AnnotationGraph, AnnotationResult, SemanticLabel, PrimitiveEntity
+        entity = PrimitiveEntity(id="test", pixel_coords=[(0, 0)], primitive_type="line")
+        label = SemanticLabel(entity_id="test", label="test", uncertainty=0.9)  # High uncertainty
+        graph = AnnotationGraph(entities=[entity], labels=[label])
+        result = AnnotationResult(
+            annotation_graph=graph,
+            overlay_image=None,
+            formal_report="",
+            json_output={},
+            processing_time=0.0
+        )
+        assert engine._should_retry(result, attempt=0) is True
+    def test_should_retry_max_attempts(self):
+        """Test retry decision when max attempts reached."""
+        engine = ImageAnnotationEngine()
+        engine.config.max_retries = 3
+        from schemas.annotation import AnnotationGraph, AnnotationResult
+        result = AnnotationResult(
+            annotation_graph=AnnotationGraph(),
+            overlay_image=None,
+            formal_report="",
+            json_output={},
+            processing_time=0.0
+        )
+        assert engine._should_retry(result, attempt=3) is False
+    def test_get_retry_params(self):
+        """Test getting retry parameters."""
+        engine = ImageAnnotationEngine()
+        base_params = {"hough_line_threshold": 100, "canny_low": 50}
+        retry_params = engine._get_retry_params(attempt=1, previous_result=None, base_params=base_params)
+        # Should relax thresholds
+        assert retry_params["hough_line_threshold"] < base_params["hough_line_threshold"]
+class TestCaching:
+    """Test smart caching."""
+    def test_get_cache_key(self):
+        """Test cache key generation."""
+        engine = ImageAnnotationEngine()
+        # Create actually different images
+        img1 = np.zeros((100, 100, 3), dtype=np.uint8)
+        img1[50, 50] = [255, 255, 255]  # Add a white pixel
+        img2 = np.zeros((100, 100, 3), dtype=np.uint8)
+        img2[50, 50] = [128, 128, 128]  # Add a gray pixel (different)
+        params = {"test": "value"}
+        key1 = engine._get_cache_key(img1, params)
+        key2 = engine._get_cache_key(img2, params)
+        key3 = engine._get_cache_key(img1, params)
+        # Same image + params should give same key
+        assert key1 == key3
+        # Different images should give different keys (even if same shape)
+        assert key1 != key2
+    def test_cache_primitives(self):
+        """Test caching primitives."""
+        engine = ImageAnnotationEngine()
+        engine.config.cache_enabled = True
+        from schemas.annotation import PrimitiveEntity
+        primitives = [
+            PrimitiveEntity(id="1", pixel_coords=[(0, 0), (10, 10)], primitive_type="line")
+        ]
+        cache_key = "test_key"
+        engine._cache_primitives(cache_key, primitives)
+        # Check cache file exists
+        cache_file = engine._cache_dir / f"{cache_key}_primitives.json"
+        assert cache_file.exists()
+        # Cleanup
+        if cache_file.exists():
+            cache_file.unlink()
+    def test_get_cached_primitives(self):
+        """Test retrieving cached primitives."""
+        engine = ImageAnnotationEngine()
+        engine.config.cache_enabled = True
+        from schemas.annotation import PrimitiveEntity
+        primitives = [
+            PrimitiveEntity(id="1", pixel_coords=[(0, 0), (10, 10)], primitive_type="line")
+        ]
+        cache_key = "test_key_2"
+        engine._cache_primitives(cache_key, primitives)
+        cached = engine._get_cached_primitives(cache_key)
+        assert cached is not None
+        assert len(cached) == 1
+        assert cached[0].id == "1"
+        # Cleanup
+        cache_file = engine._cache_dir / f"{cache_key}_primitives.json"
+        if cache_file.exists():
+            cache_file.unlink()
+class TestPrimitiveExtraction:
+    """Test primitive extraction methods."""
+    def test_extract_lines(self):
+        """Test line extraction."""
+        engine = ImageAnnotationEngine()
+        img = np.zeros((500, 500), dtype=np.uint8)
+        cv2.line(img, (0, 0), (500, 500), 255, 2)
+        cv2.line(img, (0, 500), (500, 0), 255, 2)
+        params = {"hough_line_threshold": 50, "hough_line_min_length": 10}
+        lines = engine._extract_lines(img, params)
+        assert len(lines) > 0
+    def test_extract_circles(self):
+        """Test circle extraction."""
+        engine = ImageAnnotationEngine()
+        img = np.zeros((500, 500), dtype=np.uint8)
+        cv2.circle(img, (250, 250), 50, 255, 2)
+        params = {"hough_circle_threshold": 30, "hough_circle_min_radius": 10}
+        circles = engine._extract_circles(img, params)
+        assert len(circles) > 0
+    def test_extract_contours(self):
+        """Test contour extraction."""
+        engine = ImageAnnotationEngine()
+        img = np.zeros((500, 500), dtype=np.uint8)
+        cv2.rectangle(img, (100, 100), (400, 400), 255, 2)
+        params = {"canny_low": 50, "canny_high": 150}
+        contours = engine._extract_contours(img, params)
+        assert len(contours) > 0
+    def test_compute_intersections(self):
+        """Test intersection computation."""
+        engine = ImageAnnotationEngine()
+        from schemas.annotation import PrimitiveEntity
+        # Create two lines that intersect
+        line1 = PrimitiveEntity(
+            id="line1",
+            pixel_coords=[(0, 0), (100, 100)],
+            primitive_type="line"
+        )
+        line2 = PrimitiveEntity(
+            id="line2",
+            pixel_coords=[(0, 100), (100, 0)],
+            primitive_type="line"
+        )
+        intersections = engine._compute_intersections([line1, line2])
+        assert len(intersections) > 0
+class TestPreprocessing:
+    """Test image preprocessing."""
+    def test_preprocess_image(self):
+        """Test main preprocessing pipeline."""
+        engine = ImageAnnotationEngine()
+        img = np.random.randint(0, 255, (500, 500, 3), dtype=np.uint8)
+        processed = engine._preprocess_image(img)
+        assert processed.shape[0] > 0
+        assert processed.shape[1] > 0
+        assert len(processed.shape) == 2  # Grayscale
+    def test_adaptive_histogram_equalization(self):
+        """Test adaptive histogram equalization."""
+        engine = ImageAnnotationEngine()
+        img = np.random.randint(0, 255, (500, 500), dtype=np.uint8)
+        equalized = engine._adaptive_histogram_equalization(img)
+        assert equalized.shape == img.shape
+    def test_edge_amplification(self):
+        """Test edge amplification."""
+        engine = ImageAnnotationEngine()
+        img = np.random.randint(0, 255, (500, 500), dtype=np.uint8)
+        amplified = engine._edge_amplification(img, strength=0.7)
+        assert amplified.shape == img.shape
+class TestQueryInterface:
+    """Test query/task-based interface."""
+    def test_extract_relevant_entities(self):
+        """Test extracting relevant entities from query."""
+        engine = ImageAnnotationEngine()
+        from schemas.annotation import AnnotationGraph, PrimitiveEntity, SemanticLabel
+        entity1 = PrimitiveEntity(id="1", pixel_coords=[(0, 0)], primitive_type="circle")
+        entity2 = PrimitiveEntity(id="2", pixel_coords=[(10, 10), (20, 20)], primitive_type="line")
+        label = SemanticLabel(entity_id="1", label="building", uncertainty=0.3)
+        graph = AnnotationGraph(entities=[entity1, entity2], labels=[label])
+        relevant = engine._extract_relevant_entities("find the largest building", graph)
+        assert len(relevant) > 0
+    def test_get_entity_size(self):
+        """Test entity size calculation."""
+        engine = ImageAnnotationEngine()
+        from schemas.annotation import PrimitiveEntity
+        # Circle
+        circle = PrimitiveEntity(
+            id="circle1",
+            pixel_coords=[(50, 50)],
+            primitive_type="circle",
+            metadata={"radius": 10}
+        )
+        size = engine._get_entity_size(circle)
+        assert size > 0
+        # Line
+        line = PrimitiveEntity(
+            id="line1",
+            pixel_coords=[(0, 0), (10, 10)],
+            primitive_type="line"
+        )
+        size = engine._get_entity_size(line)
+        assert size > 0
+    def test_perform_query_measurements(self):
+        """Test performing measurements for queries."""
+        engine = ImageAnnotationEngine()
+        from schemas.annotation import PrimitiveEntity, AnnotationGraph
+        circle = PrimitiveEntity(
+            id="circle1",
+            pixel_coords=[(50, 50)],
+            primitive_type="circle",
+            metadata={"radius": 10}
+        )
+        graph = AnnotationGraph(entities=[circle])
+        measurements = engine._perform_query_measurements("measure the circle", [circle], graph)
+        assert "circle1" in measurements
+        assert "radius" in measurements["circle1"]
+        assert "area" in measurements["circle1"]
+class TestOutputFormatting:
+    """Test output formatting."""
+    def test_format_output_overlay(self):
+        """Test formatting output as overlay."""
+        engine = ImageAnnotationEngine()
+        from schemas.annotation import AnnotationGraph, AnnotationResult
+        import cv2
+        overlay_img = np.zeros((100, 100, 3), dtype=np.uint8)
+        _, buffer = cv2.imencode('.jpg', overlay_img)
+        overlay_bytes = buffer.tobytes()
+        result = AnnotationResult(
+            annotation_graph=AnnotationGraph(),
+            overlay_image=overlay_bytes,
+            formal_report="Test report",
+            json_output={"test": "data"},
+            processing_time=1.0
+        )
+        formatted = engine._format_output(result, "overlay")
+        assert isinstance(formatted, np.ndarray)
+    def test_format_output_json(self):
+        """Test formatting output as JSON."""
+        engine = ImageAnnotationEngine()
+        from schemas.annotation import AnnotationGraph, AnnotationResult
+        result = AnnotationResult(
+            annotation_graph=AnnotationGraph(),
+            overlay_image=None,
+            formal_report="Test report",
+            json_output={"test": "data"},
+            processing_time=1.0
+        )
+        formatted = engine._format_output(result, "json")
+        assert isinstance(formatted, dict)
+        assert "test" in formatted
+    def test_format_output_report(self):
+        """Test formatting output as report."""
+        engine = ImageAnnotationEngine()
+        from schemas.annotation import AnnotationGraph, AnnotationResult
+        result = AnnotationResult(
+            annotation_graph=AnnotationGraph(),
+            overlay_image=None,
+            formal_report="Test report content",
+            json_output={},
+            processing_time=1.0
+        )
+        formatted = engine._format_output(result, "report")
+        assert isinstance(formatted, str)
+        assert "Test report" in formatted
+if __name__ == "__main__":
+    pytest.main([__file__, "-v"])

tests/test_training_moe.py ADDED Viewed

@@ -0,0 +1,13 @@
+from training.finetune import _resolve_model_info
+def test_resolve_model_info_switch_is_seq2seq() -> None:
+    info = _resolve_model_info("google/switch-base-8")
+    assert info["arch"] == "seq2seq"
+    assert info["moe"] is True
+def test_resolve_model_info_qwen_is_causal() -> None:
+    info = _resolve_model_info("Qwen/Qwen2.5-1.5B-Instruct")
+    assert info["arch"] == "causal"
+    assert info["moe"] is False

training/__init__.py ADDED Viewed

@@ -0,0 +1,42 @@
+"""Training utilities for LRM finetuning."""
+from training.datasets import (
+    ReActExample,
+    examples_from_traces,
+    filter_examples,
+    merge_examples,
+    plan_result_to_examples,
+    save_jsonl,
+)
+from training.finetune import (
+    FinetuneConfig,
+    full_finetune_qwen25_0_5b_config,
+    full_finetune_qwen25_0_5b_config_cloud,
+    full_finetune_qwen25_1_5b_config,
+    full_finetune_qwen25_7b_config,
+    full_finetune_qwen25_14b_config,
+    full_finetune_switch_base_8_config,
+    full_finetune_switch_large_16_config,
+    run_finetune,
+)
+from training.eval import EvalConfig, run_eval
+__all__ = [
+    "ReActExample",
+    "examples_from_traces",
+    "filter_examples",
+    "merge_examples",
+    "plan_result_to_examples",
+    "save_jsonl",
+    "FinetuneConfig",
+    "full_finetune_qwen25_0_5b_config",
+    "full_finetune_qwen25_0_5b_config_cloud",
+    "full_finetune_qwen25_1_5b_config",
+    "full_finetune_qwen25_7b_config",
+    "full_finetune_qwen25_14b_config",
+    "full_finetune_switch_base_8_config",
+    "full_finetune_switch_large_16_config",
+    "run_finetune",
+    "EvalConfig",
+    "run_eval",
+]

crca 1.4.0__py3-none-any.whl → 1.5.0__py3-none-any.whl

crca 1.4.0py3-none-any.whl → 1.5.0py3-none-any.whl