PyPI - kiln-ai - Versions diffs - 0.20.1__py3-none-any.whl → 0.22.0__py3-none-any.whl - Mend

kiln-ai 0.20.1py3-none-any.whl → 0.22.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of kiln-ai might be problematic. Click here for more details.

Files changed (133) hide show

kiln_ai/adapters/__init__.py +6 -0
kiln_ai/adapters/adapter_registry.py +43 -226
kiln_ai/adapters/chunkers/__init__.py +13 -0
kiln_ai/adapters/chunkers/base_chunker.py +42 -0
kiln_ai/adapters/chunkers/chunker_registry.py +16 -0
kiln_ai/adapters/chunkers/fixed_window_chunker.py +39 -0
kiln_ai/adapters/chunkers/helpers.py +23 -0
kiln_ai/adapters/chunkers/test_base_chunker.py +63 -0
kiln_ai/adapters/chunkers/test_chunker_registry.py +28 -0
kiln_ai/adapters/chunkers/test_fixed_window_chunker.py +346 -0
kiln_ai/adapters/chunkers/test_helpers.py +75 -0
kiln_ai/adapters/data_gen/test_data_gen_task.py +9 -3
kiln_ai/adapters/embedding/__init__.py +0 -0
kiln_ai/adapters/embedding/base_embedding_adapter.py +44 -0
kiln_ai/adapters/embedding/embedding_registry.py +32 -0
kiln_ai/adapters/embedding/litellm_embedding_adapter.py +199 -0
kiln_ai/adapters/embedding/test_base_embedding_adapter.py +283 -0
kiln_ai/adapters/embedding/test_embedding_registry.py +166 -0
kiln_ai/adapters/embedding/test_litellm_embedding_adapter.py +1149 -0
kiln_ai/adapters/eval/eval_runner.py +6 -2
kiln_ai/adapters/eval/test_base_eval.py +1 -3
kiln_ai/adapters/eval/test_g_eval.py +1 -1
kiln_ai/adapters/extractors/__init__.py +18 -0
kiln_ai/adapters/extractors/base_extractor.py +72 -0
kiln_ai/adapters/extractors/encoding.py +20 -0
kiln_ai/adapters/extractors/extractor_registry.py +44 -0
kiln_ai/adapters/extractors/extractor_runner.py +112 -0
kiln_ai/adapters/extractors/litellm_extractor.py +406 -0
kiln_ai/adapters/extractors/test_base_extractor.py +244 -0
kiln_ai/adapters/extractors/test_encoding.py +54 -0
kiln_ai/adapters/extractors/test_extractor_registry.py +181 -0
kiln_ai/adapters/extractors/test_extractor_runner.py +181 -0
kiln_ai/adapters/extractors/test_litellm_extractor.py +1290 -0
kiln_ai/adapters/fine_tune/test_dataset_formatter.py +2 -2
kiln_ai/adapters/fine_tune/test_fireworks_tinetune.py +2 -6
kiln_ai/adapters/fine_tune/test_together_finetune.py +2 -6
kiln_ai/adapters/ml_embedding_model_list.py +494 -0
kiln_ai/adapters/ml_model_list.py +876 -18
kiln_ai/adapters/model_adapters/litellm_adapter.py +40 -75
kiln_ai/adapters/model_adapters/test_litellm_adapter.py +79 -1
kiln_ai/adapters/model_adapters/test_litellm_adapter_tools.py +119 -5
kiln_ai/adapters/model_adapters/test_saving_adapter_results.py +9 -3
kiln_ai/adapters/model_adapters/test_structured_output.py +9 -10
kiln_ai/adapters/ollama_tools.py +69 -12
kiln_ai/adapters/provider_tools.py +190 -46
kiln_ai/adapters/rag/deduplication.py +49 -0
kiln_ai/adapters/rag/progress.py +252 -0
kiln_ai/adapters/rag/rag_runners.py +844 -0
kiln_ai/adapters/rag/test_deduplication.py +195 -0
kiln_ai/adapters/rag/test_progress.py +785 -0
kiln_ai/adapters/rag/test_rag_runners.py +2376 -0
kiln_ai/adapters/remote_config.py +80 -8
kiln_ai/adapters/test_adapter_registry.py +579 -86
kiln_ai/adapters/test_ml_embedding_model_list.py +239 -0
kiln_ai/adapters/test_ml_model_list.py +202 -0
kiln_ai/adapters/test_ollama_tools.py +340 -1
kiln_ai/adapters/test_prompt_builders.py +1 -1
kiln_ai/adapters/test_provider_tools.py +199 -8
kiln_ai/adapters/test_remote_config.py +551 -56
kiln_ai/adapters/vector_store/__init__.py +1 -0
kiln_ai/adapters/vector_store/base_vector_store_adapter.py +83 -0
kiln_ai/adapters/vector_store/lancedb_adapter.py +389 -0
kiln_ai/adapters/vector_store/test_base_vector_store.py +160 -0
kiln_ai/adapters/vector_store/test_lancedb_adapter.py +1841 -0
kiln_ai/adapters/vector_store/test_vector_store_registry.py +199 -0
kiln_ai/adapters/vector_store/vector_store_registry.py +33 -0
kiln_ai/datamodel/__init__.py +16 -13
kiln_ai/datamodel/basemodel.py +201 -4
kiln_ai/datamodel/chunk.py +158 -0
kiln_ai/datamodel/datamodel_enums.py +27 -0
kiln_ai/datamodel/embedding.py +64 -0
kiln_ai/datamodel/external_tool_server.py +206 -54
kiln_ai/datamodel/extraction.py +317 -0
kiln_ai/datamodel/project.py +33 -1
kiln_ai/datamodel/rag.py +79 -0
kiln_ai/datamodel/task.py +5 -0
kiln_ai/datamodel/task_output.py +41 -11
kiln_ai/datamodel/test_attachment.py +649 -0
kiln_ai/datamodel/test_basemodel.py +270 -14
kiln_ai/datamodel/test_chunk_models.py +317 -0
kiln_ai/datamodel/test_dataset_split.py +1 -1
kiln_ai/datamodel/test_datasource.py +50 -0
kiln_ai/datamodel/test_embedding_models.py +448 -0
kiln_ai/datamodel/test_eval_model.py +6 -6
kiln_ai/datamodel/test_external_tool_server.py +534 -152
kiln_ai/datamodel/test_extraction_chunk.py +206 -0
kiln_ai/datamodel/test_extraction_model.py +501 -0
kiln_ai/datamodel/test_rag.py +641 -0
kiln_ai/datamodel/test_task.py +35 -1
kiln_ai/datamodel/test_tool_id.py +187 -1
kiln_ai/datamodel/test_vector_store.py +320 -0
kiln_ai/datamodel/tool_id.py +58 -0
kiln_ai/datamodel/vector_store.py +141 -0
kiln_ai/tools/base_tool.py +12 -3
kiln_ai/tools/built_in_tools/math_tools.py +12 -4
kiln_ai/tools/kiln_task_tool.py +158 -0
kiln_ai/tools/mcp_server_tool.py +2 -2
kiln_ai/tools/mcp_session_manager.py +51 -22
kiln_ai/tools/rag_tools.py +164 -0
kiln_ai/tools/test_kiln_task_tool.py +527 -0
kiln_ai/tools/test_mcp_server_tool.py +4 -15
kiln_ai/tools/test_mcp_session_manager.py +187 -227
kiln_ai/tools/test_rag_tools.py +929 -0
kiln_ai/tools/test_tool_registry.py +290 -7
kiln_ai/tools/tool_registry.py +69 -16
kiln_ai/utils/__init__.py +3 -0
kiln_ai/utils/async_job_runner.py +62 -17
kiln_ai/utils/config.py +2 -2
kiln_ai/utils/env.py +15 -0
kiln_ai/utils/filesystem.py +14 -0
kiln_ai/utils/filesystem_cache.py +60 -0
kiln_ai/utils/litellm.py +94 -0
kiln_ai/utils/lock.py +100 -0
kiln_ai/utils/mime_type.py +38 -0
kiln_ai/utils/open_ai_types.py +19 -2
kiln_ai/utils/pdf_utils.py +59 -0
kiln_ai/utils/test_async_job_runner.py +151 -35
kiln_ai/utils/test_env.py +142 -0
kiln_ai/utils/test_filesystem_cache.py +316 -0
kiln_ai/utils/test_litellm.py +206 -0
kiln_ai/utils/test_lock.py +185 -0
kiln_ai/utils/test_mime_type.py +66 -0
kiln_ai/utils/test_open_ai_types.py +88 -12
kiln_ai/utils/test_pdf_utils.py +86 -0
kiln_ai/utils/test_uuid.py +111 -0
kiln_ai/utils/test_validation.py +524 -0
kiln_ai/utils/uuid.py +9 -0
kiln_ai/utils/validation.py +90 -0
{kiln_ai-0.20.1.dist-info → kiln_ai-0.22.0.dist-info}/METADATA +9 -1
kiln_ai-0.22.0.dist-info/RECORD +213 -0
kiln_ai-0.20.1.dist-info/RECORD +0 -138
{kiln_ai-0.20.1.dist-info → kiln_ai-0.22.0.dist-info}/WHEEL +0 -0
{kiln_ai-0.20.1.dist-info → kiln_ai-0.22.0.dist-info}/licenses/LICENSE.txt +0 -0

kiln_ai/utils/test_validation.py ADDED Viewed

@@ -0,0 +1,524 @@
+import pytest
+from kiln_ai.utils.validation import (
+    tool_name_validator,
+    validate_return_dict_prop,
+    validate_return_dict_prop_optional,
+)
+class TestValidateReturnDictProp:
+    """Test cases for validate_return_dict_prop function."""
+    def test_valid_string_property(self):
+        """Test validation succeeds for valid string property."""
+        test_dict = {"name": "test_value"}
+        result = validate_return_dict_prop(test_dict, "name", str, "prefix")
+        assert result == "test_value"
+    def test_valid_int_property(self):
+        """Test validation succeeds for valid integer property."""
+        test_dict = {"count": 42}
+        result = validate_return_dict_prop(test_dict, "count", int, "prefix")
+        assert result == 42
+    def test_valid_bool_property(self):
+        """Test validation succeeds for valid boolean property."""
+        test_dict = {"enabled": True}
+        result = validate_return_dict_prop(test_dict, "enabled", bool, "prefix")
+        assert result is True
+    def test_valid_list_property(self):
+        """Test validation succeeds for valid list property."""
+        test_dict = {"items": [1, 2, 3]}
+        result = validate_return_dict_prop(test_dict, "items", list, "prefix")
+        assert result == [1, 2, 3]
+    def test_valid_dict_property(self):
+        """Test validation succeeds for valid dict property."""
+        test_dict = {"config": {"key": "value"}}
+        result = validate_return_dict_prop(test_dict, "config", dict, "prefix")
+        assert result == {"key": "value"}
+    def test_missing_key_raises_error(self):
+        """Test that missing key raises ValueError with appropriate message."""
+        test_dict = {"other_key": "value"}
+        with pytest.raises(ValueError) as exc_info:
+            validate_return_dict_prop(test_dict, "missing_key", str, "prefix")
+        expected_msg = "prefix missing_key is a required property"
+        assert str(exc_info.value) == expected_msg
+    def test_wrong_type_raises_error(self):
+        """Test that wrong type raises ValueError with appropriate message."""
+        test_dict = {"count": "not_a_number"}
+        with pytest.raises(ValueError) as exc_info:
+            validate_return_dict_prop(test_dict, "count", int, "prefix")
+        expected_msg = "prefix count must be of type <class 'int'>"
+        assert str(exc_info.value) == expected_msg
+    def test_none_value_with_none_type(self):
+        """Test that None value validates correctly when expecting NoneType."""
+        test_dict = {"value": None}
+        result = validate_return_dict_prop(test_dict, "value", type(None), "prefix")
+        assert result is None
+    def test_none_value_with_string_type_raises_error(self):
+        """Test that None value raises error when expecting string."""
+        test_dict = {"value": None}
+        with pytest.raises(ValueError) as exc_info:
+            validate_return_dict_prop(test_dict, "value", str, "prefix")
+        expected_msg = "prefix value must be of type <class 'str'>"
+        assert str(exc_info.value) == expected_msg
+    @pytest.mark.parametrize(
+        "test_value,expected_type",
+        [
+            ("string", str),
+            (123, int),
+            (3.14, float),
+            (True, bool),
+            ([1, 2, 3], list),
+            ({"k": "v"}, dict),
+            ((1, 2), tuple),
+            ({1, 2, 3}, set),
+        ],
+    )
+    def test_various_types_succeed(self, test_value, expected_type):
+        """Test validation succeeds for various types."""
+        test_dict = {"value": test_value}
+        result = validate_return_dict_prop(test_dict, "value", expected_type, "prefix")
+        assert result == test_value
+        assert isinstance(result, expected_type)
+    @pytest.mark.parametrize(
+        "test_value,wrong_type",
+        [
+            ("string", int),
+            (123, str),
+            (3.14, int),
+            (True, str),
+            ([1, 2, 3], dict),
+            ({"k": "v"}, list),
+            ((1, 2), list),
+            ({1, 2, 3}, list),
+        ],
+    )
+    def test_various_types_fail(self, test_value, wrong_type):
+        """Test validation fails for wrong types."""
+        test_dict = {"value": test_value}
+        with pytest.raises(ValueError):
+            validate_return_dict_prop(test_dict, "value", wrong_type, "prefix")
+    def test_empty_dict_raises_error(self):
+        """Test that empty dictionary raises error for any key."""
+        test_dict = {}
+        with pytest.raises(ValueError) as exc_info:
+            validate_return_dict_prop(test_dict, "any_key", str, "prefix")
+        expected_msg = "prefix any_key is a required property"
+        assert str(exc_info.value) == expected_msg
+    def test_empty_string_key(self):
+        """Test validation with empty string as key."""
+        test_dict = {"": "empty_key_value"}
+        result = validate_return_dict_prop(test_dict, "", str, "prefix")
+        assert result == "empty_key_value"
+    def test_numeric_values_and_inheritance(self):
+        """Test that isinstance works correctly with numeric inheritance."""
+        # bool is a subclass of int in Python, so True/False are valid ints
+        test_dict = {"flag": True}
+        result = validate_return_dict_prop(test_dict, "flag", int, "prefix")
+        assert result is True
+        assert isinstance(result, int)  # This should pass since bool inherits from int
+class TestValidateReturnDictPropOptional:
+    """Test cases for validate_return_dict_prop_optional function."""
+    def test_valid_string_property(self):
+        """Test validation succeeds for valid string property."""
+        test_dict = {"name": "test_value"}
+        result = validate_return_dict_prop_optional(test_dict, "name", str, "prefix")
+        assert result == "test_value"
+    def test_valid_int_property(self):
+        """Test validation succeeds for valid integer property."""
+        test_dict = {"count": 42}
+        result = validate_return_dict_prop_optional(test_dict, "count", int, "prefix")
+        assert result == 42
+    def test_missing_key_returns_none(self):
+        """Test that missing key returns None instead of raising error."""
+        test_dict = {"other_key": "value"}
+        result = validate_return_dict_prop_optional(
+            test_dict, "missing_key", str, "prefix"
+        )
+        assert result is None
+    def test_none_value_returns_none(self):
+        """Test that None value returns None."""
+        test_dict = {"value": None}
+        result = validate_return_dict_prop_optional(test_dict, "value", str, "prefix")
+        assert result is None
+    def test_empty_dict_returns_none(self):
+        """Test that empty dictionary returns None for any key."""
+        test_dict = {}
+        result = validate_return_dict_prop_optional(test_dict, "any_key", str, "prefix")
+        assert result is None
+    def test_wrong_type_raises_error(self):
+        """Test that wrong type still raises ValueError (delegates to required function)."""
+        test_dict = {"count": "not_a_number"}
+        with pytest.raises(ValueError) as exc_info:
+            validate_return_dict_prop_optional(test_dict, "count", int, "prefix")
+        expected_msg = "prefix count must be of type <class 'int'>"
+        assert str(exc_info.value) == expected_msg
+    def test_explicit_none_vs_missing_key(self):
+        """Test that explicit None value and missing key both return None."""
+        # Missing key
+        test_dict_missing = {"other": "value"}
+        result_missing = validate_return_dict_prop_optional(
+            test_dict_missing, "target", str, "prefix"
+        )
+        assert result_missing is None
+        # Explicit None
+        test_dict_none = {"target": None}
+        result_none = validate_return_dict_prop_optional(
+            test_dict_none, "target", str, "prefix"
+        )
+        assert result_none is None
+    @pytest.mark.parametrize(
+        "test_value,expected_type",
+        [
+            ("string", str),
+            (123, int),
+            (3.14, float),
+            (True, bool),
+            ([1, 2, 3], list),
+            ({"k": "v"}, dict),
+            ((1, 2), tuple),
+            ({1, 2, 3}, set),
+        ],
+    )
+    def test_various_types_succeed(self, test_value, expected_type):
+        """Test validation succeeds for various types."""
+        test_dict = {"value": test_value}
+        result = validate_return_dict_prop_optional(
+            test_dict, "value", expected_type, "prefix"
+        )
+        assert result == test_value
+        assert isinstance(result, expected_type)
+    @pytest.mark.parametrize(
+        "test_value,wrong_type",
+        [
+            ("string", int),
+            (123, str),
+            (3.14, int),
+            (True, str),
+            ([1, 2, 3], dict),
+            ({"k": "v"}, list),
+            ((1, 2), list),
+            ({1, 2, 3}, list),
+        ],
+    )
+    def test_various_types_fail(self, test_value, wrong_type):
+        """Test validation fails for wrong types (delegates to required function)."""
+        test_dict = {"value": test_value}
+        with pytest.raises(ValueError):
+            validate_return_dict_prop_optional(test_dict, "value", wrong_type, "prefix")
+    def test_empty_string_key_with_value(self):
+        """Test validation with empty string as key when value exists."""
+        test_dict = {"": "empty_key_value"}
+        result = validate_return_dict_prop_optional(test_dict, "", str, "prefix")
+        assert result == "empty_key_value"
+    def test_empty_string_key_missing(self):
+        """Test validation with empty string as key when key is missing."""
+        test_dict = {"other": "value"}
+        result = validate_return_dict_prop_optional(test_dict, "", str, "prefix")
+        assert result is None
+    def test_numeric_inheritance_behavior(self):
+        """Test that isinstance works correctly with numeric inheritance."""
+        # bool is a subclass of int in Python, so True/False are valid ints
+        test_dict = {"flag": True}
+        result = validate_return_dict_prop_optional(test_dict, "flag", int, "prefix")
+        assert result is True
+        assert isinstance(result, int)
+    def test_optional_with_zero_values(self):
+        """Test that zero-like values (0, False, [], {}) are not treated as None."""
+        test_cases = [
+            ({"count": 0}, "count", int, 0),
+            ({"flag": False}, "flag", bool, False),
+            ({"items": []}, "items", list, []),
+            ({"config": {}}, "config", dict, {}),
+            ({"text": ""}, "text", str, ""),
+        ]
+        for test_dict, key, expected_type, expected_value in test_cases:
+            result = validate_return_dict_prop_optional(
+                test_dict, key, expected_type, "prefix"
+            )
+            assert result == expected_value
+            assert result is not None
+class TestToolNameValidator:
+    """Test cases for tool_name_validator function."""
+    def test_valid_simple_name(self):
+        """Test validation succeeds for simple valid tool names."""
+        valid_names = [
+            "tool",
+            "my_tool",
+            "data_processor",
+            "test123",
+            "a",
+            "tool_v2",
+            "get_weather",
+        ]
+        for name in valid_names:
+            result = tool_name_validator(name)
+            assert result == name
+    def test_valid_name_with_numbers(self):
+        """Test validation succeeds for tool names with numbers."""
+        valid_names = [
+            "tool1",
+            "my_tool_v2",
+            "data_processor_3000",
+            "test_123_abc",
+            "version2",
+        ]
+        for name in valid_names:
+            result = tool_name_validator(name)
+            assert result == name
+    def test_none_name_raises_error(self):
+        """Test that None name raises ValueError."""
+        with pytest.raises(ValueError) as exc_info:
+            tool_name_validator(None)
+        assert str(exc_info.value) == "Tool name cannot be empty"
+    def test_empty_string_raises_error(self):
+        """Test that empty string raises ValueError."""
+        with pytest.raises(ValueError) as exc_info:
+            tool_name_validator("")
+        assert str(exc_info.value) == "Tool name cannot be empty"
+    def test_whitespace_only_raises_error(self):
+        """Test that whitespace-only string raises ValueError."""
+        whitespace_names = [" ", "  ", "\t", "\n", "   \t  "]
+        for name in whitespace_names:
+            with pytest.raises(ValueError) as exc_info:
+                tool_name_validator(name)
+            assert str(exc_info.value) == "Tool name cannot be empty"
+    def test_non_string_raises_error(self):
+        """Test that non-string input raises ValueError."""
+        non_string_inputs = [123, [], {}, True, 3.14]
+        for input_val in non_string_inputs:
+            with pytest.raises(ValueError) as exc_info:
+                tool_name_validator(input_val)
+            assert str(exc_info.value) == "Tool name must be a string"
+    def test_uppercase_letters_raise_error(self):
+        """Test that uppercase letters raise ValueError."""
+        invalid_names = [
+            "Tool",
+            "MY_TOOL",
+            "myTool",
+            "tool_Name",
+            "TOOL",
+            "Test123",
+        ]
+        for name in invalid_names:
+            with pytest.raises(ValueError) as exc_info:
+                tool_name_validator(name)
+            assert "Tool name must be in snake_case" in str(exc_info.value)
+    def test_special_characters_raise_error(self):
+        """Test that special characters raise ValueError."""
+        invalid_names = [
+            "tool-name",
+            "tool.name",
+            "tool@name",
+            "tool#name",
+            "tool$name",
+            "tool%name",
+            "tool&name",
+            "tool*name",
+            "tool+name",
+            "tool=name",
+            "tool!name",
+            "tool?name",
+            "tool name",  # space
+            "tool,name",
+            "tool;name",
+            "tool:name",
+            "tool'name",
+            'tool"name',
+            "tool(name)",
+            "tool[name]",
+            "tool{name}",
+            "tool/name",
+            "tool\\name",
+        ]
+        for name in invalid_names:
+            with pytest.raises(ValueError) as exc_info:
+                tool_name_validator(name)
+            assert "Tool name must be in snake_case" in str(exc_info.value)
+    def test_starts_with_underscore_raises_error(self):
+        """Test that names starting with underscore raise ValueError."""
+        invalid_names = ["_tool", "_my_tool", "_", "_123"]
+        for name in invalid_names:
+            with pytest.raises(ValueError) as exc_info:
+                tool_name_validator(name)
+            assert (
+                str(exc_info.value)
+                == "Tool name cannot start or end with an underscore"
+            )
+    def test_ends_with_underscore_raises_error(self):
+        """Test that names ending with underscore raise ValueError."""
+        invalid_names = ["tool_", "my_tool_", "test_"]
+        for name in invalid_names:
+            with pytest.raises(ValueError) as exc_info:
+                tool_name_validator(name)
+            assert (
+                str(exc_info.value)
+                == "Tool name cannot start or end with an underscore"
+            )
+    def test_consecutive_underscores_raise_error(self):
+        """Test that consecutive underscores raise ValueError."""
+        invalid_names = [
+            "tool__name",
+            "my__tool",
+            "test___name",
+            "a__b__c",
+            "tool____name",
+        ]
+        for name in invalid_names:
+            with pytest.raises(ValueError) as exc_info:
+                tool_name_validator(name)
+            assert (
+                str(exc_info.value)
+                == "Tool name cannot contain consecutive underscores"
+            )
+    def test_starts_with_number_raises_error(self):
+        """Test that names starting with number raise ValueError."""
+        invalid_names = ["1tool", "2_tool", "123abc", "9test"]
+        for name in invalid_names:
+            with pytest.raises(ValueError) as exc_info:
+                tool_name_validator(name)
+            assert str(exc_info.value) == "Tool name must start with a lowercase letter"
+    def test_starts_with_underscore_number_raises_error(self):
+        """Test that names starting with underscore followed by number raise ValueError."""
+        invalid_names = ["_1tool", "_2tool"]
+        for name in invalid_names:
+            with pytest.raises(ValueError) as exc_info:
+                tool_name_validator(name)
+            # This should fail on the underscore check first
+            assert (
+                str(exc_info.value)
+                == "Tool name cannot start or end with an underscore"
+            )
+    def test_long_name_raises_error(self):
+        """Test that names longer than 64 characters raise ValueError."""
+        # Create a 65-character name
+        long_name = "a" * 65
+        with pytest.raises(ValueError) as exc_info:
+            tool_name_validator(long_name)
+        assert str(exc_info.value) == "Tool name must be less than 64 characters long"
+    def test_exactly_64_characters_succeeds(self):
+        """Test that names with exactly 64 characters succeed."""
+        # Create a 64-character name
+        max_length_name = "a" * 64
+        result = tool_name_validator(max_length_name)
+        assert result == max_length_name
+    def test_boundary_length_cases(self):
+        """Test various boundary cases for name length."""
+        # Test lengths around the limit
+        test_cases = [
+            ("a", 1),  # minimum valid length
+            ("ab", 2),
+            ("a" * 63, 63),  # just under limit
+            ("a" * 64, 64),  # exactly at limit
+        ]
+        for name, expected_length in test_cases:
+            result = tool_name_validator(name)
+            assert result == name
+            assert len(result) == expected_length
+    def test_complex_valid_names(self):
+        """Test complex but valid tool names."""
+        valid_names = [
+            "get_user_data",
+            "process_payment_info",
+            "validate_email_address",
+            "send_notification_v2",
+            "calculate_tax_amount",
+            "fetch_weather_data_for_city",
+            "convert_currency_usd_to_eur",
+            "a1b2c3d4e5f6g7h8i9j0",
+            "tool_with_many_underscores_and_numbers_123",
+        ]
+        for name in valid_names:
+            result = tool_name_validator(name)
+            assert result == name
+    @pytest.mark.parametrize(
+        "invalid_name,expected_error",
+        [
+            (None, "Tool name cannot be empty"),
+            ("", "Tool name cannot be empty"),
+            ("   ", "Tool name cannot be empty"),
+            (123, "Tool name must be a string"),
+            ("Tool", "Tool name must be in snake_case"),
+            ("tool-name", "Tool name must be in snake_case"),
+            ("_tool", "Tool name cannot start or end with an underscore"),
+            ("tool_", "Tool name cannot start or end with an underscore"),
+            ("tool__name", "Tool name cannot contain consecutive underscores"),
+            ("1tool", "Tool name must start with a lowercase letter"),
+            ("a" * 65, "Tool name must be less than 64 characters long"),
+        ],
+    )
+    def test_parametrized_invalid_cases(self, invalid_name, expected_error):
+        """Test various invalid cases with parameterized inputs."""
+        with pytest.raises(ValueError) as exc_info:
+            tool_name_validator(invalid_name)
+        assert expected_error in str(exc_info.value)
+    def test_edge_case_single_character_names(self):
+        """Test single character names (valid and invalid)."""
+        # Valid single characters
+        valid_chars = "abcdefghijklmnopqrstuvwxyz"
+        for char in valid_chars:
+            result = tool_name_validator(char)
+            assert result == char
+        # Invalid single characters
+        invalid_chars = "ABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789_-+="
+        for char in invalid_chars:
+            with pytest.raises(ValueError):
+                tool_name_validator(char)

kiln_ai/utils/uuid.py ADDED Viewed

@@ -0,0 +1,9 @@
+import uuid
+# do not change this, or this will break backwards compatibility with existing UUIDs
+KILN_UUID_NAMESPACE = uuid.uuid5(uuid.NAMESPACE_DNS, "kiln.tech")
+def string_to_uuid(s: str) -> uuid.UUID:
+    """Return a deterministic UUIDv5 for the input string."""
+    return uuid.uuid5(KILN_UUID_NAMESPACE, s)

kiln_ai/utils/validation.py ADDED Viewed

@@ -0,0 +1,90 @@
+import re
+from typing import Annotated, Any, TypeVar, Union
+from pydantic import BeforeValidator
+T = TypeVar("T")
+def validate_return_dict_prop(
+    dict: dict[str, Any], key: str, type: type[T], error_msg_prefix: str
+) -> T:
+    """
+    Validate that a property exists in a dictionary and is of a specified type.
+    Args:
+        dict: The dictionary to validate.
+        key: The key of the property to validate.
+        type: The type of the property to validate.
+        error_msg_prefix: The prefix of the error message.
+    Returns:
+        The value of the property.
+    Raises:
+        ValueError: If the property is not found or is not of the specified type.
+    Example:
+        >>> validate_return_dict_prop({"key": "value"}, "key", str, "LanceDB vector store configs properties:")
+        "value"
+    """
+    if key not in dict:
+        raise ValueError(f"{error_msg_prefix} {key} is a required property")
+    if not isinstance(dict[key], type):
+        raise ValueError(f"{error_msg_prefix} {key} must be of type {type}")
+    return dict[key]
+def validate_return_dict_prop_optional(
+    dict: dict[str, Any], key: str, type: type[T], error_msg_prefix: str
+) -> Union[T, None]:
+    """
+    Validate that a property exists in a dictionary and is of a specified type.
+    Args:
+        dict: The dictionary to validate.
+        key: The key of the property to validate.
+        type: The type of the property to validate.
+        error_msg_prefix: The prefix of the error message.
+    """
+    if key not in dict or dict[key] is None:
+        return None
+    return validate_return_dict_prop(dict, key, type, error_msg_prefix)
+def tool_name_validator(name: str) -> str:
+    # Check if name is None or empty
+    if name is None or (isinstance(name, str) and len(name.strip()) == 0):
+        raise ValueError("Tool name cannot be empty")
+    if not isinstance(name, str):
+        raise ValueError("Tool name must be a string")
+    # Check if name contains only lowercase letters, numbers, and underscores
+    snake_case_regex = re.compile(r"^[a-z0-9_]+$")
+    if not snake_case_regex.match(name):
+        raise ValueError(
+            "Tool name must be in snake_case: containing only lowercase letters (a-z), numbers (0-9), and underscores"
+        )
+    # Check that it doesn't start or end with underscore
+    if name.startswith("_") or name.endswith("_"):
+        raise ValueError("Tool name cannot start or end with an underscore")
+    # Check that it doesn't have consecutive underscores
+    if "__" in name:
+        raise ValueError("Tool name cannot contain consecutive underscores")
+    # Check that it starts with a letter (good snake_case practice)
+    if not re.match(r"^[a-z]", name):
+        raise ValueError("Tool name must start with a lowercase letter")
+    # Check length
+    if len(name) > 64:
+        raise ValueError("Tool name must be less than 64 characters long")
+    return name
+ToolNameString = Annotated[str, BeforeValidator(tool_name_validator)]

{kiln_ai-0.20.1.dist-info → kiln_ai-0.22.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: kiln-ai
-Version: 0.20.1
+Version: 0.22.0
 Summary: Kiln AI
 Project-URL: Homepage, https://kiln.tech
 Project-URL: Repository, https://github.com/Kiln-AI/kiln
@@ -15,15 +15,23 @@ Classifier: Programming Language :: Python :: 3.11
 Classifier: Programming Language :: Python :: 3.12
 Classifier: Programming Language :: Python :: 3.13
 Requires-Python: >=3.10
+Requires-Dist: anyio>=4.10.0
 Requires-Dist: boto3>=1.37.10
 Requires-Dist: coverage>=7.6.4
 Requires-Dist: exceptiongroup>=1.0.0; python_version < '3.11'
 Requires-Dist: google-cloud-aiplatform>=1.84.0
+Requires-Dist: google-genai>=1.21.1
 Requires-Dist: jsonschema>=4.23.0
+Requires-Dist: lancedb>=0.24.2
 Requires-Dist: litellm>=1.72.6
+Requires-Dist: llama-index-vector-stores-lancedb>=0.3.3
+Requires-Dist: llama-index>=0.13.3
 Requires-Dist: openai>=1.53.0
 Requires-Dist: pdoc>=15.0.0
+Requires-Dist: pillow>=11.1.0
 Requires-Dist: pydantic>=2.9.2
+Requires-Dist: pypdf>=6.0.0
+Requires-Dist: pypdfium2>=4.30.0
 Requires-Dist: pytest-benchmark>=5.1.0
 Requires-Dist: pytest-cov>=6.0.0
 Requires-Dist: pyyaml>=6.0.2

kiln-ai 0.20.1__py3-none-any.whl → 0.22.0__py3-none-any.whl

Potentially problematic release.

kiln-ai 0.20.1py3-none-any.whl → 0.22.0py3-none-any.whl