PyPI - kiln-ai - Versions diffs - 0.19.0__py3-none-any.whl → 0.21.0__py3-none-any.whl - Mend

kiln-ai 0.19.0py3-none-any.whl → 0.21.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of kiln-ai might be problematic. Click here for more details.

Files changed (158) hide show

kiln_ai/adapters/__init__.py +8 -2
kiln_ai/adapters/adapter_registry.py +43 -208
kiln_ai/adapters/chat/chat_formatter.py +8 -12
kiln_ai/adapters/chat/test_chat_formatter.py +6 -2
kiln_ai/adapters/chunkers/__init__.py +13 -0
kiln_ai/adapters/chunkers/base_chunker.py +42 -0
kiln_ai/adapters/chunkers/chunker_registry.py +16 -0
kiln_ai/adapters/chunkers/fixed_window_chunker.py +39 -0
kiln_ai/adapters/chunkers/helpers.py +23 -0
kiln_ai/adapters/chunkers/test_base_chunker.py +63 -0
kiln_ai/adapters/chunkers/test_chunker_registry.py +28 -0
kiln_ai/adapters/chunkers/test_fixed_window_chunker.py +346 -0
kiln_ai/adapters/chunkers/test_helpers.py +75 -0
kiln_ai/adapters/data_gen/test_data_gen_task.py +9 -3
kiln_ai/adapters/docker_model_runner_tools.py +119 -0
kiln_ai/adapters/embedding/__init__.py +0 -0
kiln_ai/adapters/embedding/base_embedding_adapter.py +44 -0
kiln_ai/adapters/embedding/embedding_registry.py +32 -0
kiln_ai/adapters/embedding/litellm_embedding_adapter.py +199 -0
kiln_ai/adapters/embedding/test_base_embedding_adapter.py +283 -0
kiln_ai/adapters/embedding/test_embedding_registry.py +166 -0
kiln_ai/adapters/embedding/test_litellm_embedding_adapter.py +1149 -0
kiln_ai/adapters/eval/base_eval.py +2 -2
kiln_ai/adapters/eval/eval_runner.py +9 -3
kiln_ai/adapters/eval/g_eval.py +2 -2
kiln_ai/adapters/eval/test_base_eval.py +2 -4
kiln_ai/adapters/eval/test_g_eval.py +4 -5
kiln_ai/adapters/extractors/__init__.py +18 -0
kiln_ai/adapters/extractors/base_extractor.py +72 -0
kiln_ai/adapters/extractors/encoding.py +20 -0
kiln_ai/adapters/extractors/extractor_registry.py +44 -0
kiln_ai/adapters/extractors/extractor_runner.py +112 -0
kiln_ai/adapters/extractors/litellm_extractor.py +386 -0
kiln_ai/adapters/extractors/test_base_extractor.py +244 -0
kiln_ai/adapters/extractors/test_encoding.py +54 -0
kiln_ai/adapters/extractors/test_extractor_registry.py +181 -0
kiln_ai/adapters/extractors/test_extractor_runner.py +181 -0
kiln_ai/adapters/extractors/test_litellm_extractor.py +1192 -0
kiln_ai/adapters/fine_tune/__init__.py +1 -1
kiln_ai/adapters/fine_tune/openai_finetune.py +14 -4
kiln_ai/adapters/fine_tune/test_dataset_formatter.py +2 -2
kiln_ai/adapters/fine_tune/test_fireworks_tinetune.py +2 -6
kiln_ai/adapters/fine_tune/test_openai_finetune.py +108 -111
kiln_ai/adapters/fine_tune/test_together_finetune.py +2 -6
kiln_ai/adapters/ml_embedding_model_list.py +192 -0
kiln_ai/adapters/ml_model_list.py +761 -37
kiln_ai/adapters/model_adapters/base_adapter.py +51 -21
kiln_ai/adapters/model_adapters/litellm_adapter.py +380 -138
kiln_ai/adapters/model_adapters/test_base_adapter.py +193 -17
kiln_ai/adapters/model_adapters/test_litellm_adapter.py +407 -2
kiln_ai/adapters/model_adapters/test_litellm_adapter_tools.py +1103 -0
kiln_ai/adapters/model_adapters/test_saving_adapter_results.py +5 -5
kiln_ai/adapters/model_adapters/test_structured_output.py +113 -5
kiln_ai/adapters/ollama_tools.py +69 -12
kiln_ai/adapters/parsers/__init__.py +1 -1
kiln_ai/adapters/provider_tools.py +205 -47
kiln_ai/adapters/rag/deduplication.py +49 -0
kiln_ai/adapters/rag/progress.py +252 -0
kiln_ai/adapters/rag/rag_runners.py +844 -0
kiln_ai/adapters/rag/test_deduplication.py +195 -0
kiln_ai/adapters/rag/test_progress.py +785 -0
kiln_ai/adapters/rag/test_rag_runners.py +2376 -0
kiln_ai/adapters/remote_config.py +80 -8
kiln_ai/adapters/repair/test_repair_task.py +12 -9
kiln_ai/adapters/run_output.py +3 -0
kiln_ai/adapters/test_adapter_registry.py +657 -85
kiln_ai/adapters/test_docker_model_runner_tools.py +305 -0
kiln_ai/adapters/test_ml_embedding_model_list.py +429 -0
kiln_ai/adapters/test_ml_model_list.py +251 -1
kiln_ai/adapters/test_ollama_tools.py +340 -1
kiln_ai/adapters/test_prompt_adaptors.py +13 -6
kiln_ai/adapters/test_prompt_builders.py +1 -1
kiln_ai/adapters/test_provider_tools.py +254 -8
kiln_ai/adapters/test_remote_config.py +651 -58
kiln_ai/adapters/vector_store/__init__.py +1 -0
kiln_ai/adapters/vector_store/base_vector_store_adapter.py +83 -0
kiln_ai/adapters/vector_store/lancedb_adapter.py +389 -0
kiln_ai/adapters/vector_store/test_base_vector_store.py +160 -0
kiln_ai/adapters/vector_store/test_lancedb_adapter.py +1841 -0
kiln_ai/adapters/vector_store/test_vector_store_registry.py +199 -0
kiln_ai/adapters/vector_store/vector_store_registry.py +33 -0
kiln_ai/datamodel/__init__.py +39 -34
kiln_ai/datamodel/basemodel.py +170 -1
kiln_ai/datamodel/chunk.py +158 -0
kiln_ai/datamodel/datamodel_enums.py +28 -0
kiln_ai/datamodel/embedding.py +64 -0
kiln_ai/datamodel/eval.py +1 -1
kiln_ai/datamodel/external_tool_server.py +298 -0
kiln_ai/datamodel/extraction.py +303 -0
kiln_ai/datamodel/json_schema.py +25 -10
kiln_ai/datamodel/project.py +40 -1
kiln_ai/datamodel/rag.py +79 -0
kiln_ai/datamodel/registry.py +0 -15
kiln_ai/datamodel/run_config.py +62 -0
kiln_ai/datamodel/task.py +2 -77
kiln_ai/datamodel/task_output.py +6 -1
kiln_ai/datamodel/task_run.py +41 -0
kiln_ai/datamodel/test_attachment.py +649 -0
kiln_ai/datamodel/test_basemodel.py +4 -4
kiln_ai/datamodel/test_chunk_models.py +317 -0
kiln_ai/datamodel/test_dataset_split.py +1 -1
kiln_ai/datamodel/test_embedding_models.py +448 -0
kiln_ai/datamodel/test_eval_model.py +6 -6
kiln_ai/datamodel/test_example_models.py +175 -0
kiln_ai/datamodel/test_external_tool_server.py +691 -0
kiln_ai/datamodel/test_extraction_chunk.py +206 -0
kiln_ai/datamodel/test_extraction_model.py +470 -0
kiln_ai/datamodel/test_rag.py +641 -0
kiln_ai/datamodel/test_registry.py +8 -3
kiln_ai/datamodel/test_task.py +15 -47
kiln_ai/datamodel/test_tool_id.py +320 -0
kiln_ai/datamodel/test_vector_store.py +320 -0
kiln_ai/datamodel/tool_id.py +105 -0
kiln_ai/datamodel/vector_store.py +141 -0
kiln_ai/tools/__init__.py +8 -0
kiln_ai/tools/base_tool.py +82 -0
kiln_ai/tools/built_in_tools/__init__.py +13 -0
kiln_ai/tools/built_in_tools/math_tools.py +124 -0
kiln_ai/tools/built_in_tools/test_math_tools.py +204 -0
kiln_ai/tools/mcp_server_tool.py +95 -0
kiln_ai/tools/mcp_session_manager.py +246 -0
kiln_ai/tools/rag_tools.py +157 -0
kiln_ai/tools/test_base_tools.py +199 -0
kiln_ai/tools/test_mcp_server_tool.py +457 -0
kiln_ai/tools/test_mcp_session_manager.py +1585 -0
kiln_ai/tools/test_rag_tools.py +848 -0
kiln_ai/tools/test_tool_registry.py +562 -0
kiln_ai/tools/tool_registry.py +85 -0
kiln_ai/utils/__init__.py +3 -0
kiln_ai/utils/async_job_runner.py +62 -17
kiln_ai/utils/config.py +24 -2
kiln_ai/utils/env.py +15 -0
kiln_ai/utils/filesystem.py +14 -0
kiln_ai/utils/filesystem_cache.py +60 -0
kiln_ai/utils/litellm.py +94 -0
kiln_ai/utils/lock.py +100 -0
kiln_ai/utils/mime_type.py +38 -0
kiln_ai/utils/open_ai_types.py +94 -0
kiln_ai/utils/pdf_utils.py +38 -0
kiln_ai/utils/project_utils.py +17 -0
kiln_ai/utils/test_async_job_runner.py +151 -35
kiln_ai/utils/test_config.py +138 -1
kiln_ai/utils/test_env.py +142 -0
kiln_ai/utils/test_filesystem_cache.py +316 -0
kiln_ai/utils/test_litellm.py +206 -0
kiln_ai/utils/test_lock.py +185 -0
kiln_ai/utils/test_mime_type.py +66 -0
kiln_ai/utils/test_open_ai_types.py +131 -0
kiln_ai/utils/test_pdf_utils.py +73 -0
kiln_ai/utils/test_uuid.py +111 -0
kiln_ai/utils/test_validation.py +524 -0
kiln_ai/utils/uuid.py +9 -0
kiln_ai/utils/validation.py +90 -0
{kiln_ai-0.19.0.dist-info → kiln_ai-0.21.0.dist-info}/METADATA +12 -5
kiln_ai-0.21.0.dist-info/RECORD +211 -0
kiln_ai-0.19.0.dist-info/RECORD +0 -115
{kiln_ai-0.19.0.dist-info → kiln_ai-0.21.0.dist-info}/WHEEL +0 -0
{kiln_ai-0.19.0.dist-info → kiln_ai-0.21.0.dist-info}/licenses/LICENSE.txt +0 -0

kiln_ai/utils/test_async_job_runner.py CHANGED Viewed

@@ -3,30 +3,51 @@ from unittest.mock import AsyncMock, patch
 import pytest
-from kiln_ai.utils.async_job_runner import AsyncJobRunner, Progress
+from kiln_ai.utils.async_job_runner import (
+    AsyncJobRunner,
+    AsyncJobRunnerObserver,
+    Progress,
+)
+@pytest.fixture
+def mock_async_run_job_fn_success():
+    return AsyncMock(return_value=True)
+@pytest.fixture
+def mock_async_run_job_fn_failure():
+    return AsyncMock(return_value=False)
 @pytest.mark.parametrize("concurrency", [0, -1, -25])
-def test_invalid_concurrency_raises(concurrency):
+def test_invalid_concurrency_raises(concurrency, mock_async_run_job_fn_success):
     with pytest.raises(ValueError):
-        AsyncJobRunner(concurrency=concurrency)
+        AsyncJobRunner(
+            concurrency=concurrency,
+            jobs=[],
+            run_job_fn=mock_async_run_job_fn_success,
+        )
 # Test with and without concurrency
 @pytest.mark.parametrize("concurrency", [1, 25])
 @pytest.mark.asyncio
-async def test_async_job_runner_status_updates(concurrency):
+async def test_async_job_runner_status_updates(
+    concurrency, mock_async_run_job_fn_success
+):
     job_count = 50
     jobs = [{"id": i} for i in range(job_count)]
-    runner = AsyncJobRunner(concurrency=concurrency)
-    # fake run_job that succeeds
-    mock_run_job_success = AsyncMock(return_value=True)
+    runner = AsyncJobRunner(
+        concurrency=concurrency,
+        jobs=jobs,
+        run_job_fn=mock_async_run_job_fn_success,
+    )
     # Expect the status updates in order, and 1 for each job
     expected_completed_count = 0
-    async for progress in runner.run(jobs, mock_run_job_success):
+    async for progress in runner.run():
         assert progress.complete == expected_completed_count
         expected_completed_count += 1
         assert progress.errors == 0
@@ -36,26 +57,29 @@ async def test_async_job_runner_status_updates(concurrency):
     assert expected_completed_count == job_count + 1
     # Verify run_job was called for each job
-    assert mock_run_job_success.call_count == job_count
+    assert mock_async_run_job_fn_success.call_count == job_count
     # Verify run_job was called with the correct arguments
     for i in range(job_count):
-        mock_run_job_success.assert_any_await(jobs[i])
+        mock_async_run_job_fn_success.assert_any_await(jobs[i])
 # Test with and without concurrency
 @pytest.mark.parametrize("concurrency", [1, 25])
 @pytest.mark.asyncio
-async def test_async_job_runner_status_updates_empty_job_list(concurrency):
+async def test_async_job_runner_status_updates_empty_job_list(
+    concurrency, mock_async_run_job_fn_success
+):
     empty_job_list = []
-    runner = AsyncJobRunner(concurrency=concurrency)
-    # fake run_job that succeeds
-    mock_run_job_success = AsyncMock(return_value=True)
+    runner = AsyncJobRunner(
+        concurrency=concurrency,
+        jobs=empty_job_list,
+        run_job_fn=mock_async_run_job_fn_success,
+    )
     updates: List[Progress] = []
-    async for progress in runner.run(empty_job_list, mock_run_job_success):
+    async for progress in runner.run():
         updates.append(progress)
     # Verify last status update was complete
@@ -66,23 +90,26 @@ async def test_async_job_runner_status_updates_empty_job_list(concurrency):
     assert updates[0].total == 0
     # Verify run_job was called for each job
-    assert mock_run_job_success.call_count == 0
+    assert mock_async_run_job_fn_success.call_count == 0
 @pytest.mark.parametrize("concurrency", [1, 25])
 @pytest.mark.asyncio
-async def test_async_job_runner_all_failures(concurrency):
+async def test_async_job_runner_all_failures(
+    concurrency, mock_async_run_job_fn_failure
+):
     job_count = 50
     jobs = [{"id": i} for i in range(job_count)]
-    runner = AsyncJobRunner(concurrency=concurrency)
-    # fake run_job that fails
-    mock_run_job_failure = AsyncMock(return_value=False)
+    runner = AsyncJobRunner(
+        concurrency=concurrency,
+        jobs=jobs,
+        run_job_fn=mock_async_run_job_fn_failure,
+    )
     # Expect the status updates in order, and 1 for each job
     expected_error_count = 0
-    async for progress in runner.run(jobs, mock_run_job_failure):
+    async for progress in runner.run():
         assert progress.complete == 0
         assert progress.errors == expected_error_count
         expected_error_count += 1
@@ -92,11 +119,11 @@ async def test_async_job_runner_all_failures(concurrency):
     assert expected_error_count == job_count + 1
     # Verify run_job was called for each job
-    assert mock_run_job_failure.call_count == job_count
+    assert mock_async_run_job_fn_failure.call_count == job_count
     # Verify run_job was called with the correct arguments
     for i in range(job_count):
-        mock_run_job_failure.assert_any_await(jobs[i])
+        mock_async_run_job_fn_failure.assert_any_await(jobs[i])
 @pytest.mark.parametrize("concurrency", [1, 25])
@@ -108,16 +135,20 @@ async def test_async_job_runner_partial_failures(concurrency):
     # we want to fail on some jobs and succeed on others
     jobs_to_fail = set([0, 2, 4, 6, 8, 20, 25])
-    runner = AsyncJobRunner(concurrency=concurrency)
     # fake run_job that fails
     mock_run_job_partial_success = AsyncMock(
         # return True for jobs that should succeed
         side_effect=lambda job: job["id"] not in jobs_to_fail
     )
+    runner = AsyncJobRunner(
+        concurrency=concurrency,
+        jobs=jobs,
+        run_job_fn=mock_run_job_partial_success,
+    )
     # Expect the status updates in order, and 1 for each job
-    async for progress in runner.run(jobs, mock_run_job_partial_success):
+    async for progress in runner.run():
         assert progress.total == job_count
     # Verify last status update was complete
@@ -140,8 +171,6 @@ async def test_async_job_runner_partial_raises(concurrency):
     job_count = 50
     jobs = [{"id": i} for i in range(job_count)]
-    runner = AsyncJobRunner(concurrency=concurrency)
     ids_to_fail = set([10, 25])
     def failure_fn(job):
@@ -152,6 +181,12 @@ async def test_async_job_runner_partial_raises(concurrency):
     # fake run_job that fails
     mock_run_job_partial_success = AsyncMock(side_effect=failure_fn)
+    runner = AsyncJobRunner(
+        concurrency=concurrency,
+        jobs=jobs,
+        run_job_fn=mock_run_job_partial_success,
+    )
     # generate all the values we expect to see in progress updates
     complete_values_expected = set([i for i in range(job_count - len(ids_to_fail) + 1)])
     errors_values_expected = set([i for i in range(len(ids_to_fail) + 1)])
@@ -164,7 +199,7 @@ async def test_async_job_runner_partial_raises(concurrency):
     errors_values_actual = set()
     # Expect the status updates in order, and 1 for each job
-    async for progress in runner.run(jobs, mock_run_job_partial_success):
+    async for progress in runner.run():
         updates.append(progress)
         complete_values_actual.add(progress.complete)
         errors_values_actual.add(progress.errors)
@@ -184,9 +219,13 @@ async def test_async_job_runner_partial_raises(concurrency):
 @pytest.mark.parametrize("concurrency", [1, 25])
 @pytest.mark.asyncio
-async def test_async_job_runner_cancelled(concurrency):
-    runner = AsyncJobRunner(concurrency=concurrency)
+async def test_async_job_runner_cancelled(concurrency, mock_async_run_job_fn_success):
     jobs = [{"id": i} for i in range(10)]
+    runner = AsyncJobRunner(
+        concurrency=concurrency,
+        jobs=jobs,
+        run_job_fn=mock_async_run_job_fn_success,
+    )
     with patch.object(
         runner,
@@ -195,5 +234,82 @@ async def test_async_job_runner_cancelled(concurrency):
     ):
         # if an exception is raised in the task, we should see it bubble up
         with pytest.raises(Exception, match="run_worker raised an exception"):
-            async for _ in runner.run(jobs, AsyncMock(return_value=True)):
+            async for _ in runner.run():
                 pass
+@pytest.mark.parametrize("concurrency", [1, 25])
+@pytest.mark.asyncio
+async def test_async_job_runner_observers(concurrency):
+    class MockAsyncJobRunnerObserver(AsyncJobRunnerObserver[dict[str, int]]):
+        def __init__(self):
+            self.on_error_calls = []
+            self.on_success_calls = []
+        async def on_error(self, job: dict[str, int], error: Exception):
+            self.on_error_calls.append((job, error))
+        async def on_success(self, job: dict[str, int]):
+            self.on_success_calls.append(job)
+    mock_observer_a = MockAsyncJobRunnerObserver()
+    mock_observer_b = MockAsyncJobRunnerObserver()
+    jobs = [{"id": i} for i in range(10)]
+    async def run_job_fn(job: dict[str, int]) -> bool:
+        # we simulate the job 5 and 6 crashing, which should trigger the observers on_error handlers
+        if job["id"] == 5 or job["id"] == 6:
+            raise ValueError(f"job failed unexpectedly {job['id']}")
+        return True
+    runner = AsyncJobRunner(
+        concurrency=concurrency,
+        jobs=jobs,
+        run_job_fn=run_job_fn,
+        observers=[mock_observer_a, mock_observer_b],
+    )
+    async for _ in runner.run():
+        pass
+    assert len(mock_observer_a.on_error_calls) == 2
+    assert len(mock_observer_b.on_error_calls) == 2
+    # not necessarily in order, but we should have seen both 5 and 6
+    assert len(mock_observer_a.on_success_calls) == 8
+    assert len(mock_observer_b.on_success_calls) == 8
+    # check that 5 and 6 are in the error calls
+    for job_idx in [5, 6]:
+        # check that 5 and 6 are in the error calls for both observers
+        assert any(call[0] == jobs[job_idx] for call in mock_observer_a.on_error_calls)
+        assert any(call[0] == jobs[job_idx] for call in mock_observer_b.on_error_calls)
+        # check that the error is the correct exception
+        assert (
+            str(mock_observer_a.on_error_calls[0][1]) == "job failed unexpectedly 5"
+            or str(mock_observer_a.on_error_calls[1][1]) == "job failed unexpectedly 6"
+        )
+        assert (
+            str(mock_observer_b.on_error_calls[0][1]) == "job failed unexpectedly 5"
+            or str(mock_observer_b.on_error_calls[1][1]) == "job failed unexpectedly 6"
+        )
+        # check that 5 and 6 are not in the success calls for both observers
+        assert not any(
+            call == jobs[job_idx] for call in mock_observer_a.on_success_calls
+        )
+        assert not any(
+            call == jobs[job_idx] for call in mock_observer_b.on_success_calls
+        )
+    # check that the other jobs are in the success calls for both observers
+    for job_idx in range(10):
+        if job_idx not in [5, 6]:
+            assert any(
+                call == jobs[job_idx] for call in mock_observer_a.on_success_calls
+            )
+            assert any(
+                call == jobs[job_idx] for call in mock_observer_b.on_success_calls
+            )

kiln_ai/utils/test_config.py CHANGED Viewed

@@ -6,7 +6,7 @@ from unittest.mock import patch
 import pytest
 import yaml
-from kiln_ai.utils.config import Config, ConfigProperty, _get_user_id
+from kiln_ai.utils.config import MCP_SECRETS_KEY, Config, ConfigProperty, _get_user_id
 @pytest.fixture
@@ -322,3 +322,140 @@ def test_update_settings_thread_safety(config_with_yaml):
     assert not exceptions
     assert config.int_property in range(5)
+def test_mcp_secrets_property():
+    """Test mcp_secrets configuration property"""
+    config = Config.shared()
+    # Initially should be None/empty
+    assert config.mcp_secrets is None
+    # Set some secrets
+    secrets = {
+        "server1::Authorization": "Bearer token123",
+        "server1::X-API-Key": "api-key-456",
+        "server2::Token": "secret-token",
+    }
+    config.mcp_secrets = secrets
+    # Verify they are stored correctly
+    assert config.mcp_secrets == secrets
+    assert config.mcp_secrets["server1::Authorization"] == "Bearer token123"
+    assert config.mcp_secrets["server1::X-API-Key"] == "api-key-456"
+    assert config.mcp_secrets["server2::Token"] == "secret-token"
+def test_mcp_secrets_sensitive_hiding():
+    """Test that mcp_secrets are hidden when hide_sensitive=True"""
+    config = Config.shared()
+    # Set some secrets
+    secrets = {
+        "server1::Authorization": "Bearer secret123",
+        "server2::X-API-Key": "secret-key",
+    }
+    config.mcp_secrets = secrets
+    # Test without hiding sensitive data
+    visible_settings = config.settings(hide_sensitive=False)
+    assert MCP_SECRETS_KEY in visible_settings
+    assert visible_settings[MCP_SECRETS_KEY] == secrets
+    # Test with hiding sensitive data
+    hidden_settings = config.settings(hide_sensitive=True)
+    assert MCP_SECRETS_KEY in hidden_settings
+    assert hidden_settings[MCP_SECRETS_KEY] == "[hidden]"
+def test_mcp_secrets_persistence(mock_yaml_file):
+    """Test that mcp_secrets are persisted to YAML correctly"""
+    with patch(
+        "kiln_ai.utils.config.Config.settings_path",
+        return_value=mock_yaml_file,
+    ):
+        config = Config()
+        # Set some secrets
+        secrets = {
+            "server1::Authorization": "Bearer persist123",
+            "server2::Token": "persist-token",
+        }
+        config.mcp_secrets = secrets
+        # Check that the value was saved to the YAML file
+        with open(mock_yaml_file, "r") as f:
+            saved_settings = yaml.safe_load(f)
+        assert saved_settings[MCP_SECRETS_KEY] == secrets
+        # Create a new config instance to test loading from YAML
+        new_config = Config()
+        # Check that the value is loaded from YAML
+        assert new_config.mcp_secrets == secrets
+def test_mcp_secrets_get_value():
+    """Test that mcp_secrets can be retrieved using get_value method"""
+    config = Config.shared()
+    # Initially should be None
+    assert config.get_value(MCP_SECRETS_KEY) is None
+    # Set some secrets
+    secrets = {"server::key": "value"}
+    config.mcp_secrets = secrets
+    # Should be retrievable via get_value
+    assert config.get_value(MCP_SECRETS_KEY) == secrets
+def test_mcp_secrets_update_settings():
+    """Test updating mcp_secrets using update_settings method"""
+    config = Config.shared()
+    # Set initial secrets
+    initial_secrets = {"server1::key1": "value1"}
+    config.update_settings({MCP_SECRETS_KEY: initial_secrets})
+    assert config.mcp_secrets == initial_secrets
+    # Update with new secrets (should replace, not merge)
+    new_secrets = {
+        "server1::key1": "updated_value1",
+        "server2::key2": "value2",
+    }
+    config.update_settings({MCP_SECRETS_KEY: new_secrets})
+    assert config.mcp_secrets == new_secrets
+    assert config.mcp_secrets["server1::key1"] == "updated_value1"
+    assert config.mcp_secrets["server2::key2"] == "value2"
+def test_mcp_secrets_empty_dict():
+    """Test mcp_secrets with empty dict"""
+    config = Config.shared()
+    # Set empty dict
+    config.mcp_secrets = {}
+    assert config.mcp_secrets == {}
+    # Should still be dict type, not None
+    assert isinstance(config.mcp_secrets, dict)
+def test_mcp_secrets_type_validation():
+    """Test that mcp_secrets enforces dict[str, str] type"""
+    config = Config.shared()
+    # Valid dict[str, str]
+    valid_secrets = {"server::key": "value"}
+    config.mcp_secrets = valid_secrets
+    assert config.mcp_secrets == valid_secrets
+    # The config system applies type conversion when retrieving values
+    mixed_types = {"server::key": 123}  # int value
+    config.mcp_secrets = mixed_types
+    # The type conversion happens when the value is retrieved, not when set
+    # So the underlying storage may preserve the original type
+    assert config.mcp_secrets == mixed_types or config.mcp_secrets == {
+        "server::key": "123"
+    }

kiln_ai/utils/test_env.py ADDED Viewed

@@ -0,0 +1,142 @@
+import os
+import pytest
+from kiln_ai.utils.env import temporary_env
+class TestTemporaryEnv:
+    def test_set_new_env_var(self):
+        """Test setting a new environment variable that doesn't exist."""
+        var_name = "TEST_NEW_VAR"
+        test_value = "test_value"
+        # Ensure the variable doesn't exist initially
+        assert var_name not in os.environ
+        with temporary_env(var_name, test_value):
+            assert os.environ[var_name] == test_value
+        # Verify it's removed after context
+        assert var_name not in os.environ
+    def test_modify_existing_env_var(self):
+        """Test modifying an existing environment variable."""
+        var_name = "TEST_EXISTING_VAR"
+        original_value = "original_value"
+        new_value = "new_value"
+        # Set up initial state
+        os.environ[var_name] = original_value
+        with temporary_env(var_name, new_value):
+            assert os.environ[var_name] == new_value
+        # Verify original value is restored
+        assert os.environ[var_name] == original_value
+    def test_restore_nonexistent_var(self):
+        """Test that a variable that didn't exist is properly removed."""
+        var_name = "TEST_NONEXISTENT_VAR"
+        test_value = "test_value"
+        # Ensure the variable doesn't exist initially
+        if var_name in os.environ:
+            del os.environ[var_name]
+        with temporary_env(var_name, test_value):
+            assert os.environ[var_name] == test_value
+        # Verify it's removed after context
+        assert var_name not in os.environ
+    def test_exception_handling(self):
+        """Test that environment is restored even when an exception occurs."""
+        var_name = "TEST_EXCEPTION_VAR"
+        original_value = "original_value"
+        new_value = "new_value"
+        # Set up initial state
+        os.environ[var_name] = original_value
+        with pytest.raises(ValueError):
+            with temporary_env(var_name, new_value):
+                assert os.environ[var_name] == new_value
+                raise ValueError("Test exception")
+        # Verify original value is restored even after exception
+        assert os.environ[var_name] == original_value
+    def test_exception_handling_new_var(self):
+        """Test that new variable is removed even when an exception occurs."""
+        var_name = "TEST_EXCEPTION_NEW_VAR"
+        test_value = "test_value"
+        # Ensure the variable doesn't exist initially
+        if var_name in os.environ:
+            del os.environ[var_name]
+        with pytest.raises(RuntimeError):
+            with temporary_env(var_name, test_value):
+                assert os.environ[var_name] == test_value
+                raise RuntimeError("Test exception")
+        # Verify variable is removed even after exception
+        assert var_name not in os.environ
+    def test_nested_context_managers(self):
+        """Test using multiple temporary_env context managers."""
+        var1 = "TEST_NESTED_VAR1"
+        var2 = "TEST_NESTED_VAR2"
+        value1 = "value1"
+        value2 = "value2"
+        # Set up initial state
+        os.environ[var1] = "original1"
+        if var2 in os.environ:
+            del os.environ[var2]
+        with temporary_env(var1, value1):
+            assert os.environ[var1] == value1
+            with temporary_env(var2, value2):
+                assert os.environ[var1] == value1
+                assert os.environ[var2] == value2
+            # Inner context should be cleaned up
+            assert var2 not in os.environ
+            assert os.environ[var1] == value1
+        # Both contexts should be cleaned up
+        assert os.environ[var1] == "original1"
+        assert var2 not in os.environ
+    def test_empty_string_value(self):
+        """Test setting an empty string value."""
+        var_name = "TEST_EMPTY_VAR"
+        test_value = ""
+        with temporary_env(var_name, test_value):
+            assert os.environ[var_name] == test_value
+        assert var_name not in os.environ
+    def test_none_value_handling(self):
+        """Test that None values are handled properly."""
+        var_name = "TEST_NONE_VAR"
+        test_value = "test_value"
+        with temporary_env(var_name, test_value):
+            assert os.environ[var_name] == test_value
+        assert var_name not in os.environ
+    def test_unicode_value(self):
+        """Test setting unicode values."""
+        var_name = "TEST_UNICODE_VAR"
+        test_value = "测试值 🚀"
+        with temporary_env(var_name, test_value):
+            assert os.environ[var_name] == test_value
+        assert var_name not in os.environ

kiln-ai 0.19.0__py3-none-any.whl → 0.21.0__py3-none-any.whl

Potentially problematic release.

kiln-ai 0.19.0py3-none-any.whl → 0.21.0py3-none-any.whl