PyPI - opik - Versions diffs - 1.9.41__py3-none-any.whl → 1.9.86__py3-none-any.whl - Mend

opik 1.9.41py3-none-any.whl → 1.9.86py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (192) hide show

opik/api_objects/attachment/attachment_context.py +36 -0
opik/api_objects/attachment/attachments_extractor.py +153 -0
opik/api_objects/attachment/client.py +1 -0
opik/api_objects/attachment/converters.py +2 -0
opik/api_objects/attachment/decoder.py +18 -0
opik/api_objects/attachment/decoder_base64.py +83 -0
opik/api_objects/attachment/decoder_helpers.py +137 -0
opik/api_objects/constants.py +2 -0
opik/api_objects/dataset/dataset.py +133 -40
opik/api_objects/dataset/rest_operations.py +2 -0
opik/api_objects/experiment/experiment.py +6 -0
opik/api_objects/helpers.py +8 -4
opik/api_objects/local_recording.py +6 -5
opik/api_objects/observation_data.py +101 -0
opik/api_objects/opik_client.py +78 -45
opik/api_objects/opik_query_language.py +9 -3
opik/api_objects/prompt/chat/chat_prompt.py +18 -1
opik/api_objects/prompt/client.py +8 -1
opik/api_objects/span/span_data.py +3 -88
opik/api_objects/threads/threads_client.py +7 -4
opik/api_objects/trace/trace_data.py +3 -74
opik/api_objects/validation_helpers.py +3 -3
opik/cli/exports/__init__.py +131 -0
opik/cli/exports/dataset.py +278 -0
opik/cli/exports/experiment.py +784 -0
opik/cli/exports/project.py +685 -0
opik/cli/exports/prompt.py +578 -0
opik/cli/exports/utils.py +406 -0
opik/cli/harbor.py +39 -0
opik/cli/imports/__init__.py +439 -0
opik/cli/imports/dataset.py +143 -0
opik/cli/imports/experiment.py +1192 -0
opik/cli/imports/project.py +262 -0
opik/cli/imports/prompt.py +177 -0
opik/cli/imports/utils.py +280 -0
opik/cli/main.py +14 -12
opik/config.py +12 -1
opik/datetime_helpers.py +12 -0
opik/decorator/arguments_helpers.py +4 -1
opik/decorator/base_track_decorator.py +111 -37
opik/decorator/context_manager/span_context_manager.py +5 -1
opik/decorator/generator_wrappers.py +5 -4
opik/decorator/span_creation_handler.py +13 -4
opik/evaluation/engine/engine.py +111 -28
opik/evaluation/engine/evaluation_tasks_executor.py +71 -19
opik/evaluation/evaluator.py +12 -0
opik/evaluation/metrics/conversation/llm_judges/conversational_coherence/metric.py +3 -1
opik/evaluation/metrics/conversation/llm_judges/session_completeness/metric.py +3 -1
opik/evaluation/metrics/conversation/llm_judges/user_frustration/metric.py +3 -1
opik/evaluation/metrics/heuristics/equals.py +11 -7
opik/evaluation/metrics/llm_judges/answer_relevance/metric.py +3 -1
opik/evaluation/metrics/llm_judges/context_precision/metric.py +3 -1
opik/evaluation/metrics/llm_judges/context_recall/metric.py +3 -1
opik/evaluation/metrics/llm_judges/factuality/metric.py +1 -1
opik/evaluation/metrics/llm_judges/g_eval/metric.py +3 -1
opik/evaluation/metrics/llm_judges/hallucination/metric.py +3 -1
opik/evaluation/metrics/llm_judges/moderation/metric.py +3 -1
opik/evaluation/metrics/llm_judges/structure_output_compliance/metric.py +3 -1
opik/evaluation/metrics/llm_judges/syc_eval/metric.py +4 -2
opik/evaluation/metrics/llm_judges/trajectory_accuracy/metric.py +3 -1
opik/evaluation/metrics/llm_judges/usefulness/metric.py +3 -1
opik/evaluation/metrics/ragas_metric.py +43 -23
opik/evaluation/models/litellm/litellm_chat_model.py +7 -2
opik/evaluation/models/litellm/util.py +4 -20
opik/evaluation/models/models_factory.py +19 -5
opik/evaluation/rest_operations.py +3 -3
opik/evaluation/threads/helpers.py +3 -2
opik/file_upload/file_uploader.py +13 -0
opik/file_upload/upload_options.py +2 -0
opik/integrations/adk/legacy_opik_tracer.py +9 -11
opik/integrations/adk/opik_tracer.py +2 -2
opik/integrations/adk/patchers/adk_otel_tracer/opik_adk_otel_tracer.py +2 -2
opik/integrations/dspy/callback.py +100 -14
opik/integrations/dspy/parsers.py +168 -0
opik/integrations/harbor/__init__.py +17 -0
opik/integrations/harbor/experiment_service.py +269 -0
opik/integrations/harbor/opik_tracker.py +528 -0
opik/integrations/haystack/opik_tracer.py +2 -2
opik/integrations/langchain/__init__.py +15 -2
opik/integrations/langchain/langgraph_tracer_injector.py +88 -0
opik/integrations/langchain/opik_tracer.py +258 -160
opik/integrations/langchain/provider_usage_extractors/langchain_run_helpers/helpers.py +7 -4
opik/integrations/llama_index/callback.py +43 -6
opik/integrations/openai/agents/opik_tracing_processor.py +8 -10
opik/integrations/openai/opik_tracker.py +99 -4
opik/integrations/openai/videos/__init__.py +9 -0
opik/integrations/openai/videos/binary_response_write_to_file_decorator.py +88 -0
opik/integrations/openai/videos/videos_create_decorator.py +159 -0
opik/integrations/openai/videos/videos_download_decorator.py +110 -0
opik/message_processing/batching/base_batcher.py +14 -21
opik/message_processing/batching/batch_manager.py +22 -10
opik/message_processing/batching/batchers.py +32 -40
opik/message_processing/batching/flushing_thread.py +0 -3
opik/message_processing/emulation/emulator_message_processor.py +36 -1
opik/message_processing/emulation/models.py +21 -0
opik/message_processing/messages.py +9 -0
opik/message_processing/preprocessing/__init__.py +0 -0
opik/message_processing/preprocessing/attachments_preprocessor.py +70 -0
opik/message_processing/preprocessing/batching_preprocessor.py +53 -0
opik/message_processing/preprocessing/constants.py +1 -0
opik/message_processing/preprocessing/file_upload_preprocessor.py +38 -0
opik/message_processing/preprocessing/preprocessor.py +36 -0
opik/message_processing/processors/__init__.py +0 -0
opik/message_processing/processors/attachments_extraction_processor.py +146 -0
opik/message_processing/{message_processors.py → processors/message_processors.py} +15 -1
opik/message_processing/{message_processors_chain.py → processors/message_processors_chain.py} +3 -2
opik/message_processing/{online_message_processor.py → processors/online_message_processor.py} +11 -9
opik/message_processing/queue_consumer.py +4 -2
opik/message_processing/streamer.py +71 -33
opik/message_processing/streamer_constructors.py +36 -8
opik/plugins/pytest/experiment_runner.py +1 -1
opik/plugins/pytest/hooks.py +5 -3
opik/rest_api/__init__.py +38 -0
opik/rest_api/datasets/client.py +249 -148
opik/rest_api/datasets/raw_client.py +356 -217
opik/rest_api/experiments/client.py +26 -0
opik/rest_api/experiments/raw_client.py +26 -0
opik/rest_api/llm_provider_key/client.py +4 -4
opik/rest_api/llm_provider_key/raw_client.py +4 -4
opik/rest_api/llm_provider_key/types/provider_api_key_write_provider.py +2 -1
opik/rest_api/manual_evaluation/client.py +101 -0
opik/rest_api/manual_evaluation/raw_client.py +172 -0
opik/rest_api/optimizations/client.py +0 -166
opik/rest_api/optimizations/raw_client.py +0 -248
opik/rest_api/projects/client.py +9 -0
opik/rest_api/projects/raw_client.py +13 -0
opik/rest_api/projects/types/project_metric_request_public_metric_type.py +4 -0
opik/rest_api/prompts/client.py +130 -2
opik/rest_api/prompts/raw_client.py +175 -0
opik/rest_api/traces/client.py +101 -0
opik/rest_api/traces/raw_client.py +120 -0
opik/rest_api/types/__init__.py +46 -0
opik/rest_api/types/audio_url.py +19 -0
opik/rest_api/types/audio_url_public.py +19 -0
opik/rest_api/types/audio_url_write.py +19 -0
opik/rest_api/types/automation_rule_evaluator.py +38 -2
opik/rest_api/types/automation_rule_evaluator_object_object_public.py +33 -2
opik/rest_api/types/automation_rule_evaluator_public.py +33 -2
opik/rest_api/types/automation_rule_evaluator_span_user_defined_metric_python.py +22 -0
opik/rest_api/types/automation_rule_evaluator_span_user_defined_metric_python_public.py +22 -0
opik/rest_api/types/automation_rule_evaluator_span_user_defined_metric_python_write.py +22 -0
opik/rest_api/types/automation_rule_evaluator_update.py +27 -1
opik/rest_api/types/automation_rule_evaluator_update_span_user_defined_metric_python.py +22 -0
opik/rest_api/types/automation_rule_evaluator_write.py +27 -1
opik/rest_api/types/dataset_item.py +1 -1
opik/rest_api/types/dataset_item_batch.py +4 -0
opik/rest_api/types/dataset_item_changes_public.py +5 -0
opik/rest_api/types/dataset_item_compare.py +1 -1
opik/rest_api/types/dataset_item_filter.py +4 -0
opik/rest_api/types/dataset_item_page_compare.py +0 -1
opik/rest_api/types/dataset_item_page_public.py +0 -1
opik/rest_api/types/dataset_item_public.py +1 -1
opik/rest_api/types/dataset_version_public.py +5 -0
opik/rest_api/types/dataset_version_summary.py +5 -0
opik/rest_api/types/dataset_version_summary_public.py +5 -0
opik/rest_api/types/experiment.py +9 -0
opik/rest_api/types/experiment_public.py +9 -0
opik/rest_api/types/llm_as_judge_message_content.py +2 -0
opik/rest_api/types/llm_as_judge_message_content_public.py +2 -0
opik/rest_api/types/llm_as_judge_message_content_write.py +2 -0
opik/rest_api/types/manual_evaluation_request_entity_type.py +1 -1
opik/rest_api/types/project.py +1 -0
opik/rest_api/types/project_detailed.py +1 -0
opik/rest_api/types/project_metric_response_public_metric_type.py +4 -0
opik/rest_api/types/project_reference.py +31 -0
opik/rest_api/types/project_reference_public.py +31 -0
opik/rest_api/types/project_stats_summary_item.py +1 -0
opik/rest_api/types/prompt_version.py +1 -0
opik/rest_api/types/prompt_version_detail.py +1 -0
opik/rest_api/types/prompt_version_page_public.py +5 -0
opik/rest_api/types/prompt_version_public.py +1 -0
opik/rest_api/types/prompt_version_update.py +33 -0
opik/rest_api/types/provider_api_key.py +5 -1
opik/rest_api/types/provider_api_key_provider.py +2 -1
opik/rest_api/types/provider_api_key_public.py +5 -1
opik/rest_api/types/provider_api_key_public_provider.py +2 -1
opik/rest_api/types/service_toggles_config.py +11 -1
opik/rest_api/types/span_user_defined_metric_python_code.py +20 -0
opik/rest_api/types/span_user_defined_metric_python_code_public.py +20 -0
opik/rest_api/types/span_user_defined_metric_python_code_write.py +20 -0
opik/types.py +36 -0
opik/validation/chat_prompt_messages.py +241 -0
opik/validation/feedback_score.py +3 -3
opik/validation/validator.py +28 -0
{opik-1.9.41.dist-info → opik-1.9.86.dist-info}/METADATA +5 -5
{opik-1.9.41.dist-info → opik-1.9.86.dist-info}/RECORD +190 -141
opik/cli/export.py +0 -791
opik/cli/import_command.py +0 -575
{opik-1.9.41.dist-info → opik-1.9.86.dist-info}/WHEEL +0 -0
{opik-1.9.41.dist-info → opik-1.9.86.dist-info}/entry_points.txt +0 -0
{opik-1.9.41.dist-info → opik-1.9.86.dist-info}/licenses/LICENSE +0 -0
{opik-1.9.41.dist-info → opik-1.9.86.dist-info}/top_level.txt +0 -0

opik/rest_api/experiments/client.py CHANGED Viewed

@@ -119,12 +119,14 @@ class ExperimentsClient:
         id: typing.Optional[str] = OMIT,
         name: typing.Optional[str] = OMIT,
         metadata: typing.Optional[JsonListStringWrite] = OMIT,
+        tags: typing.Optional[typing.Sequence[str]] = OMIT,
         type: typing.Optional[ExperimentWriteType] = OMIT,
         optimization_id: typing.Optional[str] = OMIT,
         status: typing.Optional[ExperimentWriteStatus] = OMIT,
         experiment_scores: typing.Optional[typing.Sequence[ExperimentScoreWrite]] = OMIT,
         prompt_version: typing.Optional[PromptVersionLinkWrite] = OMIT,
         prompt_versions: typing.Optional[typing.Sequence[PromptVersionLinkWrite]] = OMIT,
+        dataset_version_id: typing.Optional[str] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> None:
         """
@@ -140,6 +142,8 @@ class ExperimentsClient:
         metadata : typing.Optional[JsonListStringWrite]
+        tags : typing.Optional[typing.Sequence[str]]
         type : typing.Optional[ExperimentWriteType]
         optimization_id : typing.Optional[str]
@@ -152,6 +156,9 @@ class ExperimentsClient:
         prompt_versions : typing.Optional[typing.Sequence[PromptVersionLinkWrite]]
+        dataset_version_id : typing.Optional[str]
+            ID of the dataset version this experiment is linked to. If not provided at creation, experiment will be automatically linked to the latest version.
         request_options : typing.Optional[RequestOptions]
             Request-specific configuration.
@@ -170,12 +177,14 @@ class ExperimentsClient:
             id=id,
             name=name,
             metadata=metadata,
+            tags=tags,
             type=type,
             optimization_id=optimization_id,
             status=status,
             experiment_scores=experiment_scores,
             prompt_version=prompt_version,
             prompt_versions=prompt_versions,
+            dataset_version_id=dataset_version_id,
             request_options=request_options,
         )
         return _response.data
@@ -480,6 +489,7 @@ class ExperimentsClient:
         *,
         name: typing.Optional[str] = OMIT,
         metadata: typing.Optional[JsonNode] = OMIT,
+        tags: typing.Optional[typing.Sequence[str]] = OMIT,
         type: typing.Optional[ExperimentUpdateType] = OMIT,
         status: typing.Optional[ExperimentUpdateStatus] = OMIT,
         experiment_scores: typing.Optional[typing.Sequence[ExperimentScore]] = OMIT,
@@ -496,6 +506,8 @@ class ExperimentsClient:
         metadata : typing.Optional[JsonNode]
+        tags : typing.Optional[typing.Sequence[str]]
         type : typing.Optional[ExperimentUpdateType]
         status : typing.Optional[ExperimentUpdateStatus]
@@ -520,6 +532,7 @@ class ExperimentsClient:
             id,
             name=name,
             metadata=metadata,
+            tags=tags,
             type=type,
             status=status,
             experiment_scores=experiment_scores,
@@ -721,12 +734,14 @@ class AsyncExperimentsClient:
         id: typing.Optional[str] = OMIT,
         name: typing.Optional[str] = OMIT,
         metadata: typing.Optional[JsonListStringWrite] = OMIT,
+        tags: typing.Optional[typing.Sequence[str]] = OMIT,
         type: typing.Optional[ExperimentWriteType] = OMIT,
         optimization_id: typing.Optional[str] = OMIT,
         status: typing.Optional[ExperimentWriteStatus] = OMIT,
         experiment_scores: typing.Optional[typing.Sequence[ExperimentScoreWrite]] = OMIT,
         prompt_version: typing.Optional[PromptVersionLinkWrite] = OMIT,
         prompt_versions: typing.Optional[typing.Sequence[PromptVersionLinkWrite]] = OMIT,
+        dataset_version_id: typing.Optional[str] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> None:
         """
@@ -742,6 +757,8 @@ class AsyncExperimentsClient:
         metadata : typing.Optional[JsonListStringWrite]
+        tags : typing.Optional[typing.Sequence[str]]
         type : typing.Optional[ExperimentWriteType]
         optimization_id : typing.Optional[str]
@@ -754,6 +771,9 @@ class AsyncExperimentsClient:
         prompt_versions : typing.Optional[typing.Sequence[PromptVersionLinkWrite]]
+        dataset_version_id : typing.Optional[str]
+            ID of the dataset version this experiment is linked to. If not provided at creation, experiment will be automatically linked to the latest version.
         request_options : typing.Optional[RequestOptions]
             Request-specific configuration.
@@ -775,12 +795,14 @@ class AsyncExperimentsClient:
             id=id,
             name=name,
             metadata=metadata,
+            tags=tags,
             type=type,
             optimization_id=optimization_id,
             status=status,
             experiment_scores=experiment_scores,
             prompt_version=prompt_version,
             prompt_versions=prompt_versions,
+            dataset_version_id=dataset_version_id,
             request_options=request_options,
         )
         return _response.data
@@ -1112,6 +1134,7 @@ class AsyncExperimentsClient:
         *,
         name: typing.Optional[str] = OMIT,
         metadata: typing.Optional[JsonNode] = OMIT,
+        tags: typing.Optional[typing.Sequence[str]] = OMIT,
         type: typing.Optional[ExperimentUpdateType] = OMIT,
         status: typing.Optional[ExperimentUpdateStatus] = OMIT,
         experiment_scores: typing.Optional[typing.Sequence[ExperimentScore]] = OMIT,
@@ -1128,6 +1151,8 @@ class AsyncExperimentsClient:
         metadata : typing.Optional[JsonNode]
+        tags : typing.Optional[typing.Sequence[str]]
         type : typing.Optional[ExperimentUpdateType]
         status : typing.Optional[ExperimentUpdateStatus]
@@ -1155,6 +1180,7 @@ class AsyncExperimentsClient:
             id,
             name=name,
             metadata=metadata,
+            tags=tags,
             type=type,
             status=status,
             experiment_scores=experiment_scores,

opik/rest_api/experiments/raw_client.py CHANGED Viewed

@@ -140,12 +140,14 @@ class RawExperimentsClient:
         id: typing.Optional[str] = OMIT,
         name: typing.Optional[str] = OMIT,
         metadata: typing.Optional[JsonListStringWrite] = OMIT,
+        tags: typing.Optional[typing.Sequence[str]] = OMIT,
         type: typing.Optional[ExperimentWriteType] = OMIT,
         optimization_id: typing.Optional[str] = OMIT,
         status: typing.Optional[ExperimentWriteStatus] = OMIT,
         experiment_scores: typing.Optional[typing.Sequence[ExperimentScoreWrite]] = OMIT,
         prompt_version: typing.Optional[PromptVersionLinkWrite] = OMIT,
         prompt_versions: typing.Optional[typing.Sequence[PromptVersionLinkWrite]] = OMIT,
+        dataset_version_id: typing.Optional[str] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> HttpResponse[None]:
         """
@@ -161,6 +163,8 @@ class RawExperimentsClient:
         metadata : typing.Optional[JsonListStringWrite]
+        tags : typing.Optional[typing.Sequence[str]]
         type : typing.Optional[ExperimentWriteType]
         optimization_id : typing.Optional[str]
@@ -173,6 +177,9 @@ class RawExperimentsClient:
         prompt_versions : typing.Optional[typing.Sequence[PromptVersionLinkWrite]]
+        dataset_version_id : typing.Optional[str]
+            ID of the dataset version this experiment is linked to. If not provided at creation, experiment will be automatically linked to the latest version.
         request_options : typing.Optional[RequestOptions]
             Request-specific configuration.
@@ -190,6 +197,7 @@ class RawExperimentsClient:
                 "metadata": convert_and_respect_annotation_metadata(
                     object_=metadata, annotation=JsonListStringWrite, direction="write"
                 ),
+                "tags": tags,
                 "type": type,
                 "optimization_id": optimization_id,
                 "status": status,
@@ -202,6 +210,7 @@ class RawExperimentsClient:
                 "prompt_versions": convert_and_respect_annotation_metadata(
                     object_=prompt_versions, annotation=typing.Sequence[PromptVersionLinkWrite], direction="write"
                 ),
+                "dataset_version_id": dataset_version_id,
             },
             headers={
                 "content-type": "application/json",
@@ -701,6 +710,7 @@ class RawExperimentsClient:
         *,
         name: typing.Optional[str] = OMIT,
         metadata: typing.Optional[JsonNode] = OMIT,
+        tags: typing.Optional[typing.Sequence[str]] = OMIT,
         type: typing.Optional[ExperimentUpdateType] = OMIT,
         status: typing.Optional[ExperimentUpdateStatus] = OMIT,
         experiment_scores: typing.Optional[typing.Sequence[ExperimentScore]] = OMIT,
@@ -717,6 +727,8 @@ class RawExperimentsClient:
         metadata : typing.Optional[JsonNode]
+        tags : typing.Optional[typing.Sequence[str]]
         type : typing.Optional[ExperimentUpdateType]
         status : typing.Optional[ExperimentUpdateStatus]
@@ -737,6 +749,7 @@ class RawExperimentsClient:
             json={
                 "name": name,
                 "metadata": metadata,
+                "tags": tags,
                 "type": type,
                 "status": status,
                 "experiment_scores": convert_and_respect_annotation_metadata(
@@ -1056,12 +1069,14 @@ class AsyncRawExperimentsClient:
         id: typing.Optional[str] = OMIT,
         name: typing.Optional[str] = OMIT,
         metadata: typing.Optional[JsonListStringWrite] = OMIT,
+        tags: typing.Optional[typing.Sequence[str]] = OMIT,
         type: typing.Optional[ExperimentWriteType] = OMIT,
         optimization_id: typing.Optional[str] = OMIT,
         status: typing.Optional[ExperimentWriteStatus] = OMIT,
         experiment_scores: typing.Optional[typing.Sequence[ExperimentScoreWrite]] = OMIT,
         prompt_version: typing.Optional[PromptVersionLinkWrite] = OMIT,
         prompt_versions: typing.Optional[typing.Sequence[PromptVersionLinkWrite]] = OMIT,
+        dataset_version_id: typing.Optional[str] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> AsyncHttpResponse[None]:
         """
@@ -1077,6 +1092,8 @@ class AsyncRawExperimentsClient:
         metadata : typing.Optional[JsonListStringWrite]
+        tags : typing.Optional[typing.Sequence[str]]
         type : typing.Optional[ExperimentWriteType]
         optimization_id : typing.Optional[str]
@@ -1089,6 +1106,9 @@ class AsyncRawExperimentsClient:
         prompt_versions : typing.Optional[typing.Sequence[PromptVersionLinkWrite]]
+        dataset_version_id : typing.Optional[str]
+            ID of the dataset version this experiment is linked to. If not provided at creation, experiment will be automatically linked to the latest version.
         request_options : typing.Optional[RequestOptions]
             Request-specific configuration.
@@ -1106,6 +1126,7 @@ class AsyncRawExperimentsClient:
                 "metadata": convert_and_respect_annotation_metadata(
                     object_=metadata, annotation=JsonListStringWrite, direction="write"
                 ),
+                "tags": tags,
                 "type": type,
                 "optimization_id": optimization_id,
                 "status": status,
@@ -1118,6 +1139,7 @@ class AsyncRawExperimentsClient:
                 "prompt_versions": convert_and_respect_annotation_metadata(
                     object_=prompt_versions, annotation=typing.Sequence[PromptVersionLinkWrite], direction="write"
                 ),
+                "dataset_version_id": dataset_version_id,
             },
             headers={
                 "content-type": "application/json",
@@ -1617,6 +1639,7 @@ class AsyncRawExperimentsClient:
         *,
         name: typing.Optional[str] = OMIT,
         metadata: typing.Optional[JsonNode] = OMIT,
+        tags: typing.Optional[typing.Sequence[str]] = OMIT,
         type: typing.Optional[ExperimentUpdateType] = OMIT,
         status: typing.Optional[ExperimentUpdateStatus] = OMIT,
         experiment_scores: typing.Optional[typing.Sequence[ExperimentScore]] = OMIT,
@@ -1633,6 +1656,8 @@ class AsyncRawExperimentsClient:
         metadata : typing.Optional[JsonNode]
+        tags : typing.Optional[typing.Sequence[str]]
         type : typing.Optional[ExperimentUpdateType]
         status : typing.Optional[ExperimentUpdateStatus]
@@ -1653,6 +1678,7 @@ class AsyncRawExperimentsClient:
             json={
                 "name": name,
                 "metadata": metadata,
+                "tags": tags,
                 "type": type,
                 "status": status,
                 "experiment_scores": convert_and_respect_annotation_metadata(

opik/rest_api/llm_provider_key/client.py CHANGED Viewed

@@ -103,7 +103,7 @@ class LlmProviderKeyClient:
         name : typing.Optional[str]
         provider_name : typing.Optional[str]
-            Provider name - required for custom LLM providers to uniquely identify them (e.g., 'ollama', 'vllm'). Must not be blank for custom providers. Should not be set for standard providers (OpenAI, Anthropic, etc.). This requirement is conditional and validation is enforced programmatically.
+            Provider name - required for custom LLM and Bedrock providers to uniquely identify them (e.g., 'ollama', 'vllm', 'Bedrock us-east-1'). Must not be blank for custom and Bedrock providers. Should not be set for standard providers (OpenAI, Anthropic, etc.). This requirement is conditional and validation is enforced programmatically.
         headers : typing.Optional[typing.Dict[str, str]]
@@ -187,7 +187,7 @@ class LlmProviderKeyClient:
         name : typing.Optional[str]
         provider_name : typing.Optional[str]
-            Provider name - can be set to migrate legacy custom LLM providers to the new multi-provider format. Once set, it cannot be changed. Should only be set for custom LLM providers.
+            Provider name - can be set to migrate legacy custom LLM or Bedrock providers to the new multi-provider format. Once set, it cannot be changed. Should only be set for custom LLM and Bedrock providers.
         headers : typing.Optional[typing.Dict[str, str]]
@@ -317,7 +317,7 @@ class AsyncLlmProviderKeyClient:
         name : typing.Optional[str]
         provider_name : typing.Optional[str]
-            Provider name - required for custom LLM providers to uniquely identify them (e.g., 'ollama', 'vllm'). Must not be blank for custom providers. Should not be set for standard providers (OpenAI, Anthropic, etc.). This requirement is conditional and validation is enforced programmatically.
+            Provider name - required for custom LLM and Bedrock providers to uniquely identify them (e.g., 'ollama', 'vllm', 'Bedrock us-east-1'). Must not be blank for custom and Bedrock providers. Should not be set for standard providers (OpenAI, Anthropic, etc.). This requirement is conditional and validation is enforced programmatically.
         headers : typing.Optional[typing.Dict[str, str]]
@@ -407,7 +407,7 @@ class AsyncLlmProviderKeyClient:
         name : typing.Optional[str]
         provider_name : typing.Optional[str]
-            Provider name - can be set to migrate legacy custom LLM providers to the new multi-provider format. Once set, it cannot be changed. Should only be set for custom LLM providers.
+            Provider name - can be set to migrate legacy custom LLM or Bedrock providers to the new multi-provider format. Once set, it cannot be changed. Should only be set for custom LLM and Bedrock providers.
         headers : typing.Optional[typing.Dict[str, str]]

opik/rest_api/llm_provider_key/raw_client.py CHANGED Viewed

@@ -122,7 +122,7 @@ class RawLlmProviderKeyClient:
         name : typing.Optional[str]
         provider_name : typing.Optional[str]
-            Provider name - required for custom LLM providers to uniquely identify them (e.g., 'ollama', 'vllm'). Must not be blank for custom providers. Should not be set for standard providers (OpenAI, Anthropic, etc.). This requirement is conditional and validation is enforced programmatically.
+            Provider name - required for custom LLM and Bedrock providers to uniquely identify them (e.g., 'ollama', 'vllm', 'Bedrock us-east-1'). Must not be blank for custom and Bedrock providers. Should not be set for standard providers (OpenAI, Anthropic, etc.). This requirement is conditional and validation is enforced programmatically.
         headers : typing.Optional[typing.Dict[str, str]]
@@ -258,7 +258,7 @@ class RawLlmProviderKeyClient:
         name : typing.Optional[str]
         provider_name : typing.Optional[str]
-            Provider name - can be set to migrate legacy custom LLM providers to the new multi-provider format. Once set, it cannot be changed. Should only be set for custom LLM providers.
+            Provider name - can be set to migrate legacy custom LLM or Bedrock providers to the new multi-provider format. Once set, it cannot be changed. Should only be set for custom LLM and Bedrock providers.
         headers : typing.Optional[typing.Dict[str, str]]
@@ -433,7 +433,7 @@ class AsyncRawLlmProviderKeyClient:
         name : typing.Optional[str]
         provider_name : typing.Optional[str]
-            Provider name - required for custom LLM providers to uniquely identify them (e.g., 'ollama', 'vllm'). Must not be blank for custom providers. Should not be set for standard providers (OpenAI, Anthropic, etc.). This requirement is conditional and validation is enforced programmatically.
+            Provider name - required for custom LLM and Bedrock providers to uniquely identify them (e.g., 'ollama', 'vllm', 'Bedrock us-east-1'). Must not be blank for custom and Bedrock providers. Should not be set for standard providers (OpenAI, Anthropic, etc.). This requirement is conditional and validation is enforced programmatically.
         headers : typing.Optional[typing.Dict[str, str]]
@@ -569,7 +569,7 @@ class AsyncRawLlmProviderKeyClient:
         name : typing.Optional[str]
         provider_name : typing.Optional[str]
-            Provider name - can be set to migrate legacy custom LLM providers to the new multi-provider format. Once set, it cannot be changed. Should only be set for custom LLM providers.
+            Provider name - can be set to migrate legacy custom LLM or Bedrock providers to the new multi-provider format. Once set, it cannot be changed. Should only be set for custom LLM and Bedrock providers.
         headers : typing.Optional[typing.Dict[str, str]]

opik/rest_api/llm_provider_key/types/provider_api_key_write_provider.py CHANGED Viewed

@@ -3,5 +3,6 @@
 import typing
 ProviderApiKeyWriteProvider = typing.Union[
-    typing.Literal["openai", "anthropic", "gemini", "openrouter", "vertex-ai", "custom-llm"], typing.Any
+    typing.Literal["openai", "anthropic", "gemini", "openrouter", "vertex-ai", "bedrock", "custom-llm", "opik-free"],
+    typing.Any,
 ]

opik/rest_api/manual_evaluation/client.py CHANGED Viewed

@@ -27,6 +27,55 @@ class ManualEvaluationClient:
         """
         return self._raw_client
+    def evaluate_spans(
+        self,
+        *,
+        project_id: str,
+        entity_ids: typing.Sequence[str],
+        rule_ids: typing.Sequence[str],
+        entity_type: ManualEvaluationRequestEntityType,
+        request_options: typing.Optional[RequestOptions] = None,
+    ) -> ManualEvaluationResponse:
+        """
+        Manually trigger evaluation rules on selected spans. Bypasses sampling and enqueues all specified spans for evaluation.
+        Parameters
+        ----------
+        project_id : str
+            Project ID
+        entity_ids : typing.Sequence[str]
+            List of entity IDs (trace IDs or thread IDs) to evaluate
+        rule_ids : typing.Sequence[str]
+            List of automation rule IDs to apply
+        entity_type : ManualEvaluationRequestEntityType
+            Type of entity to evaluate (trace or thread)
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        ManualEvaluationResponse
+            Accepted - Evaluation request queued successfully
+        Examples
+        --------
+        from Opik import OpikApi
+        client = OpikApi(api_key="YOUR_API_KEY", workspace_name="YOUR_WORKSPACE_NAME", )
+        client.manual_evaluation.evaluate_spans(project_id='550e8400-e29b-41d4-a716-446655440000', entity_ids=['550e8400-e29b-41d4-a716-446655440000', '550e8400-e29b-41d4-a716-446655440001'], rule_ids=['660e8400-e29b-41d4-a716-446655440000'], entity_type="trace", )
+        """
+        _response = self._raw_client.evaluate_spans(
+            project_id=project_id,
+            entity_ids=entity_ids,
+            rule_ids=rule_ids,
+            entity_type=entity_type,
+            request_options=request_options,
+        )
+        return _response.data
     def evaluate_threads(
         self,
         *,
@@ -141,6 +190,58 @@ class AsyncManualEvaluationClient:
         """
         return self._raw_client
+    async def evaluate_spans(
+        self,
+        *,
+        project_id: str,
+        entity_ids: typing.Sequence[str],
+        rule_ids: typing.Sequence[str],
+        entity_type: ManualEvaluationRequestEntityType,
+        request_options: typing.Optional[RequestOptions] = None,
+    ) -> ManualEvaluationResponse:
+        """
+        Manually trigger evaluation rules on selected spans. Bypasses sampling and enqueues all specified spans for evaluation.
+        Parameters
+        ----------
+        project_id : str
+            Project ID
+        entity_ids : typing.Sequence[str]
+            List of entity IDs (trace IDs or thread IDs) to evaluate
+        rule_ids : typing.Sequence[str]
+            List of automation rule IDs to apply
+        entity_type : ManualEvaluationRequestEntityType
+            Type of entity to evaluate (trace or thread)
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        ManualEvaluationResponse
+            Accepted - Evaluation request queued successfully
+        Examples
+        --------
+        from Opik import AsyncOpikApi
+        import asyncio
+        client = AsyncOpikApi(api_key="YOUR_API_KEY", workspace_name="YOUR_WORKSPACE_NAME", )
+        async def main() -> None:
+            await client.manual_evaluation.evaluate_spans(project_id='550e8400-e29b-41d4-a716-446655440000', entity_ids=['550e8400-e29b-41d4-a716-446655440000', '550e8400-e29b-41d4-a716-446655440001'], rule_ids=['660e8400-e29b-41d4-a716-446655440000'], entity_type="trace", )
+        asyncio.run(main())
+        """
+        _response = await self._raw_client.evaluate_spans(
+            project_id=project_id,
+            entity_ids=entity_ids,
+            rule_ids=rule_ids,
+            entity_type=entity_type,
+            request_options=request_options,
+        )
+        return _response.data
     async def evaluate_threads(
         self,
         *,

opik/rest_api/manual_evaluation/raw_client.py CHANGED Viewed

@@ -21,6 +21,92 @@ class RawManualEvaluationClient:
     def __init__(self, *, client_wrapper: SyncClientWrapper):
         self._client_wrapper = client_wrapper
+    def evaluate_spans(
+        self,
+        *,
+        project_id: str,
+        entity_ids: typing.Sequence[str],
+        rule_ids: typing.Sequence[str],
+        entity_type: ManualEvaluationRequestEntityType,
+        request_options: typing.Optional[RequestOptions] = None,
+    ) -> HttpResponse[ManualEvaluationResponse]:
+        """
+        Manually trigger evaluation rules on selected spans. Bypasses sampling and enqueues all specified spans for evaluation.
+        Parameters
+        ----------
+        project_id : str
+            Project ID
+        entity_ids : typing.Sequence[str]
+            List of entity IDs (trace IDs or thread IDs) to evaluate
+        rule_ids : typing.Sequence[str]
+            List of automation rule IDs to apply
+        entity_type : ManualEvaluationRequestEntityType
+            Type of entity to evaluate (trace or thread)
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        HttpResponse[ManualEvaluationResponse]
+            Accepted - Evaluation request queued successfully
+        """
+        _response = self._client_wrapper.httpx_client.request(
+            "v1/private/manual-evaluation/spans",
+            method="POST",
+            json={
+                "project_id": project_id,
+                "entity_ids": entity_ids,
+                "rule_ids": rule_ids,
+                "entity_type": entity_type,
+            },
+            headers={
+                "content-type": "application/json",
+            },
+            request_options=request_options,
+            omit=OMIT,
+        )
+        try:
+            if 200 <= _response.status_code < 300:
+                _data = typing.cast(
+                    ManualEvaluationResponse,
+                    parse_obj_as(
+                        type_=ManualEvaluationResponse,  # type: ignore
+                        object_=_response.json(),
+                    ),
+                )
+                return HttpResponse(response=_response, data=_data)
+            if _response.status_code == 400:
+                raise BadRequestError(
+                    headers=dict(_response.headers),
+                    body=typing.cast(
+                        typing.Optional[typing.Any],
+                        parse_obj_as(
+                            type_=typing.Optional[typing.Any],  # type: ignore
+                            object_=_response.json(),
+                        ),
+                    ),
+                )
+            if _response.status_code == 404:
+                raise NotFoundError(
+                    headers=dict(_response.headers),
+                    body=typing.cast(
+                        typing.Optional[typing.Any],
+                        parse_obj_as(
+                            type_=typing.Optional[typing.Any],  # type: ignore
+                            object_=_response.json(),
+                        ),
+                    ),
+                )
+            _response_json = _response.json()
+        except JSONDecodeError:
+            raise ApiError(status_code=_response.status_code, headers=dict(_response.headers), body=_response.text)
+        raise ApiError(status_code=_response.status_code, headers=dict(_response.headers), body=_response_json)
     def evaluate_threads(
         self,
         *,
@@ -198,6 +284,92 @@ class AsyncRawManualEvaluationClient:
     def __init__(self, *, client_wrapper: AsyncClientWrapper):
         self._client_wrapper = client_wrapper
+    async def evaluate_spans(
+        self,
+        *,
+        project_id: str,
+        entity_ids: typing.Sequence[str],
+        rule_ids: typing.Sequence[str],
+        entity_type: ManualEvaluationRequestEntityType,
+        request_options: typing.Optional[RequestOptions] = None,
+    ) -> AsyncHttpResponse[ManualEvaluationResponse]:
+        """
+        Manually trigger evaluation rules on selected spans. Bypasses sampling and enqueues all specified spans for evaluation.
+        Parameters
+        ----------
+        project_id : str
+            Project ID
+        entity_ids : typing.Sequence[str]
+            List of entity IDs (trace IDs or thread IDs) to evaluate
+        rule_ids : typing.Sequence[str]
+            List of automation rule IDs to apply
+        entity_type : ManualEvaluationRequestEntityType
+            Type of entity to evaluate (trace or thread)
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        AsyncHttpResponse[ManualEvaluationResponse]
+            Accepted - Evaluation request queued successfully
+        """
+        _response = await self._client_wrapper.httpx_client.request(
+            "v1/private/manual-evaluation/spans",
+            method="POST",
+            json={
+                "project_id": project_id,
+                "entity_ids": entity_ids,
+                "rule_ids": rule_ids,
+                "entity_type": entity_type,
+            },
+            headers={
+                "content-type": "application/json",
+            },
+            request_options=request_options,
+            omit=OMIT,
+        )
+        try:
+            if 200 <= _response.status_code < 300:
+                _data = typing.cast(
+                    ManualEvaluationResponse,
+                    parse_obj_as(
+                        type_=ManualEvaluationResponse,  # type: ignore
+                        object_=_response.json(),
+                    ),
+                )
+                return AsyncHttpResponse(response=_response, data=_data)
+            if _response.status_code == 400:
+                raise BadRequestError(
+                    headers=dict(_response.headers),
+                    body=typing.cast(
+                        typing.Optional[typing.Any],
+                        parse_obj_as(
+                            type_=typing.Optional[typing.Any],  # type: ignore
+                            object_=_response.json(),
+                        ),
+                    ),
+                )
+            if _response.status_code == 404:
+                raise NotFoundError(
+                    headers=dict(_response.headers),
+                    body=typing.cast(
+                        typing.Optional[typing.Any],
+                        parse_obj_as(
+                            type_=typing.Optional[typing.Any],  # type: ignore
+                            object_=_response.json(),
+                        ),
+                    ),
+                )
+            _response_json = _response.json()
+        except JSONDecodeError:
+            raise ApiError(status_code=_response.status_code, headers=dict(_response.headers), body=_response.text)
+        raise ApiError(status_code=_response.status_code, headers=dict(_response.headers), body=_response_json)
     async def evaluate_threads(
         self,
         *,

opik 1.9.41__py3-none-any.whl → 1.9.86__py3-none-any.whl

opik 1.9.41py3-none-any.whl → 1.9.86py3-none-any.whl