PyPI - opik - Versions diffs - 1.8.39__py3-none-any.whl → 1.9.71__py3-none-any.whl - Mend

opik 1.8.39py3-none-any.whl → 1.9.71py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (592) hide show

opik/__init__.py +19 -3
opik/anonymizer/__init__.py +5 -0
opik/anonymizer/anonymizer.py +12 -0
opik/anonymizer/factory.py +80 -0
opik/anonymizer/recursive_anonymizer.py +64 -0
opik/anonymizer/rules.py +56 -0
opik/anonymizer/rules_anonymizer.py +35 -0
opik/api_objects/attachment/attachment_context.py +36 -0
opik/api_objects/attachment/attachments_extractor.py +153 -0
opik/api_objects/attachment/client.py +1 -0
opik/api_objects/attachment/converters.py +2 -0
opik/api_objects/attachment/decoder.py +18 -0
opik/api_objects/attachment/decoder_base64.py +83 -0
opik/api_objects/attachment/decoder_helpers.py +137 -0
opik/api_objects/data_helpers.py +79 -0
opik/api_objects/dataset/dataset.py +64 -4
opik/api_objects/dataset/rest_operations.py +11 -2
opik/api_objects/experiment/experiment.py +57 -57
opik/api_objects/experiment/experiment_item.py +2 -1
opik/api_objects/experiment/experiments_client.py +64 -0
opik/api_objects/experiment/helpers.py +35 -11
opik/api_objects/experiment/rest_operations.py +65 -5
opik/api_objects/helpers.py +8 -5
opik/api_objects/local_recording.py +81 -0
opik/api_objects/opik_client.py +600 -108
opik/api_objects/opik_query_language.py +39 -5
opik/api_objects/prompt/__init__.py +12 -2
opik/api_objects/prompt/base_prompt.py +69 -0
opik/api_objects/prompt/base_prompt_template.py +29 -0
opik/api_objects/prompt/chat/__init__.py +1 -0
opik/api_objects/prompt/chat/chat_prompt.py +210 -0
opik/api_objects/prompt/chat/chat_prompt_template.py +350 -0
opik/api_objects/prompt/chat/content_renderer_registry.py +203 -0
opik/api_objects/prompt/client.py +189 -47
opik/api_objects/prompt/text/__init__.py +1 -0
opik/api_objects/prompt/text/prompt.py +174 -0
opik/api_objects/prompt/{prompt_template.py → text/prompt_template.py} +10 -6
opik/api_objects/prompt/types.py +23 -0
opik/api_objects/search_helpers.py +89 -0
opik/api_objects/span/span_data.py +35 -25
opik/api_objects/threads/threads_client.py +39 -5
opik/api_objects/trace/trace_client.py +52 -2
opik/api_objects/trace/trace_data.py +15 -24
opik/api_objects/validation_helpers.py +3 -3
opik/cli/__init__.py +5 -0
opik/cli/__main__.py +6 -0
opik/cli/configure.py +66 -0
opik/cli/exports/__init__.py +131 -0
opik/cli/exports/dataset.py +278 -0
opik/cli/exports/experiment.py +784 -0
opik/cli/exports/project.py +685 -0
opik/cli/exports/prompt.py +578 -0
opik/cli/exports/utils.py +406 -0
opik/cli/harbor.py +39 -0
opik/cli/healthcheck.py +21 -0
opik/cli/imports/__init__.py +439 -0
opik/cli/imports/dataset.py +143 -0
opik/cli/imports/experiment.py +1192 -0
opik/cli/imports/project.py +262 -0
opik/cli/imports/prompt.py +177 -0
opik/cli/imports/utils.py +280 -0
opik/cli/main.py +49 -0
opik/cli/proxy.py +93 -0
opik/cli/usage_report/__init__.py +16 -0
opik/cli/usage_report/charts.py +783 -0
opik/cli/usage_report/cli.py +274 -0
opik/cli/usage_report/constants.py +9 -0
opik/cli/usage_report/extraction.py +749 -0
opik/cli/usage_report/pdf.py +244 -0
opik/cli/usage_report/statistics.py +78 -0
opik/cli/usage_report/utils.py +235 -0
opik/config.py +13 -7
opik/configurator/configure.py +17 -0
opik/datetime_helpers.py +12 -0
opik/decorator/arguments_helpers.py +9 -1
opik/decorator/base_track_decorator.py +205 -133
opik/decorator/context_manager/span_context_manager.py +123 -0
opik/decorator/context_manager/trace_context_manager.py +84 -0
opik/decorator/opik_args/__init__.py +13 -0
opik/decorator/opik_args/api_classes.py +71 -0
opik/decorator/opik_args/helpers.py +120 -0
opik/decorator/span_creation_handler.py +25 -6
opik/dict_utils.py +3 -3
opik/evaluation/__init__.py +13 -2
opik/evaluation/engine/engine.py +272 -75
opik/evaluation/engine/evaluation_tasks_executor.py +6 -3
opik/evaluation/engine/helpers.py +31 -6
opik/evaluation/engine/metrics_evaluator.py +237 -0
opik/evaluation/evaluation_result.py +168 -2
opik/evaluation/evaluator.py +533 -62
opik/evaluation/metrics/__init__.py +103 -4
opik/evaluation/metrics/aggregated_metric.py +35 -6
opik/evaluation/metrics/base_metric.py +1 -1
opik/evaluation/metrics/conversation/__init__.py +48 -0
opik/evaluation/metrics/conversation/conversation_thread_metric.py +56 -2
opik/evaluation/metrics/conversation/g_eval_wrappers.py +19 -0
opik/evaluation/metrics/conversation/helpers.py +14 -15
opik/evaluation/metrics/conversation/heuristics/__init__.py +14 -0
opik/evaluation/metrics/conversation/heuristics/degeneration/__init__.py +3 -0
opik/evaluation/metrics/conversation/heuristics/degeneration/metric.py +189 -0
opik/evaluation/metrics/conversation/heuristics/degeneration/phrases.py +12 -0
opik/evaluation/metrics/conversation/heuristics/knowledge_retention/__init__.py +3 -0
opik/evaluation/metrics/conversation/heuristics/knowledge_retention/metric.py +172 -0
opik/evaluation/metrics/conversation/llm_judges/__init__.py +32 -0
opik/evaluation/metrics/conversation/{conversational_coherence → llm_judges/conversational_coherence}/metric.py +22 -17
opik/evaluation/metrics/conversation/{conversational_coherence → llm_judges/conversational_coherence}/templates.py +1 -1
opik/evaluation/metrics/conversation/llm_judges/g_eval_wrappers.py +442 -0
opik/evaluation/metrics/conversation/{session_completeness → llm_judges/session_completeness}/metric.py +13 -7
opik/evaluation/metrics/conversation/{session_completeness → llm_judges/session_completeness}/templates.py +1 -1
opik/evaluation/metrics/conversation/llm_judges/user_frustration/__init__.py +0 -0
opik/evaluation/metrics/conversation/{user_frustration → llm_judges/user_frustration}/metric.py +21 -14
opik/evaluation/metrics/conversation/{user_frustration → llm_judges/user_frustration}/templates.py +1 -1
opik/evaluation/metrics/conversation/types.py +4 -5
opik/evaluation/metrics/conversation_types.py +9 -0
opik/evaluation/metrics/heuristics/bertscore.py +107 -0
opik/evaluation/metrics/heuristics/bleu.py +35 -15
opik/evaluation/metrics/heuristics/chrf.py +127 -0
opik/evaluation/metrics/heuristics/contains.py +47 -11
opik/evaluation/metrics/heuristics/distribution_metrics.py +331 -0
opik/evaluation/metrics/heuristics/gleu.py +113 -0
opik/evaluation/metrics/heuristics/language_adherence.py +123 -0
opik/evaluation/metrics/heuristics/meteor.py +119 -0
opik/evaluation/metrics/heuristics/prompt_injection.py +150 -0
opik/evaluation/metrics/heuristics/readability.py +129 -0
opik/evaluation/metrics/heuristics/rouge.py +26 -9
opik/evaluation/metrics/heuristics/spearman.py +88 -0
opik/evaluation/metrics/heuristics/tone.py +155 -0
opik/evaluation/metrics/heuristics/vader_sentiment.py +77 -0
opik/evaluation/metrics/llm_judges/answer_relevance/metric.py +20 -5
opik/evaluation/metrics/llm_judges/context_precision/metric.py +20 -6
opik/evaluation/metrics/llm_judges/context_recall/metric.py +20 -6
opik/evaluation/metrics/llm_judges/g_eval/__init__.py +5 -0
opik/evaluation/metrics/llm_judges/g_eval/metric.py +219 -68
opik/evaluation/metrics/llm_judges/g_eval/parser.py +102 -52
opik/evaluation/metrics/llm_judges/g_eval/presets.py +209 -0
opik/evaluation/metrics/llm_judges/g_eval_presets/__init__.py +36 -0
opik/evaluation/metrics/llm_judges/g_eval_presets/agent_assessment.py +77 -0
opik/evaluation/metrics/llm_judges/g_eval_presets/bias_classifier.py +181 -0
opik/evaluation/metrics/llm_judges/g_eval_presets/compliance_risk.py +41 -0
opik/evaluation/metrics/llm_judges/g_eval_presets/prompt_uncertainty.py +41 -0
opik/evaluation/metrics/llm_judges/g_eval_presets/qa_suite.py +146 -0
opik/evaluation/metrics/llm_judges/hallucination/metric.py +16 -3
opik/evaluation/metrics/llm_judges/llm_juries/__init__.py +3 -0
opik/evaluation/metrics/llm_judges/llm_juries/metric.py +76 -0
opik/evaluation/metrics/llm_judges/moderation/metric.py +16 -4
opik/evaluation/metrics/llm_judges/structure_output_compliance/__init__.py +0 -0
opik/evaluation/metrics/llm_judges/structure_output_compliance/metric.py +144 -0
opik/evaluation/metrics/llm_judges/structure_output_compliance/parser.py +79 -0
opik/evaluation/metrics/llm_judges/structure_output_compliance/schema.py +15 -0
opik/evaluation/metrics/llm_judges/structure_output_compliance/template.py +50 -0
opik/evaluation/metrics/llm_judges/syc_eval/__init__.py +0 -0
opik/evaluation/metrics/llm_judges/syc_eval/metric.py +252 -0
opik/evaluation/metrics/llm_judges/syc_eval/parser.py +82 -0
opik/evaluation/metrics/llm_judges/syc_eval/template.py +155 -0
opik/evaluation/metrics/llm_judges/trajectory_accuracy/metric.py +20 -5
opik/evaluation/metrics/llm_judges/usefulness/metric.py +16 -4
opik/evaluation/metrics/ragas_metric.py +43 -23
opik/evaluation/models/__init__.py +8 -0
opik/evaluation/models/base_model.py +107 -1
opik/evaluation/models/langchain/langchain_chat_model.py +15 -7
opik/evaluation/models/langchain/message_converters.py +97 -15
opik/evaluation/models/litellm/litellm_chat_model.py +156 -29
opik/evaluation/models/litellm/util.py +125 -0
opik/evaluation/models/litellm/warning_filters.py +16 -4
opik/evaluation/models/model_capabilities.py +187 -0
opik/evaluation/models/models_factory.py +25 -3
opik/evaluation/preprocessing.py +92 -0
opik/evaluation/report.py +70 -12
opik/evaluation/rest_operations.py +49 -45
opik/evaluation/samplers/__init__.py +4 -0
opik/evaluation/samplers/base_dataset_sampler.py +40 -0
opik/evaluation/samplers/random_dataset_sampler.py +48 -0
opik/evaluation/score_statistics.py +66 -0
opik/evaluation/scorers/__init__.py +4 -0
opik/evaluation/scorers/scorer_function.py +55 -0
opik/evaluation/scorers/scorer_wrapper_metric.py +130 -0
opik/evaluation/test_case.py +3 -2
opik/evaluation/test_result.py +1 -0
opik/evaluation/threads/evaluator.py +31 -3
opik/evaluation/threads/helpers.py +3 -2
opik/evaluation/types.py +9 -1
opik/exceptions.py +33 -0
opik/file_upload/file_uploader.py +13 -0
opik/file_upload/upload_options.py +2 -0
opik/hooks/__init__.py +23 -0
opik/hooks/anonymizer_hook.py +36 -0
opik/hooks/httpx_client_hook.py +112 -0
opik/httpx_client.py +12 -9
opik/id_helpers.py +18 -0
opik/integrations/adk/graph/subgraph_edges_builders.py +1 -2
opik/integrations/adk/helpers.py +16 -7
opik/integrations/adk/legacy_opik_tracer.py +7 -4
opik/integrations/adk/opik_tracer.py +14 -1
opik/integrations/adk/patchers/adk_otel_tracer/opik_adk_otel_tracer.py +7 -3
opik/integrations/adk/recursive_callback_injector.py +4 -7
opik/integrations/bedrock/converse/__init__.py +0 -0
opik/integrations/bedrock/converse/chunks_aggregator.py +188 -0
opik/integrations/bedrock/{converse_decorator.py → converse/converse_decorator.py} +4 -3
opik/integrations/bedrock/invoke_agent_decorator.py +5 -4
opik/integrations/bedrock/invoke_model/__init__.py +0 -0
opik/integrations/bedrock/invoke_model/chunks_aggregator/__init__.py +78 -0
opik/integrations/bedrock/invoke_model/chunks_aggregator/api.py +45 -0
opik/integrations/bedrock/invoke_model/chunks_aggregator/base.py +23 -0
opik/integrations/bedrock/invoke_model/chunks_aggregator/claude.py +121 -0
opik/integrations/bedrock/invoke_model/chunks_aggregator/format_detector.py +107 -0
opik/integrations/bedrock/invoke_model/chunks_aggregator/llama.py +108 -0
opik/integrations/bedrock/invoke_model/chunks_aggregator/mistral.py +118 -0
opik/integrations/bedrock/invoke_model/chunks_aggregator/nova.py +99 -0
opik/integrations/bedrock/invoke_model/invoke_model_decorator.py +178 -0
opik/integrations/bedrock/invoke_model/response_types.py +34 -0
opik/integrations/bedrock/invoke_model/stream_wrappers.py +122 -0
opik/integrations/bedrock/invoke_model/usage_converters.py +87 -0
opik/integrations/bedrock/invoke_model/usage_extraction.py +108 -0
opik/integrations/bedrock/opik_tracker.py +42 -4
opik/integrations/bedrock/types.py +19 -0
opik/integrations/crewai/crewai_decorator.py +8 -51
opik/integrations/crewai/opik_tracker.py +31 -10
opik/integrations/crewai/patchers/__init__.py +5 -0
opik/integrations/crewai/patchers/flow.py +118 -0
opik/integrations/crewai/patchers/litellm_completion.py +30 -0
opik/integrations/crewai/patchers/llm_client.py +207 -0
opik/integrations/dspy/callback.py +80 -17
opik/integrations/dspy/parsers.py +168 -0
opik/integrations/harbor/__init__.py +17 -0
opik/integrations/harbor/experiment_service.py +269 -0
opik/integrations/harbor/opik_tracker.py +528 -0
opik/integrations/haystack/opik_connector.py +2 -2
opik/integrations/haystack/opik_tracer.py +3 -7
opik/integrations/langchain/__init__.py +3 -1
opik/integrations/langchain/helpers.py +96 -0
opik/integrations/langchain/langgraph_async_context_bridge.py +131 -0
opik/integrations/langchain/langgraph_tracer_injector.py +88 -0
opik/integrations/langchain/opik_encoder_extension.py +1 -1
opik/integrations/langchain/opik_tracer.py +474 -229
opik/integrations/litellm/__init__.py +5 -0
opik/integrations/litellm/completion_chunks_aggregator.py +115 -0
opik/integrations/litellm/litellm_completion_decorator.py +242 -0
opik/integrations/litellm/opik_tracker.py +43 -0
opik/integrations/litellm/stream_patchers.py +151 -0
opik/integrations/llama_index/callback.py +146 -107
opik/integrations/openai/agents/opik_tracing_processor.py +1 -2
opik/integrations/openai/openai_chat_completions_decorator.py +2 -16
opik/integrations/openai/opik_tracker.py +1 -1
opik/integrations/sagemaker/auth.py +5 -1
opik/llm_usage/google_usage.py +3 -1
opik/llm_usage/opik_usage.py +7 -8
opik/llm_usage/opik_usage_factory.py +4 -2
opik/logging_messages.py +6 -0
opik/message_processing/batching/base_batcher.py +14 -21
opik/message_processing/batching/batch_manager.py +22 -10
opik/message_processing/batching/batch_manager_constuctors.py +10 -0
opik/message_processing/batching/batchers.py +59 -27
opik/message_processing/batching/flushing_thread.py +0 -3
opik/message_processing/emulation/__init__.py +0 -0
opik/message_processing/emulation/emulator_message_processor.py +578 -0
opik/message_processing/emulation/local_emulator_message_processor.py +140 -0
opik/message_processing/emulation/models.py +162 -0
opik/message_processing/encoder_helpers.py +79 -0
opik/message_processing/messages.py +56 -1
opik/message_processing/preprocessing/__init__.py +0 -0
opik/message_processing/preprocessing/attachments_preprocessor.py +70 -0
opik/message_processing/preprocessing/batching_preprocessor.py +53 -0
opik/message_processing/preprocessing/constants.py +1 -0
opik/message_processing/preprocessing/file_upload_preprocessor.py +38 -0
opik/message_processing/preprocessing/preprocessor.py +36 -0
opik/message_processing/processors/__init__.py +0 -0
opik/message_processing/processors/attachments_extraction_processor.py +146 -0
opik/message_processing/processors/message_processors.py +92 -0
opik/message_processing/processors/message_processors_chain.py +96 -0
opik/message_processing/{message_processors.py → processors/online_message_processor.py} +85 -29
opik/message_processing/queue_consumer.py +9 -3
opik/message_processing/streamer.py +71 -33
opik/message_processing/streamer_constructors.py +43 -10
opik/opik_context.py +16 -4
opik/plugins/pytest/hooks.py +5 -3
opik/rest_api/__init__.py +346 -15
opik/rest_api/alerts/__init__.py +7 -0
opik/rest_api/alerts/client.py +667 -0
opik/rest_api/alerts/raw_client.py +1015 -0
opik/rest_api/alerts/types/__init__.py +7 -0
opik/rest_api/alerts/types/get_webhook_examples_request_alert_type.py +5 -0
opik/rest_api/annotation_queues/__init__.py +4 -0
opik/rest_api/annotation_queues/client.py +668 -0
opik/rest_api/annotation_queues/raw_client.py +1019 -0
opik/rest_api/automation_rule_evaluators/client.py +34 -2
opik/rest_api/automation_rule_evaluators/raw_client.py +24 -0
opik/rest_api/client.py +15 -0
opik/rest_api/dashboards/__init__.py +4 -0
opik/rest_api/dashboards/client.py +462 -0
opik/rest_api/dashboards/raw_client.py +648 -0
opik/rest_api/datasets/client.py +1310 -44
opik/rest_api/datasets/raw_client.py +2269 -358
opik/rest_api/experiments/__init__.py +2 -2
opik/rest_api/experiments/client.py +191 -5
opik/rest_api/experiments/raw_client.py +301 -7
opik/rest_api/experiments/types/__init__.py +4 -1
opik/rest_api/experiments/types/experiment_update_status.py +5 -0
opik/rest_api/experiments/types/experiment_update_type.py +5 -0
opik/rest_api/experiments/types/experiment_write_status.py +5 -0
opik/rest_api/feedback_definitions/types/find_feedback_definitions_request_type.py +1 -1
opik/rest_api/llm_provider_key/client.py +20 -0
opik/rest_api/llm_provider_key/raw_client.py +20 -0
opik/rest_api/llm_provider_key/types/provider_api_key_write_provider.py +1 -1
opik/rest_api/manual_evaluation/__init__.py +4 -0
opik/rest_api/manual_evaluation/client.py +347 -0
opik/rest_api/manual_evaluation/raw_client.py +543 -0
opik/rest_api/optimizations/client.py +145 -9
opik/rest_api/optimizations/raw_client.py +237 -13
opik/rest_api/optimizations/types/optimization_update_status.py +3 -1
opik/rest_api/prompts/__init__.py +2 -2
opik/rest_api/prompts/client.py +227 -6
opik/rest_api/prompts/raw_client.py +331 -2
opik/rest_api/prompts/types/__init__.py +3 -1
opik/rest_api/prompts/types/create_prompt_version_detail_template_structure.py +5 -0
opik/rest_api/prompts/types/prompt_write_template_structure.py +5 -0
opik/rest_api/spans/__init__.py +0 -2
opik/rest_api/spans/client.py +238 -76
opik/rest_api/spans/raw_client.py +307 -95
opik/rest_api/spans/types/__init__.py +0 -2
opik/rest_api/traces/client.py +572 -161
opik/rest_api/traces/raw_client.py +736 -229
opik/rest_api/types/__init__.py +352 -17
opik/rest_api/types/aggregation_data.py +1 -0
opik/rest_api/types/alert.py +33 -0
opik/rest_api/types/alert_alert_type.py +5 -0
opik/rest_api/types/alert_page_public.py +24 -0
opik/rest_api/types/alert_public.py +33 -0
opik/rest_api/types/alert_public_alert_type.py +5 -0
opik/rest_api/types/alert_trigger.py +27 -0
opik/rest_api/types/alert_trigger_config.py +28 -0
opik/rest_api/types/alert_trigger_config_public.py +28 -0
opik/rest_api/types/alert_trigger_config_public_type.py +10 -0
opik/rest_api/types/alert_trigger_config_type.py +10 -0
opik/rest_api/types/alert_trigger_config_write.py +22 -0
opik/rest_api/types/alert_trigger_config_write_type.py +10 -0
opik/rest_api/types/alert_trigger_event_type.py +19 -0
opik/rest_api/types/alert_trigger_public.py +27 -0
opik/rest_api/types/alert_trigger_public_event_type.py +19 -0
opik/rest_api/types/alert_trigger_write.py +23 -0
opik/rest_api/types/alert_trigger_write_event_type.py +19 -0
opik/rest_api/types/alert_write.py +28 -0
opik/rest_api/types/alert_write_alert_type.py +5 -0
opik/rest_api/types/annotation_queue.py +42 -0
opik/rest_api/types/annotation_queue_batch.py +27 -0
opik/rest_api/types/annotation_queue_item_ids.py +19 -0
opik/rest_api/types/annotation_queue_page_public.py +28 -0
opik/rest_api/types/annotation_queue_public.py +38 -0
opik/rest_api/types/annotation_queue_public_scope.py +5 -0
opik/rest_api/types/annotation_queue_reviewer.py +20 -0
opik/rest_api/types/annotation_queue_reviewer_public.py +20 -0
opik/rest_api/types/annotation_queue_scope.py +5 -0
opik/rest_api/types/annotation_queue_write.py +31 -0
opik/rest_api/types/annotation_queue_write_scope.py +5 -0
opik/rest_api/types/audio_url.py +19 -0
opik/rest_api/types/audio_url_public.py +19 -0
opik/rest_api/types/audio_url_write.py +19 -0
opik/rest_api/types/automation_rule_evaluator.py +62 -2
opik/rest_api/types/automation_rule_evaluator_llm_as_judge.py +2 -0
opik/rest_api/types/automation_rule_evaluator_llm_as_judge_public.py +2 -0
opik/rest_api/types/automation_rule_evaluator_llm_as_judge_write.py +2 -0
opik/rest_api/types/automation_rule_evaluator_object_object_public.py +155 -0
opik/rest_api/types/automation_rule_evaluator_page_public.py +3 -2
opik/rest_api/types/automation_rule_evaluator_public.py +57 -2
opik/rest_api/types/automation_rule_evaluator_span_llm_as_judge.py +22 -0
opik/rest_api/types/automation_rule_evaluator_span_llm_as_judge_public.py +22 -0
opik/rest_api/types/automation_rule_evaluator_span_llm_as_judge_write.py +22 -0
opik/rest_api/types/automation_rule_evaluator_span_user_defined_metric_python.py +22 -0
opik/rest_api/types/automation_rule_evaluator_span_user_defined_metric_python_public.py +22 -0
opik/rest_api/types/automation_rule_evaluator_span_user_defined_metric_python_write.py +22 -0
opik/rest_api/types/automation_rule_evaluator_trace_thread_llm_as_judge.py +2 -0
opik/rest_api/types/automation_rule_evaluator_trace_thread_llm_as_judge_public.py +2 -0
opik/rest_api/types/automation_rule_evaluator_trace_thread_llm_as_judge_write.py +2 -0
opik/rest_api/types/automation_rule_evaluator_trace_thread_user_defined_metric_python.py +2 -0
opik/rest_api/types/automation_rule_evaluator_trace_thread_user_defined_metric_python_public.py +2 -0
opik/rest_api/types/automation_rule_evaluator_trace_thread_user_defined_metric_python_write.py +2 -0
opik/rest_api/types/automation_rule_evaluator_update.py +51 -1
opik/rest_api/types/automation_rule_evaluator_update_llm_as_judge.py +2 -0
opik/rest_api/types/automation_rule_evaluator_update_span_llm_as_judge.py +22 -0
opik/rest_api/types/automation_rule_evaluator_update_span_user_defined_metric_python.py +22 -0
opik/rest_api/types/automation_rule_evaluator_update_trace_thread_llm_as_judge.py +2 -0
opik/rest_api/types/automation_rule_evaluator_update_trace_thread_user_defined_metric_python.py +2 -0
opik/rest_api/types/automation_rule_evaluator_update_user_defined_metric_python.py +2 -0
opik/rest_api/types/automation_rule_evaluator_user_defined_metric_python.py +2 -0
opik/rest_api/types/automation_rule_evaluator_user_defined_metric_python_public.py +2 -0
opik/rest_api/types/automation_rule_evaluator_user_defined_metric_python_write.py +2 -0
opik/rest_api/types/automation_rule_evaluator_write.py +51 -1
opik/rest_api/types/boolean_feedback_definition.py +25 -0
opik/rest_api/types/boolean_feedback_definition_create.py +20 -0
opik/rest_api/types/boolean_feedback_definition_public.py +25 -0
opik/rest_api/types/boolean_feedback_definition_update.py +20 -0
opik/rest_api/types/boolean_feedback_detail.py +29 -0
opik/rest_api/types/boolean_feedback_detail_create.py +29 -0
opik/rest_api/types/boolean_feedback_detail_public.py +29 -0
opik/rest_api/types/boolean_feedback_detail_update.py +29 -0
opik/rest_api/types/dashboard_page_public.py +24 -0
opik/rest_api/types/dashboard_public.py +30 -0
opik/rest_api/types/dataset.py +4 -0
opik/rest_api/types/dataset_expansion.py +42 -0
opik/rest_api/types/dataset_expansion_response.py +39 -0
opik/rest_api/types/dataset_item.py +2 -0
opik/rest_api/types/dataset_item_changes_public.py +5 -0
opik/rest_api/types/dataset_item_compare.py +2 -0
opik/rest_api/types/dataset_item_filter.py +27 -0
opik/rest_api/types/dataset_item_filter_operator.py +21 -0
opik/rest_api/types/dataset_item_page_compare.py +5 -0
opik/rest_api/types/dataset_item_page_public.py +5 -0
opik/rest_api/types/dataset_item_public.py +2 -0
opik/rest_api/types/dataset_item_update.py +39 -0
opik/rest_api/types/dataset_item_write.py +1 -0
opik/rest_api/types/dataset_public.py +4 -0
opik/rest_api/types/dataset_public_status.py +5 -0
opik/rest_api/types/dataset_status.py +5 -0
opik/rest_api/types/dataset_version_diff.py +22 -0
opik/rest_api/types/dataset_version_diff_stats.py +24 -0
opik/rest_api/types/dataset_version_page_public.py +23 -0
opik/rest_api/types/dataset_version_public.py +59 -0
opik/rest_api/types/dataset_version_summary.py +46 -0
opik/rest_api/types/dataset_version_summary_public.py +46 -0
opik/rest_api/types/experiment.py +7 -2
opik/rest_api/types/experiment_group_response.py +2 -0
opik/rest_api/types/experiment_public.py +7 -2
opik/rest_api/types/experiment_public_status.py +5 -0
opik/rest_api/types/experiment_score.py +20 -0
opik/rest_api/types/experiment_score_public.py +20 -0
opik/rest_api/types/experiment_score_write.py +20 -0
opik/rest_api/types/experiment_status.py +5 -0
opik/rest_api/types/feedback.py +25 -1
opik/rest_api/types/feedback_create.py +20 -1
opik/rest_api/types/feedback_object_public.py +27 -1
opik/rest_api/types/feedback_public.py +25 -1
opik/rest_api/types/feedback_score_batch_item.py +2 -1
opik/rest_api/types/feedback_score_batch_item_thread.py +2 -1
opik/rest_api/types/feedback_score_public.py +4 -0
opik/rest_api/types/feedback_update.py +20 -1
opik/rest_api/types/group_content_with_aggregations.py +1 -0
opik/rest_api/types/group_detail.py +19 -0
opik/rest_api/types/group_details.py +20 -0
opik/rest_api/types/guardrail.py +1 -0
opik/rest_api/types/guardrail_write.py +1 -0
opik/rest_api/types/ids_holder.py +19 -0
opik/rest_api/types/image_url.py +20 -0
opik/rest_api/types/image_url_public.py +20 -0
opik/rest_api/types/image_url_write.py +20 -0
opik/rest_api/types/llm_as_judge_message.py +5 -1
opik/rest_api/types/llm_as_judge_message_content.py +26 -0
opik/rest_api/types/llm_as_judge_message_content_public.py +26 -0
opik/rest_api/types/llm_as_judge_message_content_write.py +26 -0
opik/rest_api/types/llm_as_judge_message_public.py +5 -1
opik/rest_api/types/llm_as_judge_message_write.py +5 -1
opik/rest_api/types/llm_as_judge_model_parameters.py +3 -0
opik/rest_api/types/llm_as_judge_model_parameters_public.py +3 -0
opik/rest_api/types/llm_as_judge_model_parameters_write.py +3 -0
opik/rest_api/types/manual_evaluation_request.py +38 -0
opik/rest_api/types/manual_evaluation_request_entity_type.py +5 -0
opik/rest_api/types/manual_evaluation_response.py +27 -0
opik/rest_api/types/optimization.py +4 -2
opik/rest_api/types/optimization_public.py +4 -2
opik/rest_api/types/optimization_public_status.py +3 -1
opik/rest_api/types/optimization_status.py +3 -1
opik/rest_api/types/optimization_studio_config.py +27 -0
opik/rest_api/types/optimization_studio_config_public.py +27 -0
opik/rest_api/types/optimization_studio_config_write.py +27 -0
opik/rest_api/types/optimization_studio_log.py +22 -0
opik/rest_api/types/optimization_write.py +4 -2
opik/rest_api/types/optimization_write_status.py +3 -1
opik/rest_api/types/project.py +1 -0
opik/rest_api/types/project_detailed.py +1 -0
opik/rest_api/types/project_reference.py +31 -0
opik/rest_api/types/project_reference_public.py +31 -0
opik/rest_api/types/project_stats_summary_item.py +1 -0
opik/rest_api/types/prompt.py +6 -0
opik/rest_api/types/prompt_detail.py +6 -0
opik/rest_api/types/prompt_detail_template_structure.py +5 -0
opik/rest_api/types/prompt_public.py +6 -0
opik/rest_api/types/prompt_public_template_structure.py +5 -0
opik/rest_api/types/prompt_template_structure.py +5 -0
opik/rest_api/types/prompt_version.py +3 -0
opik/rest_api/types/prompt_version_detail.py +3 -0
opik/rest_api/types/prompt_version_detail_template_structure.py +5 -0
opik/rest_api/types/prompt_version_link.py +1 -0
opik/rest_api/types/prompt_version_link_public.py +1 -0
opik/rest_api/types/prompt_version_page_public.py +5 -0
opik/rest_api/types/prompt_version_public.py +3 -0
opik/rest_api/types/prompt_version_public_template_structure.py +5 -0
opik/rest_api/types/prompt_version_template_structure.py +5 -0
opik/rest_api/types/prompt_version_update.py +33 -0
opik/rest_api/types/provider_api_key.py +9 -0
opik/rest_api/types/provider_api_key_provider.py +1 -1
opik/rest_api/types/provider_api_key_public.py +9 -0
opik/rest_api/types/provider_api_key_public_provider.py +1 -1
opik/rest_api/types/score_name.py +1 -0
opik/rest_api/types/service_toggles_config.py +18 -0
opik/rest_api/types/span.py +1 -2
opik/rest_api/types/span_enrichment_options.py +31 -0
opik/rest_api/types/span_experiment_item_bulk_write_view.py +1 -2
opik/rest_api/types/span_filter.py +23 -0
opik/rest_api/types/span_filter_operator.py +21 -0
opik/rest_api/types/span_filter_write.py +23 -0
opik/rest_api/types/span_filter_write_operator.py +21 -0
opik/rest_api/types/span_llm_as_judge_code.py +27 -0
opik/rest_api/types/span_llm_as_judge_code_public.py +27 -0
opik/rest_api/types/span_llm_as_judge_code_write.py +27 -0
opik/rest_api/types/span_public.py +1 -2
opik/rest_api/types/span_update.py +46 -0
opik/rest_api/types/span_user_defined_metric_python_code.py +20 -0
opik/rest_api/types/span_user_defined_metric_python_code_public.py +20 -0
opik/rest_api/types/span_user_defined_metric_python_code_write.py +20 -0
opik/rest_api/types/span_write.py +1 -2
opik/rest_api/types/studio_evaluation.py +20 -0
opik/rest_api/types/studio_evaluation_public.py +20 -0
opik/rest_api/types/studio_evaluation_write.py +20 -0
opik/rest_api/types/studio_llm_model.py +21 -0
opik/rest_api/types/studio_llm_model_public.py +21 -0
opik/rest_api/types/studio_llm_model_write.py +21 -0
opik/rest_api/types/studio_message.py +20 -0
opik/rest_api/types/studio_message_public.py +20 -0
opik/rest_api/types/studio_message_write.py +20 -0
opik/rest_api/types/studio_metric.py +21 -0
opik/rest_api/types/studio_metric_public.py +21 -0
opik/rest_api/types/studio_metric_write.py +21 -0
opik/rest_api/types/studio_optimizer.py +21 -0
opik/rest_api/types/studio_optimizer_public.py +21 -0
opik/rest_api/types/studio_optimizer_write.py +21 -0
opik/rest_api/types/studio_prompt.py +20 -0
opik/rest_api/types/studio_prompt_public.py +20 -0
opik/rest_api/types/studio_prompt_write.py +20 -0
opik/rest_api/types/trace.py +11 -2
opik/rest_api/types/trace_enrichment_options.py +32 -0
opik/rest_api/types/trace_experiment_item_bulk_write_view.py +1 -2
opik/rest_api/types/trace_filter.py +23 -0
opik/rest_api/types/trace_filter_operator.py +21 -0
opik/rest_api/types/trace_filter_write.py +23 -0
opik/rest_api/types/trace_filter_write_operator.py +21 -0
opik/rest_api/types/trace_public.py +11 -2
opik/rest_api/types/trace_thread_filter_write.py +23 -0
opik/rest_api/types/trace_thread_filter_write_operator.py +21 -0
opik/rest_api/types/trace_thread_identifier.py +1 -0
opik/rest_api/types/trace_update.py +39 -0
opik/rest_api/types/trace_write.py +1 -2
opik/rest_api/types/value_entry.py +2 -0
opik/rest_api/types/value_entry_compare.py +2 -0
opik/rest_api/types/value_entry_experiment_item_bulk_write_view.py +2 -0
opik/rest_api/types/value_entry_public.py +2 -0
opik/rest_api/types/video_url.py +19 -0
opik/rest_api/types/video_url_public.py +19 -0
opik/rest_api/types/video_url_write.py +19 -0
opik/rest_api/types/webhook.py +28 -0
opik/rest_api/types/webhook_examples.py +19 -0
opik/rest_api/types/webhook_public.py +28 -0
opik/rest_api/types/webhook_test_result.py +23 -0
opik/rest_api/types/webhook_test_result_status.py +5 -0
opik/rest_api/types/webhook_write.py +23 -0
opik/rest_api/types/welcome_wizard_tracking.py +22 -0
opik/rest_api/types/workspace_configuration.py +5 -0
opik/rest_api/welcome_wizard/__init__.py +4 -0
opik/rest_api/welcome_wizard/client.py +195 -0
opik/rest_api/welcome_wizard/raw_client.py +208 -0
opik/rest_api/workspaces/client.py +14 -2
opik/rest_api/workspaces/raw_client.py +10 -0
opik/s3_httpx_client.py +14 -1
opik/simulation/__init__.py +6 -0
opik/simulation/simulated_user.py +99 -0
opik/simulation/simulator.py +108 -0
opik/synchronization.py +5 -6
opik/{decorator/tracing_runtime_config.py → tracing_runtime_config.py} +6 -7
opik/types.py +36 -0
opik/validation/chat_prompt_messages.py +241 -0
opik/validation/feedback_score.py +3 -3
opik/validation/validator.py +28 -0
opik-1.9.71.dist-info/METADATA +370 -0
opik-1.9.71.dist-info/RECORD +1110 -0
opik/api_objects/prompt/prompt.py +0 -112
opik/cli.py +0 -193
opik/hooks.py +0 -13
opik/integrations/bedrock/chunks_aggregator.py +0 -55
opik/integrations/bedrock/helpers.py +0 -8
opik/rest_api/types/automation_rule_evaluator_object_public.py +0 -100
opik/rest_api/types/json_node_experiment_item_bulk_write_view.py +0 -5
opik-1.8.39.dist-info/METADATA +0 -339
opik-1.8.39.dist-info/RECORD +0 -790
/opik/{evaluation/metrics/conversation/conversational_coherence → decorator/context_manager}/__init__.py +0 -0
/opik/evaluation/metrics/conversation/{session_completeness → llm_judges/conversational_coherence}/__init__.py +0 -0
/opik/evaluation/metrics/conversation/{conversational_coherence → llm_judges/conversational_coherence}/schema.py +0 -0
/opik/evaluation/metrics/conversation/{user_frustration → llm_judges/session_completeness}/__init__.py +0 -0
/opik/evaluation/metrics/conversation/{session_completeness → llm_judges/session_completeness}/schema.py +0 -0
/opik/evaluation/metrics/conversation/{user_frustration → llm_judges/user_frustration}/schema.py +0 -0
/opik/integrations/bedrock/{stream_wrappers.py → converse/stream_wrappers.py} +0 -0
/opik/rest_api/{spans/types → types}/span_update_type.py +0 -0
{opik-1.8.39.dist-info → opik-1.9.71.dist-info}/WHEEL +0 -0
{opik-1.8.39.dist-info → opik-1.9.71.dist-info}/entry_points.txt +0 -0
{opik-1.8.39.dist-info → opik-1.9.71.dist-info}/licenses/LICENSE +0 -0
{opik-1.8.39.dist-info → opik-1.9.71.dist-info}/top_level.txt +0 -0

opik/cli/exports/experiment.py ADDED Viewed

@@ -0,0 +1,784 @@
+"""Experiment export functionality."""
+import sys
+from concurrent.futures import Future, ThreadPoolExecutor, as_completed
+from datetime import datetime
+from pathlib import Path
+from typing import Optional, List, Dict, Tuple
+import click
+from rich.console import Console
+from rich.progress import (
+    Progress,
+    SpinnerColumn,
+    TextColumn,
+    BarColumn,
+    TaskProgressColumn,
+)
+import opik
+from opik import exceptions
+from .utils import (
+    create_experiment_data_structure,
+    debug_print,
+    write_json_data,
+    write_csv_data,
+    print_export_summary,
+    should_skip_file,
+    trace_to_csv_rows,
+)
+from .dataset import export_experiment_datasets
+from .prompt import (
+    export_related_prompts_by_name,
+    export_prompts_by_ids,
+)
+console = Console()
+# Batch size for parallel trace fetching
+BATCH_SIZE = 100
+# Maximum number of concurrent workers for parallel execution
+MAX_WORKERS = 20
+def _fetch_trace_data(
+    client: opik.Opik,
+    trace_id: str,
+    project_name_cache: dict[str, str],
+    debug: bool,
+) -> Optional[Tuple[str, dict, str]]:
+    """Fetch trace and span data for a single trace ID.
+    Returns:
+        Tuple of (trace_id, trace_data_dict, project_name) or None if failed.
+    """
+    try:
+        # Get trace by ID
+        trace = client.get_trace_content(trace_id)
+        # Get project name for this trace
+        if not trace.project_id:
+            return None
+        # Get project name (use cache if available)
+        if trace.project_id not in project_name_cache:
+            try:
+                project = client.get_project(trace.project_id)
+                project_name_cache[trace.project_id] = project.name
+            except Exception as e:
+                if debug:
+                    debug_print(
+                        f"Warning: Could not get project for trace {trace_id}: {e}",
+                        debug,
+                    )
+                return None
+        project_name = project_name_cache[trace.project_id]
+        # Get spans for this trace
+        spans = client.search_spans(
+            trace_id=trace_id,
+            max_results=1000,
+            truncate=False,
+        )
+        # Create trace data structure
+        trace_data = {
+            "trace": trace.model_dump(),
+            "spans": [span.model_dump() for span in spans],
+            "downloaded_at": datetime.now().isoformat(),
+            "project_name": project_name,
+        }
+        return (trace_id, trace_data, project_name)
+    except Exception as e:
+        if debug:
+            import traceback
+            debug_print(
+                f"Error fetching trace {trace_id}: {e}\n{traceback.format_exc()}", debug
+            )
+        return None
+def _write_trace_file(
+    trace_id: str,
+    trace_data: dict,
+    project_name: str,
+    workspace_root: Path,
+    format: str,
+    force: bool,
+    debug: bool,
+) -> bool:
+    """Write a single trace to file. Returns True if exported, False if skipped."""
+    try:
+        # Save trace in projects/PROJECT_NAME/ directory
+        project_dir = workspace_root / "projects" / project_name
+        project_dir.mkdir(parents=True, exist_ok=True)
+        # Determine file path based on format
+        if format.lower() == "csv":
+            file_path = project_dir / f"trace_{trace_id}.csv"
+        else:
+            file_path = project_dir / f"trace_{trace_id}.json"
+        # Check if file already exists and should be skipped
+        if should_skip_file(file_path, force):
+            if debug:
+                debug_print(f"Skipping trace {trace_id} (already exists)", debug)
+            return False
+        # Save to file using the appropriate format
+        if format.lower() == "csv":
+            write_csv_data(trace_data, file_path, trace_to_csv_rows)
+            if debug:
+                debug_print(f"Wrote CSV file: {file_path}", debug)
+        else:
+            write_json_data(trace_data, file_path)
+            if debug:
+                debug_print(f"Wrote JSON file: {file_path}", debug)
+        return True
+    except Exception as e:
+        console.print(f"[red]Error writing trace {trace_id} to file: {e}[/red]")
+        if debug:
+            import traceback
+            debug_print(f"Traceback: {traceback.format_exc()}", debug)
+        return False
+def export_traces_by_ids(
+    client: opik.Opik,
+    trace_ids: List[str],
+    workspace_root: Path,
+    max_traces: Optional[int],
+    format: str,
+    debug: bool,
+    force: bool,
+) -> tuple[int, int]:
+    """Export traces by their IDs using parallel batch processing.
+    Traces are saved in projects/PROJECT_NAME/ directory based on each trace's project.
+    Uses parallel execution to fetch traces/spans and write files concurrently.
+    """
+    exported_count = 0
+    skipped_count = 0
+    if max_traces:
+        trace_ids = trace_ids[:max_traces]
+    if not trace_ids:
+        return 0, 0
+    if debug:
+        debug_print(
+            f"Exporting {len(trace_ids)} trace(s) in batches of {BATCH_SIZE}", debug
+        )
+    # Cache project names to avoid repeated API calls (shared across threads)
+    project_name_cache: dict[str, str] = {}
+    # Use progress bar for trace export
+    with Progress(
+        SpinnerColumn(),
+        TextColumn("[progress.description]{task.description}"),
+        BarColumn(),
+        TaskProgressColumn(),
+        console=console,
+    ) as progress:
+        task = progress.add_task(
+            f"Exporting {len(trace_ids)} traces...", total=len(trace_ids)
+        )
+        # Process traces in batches
+        for batch_start in range(0, len(trace_ids), BATCH_SIZE):
+            batch_end = min(batch_start + BATCH_SIZE, len(trace_ids))
+            batch_trace_ids = trace_ids[batch_start:batch_end]
+            if debug:
+                debug_print(
+                    f"Batch {batch_start // BATCH_SIZE + 1}: traces {batch_start + 1}-{batch_end}",
+                    debug,
+                )
+            # Fetch trace data in parallel
+            fetched_traces: dict[str, Tuple[dict, str]] = {}
+            with ThreadPoolExecutor(max_workers=MAX_WORKERS) as fetch_executor:
+                # Submit all trace fetch tasks and track trace_id for each future
+                fetch_futures: Dict[Future[Optional[Tuple[str, dict, str]]], str] = {}
+                for trace_id in batch_trace_ids:
+                    fetch_future: Future[Optional[Tuple[str, dict, str]]] = (
+                        fetch_executor.submit(
+                            _fetch_trace_data,
+                            client,
+                            trace_id,
+                            project_name_cache,
+                            debug,
+                        )
+                    )
+                    fetch_futures[fetch_future] = trace_id
+                # Collect completed fetches
+                for fetch_future in as_completed(fetch_futures):
+                    trace_id = fetch_futures[fetch_future]
+                    try:
+                        result = fetch_future.result()
+                        if result is not None:
+                            fetched_trace_id, trace_data, project_name = result
+                            fetched_traces[fetched_trace_id] = (
+                                trace_data,
+                                project_name,
+                            )
+                    except Exception as e:
+                        if debug:
+                            console.print(
+                                f"[red]Error fetching trace {trace_id}: {e}[/red]"
+                            )
+            # Write files in parallel
+            with ThreadPoolExecutor(max_workers=MAX_WORKERS) as write_executor:
+                # Submit all write tasks and track trace_id for each future
+                write_futures: Dict[Future[bool], str] = {}
+                for trace_id, (trace_data, project_name) in fetched_traces.items():
+                    write_future: Future[bool] = write_executor.submit(
+                        _write_trace_file,
+                        trace_id,
+                        trace_data,
+                        project_name,
+                        workspace_root,
+                        format,
+                        force,
+                        debug,
+                    )
+                    write_futures[write_future] = trace_id
+                # Process completed writes
+                for write_future in as_completed(write_futures):
+                    trace_id = write_futures[write_future]
+                    try:
+                        if write_future.result():
+                            exported_count += 1
+                        else:
+                            skipped_count += 1
+                    except Exception as e:
+                        if debug:
+                            console.print(
+                                f"[red]Error writing trace {trace_id}: {e}[/red]"
+                            )
+                    finally:
+                        progress.update(
+                            task,
+                            advance=1,
+                            description=f"Exported {exported_count}/{len(trace_ids)} traces",
+                        )
+                # Update progress for traces that failed to fetch
+                for trace_id in batch_trace_ids:
+                    if trace_id not in fetched_traces:
+                        progress.update(task, advance=1)
+    return exported_count, skipped_count
+def export_experiment_by_id(
+    client: opik.Opik,
+    output_dir: Path,
+    experiment_id: str,
+    max_traces: Optional[int],
+    force: bool,
+    debug: bool,
+    format: str,
+    trace_ids_collector: Optional[set[str]] = None,
+) -> tuple[Dict[str, int], int]:
+    """Export a specific experiment by ID, including related datasets and traces.
+    Returns:
+        Tuple of (stats dictionary, file_written flag) where:
+        - stats: Dictionary with keys "datasets", "prompts", "traces" and their counts
+        - file_written: 1 if experiment file was written, 0 if skipped or error
+    """
+    try:
+        console.print(f"[blue]Fetching experiment by ID: {experiment_id}[/blue]")
+        # Get the specific experiment by ID
+        experiment = client.get_experiment_by_id(experiment_id)
+        if not experiment:
+            console.print(f"[red]Experiment '{experiment_id}' not found[/red]")
+            # Return empty stats and 0 for file written when not found
+            return ({"datasets": 0, "prompts": 0, "traces": 0}, 0)
+        debug_print(f"Found experiment: {experiment.name}", debug)
+        # Get experiment items first (this can be slow for large experiments)
+        console.print("[blue]Fetching experiment items...[/blue]")
+        with Progress(
+            SpinnerColumn(),
+            TextColumn("[progress.description]{task.description}"),
+            console=console,
+        ) as progress:
+            task = progress.add_task("Getting experiment items...", total=None)
+            experiment_items = experiment.get_items()
+            progress.update(task, description="Got experiment items")
+        # Create experiment data structure
+        experiment_data = create_experiment_data_structure(experiment, experiment_items)
+        # Save experiment data
+        # Include experiment ID in filename to handle multiple experiments with same name
+        experiment_file = (
+            output_dir / f"experiment_{experiment.name}_{experiment.id}.json"
+        )
+        file_already_exists = experiment_file.exists()
+        experiment_file_written = False
+        if not file_already_exists or force:
+            write_json_data(experiment_data, experiment_file)
+            experiment_file_written = True
+            debug_print(
+                f"Exported experiment: {experiment.name} (ID: {experiment.id})", debug
+            )
+        else:
+            debug_print(
+                f"Skipping experiment {experiment.name} (ID: {experiment.id}) (already exists)",
+                debug,
+            )
+        # Related prompts and traces are handled at the batch level
+        # Only export related prompts by name (this is experiment-specific and can't be easily deduplicated)
+        stats = {
+            "datasets": 0,
+            "datasets_skipped": 0,
+            "prompts": 0,
+            "prompts_skipped": 0,
+            "traces": 0,
+            "traces_skipped": 0,
+        }
+        stats["prompts"] = export_related_prompts_by_name(
+            client, experiment, output_dir, force, debug, format
+        )
+        # Collect trace IDs from experiment items (for batch export later)
+        trace_ids = [item.trace_id for item in experiment_items if item.trace_id]
+        if trace_ids_collector is not None:
+            trace_ids_collector.update(trace_ids)
+        # Traces are exported at batch level, so we don't export them here
+        stats["traces"] = 0
+        stats["traces_skipped"] = 0
+        if debug:
+            console.print(
+                f"[green]Experiment {experiment.name} exported with stats: {stats}[/green]"
+            )
+        # Return stats dictionary and whether file was written
+        return (stats, 1 if experiment_file_written else 0)
+    except Exception as e:
+        console.print(f"[red]Error exporting experiment {experiment_id}: {e}[/red]")
+        # Return empty stats and 0 for file written on error
+        return ({"datasets": 0, "prompts": 0, "traces": 0}, 0)
+def export_experiment_by_name(
+    name: str,
+    workspace: str,
+    output_path: str,
+    dataset: Optional[str],
+    max_traces: Optional[int],
+    force: bool,
+    debug: bool,
+    format: str,
+    api_key: Optional[str] = None,
+) -> None:
+    """Export an experiment by exact name."""
+    try:
+        if debug:
+            debug_print(f"Exporting experiment: {name}", debug)
+        # Initialize client
+        if api_key:
+            client = opik.Opik(api_key=api_key, workspace=workspace)
+        else:
+            client = opik.Opik(workspace=workspace)
+        # Create output directory
+        output_dir = Path(output_path) / workspace / "experiments"
+        output_dir.mkdir(parents=True, exist_ok=True)
+        datasets_dir = Path(output_path) / workspace / "datasets"
+        datasets_dir.mkdir(parents=True, exist_ok=True)
+        if debug:
+            debug_print(f"Target directory: {output_dir}", debug)
+        # Try to get experiments by exact name
+        try:
+            experiments = client.get_experiments_by_name(name)
+            if not experiments:
+                console.print(f"[red]Experiment '{name}' not found[/red]")
+                return
+            if debug:
+                debug_print(
+                    f"Found {len(experiments)} experiment(s) with name '{name}'", debug
+                )
+            if len(experiments) > 1:
+                console.print(
+                    f"[blue]Found {len(experiments)} experiments with name '{name}', exporting all of them[/blue]"
+                )
+        except Exception as e:
+            console.print(f"[red]Experiment '{name}' not found: {e}[/red]")
+            return
+        # Filter experiments by dataset if specified (client-side filtering)
+        if dataset:
+            experiments = [exp for exp in experiments if exp.dataset_name == dataset]
+            if not experiments:
+                console.print(
+                    f"[yellow]No experiments found with name '{name}' using dataset '{dataset}'[/yellow]"
+                )
+                return
+            if debug:
+                debug_print(
+                    f"Filtered to {len(experiments)} experiment(s) using dataset '{dataset}'",
+                    debug,
+                )
+        # Collect all unique resources from all experiments first
+        unique_datasets = set()
+        unique_prompt_ids: set[str] = set()
+        # First pass: collect datasets and prompt IDs (these are available without fetching items)
+        for experiment in experiments:
+            if experiment.dataset_name:
+                unique_datasets.add(experiment.dataset_name)
+            # Get experiment data to access prompt_versions
+            experiment_data = experiment.get_experiment_data()
+            if experiment_data.prompt_versions:
+                for prompt_version in experiment_data.prompt_versions:
+                    if prompt_version.prompt_id:
+                        unique_prompt_ids.add(prompt_version.prompt_id)
+        # Export all unique datasets once before processing experiments
+        datasets_exported = 0
+        datasets_skipped = 0
+        if unique_datasets:
+            if len(unique_datasets) > 1:
+                console.print(
+                    f"[blue]Exporting {len(unique_datasets)} unique dataset(s) used by these experiments...[/blue]"
+                )
+            datasets_exported, datasets_skipped = export_experiment_datasets(
+                client, unique_datasets, datasets_dir, format, debug, force
+            )
+        # Export all unique prompts once before processing experiments
+        prompts_dir = output_dir.parent / "prompts"
+        prompts_dir.mkdir(parents=True, exist_ok=True)
+        prompts_exported = 0
+        prompts_skipped = 0
+        if unique_prompt_ids:
+            if len(unique_prompt_ids) > 1:
+                console.print(
+                    f"[blue]Exporting {len(unique_prompt_ids)} unique prompt(s) used by these experiments...[/blue]"
+                )
+            prompts_exported, prompts_skipped = export_prompts_by_ids(
+                client, unique_prompt_ids, prompts_dir, format, debug, force
+            )
+        # Collect all unique trace IDs from all experiments as we process them
+        # We'll collect them during the first pass, then export once
+        all_trace_ids: set[str] = set()
+        # Export all matching experiments
+        exported_count = 0
+        skipped_count = 0
+        # Aggregate stats from all experiments (prompts and traces already exported at batch level)
+        aggregated_stats = {
+            "prompts": 0,
+            "prompts_skipped": 0,
+        }
+        for experiment in experiments:
+            if debug:
+                debug_print(
+                    f"Exporting experiment: {experiment.name} (ID: {experiment.id})",
+                    debug,
+                )
+            result = export_experiment_by_id(
+                client,
+                output_dir,
+                experiment.id,
+                max_traces,
+                force,
+                debug,
+                format,
+                all_trace_ids,
+            )
+            # result is a tuple: (stats_dict, file_written_flag)
+            exp_stats, file_written = result
+            # Aggregate stats (only related prompts, traces already handled)
+            aggregated_stats["prompts"] += exp_stats.get("prompts", 0)
+            aggregated_stats["prompts_skipped"] += exp_stats.get("prompts_skipped", 0)
+            if file_written > 0:
+                exported_count += 1
+            else:
+                skipped_count += 1
+        # Export all unique traces once after collecting them from all experiments
+        workspace_root = output_dir.parent
+        traces_exported = 0
+        traces_skipped = 0
+        if all_trace_ids:
+            trace_ids_list = list(all_trace_ids)
+            if max_traces:
+                trace_ids_list = trace_ids_list[:max_traces]
+            if len(trace_ids_list) > 0:
+                if len(all_trace_ids) > 1:
+                    console.print(
+                        f"[blue]Exporting {len(trace_ids_list)} unique trace(s) from these experiments...[/blue]"
+                    )
+                traces_exported, traces_skipped = export_traces_by_ids(
+                    client, trace_ids_list, workspace_root, None, format, debug, force
+                )
+        # Collect statistics for summary
+        stats = {
+            "experiments": exported_count,
+            "experiments_skipped": skipped_count,
+            "datasets": datasets_exported,
+            "datasets_skipped": datasets_skipped,
+            "prompts": prompts_exported + aggregated_stats["prompts"],
+            "prompts_skipped": prompts_skipped + aggregated_stats["prompts_skipped"],
+            "traces": traces_exported,
+            "traces_skipped": traces_skipped,
+        }
+        # Show export summary
+        print_export_summary(stats, format)
+        if exported_count > 0:
+            if len(experiments) > 1:
+                console.print(
+                    f"[green]Successfully exported {exported_count} experiment(s) with name '{name}' to {output_dir}[/green]"
+                )
+            else:
+                console.print(
+                    f"[green]Successfully exported experiment '{name}' to {output_dir}[/green]"
+                )
+        else:
+            console.print(
+                f"[yellow]All {len(experiments)} experiment(s) with name '{name}' already exist (use --force to re-download)[/yellow]"
+            )
+    except Exception as e:
+        console.print(f"[red]Error exporting experiment: {e}[/red]")
+        sys.exit(1)
+def export_experiment_by_name_or_id(
+    name_or_id: str,
+    workspace: str,
+    output_path: str,
+    dataset: Optional[str],
+    max_traces: Optional[int],
+    force: bool,
+    debug: bool,
+    format: str,
+    api_key: Optional[str] = None,
+) -> None:
+    """Export an experiment by name or ID.
+    First tries to get the experiment by ID. If not found, tries by name.
+    """
+    try:
+        if debug:
+            debug_print(f"Attempting to export experiment: {name_or_id}", debug)
+        # Initialize client
+        if api_key:
+            client = opik.Opik(api_key=api_key, workspace=workspace)
+        else:
+            client = opik.Opik(workspace=workspace)
+        # Create output directory
+        output_dir = Path(output_path) / workspace / "experiments"
+        output_dir.mkdir(parents=True, exist_ok=True)
+        datasets_dir = Path(output_path) / workspace / "datasets"
+        datasets_dir.mkdir(parents=True, exist_ok=True)
+        # Try to get experiment by ID first
+        try:
+            if debug:
+                debug_print(f"Trying to get experiment by ID: {name_or_id}", debug)
+            experiment = client.get_experiment_by_id(name_or_id)
+            # Successfully found by ID, export it
+            if debug:
+                debug_print(
+                    f"Found experiment by ID: {experiment.name} (ID: {experiment.id})",
+                    debug,
+                )
+            # Collect trace IDs as we export
+            trace_ids_collector: set[str] = set()
+            # Use the ID-based export function
+            result = export_experiment_by_id(
+                client,
+                output_dir,
+                name_or_id,
+                max_traces,
+                force,
+                debug,
+                format,
+                trace_ids_collector,
+            )
+            exp_stats, file_written = result
+            # Export related datasets
+            unique_datasets = set()
+            if experiment.dataset_name:
+                unique_datasets.add(experiment.dataset_name)
+            datasets_exported = 0
+            datasets_skipped = 0
+            if unique_datasets:
+                datasets_exported, datasets_skipped = export_experiment_datasets(
+                    client, unique_datasets, datasets_dir, format, debug, force
+                )
+            # Export traces collected from experiment items
+            workspace_root = output_dir.parent
+            traces_exported = 0
+            traces_skipped = 0
+            if trace_ids_collector:
+                trace_ids_list = list(trace_ids_collector)
+                if max_traces:
+                    trace_ids_list = trace_ids_list[:max_traces]
+                if len(trace_ids_list) > 0:
+                    traces_exported, traces_skipped = export_traces_by_ids(
+                        client,
+                        trace_ids_list,
+                        workspace_root,
+                        None,
+                        format,
+                        debug,
+                        force,
+                    )
+            # Collect statistics for summary
+            stats = {
+                "experiments": 1 if file_written > 0 else 0,
+                "experiments_skipped": 0 if file_written > 0 else 1,
+                "datasets": datasets_exported,
+                "datasets_skipped": datasets_skipped,
+                "prompts": exp_stats.get("prompts", 0),
+                "prompts_skipped": exp_stats.get("prompts_skipped", 0),
+                "traces": traces_exported,
+                "traces_skipped": traces_skipped,
+            }
+            # Show export summary
+            print_export_summary(stats, format)
+            if file_written > 0:
+                console.print(
+                    f"[green]Successfully exported experiment '{experiment.name}' (ID: {experiment.id}) to {output_dir}[/green]"
+                )
+            else:
+                console.print(
+                    f"[yellow]Experiment '{experiment.name}' (ID: {experiment.id}) already exists (use --force to re-download)[/yellow]"
+                )
+            return
+        except exceptions.ExperimentNotFound:
+            # Not found by ID, try by name
+            if debug:
+                debug_print(
+                    f"Experiment not found by ID, trying by name: {name_or_id}", debug
+                )
+            # Fall through to name-based export
+            pass
+        # Try by name (either because ID lookup failed or we're explicitly trying name)
+        export_experiment_by_name(
+            name_or_id,
+            workspace,
+            output_path,
+            dataset,
+            max_traces,
+            force,
+            debug,
+            format,
+            api_key,
+        )
+    except Exception as e:
+        console.print(f"[red]Error exporting experiment: {e}[/red]")
+        sys.exit(1)
+@click.command(name="experiment")
+@click.argument("name_or_id", type=str)
+@click.option(
+    "--dataset",
+    type=str,
+    help="Filter experiments by dataset name. Only experiments using this dataset will be exported.",
+)
+@click.option(
+    "--max-traces",
+    type=int,
+    help="Maximum number of traces to export per experiment. Limits the total number of traces downloaded.",
+)
+@click.option(
+    "--path",
+    "-p",
+    type=click.Path(file_okay=False, dir_okay=True, writable=True),
+    default="opik_exports",
+    help="Directory to save exported data. Defaults to opik_exports.",
+)
+@click.option(
+    "--force",
+    is_flag=True,
+    help="Re-download items even if they already exist locally.",
+)
+@click.option(
+    "--debug",
+    is_flag=True,
+    help="Enable debug output to show detailed information about the export process.",
+)
+@click.option(
+    "--format",
+    type=click.Choice(["json", "csv"], case_sensitive=False),
+    default="json",
+    help="Format for exporting data. Defaults to json.",
+)
+@click.pass_context
+def export_experiment_command(
+    ctx: click.Context,
+    name_or_id: str,
+    dataset: Optional[str],
+    max_traces: Optional[int],
+    path: str,
+    force: bool,
+    debug: bool,
+    format: str,
+) -> None:
+    """Export an experiment by exact name to workspace/experiments.
+    The command will first try to find the experiment by ID. If not found, it will try by name.
+    """
+    # Get workspace and API key from context
+    workspace = ctx.obj["workspace"]
+    api_key = ctx.obj.get("api_key") if ctx.obj else None
+    export_experiment_by_name_or_id(
+        name_or_id, workspace, path, dataset, max_traces, force, debug, format, api_key
+    )

opik 1.8.39__py3-none-any.whl → 1.9.71__py3-none-any.whl

opik 1.8.39py3-none-any.whl → 1.9.71py3-none-any.whl