judgeval 0.0.19__tar.gz → 0.0.20__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {judgeval-0.0.19 → judgeval-0.0.20}/PKG-INFO +1 -1
- {judgeval-0.0.19 → judgeval-0.0.20}/Pipfile +5 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/Pipfile.lock +638 -104
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/api_reference/trace.mdx +2 -1
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/data_datasets.mdx +30 -7
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/introduction.mdx +6 -1
- judgeval-0.0.20/docs/evaluation/scorers/execution_order.mdx +72 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/introduction.mdx +2 -2
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/unit_testing.mdx +2 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/getting_started.mdx +95 -36
- judgeval-0.0.20/docs/images/basic_trace_example.png +0 -0
- judgeval-0.0.20/docs/images/online_eval_fault.png +0 -0
- judgeval-0.0.20/docs/images/trace_ss.png +0 -0
- judgeval-0.0.20/docs/integration/langgraph.mdx +27 -0
- judgeval-0.0.20/docs/introduction.mdx +19 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/mint.json +8 -2
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/monitoring/tracing.mdx +17 -14
- {judgeval-0.0.19 → judgeval-0.0.20}/pyproject.toml +1 -1
- judgeval-0.0.20/src/demo/cookbooks/JNPR_Mist/test.py +21 -0
- judgeval-0.0.20/src/demo/cookbooks/langgraph_basic/agent.py +109 -0
- judgeval-0.0.20/src/demo/cookbooks/linkd/text2sql.py +14 -0
- judgeval-0.0.20/src/demo/customer_use/jnpr/mist/demo.py +131 -0
- judgeval-0.0.20/src/demo/customer_use/jnpr/mist/test.yaml +11 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/common/tracer.py +24 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/constants.py +1 -1
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/data/api_example.py +3 -16
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/data/datasets/dataset.py +114 -2
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/data/example.py +16 -15
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/data/result.py +3 -3
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/__init__.py +2 -2
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/__init__.py +6 -6
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/__init__.py +2 -2
- judgeval-0.0.20/src/judgeval/scorers/judgeval_scorers/api_scorers/execution_order.py +35 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/__init__.py +2 -2
- judgeval-0.0.20/src/judgeval/scorers/judgeval_scorers/local_implementations/execution_order/__init__.py +3 -0
- judgeval-0.0.19/src/judgeval/scorers/judgeval_scorers/local_implementations/tool_correctness/tool_correctness_scorer.py → judgeval-0.0.20/src/judgeval/scorers/judgeval_scorers/local_implementations/execution_order/execution_order.py +3 -3
- judgeval-0.0.19/docs/evaluation/scorers/tool_correctness.mdx +0 -50
- judgeval-0.0.19/docs/images/basic_trace_example.png +0 -0
- judgeval-0.0.19/docs/images/trace_screenshot.png +0 -0
- judgeval-0.0.19/docs/introduction.mdx +0 -90
- judgeval-0.0.19/src/demo/cookbooks/langgraph_basic/agent.py +0 -114
- judgeval-0.0.19/src/judgeval/scorers/judgeval_scorers/api_scorers/tool_correctness.py +0 -19
- judgeval-0.0.19/src/judgeval/scorers/judgeval_scorers/local_implementations/tool_correctness/__init__.py +0 -3
- {judgeval-0.0.19 → judgeval-0.0.20}/.github/workflows/ci.yaml +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/.gitignore +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/LICENSE.md +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/README.md +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/README.md +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/api_reference/judgment_client.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/development.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/essentials/code.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/essentials/images.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/essentials/markdown.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/essentials/navigation.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/essentials/reusable-snippets.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/essentials/settings.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/data_examples.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/judges.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/answer_correctness.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/answer_relevancy.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/classifier_scorer.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/comparison.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/contextual_precision.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/contextual_recall.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/contextual_relevancy.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/custom_scorers.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/faithfulness.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/hallucination.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/json_correctness.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/evaluation/scorers/summarization.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/favicon.svg +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/images/checks-passed.png +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/images/create_aggressive_scorer.png +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/images/create_scorer.png +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/images/evaluation_diagram.png +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/images/hero-dark.svg +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/images/hero-light.svg +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/judgment/introduction.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/logo/dark.svg +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/logo/light.svg +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/monitoring/introduction.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/monitoring/production_insights.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/notebooks/create_dataset.ipynb +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/notebooks/create_scorer.ipynb +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/notebooks/demo.ipynb +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/notebooks/prompt_scorer.ipynb +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/notebooks/quickstart.ipynb +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/quickstart.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/docs/snippets/snippet-intro.mdx +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/pytest.ini +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/anime_chatbot_agent/animeChatBot.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/ci_testing/ci_testing.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/ci_testing/travel_response.txt +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/custom_scorers/competitor_mentions.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/custom_scorers/text2sql.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/jpmorgan/demo.ipynb +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/jpmorgan/demo.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/jpmorgan/vectordbdocs.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/langchain_basic_rag/basic_agentic_rag.ipynb +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/langchain_basic_rag/tesla_q3.pdf +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/langchain_sales/example_product_price_id_mapping.json +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/langchain_sales/sales_agent_with_context.ipynb +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/langchain_sales/sample_product_catalog.txt +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/langgraph_basic/agent.ipynb +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/new_bot/basic_bot.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/openai_travel_agent/agent.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/openai_travel_agent/populate_db.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/openai_travel_agent/tools.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/rules_alerts/rules_bot.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/rules_alerts/rules_demo.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/cookbooks/rules_alerts/utils_helper.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/demo/customer_use/jnpr/srikar_demo.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/clients.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/common/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/common/exceptions.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/common/logger.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/common/utils.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/data/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/data/datasets/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/data/datasets/eval_dataset_client.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/data/datasets/utils.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/data/ground_truth.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/data/scorer_data.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/evaluation_run.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/judges/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/judges/base_judge.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/judges/litellm_judge.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/judges/mixture_of_judges.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/judges/together_judge.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/judges/utils.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/judgment_client.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/rules.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/run_evaluation.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/api_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/base_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/exceptions.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/answer_correctness.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/answer_relevancy.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/comparison.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/contextual_precision.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/contextual_recall.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/contextual_relevancy.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/faithfulness.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/groundedness.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/hallucination.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/instruction_adherence.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/json_correctness.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/api_scorers/summarization.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/classifiers/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/classifiers/text2sql/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/classifiers/text2sql/text2sql_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/answer_correctness_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/prompts.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/answer_relevancy_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/prompts.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/comparison/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/comparison/comparison_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/comparison/prompts.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_precision/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_precision/contextual_precision_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_precision/prompts.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_recall/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_recall/contextual_recall_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_recall/prompts.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_relevancy/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_relevancy/contextual_relevancy_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_relevancy/prompts.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/faithfulness/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/faithfulness/faithfulness_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/faithfulness/prompts.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/hallucination/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/hallucination/hallucination_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/hallucination/prompts.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/instruction_adherence/instruction_adherence.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/instruction_adherence/prompt.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/json_correctness/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/json_correctness/json_correctness_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/summarization/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/summarization/prompts.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/judgeval_scorers/local_implementations/summarization/summarization_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/prompt_scorer.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/score.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/scorers/utils.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/tracer/__init__.py +0 -0
- {judgeval-0.0.19 → judgeval-0.0.20}/src/judgeval/utils/alerts.py +0 -0