PyPI - langchain - Versions diffs - 0.3.26__py3-none-any.whl → 0.3.27__py3-none-any.whl - Mend

langchain 0.3.26py3-none-any.whl → 0.3.27py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of langchain might be problematic. Click here for more details.

Files changed (580) hide show

langchain/__init__.py +110 -96
langchain/_api/__init__.py +2 -2
langchain/_api/deprecation.py +3 -3
langchain/_api/module_import.py +51 -46
langchain/_api/path.py +1 -1
langchain/adapters/openai.py +8 -8
langchain/agents/__init__.py +15 -12
langchain/agents/agent.py +160 -133
langchain/agents/agent_iterator.py +31 -14
langchain/agents/agent_toolkits/__init__.py +7 -6
langchain/agents/agent_toolkits/ainetwork/toolkit.py +1 -1
langchain/agents/agent_toolkits/amadeus/toolkit.py +1 -1
langchain/agents/agent_toolkits/azure_cognitive_services.py +1 -1
langchain/agents/agent_toolkits/clickup/toolkit.py +1 -1
langchain/agents/agent_toolkits/conversational_retrieval/openai_functions.py +6 -4
langchain/agents/agent_toolkits/csv/__init__.py +4 -2
langchain/agents/agent_toolkits/file_management/__init__.py +1 -1
langchain/agents/agent_toolkits/file_management/toolkit.py +1 -1
langchain/agents/agent_toolkits/github/toolkit.py +9 -9
langchain/agents/agent_toolkits/gitlab/toolkit.py +1 -1
langchain/agents/agent_toolkits/json/base.py +1 -1
langchain/agents/agent_toolkits/multion/toolkit.py +1 -1
langchain/agents/agent_toolkits/office365/toolkit.py +1 -1
langchain/agents/agent_toolkits/openapi/base.py +1 -1
langchain/agents/agent_toolkits/openapi/planner.py +2 -2
langchain/agents/agent_toolkits/openapi/planner_prompt.py +10 -10
langchain/agents/agent_toolkits/openapi/prompt.py +1 -1
langchain/agents/agent_toolkits/openapi/toolkit.py +1 -1
langchain/agents/agent_toolkits/pandas/__init__.py +4 -2
langchain/agents/agent_toolkits/playwright/__init__.py +1 -1
langchain/agents/agent_toolkits/playwright/toolkit.py +1 -1
langchain/agents/agent_toolkits/powerbi/base.py +1 -1
langchain/agents/agent_toolkits/powerbi/chat_base.py +1 -1
langchain/agents/agent_toolkits/powerbi/prompt.py +2 -2
langchain/agents/agent_toolkits/powerbi/toolkit.py +1 -1
langchain/agents/agent_toolkits/python/__init__.py +4 -2
langchain/agents/agent_toolkits/spark/__init__.py +4 -2
langchain/agents/agent_toolkits/spark_sql/base.py +1 -1
langchain/agents/agent_toolkits/spark_sql/toolkit.py +1 -1
langchain/agents/agent_toolkits/sql/prompt.py +1 -1
langchain/agents/agent_toolkits/sql/toolkit.py +1 -1
langchain/agents/agent_toolkits/vectorstore/base.py +2 -2
langchain/agents/agent_toolkits/vectorstore/prompt.py +2 -4
langchain/agents/agent_toolkits/vectorstore/toolkit.py +12 -11
langchain/agents/agent_toolkits/xorbits/__init__.py +4 -2
langchain/agents/agent_toolkits/zapier/toolkit.py +1 -1
langchain/agents/agent_types.py +6 -6
langchain/agents/chat/base.py +6 -12
langchain/agents/chat/output_parser.py +9 -6
langchain/agents/chat/prompt.py +3 -4
langchain/agents/conversational/base.py +9 -5
langchain/agents/conversational/output_parser.py +4 -2
langchain/agents/conversational/prompt.py +2 -3
langchain/agents/conversational_chat/base.py +7 -5
langchain/agents/conversational_chat/output_parser.py +9 -11
langchain/agents/conversational_chat/prompt.py +5 -6
langchain/agents/format_scratchpad/__init__.py +3 -3
langchain/agents/format_scratchpad/log_to_messages.py +1 -1
langchain/agents/format_scratchpad/openai_functions.py +8 -6
langchain/agents/format_scratchpad/tools.py +5 -3
langchain/agents/format_scratchpad/xml.py +33 -2
langchain/agents/initialize.py +16 -8
langchain/agents/json_chat/base.py +18 -18
langchain/agents/json_chat/prompt.py +2 -3
langchain/agents/load_tools.py +2 -1
langchain/agents/loading.py +28 -18
langchain/agents/mrkl/base.py +9 -4
langchain/agents/mrkl/output_parser.py +17 -13
langchain/agents/mrkl/prompt.py +1 -2
langchain/agents/openai_assistant/base.py +80 -70
langchain/agents/openai_functions_agent/base.py +46 -37
langchain/agents/openai_functions_multi_agent/base.py +39 -26
langchain/agents/openai_tools/base.py +8 -8
langchain/agents/output_parsers/__init__.py +3 -3
langchain/agents/output_parsers/json.py +6 -6
langchain/agents/output_parsers/openai_functions.py +15 -7
langchain/agents/output_parsers/openai_tools.py +9 -4
langchain/agents/output_parsers/react_json_single_input.py +10 -5
langchain/agents/output_parsers/react_single_input.py +15 -11
langchain/agents/output_parsers/self_ask.py +3 -2
langchain/agents/output_parsers/tools.py +18 -13
langchain/agents/output_parsers/xml.py +99 -28
langchain/agents/react/agent.py +4 -4
langchain/agents/react/base.py +22 -17
langchain/agents/react/output_parser.py +5 -6
langchain/agents/react/textworld_prompt.py +0 -1
langchain/agents/react/wiki_prompt.py +14 -15
langchain/agents/schema.py +3 -2
langchain/agents/self_ask_with_search/base.py +19 -15
langchain/agents/self_ask_with_search/prompt.py +0 -1
langchain/agents/structured_chat/base.py +14 -11
langchain/agents/structured_chat/output_parser.py +16 -18
langchain/agents/structured_chat/prompt.py +3 -4
langchain/agents/tool_calling_agent/base.py +7 -6
langchain/agents/tools.py +2 -2
langchain/agents/utils.py +2 -3
langchain/agents/xml/base.py +5 -5
langchain/agents/xml/prompt.py +1 -2
langchain/cache.py +12 -12
langchain/callbacks/__init__.py +11 -11
langchain/callbacks/aim_callback.py +2 -2
langchain/callbacks/argilla_callback.py +1 -1
langchain/callbacks/arize_callback.py +1 -1
langchain/callbacks/arthur_callback.py +1 -1
langchain/callbacks/base.py +7 -7
langchain/callbacks/clearml_callback.py +1 -1
langchain/callbacks/comet_ml_callback.py +1 -1
langchain/callbacks/confident_callback.py +1 -1
langchain/callbacks/context_callback.py +1 -1
langchain/callbacks/flyte_callback.py +1 -1
langchain/callbacks/human.py +2 -2
langchain/callbacks/infino_callback.py +1 -1
langchain/callbacks/labelstudio_callback.py +1 -1
langchain/callbacks/llmonitor_callback.py +1 -1
langchain/callbacks/manager.py +5 -5
langchain/callbacks/mlflow_callback.py +2 -2
langchain/callbacks/openai_info.py +1 -1
langchain/callbacks/promptlayer_callback.py +1 -1
langchain/callbacks/sagemaker_callback.py +1 -1
langchain/callbacks/streaming_aiter.py +4 -1
langchain/callbacks/streaming_aiter_final_only.py +5 -3
langchain/callbacks/streaming_stdout_final_only.py +5 -3
langchain/callbacks/streamlit/__init__.py +3 -2
langchain/callbacks/streamlit/mutable_expander.py +1 -1
langchain/callbacks/streamlit/streamlit_callback_handler.py +3 -3
langchain/callbacks/tracers/__init__.py +1 -1
langchain/callbacks/tracers/comet.py +1 -1
langchain/callbacks/tracers/evaluation.py +1 -1
langchain/callbacks/tracers/log_stream.py +1 -1
langchain/callbacks/tracers/logging.py +1 -1
langchain/callbacks/tracers/stdout.py +1 -1
langchain/callbacks/trubrics_callback.py +1 -1
langchain/callbacks/utils.py +4 -4
langchain/callbacks/wandb_callback.py +1 -1
langchain/callbacks/whylabs_callback.py +1 -1
langchain/chains/api/base.py +36 -22
langchain/chains/api/news_docs.py +1 -2
langchain/chains/api/open_meteo_docs.py +1 -2
langchain/chains/api/openapi/requests_chain.py +1 -1
langchain/chains/api/openapi/response_chain.py +1 -1
langchain/chains/api/podcast_docs.py +1 -2
langchain/chains/api/prompt.py +1 -2
langchain/chains/api/tmdb_docs.py +1 -2
langchain/chains/base.py +88 -54
langchain/chains/chat_vector_db/prompts.py +2 -3
langchain/chains/combine_documents/__init__.py +1 -1
langchain/chains/combine_documents/base.py +23 -10
langchain/chains/combine_documents/map_reduce.py +38 -30
langchain/chains/combine_documents/map_rerank.py +33 -20
langchain/chains/combine_documents/reduce.py +47 -26
langchain/chains/combine_documents/refine.py +26 -17
langchain/chains/combine_documents/stuff.py +19 -12
langchain/chains/constitutional_ai/base.py +4 -4
langchain/chains/constitutional_ai/principles.py +22 -25
langchain/chains/constitutional_ai/prompts.py +25 -28
langchain/chains/conversation/base.py +5 -3
langchain/chains/conversation/memory.py +5 -5
langchain/chains/conversation/prompt.py +5 -5
langchain/chains/conversational_retrieval/base.py +41 -20
langchain/chains/conversational_retrieval/prompts.py +2 -3
langchain/chains/elasticsearch_database/base.py +8 -9
langchain/chains/elasticsearch_database/prompts.py +2 -3
langchain/chains/ernie_functions/__init__.py +2 -2
langchain/chains/example_generator.py +3 -1
langchain/chains/flare/base.py +26 -12
langchain/chains/graph_qa/cypher.py +2 -2
langchain/chains/graph_qa/falkordb.py +1 -1
langchain/chains/graph_qa/gremlin.py +1 -1
langchain/chains/graph_qa/neptune_sparql.py +1 -1
langchain/chains/graph_qa/prompts.py +2 -2
langchain/chains/history_aware_retriever.py +2 -1
langchain/chains/hyde/base.py +6 -5
langchain/chains/hyde/prompts.py +5 -6
langchain/chains/llm.py +77 -61
langchain/chains/llm_bash/__init__.py +2 -1
langchain/chains/llm_checker/base.py +7 -5
langchain/chains/llm_checker/prompt.py +3 -4
langchain/chains/llm_math/base.py +16 -9
langchain/chains/llm_math/prompt.py +1 -2
langchain/chains/llm_summarization_checker/base.py +9 -6
langchain/chains/llm_symbolic_math/__init__.py +2 -1
langchain/chains/loading.py +151 -95
langchain/chains/mapreduce.py +4 -3
langchain/chains/moderation.py +8 -9
langchain/chains/natbot/base.py +8 -8
langchain/chains/natbot/crawler.py +73 -76
langchain/chains/natbot/prompt.py +2 -3
langchain/chains/openai_functions/__init__.py +7 -7
langchain/chains/openai_functions/base.py +13 -10
langchain/chains/openai_functions/citation_fuzzy_match.py +12 -11
langchain/chains/openai_functions/extraction.py +19 -19
langchain/chains/openai_functions/openapi.py +35 -35
langchain/chains/openai_functions/qa_with_structure.py +19 -12
langchain/chains/openai_functions/tagging.py +2 -4
langchain/chains/openai_tools/extraction.py +7 -8
langchain/chains/qa_generation/base.py +4 -3
langchain/chains/qa_generation/prompt.py +5 -5
langchain/chains/qa_with_sources/base.py +14 -6
langchain/chains/qa_with_sources/loading.py +16 -8
langchain/chains/qa_with_sources/map_reduce_prompt.py +8 -9
langchain/chains/qa_with_sources/refine_prompts.py +0 -1
langchain/chains/qa_with_sources/retrieval.py +14 -5
langchain/chains/qa_with_sources/stuff_prompt.py +6 -7
langchain/chains/qa_with_sources/vector_db.py +17 -6
langchain/chains/query_constructor/base.py +34 -33
langchain/chains/query_constructor/ir.py +4 -4
langchain/chains/query_constructor/parser.py +37 -32
langchain/chains/query_constructor/prompt.py +5 -6
langchain/chains/question_answering/chain.py +21 -10
langchain/chains/question_answering/map_reduce_prompt.py +14 -14
langchain/chains/question_answering/map_rerank_prompt.py +3 -3
langchain/chains/question_answering/refine_prompts.py +2 -5
langchain/chains/question_answering/stuff_prompt.py +5 -5
langchain/chains/retrieval.py +1 -3
langchain/chains/retrieval_qa/base.py +34 -27
langchain/chains/retrieval_qa/prompt.py +1 -2
langchain/chains/router/__init__.py +3 -3
langchain/chains/router/base.py +24 -20
langchain/chains/router/embedding_router.py +12 -8
langchain/chains/router/llm_router.py +17 -16
langchain/chains/router/multi_prompt.py +2 -2
langchain/chains/router/multi_retrieval_qa.py +10 -5
langchain/chains/sequential.py +30 -18
langchain/chains/sql_database/prompt.py +14 -16
langchain/chains/sql_database/query.py +6 -5
langchain/chains/structured_output/__init__.py +1 -1
langchain/chains/structured_output/base.py +75 -67
langchain/chains/summarize/chain.py +11 -5
langchain/chains/summarize/map_reduce_prompt.py +0 -1
langchain/chains/summarize/stuff_prompt.py +0 -1
langchain/chains/transform.py +5 -6
langchain/chat_loaders/facebook_messenger.py +1 -1
langchain/chat_loaders/langsmith.py +1 -1
langchain/chat_loaders/utils.py +3 -3
langchain/chat_models/__init__.py +20 -19
langchain/chat_models/anthropic.py +1 -1
langchain/chat_models/azureml_endpoint.py +1 -1
langchain/chat_models/baidu_qianfan_endpoint.py +1 -1
langchain/chat_models/base.py +160 -123
langchain/chat_models/bedrock.py +1 -1
langchain/chat_models/fake.py +1 -1
langchain/chat_models/meta.py +1 -1
langchain/chat_models/pai_eas_endpoint.py +1 -1
langchain/chat_models/promptlayer_openai.py +1 -1
langchain/chat_models/volcengine_maas.py +1 -1
langchain/docstore/base.py +1 -1
langchain/document_loaders/__init__.py +9 -9
langchain/document_loaders/airbyte.py +3 -3
langchain/document_loaders/assemblyai.py +1 -1
langchain/document_loaders/azure_blob_storage_container.py +1 -1
langchain/document_loaders/azure_blob_storage_file.py +1 -1
langchain/document_loaders/baiducloud_bos_file.py +1 -1
langchain/document_loaders/base.py +1 -1
langchain/document_loaders/blob_loaders/__init__.py +1 -1
langchain/document_loaders/blockchain.py +1 -1
langchain/document_loaders/chatgpt.py +1 -1
langchain/document_loaders/college_confidential.py +1 -1
langchain/document_loaders/confluence.py +1 -1
langchain/document_loaders/email.py +1 -1
langchain/document_loaders/facebook_chat.py +1 -1
langchain/document_loaders/markdown.py +1 -1
langchain/document_loaders/notebook.py +1 -1
langchain/document_loaders/org_mode.py +1 -1
langchain/document_loaders/parsers/__init__.py +1 -1
langchain/document_loaders/parsers/docai.py +1 -1
langchain/document_loaders/parsers/generic.py +1 -1
langchain/document_loaders/parsers/html/__init__.py +1 -1
langchain/document_loaders/parsers/html/bs4.py +1 -1
langchain/document_loaders/parsers/language/cobol.py +1 -1
langchain/document_loaders/parsers/language/python.py +1 -1
langchain/document_loaders/parsers/msword.py +1 -1
langchain/document_loaders/parsers/pdf.py +5 -5
langchain/document_loaders/parsers/registry.py +1 -1
langchain/document_loaders/pdf.py +8 -8
langchain/document_loaders/powerpoint.py +1 -1
langchain/document_loaders/pyspark_dataframe.py +1 -1
langchain/document_loaders/telegram.py +2 -2
langchain/document_loaders/tencent_cos_directory.py +1 -1
langchain/document_loaders/unstructured.py +5 -5
langchain/document_loaders/url_playwright.py +1 -1
langchain/document_loaders/whatsapp_chat.py +1 -1
langchain/document_loaders/youtube.py +2 -2
langchain/document_transformers/__init__.py +3 -3
langchain/document_transformers/beautiful_soup_transformer.py +1 -1
langchain/document_transformers/doctran_text_extract.py +1 -1
langchain/document_transformers/doctran_text_qa.py +1 -1
langchain/document_transformers/doctran_text_translate.py +1 -1
langchain/document_transformers/embeddings_redundant_filter.py +3 -3
langchain/document_transformers/google_translate.py +1 -1
langchain/document_transformers/html2text.py +1 -1
langchain/document_transformers/nuclia_text_transform.py +1 -1
langchain/embeddings/__init__.py +5 -5
langchain/embeddings/base.py +33 -24
langchain/embeddings/cache.py +36 -31
langchain/embeddings/fake.py +1 -1
langchain/embeddings/huggingface.py +2 -2
langchain/evaluation/__init__.py +22 -22
langchain/evaluation/agents/trajectory_eval_chain.py +23 -23
langchain/evaluation/agents/trajectory_eval_prompt.py +6 -9
langchain/evaluation/comparison/__init__.py +1 -1
langchain/evaluation/comparison/eval_chain.py +20 -13
langchain/evaluation/comparison/prompt.py +1 -2
langchain/evaluation/criteria/__init__.py +1 -1
langchain/evaluation/criteria/eval_chain.py +20 -11
langchain/evaluation/criteria/prompt.py +2 -3
langchain/evaluation/embedding_distance/base.py +23 -20
langchain/evaluation/loading.py +15 -11
langchain/evaluation/parsing/base.py +4 -1
langchain/evaluation/parsing/json_distance.py +5 -2
langchain/evaluation/parsing/json_schema.py +12 -8
langchain/evaluation/qa/__init__.py +1 -1
langchain/evaluation/qa/eval_chain.py +12 -5
langchain/evaluation/qa/eval_prompt.py +7 -8
langchain/evaluation/qa/generate_chain.py +2 -1
langchain/evaluation/qa/generate_prompt.py +2 -4
langchain/evaluation/schema.py +38 -30
langchain/evaluation/scoring/__init__.py +1 -1
langchain/evaluation/scoring/eval_chain.py +22 -15
langchain/evaluation/scoring/prompt.py +0 -1
langchain/evaluation/string_distance/base.py +14 -9
langchain/globals.py +12 -11
langchain/graphs/__init__.py +6 -6
langchain/graphs/graph_document.py +1 -1
langchain/graphs/networkx_graph.py +2 -2
langchain/hub.py +9 -11
langchain/indexes/__init__.py +3 -3
langchain/indexes/_sql_record_manager.py +63 -46
langchain/indexes/prompts/entity_extraction.py +1 -2
langchain/indexes/prompts/entity_summarization.py +1 -2
langchain/indexes/prompts/knowledge_triplet_extraction.py +1 -3
langchain/indexes/vectorstore.py +35 -19
langchain/llms/__init__.py +13 -13
langchain/llms/ai21.py +1 -1
langchain/llms/azureml_endpoint.py +4 -4
langchain/llms/base.py +15 -7
langchain/llms/bedrock.py +1 -1
langchain/llms/cloudflare_workersai.py +1 -1
langchain/llms/gradient_ai.py +1 -1
langchain/llms/loading.py +1 -1
langchain/llms/openai.py +1 -1
langchain/llms/sagemaker_endpoint.py +1 -1
langchain/load/dump.py +1 -1
langchain/load/load.py +1 -1
langchain/load/serializable.py +3 -3
langchain/memory/__init__.py +3 -3
langchain/memory/buffer.py +9 -7
langchain/memory/chat_memory.py +14 -8
langchain/memory/chat_message_histories/__init__.py +1 -1
langchain/memory/chat_message_histories/astradb.py +1 -1
langchain/memory/chat_message_histories/cassandra.py +1 -1
langchain/memory/chat_message_histories/cosmos_db.py +1 -1
langchain/memory/chat_message_histories/dynamodb.py +1 -1
langchain/memory/chat_message_histories/elasticsearch.py +1 -1
langchain/memory/chat_message_histories/file.py +1 -1
langchain/memory/chat_message_histories/firestore.py +1 -1
langchain/memory/chat_message_histories/momento.py +1 -1
langchain/memory/chat_message_histories/mongodb.py +1 -1
langchain/memory/chat_message_histories/neo4j.py +1 -1
langchain/memory/chat_message_histories/postgres.py +1 -1
langchain/memory/chat_message_histories/redis.py +1 -1
langchain/memory/chat_message_histories/rocksetdb.py +1 -1
langchain/memory/chat_message_histories/singlestoredb.py +1 -1
langchain/memory/chat_message_histories/streamlit.py +1 -1
langchain/memory/chat_message_histories/upstash_redis.py +1 -1
langchain/memory/chat_message_histories/xata.py +1 -1
langchain/memory/chat_message_histories/zep.py +1 -1
langchain/memory/combined.py +13 -12
langchain/memory/entity.py +84 -61
langchain/memory/prompt.py +10 -11
langchain/memory/readonly.py +0 -2
langchain/memory/simple.py +1 -3
langchain/memory/summary.py +13 -11
langchain/memory/summary_buffer.py +17 -8
langchain/memory/utils.py +3 -2
langchain/memory/vectorstore.py +12 -5
langchain/memory/vectorstore_token_buffer_memory.py +5 -5
langchain/model_laboratory.py +12 -11
langchain/output_parsers/__init__.py +4 -4
langchain/output_parsers/boolean.py +7 -4
langchain/output_parsers/combining.py +10 -5
langchain/output_parsers/datetime.py +32 -31
langchain/output_parsers/enum.py +5 -3
langchain/output_parsers/fix.py +52 -52
langchain/output_parsers/format_instructions.py +6 -8
langchain/output_parsers/json.py +2 -2
langchain/output_parsers/list.py +2 -2
langchain/output_parsers/loading.py +9 -9
langchain/output_parsers/openai_functions.py +3 -3
langchain/output_parsers/openai_tools.py +1 -1
langchain/output_parsers/pandas_dataframe.py +43 -47
langchain/output_parsers/prompts.py +1 -2
langchain/output_parsers/rail_parser.py +1 -1
langchain/output_parsers/regex.py +7 -8
langchain/output_parsers/regex_dict.py +7 -10
langchain/output_parsers/retry.py +77 -78
langchain/output_parsers/structured.py +11 -6
langchain/output_parsers/yaml.py +15 -11
langchain/prompts/__init__.py +5 -3
langchain/prompts/base.py +5 -5
langchain/prompts/chat.py +8 -8
langchain/prompts/example_selector/__init__.py +3 -1
langchain/prompts/example_selector/semantic_similarity.py +2 -2
langchain/prompts/few_shot.py +1 -1
langchain/prompts/loading.py +3 -3
langchain/prompts/prompt.py +1 -1
langchain/retrievers/__init__.py +5 -5
langchain/retrievers/bedrock.py +2 -2
langchain/retrievers/bm25.py +1 -1
langchain/retrievers/contextual_compression.py +14 -8
langchain/retrievers/docarray.py +1 -1
langchain/retrievers/document_compressors/__init__.py +5 -4
langchain/retrievers/document_compressors/base.py +12 -6
langchain/retrievers/document_compressors/chain_extract.py +2 -2
langchain/retrievers/document_compressors/chain_extract_prompt.py +2 -3
langchain/retrievers/document_compressors/chain_filter.py +9 -9
langchain/retrievers/document_compressors/chain_filter_prompt.py +1 -2
langchain/retrievers/document_compressors/cohere_rerank.py +15 -15
langchain/retrievers/document_compressors/embeddings_filter.py +21 -17
langchain/retrievers/document_compressors/flashrank_rerank.py +1 -1
langchain/retrievers/document_compressors/listwise_rerank.py +7 -5
langchain/retrievers/ensemble.py +28 -25
langchain/retrievers/google_cloud_documentai_warehouse.py +1 -1
langchain/retrievers/google_vertex_ai_search.py +2 -2
langchain/retrievers/kendra.py +10 -10
langchain/retrievers/llama_index.py +1 -1
langchain/retrievers/merger_retriever.py +11 -11
langchain/retrievers/milvus.py +1 -1
langchain/retrievers/multi_query.py +32 -26
langchain/retrievers/multi_vector.py +20 -8
langchain/retrievers/parent_document_retriever.py +18 -9
langchain/retrievers/re_phraser.py +6 -5
langchain/retrievers/self_query/base.py +138 -127
langchain/retrievers/time_weighted_retriever.py +18 -7
langchain/retrievers/zilliz.py +1 -1
langchain/runnables/openai_functions.py +6 -2
langchain/schema/__init__.py +23 -23
langchain/schema/cache.py +1 -1
langchain/schema/callbacks/base.py +7 -7
langchain/schema/callbacks/manager.py +19 -19
langchain/schema/callbacks/tracers/base.py +1 -1
langchain/schema/callbacks/tracers/evaluation.py +1 -1
langchain/schema/callbacks/tracers/langchain.py +1 -1
langchain/schema/callbacks/tracers/langchain_v1.py +1 -1
langchain/schema/callbacks/tracers/log_stream.py +1 -1
langchain/schema/callbacks/tracers/schemas.py +8 -8
langchain/schema/callbacks/tracers/stdout.py +3 -3
langchain/schema/document.py +1 -1
langchain/schema/language_model.py +2 -2
langchain/schema/messages.py +12 -12
langchain/schema/output.py +3 -3
langchain/schema/output_parser.py +3 -3
langchain/schema/runnable/__init__.py +3 -3
langchain/schema/runnable/base.py +9 -9
langchain/schema/runnable/config.py +5 -5
langchain/schema/runnable/configurable.py +1 -1
langchain/schema/runnable/history.py +1 -1
langchain/schema/runnable/passthrough.py +1 -1
langchain/schema/runnable/utils.py +16 -16
langchain/schema/vectorstore.py +1 -1
langchain/smith/__init__.py +1 -1
langchain/smith/evaluation/__init__.py +2 -2
langchain/smith/evaluation/config.py +10 -7
langchain/smith/evaluation/name_generation.py +3 -3
langchain/smith/evaluation/progress.py +11 -2
langchain/smith/evaluation/runner_utils.py +179 -127
langchain/smith/evaluation/string_run_evaluator.py +75 -68
langchain/storage/__init__.py +2 -2
langchain/storage/_lc_store.py +4 -2
langchain/storage/encoder_backed.py +6 -2
langchain/storage/file_system.py +19 -16
langchain/storage/in_memory.py +1 -1
langchain/storage/upstash_redis.py +1 -1
langchain/text_splitter.py +15 -15
langchain/tools/__init__.py +28 -26
langchain/tools/ainetwork/app.py +1 -1
langchain/tools/ainetwork/base.py +1 -1
langchain/tools/ainetwork/owner.py +1 -1
langchain/tools/ainetwork/rule.py +1 -1
langchain/tools/ainetwork/transfer.py +1 -1
langchain/tools/ainetwork/value.py +1 -1
langchain/tools/amadeus/closest_airport.py +1 -1
langchain/tools/amadeus/flight_search.py +1 -1
langchain/tools/azure_cognitive_services/__init__.py +1 -1
langchain/tools/base.py +4 -4
langchain/tools/bearly/tool.py +1 -1
langchain/tools/bing_search/__init__.py +1 -1
langchain/tools/bing_search/tool.py +1 -1
langchain/tools/dataforseo_api_search/__init__.py +1 -1
langchain/tools/dataforseo_api_search/tool.py +1 -1
langchain/tools/ddg_search/tool.py +1 -1
langchain/tools/e2b_data_analysis/tool.py +2 -2
langchain/tools/edenai/__init__.py +1 -1
langchain/tools/file_management/__init__.py +1 -1
langchain/tools/file_management/copy.py +1 -1
langchain/tools/file_management/delete.py +1 -1
langchain/tools/gmail/__init__.py +2 -2
langchain/tools/gmail/get_message.py +1 -1
langchain/tools/gmail/search.py +1 -1
langchain/tools/gmail/send_message.py +1 -1
langchain/tools/google_finance/__init__.py +1 -1
langchain/tools/google_finance/tool.py +1 -1
langchain/tools/google_scholar/__init__.py +1 -1
langchain/tools/google_scholar/tool.py +1 -1
langchain/tools/google_search/__init__.py +1 -1
langchain/tools/google_search/tool.py +1 -1
langchain/tools/google_serper/__init__.py +1 -1
langchain/tools/google_serper/tool.py +1 -1
langchain/tools/google_trends/__init__.py +1 -1
langchain/tools/google_trends/tool.py +1 -1
langchain/tools/jira/tool.py +20 -1
langchain/tools/json/tool.py +25 -3
langchain/tools/memorize/tool.py +1 -1
langchain/tools/multion/__init__.py +1 -1
langchain/tools/multion/update_session.py +1 -1
langchain/tools/office365/__init__.py +2 -2
langchain/tools/office365/events_search.py +1 -1
langchain/tools/office365/messages_search.py +1 -1
langchain/tools/office365/send_event.py +1 -1
langchain/tools/office365/send_message.py +1 -1
langchain/tools/openapi/utils/api_models.py +6 -6
langchain/tools/playwright/__init__.py +5 -5
langchain/tools/playwright/click.py +1 -1
langchain/tools/playwright/extract_hyperlinks.py +1 -1
langchain/tools/playwright/get_elements.py +1 -1
langchain/tools/playwright/navigate.py +1 -1
langchain/tools/plugin.py +2 -2
langchain/tools/powerbi/tool.py +1 -1
langchain/tools/python/__init__.py +2 -1
langchain/tools/reddit_search/tool.py +1 -1
langchain/tools/render.py +2 -2
langchain/tools/requests/tool.py +2 -2
langchain/tools/searchapi/tool.py +1 -1
langchain/tools/searx_search/tool.py +1 -1
langchain/tools/slack/get_message.py +1 -1
langchain/tools/spark_sql/tool.py +1 -1
langchain/tools/sql_database/tool.py +1 -1
langchain/tools/tavily_search/__init__.py +1 -1
langchain/tools/tavily_search/tool.py +1 -1
langchain/tools/zapier/__init__.py +1 -1
langchain/tools/zapier/tool.py +24 -2
langchain/utilities/__init__.py +4 -4
langchain/utilities/arcee.py +4 -4
langchain/utilities/clickup.py +4 -4
langchain/utilities/dalle_image_generator.py +1 -1
langchain/utilities/dataforseo_api_search.py +1 -1
langchain/utilities/opaqueprompts.py +1 -1
langchain/utilities/reddit_search.py +1 -1
langchain/utilities/sql_database.py +1 -1
langchain/utilities/tavily_search.py +1 -1
langchain/utilities/vertexai.py +2 -2
langchain/utils/__init__.py +1 -1
langchain/utils/aiter.py +1 -1
langchain/utils/html.py +3 -3
langchain/utils/input.py +1 -1
langchain/utils/iter.py +1 -1
langchain/utils/json_schema.py +1 -3
langchain/utils/strings.py +1 -1
langchain/utils/utils.py +6 -6
langchain/vectorstores/__init__.py +5 -5
langchain/vectorstores/alibabacloud_opensearch.py +1 -1
langchain/vectorstores/azure_cosmos_db.py +1 -1
langchain/vectorstores/clickhouse.py +1 -1
langchain/vectorstores/elastic_vector_search.py +1 -1
langchain/vectorstores/elasticsearch.py +2 -2
langchain/vectorstores/myscale.py +1 -1
langchain/vectorstores/neo4j_vector.py +1 -1
langchain/vectorstores/pgembedding.py +1 -1
langchain/vectorstores/qdrant.py +1 -1
langchain/vectorstores/redis/__init__.py +1 -1
langchain/vectorstores/redis/base.py +1 -1
langchain/vectorstores/redis/filters.py +4 -4
langchain/vectorstores/redis/schema.py +6 -6
langchain/vectorstores/sklearn.py +2 -2
langchain/vectorstores/starrocks.py +1 -1
langchain/vectorstores/utils.py +1 -1
{langchain-0.3.26.dist-info → langchain-0.3.27.dist-info}/METADATA +4 -4
{langchain-0.3.26.dist-info → langchain-0.3.27.dist-info}/RECORD +580 -580
{langchain-0.3.26.dist-info → langchain-0.3.27.dist-info}/WHEEL +1 -1
{langchain-0.3.26.dist-info → langchain-0.3.27.dist-info}/entry_points.txt +0 -0
{langchain-0.3.26.dist-info → langchain-0.3.27.dist-info}/licenses/LICENSE +0 -0

langchain/smith/evaluation/runner_utils.py CHANGED Viewed

@@ -98,10 +98,8 @@ class TestResult(dict):
         to_drop = [
             col
             for col in df.columns
-            if col.startswith("inputs.")
-            or col.startswith("outputs.")
+            if col.startswith(("inputs.", "outputs.", "reference"))
             or col in {"input", "output"}
-            or col.startswith("reference")
         ]
         return df.describe(include="all").drop(to_drop, axis=1)
@@ -110,10 +108,11 @@ class TestResult(dict):
         try:
             import pandas as pd
         except ImportError as e:
-            raise ImportError(
+            msg = (
                 "Pandas is required to convert the results to a dataframe."
                 " to install pandas, run `pip install pandas`."
-            ) from e
+            )
+            raise ImportError(msg) from e
         indices = []
         records = []
@@ -134,7 +133,7 @@ class TestResult(dict):
             if "reference" in result:
                 if isinstance(result["reference"], dict):
                     r.update(
-                        {f"reference.{k}": v for k, v in result["reference"].items()}
+                        {f"reference.{k}": v for k, v in result["reference"].items()},
                     )
                 else:
                     r["reference"] = result["reference"]
@@ -144,7 +143,7 @@ class TestResult(dict):
                     "error": result.get("Error"),
                     "execution_time": result["execution_time"],
                     "run_id": result.get("run_id"),
-                }
+                },
             )
             records.append(r)
             indices.append(example_id)
@@ -161,8 +160,9 @@ class EvalError(dict):
     def __getattr__(self, name: str) -> Any:
         try:
             return self[name]
-        except KeyError:
-            raise AttributeError(f"'EvalError' object has no attribute '{name}'")
+        except KeyError as e:
+            msg = f"'EvalError' object has no attribute '{name}'"
+            raise AttributeError(msg) from e
 def _wrap_in_chain_factory(
@@ -176,7 +176,7 @@ def _wrap_in_chain_factory(
         chain_class = chain.__class__.__name__
         if llm_or_chain_factory.memory is not None:
             memory_class = chain.memory.__class__.__name__
-            raise ValueError(
+            msg = (
                 "Cannot directly evaluate a chain with stateful memory."
                 " To evaluate this chain, pass in a chain constructor"
                 " that initializes fresh memory each time it is called."
@@ -189,14 +189,15 @@ def _wrap_in_chain_factory(
                 "(memory=new_memory, ...)\n\n"
                 f'run_on_dataset("{dataset_name}", chain_constructor, ...)'
             )
+            raise ValueError(msg)
         return lambda: chain
-    elif isinstance(llm_or_chain_factory, BaseLanguageModel):
+    if isinstance(llm_or_chain_factory, BaseLanguageModel):
         return llm_or_chain_factory
-    elif isinstance(llm_or_chain_factory, Runnable):
+    if isinstance(llm_or_chain_factory, Runnable):
         # Memory may exist here, but it's not elegant to check all those cases.
         lcf = llm_or_chain_factory
         return lambda: lcf
-    elif callable(llm_or_chain_factory):
+    if callable(llm_or_chain_factory):
         if is_traceable_function(llm_or_chain_factory):
             runnable_ = as_runnable(cast(Callable, llm_or_chain_factory))
             return lambda: runnable_
@@ -206,7 +207,7 @@ def _wrap_in_chain_factory(
             # It's an arbitrary function, wrap it in a RunnableLambda
             user_func = cast(Callable, llm_or_chain_factory)
             sig = inspect.signature(user_func)
-            logger.info(f"Wrapping function {sig} as RunnableLambda.")
+            logger.info("Wrapping function %s as RunnableLambda.", sig)
             wrapped = RunnableLambda(user_func)
             return lambda: wrapped
         constructor = cast(Callable, llm_or_chain_factory)
@@ -214,15 +215,14 @@ def _wrap_in_chain_factory(
             # It's not uncommon to do an LLM constructor instead of raw LLM,
             # so we'll unpack it for the user.
             return _model
-        elif is_traceable_function(cast(Callable, _model)):
+        if is_traceable_function(cast(Callable, _model)):
             runnable_ = as_runnable(cast(Callable, _model))
             return lambda: runnable_
-        elif not isinstance(_model, Runnable):
+        if not isinstance(_model, Runnable):
             # This is unlikely to happen - a constructor for a model function
             return lambda: RunnableLambda(constructor)
-        else:
-            # Typical correct case
-            return constructor
+        # Typical correct case
+        return constructor
     return llm_or_chain_factory
@@ -238,23 +238,24 @@ def _get_prompt(inputs: dict[str, Any]) -> str:
         InputFormatError: If the input format is invalid.
     """
     if not inputs:
-        raise InputFormatError("Inputs should not be empty.")
+        msg = "Inputs should not be empty."
+        raise InputFormatError(msg)
     prompts = []
     if "prompt" in inputs:
         if not isinstance(inputs["prompt"], str):
-            raise InputFormatError(
-                f"Expected string for 'prompt', got {type(inputs['prompt']).__name__}"
-            )
+            msg = f"Expected string for 'prompt', got {type(inputs['prompt']).__name__}"
+            raise InputFormatError(msg)
         prompts = [inputs["prompt"]]
     elif "prompts" in inputs:
         if not isinstance(inputs["prompts"], list) or not all(
             isinstance(i, str) for i in inputs["prompts"]
         ):
-            raise InputFormatError(
+            msg = (
                 "Expected list of strings for 'prompts',"
                 f" got {type(inputs['prompts']).__name__}"
             )
+            raise InputFormatError(msg)
         prompts = inputs["prompts"]
     elif len(inputs) == 1:
         prompt_ = next(iter(inputs.values()))
@@ -263,17 +264,15 @@ def _get_prompt(inputs: dict[str, Any]) -> str:
         elif isinstance(prompt_, list) and all(isinstance(i, str) for i in prompt_):
             prompts = prompt_
         else:
-            raise InputFormatError(f"LLM Run expects string prompt input. Got {inputs}")
+            msg = f"LLM Run expects string prompt input. Got {inputs}"
+            raise InputFormatError(msg)
     else:
-        raise InputFormatError(
-            f"LLM Run expects 'prompt' or 'prompts' in inputs. Got {inputs}"
-        )
+        msg = f"LLM Run expects 'prompt' or 'prompts' in inputs. Got {inputs}"
+        raise InputFormatError(msg)
     if len(prompts) == 1:
         return prompts[0]
-    else:
-        raise InputFormatError(
-            f"LLM Run expects single prompt input. Got {len(prompts)} prompts."
-        )
+    msg = f"LLM Run expects single prompt input. Got {len(prompts)} prompts."
+    raise InputFormatError(msg)
 class ChatModelInput(TypedDict):
@@ -298,7 +297,8 @@ def _get_messages(inputs: dict[str, Any]) -> dict:
         InputFormatError: If the input format is invalid.
     """
     if not inputs:
-        raise InputFormatError("Inputs should not be empty.")
+        msg = "Inputs should not be empty."
+        raise InputFormatError(msg)
     input_copy = inputs.copy()
     if "messages" in inputs:
         input_copy["input"] = input_copy.pop("messages")
@@ -313,16 +313,17 @@ def _get_messages(inputs: dict[str, Any]) -> dict:
         if len(raw_messages) == 1:
             input_copy["input"] = messages_from_dict(raw_messages[0])
         else:
-            raise InputFormatError(
+            msg = (
                 "Batch messages not supported. Please provide a"
                 " single list of messages."
             )
+            raise InputFormatError(msg)
         return input_copy
-    else:
-        raise InputFormatError(
-            f"Chat Run expects single List[dict] or List[List[dict]] 'messages'"
-            f" input. Got {inputs}"
-        )
+    msg = (
+        f"Chat Run expects single List[dict] or List[List[dict]] 'messages'"
+        f" input. Got {inputs}"
+    )
+    raise InputFormatError(msg)
 ## Shared data validation utilities
@@ -336,20 +337,21 @@ def _validate_example_inputs_for_language_model(
             isinstance(prompt_input, list)
             and all(isinstance(msg, BaseMessage) for msg in prompt_input)
         ):
-            raise InputFormatError(
+            msg = (
                 "When using an input_mapper to prepare dataset example inputs"
                 " for an LLM or chat model, the output must a single string or"
                 " a list of chat messages."
                 f"\nGot: {prompt_input} of type {type(prompt_input)}."
             )
+            raise InputFormatError(msg)
     else:
         try:
             _get_prompt(first_example.inputs or {})
         except InputFormatError:
             try:
                 _get_messages(first_example.inputs or {})
-            except InputFormatError:
-                raise InputFormatError(
+            except InputFormatError as err2:
+                msg = (
                     "Example inputs do not match language model input format. "
                     "Expected a dictionary with messages or a single prompt."
                     f" Got: {first_example.inputs}"
@@ -357,6 +359,7 @@ def _validate_example_inputs_for_language_model(
                     " to convert the example.inputs to a compatible format"
                     " for the llm or chat model you wish to evaluate."
                 )
+                raise InputFormatError(msg) from err2
 def _validate_example_inputs_for_chain(
@@ -369,16 +372,18 @@ def _validate_example_inputs_for_chain(
         first_inputs = input_mapper(first_example.inputs or {})
         missing_keys = set(chain.input_keys).difference(first_inputs)
         if not isinstance(first_inputs, dict):
-            raise InputFormatError(
+            msg = (
                 "When using an input_mapper to prepare dataset example"
                 " inputs for a chain, the mapped value must be a dictionary."
                 f"\nGot: {first_inputs} of type {type(first_inputs)}."
             )
+            raise InputFormatError(msg)
         if missing_keys:
-            raise InputFormatError(
+            msg = (
                 "Missing keys after loading example using input_mapper."
                 f"\nExpected: {chain.input_keys}. Got: {first_inputs.keys()}"
             )
+            raise InputFormatError(msg)
     else:
         first_inputs = first_example.inputs
         missing_keys = set(chain.input_keys).difference(first_inputs)
@@ -387,13 +392,14 @@ def _validate_example_inputs_for_chain(
             # Refrain from calling to validate.
             pass
         elif missing_keys:
-            raise InputFormatError(
+            msg = (
                 "Example inputs missing expected chain input keys."
                 " Please provide an input_mapper to convert the example.inputs"
                 " to a compatible format for the chain you wish to evaluate."
                 f"Expected: {chain.input_keys}. "
                 f"Got: {first_inputs.keys()}"
             )
+            raise InputFormatError(msg)
 def _validate_example_inputs(
@@ -410,7 +416,7 @@ def _validate_example_inputs(
             # Otherwise it's a runnable
             _validate_example_inputs_for_chain(example, chain, input_mapper)
         elif isinstance(chain, Runnable):
-            logger.debug(f"Skipping input validation for {chain}")
+            logger.debug("Skipping input validation for %s", chain)
 ## Shared Evaluator Setup Utilities
@@ -455,16 +461,19 @@ def _determine_input_key(
         input_key = config.input_key
         if run_inputs and input_key not in run_inputs:
             logger.warning(
-                f"Input key {input_key} not in chain's specified"
-                f" input keys {run_inputs}. Evaluation behavior may be undefined."
+                "Input key %s not in chain's specified input keys %s. "
+                "Evaluation behavior may be undefined.",
+                input_key,
+                run_inputs,
             )
     elif run_inputs and len(run_inputs) == 1:
         input_key = run_inputs[0]
     elif run_inputs is not None and len(run_inputs) > 1:
         logger.warning(
-            f"Chain expects multiple input keys: {run_inputs},"
-            f" Evaluator is likely to fail. Evaluation behavior may be undefined."
-            " Specify an input_key in the RunEvalConfig to avoid this warning."
+            "Chain expects multiple input keys: %s,"
+            " Evaluator is likely to fail. Evaluation behavior may be undefined."
+            " Specify an input_key in the RunEvalConfig to avoid this warning.",
+            run_inputs,
         )
     return input_key
@@ -479,16 +488,19 @@ def _determine_prediction_key(
         prediction_key = config.prediction_key
         if run_outputs and prediction_key not in run_outputs:
             logger.warning(
-                f"Prediction key {prediction_key} not in chain's specified"
-                f" output keys {run_outputs}. Evaluation behavior may be undefined."
+                "Prediction key %s not in chain's specified output keys %s. "
+                "Evaluation behavior may be undefined.",
+                prediction_key,
+                run_outputs,
             )
     elif run_outputs and len(run_outputs) == 1:
         prediction_key = run_outputs[0]
     elif run_outputs is not None and len(run_outputs) > 1:
         logger.warning(
-            f"Chain expects multiple output keys: {run_outputs},"
-            f" Evaluation behavior may be undefined. Specify a prediction_key"
-            " in the RunEvalConfig to avoid this warning."
+            "Chain expects multiple output keys: %s,"
+            " Evaluation behavior may be undefined. Specify a prediction_key"
+            " in the RunEvalConfig to avoid this warning.",
+            run_outputs,
         )
     return prediction_key
@@ -500,12 +512,13 @@ def _determine_reference_key(
     if config.reference_key:
         reference_key = config.reference_key
         if example_outputs and reference_key not in example_outputs:
-            raise ValueError(
+            msg = (
                 f"Reference key {reference_key} not in Dataset"
                 f" example outputs: {example_outputs}"
             )
+            raise ValueError(msg)
     elif example_outputs and len(example_outputs) == 1:
-        reference_key = list(example_outputs)[0]
+        reference_key = next(iter(example_outputs))
     else:
         reference_key = None
     return reference_key
@@ -544,15 +557,17 @@ def _construct_run_evaluator(
         # Assume we can decorate
         return run_evaluator_dec(eval_config)
     else:
-        raise ValueError(f"Unknown evaluator type: {type(eval_config)}")
+        msg = f"Unknown evaluator type: {type(eval_config)}"
+        raise ValueError(msg)  # noqa: TRY004
     if isinstance(evaluator_, StringEvaluator):
         if evaluator_.requires_reference and reference_key is None:
-            raise ValueError(
+            msg = (
                 f"Must specify reference_key in smith_eval.RunEvalConfig to use"
                 f" evaluator of type {eval_type_tag} with"
                 f" dataset with multiple output keys: {example_outputs}."
             )
+            raise ValueError(msg)
         run_evaluator = smith_eval.StringRunEvaluatorChain.from_run_and_data_type(
             evaluator_,
             run_type,
@@ -563,18 +578,18 @@ def _construct_run_evaluator(
             tags=[eval_type_tag],
         )
     elif isinstance(evaluator_, PairwiseStringEvaluator):
-        raise NotImplementedError(
+        msg = (
             f"Run evaluator for {eval_type_tag} is not implemented."
             " PairwiseStringEvaluators compare the outputs of two different models"
             " rather than the output of a single model."
             " Did you mean to use a StringEvaluator instead?"
             "\nSee: https://python.langchain.com/docs/guides/evaluation/string/"
         )
+        raise NotImplementedError(msg)
     else:
-        raise NotImplementedError(
-            f"Run evaluator for {eval_type_tag} is not implemented"
-        )
+        msg = f"Run evaluator for {eval_type_tag} is not implemented"
+        raise NotImplementedError(msg)
     return run_evaluator
@@ -611,10 +626,13 @@ def _load_run_evaluators(
     input_key, prediction_key, reference_key = None, None, None
     if config.evaluators or (
         config.custom_evaluators
-        and any([isinstance(e, StringEvaluator) for e in config.custom_evaluators])
+        and any(isinstance(e, StringEvaluator) for e in config.custom_evaluators)
     ):
         input_key, prediction_key, reference_key = _get_keys(
-            config, run_inputs, run_outputs, example_outputs
+            config,
+            run_inputs,
+            run_outputs,
+            example_outputs,
         )
     for eval_config in config.evaluators:
         run_evaluator = _construct_run_evaluator(
@@ -641,15 +659,16 @@ def _load_run_evaluators(
                     input_key=input_key,
                     prediction_key=prediction_key,
                     reference_key=reference_key,
-                )
+                ),
             )
         elif callable(custom_evaluator):
             run_evaluators.append(run_evaluator_dec(custom_evaluator))
         else:
-            raise ValueError(
+            msg = (
                 f"Unsupported custom evaluator: {custom_evaluator}."
                 f" Expected RunEvaluator or StringEvaluator."
             )
+            raise ValueError(msg)  # noqa: TRY004
     return run_evaluators
@@ -683,41 +702,45 @@ async def _arun_llm(
     """
     if input_mapper is not None:
         prompt_or_messages = input_mapper(inputs)
-        if (
-            isinstance(prompt_or_messages, str)
-            or isinstance(prompt_or_messages, list)
+        if isinstance(prompt_or_messages, str) or (
+            isinstance(prompt_or_messages, list)
             and all(isinstance(msg, BaseMessage) for msg in prompt_or_messages)
         ):
             return await llm.ainvoke(
                 prompt_or_messages,
                 config=RunnableConfig(
-                    callbacks=callbacks, tags=tags or [], metadata=metadata or {}
+                    callbacks=callbacks,
+                    tags=tags or [],
+                    metadata=metadata or {},
                 ),
             )
-        else:
-            raise InputFormatError(
-                "Input mapper returned invalid format"
-                f" {prompt_or_messages}"
-                "\nExpected a single string or list of chat messages."
-            )
+        msg = (
+            "Input mapper returned invalid format"
+            f" {prompt_or_messages}"
+            "\nExpected a single string or list of chat messages."
+        )
+        raise InputFormatError(msg)
-    else:
-        try:
-            prompt = _get_prompt(inputs)
-            llm_output: Union[str, BaseMessage] = await llm.ainvoke(
-                prompt,
-                config=RunnableConfig(
-                    callbacks=callbacks, tags=tags or [], metadata=metadata or {}
-                ),
-            )
-        except InputFormatError:
-            llm_inputs = _get_messages(inputs)
-            llm_output = await llm.ainvoke(
-                **llm_inputs,
-                config=RunnableConfig(
-                    callbacks=callbacks, tags=tags or [], metadata=metadata or {}
-                ),
-            )
+    try:
+        prompt = _get_prompt(inputs)
+        llm_output: Union[str, BaseMessage] = await llm.ainvoke(
+            prompt,
+            config=RunnableConfig(
+                callbacks=callbacks,
+                tags=tags or [],
+                metadata=metadata or {},
+            ),
+        )
+    except InputFormatError:
+        llm_inputs = _get_messages(inputs)
+        llm_output = await llm.ainvoke(
+            **llm_inputs,
+            config=RunnableConfig(
+                callbacks=callbacks,
+                tags=tags or [],
+                metadata=metadata or {},
+            ),
+        )
     return llm_output
@@ -742,12 +765,16 @@ async def _arun_chain(
         output = await chain.ainvoke(
             val,
             config=RunnableConfig(
-                callbacks=callbacks, tags=tags or [], metadata=metadata or {}
+                callbacks=callbacks,
+                tags=tags or [],
+                metadata=metadata or {},
             ),
         )
     else:
         runnable_config = RunnableConfig(
-            tags=tags or [], callbacks=callbacks, metadata=metadata or {}
+            tags=tags or [],
+            callbacks=callbacks,
+            metadata=metadata or {},
         )
         output = await chain.ainvoke(inputs_, config=runnable_config)
     return output
@@ -799,9 +826,11 @@ async def _arun_llm_or_chain(
         result = output
     except Exception as e:
         logger.warning(
-            f"{chain_or_llm} failed for example {example.id} "
-            f"with inputs {example.inputs}"
-            f"\n{repr(e)}"
+            "%s failed for example %s with inputs %s\n%s",
+            chain_or_llm,
+            example.id,
+            example.inputs,
+            e,
         )
         result = EvalError(Error=e)
     return result
@@ -837,30 +866,34 @@ def _run_llm(
     # Most of this is legacy code; we could probably remove a lot of it.
     if input_mapper is not None:
         prompt_or_messages = input_mapper(inputs)
-        if (
-            isinstance(prompt_or_messages, str)
-            or isinstance(prompt_or_messages, list)
+        if isinstance(prompt_or_messages, str) or (
+            isinstance(prompt_or_messages, list)
             and all(isinstance(msg, BaseMessage) for msg in prompt_or_messages)
         ):
             llm_output: Union[str, BaseMessage] = llm.invoke(
                 prompt_or_messages,
                 config=RunnableConfig(
-                    callbacks=callbacks, tags=tags or [], metadata=metadata or {}
+                    callbacks=callbacks,
+                    tags=tags or [],
+                    metadata=metadata or {},
                 ),
             )
         else:
-            raise InputFormatError(
+            msg = (
                 "Input mapper returned invalid format: "
                 f" {prompt_or_messages}"
                 "\nExpected a single string or list of chat messages."
             )
+            raise InputFormatError(msg)
     else:
         try:
             llm_prompts = _get_prompt(inputs)
             llm_output = llm.invoke(
                 llm_prompts,
                 config=RunnableConfig(
-                    callbacks=callbacks, tags=tags or [], metadata=metadata or {}
+                    callbacks=callbacks,
+                    tags=tags or [],
+                    metadata=metadata or {},
                 ),
             )
         except InputFormatError:
@@ -893,12 +926,16 @@ def _run_chain(
         output = chain.invoke(
             val,
             config=RunnableConfig(
-                callbacks=callbacks, tags=tags or [], metadata=metadata or {}
+                callbacks=callbacks,
+                tags=tags or [],
+                metadata=metadata or {},
             ),
         )
     else:
         runnable_config = RunnableConfig(
-            tags=tags or [], callbacks=callbacks, metadata=metadata or {}
+            tags=tags or [],
+            callbacks=callbacks,
+            metadata=metadata or {},
         )
         output = chain.invoke(inputs_, config=runnable_config)
     return output
@@ -952,9 +989,12 @@ def _run_llm_or_chain(
     except Exception as e:
         error_type = type(e).__name__
         logger.warning(
-            f"{chain_or_llm} failed for example {example.id} "
-            f"with inputs {example.inputs}"
-            f"\nError Type: {error_type}, Message: {e}"
+            "%s failed for example %s with inputs %s\nError Type: %s, Message: %s",
+            chain_or_llm,
+            example.id,
+            example.inputs,
+            error_type,
+            e,
         )
         result = EvalError(Error=e)
     return result
@@ -974,7 +1014,8 @@ def _prepare_eval_run(
     examples = list(client.list_examples(dataset_id=dataset.id, as_of=dataset_version))
     if not examples:
-        raise ValueError(f"Dataset {dataset_name} has no example rows.")
+        msg = f"Dataset {dataset_name} has no example rows."
+        raise ValueError(msg)
     modified_at = [ex.modified_at for ex in examples if ex.modified_at]
     # Should always be defined in practice when fetched,
     # but the typing permits None
@@ -999,7 +1040,7 @@ def _prepare_eval_run(
         )
     except (HTTPError, ValueError, LangSmithError) as e:
         if "already exists " not in str(e):
-            raise e
+            raise
         uid = uuid.uuid4()
         example_msg = f"""
 run_on_dataset(
@@ -1007,10 +1048,11 @@ run_on_dataset(
     project_name="{project_name} - {uid}", # Update since {project_name} already exists
 )
 """
-        raise ValueError(
+        msg = (
             f"Test project {project_name} already exists. Please use a different name:"
             f"\n\n{example_msg}"
         )
+        raise ValueError(msg) from e
     comparison_url = dataset.url + f"/compare?selectedSessions={project.id}"
     print(  # noqa: T201
         f"View the evaluation results for project '{project_name}'"
@@ -1081,9 +1123,9 @@ class _DatasetRunContainer:
                         run_id=None,
                         project_id=self.project.id,
                     )
-                except Exception as e:
-                    logger.error(
-                        f"Error running batch evaluator {repr(evaluator)}: {e}"
+                except Exception:
+                    logger.exception(
+                        "Error running batch evaluator %s", repr(evaluator)
                     )
         return aggregate_feedback
@@ -1096,7 +1138,7 @@ class _DatasetRunContainer:
                     eval_results = callback.logged_eval_results
                     for (_, example_id), v in eval_results.items():
                         all_eval_results.setdefault(str(example_id), {}).update(
-                            {"feedback": v}
+                            {"feedback": v},
                         )
                 elif isinstance(callback, LangChainTracer):
                     run = callback.latest_run
@@ -1111,7 +1153,7 @@ class _DatasetRunContainer:
                             "execution_time": execution_time,
                             "run_id": run_id,
                             "run": run,
-                        }
+                        },
                     )
                     all_runs[str(callback.example_id)] = run
         return cast(dict[str, _RowResult], all_eval_results), all_runs
@@ -1134,21 +1176,26 @@ class _DatasetRunContainer:
             aggregate_metrics=aggregate_feedback,
         )
-    def finish(self, batch_results: list, verbose: bool = False) -> TestResult:
+    def finish(
+        self,
+        batch_results: list,
+        verbose: bool = False,  # noqa: FBT001,FBT002
+    ) -> TestResult:
         results = self._collect_test_results(batch_results)
         if verbose:
             try:
                 agg_feedback = results.get_aggregate_feedback()
                 _display_aggregate_results(agg_feedback)
             except Exception as e:
-                logger.debug(f"Failed to print aggregate feedback: {repr(e)}")
+                logger.debug("Failed to print aggregate feedback: %s", e, exc_info=True)
         try:
             # Closing the project permits name changing and metric optimizations
             self.client.update_project(
-                self.project.id, end_time=datetime.now(timezone.utc)
+                self.project.id,
+                end_time=datetime.now(timezone.utc),
             )
         except Exception as e:
-            logger.debug(f"Failed to close project: {repr(e)}")
+            logger.debug("Failed to close project: %s", e, exc_info=True)
         return results
     @classmethod
@@ -1188,7 +1235,10 @@ class _DatasetRunContainer:
             run_metadata["revision_id"] = revision_id
         wrapped_model = _wrap_in_chain_factory(llm_or_chain_factory)
         run_evaluators = _setup_evaluation(
-            wrapped_model, examples, evaluation, dataset.data_type or DataType.kv
+            wrapped_model,
+            examples,
+            evaluation,
+            dataset.data_type or DataType.kv,
         )
         _validate_example_inputs(examples[0], wrapped_model, input_mapper)
         progress_bar = progress.ProgressBarCallback(len(examples))
@@ -1242,7 +1292,8 @@ def _display_aggregate_results(aggregate_results: pd.DataFrame) -> None:
         display(aggregate_results)
     else:
         formatted_string = aggregate_results.to_string(
-            float_format=lambda x: f"{x:.2f}", justify="right"
+            float_format=lambda x: f"{x:.2f}",
+            justify="right",
         )
         print("\n Experiment Results:")  # noqa: T201
         print(formatted_string)  # noqa: T201
@@ -1401,7 +1452,7 @@ def run_on_dataset(
                     ),
                     container.examples,
                     container.configs,
-                )
+                ),
             )
     return container.finish(batch_results, verbose=verbose)
@@ -1516,5 +1567,6 @@ or LangSmith's `RunEvaluator` classes.
 """  # noqa: E501
 run_on_dataset.__doc__ = _RUN_ON_DATASET_DOCSTRING
 arun_on_dataset.__doc__ = _RUN_ON_DATASET_DOCSTRING.replace(
-    "run_on_dataset(", "await arun_on_dataset("
+    "run_on_dataset(",
+    "await arun_on_dataset(",
 )

langchain 0.3.26__py3-none-any.whl → 0.3.27__py3-none-any.whl

Potentially problematic release.

langchain 0.3.26py3-none-any.whl → 0.3.27py3-none-any.whl