PyPI - langchain-core - Versions diffs - 0.4.0.dev0__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

langchain-core 0.4.0.dev0py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of langchain-core might be problematic. Click here for more details.

Files changed (172) hide show

langchain_core/__init__.py +1 -1
langchain_core/_api/__init__.py +3 -4
langchain_core/_api/beta_decorator.py +45 -70
langchain_core/_api/deprecation.py +80 -80
langchain_core/_api/path.py +22 -8
langchain_core/_import_utils.py +10 -4
langchain_core/agents.py +25 -21
langchain_core/caches.py +53 -63
langchain_core/callbacks/__init__.py +1 -8
langchain_core/callbacks/base.py +341 -348
langchain_core/callbacks/file.py +55 -44
langchain_core/callbacks/manager.py +546 -683
langchain_core/callbacks/stdout.py +29 -30
langchain_core/callbacks/streaming_stdout.py +35 -36
langchain_core/callbacks/usage.py +65 -70
langchain_core/chat_history.py +48 -55
langchain_core/document_loaders/base.py +46 -21
langchain_core/document_loaders/langsmith.py +39 -36
langchain_core/documents/__init__.py +0 -1
langchain_core/documents/base.py +96 -74
langchain_core/documents/compressor.py +12 -9
langchain_core/documents/transformers.py +29 -28
langchain_core/embeddings/fake.py +56 -57
langchain_core/env.py +2 -3
langchain_core/example_selectors/base.py +12 -0
langchain_core/example_selectors/length_based.py +1 -1
langchain_core/example_selectors/semantic_similarity.py +21 -25
langchain_core/exceptions.py +15 -9
langchain_core/globals.py +4 -163
langchain_core/indexing/api.py +132 -125
langchain_core/indexing/base.py +64 -67
langchain_core/indexing/in_memory.py +26 -6
langchain_core/language_models/__init__.py +15 -27
langchain_core/language_models/_utils.py +267 -117
langchain_core/language_models/base.py +92 -177
langchain_core/language_models/chat_models.py +547 -407
langchain_core/language_models/fake.py +11 -11
langchain_core/language_models/fake_chat_models.py +72 -118
langchain_core/language_models/llms.py +168 -242
langchain_core/load/dump.py +8 -11
langchain_core/load/load.py +32 -28
langchain_core/load/mapping.py +2 -4
langchain_core/load/serializable.py +50 -56
langchain_core/messages/__init__.py +36 -51
langchain_core/messages/ai.py +377 -150
langchain_core/messages/base.py +239 -47
langchain_core/messages/block_translators/__init__.py +111 -0
langchain_core/messages/block_translators/anthropic.py +470 -0
langchain_core/messages/block_translators/bedrock.py +94 -0
langchain_core/messages/block_translators/bedrock_converse.py +297 -0
langchain_core/messages/block_translators/google_genai.py +530 -0
langchain_core/messages/block_translators/google_vertexai.py +21 -0
langchain_core/messages/block_translators/groq.py +143 -0
langchain_core/messages/block_translators/langchain_v0.py +301 -0
langchain_core/messages/block_translators/openai.py +1010 -0
langchain_core/messages/chat.py +2 -3
langchain_core/messages/content.py +1423 -0
langchain_core/messages/function.py +7 -7
langchain_core/messages/human.py +44 -38
langchain_core/messages/modifier.py +3 -2
langchain_core/messages/system.py +40 -27
langchain_core/messages/tool.py +160 -58
langchain_core/messages/utils.py +527 -638
langchain_core/output_parsers/__init__.py +1 -14
langchain_core/output_parsers/base.py +68 -104
langchain_core/output_parsers/json.py +13 -17
langchain_core/output_parsers/list.py +11 -33
langchain_core/output_parsers/openai_functions.py +56 -74
langchain_core/output_parsers/openai_tools.py +68 -109
langchain_core/output_parsers/pydantic.py +15 -13
langchain_core/output_parsers/string.py +6 -2
langchain_core/output_parsers/transform.py +17 -60
langchain_core/output_parsers/xml.py +34 -44
langchain_core/outputs/__init__.py +1 -1
langchain_core/outputs/chat_generation.py +26 -11
langchain_core/outputs/chat_result.py +1 -3
langchain_core/outputs/generation.py +17 -6
langchain_core/outputs/llm_result.py +15 -8
langchain_core/prompt_values.py +29 -123
langchain_core/prompts/__init__.py +3 -27
langchain_core/prompts/base.py +48 -63
langchain_core/prompts/chat.py +259 -288
langchain_core/prompts/dict.py +19 -11
langchain_core/prompts/few_shot.py +84 -90
langchain_core/prompts/few_shot_with_templates.py +14 -12
langchain_core/prompts/image.py +19 -14
langchain_core/prompts/loading.py +6 -8
langchain_core/prompts/message.py +7 -8
langchain_core/prompts/prompt.py +42 -43
langchain_core/prompts/string.py +37 -16
langchain_core/prompts/structured.py +43 -46
langchain_core/rate_limiters.py +51 -60
langchain_core/retrievers.py +52 -192
langchain_core/runnables/base.py +1727 -1683
langchain_core/runnables/branch.py +52 -73
langchain_core/runnables/config.py +89 -103
langchain_core/runnables/configurable.py +128 -130
langchain_core/runnables/fallbacks.py +93 -82
langchain_core/runnables/graph.py +127 -127
langchain_core/runnables/graph_ascii.py +63 -41
langchain_core/runnables/graph_mermaid.py +87 -70
langchain_core/runnables/graph_png.py +31 -36
langchain_core/runnables/history.py +145 -161
langchain_core/runnables/passthrough.py +141 -144
langchain_core/runnables/retry.py +84 -68
langchain_core/runnables/router.py +33 -37
langchain_core/runnables/schema.py +79 -72
langchain_core/runnables/utils.py +95 -139
langchain_core/stores.py +85 -131
langchain_core/structured_query.py +11 -15
langchain_core/sys_info.py +31 -32
langchain_core/tools/__init__.py +1 -14
langchain_core/tools/base.py +221 -247
langchain_core/tools/convert.py +144 -161
langchain_core/tools/render.py +10 -10
langchain_core/tools/retriever.py +12 -19
langchain_core/tools/simple.py +52 -29
langchain_core/tools/structured.py +56 -60
langchain_core/tracers/__init__.py +1 -9
langchain_core/tracers/_streaming.py +6 -7
langchain_core/tracers/base.py +103 -112
langchain_core/tracers/context.py +29 -48
langchain_core/tracers/core.py +142 -105
langchain_core/tracers/evaluation.py +30 -34
langchain_core/tracers/event_stream.py +162 -117
langchain_core/tracers/langchain.py +34 -36
langchain_core/tracers/log_stream.py +87 -49
langchain_core/tracers/memory_stream.py +3 -3
langchain_core/tracers/root_listeners.py +18 -34
langchain_core/tracers/run_collector.py +8 -20
langchain_core/tracers/schemas.py +0 -125
langchain_core/tracers/stdout.py +3 -3
langchain_core/utils/__init__.py +1 -4
langchain_core/utils/_merge.py +47 -9
langchain_core/utils/aiter.py +70 -66
langchain_core/utils/env.py +12 -9
langchain_core/utils/function_calling.py +139 -206
langchain_core/utils/html.py +7 -8
langchain_core/utils/input.py +6 -6
langchain_core/utils/interactive_env.py +6 -2
langchain_core/utils/iter.py +48 -45
langchain_core/utils/json.py +14 -4
langchain_core/utils/json_schema.py +159 -43
langchain_core/utils/mustache.py +32 -25
langchain_core/utils/pydantic.py +67 -40
langchain_core/utils/strings.py +5 -5
langchain_core/utils/usage.py +1 -1
langchain_core/utils/utils.py +104 -62
langchain_core/vectorstores/base.py +131 -179
langchain_core/vectorstores/in_memory.py +113 -182
langchain_core/vectorstores/utils.py +23 -17
langchain_core/version.py +1 -1
langchain_core-1.0.0.dist-info/METADATA +68 -0
langchain_core-1.0.0.dist-info/RECORD +172 -0
{langchain_core-0.4.0.dev0.dist-info → langchain_core-1.0.0.dist-info}/WHEEL +1 -1
langchain_core/beta/__init__.py +0 -1
langchain_core/beta/runnables/__init__.py +0 -1
langchain_core/beta/runnables/context.py +0 -448
langchain_core/memory.py +0 -116
langchain_core/messages/content_blocks.py +0 -1435
langchain_core/prompts/pipeline.py +0 -133
langchain_core/pydantic_v1/__init__.py +0 -30
langchain_core/pydantic_v1/dataclasses.py +0 -23
langchain_core/pydantic_v1/main.py +0 -23
langchain_core/tracers/langchain_v1.py +0 -23
langchain_core/utils/loading.py +0 -31
langchain_core/v1/__init__.py +0 -1
langchain_core/v1/chat_models.py +0 -1047
langchain_core/v1/messages.py +0 -755
langchain_core-0.4.0.dev0.dist-info/METADATA +0 -108
langchain_core-0.4.0.dev0.dist-info/RECORD +0 -177
langchain_core-0.4.0.dev0.dist-info/entry_points.txt +0 -4

langchain_core/language_models/llms.py CHANGED Viewed

@@ -7,21 +7,17 @@ import functools
 import inspect
 import json
 import logging
-import warnings
 from abc import ABC, abstractmethod
-from collections.abc import AsyncIterator, Iterator, Sequence
+from collections.abc import AsyncIterator, Callable, Iterator, Sequence
 from pathlib import Path
 from typing import (
     TYPE_CHECKING,
     Any,
-    Callable,
-    Optional,
-    Union,
     cast,
 )
 import yaml
-from pydantic import ConfigDict, Field, model_validator
+from pydantic import ConfigDict
 from tenacity import (
     RetryCallState,
     before_sleep_log,
@@ -33,7 +29,6 @@ from tenacity import (
 )
 from typing_extensions import override
-from langchain_core._api import deprecated
 from langchain_core.caches import BaseCache
 from langchain_core.callbacks import (
     AsyncCallbackManager,
@@ -51,10 +46,7 @@ from langchain_core.language_models.base import (
 )
 from langchain_core.load import dumpd
 from langchain_core.messages import (
-    AIMessage,
-    BaseMessage,
     convert_to_messages,
-    get_buffer_string,
 )
 from langchain_core.outputs import Generation, GenerationChunk, LLMResult, RunInfo
 from langchain_core.prompt_values import ChatPromptValue, PromptValue, StringPromptValue
@@ -76,16 +68,14 @@ def _log_error_once(msg: str) -> None:
 def create_base_retry_decorator(
     error_types: list[type[BaseException]],
     max_retries: int = 1,
-    run_manager: Optional[
-        Union[AsyncCallbackManagerForLLMRun, CallbackManagerForLLMRun]
-    ] = None,
+    run_manager: AsyncCallbackManagerForLLMRun | CallbackManagerForLLMRun | None = None,
 ) -> Callable[[Any], Any]:
     """Create a retry decorator for a given LLM and provided a list of error types.
     Args:
         error_types: List of error types to retry on.
-        max_retries: Number of retries. Default is 1.
-        run_manager: Callback manager for the run. Default is None.
+        max_retries: Number of retries.
+        run_manager: Callback manager for the run.
     Returns:
         A retry decorator.
@@ -101,13 +91,17 @@ def create_base_retry_decorator(
             if isinstance(run_manager, AsyncCallbackManagerForLLMRun):
                 coro = run_manager.on_retry(retry_state)
                 try:
-                    loop = asyncio.get_event_loop()
-                    if loop.is_running():
-                        # TODO: Fix RUF006 - this task should have a reference
-                        #  and be awaited somewhere
-                        loop.create_task(coro)  # noqa: RUF006
-                    else:
+                    try:
+                        loop = asyncio.get_event_loop()
+                    except RuntimeError:
                         asyncio.run(coro)
+                    else:
+                        if loop.is_running():
+                            # TODO: Fix RUF006 - this task should have a reference
+                            #  and be awaited somewhere
+                            loop.create_task(coro)  # noqa: RUF006
+                        else:
+                            asyncio.run(coro)
                 except Exception as e:
                     _log_error_once(f"Error in on_retry: {e}")
             else:
@@ -129,8 +123,9 @@ def create_base_retry_decorator(
     )
-def _resolve_cache(*, cache: Union[BaseCache, bool, None]) -> Optional[BaseCache]:
+def _resolve_cache(*, cache: BaseCache | bool | None) -> BaseCache | None:
     """Resolve the cache."""
+    llm_cache: BaseCache | None
     if isinstance(cache, BaseCache):
         llm_cache = cache
     elif cache is None:
@@ -155,14 +150,14 @@ def _resolve_cache(*, cache: Union[BaseCache, bool, None]) -> Optional[BaseCache
 def get_prompts(
     params: dict[str, Any],
     prompts: list[str],
-    cache: Union[BaseCache, bool, None] = None,  # noqa: FBT001
+    cache: BaseCache | bool | None = None,  # noqa: FBT001
 ) -> tuple[dict[int, list], str, list[int], list[str]]:
     """Get prompts that are already cached.
     Args:
         params: Dictionary of parameters.
         prompts: List of prompts.
-        cache: Cache object. Default is None.
+        cache: Cache object.
     Returns:
         A tuple of existing prompts, llm_string, missing prompt indexes,
@@ -191,14 +186,14 @@ def get_prompts(
 async def aget_prompts(
     params: dict[str, Any],
     prompts: list[str],
-    cache: Union[BaseCache, bool, None] = None,  # noqa: FBT001
+    cache: BaseCache | bool | None = None,  # noqa: FBT001
 ) -> tuple[dict[int, list], str, list[int], list[str]]:
     """Get prompts that are already cached. Async version.
     Args:
         params: Dictionary of parameters.
         prompts: List of prompts.
-        cache: Cache object. Default is None.
+        cache: Cache object.
     Returns:
         A tuple of existing prompts, llm_string, missing prompt indexes,
@@ -224,13 +219,13 @@ async def aget_prompts(
 def update_cache(
-    cache: Union[BaseCache, bool, None],  # noqa: FBT001
+    cache: BaseCache | bool | None,  # noqa: FBT001
     existing_prompts: dict[int, list],
     llm_string: str,
     missing_prompt_idxs: list[int],
     new_results: LLMResult,
     prompts: list[str],
-) -> Optional[dict]:
+) -> dict | None:
     """Update the cache and get the LLM output.
     Args:
@@ -257,13 +252,13 @@ def update_cache(
 async def aupdate_cache(
-    cache: Union[BaseCache, bool, None],  # noqa: FBT001
+    cache: BaseCache | bool | None,  # noqa: FBT001
     existing_prompts: dict[int, list],
     llm_string: str,
     missing_prompt_idxs: list[int],
     new_results: LLMResult,
     prompts: list[str],
-) -> Optional[dict]:
+) -> dict | None:
     """Update the cache and get the LLM output. Async version.
     Args:
@@ -295,26 +290,10 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     It should take in a prompt and return a string.
     """
-    callback_manager: Optional[BaseCallbackManager] = Field(default=None, exclude=True)
-    """[DEPRECATED]"""
     model_config = ConfigDict(
         arbitrary_types_allowed=True,
     )
-    @model_validator(mode="before")
-    @classmethod
-    def raise_deprecation(cls, values: dict) -> Any:
-        """Raise deprecation warning if callback_manager is used."""
-        if values.get("callback_manager") is not None:
-            warnings.warn(
-                "callback_manager is deprecated. Please use callbacks instead.",
-                DeprecationWarning,
-                stacklevel=5,
-            )
-            values["callbacks"] = values.pop("callback_manager", None)
-        return values
     @functools.cached_property
     def _serialized(self) -> dict[str, Any]:
         return dumpd(self)
@@ -324,7 +303,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     @property
     @override
     def OutputType(self) -> type[str]:
-        """Get the input type for this runnable."""
+        """Get the input type for this `Runnable`."""
         return str
     def _convert_input(self, model_input: LanguageModelInput) -> PromptValue:
@@ -342,7 +321,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     def _get_ls_params(
         self,
-        stop: Optional[list[str]] = None,
+        stop: list[str] | None = None,
         **kwargs: Any,
     ) -> LangSmithParams:
         """Get standard params for tracing."""
@@ -356,7 +335,9 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             ls_params["ls_stop"] = stop
         # model
-        if hasattr(self, "model") and isinstance(self.model, str):
+        if "model" in kwargs and isinstance(kwargs["model"], str):
+            ls_params["ls_model_name"] = kwargs["model"]
+        elif hasattr(self, "model") and isinstance(self.model, str):
             ls_params["ls_model_name"] = self.model
         elif hasattr(self, "model_name") and isinstance(self.model_name, str):
             ls_params["ls_model_name"] = self.model_name
@@ -379,9 +360,9 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     def invoke(
         self,
         input: LanguageModelInput,
-        config: Optional[RunnableConfig] = None,
+        config: RunnableConfig | None = None,
         *,
-        stop: Optional[list[str]] = None,
+        stop: list[str] | None = None,
         **kwargs: Any,
     ) -> str:
         config = ensure_config(config)
@@ -404,9 +385,9 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     async def ainvoke(
         self,
         input: LanguageModelInput,
-        config: Optional[RunnableConfig] = None,
+        config: RunnableConfig | None = None,
         *,
-        stop: Optional[list[str]] = None,
+        stop: list[str] | None = None,
         **kwargs: Any,
     ) -> str:
         config = ensure_config(config)
@@ -426,7 +407,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     def batch(
         self,
         inputs: list[LanguageModelInput],
-        config: Optional[Union[RunnableConfig, list[RunnableConfig]]] = None,
+        config: RunnableConfig | list[RunnableConfig] | None = None,
         *,
         return_exceptions: bool = False,
         **kwargs: Any,
@@ -473,7 +454,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     async def abatch(
         self,
         inputs: list[LanguageModelInput],
-        config: Optional[Union[RunnableConfig, list[RunnableConfig]]] = None,
+        config: RunnableConfig | list[RunnableConfig] | None = None,
         *,
         return_exceptions: bool = False,
         **kwargs: Any,
@@ -519,9 +500,9 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     def stream(
         self,
         input: LanguageModelInput,
-        config: Optional[RunnableConfig] = None,
+        config: RunnableConfig | None = None,
         *,
-        stop: Optional[list[str]] = None,
+        stop: list[str] | None = None,
         **kwargs: Any,
     ) -> Iterator[str]:
         if type(self)._stream == BaseLLM._stream:  # noqa: SLF001
@@ -556,7 +537,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
                 run_id=config.pop("run_id", None),
                 batch_size=1,
             )
-            generation: Optional[GenerationChunk] = None
+            generation: GenerationChunk | None = None
             try:
                 for chunk in self._stream(
                     prompt, stop=stop, run_manager=run_manager, **kwargs
@@ -586,9 +567,9 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     async def astream(
         self,
         input: LanguageModelInput,
-        config: Optional[RunnableConfig] = None,
+        config: RunnableConfig | None = None,
         *,
-        stop: Optional[list[str]] = None,
+        stop: list[str] | None = None,
         **kwargs: Any,
     ) -> AsyncIterator[str]:
         if (
@@ -626,7 +607,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             run_id=config.pop("run_id", None),
             batch_size=1,
         )
-        generation: Optional[GenerationChunk] = None
+        generation: GenerationChunk | None = None
         try:
             async for chunk in self._astream(
                 prompt,
@@ -659,20 +640,42 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     def _generate(
         self,
         prompts: list[str],
-        stop: Optional[list[str]] = None,
-        run_manager: Optional[CallbackManagerForLLMRun] = None,
+        stop: list[str] | None = None,
+        run_manager: CallbackManagerForLLMRun | None = None,
         **kwargs: Any,
     ) -> LLMResult:
-        """Run the LLM on the given prompts."""
+        """Run the LLM on the given prompts.
+        Args:
+            prompts: The prompts to generate from.
+            stop: Stop words to use when generating. Model output is cut off at the
+                first occurrence of any of the stop substrings.
+                If stop tokens are not supported consider raising NotImplementedError.
+            run_manager: Callback manager for the run.
+        Returns:
+            The LLM result.
+        """
     async def _agenerate(
         self,
         prompts: list[str],
-        stop: Optional[list[str]] = None,
-        run_manager: Optional[AsyncCallbackManagerForLLMRun] = None,
+        stop: list[str] | None = None,
+        run_manager: AsyncCallbackManagerForLLMRun | None = None,
         **kwargs: Any,
     ) -> LLMResult:
-        """Run the LLM on the given prompts."""
+        """Run the LLM on the given prompts.
+        Args:
+            prompts: The prompts to generate from.
+            stop: Stop words to use when generating. Model output is cut off at the
+                first occurrence of any of the stop substrings.
+                If stop tokens are not supported consider raising NotImplementedError.
+            run_manager: Callback manager for the run.
+        Returns:
+            The LLM result.
+        """
         return await run_in_executor(
             None,
             self._generate,
@@ -685,8 +688,8 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     def _stream(
         self,
         prompt: str,
-        stop: Optional[list[str]] = None,
-        run_manager: Optional[CallbackManagerForLLMRun] = None,
+        stop: list[str] | None = None,
+        run_manager: CallbackManagerForLLMRun | None = None,
         **kwargs: Any,
     ) -> Iterator[GenerationChunk]:
         """Stream the LLM on the given prompt.
@@ -705,16 +708,16 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             **kwargs: Arbitrary additional keyword arguments. These are usually passed
                 to the model provider API call.
-        Returns:
-            An iterator of GenerationChunks.
+        Yields:
+            Generation chunks.
         """
         raise NotImplementedError
     async def _astream(
         self,
         prompt: str,
-        stop: Optional[list[str]] = None,
-        run_manager: Optional[AsyncCallbackManagerForLLMRun] = None,
+        stop: list[str] | None = None,
+        run_manager: AsyncCallbackManagerForLLMRun | None = None,
         **kwargs: Any,
     ) -> AsyncIterator[GenerationChunk]:
         """An async version of the _stream method.
@@ -731,8 +734,8 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             **kwargs: Arbitrary additional keyword arguments. These are usually passed
                 to the model provider API call.
-        Returns:
-            An async iterator of GenerationChunks.
+        Yields:
+            Generation chunks.
         """
         iterator = await run_in_executor(
             None,
@@ -758,8 +761,8 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     def generate_prompt(
         self,
         prompts: list[PromptValue],
-        stop: Optional[list[str]] = None,
-        callbacks: Optional[Union[Callbacks, list[Callbacks]]] = None,
+        stop: list[str] | None = None,
+        callbacks: Callbacks | list[Callbacks] | None = None,
         **kwargs: Any,
     ) -> LLMResult:
         prompt_strings = [p.to_string() for p in prompts]
@@ -769,8 +772,8 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     async def agenerate_prompt(
         self,
         prompts: list[PromptValue],
-        stop: Optional[list[str]] = None,
-        callbacks: Optional[Union[Callbacks, list[Callbacks]]] = None,
+        stop: list[str] | None = None,
+        callbacks: Callbacks | list[Callbacks] | None = None,
         **kwargs: Any,
     ) -> LLMResult:
         prompt_strings = [p.to_string() for p in prompts]
@@ -781,7 +784,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     def _generate_helper(
         self,
         prompts: list[str],
-        stop: Optional[list[str]],
+        stop: list[str] | None,
         run_managers: list[CallbackManagerForLLMRun],
         *,
         new_arg_supported: bool,
@@ -804,7 +807,9 @@ class BaseLLM(BaseLanguageModel[str], ABC):
                 run_manager.on_llm_error(e, response=LLMResult(generations=[]))
             raise
         flattened_outputs = output.flatten()
-        for manager, flattened_output in zip(run_managers, flattened_outputs):
+        for manager, flattened_output in zip(
+            run_managers, flattened_outputs, strict=False
+        ):
             manager.on_llm_end(flattened_output)
         if run_managers:
             output.run = [
@@ -815,13 +820,13 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     def generate(
         self,
         prompts: list[str],
-        stop: Optional[list[str]] = None,
-        callbacks: Optional[Union[Callbacks, list[Callbacks]]] = None,
+        stop: list[str] | None = None,
+        callbacks: Callbacks | list[Callbacks] | None = None,
         *,
-        tags: Optional[Union[list[str], list[list[str]]]] = None,
-        metadata: Optional[Union[dict[str, Any], list[dict[str, Any]]]] = None,
-        run_name: Optional[Union[str, list[str]]] = None,
-        run_id: Optional[Union[uuid.UUID, list[Optional[uuid.UUID]]]] = None,
+        tags: list[str] | list[list[str]] | None = None,
+        metadata: dict[str, Any] | list[dict[str, Any]] | None = None,
+        run_name: str | list[str] | None = None,
+        run_id: uuid.UUID | list[uuid.UUID | None] | None = None,
         **kwargs: Any,
     ) -> LLMResult:
         """Pass a sequence of prompts to a model and return generations.
@@ -830,16 +835,17 @@ class BaseLLM(BaseLanguageModel[str], ABC):
         API.
         Use this method when you want to:
-            1. take advantage of batched calls,
-            2. need more output from the model than just the top generated value,
-            3. are building chains that are agnostic to the underlying language model
-                type (e.g., pure text completion models vs chat models).
+        1. Take advantage of batched calls,
+        2. Need more output from the model than just the top generated value,
+        3. Are building chains that are agnostic to the underlying language model
+            type (e.g., pure text completion models vs chat models).
         Args:
             prompts: List of string prompts.
             stop: Stop words to use when generating. Model output is cut off at the
                 first occurrence of any of these substrings.
-            callbacks: Callbacks to pass through. Used for executing additional
+            callbacks: `Callbacks` to pass through. Used for executing additional
                 functionality, such as logging or streaming, throughout generation.
             tags: List of tags to associate with each prompt. If provided, the length
                 of the list must match the length of the prompts list.
@@ -853,9 +859,14 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             **kwargs: Arbitrary additional keyword arguments. These are usually passed
                 to the model provider API call.
+        Raises:
+            ValueError: If prompts is not a list.
+            ValueError: If the length of `callbacks`, `tags`, `metadata`, or
+                `run_name` (if provided) does not match the length of prompts.
         Returns:
-            An LLMResult, which contains a list of candidate Generations for each input
-                prompt and additional model provider-specific output.
+            An `LLMResult`, which contains a list of candidate `Generations` for each
+                input prompt and additional model provider-specific output.
         """
         if not isinstance(prompts, list):
             msg = (
@@ -905,14 +916,12 @@ class BaseLLM(BaseLanguageModel[str], ABC):
                 msg = "run_name must be a list of the same length as prompts"
                 raise ValueError(msg)
             callbacks = cast("list[Callbacks]", callbacks)
-            tags_list = cast(
-                "list[Optional[list[str]]]", tags or ([None] * len(prompts))
-            )
+            tags_list = cast("list[list[str] | None]", tags or ([None] * len(prompts)))
             metadata_list = cast(
-                "list[Optional[dict[str, Any]]]", metadata or ([{}] * len(prompts))
+                "list[dict[str, Any] | None]", metadata or ([{}] * len(prompts))
             )
             run_name_list = run_name or cast(
-                "list[Optional[str]]", ([None] * len(prompts))
+                "list[str | None]", ([None] * len(prompts))
             )
             callback_managers = [
                 CallbackManager.configure(
@@ -924,7 +933,9 @@ class BaseLLM(BaseLanguageModel[str], ABC):
                     meta,
                     self.metadata,
                 )
-                for callback, tag, meta in zip(callbacks, tags_list, metadata_list)
+                for callback, tag, meta in zip(
+                    callbacks, tags_list, metadata_list, strict=False
+                )
             ]
         else:
             # We've received a single callbacks arg to apply to all inputs
@@ -939,7 +950,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
                     self.metadata,
                 )
             ] * len(prompts)
-            run_name_list = [cast("Optional[str]", run_name)] * len(prompts)
+            run_name_list = [cast("str | None", run_name)] * len(prompts)
         run_ids_list = self._get_run_ids_list(run_id, prompts)
         params = self.dict()
         params["stop"] = stop
@@ -965,7 +976,11 @@ class BaseLLM(BaseLanguageModel[str], ABC):
                     run_id=run_id_,
                 )[0]
                 for callback_manager, prompt, run_name, run_id_ in zip(
-                    callback_managers, prompts, run_name_list, run_ids_list
+                    callback_managers,
+                    prompts,
+                    run_name_list,
+                    run_ids_list,
+                    strict=False,
                 )
             ]
             return self._generate_helper(
@@ -1015,7 +1030,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     @staticmethod
     def _get_run_ids_list(
-        run_id: Optional[Union[uuid.UUID, list[Optional[uuid.UUID]]]], prompts: list
+        run_id: uuid.UUID | list[uuid.UUID | None] | None, prompts: list
     ) -> list:
         if run_id is None:
             return [None] * len(prompts)
@@ -1032,7 +1047,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     async def _agenerate_helper(
         self,
         prompts: list[str],
-        stop: Optional[list[str]],
+        stop: list[str] | None,
         run_managers: list[AsyncCallbackManagerForLLMRun],
         *,
         new_arg_supported: bool,
@@ -1062,7 +1077,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             *[
                 run_manager.on_llm_end(flattened_output)
                 for run_manager, flattened_output in zip(
-                    run_managers, flattened_outputs
+                    run_managers, flattened_outputs, strict=False
                 )
             ]
         )
@@ -1075,13 +1090,13 @@ class BaseLLM(BaseLanguageModel[str], ABC):
     async def agenerate(
         self,
         prompts: list[str],
-        stop: Optional[list[str]] = None,
-        callbacks: Optional[Union[Callbacks, list[Callbacks]]] = None,
+        stop: list[str] | None = None,
+        callbacks: Callbacks | list[Callbacks] | None = None,
         *,
-        tags: Optional[Union[list[str], list[list[str]]]] = None,
-        metadata: Optional[Union[dict[str, Any], list[dict[str, Any]]]] = None,
-        run_name: Optional[Union[str, list[str]]] = None,
-        run_id: Optional[Union[uuid.UUID, list[Optional[uuid.UUID]]]] = None,
+        tags: list[str] | list[list[str]] | None = None,
+        metadata: dict[str, Any] | list[dict[str, Any]] | None = None,
+        run_name: str | list[str] | None = None,
+        run_id: uuid.UUID | list[uuid.UUID | None] | None = None,
         **kwargs: Any,
     ) -> LLMResult:
         """Asynchronously pass a sequence of prompts to a model and return generations.
@@ -1090,16 +1105,17 @@ class BaseLLM(BaseLanguageModel[str], ABC):
         API.
         Use this method when you want to:
-            1. take advantage of batched calls,
-            2. need more output from the model than just the top generated value,
-            3. are building chains that are agnostic to the underlying language model
-                type (e.g., pure text completion models vs chat models).
+        1. Take advantage of batched calls,
+        2. Need more output from the model than just the top generated value,
+        3. Are building chains that are agnostic to the underlying language model
+            type (e.g., pure text completion models vs chat models).
         Args:
             prompts: List of string prompts.
             stop: Stop words to use when generating. Model output is cut off at the
                 first occurrence of any of these substrings.
-            callbacks: Callbacks to pass through. Used for executing additional
+            callbacks: `Callbacks` to pass through. Used for executing additional
                 functionality, such as logging or streaming, throughout generation.
             tags: List of tags to associate with each prompt. If provided, the length
                 of the list must match the length of the prompts list.
@@ -1113,9 +1129,13 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             **kwargs: Arbitrary additional keyword arguments. These are usually passed
                 to the model provider API call.
+        Raises:
+            ValueError: If the length of `callbacks`, `tags`, `metadata`, or
+                `run_name` (if provided) does not match the length of prompts.
         Returns:
-            An LLMResult, which contains a list of candidate Generations for each input
-                prompt and additional model provider-specific output.
+            An `LLMResult`, which contains a list of candidate `Generations` for each
+                input prompt and additional model provider-specific output.
         """
         if isinstance(metadata, list):
             metadata = [
@@ -1155,14 +1175,12 @@ class BaseLLM(BaseLanguageModel[str], ABC):
                 msg = "run_name must be a list of the same length as prompts"
                 raise ValueError(msg)
             callbacks = cast("list[Callbacks]", callbacks)
-            tags_list = cast(
-                "list[Optional[list[str]]]", tags or ([None] * len(prompts))
-            )
+            tags_list = cast("list[list[str] | None]", tags or ([None] * len(prompts)))
             metadata_list = cast(
-                "list[Optional[dict[str, Any]]]", metadata or ([{}] * len(prompts))
+                "list[dict[str, Any] | None]", metadata or ([{}] * len(prompts))
             )
             run_name_list = run_name or cast(
-                "list[Optional[str]]", ([None] * len(prompts))
+                "list[str | None]", ([None] * len(prompts))
             )
             callback_managers = [
                 AsyncCallbackManager.configure(
@@ -1174,7 +1192,9 @@ class BaseLLM(BaseLanguageModel[str], ABC):
                     meta,
                     self.metadata,
                 )
-                for callback, tag, meta in zip(callbacks, tags_list, metadata_list)
+                for callback, tag, meta in zip(
+                    callbacks, tags_list, metadata_list, strict=False
+                )
             ]
         else:
             # We've received a single callbacks arg to apply to all inputs
@@ -1189,7 +1209,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
                     self.metadata,
                 )
             ] * len(prompts)
-            run_name_list = [cast("Optional[str]", run_name)] * len(prompts)
+            run_name_list = [cast("str | None", run_name)] * len(prompts)
         run_ids_list = self._get_run_ids_list(run_id, prompts)
         params = self.dict()
         params["stop"] = stop
@@ -1219,7 +1239,11 @@ class BaseLLM(BaseLanguageModel[str], ABC):
                         run_id=run_id_,
                     )
                     for callback_manager, prompt, run_name, run_id_ in zip(
-                        callback_managers, prompts, run_name_list, run_ids_list
+                        callback_managers,
+                        prompts,
+                        run_name_list,
+                        run_ids_list,
+                        strict=False,
                     )
                 ]
             )
@@ -1272,64 +1296,14 @@ class BaseLLM(BaseLanguageModel[str], ABC):
         generations = [existing_prompts[i] for i in range(len(prompts))]
         return LLMResult(generations=generations, llm_output=llm_output, run=run_info)
-    @deprecated("0.1.7", alternative="invoke", removal="1.0")
-    def __call__(
-        self,
-        prompt: str,
-        stop: Optional[list[str]] = None,
-        callbacks: Callbacks = None,
-        *,
-        tags: Optional[list[str]] = None,
-        metadata: Optional[dict[str, Any]] = None,
-        **kwargs: Any,
-    ) -> str:
-        """Check Cache and run the LLM on the given prompt and input.
-        Args:
-            prompt: The prompt to generate from.
-            stop: Stop words to use when generating. Model output is cut off at the
-                first occurrence of any of these substrings.
-            callbacks: Callbacks to pass through. Used for executing additional
-                functionality, such as logging or streaming, throughout generation.
-            tags: List of tags to associate with the prompt.
-            metadata: Metadata to associate with the prompt.
-            **kwargs: Arbitrary additional keyword arguments. These are usually passed
-                to the model provider API call.
-        Returns:
-            The generated text.
-        Raises:
-            ValueError: If the prompt is not a string.
-        """
-        if not isinstance(prompt, str):
-            msg = (
-                "Argument `prompt` is expected to be a string. Instead found "
-                f"{type(prompt)}. If you want to run the LLM on multiple prompts, use "
-                "`generate` instead."
-            )
-            raise ValueError(msg)  # noqa: TRY004
-        return (
-            self.generate(
-                [prompt],
-                stop=stop,
-                callbacks=callbacks,
-                tags=tags,
-                metadata=metadata,
-                **kwargs,
-            )
-            .generations[0][0]
-            .text
-        )
     async def _call_async(
         self,
         prompt: str,
-        stop: Optional[list[str]] = None,
+        stop: list[str] | None = None,
         callbacks: Callbacks = None,
         *,
-        tags: Optional[list[str]] = None,
-        metadata: Optional[dict[str, Any]] = None,
+        tags: list[str] | None = None,
+        metadata: dict[str, Any] | None = None,
         **kwargs: Any,
     ) -> str:
         """Check Cache and run the LLM on the given prompt and input."""
@@ -1343,52 +1317,8 @@ class BaseLLM(BaseLanguageModel[str], ABC):
         )
         return result.generations[0][0].text
-    @deprecated("0.1.7", alternative="invoke", removal="1.0")
-    @override
-    def predict(
-        self, text: str, *, stop: Optional[Sequence[str]] = None, **kwargs: Any
-    ) -> str:
-        stop_ = None if stop is None else list(stop)
-        return self(text, stop=stop_, **kwargs)
-    @deprecated("0.1.7", alternative="invoke", removal="1.0")
-    @override
-    def predict_messages(
-        self,
-        messages: list[BaseMessage],
-        *,
-        stop: Optional[Sequence[str]] = None,
-        **kwargs: Any,
-    ) -> BaseMessage:
-        text = get_buffer_string(messages)
-        stop_ = None if stop is None else list(stop)
-        content = self(text, stop=stop_, **kwargs)
-        return AIMessage(content=content)
-    @deprecated("0.1.7", alternative="ainvoke", removal="1.0")
-    @override
-    async def apredict(
-        self, text: str, *, stop: Optional[Sequence[str]] = None, **kwargs: Any
-    ) -> str:
-        stop_ = None if stop is None else list(stop)
-        return await self._call_async(text, stop=stop_, **kwargs)
-    @deprecated("0.1.7", alternative="ainvoke", removal="1.0")
-    @override
-    async def apredict_messages(
-        self,
-        messages: list[BaseMessage],
-        *,
-        stop: Optional[Sequence[str]] = None,
-        **kwargs: Any,
-    ) -> BaseMessage:
-        text = get_buffer_string(messages)
-        stop_ = None if stop is None else list(stop)
-        content = await self._call_async(text, stop=stop_, **kwargs)
-        return AIMessage(content=content)
     def __str__(self) -> str:
-        """Get a string representation of the object for printing."""
+        """Return a string representation of the object for printing."""
         cls_name = f"\033[1m{self.__class__.__name__}\033[0m"
         return f"{cls_name}\nParams: {self._identifying_params}"
@@ -1404,7 +1334,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
         starter_dict["_type"] = self._llm_type
         return starter_dict
-    def save(self, file_path: Union[Path, str]) -> None:
+    def save(self, file_path: Path | str) -> None:
         """Save the LLM.
         Args:
@@ -1414,11 +1344,9 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             ValueError: If the file path is not a string or Path object.
         Example:
-            .. code-block:: python
-                llm.save(file_path="path/llm.yaml")
+            ```python
+            llm.save(file_path="path/llm.yaml")
+            ```
         """
         # Convert file to Path object.
         save_path = Path(file_path)
@@ -1430,10 +1358,10 @@ class BaseLLM(BaseLanguageModel[str], ABC):
         prompt_dict = self.dict()
         if save_path.suffix == ".json":
-            with save_path.open("w") as f:
+            with save_path.open("w", encoding="utf-8") as f:
                 json.dump(prompt_dict, f, indent=4)
         elif save_path.suffix.endswith((".yaml", ".yml")):
-            with save_path.open("w") as f:
+            with save_path.open("w", encoding="utf-8") as f:
                 yaml.dump(prompt_dict, f, default_flow_style=False)
         else:
             msg = f"{save_path} must be json or yaml"
@@ -1474,8 +1402,8 @@ class LLM(BaseLLM):
     def _call(
         self,
         prompt: str,
-        stop: Optional[list[str]] = None,
-        run_manager: Optional[CallbackManagerForLLMRun] = None,
+        stop: list[str] | None = None,
+        run_manager: CallbackManagerForLLMRun | None = None,
         **kwargs: Any,
     ) -> str:
         """Run the LLM on the given input.
@@ -1498,8 +1426,8 @@ class LLM(BaseLLM):
     async def _acall(
         self,
         prompt: str,
-        stop: Optional[list[str]] = None,
-        run_manager: Optional[AsyncCallbackManagerForLLMRun] = None,
+        stop: list[str] | None = None,
+        run_manager: AsyncCallbackManagerForLLMRun | None = None,
         **kwargs: Any,
     ) -> str:
         """Async version of the _call method.
@@ -1532,11 +1460,10 @@ class LLM(BaseLLM):
     def _generate(
         self,
         prompts: list[str],
-        stop: Optional[list[str]] = None,
-        run_manager: Optional[CallbackManagerForLLMRun] = None,
+        stop: list[str] | None = None,
+        run_manager: CallbackManagerForLLMRun | None = None,
         **kwargs: Any,
     ) -> LLMResult:
-        """Run the LLM on the given prompt and input."""
         # TODO: add caching here.
         generations = []
         new_arg_supported = inspect.signature(self._call).parameters.get("run_manager")
@@ -1552,11 +1479,10 @@ class LLM(BaseLLM):
     async def _agenerate(
         self,
         prompts: list[str],
-        stop: Optional[list[str]] = None,
-        run_manager: Optional[AsyncCallbackManagerForLLMRun] = None,
+        stop: list[str] | None = None,
+        run_manager: AsyncCallbackManagerForLLMRun | None = None,
         **kwargs: Any,
     ) -> LLMResult:
-        """Async run the LLM on the given prompt and input."""
         generations = []
         new_arg_supported = inspect.signature(self._acall).parameters.get("run_manager")
         for prompt in prompts:

langchain-core 0.4.0.dev0__py3-none-any.whl → 1.0.0__py3-none-any.whl

Potentially problematic release.

langchain-core 0.4.0.dev0py3-none-any.whl → 1.0.0py3-none-any.whl