PyPI - langchain-core - Versions diffs - 0.3.74__py3-none-any.whl → 0.3.76__py3-none-any.whl - Mend

langchain-core 0.3.74py3-none-any.whl → 0.3.76py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of langchain-core might be problematic. Click here for more details.

Files changed (122) hide show

langchain_core/_api/beta_decorator.py +18 -41
langchain_core/_api/deprecation.py +20 -7
langchain_core/_api/path.py +19 -2
langchain_core/_import_utils.py +7 -0
langchain_core/agents.py +10 -6
langchain_core/beta/runnables/context.py +2 -3
langchain_core/callbacks/base.py +11 -4
langchain_core/callbacks/file.py +13 -2
langchain_core/callbacks/manager.py +129 -78
langchain_core/callbacks/usage.py +4 -2
langchain_core/chat_history.py +10 -12
langchain_core/document_loaders/base.py +34 -9
langchain_core/document_loaders/langsmith.py +3 -0
langchain_core/documents/base.py +36 -11
langchain_core/documents/compressor.py +9 -6
langchain_core/documents/transformers.py +4 -2
langchain_core/embeddings/fake.py +8 -5
langchain_core/env.py +2 -3
langchain_core/example_selectors/base.py +12 -0
langchain_core/exceptions.py +7 -0
langchain_core/globals.py +17 -28
langchain_core/indexing/api.py +56 -44
langchain_core/indexing/base.py +7 -10
langchain_core/indexing/in_memory.py +23 -3
langchain_core/language_models/__init__.py +3 -2
langchain_core/language_models/base.py +64 -39
langchain_core/language_models/chat_models.py +130 -42
langchain_core/language_models/fake_chat_models.py +10 -11
langchain_core/language_models/llms.py +49 -17
langchain_core/load/dump.py +5 -7
langchain_core/load/load.py +15 -1
langchain_core/load/serializable.py +38 -43
langchain_core/memory.py +7 -3
langchain_core/messages/ai.py +36 -16
langchain_core/messages/base.py +13 -6
langchain_core/messages/content_blocks.py +23 -2
langchain_core/messages/human.py +2 -6
langchain_core/messages/modifier.py +1 -1
langchain_core/messages/system.py +2 -6
langchain_core/messages/tool.py +36 -16
langchain_core/messages/utils.py +198 -87
langchain_core/output_parsers/base.py +5 -2
langchain_core/output_parsers/json.py +4 -4
langchain_core/output_parsers/list.py +7 -22
langchain_core/output_parsers/openai_functions.py +3 -0
langchain_core/output_parsers/openai_tools.py +8 -1
langchain_core/output_parsers/pydantic.py +4 -0
langchain_core/output_parsers/string.py +5 -1
langchain_core/output_parsers/transform.py +2 -2
langchain_core/output_parsers/xml.py +23 -22
langchain_core/outputs/chat_generation.py +18 -7
langchain_core/outputs/generation.py +14 -3
langchain_core/outputs/llm_result.py +8 -1
langchain_core/prompt_values.py +10 -4
langchain_core/prompts/base.py +4 -9
langchain_core/prompts/chat.py +88 -61
langchain_core/prompts/dict.py +16 -8
langchain_core/prompts/few_shot.py +9 -11
langchain_core/prompts/few_shot_with_templates.py +5 -1
langchain_core/prompts/image.py +12 -5
langchain_core/prompts/message.py +5 -6
langchain_core/prompts/pipeline.py +13 -8
langchain_core/prompts/prompt.py +22 -8
langchain_core/prompts/string.py +18 -10
langchain_core/prompts/structured.py +7 -2
langchain_core/rate_limiters.py +2 -2
langchain_core/retrievers.py +7 -6
langchain_core/runnables/base.py +842 -567
langchain_core/runnables/branch.py +15 -20
langchain_core/runnables/config.py +11 -17
langchain_core/runnables/configurable.py +34 -19
langchain_core/runnables/fallbacks.py +24 -17
langchain_core/runnables/graph.py +47 -40
langchain_core/runnables/graph_ascii.py +40 -17
langchain_core/runnables/graph_mermaid.py +27 -15
langchain_core/runnables/graph_png.py +27 -31
langchain_core/runnables/history.py +56 -59
langchain_core/runnables/passthrough.py +47 -24
langchain_core/runnables/retry.py +10 -6
langchain_core/runnables/router.py +10 -9
langchain_core/runnables/schema.py +2 -0
langchain_core/runnables/utils.py +51 -89
langchain_core/stores.py +13 -25
langchain_core/structured_query.py +3 -7
langchain_core/sys_info.py +9 -8
langchain_core/tools/base.py +30 -23
langchain_core/tools/convert.py +24 -13
langchain_core/tools/simple.py +35 -3
langchain_core/tools/structured.py +26 -3
langchain_core/tracers/_streaming.py +6 -7
langchain_core/tracers/base.py +2 -2
langchain_core/tracers/context.py +5 -1
langchain_core/tracers/core.py +109 -39
langchain_core/tracers/evaluation.py +22 -26
langchain_core/tracers/event_stream.py +41 -28
langchain_core/tracers/langchain.py +12 -3
langchain_core/tracers/langchain_v1.py +10 -2
langchain_core/tracers/log_stream.py +57 -18
langchain_core/tracers/root_listeners.py +4 -20
langchain_core/tracers/run_collector.py +6 -16
langchain_core/tracers/schemas.py +5 -1
langchain_core/utils/aiter.py +14 -6
langchain_core/utils/env.py +3 -0
langchain_core/utils/function_calling.py +49 -30
langchain_core/utils/interactive_env.py +6 -2
langchain_core/utils/iter.py +11 -3
langchain_core/utils/json.py +5 -2
langchain_core/utils/json_schema.py +15 -5
langchain_core/utils/loading.py +5 -1
langchain_core/utils/mustache.py +24 -15
langchain_core/utils/pydantic.py +32 -4
langchain_core/utils/utils.py +24 -8
langchain_core/vectorstores/base.py +7 -20
langchain_core/vectorstores/in_memory.py +18 -12
langchain_core/vectorstores/utils.py +18 -12
langchain_core/version.py +1 -1
langchain_core-0.3.76.dist-info/METADATA +77 -0
langchain_core-0.3.76.dist-info/RECORD +174 -0
langchain_core-0.3.74.dist-info/METADATA +0 -108
langchain_core-0.3.74.dist-info/RECORD +0 -174
{langchain_core-0.3.74.dist-info → langchain_core-0.3.76.dist-info}/WHEEL +0 -0
{langchain_core-0.3.74.dist-info → langchain_core-0.3.76.dist-info}/entry_points.txt +0 -0

langchain_core/language_models/chat_models.py CHANGED Viewed

@@ -46,6 +46,10 @@ from langchain_core.messages import (
     message_chunk_to_message,
 )
 from langchain_core.messages.ai import _LC_ID_PREFIX
+from langchain_core.output_parsers.openai_tools import (
+    JsonOutputKeyToolsParser,
+    PydanticToolsParser,
+)
 from langchain_core.outputs import (
     ChatGeneration,
     ChatGenerationChunk,
@@ -78,6 +82,11 @@ def _generate_response_from_error(error: BaseException) -> list[ChatGeneration]:
     if hasattr(error, "response"):
         response = error.response
         metadata: dict = {}
+        if hasattr(response, "json"):
+            try:
+                metadata["body"] = response.json()
+            except Exception:
+                metadata["body"] = getattr(response, "text", None)
         if hasattr(response, "headers"):
             try:
                 metadata["headers"] = dict(response.headers)
@@ -97,17 +106,18 @@ def _generate_response_from_error(error: BaseException) -> list[ChatGeneration]:
 def _format_for_tracing(messages: list[BaseMessage]) -> list[BaseMessage]:
-    """Format messages for tracing in on_chat_model_start.
+    """Format messages for tracing in ``on_chat_model_start``.
     - Update image content blocks to OpenAI Chat Completions format (backward
     compatibility).
-    - Add "type" key to content blocks that have a single key.
+    - Add ``type`` key to content blocks that have a single key.
     Args:
         messages: List of messages to format.
     Returns:
         List of messages formatted for tracing.
     """
     messages_to_trace = []
     for message in messages:
@@ -142,8 +152,6 @@ def _format_for_tracing(messages: list[BaseMessage]) -> list[BaseMessage]:
                             "type": key,
                             key: block[key],
                         }
-                    else:
-                        pass
         messages_to_trace.append(message_to_trace)
     return messages_to_trace
@@ -153,10 +161,14 @@ def generate_from_stream(stream: Iterator[ChatGenerationChunk]) -> ChatResult:
     """Generate from a stream.
     Args:
-        stream: Iterator of ChatGenerationChunk.
+        stream: Iterator of ``ChatGenerationChunk``.
+    Raises:
+        ValueError: If no generations are found in the stream.
     Returns:
         ChatResult: Chat result.
     """
     generation = next(stream, None)
     if generation:
@@ -180,10 +192,11 @@ async def agenerate_from_stream(
     """Async generate from a stream.
     Args:
-        stream: Iterator of ChatGenerationChunk.
+        stream: Iterator of ``ChatGenerationChunk``.
     Returns:
         ChatResult: Chat result.
     """
     chunks = [chunk async for chunk in stream]
     return await run_in_executor(None, generate_from_stream, iter(chunks))
@@ -311,15 +324,16 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
       provided. This offers the best of both worlds.
     - If False (default), will always use streaming case if available.
-    The main reason for this flag is that code might be written using ``.stream()`` and
+    The main reason for this flag is that code might be written using ``stream()`` and
     a user may want to swap out a given model for another model whose the implementation
     does not properly support streaming.
     """
     @model_validator(mode="before")
     @classmethod
     def raise_deprecation(cls, values: dict) -> Any:
-        """Raise deprecation warning if callback_manager is used.
+        """Emit deprecation warning if ``callback_manager`` is used.
         Args:
             values (Dict): Values to validate.
@@ -327,8 +341,6 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         Returns:
             Dict: Validated values.
-        Raises:
-            DeprecationWarning: If callback_manager is used.
         """
         if values.get("callback_manager") is not None:
             warnings.warn(
@@ -528,7 +540,7 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
                     generations = [generations_with_error_metadata]
                 run_manager.on_llm_error(
                     e,
-                    response=LLMResult(generations=generations),  # type: ignore[arg-type]
+                    response=LLMResult(generations=generations),
                 )
                 raise
@@ -622,7 +634,7 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
                 generations = [generations_with_error_metadata]
             await run_manager.on_llm_error(
                 e,
-                response=LLMResult(generations=generations),  # type: ignore[arg-type]
+                response=LLMResult(generations=generations),
             )
             raise
@@ -653,6 +665,7 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         Returns:
             List of ChatGeneration objects.
         """
         converted_generations = []
         for gen in cache_val:
@@ -758,10 +771,11 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         API.
         Use this method when you want to:
-            1. take advantage of batched calls,
-            2. need more output from the model than just the top generated value,
-            3. are building chains that are agnostic to the underlying language model
-                type (e.g., pure text completion models vs chat models).
+        1. Take advantage of batched calls,
+        2. Need more output from the model than just the top generated value,
+        3. Are building chains that are agnostic to the underlying language model
+           type (e.g., pure text completion models vs chat models).
         Args:
             messages: List of list of messages.
@@ -778,7 +792,8 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         Returns:
             An LLMResult, which contains a list of candidate Generations for each input
-                prompt and additional model provider-specific output.
+            prompt and additional model provider-specific output.
         """
         ls_structured_output_format = kwargs.pop(
             "ls_structured_output_format", None
@@ -835,17 +850,17 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
                     run_managers[i].on_llm_error(
                         e,
                         response=LLMResult(
-                            generations=[generations_with_error_metadata]  # type: ignore[list-item]
+                            generations=[generations_with_error_metadata]
                         ),
                     )
                 raise
         flattened_outputs = [
-            LLMResult(generations=[res.generations], llm_output=res.llm_output)  # type: ignore[list-item]
+            LLMResult(generations=[res.generations], llm_output=res.llm_output)
             for res in results
         ]
         llm_output = self._combine_llm_outputs([res.llm_output for res in results])
         generations = [res.generations for res in results]
-        output = LLMResult(generations=generations, llm_output=llm_output)  # type: ignore[arg-type]
+        output = LLMResult(generations=generations, llm_output=llm_output)
         if run_managers:
             run_infos = []
             for manager, flattened_output in zip(run_managers, flattened_outputs):
@@ -872,10 +887,11 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         API.
         Use this method when you want to:
-            1. take advantage of batched calls,
-            2. need more output from the model than just the top generated value,
-            3. are building chains that are agnostic to the underlying language model
-                type (e.g., pure text completion models vs chat models).
+        1. Take advantage of batched calls,
+        2. Need more output from the model than just the top generated value,
+        3. Are building chains that are agnostic to the underlying language model
+           type (e.g., pure text completion models vs chat models).
         Args:
             messages: List of list of messages.
@@ -892,7 +908,8 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         Returns:
             An LLMResult, which contains a list of candidate Generations for each input
-                prompt and additional model provider-specific output.
+            prompt and additional model provider-specific output.
         """
         ls_structured_output_format = kwargs.pop(
             "ls_structured_output_format", None
@@ -954,7 +971,7 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
                     await run_managers[i].on_llm_error(
                         res,
                         response=LLMResult(
-                            generations=[generations_with_error_metadata]  # type: ignore[list-item]
+                            generations=[generations_with_error_metadata]
                         ),
                     )
                 exceptions.append(res)
@@ -964,7 +981,7 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
                     *[
                         run_manager.on_llm_end(
                             LLMResult(
-                                generations=[res.generations],  # type: ignore[list-item, union-attr]
+                                generations=[res.generations],  # type: ignore[union-attr]
                                 llm_output=res.llm_output,  # type: ignore[union-attr]
                             )
                         )
@@ -974,12 +991,12 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
                 )
             raise exceptions[0]
         flattened_outputs = [
-            LLMResult(generations=[res.generations], llm_output=res.llm_output)  # type: ignore[list-item, union-attr]
+            LLMResult(generations=[res.generations], llm_output=res.llm_output)  # type: ignore[union-attr]
             for res in results
         ]
         llm_output = self._combine_llm_outputs([res.llm_output for res in results])  # type: ignore[union-attr]
         generations = [res.generations for res in results]  # type: ignore[union-attr]
-        output = LLMResult(generations=generations, llm_output=llm_output)  # type: ignore[arg-type]
+        output = LLMResult(generations=generations, llm_output=llm_output)
         await asyncio.gather(
             *[
                 run_manager.on_llm_end(flattened_output)
@@ -1172,7 +1189,17 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         run_manager: Optional[CallbackManagerForLLMRun] = None,
         **kwargs: Any,
     ) -> ChatResult:
-        """Top Level call."""
+        """Generate the result.
+        Args:
+            messages: The messages to generate from.
+            stop: Optional list of stop words to use when generating.
+            run_manager: Optional callback manager to use for this call.
+            **kwargs: Additional keyword arguments to pass to the model.
+        Returns:
+            The chat result.
+        """
     async def _agenerate(
         self,
@@ -1181,7 +1208,17 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         run_manager: Optional[AsyncCallbackManagerForLLMRun] = None,
         **kwargs: Any,
     ) -> ChatResult:
-        """Top Level call."""
+        """Generate the result.
+        Args:
+            messages: The messages to generate from.
+            stop: Optional list of stop words to use when generating.
+            run_manager: Optional callback manager to use for this call.
+            **kwargs: Additional keyword arguments to pass to the model.
+        Returns:
+            The chat result.
+        """
         return await run_in_executor(
             None,
             self._generate,
@@ -1198,6 +1235,17 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         run_manager: Optional[CallbackManagerForLLMRun] = None,
         **kwargs: Any,
     ) -> Iterator[ChatGenerationChunk]:
+        """Stream the output of the model.
+        Args:
+            messages: The messages to generate from.
+            stop: Optional list of stop words to use when generating.
+            run_manager: Optional callback manager to use for this call.
+            **kwargs: Additional keyword arguments to pass to the model.
+        Yields:
+            The chat generation chunks.
+        """
         raise NotImplementedError
     async def _astream(
@@ -1207,6 +1255,17 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         run_manager: Optional[AsyncCallbackManagerForLLMRun] = None,
         **kwargs: Any,
     ) -> AsyncIterator[ChatGenerationChunk]:
+        """Stream the output of the model.
+        Args:
+            messages: The messages to generate from.
+            stop: Optional list of stop words to use when generating.
+            run_manager: Optional callback manager to use for this call.
+            **kwargs: Additional keyword arguments to pass to the model.
+        Yields:
+            The chat generation chunks.
+        """
         iterator = await run_in_executor(
             None,
             self._stream,
@@ -1246,8 +1305,12 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
             **kwargs: Arbitrary additional keyword arguments. These are usually passed
                 to the model provider API call.
+        Raises:
+            ValueError: If the generation is not a chat generation.
         Returns:
             The model output message.
         """
         generation = self.generate(
             [messages], stop=stop, callbacks=callbacks, **kwargs
@@ -1288,6 +1351,7 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         Returns:
             The model output string.
         """
         return self.predict(message, stop=stop, **kwargs)
@@ -1305,8 +1369,12 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
             **kwargs: Arbitrary additional keyword arguments. These are usually passed
                 to the model provider API call.
+        Raises:
+            ValueError: If the output is not a string.
         Returns:
             The predicted output string.
         """
         stop_ = None if stop is None else list(stop)
         result = self([HumanMessage(content=text)], stop=stop_, **kwargs)
@@ -1382,6 +1450,7 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
         Returns:
             A Runnable that returns a message.
         """
         raise NotImplementedError
@@ -1417,6 +1486,11 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
                 will be caught and returned as well. The final output is always a dict
                 with keys ``'raw'``, ``'parsed'``, and ``'parsing_error'``.
+        Raises:
+            ValueError: If there are any unsupported ``kwargs``.
+            NotImplementedError: If the model does not implement
+                ``with_structured_output()``.
         Returns:
             A Runnable that takes same inputs as a :class:`langchain_core.language_models.chat.BaseChatModel`.
@@ -1436,15 +1510,20 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
                 from pydantic import BaseModel
                 class AnswerWithJustification(BaseModel):
                     '''An answer to the user question along with justification for the answer.'''
                     answer: str
                     justification: str
                 llm = ChatModel(model="model-name", temperature=0)
                 structured_llm = llm.with_structured_output(AnswerWithJustification)
-                structured_llm.invoke("What weighs more a pound of bricks or a pound of feathers")
+                structured_llm.invoke(
+                    "What weighs more a pound of bricks or a pound of feathers"
+                )
                 # -> AnswerWithJustification(
                 #     answer='They weigh the same',
@@ -1456,15 +1535,22 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
                 from pydantic import BaseModel
                 class AnswerWithJustification(BaseModel):
                     '''An answer to the user question along with justification for the answer.'''
                     answer: str
                     justification: str
                 llm = ChatModel(model="model-name", temperature=0)
-                structured_llm = llm.with_structured_output(AnswerWithJustification, include_raw=True)
+                structured_llm = llm.with_structured_output(
+                    AnswerWithJustification, include_raw=True
+                )
-                structured_llm.invoke("What weighs more a pound of bricks or a pound of feathers")
+                structured_llm.invoke(
+                    "What weighs more a pound of bricks or a pound of feathers"
+                )
                 # -> {
                 #     'raw': AIMessage(content='', additional_kwargs={'tool_calls': [{'id': 'call_Ao02pnFYXD6GN1yzc0uXPsvF', 'function': {'arguments': '{"answer":"They weigh the same.","justification":"Both a pound of bricks and a pound of feathers weigh one pound. The weight is the same, but the volume or density of the objects may differ."}', 'name': 'AnswerWithJustification'}, 'type': 'function'}]}),
                 #     'parsed': AnswerWithJustification(answer='They weigh the same.', justification='Both a pound of bricks and a pound of feathers weigh one pound. The weight is the same, but the volume or density of the objects may differ.'),
@@ -1477,16 +1563,21 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
                 from pydantic import BaseModel
                 from langchain_core.utils.function_calling import convert_to_openai_tool
                 class AnswerWithJustification(BaseModel):
                     '''An answer to the user question along with justification for the answer.'''
                     answer: str
                     justification: str
                 dict_schema = convert_to_openai_tool(AnswerWithJustification)
                 llm = ChatModel(model="model-name", temperature=0)
                 structured_llm = llm.with_structured_output(dict_schema)
-                structured_llm.invoke("What weighs more a pound of bricks or a pound of feathers")
+                structured_llm.invoke(
+                    "What weighs more a pound of bricks or a pound of feathers"
+                )
                 # -> {
                 #     'answer': 'They weigh the same',
                 #     'justification': 'Both a pound of bricks and a pound of feathers weigh one pound. The weight is the same, but the volume and density of the two substances differ.'
@@ -1503,11 +1594,6 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
             msg = f"Received unsupported arguments {kwargs}"
             raise ValueError(msg)
-        from langchain_core.output_parsers.openai_tools import (
-            JsonOutputKeyToolsParser,
-            PydanticToolsParser,
-        )
         if type(self).bind_tools is BaseChatModel.bind_tools:
             msg = "with_structured_output is not implemented for this model."
             raise NotImplementedError(msg)
@@ -1544,8 +1630,10 @@ class BaseChatModel(BaseLanguageModel[BaseMessage], ABC):
 class SimpleChatModel(BaseChatModel):
     """Simplified implementation for a chat model to inherit from.
-    **Note** This implementation is primarily here for backwards compatibility.
-        For new implementations, please use `BaseChatModel` directly.
+    .. note::
+        This implementation is primarily here for backwards compatibility. For new
+        implementations, please use ``BaseChatModel`` directly.
     """
     def _generate(

langchain_core/language_models/fake_chat_models.py CHANGED Viewed

@@ -75,12 +75,13 @@ class FakeListChatModel(SimpleChatModel):
     @override
     def _call(
         self,
-        messages: list[BaseMessage],
-        stop: Optional[list[str]] = None,
-        run_manager: Optional[CallbackManagerForLLMRun] = None,
+        *args: Any,
         **kwargs: Any,
     ) -> str:
-        """First try to lookup in queries, else return 'foo' or 'bar'."""
+        """Return the next response in the list.
+        Cycle back to the start if at the end.
+        """
         if self.sleep is not None:
             time.sleep(self.sleep)
         response = self.responses[self.i]
@@ -223,11 +224,12 @@ class GenericFakeChatModel(BaseChatModel):
     This can be expanded to accept other types like Callables / dicts / strings
     to make the interface more generic if needed.
-    Note: if you want to pass a list, you can use `iter` to convert it to an iterator.
+    .. note::
+        if you want to pass a list, you can use ``iter`` to convert it to an iterator.
-    Please note that streaming is not implemented yet. We should try to implement it
-    in the future by delegating to invoke and then breaking the resulting output
-    into message chunks.
+    .. warning::
+        Streaming is not implemented yet. We should try to implement it in the future by
+        delegating to invoke and then breaking the resulting output into message chunks.
     """
     @override
@@ -238,7 +240,6 @@ class GenericFakeChatModel(BaseChatModel):
         run_manager: Optional[CallbackManagerForLLMRun] = None,
         **kwargs: Any,
     ) -> ChatResult:
-        """Top Level call."""
         message = next(self.messages)
         message_ = AIMessage(content=message) if isinstance(message, str) else message
         generation = ChatGeneration(message=message_)
@@ -251,7 +252,6 @@ class GenericFakeChatModel(BaseChatModel):
         run_manager: Optional[CallbackManagerForLLMRun] = None,
         **kwargs: Any,
     ) -> Iterator[ChatGenerationChunk]:
-        """Stream the output of the model."""
         chat_result = self._generate(
             messages, stop=stop, run_manager=run_manager, **kwargs
         )
@@ -361,7 +361,6 @@ class ParrotFakeChatModel(BaseChatModel):
         run_manager: Optional[CallbackManagerForLLMRun] = None,
         **kwargs: Any,
     ) -> ChatResult:
-        """Top Level call."""
         return ChatResult(generations=[ChatGeneration(message=messages[-1])])
     @property

langchain_core/language_models/llms.py CHANGED Viewed

@@ -131,6 +131,7 @@ def create_base_retry_decorator(
 def _resolve_cache(*, cache: Union[BaseCache, bool, None]) -> Optional[BaseCache]:
     """Resolve the cache."""
+    llm_cache: Optional[BaseCache]
     if isinstance(cache, BaseCache):
         llm_cache = cache
     elif cache is None:
@@ -663,7 +664,18 @@ class BaseLLM(BaseLanguageModel[str], ABC):
         run_manager: Optional[CallbackManagerForLLMRun] = None,
         **kwargs: Any,
     ) -> LLMResult:
-        """Run the LLM on the given prompts."""
+        """Run the LLM on the given prompts.
+        Args:
+            prompts: The prompts to generate from.
+            stop: Stop words to use when generating. Model output is cut off at the
+                first occurrence of any of the stop substrings.
+                If stop tokens are not supported consider raising NotImplementedError.
+            run_manager: Callback manager for the run.
+        Returns:
+            The LLM result.
+        """
     async def _agenerate(
         self,
@@ -672,7 +684,18 @@ class BaseLLM(BaseLanguageModel[str], ABC):
         run_manager: Optional[AsyncCallbackManagerForLLMRun] = None,
         **kwargs: Any,
     ) -> LLMResult:
-        """Run the LLM on the given prompts."""
+        """Run the LLM on the given prompts.
+        Args:
+            prompts: The prompts to generate from.
+            stop: Stop words to use when generating. Model output is cut off at the
+                first occurrence of any of the stop substrings.
+                If stop tokens are not supported consider raising NotImplementedError.
+            run_manager: Callback manager for the run.
+        Returns:
+            The LLM result.
+        """
         return await run_in_executor(
             None,
             self._generate,
@@ -705,8 +728,8 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             **kwargs: Arbitrary additional keyword arguments. These are usually passed
                 to the model provider API call.
-        Returns:
-            An iterator of GenerationChunks.
+        Yields:
+            Generation chunks.
         """
         raise NotImplementedError
@@ -731,8 +754,8 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             **kwargs: Arbitrary additional keyword arguments. These are usually passed
                 to the model provider API call.
-        Returns:
-            An async iterator of GenerationChunks.
+        Yields:
+            Generation chunks.
         """
         iterator = await run_in_executor(
             None,
@@ -830,10 +853,11 @@ class BaseLLM(BaseLanguageModel[str], ABC):
         API.
         Use this method when you want to:
-            1. take advantage of batched calls,
-            2. need more output from the model than just the top generated value,
-            3. are building chains that are agnostic to the underlying language model
-                type (e.g., pure text completion models vs chat models).
+        1. Take advantage of batched calls,
+        2. Need more output from the model than just the top generated value,
+        3. Are building chains that are agnostic to the underlying language model
+           type (e.g., pure text completion models vs chat models).
         Args:
             prompts: List of string prompts.
@@ -853,6 +877,11 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             **kwargs: Arbitrary additional keyword arguments. These are usually passed
                 to the model provider API call.
+        Raises:
+            ValueError: If prompts is not a list.
+            ValueError: If the length of ``callbacks``, ``tags``, ``metadata``, or
+                ``run_name`` (if provided) does not match the length of prompts.
         Returns:
             An LLMResult, which contains a list of candidate Generations for each input
                 prompt and additional model provider-specific output.
@@ -1090,10 +1119,11 @@ class BaseLLM(BaseLanguageModel[str], ABC):
         API.
         Use this method when you want to:
-            1. take advantage of batched calls,
-            2. need more output from the model than just the top generated value,
-            3. are building chains that are agnostic to the underlying language model
-                type (e.g., pure text completion models vs chat models).
+        1. Take advantage of batched calls,
+        2. Need more output from the model than just the top generated value,
+        3. Are building chains that are agnostic to the underlying language model
+           type (e.g., pure text completion models vs chat models).
         Args:
             prompts: List of string prompts.
@@ -1113,6 +1143,10 @@ class BaseLLM(BaseLanguageModel[str], ABC):
             **kwargs: Arbitrary additional keyword arguments. These are usually passed
                 to the model provider API call.
+        Raises:
+            ValueError: If the length of ``callbacks``, ``tags``, ``metadata``, or
+                ``run_name`` (if provided) does not match the length of prompts.
         Returns:
             An LLMResult, which contains a list of candidate Generations for each input
                 prompt and additional model provider-specific output.
@@ -1388,7 +1422,7 @@ class BaseLLM(BaseLanguageModel[str], ABC):
         return AIMessage(content=content)
     def __str__(self) -> str:
-        """Get a string representation of the object for printing."""
+        """Return a string representation of the object for printing."""
         cls_name = f"\033[1m{self.__class__.__name__}\033[0m"
         return f"{cls_name}\nParams: {self._identifying_params}"
@@ -1536,7 +1570,6 @@ class LLM(BaseLLM):
         run_manager: Optional[CallbackManagerForLLMRun] = None,
         **kwargs: Any,
     ) -> LLMResult:
-        """Run the LLM on the given prompt and input."""
         # TODO: add caching here.
         generations = []
         new_arg_supported = inspect.signature(self._call).parameters.get("run_manager")
@@ -1556,7 +1589,6 @@ class LLM(BaseLLM):
         run_manager: Optional[AsyncCallbackManagerForLLMRun] = None,
         **kwargs: Any,
     ) -> LLMResult:
-        """Async run the LLM on the given prompt and input."""
         generations = []
         new_arg_supported = inspect.signature(self._acall).parameters.get("run_manager")
         for prompt in prompts:

langchain-core 0.3.74__py3-none-any.whl → 0.3.76__py3-none-any.whl

Potentially problematic release.

langchain-core 0.3.74py3-none-any.whl → 0.3.76py3-none-any.whl