PyPI - langchain-core - Versions diffs - 1.0.0a8__py3-none-any.whl → 1.0.0rc2__py3-none-any.whl - Mend

langchain-core 1.0.0a8py3-none-any.whl → 1.0.0rc2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of langchain-core might be problematic. Click here for more details.

Files changed (142) hide show

langchain_core/__init__.py +1 -1
langchain_core/_api/__init__.py +0 -1
langchain_core/_api/beta_decorator.py +17 -20
langchain_core/_api/deprecation.py +30 -35
langchain_core/_import_utils.py +1 -1
langchain_core/agents.py +10 -9
langchain_core/caches.py +46 -56
langchain_core/callbacks/__init__.py +1 -8
langchain_core/callbacks/base.py +232 -243
langchain_core/callbacks/file.py +33 -33
langchain_core/callbacks/manager.py +353 -416
langchain_core/callbacks/stdout.py +21 -22
langchain_core/callbacks/streaming_stdout.py +32 -32
langchain_core/callbacks/usage.py +54 -51
langchain_core/chat_history.py +43 -58
langchain_core/document_loaders/base.py +21 -21
langchain_core/document_loaders/langsmith.py +22 -22
langchain_core/documents/__init__.py +0 -1
langchain_core/documents/base.py +46 -49
langchain_core/documents/transformers.py +28 -29
langchain_core/embeddings/fake.py +50 -54
langchain_core/example_selectors/semantic_similarity.py +4 -6
langchain_core/exceptions.py +7 -8
langchain_core/indexing/api.py +19 -25
langchain_core/indexing/base.py +24 -24
langchain_core/language_models/__init__.py +11 -27
langchain_core/language_models/_utils.py +53 -54
langchain_core/language_models/base.py +30 -24
langchain_core/language_models/chat_models.py +123 -148
langchain_core/language_models/fake_chat_models.py +7 -7
langchain_core/language_models/llms.py +14 -16
langchain_core/load/dump.py +3 -4
langchain_core/load/load.py +7 -16
langchain_core/load/serializable.py +37 -36
langchain_core/messages/__init__.py +1 -16
langchain_core/messages/ai.py +122 -123
langchain_core/messages/base.py +31 -31
langchain_core/messages/block_translators/__init__.py +17 -17
langchain_core/messages/block_translators/anthropic.py +3 -3
langchain_core/messages/block_translators/bedrock_converse.py +3 -3
langchain_core/messages/block_translators/google_genai.py +5 -4
langchain_core/messages/block_translators/google_vertexai.py +4 -32
langchain_core/messages/block_translators/groq.py +117 -21
langchain_core/messages/block_translators/langchain_v0.py +3 -3
langchain_core/messages/block_translators/openai.py +5 -5
langchain_core/messages/chat.py +2 -6
langchain_core/messages/content.py +222 -209
langchain_core/messages/function.py +6 -10
langchain_core/messages/human.py +17 -24
langchain_core/messages/modifier.py +2 -2
langchain_core/messages/system.py +12 -22
langchain_core/messages/tool.py +53 -69
langchain_core/messages/utils.py +399 -417
langchain_core/output_parsers/__init__.py +1 -14
langchain_core/output_parsers/base.py +46 -47
langchain_core/output_parsers/json.py +3 -4
langchain_core/output_parsers/list.py +2 -2
langchain_core/output_parsers/openai_functions.py +46 -44
langchain_core/output_parsers/openai_tools.py +11 -16
langchain_core/output_parsers/pydantic.py +10 -11
langchain_core/output_parsers/string.py +2 -2
langchain_core/output_parsers/transform.py +2 -2
langchain_core/output_parsers/xml.py +1 -1
langchain_core/outputs/__init__.py +1 -1
langchain_core/outputs/chat_generation.py +14 -14
langchain_core/outputs/generation.py +6 -6
langchain_core/outputs/llm_result.py +5 -5
langchain_core/prompt_values.py +11 -11
langchain_core/prompts/__init__.py +3 -23
langchain_core/prompts/base.py +33 -38
langchain_core/prompts/chat.py +222 -229
langchain_core/prompts/dict.py +3 -3
langchain_core/prompts/few_shot.py +76 -83
langchain_core/prompts/few_shot_with_templates.py +7 -9
langchain_core/prompts/image.py +12 -14
langchain_core/prompts/loading.py +1 -1
langchain_core/prompts/message.py +3 -3
langchain_core/prompts/prompt.py +20 -23
langchain_core/prompts/string.py +20 -8
langchain_core/prompts/structured.py +26 -27
langchain_core/rate_limiters.py +50 -58
langchain_core/retrievers.py +41 -182
langchain_core/runnables/base.py +565 -597
langchain_core/runnables/branch.py +8 -8
langchain_core/runnables/config.py +37 -44
langchain_core/runnables/configurable.py +9 -10
langchain_core/runnables/fallbacks.py +9 -9
langchain_core/runnables/graph.py +46 -50
langchain_core/runnables/graph_ascii.py +19 -18
langchain_core/runnables/graph_mermaid.py +20 -31
langchain_core/runnables/graph_png.py +7 -7
langchain_core/runnables/history.py +22 -22
langchain_core/runnables/passthrough.py +11 -11
langchain_core/runnables/retry.py +3 -3
langchain_core/runnables/router.py +2 -2
langchain_core/runnables/schema.py +33 -33
langchain_core/runnables/utils.py +30 -34
langchain_core/stores.py +72 -102
langchain_core/sys_info.py +27 -29
langchain_core/tools/__init__.py +1 -14
langchain_core/tools/base.py +70 -71
langchain_core/tools/convert.py +100 -104
langchain_core/tools/render.py +9 -9
langchain_core/tools/retriever.py +7 -7
langchain_core/tools/simple.py +6 -7
langchain_core/tools/structured.py +18 -24
langchain_core/tracers/__init__.py +1 -9
langchain_core/tracers/base.py +35 -35
langchain_core/tracers/context.py +12 -17
langchain_core/tracers/event_stream.py +3 -3
langchain_core/tracers/langchain.py +8 -8
langchain_core/tracers/log_stream.py +17 -18
langchain_core/tracers/memory_stream.py +3 -3
langchain_core/tracers/root_listeners.py +2 -2
langchain_core/tracers/schemas.py +0 -129
langchain_core/tracers/stdout.py +1 -2
langchain_core/utils/__init__.py +1 -1
langchain_core/utils/aiter.py +32 -32
langchain_core/utils/env.py +5 -5
langchain_core/utils/function_calling.py +59 -154
langchain_core/utils/html.py +4 -4
langchain_core/utils/input.py +3 -3
langchain_core/utils/interactive_env.py +1 -1
langchain_core/utils/iter.py +20 -20
langchain_core/utils/json.py +1 -1
langchain_core/utils/json_schema.py +2 -2
langchain_core/utils/mustache.py +5 -5
langchain_core/utils/pydantic.py +17 -17
langchain_core/utils/strings.py +5 -5
langchain_core/utils/utils.py +25 -28
langchain_core/vectorstores/base.py +55 -87
langchain_core/vectorstores/in_memory.py +83 -85
langchain_core/vectorstores/utils.py +2 -2
langchain_core/version.py +1 -1
{langchain_core-1.0.0a8.dist-info → langchain_core-1.0.0rc2.dist-info}/METADATA +23 -11
langchain_core-1.0.0rc2.dist-info/RECORD +172 -0
langchain_core/memory.py +0 -120
langchain_core/pydantic_v1/__init__.py +0 -30
langchain_core/pydantic_v1/dataclasses.py +0 -23
langchain_core/pydantic_v1/main.py +0 -23
langchain_core-1.0.0a8.dist-info/RECORD +0 -176
{langchain_core-1.0.0a8.dist-info → langchain_core-1.0.0rc2.dist-info}/WHEEL +0 -0

langchain_core/messages/utils.py CHANGED Viewed

@@ -5,7 +5,6 @@ Some examples of what you can do with these functions include:
 * Convert messages to strings (serialization)
 * Convert messages from dicts to Message objects (deserialization)
 * Filter messages from a list of messages based on name, type or id etc.
 """
 from __future__ import annotations
@@ -87,6 +86,7 @@ AnyMessage = Annotated[
     | Annotated[ToolMessageChunk, Tag(tag="ToolMessageChunk")],
     Field(discriminator=Discriminator(_get_type)),
 ]
+""""A type representing any defined `Message` or `MessageChunk` type."""
 def get_buffer_string(
@@ -96,10 +96,8 @@ def get_buffer_string(
     Args:
         messages: Messages to be converted to strings.
-        human_prefix: The prefix to prepend to contents of ``HumanMessage``s.
-            Default is ``'Human'``.
-        ai_prefix: The prefix to prepend to contents of ``AIMessage``. Default is
-            ``'AI'``.
+        human_prefix: The prefix to prepend to contents of `HumanMessage`s.
+        ai_prefix: The prefix to prepend to contents of `AIMessage`.
     Returns:
         A single string concatenation of all input messages.
@@ -108,17 +106,16 @@ def get_buffer_string(
         ValueError: If an unsupported message type is encountered.
     Example:
-        .. code-block:: python
-            from langchain_core import AIMessage, HumanMessage
-            messages = [
-                HumanMessage(content="Hi, how are you?"),
-                AIMessage(content="Good, how are you?"),
-            ]
-            get_buffer_string(messages)
-            # -> "Human: Hi, how are you?\nAI: Good, how are you?"
+        ```python
+        from langchain_core import AIMessage, HumanMessage
+        messages = [
+            HumanMessage(content="Hi, how are you?"),
+            AIMessage(content="Good, how are you?"),
+        ]
+        get_buffer_string(messages)
+        # -> "Human: Hi, how are you?\nAI: Good, how are you?"
+        ```
     """
     string_messages = []
     for m in messages:
@@ -178,7 +175,7 @@ def _message_from_dict(message: dict) -> BaseMessage:
 def messages_from_dict(messages: Sequence[dict]) -> list[BaseMessage]:
-    """Convert a sequence of messages from dicts to ``Message`` objects.
+    """Convert a sequence of messages from dicts to `Message` objects.
     Args:
         messages: Sequence of messages (as dicts) to convert.
@@ -191,7 +188,7 @@ def messages_from_dict(messages: Sequence[dict]) -> list[BaseMessage]:
 def message_chunk_to_message(chunk: BaseMessage) -> BaseMessage:
-    """Convert a message chunk to a ``Message``.
+    """Convert a message chunk to a `Message`.
     Args:
         chunk: Message chunk to convert.
@@ -213,6 +210,7 @@ def message_chunk_to_message(chunk: BaseMessage) -> BaseMessage:
 MessageLikeRepresentation = (
     BaseMessage | list[str] | tuple[str, str] | str | dict[str, Any]
 )
+"""A type representing the various ways a message can be represented."""
 def _create_message_from_message_type(
@@ -224,24 +222,24 @@ def _create_message_from_message_type(
     id: str | None = None,
     **additional_kwargs: Any,
 ) -> BaseMessage:
-    """Create a message from a ``Message`` type and content string.
+    """Create a message from a `Message` type and content string.
     Args:
-        message_type: (str) the type of the message (e.g., ``'human'``, ``'ai'``, etc.).
+        message_type: (str) the type of the message (e.g., `'human'`, `'ai'`, etc.).
         content: (str) the content string.
-        name: (str) the name of the message. Default is None.
-        tool_call_id: (str) the tool call id. Default is None.
-        tool_calls: (list[dict[str, Any]]) the tool calls. Default is None.
-        id: (str) the id of the message. Default is None.
+        name: (str) the name of the message.
+        tool_call_id: (str) the tool call id.
+        tool_calls: (list[dict[str, Any]]) the tool calls.
+        id: (str) the id of the message.
         additional_kwargs: (dict[str, Any]) additional keyword arguments.
     Returns:
         a message of the appropriate type.
     Raises:
-        ValueError: if the message type is not one of ``'human'``, ``'user'``, ``'ai'``,
-            ``'assistant'``, ``'function'``, ``'tool'``, ``'system'``, or
-            ``'developer'``.
+        ValueError: if the message type is not one of `'human'`, `'user'`, `'ai'`,
+            `'assistant'`, `'function'`, `'tool'`, `'system'`, or
+            `'developer'`.
     """
     kwargs: dict[str, Any] = {}
     if name is not None:
@@ -307,21 +305,21 @@ def _create_message_from_message_type(
 def _convert_to_message(message: MessageLikeRepresentation) -> BaseMessage:
-    """Instantiate a ``Message`` from a variety of message formats.
+    """Instantiate a `Message` from a variety of message formats.
     The message format can be one of the following:
-    - ``BaseMessagePromptTemplate``
-    - ``BaseMessage``
-    - 2-tuple of (role string, template); e.g., (``'human'``, ``'{user_input}'``)
+    - `BaseMessagePromptTemplate`
+    - `BaseMessage`
+    - 2-tuple of (role string, template); e.g., (`'human'`, `'{user_input}'`)
     - dict: a message dict with role and content keys
-    - string: shorthand for (``'human'``, template); e.g., ``'{user_input}'``
+    - string: shorthand for (`'human'`, template); e.g., `'{user_input}'`
     Args:
         message: a representation of a message in one of the supported formats.
     Returns:
-        an instance of a message or a message template.
+        An instance of a message or a message template.
     Raises:
         NotImplementedError: if the message type is not supported.
@@ -423,79 +421,78 @@ def filter_messages(
     exclude_ids: Sequence[str] | None = None,
     exclude_tool_calls: Sequence[str] | bool | None = None,
 ) -> list[BaseMessage]:
-    """Filter messages based on ``name``, ``type`` or ``id``.
+    """Filter messages based on `name`, `type` or `id`.
     Args:
         messages: Sequence Message-like objects to filter.
-        include_names: Message names to include. Default is None.
-        exclude_names: Messages names to exclude. Default is None.
+        include_names: Message names to include.
+        exclude_names: Messages names to exclude.
         include_types: Message types to include. Can be specified as string names
-            (e.g. ``'system'``, ``'human'``, ``'ai'``, ...) or as ``BaseMessage``
-            classes (e.g. ``SystemMessage``, ``HumanMessage``, ``AIMessage``, ...).
-            Default is None.
+            (e.g. `'system'`, `'human'`, `'ai'`, ...) or as `BaseMessage`
+            classes (e.g. `SystemMessage`, `HumanMessage`, `AIMessage`, ...).
         exclude_types: Message types to exclude. Can be specified as string names
-            (e.g. ``'system'``, ``'human'``, ``'ai'``, ...) or as ``BaseMessage``
-            classes (e.g. ``SystemMessage``, ``HumanMessage``, ``AIMessage``, ...).
-            Default is None.
-        include_ids: Message IDs to include. Default is None.
-        exclude_ids: Message IDs to exclude. Default is None.
-        exclude_tool_calls: Tool call IDs to exclude. Default is None.
+            (e.g. `'system'`, `'human'`, `'ai'`, ...) or as `BaseMessage`
+            classes (e.g. `SystemMessage`, `HumanMessage`, `AIMessage`, ...).
+        include_ids: Message IDs to include.
+        exclude_ids: Message IDs to exclude.
+        exclude_tool_calls: Tool call IDs to exclude.
             Can be one of the following:
-            - ``True``: all ``AIMessage``s with tool calls and all
-              ``ToolMessage``s will be excluded.
+            - `True`: all `AIMessage`s with tool calls and all
+                `ToolMessage` objects will be excluded.
             - a sequence of tool call IDs to exclude:
-              - ``ToolMessage``s with the corresponding tool call ID will be
-                excluded.
-              - The ``tool_calls`` in the AIMessage will be updated to exclude
-                matching tool calls. If all ``tool_calls`` are filtered from an
-                AIMessage, the whole message is excluded.
+                - `ToolMessage` objects with the corresponding tool call ID will be
+                    excluded.
+                - The `tool_calls` in the AIMessage will be updated to exclude
+                    matching tool calls. If all `tool_calls` are filtered from an
+                    AIMessage, the whole message is excluded.
     Returns:
-        A list of Messages that meets at least one of the ``incl_*`` conditions and none
-        of the ``excl_*`` conditions. If not ``incl_*`` conditions are specified then
+        A list of Messages that meets at least one of the `incl_*` conditions and none
+        of the `excl_*` conditions. If not `incl_*` conditions are specified then
         anything that is not explicitly excluded will be included.
     Raises:
         ValueError: If two incompatible arguments are provided.
     Example:
-        .. code-block:: python
-            from langchain_core.messages import (
-                filter_messages,
-                AIMessage,
-                HumanMessage,
-                SystemMessage,
-            )
-            messages = [
-                SystemMessage("you're a good assistant."),
-                HumanMessage("what's your name", id="foo", name="example_user"),
-                AIMessage("steve-o", id="bar", name="example_assistant"),
-                HumanMessage(
-                    "what's your favorite color",
-                    id="baz",
-                ),
-                AIMessage(
-                    "silicon blue",
-                    id="blah",
-                ),
-            ]
-            filter_messages(
-                messages,
-                incl_names=("example_user", "example_assistant"),
-                incl_types=("system",),
-                excl_ids=("bar",),
-            )
-        .. code-block:: python
-            [
-                SystemMessage("you're a good assistant."),
-                HumanMessage("what's your name", id="foo", name="example_user"),
-            ]
+        ```python
+        from langchain_core.messages import (
+            filter_messages,
+            AIMessage,
+            HumanMessage,
+            SystemMessage,
+        )
+        messages = [
+            SystemMessage("you're a good assistant."),
+            HumanMessage("what's your name", id="foo", name="example_user"),
+            AIMessage("steve-o", id="bar", name="example_assistant"),
+            HumanMessage(
+                "what's your favorite color",
+                id="baz",
+            ),
+            AIMessage(
+                "silicon blue",
+                id="blah",
+            ),
+        ]
+        filter_messages(
+            messages,
+            incl_names=("example_user", "example_assistant"),
+            incl_types=("system",),
+            excl_ids=("bar",),
+        )
+        ```
+        ```python
+        [
+            SystemMessage("you're a good assistant."),
+            HumanMessage("what's your name", id="foo", name="example_user"),
+        ]
+        ```
     """
     messages = convert_to_messages(messages)
     filtered: list[BaseMessage] = []
@@ -565,13 +562,12 @@ def merge_message_runs(
     r"""Merge consecutive Messages of the same type.
     !!! note
-        ToolMessages are not merged, as each has a distinct tool call id that can't be
-        merged.
+        `ToolMessage` objects are not merged, as each has a distinct tool call id that
+        can't be merged.
     Args:
         messages: Sequence Message-like objects to merge.
         chunk_separator: Specify the string to be inserted between message chunks.
-            Defaults to ``'\n'``.
     Returns:
         list of BaseMessages with consecutive runs of message types merged into single
@@ -579,87 +575,86 @@ def merge_message_runs(
         the merged content is a concatenation of the two strings with a new-line
         separator.
         The separator inserted between message chunks can be controlled by specifying
-        any string with ``chunk_separator``. If at least one of the messages has a list
+        any string with `chunk_separator`. If at least one of the messages has a list
         of content blocks, the merged content is a list of content blocks.
     Example:
+        ```python
+        from langchain_core.messages import (
+            merge_message_runs,
+            AIMessage,
+            HumanMessage,
+            SystemMessage,
+            ToolCall,
+        )
-        .. code-block:: python
-            from langchain_core.messages import (
-                merge_message_runs,
-                AIMessage,
-                HumanMessage,
-                SystemMessage,
-                ToolCall,
-            )
-            messages = [
-                SystemMessage("you're a good assistant."),
-                HumanMessage(
-                    "what's your favorite color",
-                    id="foo",
-                ),
-                HumanMessage(
-                    "wait your favorite food",
-                    id="bar",
-                ),
-                AIMessage(
+        messages = [
+            SystemMessage("you're a good assistant."),
+            HumanMessage(
+                "what's your favorite color",
+                id="foo",
+            ),
+            HumanMessage(
+                "wait your favorite food",
+                id="bar",
+            ),
+            AIMessage(
+                "my favorite colo",
+                tool_calls=[
+                    ToolCall(
+                        name="blah_tool", args={"x": 2}, id="123", type="tool_call"
+                    )
+                ],
+                id="baz",
+            ),
+            AIMessage(
+                [{"type": "text", "text": "my favorite dish is lasagna"}],
+                tool_calls=[
+                    ToolCall(
+                        name="blah_tool",
+                        args={"x": -10},
+                        id="456",
+                        type="tool_call",
+                    )
+                ],
+                id="blur",
+            ),
+        ]
+        merge_message_runs(messages)
+        ```
+        ```python
+        [
+            SystemMessage("you're a good assistant."),
+            HumanMessage(
+                "what's your favorite color\\n"
+                "wait your favorite food", id="foo",
+            ),
+            AIMessage(
+                [
                     "my favorite colo",
-                    tool_calls=[
-                        ToolCall(
-                            name="blah_tool", args={"x": 2}, id="123", type="tool_call"
-                        )
-                    ],
-                    id="baz",
-                ),
-                AIMessage(
-                    [{"type": "text", "text": "my favorite dish is lasagna"}],
-                    tool_calls=[
-                        ToolCall(
-                            name="blah_tool",
-                            args={"x": -10},
-                            id="456",
-                            type="tool_call",
-                        )
-                    ],
-                    id="blur",
-                ),
-            ]
-            merge_message_runs(messages)
-        .. code-block:: python
-            [
-                SystemMessage("you're a good assistant."),
-                HumanMessage(
-                    "what's your favorite color\\n"
-                    "wait your favorite food", id="foo",
-                ),
-                AIMessage(
-                    [
-                        "my favorite colo",
-                        {"type": "text", "text": "my favorite dish is lasagna"}
-                    ],
-                    tool_calls=[
-                        ToolCall({
-                            "name": "blah_tool",
-                            "args": {"x": 2},
-                            "id": "123",
-                            "type": "tool_call"
-                        }),
-                        ToolCall({
-                            "name": "blah_tool",
-                            "args": {"x": -10},
-                            "id": "456",
-                            "type": "tool_call"
-                        })
-                    ]
-                    id="baz"
-                ),
-            ]
+                    {"type": "text", "text": "my favorite dish is lasagna"}
+                ],
+                tool_calls=[
+                    ToolCall({
+                        "name": "blah_tool",
+                        "args": {"x": 2},
+                        "id": "123",
+                        "type": "tool_call"
+                    }),
+                    ToolCall({
+                        "name": "blah_tool",
+                        "args": {"x": -10},
+                        "id": "456",
+                        "type": "tool_call"
+                    })
+                ]
+                id="baz"
+            ),
+        ]
+        ```
     """
     if not messages:
         return []
@@ -706,153 +701,146 @@ def trim_messages(
 ) -> list[BaseMessage]:
     r"""Trim messages to be below a token count.
-    ``trim_messages`` can be used to reduce the size of a chat history to a specified
-    token count or specified message count.
+    `trim_messages` can be used to reduce the size of a chat history to a specified
+    token or message count.
     In either case, if passing the trimmed chat history back into a chat model
     directly, the resulting chat history should usually satisfy the following
     properties:
     1. The resulting chat history should be valid. Most chat models expect that chat
-       history starts with either (1) a ``HumanMessage`` or (2) a ``SystemMessage``
-       followed by a ``HumanMessage``. To achieve this, set ``start_on='human'``.
-       In addition, generally a ``ToolMessage`` can only appear after an ``AIMessage``
-       that involved a tool call.
-       Please see the following link for more information about messages:
-       https://python.langchain.com/docs/concepts/#messages
+        history starts with either (1) a `HumanMessage` or (2) a `SystemMessage`
+        followed by a `HumanMessage`. To achieve this, set `start_on='human'`.
+        In addition, generally a `ToolMessage` can only appear after an `AIMessage`
+        that involved a tool call.
     2. It includes recent messages and drops old messages in the chat history.
-       To achieve this set the ``strategy='last'``.
-    3. Usually, the new chat history should include the ``SystemMessage`` if it
-       was present in the original chat history since the ``SystemMessage`` includes
-       special instructions to the chat model. The ``SystemMessage`` is almost always
-       the first message in the history if present. To achieve this set the
-       ``include_system=True``.
+        To achieve this set the `strategy='last'`.
+    3. Usually, the new chat history should include the `SystemMessage` if it
+        was present in the original chat history since the `SystemMessage` includes
+        special instructions to the chat model. The `SystemMessage` is almost always
+        the first message in the history if present. To achieve this set the
+        `include_system=True`.
     !!! note
-        The examples below show how to configure ``trim_messages`` to achieve a behavior
+        The examples below show how to configure `trim_messages` to achieve a behavior
         consistent with the above properties.
     Args:
         messages: Sequence of Message-like objects to trim.
         max_tokens: Max token count of trimmed messages.
-        token_counter: Function or llm for counting tokens in a ``BaseMessage`` or a
-            list of ``BaseMessage``. If a ``BaseLanguageModel`` is passed in then
-            ``BaseLanguageModel.get_num_tokens_from_messages()`` will be used.
-            Set to ``len`` to count the number of **messages** in the chat history.
+        token_counter: Function or llm for counting tokens in a `BaseMessage` or a
+            list of `BaseMessage`. If a `BaseLanguageModel` is passed in then
+            `BaseLanguageModel.get_num_tokens_from_messages()` will be used.
+            Set to `len` to count the number of **messages** in the chat history.
             !!! note
-                Use ``count_tokens_approximately`` to get fast, approximate token
+                Use `count_tokens_approximately` to get fast, approximate token
                 counts.
-                This is recommended for using ``trim_messages`` on the hot path, where
+                This is recommended for using `trim_messages` on the hot path, where
                 exact token counting is not necessary.
         strategy: Strategy for trimming.
-            - ``'first'``: Keep the first ``<= n_count`` tokens of the messages.
-            - ``'last'``: Keep the last ``<= n_count`` tokens of the messages.
-            Default is ``'last'``.
+            - `'first'`: Keep the first `<= n_count` tokens of the messages.
+            - `'last'`: Keep the last `<= n_count` tokens of the messages.
         allow_partial: Whether to split a message if only part of the message can be
-            included. If ``strategy='last'`` then the last partial contents of a message
-            are included. If ``strategy='first'`` then the first partial contents of a
+            included. If `strategy='last'` then the last partial contents of a message
+            are included. If `strategy='first'` then the first partial contents of a
             message are included.
-            Default is False.
         end_on: The message type to end on. If specified then every message after the
-            last occurrence of this type is ignored. If ``strategy='last'`` then this
-            is done before we attempt to get the last ``max_tokens``. If
-            ``strategy='first'`` then this is done after we get the first
-            ``max_tokens``. Can be specified as string names (e.g. ``'system'``,
-            ``'human'``, ``'ai'``, ...) or as ``BaseMessage`` classes (e.g.
-            ``SystemMessage``, ``HumanMessage``, ``AIMessage``, ...). Can be a single
+            last occurrence of this type is ignored. If `strategy='last'` then this
+            is done before we attempt to get the last `max_tokens`. If
+            `strategy='first'` then this is done after we get the first
+            `max_tokens`. Can be specified as string names (e.g. `'system'`,
+            `'human'`, `'ai'`, ...) or as `BaseMessage` classes (e.g.
+            `SystemMessage`, `HumanMessage`, `AIMessage`, ...). Can be a single
             type or a list of types.
-            Default is None.
         start_on: The message type to start on. Should only be specified if
-            ``strategy='last'``. If specified then every message before
+            `strategy='last'`. If specified then every message before
             the first occurrence of this type is ignored. This is done after we trim
-            the initial messages to the last ``max_tokens``. Does not
-            apply to a ``SystemMessage`` at index 0 if ``include_system=True``. Can be
-            specified as string names (e.g. ``'system'``, ``'human'``, ``'ai'``, ...) or
-            as ``BaseMessage`` classes (e.g. ``SystemMessage``, ``HumanMessage``,
-            ``AIMessage``, ...). Can be a single type or a list of types.
-            Default is None.
-        include_system: Whether to keep the SystemMessage if there is one at index 0.
-            Should only be specified if ``strategy="last"``.
-            Default is False.
-        text_splitter: Function or ``langchain_text_splitters.TextSplitter`` for
+            the initial messages to the last `max_tokens`. Does not
+            apply to a `SystemMessage` at index 0 if `include_system=True`. Can be
+            specified as string names (e.g. `'system'`, `'human'`, `'ai'`, ...) or
+            as `BaseMessage` classes (e.g. `SystemMessage`, `HumanMessage`,
+            `AIMessage`, ...). Can be a single type or a list of types.
+        include_system: Whether to keep the `SystemMessage` if there is one at index
+            `0`. Should only be specified if `strategy="last"`.
+        text_splitter: Function or `langchain_text_splitters.TextSplitter` for
             splitting the string contents of a message. Only used if
-            ``allow_partial=True``. If ``strategy='last'`` then the last split tokens
-            from a partial message will be included. if ``strategy='first'`` then the
+            `allow_partial=True`. If `strategy='last'` then the last split tokens
+            from a partial message will be included. if `strategy='first'` then the
             first split tokens from a partial message will be included. Token splitter
             assumes that separators are kept, so that split contents can be directly
             concatenated to recreate the original text. Defaults to splitting on
             newlines.
     Returns:
-        list of trimmed ``BaseMessage``.
+        List of trimmed `BaseMessage`.
     Raises:
         ValueError: if two incompatible arguments are specified or an unrecognized
-            ``strategy`` is specified.
+            `strategy` is specified.
     Example:
-        Trim chat history based on token count, keeping the ``SystemMessage`` if
-        present, and ensuring that the chat history starts with a ``HumanMessage`` (
-        or a ``SystemMessage`` followed by a ``HumanMessage``).
-        .. code-block:: python
-            from langchain_core.messages import (
-                AIMessage,
-                HumanMessage,
-                BaseMessage,
-                SystemMessage,
-                trim_messages,
-            )
-            messages = [
-                SystemMessage(
-                    "you're a good assistant, you always respond with a joke."
-                ),
-                HumanMessage("i wonder why it's called langchain"),
-                AIMessage(
-                    'Well, I guess they thought "WordRope" and "SentenceString" just '
-                    "didn't have the same ring to it!"
-                ),
-                HumanMessage("and who is harrison chasing anyways"),
-                AIMessage(
-                    "Hmmm let me think.\n\nWhy, he's probably chasing after the last "
-                    "cup of coffee in the office!"
-                ),
-                HumanMessage("what do you call a speechless parrot"),
-            ]
-            trim_messages(
-                messages,
-                max_tokens=45,
-                strategy="last",
-                token_counter=ChatOpenAI(model="gpt-4o"),
-                # Most chat models expect that chat history starts with either:
-                # (1) a HumanMessage or
-                # (2) a SystemMessage followed by a HumanMessage
-                start_on="human",
-                # Usually, we want to keep the SystemMessage
-                # if it's present in the original history.
-                # The SystemMessage has special instructions for the model.
-                include_system=True,
-                allow_partial=False,
-            )
+        Trim chat history based on token count, keeping the `SystemMessage` if
+        present, and ensuring that the chat history starts with a `HumanMessage` (
+        or a `SystemMessage` followed by a `HumanMessage`).
+        ```python
+        from langchain_core.messages import (
+            AIMessage,
+            HumanMessage,
+            BaseMessage,
+            SystemMessage,
+            trim_messages,
+        )
-        .. code-block:: python
+        messages = [
+            SystemMessage("you're a good assistant, you always respond with a joke."),
+            HumanMessage("i wonder why it's called langchain"),
+            AIMessage(
+                'Well, I guess they thought "WordRope" and "SentenceString" just '
+                "didn't have the same ring to it!"
+            ),
+            HumanMessage("and who is harrison chasing anyways"),
+            AIMessage(
+                "Hmmm let me think.\n\nWhy, he's probably chasing after the last "
+                "cup of coffee in the office!"
+            ),
+            HumanMessage("what do you call a speechless parrot"),
+        ]
+        trim_messages(
+            messages,
+            max_tokens=45,
+            strategy="last",
+            token_counter=ChatOpenAI(model="gpt-4o"),
+            # Most chat models expect that chat history starts with either:
+            # (1) a HumanMessage or
+            # (2) a SystemMessage followed by a HumanMessage
+            start_on="human",
+            # Usually, we want to keep the SystemMessage
+            # if it's present in the original history.
+            # The SystemMessage has special instructions for the model.
+            include_system=True,
+            allow_partial=False,
+        )
+        ```
-            [
-                SystemMessage(
-                    content="you're a good assistant, you always respond with a joke."
-                ),
-                HumanMessage(content="what do you call a speechless parrot"),
-            ]
+        ```python
+        [
+            SystemMessage(
+                content="you're a good assistant, you always respond with a joke."
+            ),
+            HumanMessage(content="what do you call a speechless parrot"),
+        ]
+        ```
-        Trim chat history based on the message count, keeping the ``SystemMessage`` if
-        present, and ensuring that the chat history starts with a ``HumanMessage`` (
-        or a ``SystemMessage`` followed by a ``HumanMessage``).
+        Trim chat history based on the message count, keeping the `SystemMessage` if
+        present, and ensuring that the chat history starts with a `HumanMessage` (
+        or a `SystemMessage` followed by a `HumanMessage`).
             trim_messages(
                 messages,
@@ -874,100 +862,95 @@ def trim_messages(
                 allow_partial=False,
             )
-        .. code-block:: python
-            [
-                SystemMessage(
-                    content="you're a good assistant, you always respond with a joke."
-                ),
-                HumanMessage(content="and who is harrison chasing anyways"),
-                AIMessage(
-                    content="Hmmm let me think.\n\nWhy, he's probably chasing after "
-                    "the last cup of coffee in the office!"
-                ),
-                HumanMessage(content="what do you call a speechless parrot"),
-            ]
+        ```python
+        [
+            SystemMessage(
+                content="you're a good assistant, you always respond with a joke."
+            ),
+            HumanMessage(content="and who is harrison chasing anyways"),
+            AIMessage(
+                content="Hmmm let me think.\n\nWhy, he's probably chasing after "
+                "the last cup of coffee in the office!"
+            ),
+            HumanMessage(content="what do you call a speechless parrot"),
+        ]
+        ```
         Trim chat history using a custom token counter function that counts the
         number of tokens in each message.
-        .. code-block:: python
-            messages = [
-                SystemMessage("This is a 4 token text. The full message is 10 tokens."),
-                HumanMessage(
-                    "This is a 4 token text. The full message is 10 tokens.", id="first"
-                ),
-                AIMessage(
-                    [
-                        {"type": "text", "text": "This is the FIRST 4 token block."},
-                        {"type": "text", "text": "This is the SECOND 4 token block."},
-                    ],
-                    id="second",
-                ),
-                HumanMessage(
-                    "This is a 4 token text. The full message is 10 tokens.", id="third"
-                ),
-                AIMessage(
-                    "This is a 4 token text. The full message is 10 tokens.",
-                    id="fourth",
-                ),
-            ]
-            def dummy_token_counter(messages: list[BaseMessage]) -> int:
-                # treat each message like it adds 3 default tokens at the beginning
-                # of the message and at the end of the message. 3 + 4 + 3 = 10 tokens
-                # per message.
-                default_content_len = 4
-                default_msg_prefix_len = 3
-                default_msg_suffix_len = 3
-                count = 0
-                for msg in messages:
-                    if isinstance(msg.content, str):
-                        count += (
-                            default_msg_prefix_len
-                            + default_content_len
-                            + default_msg_suffix_len
-                        )
-                    if isinstance(msg.content, list):
-                        count += (
-                            default_msg_prefix_len
-                            + len(msg.content) * default_content_len
-                            + default_msg_suffix_len
-                        )
-                return count
-        First 30 tokens, allowing partial messages:
-            .. code-block:: python
-                trim_messages(
-                    messages,
-                    max_tokens=30,
-                    token_counter=dummy_token_counter,
-                    strategy="first",
-                    allow_partial=True,
-                )
-            .. code-block:: python
+        ```python
+        messages = [
+            SystemMessage("This is a 4 token text. The full message is 10 tokens."),
+            HumanMessage(
+                "This is a 4 token text. The full message is 10 tokens.", id="first"
+            ),
+            AIMessage(
                 [
-                    SystemMessage(
-                        "This is a 4 token text. The full message is 10 tokens."
-                    ),
-                    HumanMessage(
-                        "This is a 4 token text. The full message is 10 tokens.",
-                        id="first",
-                    ),
-                    AIMessage(
-                        [{"type": "text", "text": "This is the FIRST 4 token block."}],
-                        id="second",
-                    ),
-                ]
+                    {"type": "text", "text": "This is the FIRST 4 token block."},
+                    {"type": "text", "text": "This is the SECOND 4 token block."},
+                ],
+                id="second",
+            ),
+            HumanMessage(
+                "This is a 4 token text. The full message is 10 tokens.", id="third"
+            ),
+            AIMessage(
+                "This is a 4 token text. The full message is 10 tokens.",
+                id="fourth",
+            ),
+        ]
+        def dummy_token_counter(messages: list[BaseMessage]) -> int:
+            # treat each message like it adds 3 default tokens at the beginning
+            # of the message and at the end of the message. 3 + 4 + 3 = 10 tokens
+            # per message.
+            default_content_len = 4
+            default_msg_prefix_len = 3
+            default_msg_suffix_len = 3
+            count = 0
+            for msg in messages:
+                if isinstance(msg.content, str):
+                    count += (
+                        default_msg_prefix_len
+                        + default_content_len
+                        + default_msg_suffix_len
+                    )
+                if isinstance(msg.content, list):
+                    count += (
+                        default_msg_prefix_len
+                        + len(msg.content) * default_content_len
+                        + default_msg_suffix_len
+                    )
+            return count
+        ```
+        First 30 tokens, allowing partial messages:
+        ```python
+        trim_messages(
+            messages,
+            max_tokens=30,
+            token_counter=dummy_token_counter,
+            strategy="first",
+            allow_partial=True,
+        )
+        ```
+        ```python
+        [
+            SystemMessage("This is a 4 token text. The full message is 10 tokens."),
+            HumanMessage(
+                "This is a 4 token text. The full message is 10 tokens.",
+                id="first",
+            ),
+            AIMessage(
+                [{"type": "text", "text": "This is the FIRST 4 token block."}],
+                id="second",
+            ),
+        ]
+        ```
     """
     # Validate arguments
     if start_on and strategy == "first":
@@ -1042,21 +1025,21 @@ def convert_to_openai_messages(
         messages: Message-like object or iterable of objects whose contents are
             in OpenAI, Anthropic, Bedrock Converse, or VertexAI formats.
         text_format: How to format string or text block contents:
-                - ``'string'``:
+                - `'string'`:
                     If a message has a string content, this is left as a string. If
-                    a message has content blocks that are all of type ``'text'``, these
+                    a message has content blocks that are all of type `'text'`, these
                     are joined with a newline to make a single string. If a message has
-                    content blocks and at least one isn't of type ``'text'``, then
+                    content blocks and at least one isn't of type `'text'`, then
                     all blocks are left as dicts.
-                - ``'block'``:
+                - `'block'`:
                     If a message has a string content, this is turned into a list
-                    with a single content block of type ``'text'``. If a message has
+                    with a single content block of type `'text'`. If a message has
                     content blocks these are left as is.
         include_id: Whether to include message ids in the openai messages, if they
                     are present in the source messages.
     Raises:
-        ValueError: if an unrecognized ``text_format`` is specified, or if a message
+        ValueError: if an unrecognized `text_format` is specified, or if a message
             content block is missing expected keys.
     Returns:
@@ -1070,50 +1053,49 @@ def convert_to_openai_messages(
             message dicts is returned.
     Example:
+        ```python
+        from langchain_core.messages import (
+            convert_to_openai_messages,
+            AIMessage,
+            SystemMessage,
+            ToolMessage,
+        )
-        .. code-block:: python
-            from langchain_core.messages import (
-                convert_to_openai_messages,
-                AIMessage,
-                SystemMessage,
-                ToolMessage,
-            )
-            messages = [
-                SystemMessage([{"type": "text", "text": "foo"}]),
-                {
-                    "role": "user",
-                    "content": [
-                        {"type": "text", "text": "whats in this"},
-                        {
-                            "type": "image_url",
-                            "image_url": {"url": "data:image/png;base64,'/9j/4AAQSk'"},
-                        },
-                    ],
-                },
-                AIMessage(
-                    "",
-                    tool_calls=[
-                        {
-                            "name": "analyze",
-                            "args": {"baz": "buz"},
-                            "id": "1",
-                            "type": "tool_call",
-                        }
-                    ],
-                ),
-                ToolMessage("foobar", tool_call_id="1", name="bar"),
-                {"role": "assistant", "content": "thats nice"},
-            ]
-            oai_messages = convert_to_openai_messages(messages)
-            # -> [
-            #   {'role': 'system', 'content': 'foo'},
-            #   {'role': 'user', 'content': [{'type': 'text', 'text': 'whats in this'}, {'type': 'image_url', 'image_url': {'url': "data:image/png;base64,'/9j/4AAQSk'"}}]},
-            #   {'role': 'assistant', 'tool_calls': [{'type': 'function', 'id': '1','function': {'name': 'analyze', 'arguments': '{"baz": "buz"}'}}], 'content': ''},
-            #   {'role': 'tool', 'name': 'bar', 'content': 'foobar'},
-            #   {'role': 'assistant', 'content': 'thats nice'}
-            # ]
+        messages = [
+            SystemMessage([{"type": "text", "text": "foo"}]),
+            {
+                "role": "user",
+                "content": [
+                    {"type": "text", "text": "whats in this"},
+                    {
+                        "type": "image_url",
+                        "image_url": {"url": "data:image/png;base64,'/9j/4AAQSk'"},
+                    },
+                ],
+            },
+            AIMessage(
+                "",
+                tool_calls=[
+                    {
+                        "name": "analyze",
+                        "args": {"baz": "buz"},
+                        "id": "1",
+                        "type": "tool_call",
+                    }
+                ],
+            ),
+            ToolMessage("foobar", tool_call_id="1", name="bar"),
+            {"role": "assistant", "content": "thats nice"},
+        ]
+        oai_messages = convert_to_openai_messages(messages)
+        # -> [
+        #   {'role': 'system', 'content': 'foo'},
+        #   {'role': 'user', 'content': [{'type': 'text', 'text': 'whats in this'}, {'type': 'image_url', 'image_url': {'url': "data:image/png;base64,'/9j/4AAQSk'"}}]},
+        #   {'role': 'assistant', 'tool_calls': [{'type': 'function', 'id': '1','function': {'name': 'analyze', 'arguments': '{"baz": "buz"}'}}], 'content': ''},
+        #   {'role': 'tool', 'name': 'bar', 'content': 'foobar'},
+        #   {'role': 'assistant', 'content': 'thats nice'}
+        # ]
+        ```
     !!! version-added "Added in version 0.3.11"
@@ -1695,13 +1677,13 @@ def count_tokens_approximately(
     Args:
         messages: List of messages to count tokens for.
         chars_per_token: Number of characters per token to use for the approximation.
-            Default is 4 (one token corresponds to ~4 chars for common English text).
+            One token corresponds to ~4 chars for common English text.
             You can also specify float values for more fine-grained control.
-            `See more here. <https://platform.openai.com/tokenizer>`__
-        extra_tokens_per_message: Number of extra tokens to add per message.
-            Default is 3 (special tokens, including beginning/end of message).
+            [See more here](https://platform.openai.com/tokenizer).
+        extra_tokens_per_message: Number of extra tokens to add per message, e.g.
+            special tokens, including beginning/end of message.
             You can also specify float values for more fine-grained control.
-            `See more here. <https://github.com/openai/openai-cookbook/blob/main/examples/How_to_count_tokens_with_tiktoken.ipynb>`__
+            [See more here](https://github.com/openai/openai-cookbook/blob/main/examples/How_to_count_tokens_with_tiktoken.ipynb).
         count_name: Whether to include message names in the count.
             Enabled by default.

langchain-core 1.0.0a8__py3-none-any.whl → 1.0.0rc2__py3-none-any.whl

Potentially problematic release.

langchain-core 1.0.0a8py3-none-any.whl → 1.0.0rc2py3-none-any.whl