PyPI - langchain-core - Versions diffs - 1.0.0a8__py3-none-any.whl → 1.0.0rc2__py3-none-any.whl - Mend

langchain-core 1.0.0a8py3-none-any.whl → 1.0.0rc2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of langchain-core might be problematic. Click here for more details.

Files changed (142) hide show

langchain_core/__init__.py +1 -1
langchain_core/_api/__init__.py +0 -1
langchain_core/_api/beta_decorator.py +17 -20
langchain_core/_api/deprecation.py +30 -35
langchain_core/_import_utils.py +1 -1
langchain_core/agents.py +10 -9
langchain_core/caches.py +46 -56
langchain_core/callbacks/__init__.py +1 -8
langchain_core/callbacks/base.py +232 -243
langchain_core/callbacks/file.py +33 -33
langchain_core/callbacks/manager.py +353 -416
langchain_core/callbacks/stdout.py +21 -22
langchain_core/callbacks/streaming_stdout.py +32 -32
langchain_core/callbacks/usage.py +54 -51
langchain_core/chat_history.py +43 -58
langchain_core/document_loaders/base.py +21 -21
langchain_core/document_loaders/langsmith.py +22 -22
langchain_core/documents/__init__.py +0 -1
langchain_core/documents/base.py +46 -49
langchain_core/documents/transformers.py +28 -29
langchain_core/embeddings/fake.py +50 -54
langchain_core/example_selectors/semantic_similarity.py +4 -6
langchain_core/exceptions.py +7 -8
langchain_core/indexing/api.py +19 -25
langchain_core/indexing/base.py +24 -24
langchain_core/language_models/__init__.py +11 -27
langchain_core/language_models/_utils.py +53 -54
langchain_core/language_models/base.py +30 -24
langchain_core/language_models/chat_models.py +123 -148
langchain_core/language_models/fake_chat_models.py +7 -7
langchain_core/language_models/llms.py +14 -16
langchain_core/load/dump.py +3 -4
langchain_core/load/load.py +7 -16
langchain_core/load/serializable.py +37 -36
langchain_core/messages/__init__.py +1 -16
langchain_core/messages/ai.py +122 -123
langchain_core/messages/base.py +31 -31
langchain_core/messages/block_translators/__init__.py +17 -17
langchain_core/messages/block_translators/anthropic.py +3 -3
langchain_core/messages/block_translators/bedrock_converse.py +3 -3
langchain_core/messages/block_translators/google_genai.py +5 -4
langchain_core/messages/block_translators/google_vertexai.py +4 -32
langchain_core/messages/block_translators/groq.py +117 -21
langchain_core/messages/block_translators/langchain_v0.py +3 -3
langchain_core/messages/block_translators/openai.py +5 -5
langchain_core/messages/chat.py +2 -6
langchain_core/messages/content.py +222 -209
langchain_core/messages/function.py +6 -10
langchain_core/messages/human.py +17 -24
langchain_core/messages/modifier.py +2 -2
langchain_core/messages/system.py +12 -22
langchain_core/messages/tool.py +53 -69
langchain_core/messages/utils.py +399 -417
langchain_core/output_parsers/__init__.py +1 -14
langchain_core/output_parsers/base.py +46 -47
langchain_core/output_parsers/json.py +3 -4
langchain_core/output_parsers/list.py +2 -2
langchain_core/output_parsers/openai_functions.py +46 -44
langchain_core/output_parsers/openai_tools.py +11 -16
langchain_core/output_parsers/pydantic.py +10 -11
langchain_core/output_parsers/string.py +2 -2
langchain_core/output_parsers/transform.py +2 -2
langchain_core/output_parsers/xml.py +1 -1
langchain_core/outputs/__init__.py +1 -1
langchain_core/outputs/chat_generation.py +14 -14
langchain_core/outputs/generation.py +6 -6
langchain_core/outputs/llm_result.py +5 -5
langchain_core/prompt_values.py +11 -11
langchain_core/prompts/__init__.py +3 -23
langchain_core/prompts/base.py +33 -38
langchain_core/prompts/chat.py +222 -229
langchain_core/prompts/dict.py +3 -3
langchain_core/prompts/few_shot.py +76 -83
langchain_core/prompts/few_shot_with_templates.py +7 -9
langchain_core/prompts/image.py +12 -14
langchain_core/prompts/loading.py +1 -1
langchain_core/prompts/message.py +3 -3
langchain_core/prompts/prompt.py +20 -23
langchain_core/prompts/string.py +20 -8
langchain_core/prompts/structured.py +26 -27
langchain_core/rate_limiters.py +50 -58
langchain_core/retrievers.py +41 -182
langchain_core/runnables/base.py +565 -597
langchain_core/runnables/branch.py +8 -8
langchain_core/runnables/config.py +37 -44
langchain_core/runnables/configurable.py +9 -10
langchain_core/runnables/fallbacks.py +9 -9
langchain_core/runnables/graph.py +46 -50
langchain_core/runnables/graph_ascii.py +19 -18
langchain_core/runnables/graph_mermaid.py +20 -31
langchain_core/runnables/graph_png.py +7 -7
langchain_core/runnables/history.py +22 -22
langchain_core/runnables/passthrough.py +11 -11
langchain_core/runnables/retry.py +3 -3
langchain_core/runnables/router.py +2 -2
langchain_core/runnables/schema.py +33 -33
langchain_core/runnables/utils.py +30 -34
langchain_core/stores.py +72 -102
langchain_core/sys_info.py +27 -29
langchain_core/tools/__init__.py +1 -14
langchain_core/tools/base.py +70 -71
langchain_core/tools/convert.py +100 -104
langchain_core/tools/render.py +9 -9
langchain_core/tools/retriever.py +7 -7
langchain_core/tools/simple.py +6 -7
langchain_core/tools/structured.py +18 -24
langchain_core/tracers/__init__.py +1 -9
langchain_core/tracers/base.py +35 -35
langchain_core/tracers/context.py +12 -17
langchain_core/tracers/event_stream.py +3 -3
langchain_core/tracers/langchain.py +8 -8
langchain_core/tracers/log_stream.py +17 -18
langchain_core/tracers/memory_stream.py +3 -3
langchain_core/tracers/root_listeners.py +2 -2
langchain_core/tracers/schemas.py +0 -129
langchain_core/tracers/stdout.py +1 -2
langchain_core/utils/__init__.py +1 -1
langchain_core/utils/aiter.py +32 -32
langchain_core/utils/env.py +5 -5
langchain_core/utils/function_calling.py +59 -154
langchain_core/utils/html.py +4 -4
langchain_core/utils/input.py +3 -3
langchain_core/utils/interactive_env.py +1 -1
langchain_core/utils/iter.py +20 -20
langchain_core/utils/json.py +1 -1
langchain_core/utils/json_schema.py +2 -2
langchain_core/utils/mustache.py +5 -5
langchain_core/utils/pydantic.py +17 -17
langchain_core/utils/strings.py +5 -5
langchain_core/utils/utils.py +25 -28
langchain_core/vectorstores/base.py +55 -87
langchain_core/vectorstores/in_memory.py +83 -85
langchain_core/vectorstores/utils.py +2 -2
langchain_core/version.py +1 -1
{langchain_core-1.0.0a8.dist-info → langchain_core-1.0.0rc2.dist-info}/METADATA +23 -11
langchain_core-1.0.0rc2.dist-info/RECORD +172 -0
langchain_core/memory.py +0 -120
langchain_core/pydantic_v1/__init__.py +0 -30
langchain_core/pydantic_v1/dataclasses.py +0 -23
langchain_core/pydantic_v1/main.py +0 -23
langchain_core-1.0.0a8.dist-info/RECORD +0 -176
{langchain_core-1.0.0a8.dist-info → langchain_core-1.0.0rc2.dist-info}/WHEEL +0 -0

langchain_core/document_loaders/langsmith.py CHANGED Viewed

@@ -22,22 +22,22 @@ class LangSmithLoader(BaseLoader):
     ??? note "Lazy load"
-        .. code-block:: python
+        ```python
+        from langchain_core.document_loaders import LangSmithLoader
-            from langchain_core.document_loaders import LangSmithLoader
+        loader = LangSmithLoader(dataset_id="...", limit=100)
+        docs = []
+        for doc in loader.lazy_load():
+            docs.append(doc)
+        ```
-            loader = LangSmithLoader(dataset_id="...", limit=100)
-            docs = []
-            for doc in loader.lazy_load():
-                docs.append(doc)
-        .. code-block:: python
-            # -> [Document("...", metadata={"inputs": {...}, "outputs": {...}, ...}), ...]
+        ```python
+        # -> [Document("...", metadata={"inputs": {...}, "outputs": {...}, ...}), ...]
+        ```
     !!! version-added "Added in version 0.2.34"
-    """  # noqa: E501
+    """
     def __init__(
         self,
@@ -60,15 +60,15 @@ class LangSmithLoader(BaseLoader):
         """Create a LangSmith loader.
         Args:
-            dataset_id: The ID of the dataset to filter by. Defaults to None.
-            dataset_name: The name of the dataset to filter by. Defaults to None.
-            content_key: The inputs key to set as Document page content. ``'.'`` characters
-                are interpreted as nested keys. E.g. ``content_key="first.second"`` will
+            dataset_id: The ID of the dataset to filter by.
+            dataset_name: The name of the dataset to filter by.
+            content_key: The inputs key to set as Document page content. `'.'` characters
+                are interpreted as nested keys. E.g. `content_key="first.second"` will
                 result in
-                ``Document(page_content=format_content(example.inputs["first"]["second"]))``
+                `Document(page_content=format_content(example.inputs["first"]["second"]))`
             format_content: Function for converting the content extracted from the example
                 inputs into a string. Defaults to JSON-encoding the contents.
-            example_ids: The IDs of the examples to filter by. Defaults to None.
+            example_ids: The IDs of the examples to filter by.
             as_of: The dataset version tag OR
                 timestamp to retrieve the examples as of.
                 Response examples will only be those that were present at the time
@@ -76,17 +76,17 @@ class LangSmithLoader(BaseLoader):
             splits: A list of dataset splits, which are
                 divisions of your dataset such as 'train', 'test', or 'validation'.
                 Returns examples only from the specified splits.
-            inline_s3_urls: Whether to inline S3 URLs. Defaults to True.
-            offset: The offset to start from. Defaults to 0.
+            inline_s3_urls: Whether to inline S3 URLs.
+            offset: The offset to start from.
             limit: The maximum number of examples to return.
-            metadata: Metadata to filter by. Defaults to None.
+            metadata: Metadata to filter by.
             filter: A structured filter string to apply to the examples.
             client: LangSmith Client. If not provided will be initialized from below args.
             client_kwargs: Keyword args to pass to LangSmith client init. Should only be
-                specified if ``client`` isn't.
+                specified if `client` isn't.
         Raises:
-            ValueError: If both ``client`` and ``client_kwargs`` are provided.
+            ValueError: If both `client` and `client_kwargs` are provided.
         """  # noqa: E501
         if client and client_kwargs:
             raise ValueError

langchain_core/documents/__init__.py CHANGED Viewed

@@ -2,7 +2,6 @@
 **Document** module is a collection of classes that handle documents
 and their transformations.
 """
 from typing import TYPE_CHECKING

langchain_core/documents/base.py CHANGED Viewed

@@ -57,52 +57,51 @@ class Blob(BaseMedia):
     Example: Initialize a blob from in-memory data
-        .. code-block:: python
+    ```python
+    from langchain_core.documents import Blob
-            from langchain_core.documents import Blob
+    blob = Blob.from_data("Hello, world!")
-            blob = Blob.from_data("Hello, world!")
+    # Read the blob as a string
+    print(blob.as_string())
-            # Read the blob as a string
-            print(blob.as_string())
+    # Read the blob as bytes
+    print(blob.as_bytes())
-            # Read the blob as bytes
-            print(blob.as_bytes())
-            # Read the blob as a byte stream
-            with blob.as_bytes_io() as f:
-                print(f.read())
+    # Read the blob as a byte stream
+    with blob.as_bytes_io() as f:
+        print(f.read())
+    ```
     Example: Load from memory and specify mime-type and metadata
-        .. code-block:: python
-            from langchain_core.documents import Blob
+    ```python
+    from langchain_core.documents import Blob
-            blob = Blob.from_data(
-                data="Hello, world!",
-                mime_type="text/plain",
-                metadata={"source": "https://example.com"},
-            )
+    blob = Blob.from_data(
+        data="Hello, world!",
+        mime_type="text/plain",
+        metadata={"source": "https://example.com"},
+    )
+    ```
     Example: Load the blob from a file
-        .. code-block:: python
-            from langchain_core.documents import Blob
-            blob = Blob.from_path("path/to/file.txt")
+    ```python
+    from langchain_core.documents import Blob
-            # Read the blob as a string
-            print(blob.as_string())
+    blob = Blob.from_path("path/to/file.txt")
-            # Read the blob as bytes
-            print(blob.as_bytes())
+    # Read the blob as a string
+    print(blob.as_string())
-            # Read the blob as a byte stream
-            with blob.as_bytes_io() as f:
-                print(f.read())
+    # Read the blob as bytes
+    print(blob.as_bytes())
+    # Read the blob as a byte stream
+    with blob.as_bytes_io() as f:
+        print(f.read())
+    ```
     """
     data: bytes | str | None = None
@@ -112,7 +111,7 @@ class Blob(BaseMedia):
     encoding: str = "utf-8"
     """Encoding to use if decoding the bytes into a string.
-    Use utf-8 as default encoding, if decoding to string.
+    Use `utf-8` as default encoding, if decoding to string.
     """
     path: PathLike | None = None
     """Location where the original content was found."""
@@ -128,7 +127,7 @@ class Blob(BaseMedia):
         If a path is associated with the blob, it will default to the path location.
-        Unless explicitly set via a metadata field called "source", in which
+        Unless explicitly set via a metadata field called `"source"`, in which
         case that value will be used instead.
         """
         if self.metadata and "source" in self.metadata:
@@ -212,11 +211,11 @@ class Blob(BaseMedia):
         """Load the blob from a path like object.
         Args:
-            path: path like object to file to be read
+            path: Path-like object to file to be read
             encoding: Encoding to use if decoding the bytes into a string
-            mime_type: if provided, will be set as the mime-type of the data
-            guess_type: If True, the mimetype will be guessed from the file extension,
-                        if a mime-type was not provided
+            mime_type: If provided, will be set as the mime-type of the data
+            guess_type: If `True`, the mimetype will be guessed from the file extension,
+                if a mime-type was not provided
             metadata: Metadata to associate with the blob
         Returns:
@@ -249,10 +248,10 @@ class Blob(BaseMedia):
         """Initialize the blob from in-memory data.
         Args:
-            data: the in-memory data associated with the blob
+            data: The in-memory data associated with the blob
             encoding: Encoding to use if decoding the bytes into a string
-            mime_type: if provided, will be set as the mime-type of the data
-            path: if provided, will be set as the source from which the data came
+            mime_type: If provided, will be set as the mime-type of the data
+            path: If provided, will be set as the source from which the data came
             metadata: Metadata to associate with the blob
         Returns:
@@ -278,15 +277,13 @@ class Document(BaseMedia):
     """Class for storing a piece of text and associated metadata.
     Example:
+        ```python
+        from langchain_core.documents import Document
-        .. code-block:: python
-            from langchain_core.documents import Document
-            document = Document(
-                page_content="Hello, world!", metadata={"source": "https://example.com"}
-            )
+        document = Document(
+            page_content="Hello, world!", metadata={"source": "https://example.com"}
+        )
+        ```
     """
     page_content: str
@@ -306,7 +303,7 @@ class Document(BaseMedia):
     @classmethod
     def get_lc_namespace(cls) -> list[str]:
-        """Get the namespace of the langchain object.
+        """Get the namespace of the LangChain object.
         Returns:
             ["langchain", "schema", "document"]

langchain_core/documents/transformers.py CHANGED Viewed

@@ -20,35 +20,34 @@ class BaseDocumentTransformer(ABC):
     sequence of transformed Documents.
     Example:
-        .. code-block:: python
-            class EmbeddingsRedundantFilter(BaseDocumentTransformer, BaseModel):
-                embeddings: Embeddings
-                similarity_fn: Callable = cosine_similarity
-                similarity_threshold: float = 0.95
-                class Config:
-                    arbitrary_types_allowed = True
-                def transform_documents(
-                    self, documents: Sequence[Document], **kwargs: Any
-                ) -> Sequence[Document]:
-                    stateful_documents = get_stateful_documents(documents)
-                    embedded_documents = _get_embeddings_from_stateful_docs(
-                        self.embeddings, stateful_documents
-                    )
-                    included_idxs = _filter_similar_embeddings(
-                        embedded_documents,
-                        self.similarity_fn,
-                        self.similarity_threshold,
-                    )
-                    return [stateful_documents[i] for i in sorted(included_idxs)]
-                async def atransform_documents(
-                    self, documents: Sequence[Document], **kwargs: Any
-                ) -> Sequence[Document]:
-                    raise NotImplementedError
+        ```python
+        class EmbeddingsRedundantFilter(BaseDocumentTransformer, BaseModel):
+            embeddings: Embeddings
+            similarity_fn: Callable = cosine_similarity
+            similarity_threshold: float = 0.95
+            class Config:
+                arbitrary_types_allowed = True
+            def transform_documents(
+                self, documents: Sequence[Document], **kwargs: Any
+            ) -> Sequence[Document]:
+                stateful_documents = get_stateful_documents(documents)
+                embedded_documents = _get_embeddings_from_stateful_docs(
+                    self.embeddings, stateful_documents
+                )
+                included_idxs = _filter_similar_embeddings(
+                    embedded_documents,
+                    self.similarity_fn,
+                    self.similarity_threshold,
+                )
+                return [stateful_documents[i] for i in sorted(included_idxs)]
+            async def atransform_documents(
+                self, documents: Sequence[Document], **kwargs: Any
+            ) -> Sequence[Document]:
+                raise NotImplementedError
+        ```
     """
     @abstractmethod

langchain_core/embeddings/fake.py CHANGED Viewed

@@ -18,40 +18,38 @@ class FakeEmbeddings(Embeddings, BaseModel):
     This embedding model creates embeddings by sampling from a normal distribution.
-    Do not use this outside of testing, as it is not a real embedding model.
+    !!! warning
+        Do not use this outside of testing, as it is not a real embedding model.
     Instantiate:
-        .. code-block:: python
+        ```python
+        from langchain_core.embeddings import FakeEmbeddings
-            from langchain_core.embeddings import FakeEmbeddings
-            embed = FakeEmbeddings(size=100)
+        embed = FakeEmbeddings(size=100)
+        ```
     Embed single text:
-        .. code-block:: python
-            input_text = "The meaning of life is 42"
-            vector = embed.embed_query(input_text)
-            print(vector[:3])
-        .. code-block:: python
-            [-0.700234640213188, -0.581266257710429, -1.1328482266445354]
+        ```python
+        input_text = "The meaning of life is 42"
+        vector = embed.embed_query(input_text)
+        print(vector[:3])
+        ```
+        ```python
+        [-0.700234640213188, -0.581266257710429, -1.1328482266445354]
+        ```
     Embed multiple texts:
-        .. code-block:: python
-            input_texts = ["Document 1...", "Document 2..."]
-            vectors = embed.embed_documents(input_texts)
-            print(len(vectors))
-            # The first 3 coordinates for the first vector
-            print(vectors[0][:3])
-        .. code-block:: python
-            2
-            [-0.5670477847544458, -0.31403828652395727, -0.5840547508955257]
+        ```python
+        input_texts = ["Document 1...", "Document 2..."]
+        vectors = embed.embed_documents(input_texts)
+        print(len(vectors))
+        # The first 3 coordinates for the first vector
+        print(vectors[0][:3])
+        ```
+        ```python
+        2
+        [-0.5670477847544458, -0.31403828652395727, -0.5840547508955257]
+        ```
     """
     size: int
@@ -75,40 +73,38 @@ class DeterministicFakeEmbedding(Embeddings, BaseModel):
     This embedding model creates embeddings by sampling from a normal distribution
     with a seed based on the hash of the text.
-    Do not use this outside of testing, as it is not a real embedding model.
+    !!! warning
+        Do not use this outside of testing, as it is not a real embedding model.
     Instantiate:
-        .. code-block:: python
+        ```python
+        from langchain_core.embeddings import DeterministicFakeEmbedding
-            from langchain_core.embeddings import DeterministicFakeEmbedding
-            embed = DeterministicFakeEmbedding(size=100)
+        embed = DeterministicFakeEmbedding(size=100)
+        ```
     Embed single text:
-        .. code-block:: python
-            input_text = "The meaning of life is 42"
-            vector = embed.embed_query(input_text)
-            print(vector[:3])
-        .. code-block:: python
-            [-0.700234640213188, -0.581266257710429, -1.1328482266445354]
+        ```python
+        input_text = "The meaning of life is 42"
+        vector = embed.embed_query(input_text)
+        print(vector[:3])
+        ```
+        ```python
+        [-0.700234640213188, -0.581266257710429, -1.1328482266445354]
+        ```
     Embed multiple texts:
-        .. code-block:: python
-            input_texts = ["Document 1...", "Document 2..."]
-            vectors = embed.embed_documents(input_texts)
-            print(len(vectors))
-            # The first 3 coordinates for the first vector
-            print(vectors[0][:3])
-        .. code-block:: python
-            2
-            [-0.5670477847544458, -0.31403828652395727, -0.5840547508955257]
+        ```python
+        input_texts = ["Document 1...", "Document 2..."]
+        vectors = embed.embed_documents(input_texts)
+        print(len(vectors))
+        # The first 3 coordinates for the first vector
+        print(vectors[0][:3])
+        ```
+        ```python
+        2
+        [-0.5670477847544458, -0.31403828652395727, -0.5840547508955257]
+        ```
     """
     size: int

langchain_core/example_selectors/semantic_similarity.py CHANGED Viewed

@@ -154,7 +154,7 @@ class SemanticSimilarityExampleSelector(_VectorStoreExampleSelector):
             examples: List of examples to use in the prompt.
             embeddings: An initialized embedding API interface, e.g. OpenAIEmbeddings().
             vectorstore_cls: A vector store DB interface class, e.g. FAISS.
-            k: Number of examples to select. Default is 4.
+            k: Number of examples to select.
             input_keys: If provided, the search is based on the input variables
                 instead of all variables.
             example_keys: If provided, keys to filter examples to.
@@ -198,7 +198,7 @@ class SemanticSimilarityExampleSelector(_VectorStoreExampleSelector):
             examples: List of examples to use in the prompt.
             embeddings: An initialized embedding API interface, e.g. OpenAIEmbeddings().
             vectorstore_cls: A vector store DB interface class, e.g. FAISS.
-            k: Number of examples to select. Default is 4.
+            k: Number of examples to select.
             input_keys: If provided, the search is based on the input variables
                 instead of all variables.
             example_keys: If provided, keys to filter examples to.
@@ -285,9 +285,8 @@ class MaxMarginalRelevanceExampleSelector(_VectorStoreExampleSelector):
             examples: List of examples to use in the prompt.
             embeddings: An initialized embedding API interface, e.g. OpenAIEmbeddings().
             vectorstore_cls: A vector store DB interface class, e.g. FAISS.
-            k: Number of examples to select. Default is 4.
+            k: Number of examples to select.
             fetch_k: Number of Documents to fetch to pass to MMR algorithm.
-                Default is 20.
             input_keys: If provided, the search is based on the input variables
                 instead of all variables.
             example_keys: If provided, keys to filter examples to.
@@ -333,9 +332,8 @@ class MaxMarginalRelevanceExampleSelector(_VectorStoreExampleSelector):
             examples: List of examples to use in the prompt.
             embeddings: An initialized embedding API interface, e.g. OpenAIEmbeddings().
             vectorstore_cls: A vector store DB interface class, e.g. FAISS.
-            k: Number of examples to select. Default is 4.
+            k: Number of examples to select.
             fetch_k: Number of Documents to fetch to pass to MMR algorithm.
-                Default is 20.
             input_keys: If provided, the search is based on the input variables
                 instead of all variables.
             example_keys: If provided, keys to filter examples to.

langchain_core/exceptions.py CHANGED Viewed

@@ -16,7 +16,7 @@ class OutputParserException(ValueError, LangChainException):  # noqa: N818
     """Exception that output parsers should raise to signify a parsing error.
     This exists to differentiate parsing errors from other code or execution errors
-    that also may arise inside the output parser. OutputParserExceptions will be
+    that also may arise inside the output parser. `OutputParserException` will be
     available to catch and handle in ways to fix the parsing error, while other
     errors will be raised.
     """
@@ -28,24 +28,23 @@ class OutputParserException(ValueError, LangChainException):  # noqa: N818
         llm_output: str | None = None,
         send_to_llm: bool = False,  # noqa: FBT001,FBT002
     ):
-        """Create an OutputParserException.
+        """Create an `OutputParserException`.
         Args:
             error: The error that's being re-raised or an error message.
             observation: String explanation of error which can be passed to a
-                model to try and remediate the issue. Defaults to None.
+                model to try and remediate the issue.
             llm_output: String model output which is error-ing.
-                Defaults to None.
             send_to_llm: Whether to send the observation and llm_output back to an Agent
-                after an OutputParserException has been raised.
+                after an `OutputParserException` has been raised.
                 This gives the underlying model driving the agent the context that the
                 previous output was improperly structured, in the hopes that it will
                 update the output to the correct format.
-                Defaults to False.
         Raises:
-            ValueError: If ``send_to_llm`` is True but either observation or
-                ``llm_output`` are not provided.
+            ValueError: If `send_to_llm` is True but either observation or
+                `llm_output` are not provided.
         """
         if isinstance(error, str):
             error = create_message(

langchain_core/indexing/api.py CHANGED Viewed

@@ -299,9 +299,9 @@ def index(
     are not able to specify the uid of the document.
     !!! warning "Behavior changed in 0.3.25"
-        Added ``scoped_full`` cleanup mode.
+        Added `scoped_full` cleanup mode.
-    !!! important
+    !!! warning
         * In full mode, the loader should be returning
           the entire dataset, and not just a subset of the dataset.
@@ -315,7 +315,7 @@ def index(
           chunks, and we index them using a batch size of 5, we'll have 3 batches
           all with the same source id. In general, to avoid doing too much
           redundant work select as big a batch size as possible.
-        * The ``scoped_full`` mode is suitable if determining an appropriate batch size
+        * The `scoped_full` mode is suitable if determining an appropriate batch size
           is challenging or if your data loader cannot return the entire dataset at
           once. This mode keeps track of source IDs in memory, which should be fine
           for most use cases. If your dataset is large (10M+ docs), you will likely
@@ -326,8 +326,8 @@ def index(
         record_manager: Timestamped set to keep track of which documents were
             updated.
         vector_store: VectorStore or DocumentIndex to index the documents into.
-        batch_size: Batch size to use when indexing. Default is 100.
-        cleanup: How to handle clean up of documents. Default is None.
+        batch_size: Batch size to use when indexing.
+        cleanup: How to handle clean up of documents.
             - incremental: Cleans up all documents that haven't been updated AND
               that are associated with source ids that were seen during indexing.
@@ -342,15 +342,12 @@ def index(
               source ids that were seen during indexing.
             - None: Do not delete any documents.
         source_id_key: Optional key that helps identify the original source
-            of the document. Default is None.
+            of the document.
         cleanup_batch_size: Batch size to use when cleaning up documents.
-            Default is 1_000.
         force_update: Force update documents even if they are present in the
             record manager. Useful if you are re-indexing with updated embeddings.
-            Default is False.
         key_encoder: Hashing algorithm to use for hashing the document content and
-            metadata. Default is "sha1".
-            Other options include "blake2b", "sha256", and "sha512".
+            metadata. Options include "blake2b", "sha256", and "sha512".
             !!! version-added "Added in version 0.3.66"
@@ -381,8 +378,8 @@ def index(
         ValueError: If vectorstore does not have
             "delete" and "add_documents" required methods.
         ValueError: If source_id_key is not None, but is not a string or callable.
-        TypeError: If ``vectorstore`` is not a VectorStore or a DocumentIndex.
-        AssertionError: If ``source_id`` is None when cleanup mode is incremental.
+        TypeError: If `vectorstore` is not a VectorStore or a DocumentIndex.
+        AssertionError: If `source_id` is None when cleanup mode is incremental.
             (should be unreachable code).
     """
     # Behavior is deprecated, but we keep it for backwards compatibility.
@@ -640,9 +637,9 @@ async def aindex(
     are not able to specify the uid of the document.
     !!! warning "Behavior changed in 0.3.25"
-        Added ``scoped_full`` cleanup mode.
+        Added `scoped_full` cleanup mode.
-    !!! important
+    !!! warning
         * In full mode, the loader should be returning
           the entire dataset, and not just a subset of the dataset.
@@ -656,7 +653,7 @@ async def aindex(
           chunks, and we index them using a batch size of 5, we'll have 3 batches
           all with the same source id. In general, to avoid doing too much
           redundant work select as big a batch size as possible.
-        * The ``scoped_full`` mode is suitable if determining an appropriate batch size
+        * The `scoped_full` mode is suitable if determining an appropriate batch size
           is challenging or if your data loader cannot return the entire dataset at
           once. This mode keeps track of source IDs in memory, which should be fine
           for most use cases. If your dataset is large (10M+ docs), you will likely
@@ -667,8 +664,8 @@ async def aindex(
         record_manager: Timestamped set to keep track of which documents were
             updated.
         vector_store: VectorStore or DocumentIndex to index the documents into.
-        batch_size: Batch size to use when indexing. Default is 100.
-        cleanup: How to handle clean up of documents. Default is None.
+        batch_size: Batch size to use when indexing.
+        cleanup: How to handle clean up of documents.
             - incremental: Cleans up all documents that haven't been updated AND
               that are associated with source ids that were seen during indexing.
@@ -683,15 +680,12 @@ async def aindex(
               source ids that were seen during indexing.
             - None: Do not delete any documents.
         source_id_key: Optional key that helps identify the original source
-            of the document. Default is None.
+            of the document.
         cleanup_batch_size: Batch size to use when cleaning up documents.
-            Default is 1_000.
         force_update: Force update documents even if they are present in the
             record manager. Useful if you are re-indexing with updated embeddings.
-            Default is False.
         key_encoder: Hashing algorithm to use for hashing the document content and
-            metadata. Default is "sha1".
-            Other options include "blake2b", "sha256", and "sha512".
+            metadata. Options include "blake2b", "sha256", and "sha512".
             !!! version-added "Added in version 0.3.66"
@@ -722,9 +716,9 @@ async def aindex(
         ValueError: If vectorstore does not have
             "adelete" and "aadd_documents" required methods.
         ValueError: If source_id_key is not None, but is not a string or callable.
-        TypeError: If ``vector_store`` is not a VectorStore or DocumentIndex.
-        AssertionError: If ``source_id_key`` is None when cleanup mode is
-            incremental or ``scoped_full`` (should be unreachable).
+        TypeError: If `vector_store` is not a VectorStore or DocumentIndex.
+        AssertionError: If `source_id_key` is None when cleanup mode is
+            incremental or `scoped_full` (should be unreachable).
     """
     # Behavior is deprecated, but we keep it for backwards compatibility.
     # # Warn only once per process.

langchain-core 1.0.0a8__py3-none-any.whl → 1.0.0rc2__py3-none-any.whl

Potentially problematic release.

langchain-core 1.0.0a8py3-none-any.whl → 1.0.0rc2py3-none-any.whl