PyPI - llama-index-vector-stores-opensearch - Versions diffs - 0.1.3__py3-none-any.whl → 0.1.5__py3-none-any.whl - Mend

llama-index-vector-stores-opensearch 0.1.3py3-none-any.whl → 0.1.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of llama-index-vector-stores-opensearch might be problematic. Click here for more details.

Files changed (5) hide show

llama_index/vector_stores/opensearch/base.py CHANGED Viewed

@@ -1,12 +1,18 @@
 """Elasticsearch/Opensearch vector store."""
+import asyncio
 import json
 import uuid
 from typing import Any, Dict, Iterable, List, Optional, Union, cast
+import nest_asyncio
+from llama_index.core.bridge.pydantic import PrivateAttr
 from llama_index.core.schema import BaseNode, MetadataMode, TextNode
 from llama_index.core.vector_stores.types import (
     MetadataFilters,
-    VectorStore,
+    BasePydanticVectorStore,
     VectorStoreQuery,
     VectorStoreQueryMode,
     VectorStoreQueryResult,
@@ -15,9 +21,9 @@ from llama_index.core.vector_stores.utils import (
     metadata_dict_to_node,
     node_to_metadata_dict,
 )
-from opensearchpy import OpenSearch
+from opensearchpy import AsyncOpenSearch
 from opensearchpy.exceptions import NotFoundError
-from opensearchpy.helpers import bulk
+from opensearchpy.helpers import async_bulk
 IMPORT_OPENSEARCH_PY_ERROR = (
     "Could not import OpenSearch. Please install it with `pip install opensearch-py`."
@@ -28,14 +34,14 @@ INVALID_HYBRID_QUERY_ERROR = (
 MATCH_ALL_QUERY = {"match_all": {}}  # type: Dict
-def _import_opensearch() -> Any:
+def _import_async_opensearch() -> Any:
     """Import OpenSearch if available, otherwise raise error."""
-    return OpenSearch
+    return AsyncOpenSearch
-def _import_bulk() -> Any:
+def _import_async_bulk() -> Any:
     """Import bulk if available, otherwise raise error."""
-    return bulk
+    return async_bulk
 def _import_not_found_error() -> Any:
@@ -43,21 +49,21 @@ def _import_not_found_error() -> Any:
     return NotFoundError
-def _get_opensearch_client(opensearch_url: str, **kwargs: Any) -> Any:
-    """Get OpenSearch client from the opensearch_url, otherwise raise error."""
+def _get_async_opensearch_client(opensearch_url: str, **kwargs: Any) -> Any:
+    """Get AsyncOpenSearch client from the opensearch_url, otherwise raise error."""
     try:
-        opensearch = _import_opensearch()
+        opensearch = _import_async_opensearch()
         client = opensearch(opensearch_url, **kwargs)
     except ValueError as e:
         raise ValueError(
-            f"OpenSearch client string provided is not in proper format. "
+            f"AsyncOpenSearch client string provided is not in proper format. "
             f"Got error: {e} "
         )
     return client
-def _bulk_ingest_embeddings(
+async def _bulk_ingest_embeddings(
     client: Any,
     index_name: str,
     embeddings: List[List[float]],
@@ -70,20 +76,20 @@ def _bulk_ingest_embeddings(
     max_chunk_bytes: Optional[int] = 1 * 1024 * 1024,
     is_aoss: bool = False,
 ) -> List[str]:
-    """Bulk Ingest Embeddings into given index."""
+    """Async Bulk Ingest Embeddings into given index."""
     if not mapping:
         mapping = {}
-    bulk = _import_bulk()
+    async_bulk = _import_async_bulk()
     not_found_error = _import_not_found_error()
     requests = []
     return_ids = []
     mapping = mapping
     try:
-        client.indices.get(index=index_name)
+        await client.indices.get(index=index_name)
     except not_found_error:
-        client.indices.create(index=index_name, body=mapping)
+        await client.indices.create(index=index_name, body=mapping)
     for i, text in enumerate(texts):
         metadata = metadatas[i] if metadatas else {}
@@ -101,9 +107,9 @@ def _bulk_ingest_embeddings(
             request["_id"] = _id
         requests.append(request)
         return_ids.append(_id)
-    bulk(client, requests, max_chunk_bytes=max_chunk_bytes)
+    await async_bulk(client, requests, max_chunk_bytes=max_chunk_bytes)
     if not is_aoss:
-        client.indices.refresh(index=index_name)
+        await client.indices.refresh(index=index_name)
     return return_ids
@@ -134,7 +140,8 @@ def _knn_search_query(
     k: int,
     filters: Optional[MetadataFilters] = None,
 ) -> Dict:
-    """Do knn search.
+    """
+    Do knn search.
     If there are no filters do approx-knn search.
     If there are (pre)-filters, do an exhaustive exact knn search using 'painless
@@ -242,7 +249,8 @@ def _is_aoss_enabled(http_auth: Any) -> bool:
 class OpensearchVectorClient:
-    """Object encapsulating an Opensearch index that has vector search enabled.
+    """
+    Object encapsulating an Opensearch index that has vector search enabled.
     If the index does not yet exist, it is created during init.
     Therefore, the underlying index is assumed to either:
@@ -310,15 +318,22 @@ class OpensearchVectorClient:
                 }
             },
         }
-        self._os_client = _get_opensearch_client(self._endpoint, **kwargs)
+        self._os_client = _get_async_opensearch_client(self._endpoint, **kwargs)
         not_found_error = _import_not_found_error()
+        event_loop = asyncio.get_event_loop()
         try:
-            self._os_client.indices.get(index=self._index)
+            event_loop.run_until_complete(
+                self._os_client.indices.get(index=self._index)
+            )
         except not_found_error:
-            self._os_client.indices.create(index=self._index, body=idx_conf)
-            self._os_client.indices.refresh(index=self._index)
+            event_loop.run_until_complete(
+                self._os_client.indices.create(index=self._index, body=idx_conf)
+            )
+            event_loop.run_until_complete(
+                self._os_client.indices.refresh(index=self._index)
+            )
-    def index_results(self, nodes: List[BaseNode], **kwargs: Any) -> List[str]:
+    async def index_results(self, nodes: List[BaseNode], **kwargs: Any) -> List[str]:
         """Store results in the index."""
         embeddings: List[List[float]] = []
         texts: List[str] = []
@@ -330,7 +345,7 @@ class OpensearchVectorClient:
             texts.append(node.get_content(metadata_mode=MetadataMode.NONE))
             metadatas.append(node_to_metadata_dict(node, remove_text=True))
-        return _bulk_ingest_embeddings(
+        return await _bulk_ingest_embeddings(
             self._os_client,
             self._index,
             embeddings,
@@ -344,15 +359,16 @@ class OpensearchVectorClient:
             is_aoss=self.is_aoss,
         )
-    def delete_doc_id(self, doc_id: str) -> None:
-        """Delete a document.
+    async def delete_doc_id(self, doc_id: str) -> None:
+        """
+        Delete a document.
         Args:
             doc_id (str): document id
         """
-        self._os_client.delete(index=self._index, id=doc_id)
+        await self._os_client.delete(index=self._index, id=doc_id)
-    def query(
+    async def aquery(
         self,
         query_mode: VectorStoreQueryMode,
         query_str: Optional[str],
@@ -378,7 +394,7 @@ class OpensearchVectorClient:
             )
             params = None
-        res = self._os_client.search(
+        res = await self._os_client.search(
             index=self._index, body=search_query, params=params
         )
         nodes = []
@@ -418,8 +434,9 @@ class OpensearchVectorClient:
         return VectorStoreQueryResult(nodes=nodes, ids=ids, similarities=scores)
-class OpensearchVectorStore(VectorStore):
-    """Elasticsearch/Opensearch vector store.
+class OpensearchVectorStore(BasePydanticVectorStore):
+    """
+    Elasticsearch/Opensearch vector store.
     Args:
         client (OpensearchVectorClient): Vector index client to use
@@ -427,12 +444,15 @@ class OpensearchVectorStore(VectorStore):
     """
     stores_text: bool = True
+    _client: OpensearchVectorClient = PrivateAttr(default=None)
     def __init__(
         self,
         client: OpensearchVectorClient,
     ) -> None:
         """Initialize params."""
+        super().__init__()
+        nest_asyncio.apply()
         self._client = client
     @property
@@ -445,13 +465,30 @@ class OpensearchVectorStore(VectorStore):
         nodes: List[BaseNode],
         **add_kwargs: Any,
     ) -> List[str]:
-        """Add nodes to index.
+        """
+        Add nodes to index.
+        Args:
+            nodes: List[BaseNode]: list of nodes with embeddings.
+        """
+        return asyncio.get_event_loop().run_until_complete(
+            self.async_add(nodes, **add_kwargs)
+        )
+    async def async_add(
+        self,
+        nodes: List[BaseNode],
+        **add_kwargs: Any,
+    ) -> List[str]:
+        """
+        Async add nodes to index.
         Args:
             nodes: List[BaseNode]: list of nodes with embeddings.
         """
-        self._client.index_results(nodes)
+        await self._client.index_results(nodes)
         return [result.node_id for result in nodes]
     def delete(self, ref_doc_id: str, **delete_kwargs: Any) -> None:
@@ -462,10 +499,35 @@ class OpensearchVectorStore(VectorStore):
             ref_doc_id (str): The doc_id of the document to delete.
         """
-        self._client.delete_doc_id(ref_doc_id)
+        asyncio.get_event_loop().run_until_complete(
+            self.adelete(ref_doc_id, **delete_kwargs)
+        )
+    async def adelete(self, ref_doc_id: str, **delete_kwargs: Any) -> None:
+        """
+        Async delete nodes using with ref_doc_id.
+        Args:
+            ref_doc_id (str): The doc_id of the document to delete.
+        """
+        await self._client.delete_doc_id(ref_doc_id)
     def query(self, query: VectorStoreQuery, **kwargs: Any) -> VectorStoreQueryResult:
-        """Query index for top k most similar nodes.
+        """
+        Query index for top k most similar nodes.
+        Args:
+            query (VectorStoreQuery): Store query object.
+        """
+        return asyncio.get_event_loop().run_until_complete(self.aquery(query, **kwargs))
+    async def aquery(
+        self, query: VectorStoreQuery, **kwargs: Any
+    ) -> VectorStoreQueryResult:
+        """
+        Async query index for top k most similar nodes.
         Args:
             query (VectorStoreQuery): Store query object.
@@ -473,7 +535,7 @@ class OpensearchVectorStore(VectorStore):
         """
         query_embedding = cast(List[float], query.query_embedding)
-        return self._client.query(
+        return await self._client.aquery(
             query.mode,
             query.query_str,
             query_embedding,

{llama_index_vector_stores_opensearch-0.1.3.dist-info → llama_index_vector_stores_opensearch-0.1.5.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: llama-index-vector-stores-opensearch
-Version: 0.1.3
+Version: 0.1.5
 Summary: llama-index vector_stores opensearch integration
 License: MIT
 Author: Your Name
@@ -11,9 +11,8 @@ Classifier: Programming Language :: Python :: 3
 Classifier: Programming Language :: Python :: 3.9
 Classifier: Programming Language :: Python :: 3.10
 Classifier: Programming Language :: Python :: 3.11
-Classifier: Programming Language :: Python :: 3.12
 Requires-Dist: llama-index-core (>=0.10.1,<0.11.0)
-Requires-Dist: opensearch-py (>=2.4.2,<3.0.0)
+Requires-Dist: opensearch-py[async] (>=2.4.2,<3.0.0)
 Description-Content-Type: text/markdown
 # LlamaIndex Vector_Stores Integration: Opensearch

llama_index_vector_stores_opensearch-0.1.5.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,5 @@
+llama_index/vector_stores/opensearch/__init__.py,sha256=U1_XAkZb6zcskOk4s10NB8Tjs9AZRGdRQLzOGpbWdBA,176
+llama_index/vector_stores/opensearch/base.py,sha256=IHHfsgsjY_9JKroivl-cFVyS74kQnzIIJCDMqEP7tfk,16877
+llama_index_vector_stores_opensearch-0.1.5.dist-info/METADATA,sha256=fsdPGHC07vUnALJftvDl8ZIFTEnQZxwZo1B1lGStLA0,677
+llama_index_vector_stores_opensearch-0.1.5.dist-info/WHEEL,sha256=d2fvjOD7sXsVzChCqf0Ty0JbHKBaLYwDbGQDwQTnJ50,88
+llama_index_vector_stores_opensearch-0.1.5.dist-info/RECORD,,

{llama_index_vector_stores_opensearch-0.1.3.dist-info → llama_index_vector_stores_opensearch-0.1.5.dist-info}/WHEEL RENAMED Viewed

@@ -1,4 +1,4 @@
 Wheel-Version: 1.0
-Generator: poetry-core 1.8.1
+Generator: poetry-core 1.7.0
 Root-Is-Purelib: true
 Tag: py3-none-any

llama_index_vector_stores_opensearch-0.1.3.dist-info/RECORD DELETED Viewed

@@ -1,5 +0,0 @@
-llama_index/vector_stores/opensearch/__init__.py,sha256=U1_XAkZb6zcskOk4s10NB8Tjs9AZRGdRQLzOGpbWdBA,176
-llama_index/vector_stores/opensearch/base.py,sha256=ohHZzOn3XAb3rXNFTq6YC6fNuGgQuKMdHIwPY0f2Wmo,15115
-llama_index_vector_stores_opensearch-0.1.3.dist-info/METADATA,sha256=yN7RT9C1S24AA0S9AGXoyzSm693GeKZtbExCp7bjc9A,721
-llama_index_vector_stores_opensearch-0.1.3.dist-info/WHEEL,sha256=FMvqSimYX_P7y0a7UY-_Mc83r5zkBZsCYPm7Lr0Bsq4,88
-llama_index_vector_stores_opensearch-0.1.3.dist-info/RECORD,,

llama-index-vector-stores-opensearch 0.1.3__py3-none-any.whl → 0.1.5__py3-none-any.whl

Potentially problematic release.

llama-index-vector-stores-opensearch 0.1.3py3-none-any.whl → 0.1.5py3-none-any.whl