PyPI - alita-sdk - Versions diffs - 0.3.205__py3-none-any.whl → 0.3.207__py3-none-any.whl - Mend

alita-sdk 0.3.205py3-none-any.whl → 0.3.207py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

alita_sdk/runtime/clients/client.py +314 -11
alita_sdk/runtime/langchain/assistant.py +22 -21
alita_sdk/runtime/langchain/interfaces/llm_processor.py +1 -4
alita_sdk/runtime/langchain/langraph_agent.py +6 -1
alita_sdk/runtime/langchain/store_manager.py +4 -4
alita_sdk/runtime/toolkits/application.py +5 -10
alita_sdk/runtime/toolkits/tools.py +11 -21
alita_sdk/runtime/tools/vectorstore.py +25 -11
alita_sdk/runtime/utils/streamlit.py +505 -222
alita_sdk/runtime/utils/toolkit_runtime.py +147 -0
alita_sdk/runtime/utils/toolkit_utils.py +157 -0
alita_sdk/runtime/utils/utils.py +5 -0
alita_sdk/tools/__init__.py +2 -0
alita_sdk/tools/ado/repos/repos_wrapper.py +20 -13
alita_sdk/tools/bitbucket/api_wrapper.py +5 -5
alita_sdk/tools/bitbucket/cloud_api_wrapper.py +54 -29
alita_sdk/tools/elitea_base.py +9 -4
alita_sdk/tools/gitlab/__init__.py +22 -10
alita_sdk/tools/gitlab/api_wrapper.py +278 -253
alita_sdk/tools/gitlab/tools.py +354 -376
alita_sdk/tools/llm/llm_utils.py +0 -6
alita_sdk/tools/memory/__init__.py +54 -10
alita_sdk/tools/openapi/__init__.py +14 -3
alita_sdk/tools/sharepoint/__init__.py +2 -1
alita_sdk/tools/sharepoint/api_wrapper.py +11 -3
alita_sdk/tools/testrail/api_wrapper.py +39 -16
alita_sdk/tools/utils/content_parser.py +77 -13
{alita_sdk-0.3.205.dist-info → alita_sdk-0.3.207.dist-info}/METADATA +1 -1
{alita_sdk-0.3.205.dist-info → alita_sdk-0.3.207.dist-info}/RECORD +32 -40
alita_sdk/community/analysis/__init__.py +0 -0
alita_sdk/community/analysis/ado_analyse/__init__.py +0 -103
alita_sdk/community/analysis/ado_analyse/api_wrapper.py +0 -261
alita_sdk/community/analysis/github_analyse/__init__.py +0 -98
alita_sdk/community/analysis/github_analyse/api_wrapper.py +0 -166
alita_sdk/community/analysis/gitlab_analyse/__init__.py +0 -110
alita_sdk/community/analysis/gitlab_analyse/api_wrapper.py +0 -172
alita_sdk/community/analysis/jira_analyse/__init__.py +0 -141
alita_sdk/community/analysis/jira_analyse/api_wrapper.py +0 -252
alita_sdk/runtime/llms/alita.py +0 -259
{alita_sdk-0.3.205.dist-info → alita_sdk-0.3.207.dist-info}/WHEEL +0 -0
{alita_sdk-0.3.205.dist-info → alita_sdk-0.3.207.dist-info}/licenses/LICENSE +0 -0
{alita_sdk-0.3.205.dist-info → alita_sdk-0.3.207.dist-info}/top_level.txt +0 -0

alita_sdk/runtime/tools/vectorstore.py CHANGED Viewed

@@ -1,6 +1,9 @@
 import json
 import math
-from typing import Any, Optional, List, Dict, Callable
+import types
+from typing import Any, Optional, List, Dict, Callable, Generator
+from langchain_core.documents import Document
 from pydantic import BaseModel, model_validator, Field
 from ..langchain.tools.vector import VectorAdapter
 from langchain_core.messages import HumanMessage
@@ -8,6 +11,7 @@ from alita_sdk.tools.elitea_base import BaseToolApiWrapper
 from logging import getLogger
 from ..utils.logging import dispatch_custom_event
+from ..utils.utils import IndexerKeywords
 logger = getLogger(__name__)
@@ -197,25 +201,29 @@ class VectorStoreWrapper(BaseToolApiWrapper):
             for doc_str, meta, db_id in zip(data['documents'], data['metadatas'], data['ids']):
                 doc = json.loads(doc_str)
                 doc_id = str(meta['id'])
+                dependent_docs = meta.get(IndexerKeywords.DEPENDENT_DOCS.value, [])
+                parent_id = meta.get(IndexerKeywords.PARENT.value, -1)
                 result[doc_id] = {
                     'metadata': meta,
                     'document': doc,
-                    'id': db_id
+                    'id': db_id,
+                    IndexerKeywords.DEPENDENT_DOCS.value: dependent_docs,
+                    IndexerKeywords.PARENT.value: parent_id
                 }
         except Exception as e:
             logger.error(f"Failed to get indexed data from vectorstore: {str(e)}. Continuing with empty index.")
         return result
-    def _reduce_duplicates(self, documents, store) -> List[Any]:
+    def _reduce_duplicates(self, documents: Generator[Document, None, None], store) -> List[Any]:
         """Remove documents already indexed in the vectorstore based on metadata 'id' and 'updated_on' fields."""
         self._log_data("Verification of documents to index started", tool_name="index_documents")
-        data = self._get_indexed_data(store)
-        indexed_ids = set(data.keys())
+        indexed_data = self._get_indexed_data(store)
+        indexed_ids = set(indexed_data.keys())
         if not indexed_ids:
             self._log_data("Vectorstore is empty, indexing all incoming documents", tool_name="index_documents")
-            return documents
+            return list(documents)
         final_docs = []
         docs_to_remove = []
@@ -226,13 +234,17 @@ class VectorStoreWrapper(BaseToolApiWrapper):
             if doc_id in indexed_ids:
                 # document has been indexed already, then verify `updated_on`
                 to_index_updated_on = document.metadata.get('updated_on')
-                indexed_meta = data[doc_id]['metadata']
+                indexed_meta = indexed_data[doc_id]['metadata']
                 indexed_updated_on = indexed_meta.get('updated_on')
                 if to_index_updated_on and indexed_updated_on and to_index_updated_on == indexed_updated_on:
                     # same updated_on, skip indexing
                     continue
                 # if updated_on is missing or different, we will re-index the document and remove old one
-                docs_to_remove.append(data[doc_id]['id'])
+                # parent doc removal
+                docs_to_remove.append(indexed_data[doc_id]['id'])
+                # mark dependent docs for removal
+                for dependent_doc_id in indexed_data[doc_id][IndexerKeywords.DEPENDENT_DOCS.value]:
+                    docs_to_remove.append(indexed_data[dependent_doc_id]['id'])
             else:
                 final_docs.append(document)
@@ -245,7 +257,7 @@ class VectorStoreWrapper(BaseToolApiWrapper):
         return final_docs
-    def index_documents(self, documents, progress_step: int = 20, clean_index: bool = True):
+    def index_documents(self, documents: Generator[Document, None, None], progress_step: int = 20, clean_index: bool = True):
         """ Index documents in the vectorstore.
         Args:
@@ -269,6 +281,8 @@ class VectorStoreWrapper(BaseToolApiWrapper):
                                tool_name="index_documents")
             except Exception as e:
                 logger.warning(f"Failed to clean index: {str(e)}. Continuing with re-indexing.")
+            if isinstance(documents, types.GeneratorType):
+                documents = list(documents)
         else:
             # remove duplicates based on metadata 'id' and 'updated_on' fields
             documents = self._reduce_duplicates(documents, self.vectoradapter.vectorstore)
@@ -281,7 +295,7 @@ class VectorStoreWrapper(BaseToolApiWrapper):
         # if func is provided, apply it to documents
         # used for processing of documents before indexing,
         # e.g. to avoid time-consuming operations for documents that are already indexed
-        self.process_document_func(documents) if self.process_document_func else None
+        dependent_docs_generator = self.process_document_func(documents) if self.process_document_func else []
         # notify user about missed required metadata fields: id, updated_on
         # it is not required to have them, but it is recommended to have them for proper re-indexing and duplicate detection
@@ -292,7 +306,7 @@ class VectorStoreWrapper(BaseToolApiWrapper):
         logger.debug(f"Indexing documents: {documents}")
         logger.debug(self.vectoradapter)
-        documents = list(documents)
+        documents = documents + list(dependent_docs_generator)
         total_docs = len(documents)
         documents_count = 0
         _documents = []

alita-sdk 0.3.205__py3-none-any.whl → 0.3.207__py3-none-any.whl

alita-sdk 0.3.205py3-none-any.whl → 0.3.207py3-none-any.whl