PyPI - davidkhala.ai - Versions diffs - 0.1.3__tar.gz → 0.1.4__tar.gz - Mend

davidkhala.ai 0.1.3tar.gz → 0.1.4tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

{davidkhala_ai-0.1.3 → davidkhala_ai-0.1.4}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: davidkhala.ai
-Version: 0.1.3
+Version: 0.1.4
 Summary: misc AI modules
 Requires-Python: >=3.13
 Provides-Extra: ali

{davidkhala_ai-0.1.3 → davidkhala_ai-0.1.4}/davidkhala/ai/agent/dify/knowledge.py RENAMED Viewed

@@ -141,13 +141,40 @@ class Dataset(API):
                 'limit': size
             })
-        def list_documents(self) -> Iterable[list[DocumentDict]]:
-            return Iterator(self.paginate_documents, None)
+        def list_documents(self) -> Iterable[DocumentDict]:
+            for document_batch in Iterator(self.paginate_documents, None):
+                for document in document_batch:
+                    yield document
         def has_document(self, name) -> bool:
             return any(name == item['name'] for row in self.list_documents() for item in row)
+class ChunkDict(TypedDict):
+    id: str
+    position: int
+    document_id: str
+    content: str
+    sign_content: str  # trimmed version of content
+    answer: Optional[str]  # only used in QA chunk
+    word_count: int
+    tokens: int
+    keywords: Optional[list[str]]
+    index_node_id: str  # chunk 在向量索引中的节点 ID
+    index_node_hash: str  # hash of sign_content
+    hit_count: int
+    enabled: bool
+    status: str  # 'completed'
+    created_at: int  # timestamp
+    updated_at: int  # timestamp
+    completed_at: int  # timestamp
+    created_by: str  # user id
+    child_chunks: list
+    error: Optional
+    stopped_at: Optional[int]  # timestamp
+    disabled_at: Optional[int]  # timestamp
 class Document(API):
     def __init__(self, d: Dataset.Instance, document_id: str):
         super().__init__(d.api_key, f"{d.base_url}/documents/{document_id}")
@@ -162,10 +189,14 @@ class Document(API):
     def get(self):
         return self.request(self.base_url, "GET")
     def paginate_chunks(self, page=1, size=20):
         return self.request(f"{self.base_url}/segments", "GET", params={
-            'page':page,
-            'limit':size
+            'page': page,
+            'limit': size
         })
-    def list_chunks(self)->Iterable[list]: # TODO ChunkDict
-        return Iterator(self.paginate_chunks, None)
+    def list_chunks(self) -> Iterable[ChunkDict]:
+        for chunk_batch in Iterator(self.paginate_chunks, None):
+            for chunk in chunk_batch:
+                yield chunk

{davidkhala_ai-0.1.3 → davidkhala_ai-0.1.4}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "davidkhala.ai"
-version = "0.1.3"
+version = "0.1.4"
 description = "misc AI modules"
 readme = "README.md"
 requires-python = ">=3.13"