ws-bom-robot-app 0.0.24__py3-none-any.whl → 0.0.25__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- ws_bom_robot_app/llm/main.py +1 -0
- ws_bom_robot_app/llm/vector_store/generator.py +13 -5
- ws_bom_robot_app/llm/vector_store/integration/dropbox.py +1 -1
- ws_bom_robot_app/llm/vector_store/integration/manager.py +2 -0
- ws_bom_robot_app/llm/vector_store/integration/sharepoint.py +59 -4
- ws_bom_robot_app/llm/vector_store/loader/base.py +34 -30
- ws_bom_robot_app/llm/vector_store/loader/docling.py +35 -0
- {ws_bom_robot_app-0.0.24.dist-info → ws_bom_robot_app-0.0.25.dist-info}/METADATA +16 -6
- {ws_bom_robot_app-0.0.24.dist-info → ws_bom_robot_app-0.0.25.dist-info}/RECORD +11 -10
- {ws_bom_robot_app-0.0.24.dist-info → ws_bom_robot_app-0.0.25.dist-info}/WHEEL +0 -0
- {ws_bom_robot_app-0.0.24.dist-info → ws_bom_robot_app-0.0.25.dist-info}/top_level.txt +0 -0
ws_bom_robot_app/llm/main.py
CHANGED
|
@@ -25,6 +25,7 @@ async def invoke(rq: InvokeRequest) -> str:
|
|
|
25
25
|
|
|
26
26
|
async def __stream(rq: StreamRequest,queue: Queue,formatted: bool = True) -> None:
|
|
27
27
|
await rq.initialize()
|
|
28
|
+
#os.environ["KMP_DUPLICATE_LIB_OK"] = "TRUE"
|
|
28
29
|
if formatted:
|
|
29
30
|
agent_handler = AgentHandler(queue,rq.thread_id)
|
|
30
31
|
else:
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import os, gc, shutil, traceback
|
|
1
|
+
import os, gc, shutil, logging, traceback
|
|
2
2
|
import asyncio, aiofiles, aiofiles.os
|
|
3
3
|
from fastapi import HTTPException
|
|
4
4
|
from fastapi.responses import StreamingResponse
|
|
@@ -67,7 +67,9 @@ async def kb(rq: KbRequest) -> VectorDbResponse:
|
|
|
67
67
|
documents.extend(await loaders.load())
|
|
68
68
|
except Exception as e:
|
|
69
69
|
tb = traceback.format_exc()
|
|
70
|
-
|
|
70
|
+
_error = f"File loader failure: {e} | {tb}"
|
|
71
|
+
logging.warning(_error)
|
|
72
|
+
return VectorDbResponse(success = False, error = _error)
|
|
71
73
|
except Exception as e:
|
|
72
74
|
await _cleanup_directory(working_path)
|
|
73
75
|
return VectorDbResponse(success = False, error = f"Failed to download file {e}")
|
|
@@ -78,7 +80,9 @@ async def kb(rq: KbRequest) -> VectorDbResponse:
|
|
|
78
80
|
except Exception as e:
|
|
79
81
|
await _cleanup_directory(working_path)
|
|
80
82
|
tb = traceback.format_exc()
|
|
81
|
-
|
|
83
|
+
_error = f"Endpoint failure: {e} | {tb}"
|
|
84
|
+
logging.warning(_error)
|
|
85
|
+
return VectorDbResponse(success = False, error = _error)
|
|
82
86
|
|
|
83
87
|
if rq.integrations:
|
|
84
88
|
tasks = []
|
|
@@ -95,7 +99,9 @@ async def kb(rq: KbRequest) -> VectorDbResponse:
|
|
|
95
99
|
except Exception as e:
|
|
96
100
|
await _cleanup_directory(working_path)
|
|
97
101
|
tb = traceback.format_exc()
|
|
98
|
-
|
|
102
|
+
_error = f"Integration failure: {e} | {tb}"
|
|
103
|
+
logging.warning(_error)
|
|
104
|
+
return VectorDbResponse(success=False, error=_error)
|
|
99
105
|
|
|
100
106
|
#cleanup
|
|
101
107
|
await _cleanup_directory(working_path)
|
|
@@ -116,7 +122,9 @@ async def kb(rq: KbRequest) -> VectorDbResponse:
|
|
|
116
122
|
del documents
|
|
117
123
|
gc.collect()
|
|
118
124
|
else:
|
|
119
|
-
|
|
125
|
+
_error = "No documents found in the knowledgebase folder"
|
|
126
|
+
logging.warning(_error)
|
|
127
|
+
return VectorDbResponse(success = False, error = _error)
|
|
120
128
|
|
|
121
129
|
async def kb_stream_file(filename: str):
|
|
122
130
|
file_path = os.path.join(config.robot_data_folder, config.robot_data_db_folder, config.robot_data_db_folder_out, filename)
|
|
@@ -12,7 +12,7 @@ class DropboxParams(BaseModel):
|
|
|
12
12
|
Attributes:
|
|
13
13
|
remote_url (str): The URL of the remote Dropbox location, e.g. 'dropbox://demo-directory' or 'dropbox://demo-directory/sub-directory'.
|
|
14
14
|
token (str): The authentication token for accessing Dropbox.
|
|
15
|
-
create app: https://www.dropbox.com/developers, with file.content.read permission, and generate token.
|
|
15
|
+
create app: https://www.dropbox.com/developers, with file.content.read permission, and generate token, or use existing app: https://www.dropbox.com/account/connected_apps / https://www.dropbox.com/developers/apps?_tk=pilot_lp&_ad=topbar4&_camp=myapps
|
|
16
16
|
recursive (bool, optional): A flag indicating whether to search directories recursively. Defaults to False.
|
|
17
17
|
extension (list[str], optional): A list of file extensions to filter by. Defaults to None, e.g. ['.pdf', '.docx'].
|
|
18
18
|
"""
|
|
@@ -9,6 +9,7 @@ from ws_bom_robot_app.llm.vector_store.integration.googledrive import GoogleDriv
|
|
|
9
9
|
from ws_bom_robot_app.llm.vector_store.integration.jira import Jira
|
|
10
10
|
from ws_bom_robot_app.llm.vector_store.integration.s3 import S3
|
|
11
11
|
from ws_bom_robot_app.llm.vector_store.integration.sftp import Sftp
|
|
12
|
+
from ws_bom_robot_app.llm.vector_store.integration.sharepoint import Sharepoint
|
|
12
13
|
from ws_bom_robot_app.llm.vector_store.integration.sitemap import Sitemap
|
|
13
14
|
from ws_bom_robot_app.llm.vector_store.integration.slack import Slack
|
|
14
15
|
|
|
@@ -23,6 +24,7 @@ class IntegrationManager:
|
|
|
23
24
|
"llmkbjira": Jira,
|
|
24
25
|
"llmkbs3": S3,
|
|
25
26
|
"llmkbsftp": Sftp,
|
|
27
|
+
"llmkbsharepoint": Sharepoint,
|
|
26
28
|
"llmkbsitemap": Sitemap,
|
|
27
29
|
"llmkbslack": Slack,
|
|
28
30
|
|
|
@@ -1,12 +1,27 @@
|
|
|
1
|
-
import asyncio
|
|
1
|
+
import asyncio, logging, traceback
|
|
2
|
+
from dataclasses import dataclass
|
|
2
3
|
from ws_bom_robot_app.llm.vector_store.integration.base import IntegrationStrategy, UnstructuredIngest
|
|
3
|
-
from unstructured_ingest.v2.processes.connectors.sharepoint import SharepointIndexerConfig, SharepointDownloaderConfig, SharepointConnectionConfig, SharepointAccessConfig
|
|
4
|
+
from unstructured_ingest.v2.processes.connectors.sharepoint import SharepointIndexerConfig, SharepointIndexer, SharepointDownloaderConfig, SharepointConnectionConfig, SharepointAccessConfig
|
|
4
5
|
from langchain_core.documents import Document
|
|
5
6
|
from ws_bom_robot_app.llm.vector_store.loader.base import Loader
|
|
6
7
|
from typing import Union, Optional
|
|
7
8
|
from pydantic import BaseModel, Field, AliasChoices
|
|
8
9
|
|
|
9
10
|
class SharepointParams(BaseModel):
|
|
11
|
+
"""
|
|
12
|
+
SharepointParams is a Pydantic model that defines the parameters required to connect to a SharePoint site.
|
|
13
|
+
|
|
14
|
+
Attributes:
|
|
15
|
+
client_id (str): The client ID for SharePoint authentication.
|
|
16
|
+
client_secret (str): The client secret for SharePoint authentication.
|
|
17
|
+
site_url (str): The URL of the SharePoint site. i.e. site collection level: https://<tenant>.sharepoint.com/sites/<site-collection-name>, or root site: https://<tenant>.sharepoint.com
|
|
18
|
+
site_path (str, optional): TThe path in the SharePoint site from which to start parsing files, for example "Shared Documents". Defaults to None.
|
|
19
|
+
recursive (bool, optional): Whether to recursively access subdirectories. Defaults to False.
|
|
20
|
+
omit_files (bool, optional): Whether to omit files from the results. Defaults to False.
|
|
21
|
+
omit_pages (bool, optional): Whether to omit pages from the results. Defaults to False.
|
|
22
|
+
omit_lists (bool, optional): Whether to omit lists from the results. Defaults to False.
|
|
23
|
+
extension (list[str], optional): A list of file extensions to include, i.e. [".pdf"] Defaults to None.
|
|
24
|
+
"""
|
|
10
25
|
client_id : str = Field(validation_alias=AliasChoices("clientId","client_id"))
|
|
11
26
|
client_secret : str = Field(validation_alias=AliasChoices("clientSecret","client_secret"))
|
|
12
27
|
site_url: str = Field(validation_alias=AliasChoices("siteUrl","site_url"))
|
|
@@ -40,12 +55,52 @@ class Sharepoint(IntegrationStrategy):
|
|
|
40
55
|
site=self.__data.site_url,
|
|
41
56
|
permissions_config=None
|
|
42
57
|
)
|
|
43
|
-
self.__unstructured_ingest.pipeline(
|
|
58
|
+
pipeline = self.__unstructured_ingest.pipeline(
|
|
44
59
|
indexer_config,
|
|
45
60
|
downloader_config,
|
|
46
61
|
connection_config,
|
|
47
|
-
extension=self.__data.extension)
|
|
62
|
+
extension=self.__data.extension)
|
|
63
|
+
current_indexer_process = pipeline.indexer_step.process
|
|
64
|
+
pipeline.indexer_step.process = CustomSharepointIndexer(**vars(current_indexer_process))
|
|
65
|
+
pipeline.run()
|
|
48
66
|
async def load(self) -> list[Document]:
|
|
49
67
|
await asyncio.to_thread(self.run)
|
|
50
68
|
await asyncio.sleep(1)
|
|
51
69
|
return await Loader(self.working_directory).load()
|
|
70
|
+
|
|
71
|
+
@dataclass
|
|
72
|
+
class CustomSharepointIndexer(SharepointIndexer):
|
|
73
|
+
def __init__(self, **kwargs):
|
|
74
|
+
# Initialize all attributes from the base indexer
|
|
75
|
+
for key, value in kwargs.items():
|
|
76
|
+
setattr(self, key, value)
|
|
77
|
+
def list_files(self, folder, recursive):
|
|
78
|
+
try:
|
|
79
|
+
_files = super().list_files(folder, recursive)
|
|
80
|
+
return _files
|
|
81
|
+
except Exception as e:
|
|
82
|
+
tb = traceback.format_exc()
|
|
83
|
+
logging.error(f"Error listing sharepoint files: {e} \n {tb}")
|
|
84
|
+
return []
|
|
85
|
+
def file_to_file_data(self, client, file):
|
|
86
|
+
try:
|
|
87
|
+
return super().file_to_file_data(client, file)
|
|
88
|
+
except Exception as e:
|
|
89
|
+
tb = traceback.format_exc()
|
|
90
|
+
logging.error(f"Error converting sharepoint file {file} to data: {e} \n {tb}")
|
|
91
|
+
return None
|
|
92
|
+
def list_pages(self, client):
|
|
93
|
+
try:
|
|
94
|
+
_pages = super().list_pages(client)
|
|
95
|
+
_allowed_content_type = None
|
|
96
|
+
for page in _pages:
|
|
97
|
+
# determine the allowed content type from the first page (Home.aspx)
|
|
98
|
+
if not _allowed_content_type:
|
|
99
|
+
_allowed_content_type = page.content_type_id
|
|
100
|
+
if not page.content_type_id == _allowed_content_type:
|
|
101
|
+
_pages.remove_child(page)
|
|
102
|
+
return _pages
|
|
103
|
+
except Exception as e:
|
|
104
|
+
tb = traceback.format_exc()
|
|
105
|
+
logging.error(f"Error listing sharepoint pages: {e} \n {tb}")
|
|
106
|
+
return []
|
|
@@ -1,21 +1,18 @@
|
|
|
1
|
-
|
|
2
1
|
import asyncio, gc, logging, os, traceback
|
|
3
2
|
from typing import Any, Optional
|
|
4
3
|
from langchain_community.document_loaders import DirectoryLoader
|
|
5
4
|
from langchain_community.document_loaders.base import BaseLoader
|
|
6
5
|
from langchain_community.document_loaders.merge import MergedDataLoader
|
|
7
6
|
from langchain_core.documents import Document
|
|
8
|
-
from langchain_unstructured import UnstructuredLoader
|
|
9
7
|
from pydantic import BaseModel
|
|
10
8
|
from ws_bom_robot_app.config import config
|
|
11
9
|
from ws_bom_robot_app.llm.vector_store.loader.json_loader import JsonLoader
|
|
10
|
+
from ws_bom_robot_app.llm.vector_store.loader.docling import DoclingLoader
|
|
11
|
+
from langchain_community.document_loaders import CSVLoader, UnstructuredPowerPointLoader, UnstructuredEmailLoader, UnstructuredXMLLoader, TextLoader, UnstructuredHTMLLoader
|
|
12
12
|
|
|
13
13
|
class LoaderConfig(BaseModel):
|
|
14
14
|
loader: type[BaseLoader]
|
|
15
|
-
kwargs: Optional[dict[str, Any]] = {
|
|
16
|
-
'chunking_strategy': 'basic',
|
|
17
|
-
'max_characters': 10_000
|
|
18
|
-
}
|
|
15
|
+
kwargs: Optional[dict[str, Any]] = {}
|
|
19
16
|
#post_processors: Optional[list[Callable[[str], str]]] = None
|
|
20
17
|
|
|
21
18
|
class Loader():
|
|
@@ -25,39 +22,46 @@ class Loader():
|
|
|
25
22
|
|
|
26
23
|
_list: dict[str, LoaderConfig | None] = {
|
|
27
24
|
'.json': LoaderConfig(loader=JsonLoader),
|
|
28
|
-
'.csv': LoaderConfig(loader=
|
|
29
|
-
'.xls':
|
|
30
|
-
'.xlsx': LoaderConfig(loader=
|
|
31
|
-
'.eml': LoaderConfig(loader=
|
|
32
|
-
'.msg': LoaderConfig(loader=
|
|
25
|
+
'.csv': LoaderConfig(loader=CSVLoader),
|
|
26
|
+
'.xls': None,
|
|
27
|
+
'.xlsx': LoaderConfig(loader=DoclingLoader),
|
|
28
|
+
'.eml': LoaderConfig(loader=UnstructuredEmailLoader,kwargs={"strategy":"auto", "process_attachments": False}),
|
|
29
|
+
'.msg': LoaderConfig(loader=UnstructuredEmailLoader,kwargs={"strategy":"auto", "process_attachments": False}),
|
|
33
30
|
'.epub': None,
|
|
34
|
-
'.md': LoaderConfig(loader=
|
|
31
|
+
'.md': LoaderConfig(loader=TextLoader),
|
|
35
32
|
'.org': None,
|
|
36
33
|
'.odt': None,
|
|
37
34
|
'.ppt': None,
|
|
38
|
-
'.pptx': LoaderConfig(loader=
|
|
39
|
-
'.txt': LoaderConfig(loader=
|
|
35
|
+
'.pptx': LoaderConfig(loader=UnstructuredPowerPointLoader,kwargs={"strategy":"auto"}), #docling issue with WMF https://github.com/DS4SD/docling/issues/594
|
|
36
|
+
'.txt': LoaderConfig(loader=TextLoader),
|
|
40
37
|
'.rst': None,
|
|
41
38
|
'.rtf': None,
|
|
42
39
|
'.tsv': None,
|
|
43
40
|
'.text': None,
|
|
44
41
|
'.log': None,
|
|
45
|
-
'.htm': LoaderConfig(loader=
|
|
46
|
-
'.html': LoaderConfig(loader=
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
|
|
54
|
-
'
|
|
55
|
-
'.
|
|
56
|
-
'.
|
|
42
|
+
'.htm': LoaderConfig(loader=UnstructuredHTMLLoader,kwargs={"strategy":"auto"}),
|
|
43
|
+
'.html': LoaderConfig(loader=UnstructuredHTMLLoader,kwargs={"strategy":"auto"}),
|
|
44
|
+
".pdf": LoaderConfig(loader=DoclingLoader),
|
|
45
|
+
#'.pdf': LoaderConfig(loader=UnstructuredLoader,kwargs={
|
|
46
|
+
# 'strategy':'ocr_only', #https://docs.unstructured.io/open-source/core-functionality/partitioning auto,ocr_only,hi_res
|
|
47
|
+
# 'split_pdf_page': False,
|
|
48
|
+
# 'chunking_strategy': 'basic',
|
|
49
|
+
# 'max_characters': 10_000,
|
|
50
|
+
# 'include_page_breaks': True,
|
|
51
|
+
# 'include_orig_elements': False}),
|
|
52
|
+
#'.png': LoaderConfig(loader=UnstructuredLoader,kwargs={"strategy":"ocr_only"}),
|
|
53
|
+
#'.jpg': LoaderConfig(loader=UnstructuredLoader,kwargs={"strategy":"ocr_only"}),
|
|
54
|
+
#'.jpeg': LoaderConfig(loader=UnstructuredLoader,kwargs={"strategy":"ocr_only"}),
|
|
55
|
+
'.png': LoaderConfig(loader=DoclingLoader),
|
|
56
|
+
'.jpg': LoaderConfig(loader=DoclingLoader),
|
|
57
|
+
'.jpeg': LoaderConfig(loader=DoclingLoader),
|
|
58
|
+
'.gif': None,
|
|
59
|
+
".emf": None,
|
|
60
|
+
".wmf": None,
|
|
57
61
|
'.tiff': None,
|
|
58
62
|
'.doc': None, #see liberoffice dependency
|
|
59
|
-
'.docx': LoaderConfig(loader=
|
|
60
|
-
'.xml': LoaderConfig(loader=
|
|
63
|
+
'.docx': LoaderConfig(loader=DoclingLoader),
|
|
64
|
+
'.xml': LoaderConfig(loader=UnstructuredXMLLoader,kwargs={"strategy":"auto"}),
|
|
61
65
|
'.js': None,
|
|
62
66
|
'.py': None,
|
|
63
67
|
'.c': None,
|
|
@@ -81,7 +85,7 @@ class Loader():
|
|
|
81
85
|
loader_configs = {}
|
|
82
86
|
for ext, loader_config in Loader._list.items():
|
|
83
87
|
if loader_config:
|
|
84
|
-
if all([self._runtime_options.loader_strategy != "",loader_config.kwargs
|
|
88
|
+
if all([self._runtime_options.loader_strategy != "",loader_config.kwargs and "strategy" in loader_config.kwargs]): # type: ignore
|
|
85
89
|
loader_config.kwargs["strategy"] = self._runtime_options.loader_strategy # type: ignore
|
|
86
90
|
loader_key = (loader_config.loader, tuple(loader_config.kwargs.items())) # type: ignore
|
|
87
91
|
if loader_key not in loader_configs:
|
|
@@ -122,7 +126,7 @@ class Loader():
|
|
|
122
126
|
return _documents
|
|
123
127
|
except Exception as e:
|
|
124
128
|
logging.warning(f"Attempt {attempt+1} load document failed: {e}")
|
|
125
|
-
await asyncio.sleep(
|
|
129
|
+
await asyncio.sleep(2)
|
|
126
130
|
if attempt == MAX_RETRIES - 1:
|
|
127
131
|
tb = traceback.format_exc()
|
|
128
132
|
logging.error(f"Failed to load documents: {e} | {tb}")
|
|
@@ -0,0 +1,35 @@
|
|
|
1
|
+
import os, logging, traceback
|
|
2
|
+
from typing import Iterator, AsyncIterator, Optional
|
|
3
|
+
from langchain_core.document_loaders import BaseLoader
|
|
4
|
+
from langchain_core.documents import Document
|
|
5
|
+
from langchain_core.runnables import run_in_executor
|
|
6
|
+
from docling.document_converter import DocumentConverter, ConversionResult, ConversionStatus
|
|
7
|
+
|
|
8
|
+
class DoclingLoader(BaseLoader):
|
|
9
|
+
def __init__(self, file_path: str | list[str]) -> None:
|
|
10
|
+
self._file_paths = file_path if isinstance(file_path, list) else [file_path]
|
|
11
|
+
self._converter = DocumentConverter()
|
|
12
|
+
def load(self) -> list[Document]:
|
|
13
|
+
"""Load data into Document objects."""
|
|
14
|
+
return list(self.lazy_load())
|
|
15
|
+
async def aload(self) -> list[Document]:
|
|
16
|
+
"""Load data into Document objects."""
|
|
17
|
+
return [document async for document in self.alazy_load()]
|
|
18
|
+
async def alazy_load(self) -> AsyncIterator[Document]:
|
|
19
|
+
"""A lazy loader for Documents."""
|
|
20
|
+
iterator = await run_in_executor(None, self.lazy_load)
|
|
21
|
+
done = object()
|
|
22
|
+
while True:
|
|
23
|
+
doc = await run_in_executor(None, next, iterator, done) # type: ignore[call-arg, arg-type]
|
|
24
|
+
if doc is done:
|
|
25
|
+
break
|
|
26
|
+
yield doc # type: ignore[misc]
|
|
27
|
+
def lazy_load(self) -> Iterator[Document]:
|
|
28
|
+
for source in self._file_paths:
|
|
29
|
+
try:
|
|
30
|
+
_result = self._converter.convert(os.path.abspath(source),raises_on_error=True)
|
|
31
|
+
doc = _result.document
|
|
32
|
+
text = doc.export_to_markdown()
|
|
33
|
+
yield Document(page_content=text, metadata={"source": source})
|
|
34
|
+
except Exception as e:
|
|
35
|
+
logging.warning(f"Failed to load document from {source}: {e} | {traceback.format_exc()}")
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: ws_bom_robot_app
|
|
3
|
-
Version: 0.0.
|
|
3
|
+
Version: 0.0.25
|
|
4
4
|
Summary: A FastAPI application serving ws bom/robot/llm platform ai.
|
|
5
5
|
Home-page: https://github.com/websolutespa/bom
|
|
6
6
|
Author: Websolute Spa
|
|
@@ -21,10 +21,8 @@ Requires-Dist: langchain-openai==0.2.10
|
|
|
21
21
|
Requires-Dist: langchain-community==0.3.8
|
|
22
22
|
Requires-Dist: langchain-core==0.3.21
|
|
23
23
|
Requires-Dist: faiss-cpu==1.9.0
|
|
24
|
-
Requires-Dist:
|
|
25
|
-
Requires-Dist:
|
|
26
|
-
Requires-Dist: unstructured[all-docs]==0.16.11
|
|
27
|
-
Requires-Dist: langchain_unstructured==0.1.5
|
|
24
|
+
Requires-Dist: unstructured==0.16.11
|
|
25
|
+
Requires-Dist: unstructured[image]
|
|
28
26
|
Requires-Dist: unstructured-ingest==0.3.8
|
|
29
27
|
Requires-Dist: unstructured-ingest[azure]
|
|
30
28
|
Requires-Dist: unstructured-ingest[confluence]
|
|
@@ -35,6 +33,7 @@ Requires-Dist: unstructured-ingest[google_drive]
|
|
|
35
33
|
Requires-Dist: unstructured-ingest[jira]
|
|
36
34
|
Requires-Dist: unstructured-ingest[s3]
|
|
37
35
|
Requires-Dist: unstructured-ingest[sftp]
|
|
36
|
+
Requires-Dist: unstructured-ingest[sharepoint]
|
|
38
37
|
Requires-Dist: unstructured-ingest[slack]
|
|
39
38
|
Requires-Dist: html5lib==1.1
|
|
40
39
|
Requires-Dist: markdownify==0.14.1
|
|
@@ -214,11 +213,22 @@ launch debugger
|
|
|
214
213
|
streamlit run debugger.py --server.port 6002
|
|
215
214
|
```
|
|
216
215
|
|
|
216
|
+
dockerize base image
|
|
217
|
+
|
|
218
|
+
```pwsh
|
|
219
|
+
<# cpu #>
|
|
220
|
+
docker build -f Dockerfile-robot-base-cpu -t ghcr.io/websolutespa/ws-bom-robot-base:cpu .
|
|
221
|
+
docker push ghcr.io/websolutespa/ws-bom-robot-base:cpu
|
|
222
|
+
<# gpu #>
|
|
223
|
+
docker build -f Dockerfile-robot-base-gpu -t ghcr.io/websolutespa/ws-bom-robot-base:gpu .
|
|
224
|
+
docker push ghcr.io/websolutespa/ws-bom-robot-base:gpu
|
|
225
|
+
```
|
|
226
|
+
|
|
217
227
|
dockerize app from src
|
|
218
228
|
|
|
219
229
|
```pwsh
|
|
220
230
|
docker build -f Dockerfile-src -t ws-bom-robot-app:src .
|
|
221
|
-
docker run --name ws-bom-robot-app-src -d -v "$(pwd)/ws_bom_robot_app:/app/ws_bom_robot_app" -p 6001:6001 ws-bom-robot-app:src
|
|
231
|
+
docker run --name ws-bom-robot-app-src -d -v "$(pwd)/ws_bom_robot_app:/app/ws_bom_robot_app" -v "$(pwd)/.data:/app/.data" -p 6001:6001 ws-bom-robot-app:src
|
|
222
232
|
```
|
|
223
233
|
|
|
224
234
|
### ✈️ publish
|
|
@@ -11,7 +11,7 @@ ws_bom_robot_app/llm/agent_handler.py,sha256=Qz3h1eZdA6pkurEbr8sQwl-0FdjugaO5Q9s
|
|
|
11
11
|
ws_bom_robot_app/llm/agent_lcel.py,sha256=jkSLMy6y_ZFvWT8bhBBYHY5CO-ea8oMSPMXMahFUBFc,2666
|
|
12
12
|
ws_bom_robot_app/llm/api.py,sha256=vBu_TFTlBjp7e3J-WmlZbXn_TbB550x-NpQN4YsO7To,3004
|
|
13
13
|
ws_bom_robot_app/llm/defaut_prompt.py,sha256=pn5a4lNLWE1NngHYjA_7tD8GasePMgsgude5fIJxsW0,756
|
|
14
|
-
ws_bom_robot_app/llm/main.py,sha256
|
|
14
|
+
ws_bom_robot_app/llm/main.py,sha256=_uW3Iy9iPJbxDfpyoReu3mbYY8a9dS1V6tZU-z6BELo,3547
|
|
15
15
|
ws_bom_robot_app/llm/settings.py,sha256=EkFGCppORenStH9W4e6_dYvQ-5p6xiEMpmUHBqNqG9M,117
|
|
16
16
|
ws_bom_robot_app/llm/models/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
17
17
|
ws_bom_robot_app/llm/models/api.py,sha256=KlVUbApyz6uuWefAN9K4B_vWDSps5hLW6hNg1Eo3TBQ,6996
|
|
@@ -31,26 +31,27 @@ ws_bom_robot_app/llm/utils/kb.py,sha256=jja45WCbNI7SGEgqDS99nErlwB5eY8Ga7BMnhdMH
|
|
|
31
31
|
ws_bom_robot_app/llm/utils/print.py,sha256=ZonoLPcfM6Cpw4_Ec455LiCovExOwvnIgvw1QORSCBY,799
|
|
32
32
|
ws_bom_robot_app/llm/utils/webhooks.py,sha256=LAAZqyN6VhV13wu4X-X85TwdDgAV2rNvIwQFIIc0FJM,2114
|
|
33
33
|
ws_bom_robot_app/llm/vector_store/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
34
|
-
ws_bom_robot_app/llm/vector_store/generator.py,sha256=
|
|
34
|
+
ws_bom_robot_app/llm/vector_store/generator.py,sha256=Xg-srcH_03lqPHkMn1EXP56GbY1CYa2zIbjvNfcQqyM,6192
|
|
35
35
|
ws_bom_robot_app/llm/vector_store/integration/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
36
36
|
ws_bom_robot_app/llm/vector_store/integration/azure.py,sha256=R37TaPQP-HJJJiaKE9rmMc9kpeXeRvdebbTY_982om0,3392
|
|
37
37
|
ws_bom_robot_app/llm/vector_store/integration/base.py,sha256=IvIu8RkISuurrVKr2YPG96fsOI2kqhaEGyTGzjB-jCI,1550
|
|
38
38
|
ws_bom_robot_app/llm/vector_store/integration/confluence.py,sha256=4fiRHB3J-SHZZxNGHwVkCrT-xSPbc91z4WrDE9fy6xU,2505
|
|
39
|
-
ws_bom_robot_app/llm/vector_store/integration/dropbox.py,sha256=
|
|
39
|
+
ws_bom_robot_app/llm/vector_store/integration/dropbox.py,sha256=yhGvHTN0TEpUfhdvvV7RX5MxBwTUyddAX95Fgqp3mCg,2629
|
|
40
40
|
ws_bom_robot_app/llm/vector_store/integration/gcs.py,sha256=fFDVDUR6eNB7FVTzDSEpMHFEWMgG16GLnpSf_mqGDdE,3184
|
|
41
41
|
ws_bom_robot_app/llm/vector_store/integration/github.py,sha256=18PO30AZcgTn6PHhid3MwImVAdmKBNkr0kmAPgOetGw,2663
|
|
42
42
|
ws_bom_robot_app/llm/vector_store/integration/googledrive.py,sha256=R6hr8iEgrR3QMOzIj5jY6w1x8pZ1LGdh4xM_q7g_ttc,3738
|
|
43
43
|
ws_bom_robot_app/llm/vector_store/integration/jira.py,sha256=o5iINIblp_yNszp54nf7fW97aqjs0A5G89N8sYrd1ds,2771
|
|
44
|
-
ws_bom_robot_app/llm/vector_store/integration/manager.py,sha256=
|
|
44
|
+
ws_bom_robot_app/llm/vector_store/integration/manager.py,sha256=5Fl3XML6f1wmgraigpUwIFIXh7QFPX0RI0YFgFxBAvg,1700
|
|
45
45
|
ws_bom_robot_app/llm/vector_store/integration/s3.py,sha256=3kh-VmH84IW7DdSLvOk6td1VBJ9aohlVJsk5F3cYj0U,3320
|
|
46
46
|
ws_bom_robot_app/llm/vector_store/integration/sftp.py,sha256=WNzjjS1EUykgFB-8e7QkecSa1r1jTJqKyGzR25uJCtM,2848
|
|
47
|
-
ws_bom_robot_app/llm/vector_store/integration/sharepoint.py,sha256=
|
|
47
|
+
ws_bom_robot_app/llm/vector_store/integration/sharepoint.py,sha256=zqqn-6qPrK50Phch4nZHJTgaPyPkGe7W2InGL_Ru6vE,5376
|
|
48
48
|
ws_bom_robot_app/llm/vector_store/integration/sitemap.py,sha256=nPbIywp-ZwWbWStvjvYVgHqqejyYFr8eZhBc8ycTuaU,4206
|
|
49
49
|
ws_bom_robot_app/llm/vector_store/integration/slack.py,sha256=FMjESXm2QetFXI6i8epze7Kbbu22fV8CVaxb71AHnJ8,2572
|
|
50
50
|
ws_bom_robot_app/llm/vector_store/loader/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
51
|
-
ws_bom_robot_app/llm/vector_store/loader/base.py,sha256=
|
|
51
|
+
ws_bom_robot_app/llm/vector_store/loader/base.py,sha256=SWV7T6BcsV8nvnUAHHZ9Q2oFUEnfwM33jpJCry5vbIA,5847
|
|
52
|
+
ws_bom_robot_app/llm/vector_store/loader/docling.py,sha256=aHHfMf2JsZo0o6jrRDlImY0Oi9NFhVQk8Wg5ePAPa50,1721
|
|
52
53
|
ws_bom_robot_app/llm/vector_store/loader/json_loader.py,sha256=qo9ejRZyKv_k6jnGgXnu1W5uqsMMtgqK_uvPpZQ0p74,833
|
|
53
|
-
ws_bom_robot_app-0.0.
|
|
54
|
-
ws_bom_robot_app-0.0.
|
|
55
|
-
ws_bom_robot_app-0.0.
|
|
56
|
-
ws_bom_robot_app-0.0.
|
|
54
|
+
ws_bom_robot_app-0.0.25.dist-info/METADATA,sha256=TObdL0LhroQrJaqOUTwLEY9gqyk_ct-yDPJzcOWps_w,7478
|
|
55
|
+
ws_bom_robot_app-0.0.25.dist-info/WHEEL,sha256=PZUExdf71Ui_so67QXpySuHtCi3-J3wvF4ORK6k_S8U,91
|
|
56
|
+
ws_bom_robot_app-0.0.25.dist-info/top_level.txt,sha256=Yl0akyHVbynsBX_N7wx3H3ZTkcMLjYyLJs5zBMDAKcM,17
|
|
57
|
+
ws_bom_robot_app-0.0.25.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|