ws-bom-robot-app 0.0.85__tar.gz → 0.0.87__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (83) hide show
  1. {ws_bom_robot_app-0.0.85/ws_bom_robot_app.egg-info → ws_bom_robot_app-0.0.87}/PKG-INFO +20 -20
  2. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/requirements.txt +20 -20
  3. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/setup.py +1 -1
  4. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/config.py +3 -1
  5. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/agent_description.py +123 -123
  6. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/agent_handler.py +174 -166
  7. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/agent_lcel.py +50 -50
  8. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/api.py +65 -3
  9. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/defaut_prompt.py +15 -15
  10. ws_bom_robot_app-0.0.87/ws_bom_robot_app/llm/evaluator.py +319 -0
  11. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/feedbacks/feedback_manager.py +66 -66
  12. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/main.py +158 -158
  13. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/models/api.py +1 -1
  14. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/models/feedback.py +30 -30
  15. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/nebuly_handler.py +185 -185
  16. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/providers/llm_manager.py +27 -9
  17. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/tools/tool_builder.py +68 -65
  18. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/tools/tool_manager.py +332 -330
  19. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/tools/utils.py +41 -41
  20. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/utils/agent.py +34 -34
  21. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/utils/cms.py +114 -114
  22. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/utils/download.py +183 -183
  23. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/utils/print.py +29 -29
  24. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/generator.py +137 -137
  25. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/shopify.py +143 -143
  26. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/thron.py +102 -102
  27. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/loader/json_loader.py +25 -25
  28. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/task_manager.py +14 -10
  29. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87/ws_bom_robot_app.egg-info}/PKG-INFO +20 -20
  30. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app.egg-info/SOURCES.txt +1 -0
  31. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app.egg-info/requires.txt +19 -19
  32. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/MANIFEST.in +0 -0
  33. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/README.md +0 -0
  34. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/pyproject.toml +0 -0
  35. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/setup.cfg +0 -0
  36. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/__init__.py +0 -0
  37. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/auth.py +0 -0
  38. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/cron_manager.py +0 -0
  39. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/__init__.py +0 -0
  40. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/agent_context.py +0 -0
  41. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/feedbacks/__init__.py +0 -0
  42. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/models/__init__.py +0 -0
  43. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/models/base.py +0 -0
  44. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/models/kb.py +0 -0
  45. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/providers/__init__.py +0 -0
  46. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/tools/__init__.py +0 -0
  47. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/tools/models/__init__.py +0 -0
  48. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/tools/models/main.py +0 -0
  49. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/utils/__init__.py +0 -0
  50. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/utils/chunker.py +0 -0
  51. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/utils/cleanup.py +0 -0
  52. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/utils/secrets.py +0 -0
  53. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/utils/webhooks.py +0 -0
  54. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/__init__.py +0 -0
  55. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/db/__init__.py +0 -0
  56. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/db/base.py +0 -0
  57. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/db/chroma.py +0 -0
  58. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/db/faiss.py +0 -0
  59. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/db/manager.py +0 -0
  60. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/db/qdrant.py +0 -0
  61. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/__init__.py +0 -0
  62. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/azure.py +0 -0
  63. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/base.py +0 -0
  64. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/confluence.py +0 -0
  65. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/dropbox.py +0 -0
  66. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/gcs.py +0 -0
  67. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/github.py +0 -0
  68. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/googledrive.py +0 -0
  69. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/jira.py +0 -0
  70. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/manager.py +0 -0
  71. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/s3.py +0 -0
  72. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/sftp.py +0 -0
  73. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/sharepoint.py +0 -0
  74. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/sitemap.py +0 -0
  75. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/integration/slack.py +0 -0
  76. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/loader/__init__.py +0 -0
  77. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/loader/base.py +0 -0
  78. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/llm/vector_store/loader/docling.py +0 -0
  79. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/main.py +0 -0
  80. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/subprocess_runner.py +0 -0
  81. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app/util.py +0 -0
  82. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app.egg-info/dependency_links.txt +0 -0
  83. {ws_bom_robot_app-0.0.85 → ws_bom_robot_app-0.0.87}/ws_bom_robot_app.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ws_bom_robot_app
3
- Version: 0.0.85
3
+ Version: 0.0.87
4
4
  Summary: A FastAPI application serving ws bom/robot/llm platform ai.
5
5
  Home-page: https://github.com/websolutespa/bom
6
6
  Author: Websolute Spa
@@ -17,26 +17,26 @@ Requires-Dist: pydantic==2.11.7
17
17
  Requires-Dist: pydantic-settings==2.10.1
18
18
  Requires-Dist: fastapi[standard]==0.116.1
19
19
  Requires-Dist: chevron==0.14.0
20
- Requires-Dist: langchain==0.3.26
21
- Requires-Dist: langchain-community==0.3.26
22
- Requires-Dist: langchain-core==0.3.72
23
- Requires-Dist: langchain-openai==0.3.27
24
- Requires-Dist: langchain-anthropic==0.3.6
25
- Requires-Dist: langchain-ibm==0.3.14
26
- Requires-Dist: langchain-google-genai==2.0.7
27
- Requires-Dist: langchain-google-vertexai==2.0.27
28
- Requires-Dist: langchain-groq==0.3.6
29
- Requires-Dist: langchain-ollama==0.3.3
30
- Requires-Dist: faiss-cpu==1.11.0
31
- Requires-Dist: chromadb==1.0.15
32
- Requires-Dist: langchain_chroma==0.2.5
33
- Requires-Dist: fastembed==0.7.1
20
+ Requires-Dist: langchain==0.3.27
21
+ Requires-Dist: langchain-community==0.3.29
22
+ Requires-Dist: langchain-core==0.3.75
23
+ Requires-Dist: langchain-openai==0.3.32
24
+ Requires-Dist: langchain-anthropic==0.3.19
25
+ Requires-Dist: langchain-ibm==0.3.17
26
+ Requires-Dist: langchain-google-genai==2.1.10
27
+ Requires-Dist: langchain-google-vertexai==2.0.28
28
+ Requires-Dist: langchain-groq==0.3.7
29
+ Requires-Dist: langchain-ollama==0.3.7
30
+ Requires-Dist: openevals==0.1.0
31
+ Requires-Dist: faiss-cpu==1.12.0
32
+ Requires-Dist: chromadb==1.0.20
33
+ Requires-Dist: langchain-chroma==0.2.5
34
34
  Requires-Dist: langchain-qdrant==0.2.0
35
- Requires-Dist: qdrant-client==1.15.0
35
+ Requires-Dist: qdrant-client[fastembed]==1.15.1
36
36
  Requires-Dist: lark==1.2.2
37
- Requires-Dist: unstructured==0.18.11
37
+ Requires-Dist: unstructured==0.18.14
38
38
  Requires-Dist: unstructured[image]
39
- Requires-Dist: unstructured-ingest==1.2.6
39
+ Requires-Dist: unstructured-ingest==1.2.11
40
40
  Requires-Dist: unstructured-ingest[azure]
41
41
  Requires-Dist: unstructured-ingest[confluence]
42
42
  Requires-Dist: unstructured-ingest[dropbox]
@@ -49,9 +49,9 @@ Requires-Dist: unstructured-ingest[sftp]
49
49
  Requires-Dist: unstructured-ingest[sharepoint]
50
50
  Requires-Dist: unstructured-ingest[slack]
51
51
  Requires-Dist: html5lib==1.1
52
- Requires-Dist: markdownify==1.1.0
52
+ Requires-Dist: markdownify==1.2.0
53
53
  Requires-Dist: duckduckgo-search==8.0.4
54
- Requires-Dist: langchain_google_community==2.0.7
54
+ Requires-Dist: langchain-google-community==2.0.7
55
55
  Requires-Dist: trafilatura==2.0.0
56
56
  Dynamic: author
57
57
  Dynamic: author-email
@@ -8,30 +8,30 @@ fastapi[standard]==0.116.1
8
8
  chevron==0.14.0
9
9
 
10
10
  #framework
11
- langchain==0.3.26
12
- langchain-community==0.3.26
13
- langchain-core==0.3.72
14
- langchain-openai==0.3.27
15
- langchain-anthropic==0.3.6 #issue get_models() from 0.3.7
16
- langchain-ibm==0.3.14
17
- langchain-google-genai==2.0.7 #waiting for new release: https://github.com/langchain-ai/langchain-google/issues/711
18
- langchain-google-vertexai==2.0.27
19
- langchain-groq==0.3.6
20
- langchain-ollama==0.3.3
11
+ langchain==0.3.27
12
+ langchain-community==0.3.29
13
+ langchain-core==0.3.75
14
+ langchain-openai==0.3.32
15
+ langchain-anthropic==0.3.19
16
+ langchain-ibm==0.3.17
17
+ langchain-google-genai==2.1.10
18
+ langchain-google-vertexai==2.0.28
19
+ langchain-groq==0.3.7
20
+ langchain-ollama==0.3.7
21
+ openevals==0.1.0 #langsmith evaluation
21
22
 
22
23
  #vector DB
23
- faiss-cpu==1.11.0
24
- chromadb==1.0.15
25
- langchain_chroma==0.2.5
26
- fastembed==0.7.1 #qdrant sparse embedding
24
+ faiss-cpu==1.12.0
25
+ chromadb==1.0.20
26
+ langchain-chroma==0.2.5
27
27
  langchain-qdrant==0.2.0
28
- qdrant-client==1.15.0
28
+ qdrant-client[fastembed]==1.15.1
29
29
  lark==1.2.2 #self-query retriever
30
30
 
31
31
  #loaders
32
- unstructured==0.18.11
32
+ unstructured==0.18.14
33
33
  unstructured[image]
34
- unstructured-ingest==1.2.6
34
+ unstructured-ingest==1.2.11
35
35
  unstructured-ingest[azure]
36
36
  unstructured-ingest[confluence]
37
37
  unstructured-ingest[dropbox]
@@ -46,9 +46,9 @@ unstructured-ingest[slack]
46
46
  html5lib==1.1 #beautifulsoup4 parser
47
47
 
48
48
  #integrations
49
- markdownify==1.1.0 #sitemap
49
+ markdownify==1.2.0 #sitemap
50
50
 
51
- ##tools
51
+ #tools
52
52
  duckduckgo-search==8.0.4
53
- langchain_google_community==2.0.7
53
+ langchain-google-community==2.0.7
54
54
  trafilatura==2.0.0
@@ -4,7 +4,7 @@ _requirements = [line.split('#')[0].strip() for line in open("requirements.txt")
4
4
 
5
5
  setup(
6
6
  name="ws_bom_robot_app",
7
- version="0.0.85",
7
+ version="0.0.87",
8
8
  description="A FastAPI application serving ws bom/robot/llm platform ai.",
9
9
  long_description=open("README.md", encoding='utf-8').read(),
10
10
  long_description_content_type="text/markdown",
@@ -36,11 +36,12 @@ class Settings(BaseSettings):
36
36
  OLLAMA_API_URL: str = 'http://localhost:11434'
37
37
  GROQ_API_KEY: str = ''
38
38
  GOOGLE_API_KEY: str = ''
39
+ GOOGLE_APPLICATION_CREDENTIALS: str = '' # path to google credentials iam file, e.d. ./.secrets/google-credentials.json
39
40
  WATSONX_URL: str = ''
40
41
  WATSONX_APIKEY: str = ''
41
42
  WATSONX_PROJECTID: str = ''
42
43
  NEBULY_API_URL: str ='https://backend.nebuly.com/'
43
- GOOGLE_APPLICATION_CREDENTIALS: str = '' # path to google credentials iam file, e.d. ./.secrets/google-credentials.json
44
+ LANGSMITH_API_KEY: str = '' # app-wide api key to run evaluation
44
45
  model_config = ConfigDict(
45
46
  env_file='./.env',
46
47
  extra='ignore',
@@ -61,6 +62,7 @@ class Settings(BaseSettings):
61
62
  os.environ["WATSONX_APIKEY"] = self.WATSONX_APIKEY
62
63
  os.environ["WATSONX_PROJECTID"] = self.WATSONX_PROJECTID
63
64
  os.environ["NEBULY_API_URL"] = self.NEBULY_API_URL
65
+ os.environ["LANGSMITH_API_KEY"] = self.LANGSMITH_API_KEY
64
66
  # dir
65
67
  os.makedirs(self.robot_data_folder, exist_ok=True)
66
68
  for subfolder in [self.robot_data_db_folder, self.robot_data_attachment_folder, 'db']:
@@ -1,123 +1,123 @@
1
- import json, requests, re
2
- from typing import Any
3
- from abc import ABC, abstractmethod
4
- from langchain_core.prompts import ChatPromptTemplate
5
- from langchain_core.messages import AIMessage
6
- from langchain_core.runnables import RunnableSerializable
7
- from langchain_core.runnables import RunnableLambda
8
- from bs4 import BeautifulSoup
9
- from ws_bom_robot_app.llm.models.api import LlmRules
10
- from ws_bom_robot_app.llm.providers.llm_manager import LlmInterface
11
- from ws_bom_robot_app.llm.utils.agent import get_rules
12
-
13
- # SafeDict helper class
14
- class SafeDict(dict):
15
- def __missing__(self, key):
16
- return ''
17
-
18
- # Strategy Interface
19
- class AgentDescriptorStrategy(ABC):
20
- @abstractmethod
21
- def enrich_prompt(self, prompt: str, input: dict) -> str:
22
- pass
23
-
24
- @abstractmethod
25
- def rule_input(self, input: dict) -> str:
26
- pass
27
-
28
- # Concrete Strategy for Default Agent
29
- class DefaultAgentDescriptor(AgentDescriptorStrategy):
30
- def enrich_prompt(self, prompt: str, input: dict) -> str:
31
- # Default enrichment logic (could be minimal or no-op)
32
- return prompt.format_map(SafeDict(input))
33
-
34
- def rule_input(self, input: dict) -> str:
35
- return input.get('content', "")
36
-
37
- # Concrete Strategy for URL2Text Agent
38
- class URL2TextAgentDescriptor(AgentDescriptorStrategy):
39
- def enrich_prompt(self, prompt: str, input: dict) -> str:
40
- input["context"] = self._get_page_text(input)
41
- return prompt.format_map(SafeDict(input))
42
-
43
- def rule_input(self, input: dict) -> str:
44
- return input.get('context', "")
45
-
46
- def _get_page_text(self, input: dict) -> str:
47
- url = input.get("content", "")
48
- exclusions = input.get("exclude", {})
49
- response = requests.get(url)
50
- response.raise_for_status()
51
- soup = BeautifulSoup(response.content, 'html5lib')
52
- classes_to_exclude = exclusions.get("classes", [])
53
- ids_to_exclude = exclusions.get("ids", [])
54
- for class_name in classes_to_exclude:
55
- for element in soup.find_all(class_=class_name):
56
- element.extract()
57
- for id_name in ids_to_exclude:
58
- for element in soup.find_all(id=id_name):
59
- element.extract()
60
- for script in soup(["script", "noscript", "style", "head", "footer", "iframe"]):
61
- script.extract()
62
- return re.sub(' +', ' ', soup.get_text())
63
-
64
-
65
- class AgentDescriptor:
66
- # Dictionary to hold all agent strategies
67
- _list: dict[str,AgentDescriptorStrategy] = {
68
- "default": DefaultAgentDescriptor(),
69
- "url2text": URL2TextAgentDescriptor(),
70
- }
71
-
72
- # Functions to manage strategies
73
- @staticmethod
74
- def add_strategy(name: str, strategy: AgentDescriptorStrategy):
75
- """_summary_
76
- add a new strategy to the dictionary
77
- Args:
78
- name (str): name of the strategy, in lowercase
79
- strategy (AgentDescriptorStrategy): class implementing the strategy
80
- Examples:
81
- AgentDescriptor.add_strategy("custom_agent_descriptor", CustomAgentDescriptor())
82
- """
83
- AgentDescriptor._list[name.lower()] = strategy
84
-
85
- @staticmethod
86
- def get_strategy(name: str) -> AgentDescriptorStrategy:
87
- return AgentDescriptor._list.get(name.lower(), DefaultAgentDescriptor())
88
-
89
- def __init__(self, llm: LlmInterface, prompt: str, mode: str, rules: LlmRules = None):
90
- self.__prompt = prompt
91
- self.__llm = llm
92
- self.rules= rules
93
- self.strategy = self.get_strategy(mode) # Selects the strategy from the dictionary
94
-
95
- async def __create_prompt(self, input_dict: dict):
96
- input_data = json.loads(input_dict.get("input", {}))
97
- system = self.strategy.enrich_prompt(self.__prompt, input_data)
98
- if self.rules:
99
- rule_input = self.strategy.rule_input(input_data)
100
- rules_prompt = await get_rules(self.__llm.get_embeddings(), self.rules, rule_input)
101
- system += rules_prompt
102
- return ChatPromptTemplate.from_messages(
103
- [
104
- ("system", system),
105
- ("user", input_data.get("content", ""))
106
- ]
107
- )
108
-
109
- def __create_agent_descriptor(self, content) -> RunnableSerializable[Any, Any]:
110
- content = json.loads(content)
111
- agent = (
112
- {
113
- "input": lambda x: x["input"],
114
- }
115
- | RunnableLambda(self.__create_prompt)
116
- | self.__llm.get_llm()
117
- )
118
- return agent
119
-
120
- async def run_agent(self, content) -> Any:
121
- agent_descriptor = self.__create_agent_descriptor(content)
122
- response: AIMessage = await agent_descriptor.ainvoke({"input": content})
123
- return response
1
+ import json, requests, re
2
+ from typing import Any
3
+ from abc import ABC, abstractmethod
4
+ from langchain_core.prompts import ChatPromptTemplate
5
+ from langchain_core.messages import AIMessage
6
+ from langchain_core.runnables import RunnableSerializable
7
+ from langchain_core.runnables import RunnableLambda
8
+ from bs4 import BeautifulSoup
9
+ from ws_bom_robot_app.llm.models.api import LlmRules
10
+ from ws_bom_robot_app.llm.providers.llm_manager import LlmInterface
11
+ from ws_bom_robot_app.llm.utils.agent import get_rules
12
+
13
+ # SafeDict helper class
14
+ class SafeDict(dict):
15
+ def __missing__(self, key):
16
+ return ''
17
+
18
+ # Strategy Interface
19
+ class AgentDescriptorStrategy(ABC):
20
+ @abstractmethod
21
+ def enrich_prompt(self, prompt: str, input: dict) -> str:
22
+ pass
23
+
24
+ @abstractmethod
25
+ def rule_input(self, input: dict) -> str:
26
+ pass
27
+
28
+ # Concrete Strategy for Default Agent
29
+ class DefaultAgentDescriptor(AgentDescriptorStrategy):
30
+ def enrich_prompt(self, prompt: str, input: dict) -> str:
31
+ # Default enrichment logic (could be minimal or no-op)
32
+ return prompt.format_map(SafeDict(input))
33
+
34
+ def rule_input(self, input: dict) -> str:
35
+ return input.get('content', "")
36
+
37
+ # Concrete Strategy for URL2Text Agent
38
+ class URL2TextAgentDescriptor(AgentDescriptorStrategy):
39
+ def enrich_prompt(self, prompt: str, input: dict) -> str:
40
+ input["context"] = self._get_page_text(input)
41
+ return prompt.format_map(SafeDict(input))
42
+
43
+ def rule_input(self, input: dict) -> str:
44
+ return input.get('context', "")
45
+
46
+ def _get_page_text(self, input: dict) -> str:
47
+ url = input.get("content", "")
48
+ exclusions = input.get("exclude", {})
49
+ response = requests.get(url)
50
+ response.raise_for_status()
51
+ soup = BeautifulSoup(response.content, 'html5lib')
52
+ classes_to_exclude = exclusions.get("classes", [])
53
+ ids_to_exclude = exclusions.get("ids", [])
54
+ for class_name in classes_to_exclude:
55
+ for element in soup.find_all(class_=class_name):
56
+ element.extract()
57
+ for id_name in ids_to_exclude:
58
+ for element in soup.find_all(id=id_name):
59
+ element.extract()
60
+ for script in soup(["script", "noscript", "style", "head", "footer", "iframe"]):
61
+ script.extract()
62
+ return re.sub(' +', ' ', soup.get_text())
63
+
64
+
65
+ class AgentDescriptor:
66
+ # Dictionary to hold all agent strategies
67
+ _list: dict[str,AgentDescriptorStrategy] = {
68
+ "default": DefaultAgentDescriptor(),
69
+ "url2text": URL2TextAgentDescriptor(),
70
+ }
71
+
72
+ # Functions to manage strategies
73
+ @staticmethod
74
+ def add_strategy(name: str, strategy: AgentDescriptorStrategy):
75
+ """_summary_
76
+ add a new strategy to the dictionary
77
+ Args:
78
+ name (str): name of the strategy, in lowercase
79
+ strategy (AgentDescriptorStrategy): class implementing the strategy
80
+ Examples:
81
+ AgentDescriptor.add_strategy("custom_agent_descriptor", CustomAgentDescriptor())
82
+ """
83
+ AgentDescriptor._list[name.lower()] = strategy
84
+
85
+ @staticmethod
86
+ def get_strategy(name: str) -> AgentDescriptorStrategy:
87
+ return AgentDescriptor._list.get(name.lower(), DefaultAgentDescriptor())
88
+
89
+ def __init__(self, llm: LlmInterface, prompt: str, mode: str, rules: LlmRules = None):
90
+ self.__prompt = prompt
91
+ self.__llm = llm
92
+ self.rules= rules
93
+ self.strategy = self.get_strategy(mode) # Selects the strategy from the dictionary
94
+
95
+ async def __create_prompt(self, input_dict: dict):
96
+ input_data = json.loads(input_dict.get("input", {}))
97
+ system = self.strategy.enrich_prompt(self.__prompt, input_data)
98
+ if self.rules:
99
+ rule_input = self.strategy.rule_input(input_data)
100
+ rules_prompt = await get_rules(self.__llm.get_embeddings(), self.rules, rule_input)
101
+ system += rules_prompt
102
+ return ChatPromptTemplate.from_messages(
103
+ [
104
+ ("system", system),
105
+ ("user", input_data.get("content", ""))
106
+ ]
107
+ )
108
+
109
+ def __create_agent_descriptor(self, content) -> RunnableSerializable[Any, Any]:
110
+ content = json.loads(content)
111
+ agent = (
112
+ {
113
+ "input": lambda x: x["input"],
114
+ }
115
+ | RunnableLambda(self.__create_prompt)
116
+ | self.__llm.get_llm()
117
+ )
118
+ return agent
119
+
120
+ async def run_agent(self, content) -> Any:
121
+ agent_descriptor = self.__create_agent_descriptor(content)
122
+ response: AIMessage = await agent_descriptor.ainvoke({"input": content})
123
+ return response