PyPI - beswarm - Versions diffs - 0.1.37__py3-none-any.whl → 0.1.39__py3-none-any.whl - Mend

beswarm 0.1.37py3-none-any.whl → 0.1.39py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

beswarm/aient/setup.py +1 -1
beswarm/aient/src/aient/models/claude.py +0 -67
beswarm/aient/src/aient/models/groq.py +0 -34
beswarm/aient/src/aient/plugins/config.py +3 -12
beswarm/aient/src/aient/plugins/websearch.py +1 -1
beswarm/aient/src/aient/utils/scripts.py +0 -23
{beswarm-0.1.37.dist-info → beswarm-0.1.39.dist-info}/METADATA +3 -3
{beswarm-0.1.37.dist-info → beswarm-0.1.39.dist-info}/RECORD +10 -11
beswarm/aient/test/test_langchain_search_old.py +0 -235
{beswarm-0.1.37.dist-info → beswarm-0.1.39.dist-info}/WHEEL +0 -0
{beswarm-0.1.37.dist-info → beswarm-0.1.39.dist-info}/top_level.txt +0 -0

beswarm/aient/setup.py CHANGED Viewed

@@ -4,7 +4,7 @@ from setuptools import setup, find_packages
 setup(
     name="aient",
-    version="1.0.93",
+    version="1.0.95",
     description="Aient: The Awakening of Agent.",
     long_description=Path.open(Path("README.md"), encoding="utf-8").read(),
     long_description_content_type="text/markdown",

beswarm/aient/src/aient/models/claude.py CHANGED Viewed

@@ -2,7 +2,6 @@ import os
 import re
 import json
 import copy
-import tiktoken
 import requests
 from .base import BaseLLM
@@ -65,39 +64,6 @@ class claude(BaseLLM):
         self.conversation[convo_id] = claudeConversation()
         self.system_prompt = system_prompt or self.system_prompt
-    def __truncate_conversation(self, convo_id: str = "default") -> None:
-        """
-        Truncate the conversation
-        """
-        while True:
-            if (
-                self.get_token_count(convo_id) > self.truncate_limit
-                and len(self.conversation[convo_id]) > 1
-            ):
-                # Don't remove the first message
-                self.conversation[convo_id].pop(1)
-            else:
-                break
-    def get_token_count(self, convo_id: str = "default") -> int:
-        """
-        Get token count
-        """
-        tiktoken.model.MODEL_TO_ENCODING["claude-2.1"] = "cl100k_base"
-        encoding = tiktoken.encoding_for_model(self.engine)
-        num_tokens = 0
-        for message in self.conversation[convo_id]:
-            # every message follows <im_start>{role/name}\n{content}<im_end>\n
-            num_tokens += 5
-            for key, value in message.items():
-                if value:
-                    num_tokens += len(encoding.encode(value))
-                if key == "name":  # if there's a name, the role is omitted
-                    num_tokens += 5  # role is always required and always 1 token
-        num_tokens += 5  # every reply is primed with <im_start>assistant
-        return num_tokens
     def ask_stream(
         self,
         prompt: str,
@@ -267,39 +233,6 @@ class claude3(BaseLLM):
         self.conversation[convo_id] = list()
         self.system_prompt = system_prompt or self.system_prompt
-    def __truncate_conversation(self, convo_id: str = "default") -> None:
-        """
-        Truncate the conversation
-        """
-        while True:
-            if (
-                self.get_token_count(convo_id) > self.truncate_limit
-                and len(self.conversation[convo_id]) > 1
-            ):
-                # Don't remove the first message
-                self.conversation[convo_id].pop(1)
-            else:
-                break
-    def get_token_count(self, convo_id: str = "default") -> int:
-        """
-        Get token count
-        """
-        tiktoken.model.MODEL_TO_ENCODING["claude-2.1"] = "cl100k_base"
-        encoding = tiktoken.encoding_for_model(self.engine)
-        num_tokens = 0
-        for message in self.conversation[convo_id]:
-            # every message follows <im_start>{role/name}\n{content}<im_end>\n
-            num_tokens += 5
-            for key, value in message.items():
-                if value:
-                    num_tokens += len(encoding.encode(value))
-                if key == "name":  # if there's a name, the role is omitted
-                    num_tokens += 5  # role is always required and always 1 token
-        num_tokens += 5  # every reply is primed with <im_start>assistant
-        return num_tokens
     def ask_stream(
         self,
         prompt: str,

beswarm/aient/src/aient/models/groq.py CHANGED Viewed

@@ -1,7 +1,6 @@
 import os
 import json
 import requests
-import tiktoken
 from .base import BaseLLM
@@ -52,39 +51,6 @@ class groq(BaseLLM):
         self.conversation[convo_id] = list()
         self.system_prompt = system_prompt or self.system_prompt
-    def __truncate_conversation(self, convo_id: str = "default") -> None:
-        """
-        Truncate the conversation
-        """
-        while True:
-            if (
-                self.get_token_count(convo_id) > self.truncate_limit
-                and len(self.conversation[convo_id]) > 1
-            ):
-                # Don't remove the first message
-                self.conversation[convo_id].pop(1)
-            else:
-                break
-    def get_token_count(self, convo_id: str = "default") -> int:
-        """
-        Get token count
-        """
-        # tiktoken.model.MODEL_TO_ENCODING["mixtral-8x7b-32768"] = "cl100k_base"
-        encoding = tiktoken.get_encoding("cl100k_base")
-        num_tokens = 0
-        for message in self.conversation[convo_id]:
-            # every message follows <im_start>{role/name}\n{content}<im_end>\n
-            num_tokens += 5
-            for key, value in message.items():
-                if value:
-                    num_tokens += len(encoding.encode(value))
-                if key == "name":  # if there's a name, the role is omitted
-                    num_tokens += 5  # role is always required and always 1 token
-        num_tokens += 5  # every reply is primed with <im_start>assistant
-        return num_tokens
     def ask_stream(
         self,
         prompt: str,

beswarm/aient/src/aient/plugins/config.py CHANGED Viewed

@@ -3,8 +3,7 @@ import json
 import inspect
 from .registry import registry
-from ..utils.scripts import cut_message
-from ..utils.prompt import search_key_word_prompt, arxiv_doc_user_prompt
+from ..utils.prompt import search_key_word_prompt
 async def get_tools_result_async(function_call_name, function_full_response, function_call_max_tokens, engine, robot, api_key, api_url, use_plugins, model, add_message, convo_id, language):
     function_response = ""
@@ -26,10 +25,7 @@ async def get_tools_result_async(function_call_name, function_full_response, fun
                 yield chunk
             else:
                 function_response = "\n\n".join(chunk)
-            # function_response = yield chunk
-        # function_response = yield from eval(function_call_name)(prompt, keywords)
-        function_call_max_tokens = 32000
-        function_response, text_len = cut_message(function_response, function_call_max_tokens, engine)
         if function_response:
             function_response = (
                 f"You need to response the following question: {prompt}. Search results is provided inside <Search_results></Search_results> XML tags. Your task is to think about the question step by step and then answer the above question in {language} based on the Search results provided. Please response in {language} and adopt a style that is logical, in-depth, and detailed. Note: In order to make the answer appear highly professional, you should be an expert in textual analysis, aiming to make the answer precise and comprehensive. Directly response markdown format, without using markdown code blocks. For each sentence quoting search results, a markdown ordered superscript number url link must be used to indicate the source, e.g., [¹](https://www.example.com)"
@@ -40,18 +36,13 @@ async def get_tools_result_async(function_call_name, function_full_response, fun
             ).format(function_response)
         else:
             function_response = "无法找到相关信息，停止使用 tools"
-        # user_prompt = f"You need to response the following question: {prompt}. Search results is provided inside <Search_results></Search_results> XML tags. Your task is to think about the question step by step and then answer the above question in {config.language} based on the Search results provided. Please response in {config.language} and adopt a style that is logical, in-depth, and detailed. Note: In order to make the answer appear highly professional, you should be an expert in textual analysis, aiming to make the answer precise and comprehensive. Directly response markdown format, without using markdown code blocks"
-        # self.add_to_conversation(user_prompt, "user", convo_id=convo_id)
     elif function_to_call:
         prompt = json.loads(function_full_response)
         if inspect.iscoroutinefunction(function_to_call):
             function_response = await function_to_call(**prompt)
         else:
             function_response = function_to_call(**prompt)
-        function_response, text_len = cut_message(function_response, function_call_max_tokens, engine)
-    # if function_call_name == "download_read_arxiv_pdf":
-    #     add_message(arxiv_doc_user_prompt, "user", convo_id=convo_id)
     function_response = (
         f"function_response:{function_response}"

beswarm/aient/src/aient/plugins/websearch.py CHANGED Viewed

@@ -6,7 +6,6 @@ import threading
 import time as record_time
 from itertools import islice
 from bs4 import BeautifulSoup
-from duckduckgo_search import DDGS
 from .registry import register_tool
 class ThreadWithReturnValue(threading.Thread):
@@ -178,6 +177,7 @@ def get_url_content(url: str) -> str:
 def getddgsearchurl(query, max_results=4):
     try:
+        from duckduckgo_search import DDGS
         results = []
         with DDGS() as ddgs:
             ddgs_gen = ddgs.text(query, safesearch='Off', timelimit='y', backend="lite")

beswarm/aient/src/aient/utils/scripts.py CHANGED Viewed

@@ -1,33 +1,10 @@
 import os
 import json
-import base64
-import tiktoken
 import requests
 import urllib.parse
 from ..core.utils import get_image_message
-def get_encode_text(text, model_name):
-    tiktoken.get_encoding("cl100k_base")
-    model_name = "gpt-3.5-turbo"
-    encoding = tiktoken.encoding_for_model(model_name)
-    encode_text = encoding.encode(text, disallowed_special=())
-    return encoding, encode_text
-def get_text_token_len(text, model_name):
-    encoding, encode_text = get_encode_text(text, model_name)
-    return len(encode_text)
-def cut_message(message: str, max_tokens: int, model_name: str):
-    if type(message) != str:
-        message = str(message)
-    encoding, encode_text = get_encode_text(message, model_name)
-    if len(encode_text) > max_tokens:
-        encode_text = encode_text[:max_tokens]
-        message = encoding.decode(encode_text)
-    encode_text = encoding.encode(message, disallowed_special=())
-    return message, len(encode_text)
 def get_doc_from_url(url):
     filename = urllib.parse.unquote(url.split("/")[-1])
     response = requests.get(url, stream=True)

{beswarm-0.1.37.dist-info → beswarm-0.1.39.dist-info}/METADATA RENAMED Viewed

@@ -1,12 +1,11 @@
 Metadata-Version: 2.4
 Name: beswarm
-Version: 0.1.37
+Version: 0.1.39
 Summary: MAS
 Requires-Python: >=3.11
 Description-Content-Type: text/markdown
 Requires-Dist: beautifulsoup4>=4.13.4
 Requires-Dist: diskcache>=5.6.3
-Requires-Dist: duckduckgo-search==5.3.1
 Requires-Dist: fake-useragent>=2.2.0
 Requires-Dist: fastapi>=0.115.12
 Requires-Dist: grep-ast>=0.8.1
@@ -27,8 +26,9 @@ Requires-Dist: pyperclip>=1.9.0
 Requires-Dist: pytz>=2025.2
 Requires-Dist: requests>=2.32.3
 Requires-Dist: scipy>=1.15.2
-Requires-Dist: tiktoken==0.6.0
 Requires-Dist: tqdm>=4.67.1
+Provides-Extra: search
+Requires-Dist: duckduckgo-search==5.3.1; extra == "search"
 # beswarm

{beswarm-0.1.37.dist-info → beswarm-0.1.39.dist-info}/RECORD RENAMED Viewed

@@ -1,7 +1,7 @@
 beswarm/__init__.py,sha256=HZjUOJtZR5QhMuDbq-wukQQn1VrBusNWai_ysGo-VVI,20
 beswarm/utils.py,sha256=AdDCcqAIIKQEMl7PfryVgeT9G5sHe7QNsZnrvmTGA8E,283
 beswarm/aient/main.py,sha256=SiYAIgQlLJqYusnTVEJOx1WNkSJKMImhgn5aWjfroxg,3814
-beswarm/aient/setup.py,sha256=UvQkQk0MwjVxgzgR4-QJxBy2A4et3GTfTnlbiHw6LVQ,487
+beswarm/aient/setup.py,sha256=gX6fAYtVyLi9NHeEKPMGPF4IxtQ9MvEnJy1besWMS5U,487
 beswarm/aient/src/aient/__init__.py,sha256=SRfF7oDVlOOAi6nGKiJIUK6B_arqYLO9iSMp-2IZZps,21
 beswarm/aient/src/aient/core/__init__.py,sha256=NxjebTlku35S4Dzr16rdSqSTWUvvwEeACe8KvHJnjPg,34
 beswarm/aient/src/aient/core/log_config.py,sha256=kz2_yJv1p-o3lUQOwA3qh-LSc3wMHv13iCQclw44W9c,274
@@ -17,14 +17,14 @@ beswarm/aient/src/aient/models/__init__.py,sha256=ouNDNvoBBpIFrLsk09Q_sq23HR0GbL
 beswarm/aient/src/aient/models/audio.py,sha256=kRd-8-WXzv4vwvsTGwnstK-WR8--vr9CdfCZzu8y9LA,1934
 beswarm/aient/src/aient/models/base.py,sha256=z-Z0pJfTN2x0cuwfvu0BdMRY9O-RmLwHEnBIJN1x4Fg,6719
 beswarm/aient/src/aient/models/chatgpt.py,sha256=-NWkkKxTCyraPYT0YN37NA2rUfOaDNXtvFSQmIE5tS8,45066
-beswarm/aient/src/aient/models/claude.py,sha256=thK9P8qkaaoUN3OOJ9Shw4KDs-pAGKPoX4FOPGFXva8,28597
+beswarm/aient/src/aient/models/claude.py,sha256=JezghW7y0brl4Y5qiSHvnYR5prQCFywX4RViHt39pGI,26037
 beswarm/aient/src/aient/models/duckduckgo.py,sha256=1l7vYCs9SG5SWPCbcl7q6pCcB5AUF_r-a4l9frz3Ogo,8115
 beswarm/aient/src/aient/models/gemini.py,sha256=chGLc-8G_DAOxr10HPoOhvVFW1RvMgHd6mt--VyAW98,14730
-beswarm/aient/src/aient/models/groq.py,sha256=2JCB0QE1htOprJHI5fZ11R2RtOhsHlsTjbmFyzc8oSM,10084
+beswarm/aient/src/aient/models/groq.py,sha256=eXfSOaPxgQEtk4U8qseArN8rFYOFBfMsPwRcDW1nERo,8790
 beswarm/aient/src/aient/models/vertex.py,sha256=qVD5l1Q538xXUPulxG4nmDjXE1VoV4yuAkTCpIeJVw0,16795
 beswarm/aient/src/aient/plugins/__init__.py,sha256=p3KO6Aa3Lupos4i2SjzLQw1hzQTigOAfEHngsldrsyk,986
 beswarm/aient/src/aient/plugins/arXiv.py,sha256=yHjb6PS3GUWazpOYRMKMzghKJlxnZ5TX8z9F6UtUVow,1461
-beswarm/aient/src/aient/plugins/config.py,sha256=KnZ5xtb5o41FI2_qvxTEQhssdd3WJc7lIAFNR85INQw,7817
+beswarm/aient/src/aient/plugins/config.py,sha256=Vp6CG9ocdC_FAlCMEGtKj45xamir76DFxdJVvURNtog,6539
 beswarm/aient/src/aient/plugins/excute_command.py,sha256=u-JOZ21dDcDx1j3O0KVIHAsa6MNuOxHFBdV3iCnTih0,5413
 beswarm/aient/src/aient/plugins/get_time.py,sha256=Ih5XIW5SDAIhrZ9W4Qe5Hs1k4ieKPUc_LAd6ySNyqZk,654
 beswarm/aient/src/aient/plugins/image.py,sha256=ZElCIaZznE06TN9xW3DrSukS7U3A5_cjk1Jge4NzPxw,2072
@@ -32,13 +32,13 @@ beswarm/aient/src/aient/plugins/list_directory.py,sha256=5ubm-mfrj-tanGSDp4M_Tmb
 beswarm/aient/src/aient/plugins/read_file.py,sha256=cJxGnhcz1_gjkgeemVyixLUiCvf-dWm-UtDfrbFdlLE,4857
 beswarm/aient/src/aient/plugins/registry.py,sha256=YknzhieU_8nQ3oKlUSSWDB4X7t2Jx0JnqT2Jd9Xsvfk,3574
 beswarm/aient/src/aient/plugins/run_python.py,sha256=dgcUwBunMuDkaSKR5bToudVzSdrXVewktDDFUz_iIOQ,4589
-beswarm/aient/src/aient/plugins/websearch.py,sha256=yiBzqXK5X220ibR-zko3VDsn4QOnLu1k6E2YOygCeTQ,15185
+beswarm/aient/src/aient/plugins/websearch.py,sha256=a-JJZjEZ5MEQ9WBMkD7okBHYehLSzApoLMiyqBnxDqs,15193
 beswarm/aient/src/aient/plugins/write_file.py,sha256=qmT6iQ3mDyVAa9Sld1jfJq0KPZj0w2kRIHq0JyjpGeA,1853
 beswarm/aient/src/aient/prompt/__init__.py,sha256=GBtn6-JDT8KHFCcuPpfSNE_aGddg5p4FEyMCy4BfwGs,20
 beswarm/aient/src/aient/prompt/agent.py,sha256=3VycHGnUq9OdR5pd_RM0AeLESlpAgBcmzrsesfq82X0,23856
 beswarm/aient/src/aient/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 beswarm/aient/src/aient/utils/prompt.py,sha256=UcSzKkFE4-h_1b6NofI6xgk3GoleqALRKY8VBaXLjmI,11311
-beswarm/aient/src/aient/utils/scripts.py,sha256=PPwaJEigPkpciJHUXOag483iq1GjvaLReHDHjkinv6c,26780
+beswarm/aient/src/aient/utils/scripts.py,sha256=JbYHsU3LLtxBcuO_2MWbSgpHpCgtVQe9FGEFJpUyejc,25926
 beswarm/aient/test/chatgpt.py,sha256=Hvl7FuDt1c74N5TVBmhErOPvJbJJzA7FNp5VoZM4u30,4957
 beswarm/aient/test/claude.py,sha256=IyB4qI1eJLwlSfDNSnt2FhbQWYyBighHUjJxEXc3osQ,1095
 beswarm/aient/test/test.py,sha256=rldnoLQdtRR8IKFSIzTti7eIK2MpPMoi9gL5qD8_K44,29
@@ -58,7 +58,6 @@ beswarm/aient/test/test_get_token_dict.py,sha256=QuR67aUbS9hTwBjndsr1u7-juopEe1K
 beswarm/aient/test/test_google_search.py,sha256=rPaKqD_N3ogHYE5DrMfRmKumcVAHKC7LcYw5euR_zGM,1035
 beswarm/aient/test/test_jieba.py,sha256=ydqIrPtJ71cgbQSXpkS_g1kSiBzEpk0mjv6N-6ETw4g,1139
 beswarm/aient/test/test_json.py,sha256=cbKSwwSwt1A9sdn5vO_5cGca0x2rR4skejAgb8uDDu0,2284
-beswarm/aient/test/test_langchain_search_old.py,sha256=QGZSYi-aBB5qrKPI64qfgENbGozfrSGQBpNZpHt0d7k,9066
 beswarm/aient/test/test_logging.py,sha256=DFZ2KqrTVH6FQ5BKJIQudZxWRUdkzWka2QjmtVYPXvw,995
 beswarm/aient/test/test_ollama.py,sha256=ywy9l06S1g1AnWQvlBbhpac7i-hBB9bpwi-pk0Afivc,1325
 beswarm/aient/test/test_plugin.py,sha256=0sBwpf1YdKba-IVPZwBMKbLR7buHfudLS9NOETm7BTc,779
@@ -128,7 +127,7 @@ beswarm/tools/repomap.py,sha256=CwvwoN5Swr42EzrORTTeV8MMb7mPviy4a4b0fxBu50k,4082
 beswarm/tools/search_arxiv.py,sha256=9slwBemXjEqrd7-YgVmyMijPXlkhZCybEDRVhWVQ9B0,7937
 beswarm/tools/think.py,sha256=WLw-7jNIsnS6n8MMSYUin_f-BGLENFmnKM2LISEp0co,1760
 beswarm/tools/worker.py,sha256=FfKCx7KFNbMRoAXtjU1_nJQjx9WHny7KBq8OXSYICJs,5334
-beswarm-0.1.37.dist-info/METADATA,sha256=aBx-kjQIXjn2HYky3L99c2oBOXJRWYNRP7xF0Ndj9h4,3197
-beswarm-0.1.37.dist-info/WHEEL,sha256=0CuiUZ_p9E4cD6NyLD6UG80LBXYyiSYZOKDm5lp32xk,91
-beswarm-0.1.37.dist-info/top_level.txt,sha256=pJw4O87wvt5882smuSO6DfByJz7FJ8SxxT8h9fHCmpo,8
-beswarm-0.1.37.dist-info/RECORD,,
+beswarm-0.1.39.dist-info/METADATA,sha256=pOFh4a12JYNDKCeFjK6k9LoB6JGlqvc7EFVNVSWsqg8,3208
+beswarm-0.1.39.dist-info/WHEEL,sha256=0CuiUZ_p9E4cD6NyLD6UG80LBXYyiSYZOKDm5lp32xk,91
+beswarm-0.1.39.dist-info/top_level.txt,sha256=pJw4O87wvt5882smuSO6DfByJz7FJ8SxxT8h9fHCmpo,8
+beswarm-0.1.39.dist-info/RECORD,,

beswarm/aient/test/test_langchain_search_old.py DELETED Viewed

@@ -1,235 +0,0 @@
-import os
-import re
-import sys
-sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
-import config
-from langchain.chat_models import ChatOpenAI
-from langchain.chains import RetrievalQA, RetrievalQAWithSourcesChain
-from langchain.prompts.chat import (
-    ChatPromptTemplate,
-    SystemMessagePromptTemplate,
-    HumanMessagePromptTemplate,
-)
-from langchain.embeddings.openai import OpenAIEmbeddings
-from langchain.vectorstores import Chroma
-from langchain.text_splitter import CharacterTextSplitter
-from langchain.document_loaders import UnstructuredPDFLoader
-def getmd5(string):
-    import hashlib
-    md5_hash = hashlib.md5()
-    md5_hash.update(string.encode('utf-8'))
-    md5_hex = md5_hash.hexdigest()
-    return md5_hex
-from utils.sitemap import SitemapLoader
-async def get_doc_from_sitemap(url):
-    # https://www.langchain.asia/modules/indexes/document_loaders/examples/sitemap#%E8%BF%87%E6%BB%A4%E7%AB%99%E7%82%B9%E5%9C%B0%E5%9B%BE-url-
-    sitemap_loader = SitemapLoader(web_path=url)
-    docs = await sitemap_loader.load()
-    return docs
-async def get_doc_from_local(docpath, doctype="md"):
-    from langchain.document_loaders import DirectoryLoader
-    # 加载文件夹中的所有txt类型的文件
-    loader = DirectoryLoader(docpath, glob='**/*.' + doctype)
-    # 将数据转成 document 对象，每个文件会作为一个 document
-    documents = loader.load()
-    return documents
-system_template="""Use the following pieces of context to answer the users question.
-If you don't know the answer, just say "Hmm..., I'm not sure.", don't try to make up an answer.
-ALWAYS return a "Sources" part in your answer.
-The "Sources" part should be a reference to the source of the document from which you got your answer.
-Example of your response should be:
-```
-The answer is foo
-Sources:
-1. abc
-2. xyz
-```
-Begin!
-----------------
-{summaries}
-"""
-messages = [
-    SystemMessagePromptTemplate.from_template(system_template),
-    HumanMessagePromptTemplate.from_template("{question}")
-]
-prompt = ChatPromptTemplate.from_messages(messages)
-def get_chain(store, llm):
-    chain_type_kwargs = {"prompt": prompt}
-    chain = RetrievalQAWithSourcesChain.from_chain_type(
-        llm,
-        chain_type="stuff",
-        retriever=store.as_retriever(),
-        chain_type_kwargs=chain_type_kwargs,
-        reduce_k_below_max_tokens=True
-    )
-    return chain
-async def docQA(docpath, query_message, persist_db_path="db", model = "gpt-3.5-turbo"):
-    chatllm = ChatOpenAI(temperature=0.5, openai_api_base=config.bot_api_url.v1_url, model_name=model, openai_api_key=config.API)
-    embeddings = OpenAIEmbeddings(openai_api_base=config.bot_api_url.v1_url, openai_api_key=config.API)
-    sitemap = "sitemap.xml"
-    match = re.match(r'^(https?|ftp)://[^\s/$.?#].[^\s]*$', docpath)
-    if match:
-        doc_method = get_doc_from_sitemap
-        docpath = os.path.join(docpath, sitemap)
-    else:
-        doc_method = get_doc_from_local
-    persist_db_path = getmd5(docpath)
-    if not os.path.exists(persist_db_path):
-        documents = await doc_method(docpath)
-        # 初始化加载器
-        text_splitter = CharacterTextSplitter(chunk_size=100, chunk_overlap=50)
-        # 持久化数据
-        split_docs = text_splitter.split_documents(documents)
-        vector_store = Chroma.from_documents(split_docs, embeddings, persist_directory=persist_db_path)
-        vector_store.persist()
-    else:
-        # 加载数据
-        vector_store = Chroma(persist_directory=persist_db_path, embedding_function=embeddings)
-    # 创建问答对象
-    qa = get_chain(vector_store, chatllm)
-    # qa = RetrievalQA.from_chain_type(llm=chatllm, chain_type="stuff", retriever=vector_store.as_retriever(), return_source_documents=True)
-    # 进行问答
-    result = qa({"question": query_message})
-    return result
-def persist_emdedding_pdf(docurl, persist_db_path):
-    embeddings = OpenAIEmbeddings(openai_api_base=config.bot_api_url.v1_url, openai_api_key=os.environ.get('API', None))
-    filename = get_doc_from_url(docurl)
-    docpath = os.getcwd() + "/" + filename
-    loader = UnstructuredPDFLoader(docpath)
-    documents = loader.load()
-    # 初始化加载器
-    text_splitter = CharacterTextSplitter(chunk_size=100, chunk_overlap=25)
-    # 切割加载的 document
-    split_docs = text_splitter.split_documents(documents)
-    vector_store = Chroma.from_documents(split_docs, embeddings, persist_directory=persist_db_path)
-    vector_store.persist()
-    os.remove(docpath)
-    return vector_store
-async def pdfQA(docurl, docpath, query_message, model="gpt-3.5-turbo"):
-    chatllm = ChatOpenAI(temperature=0.5, openai_api_base=config.bot_api_url.v1_url, model_name=model, openai_api_key=os.environ.get('API', None))
-    embeddings = OpenAIEmbeddings(openai_api_base=config.bot_api_url.v1_url, openai_api_key=os.environ.get('API', None))
-    persist_db_path = getmd5(docpath)
-    if not os.path.exists(persist_db_path):
-        vector_store = persist_emdedding_pdf(docurl, persist_db_path)
-    else:
-        vector_store = Chroma(persist_directory=persist_db_path, embedding_function=embeddings)
-    qa = RetrievalQA.from_chain_type(llm=chatllm, chain_type="stuff", retriever=vector_store.as_retriever(), return_source_documents=True)
-    result = qa({"query": query_message})
-    return result['result']
-def pdf_search(docurl, query_message, model="gpt-3.5-turbo"):
-    chatllm = ChatOpenAI(temperature=0.5, openai_api_base=config.bot_api_url.v1_url, model_name=model, openai_api_key=os.environ.get('API', None))
-    embeddings = OpenAIEmbeddings(openai_api_base=config.bot_api_url.v1_url, openai_api_key=os.environ.get('API', None))
-    filename = get_doc_from_url(docurl)
-    docpath = os.getcwd() + "/" + filename
-    loader = UnstructuredPDFLoader(docpath)
-    try:
-        documents = loader.load()
-    except:
-        print("pdf load error! docpath:", docpath)
-        return ""
-    os.remove(docpath)
-    # 初始化加载器
-    text_splitter = CharacterTextSplitter(chunk_size=100, chunk_overlap=25)
-    # 切割加载的 document
-    split_docs = text_splitter.split_documents(documents)
-    vector_store = Chroma.from_documents(split_docs, embeddings)
-    # 创建问答对象
-    qa = RetrievalQA.from_chain_type(llm=chatllm, chain_type="stuff", retriever=vector_store.as_retriever(),return_source_documents=True)
-    # 进行问答
-    result = qa({"query": query_message})
-    return result['result']
-def summary_each_url(threads, chainllm, prompt):
-    summary_prompt = PromptTemplate(
-        input_variables=["web_summary", "question", "language"],
-        template=(
-            "You need to response the following question: {question}."
-            "Your task is answer the above question in {language} based on the Search results provided. Provide a detailed and in-depth response"
-            "If there is no relevant content in the search results, just answer None, do not make any explanations."
-            "Search results: {web_summary}."
-        ),
-    )
-    summary_threads = []
-    for t in threads:
-        tmp = t.join()
-        print(tmp)
-        chain = LLMChain(llm=chainllm, prompt=summary_prompt)
-        chain_thread = ThreadWithReturnValue(target=chain.run, args=({"web_summary": tmp, "question": prompt, "language": config.LANGUAGE},))
-        chain_thread.start()
-        summary_threads.append(chain_thread)
-    url_result = ""
-    for t in summary_threads:
-        tmp = t.join()
-        print("summary", tmp)
-        if tmp != "None":
-            url_result += "\n\n" + tmp
-    return url_result
-def get_search_results(prompt: str, context_max_tokens: int):
-    url_text_list = get_url_text_list(prompt)
-    useful_source_text = "\n\n".join(url_text_list)
-    # useful_source_text = summary_each_url(threads, chainllm, prompt)
-    useful_source_text, search_tokens_len = cut_message(useful_source_text, context_max_tokens)
-    print("search tokens len", search_tokens_len, "\n\n")
-    return useful_source_text
-from typing import Any
-from langchain.schema.output import LLMResult
-from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
-class ChainStreamHandler(StreamingStdOutCallbackHandler):
-    def __init__(self):
-        self.tokens = []
-        # 记得结束后这里置true
-        self.finish = False
-        self.answer = ""
-    def on_llm_new_token(self, token: str, **kwargs):
-        # print(token)
-        self.tokens.append(token)
-        # yield ''.join(self.tokens)
-        # print(''.join(self.tokens))
-    def on_llm_end(self, response: LLMResult, **kwargs: Any) -> None:
-        self.finish = 1
-    def on_llm_error(self, error: Exception, **kwargs: Any) -> None:
-        print(str(error))
-        self.tokens.append(str(error))
-    def generate_tokens(self):
-        while not self.finish or self.tokens:
-            if self.tokens:
-                data = self.tokens.pop(0)
-                self.answer += data
-                yield data
-            else:
-                pass
-        return self.answer

{beswarm-0.1.37.dist-info → beswarm-0.1.39.dist-info}/WHEEL RENAMED Viewed

File without changes

{beswarm-0.1.37.dist-info → beswarm-0.1.39.dist-info}/top_level.txt RENAMED Viewed

File without changes

beswarm 0.1.37__py3-none-any.whl → 0.1.39__py3-none-any.whl

beswarm 0.1.37py3-none-any.whl → 0.1.39py3-none-any.whl