PyPI - hjxdl - Versions diffs - 0.1.38__py3-none-any.whl → 0.1.39__py3-none-any.whl - Mend

hjxdl 0.1.38py3-none-any.whl → 0.1.39py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

hdl/_version.py +2 -2
hdl/utils/llm/chat.py +41 -121
hdl/utils/llm/llama_chat.py +122 -0
{hjxdl-0.1.38.dist-info → hjxdl-0.1.39.dist-info}/METADATA +1 -1
{hjxdl-0.1.38.dist-info → hjxdl-0.1.39.dist-info}/RECORD +7 -6
{hjxdl-0.1.38.dist-info → hjxdl-0.1.39.dist-info}/WHEEL +0 -0
{hjxdl-0.1.38.dist-info → hjxdl-0.1.39.dist-info}/top_level.txt +0 -0

hdl/_version.py CHANGED Viewed

@@ -12,5 +12,5 @@ __version__: str
 __version_tuple__: VERSION_TUPLE
 version_tuple: VERSION_TUPLE
-__version__ = version = '0.1.38'
-__version_tuple__ = version_tuple = (0, 1, 38)
+__version__ = version = '0.1.39'
+__version_tuple__ = version_tuple = (0, 1, 39)

hdl/utils/llm/chat.py CHANGED Viewed

@@ -1,6 +1,8 @@
 import typing as t
+import asyncio
+from concurrent.futures import ProcessPoolExecutor
-from llama_cpp import Llama
 from openai import OpenAI
 from ..desc.template import FN_TEMPLATE
 from ..desc.func_desc import FN_DESC
@@ -85,126 +87,6 @@ def chat_oai_invoke(
     return response.choices[0].message.content
-class GGUF_M(Llama):
-    def __init__(
-        self,
-        model_path :str,
-        device: str='gpu',
-        generation_kwargs: dict = {},
-        server_ip: str = "127.0.0.1",
-        server_port: int = 8000,
-        *args,
-        **kwargs
-    ):
-        """Initialize the model with the specified parameters.
-        Args:
-            model_path (str): The path to the model.
-            device (str, optional): The device to use, either 'gpu' or 'cpu'. Defaults to 'gpu'.
-            generation_kwargs (dict, optional): Additional generation keyword arguments. Defaults to {}.
-            server_ip (str, optional): The IP address of the server. Defaults to "127.0.0.1".
-            server_port (int, optional): The port of the server. Defaults to 8000.
-            *args: Variable length argument list.
-            **kwargs: Arbitrary keyword arguments.
-        Raises:
-            KeyError: If 'num_threads' or 'max_context_length' is missing in generation_kwargs.
-        """
-        print("正在从本地加载模型...")
-        if device.lower() == 'cpu':
-            super().__init__(
-                model_path=model_path,
-                n_threads=generation_kwargs['num_threads'],
-                n_ctx=generation_kwargs['max_context_length'],
-                *args,
-                **kwargs
-            )
-        else:
-            super().__init__(
-                model_path=model_path,
-                n_threads=generation_kwargs['num_threads'],
-                n_ctx=generation_kwargs['max_context_length'],
-                n_gpu_layers=-1,
-                flash_attn=True,
-                *args,
-                **kwargs
-            )
-        self.generation_kwargs = generation_kwargs
-    def invoke(
-        self,
-        prompt : str,
-        stop: list[str] | None = ["USER:", "ASSISTANT:"],
-        # history: list = [],
-        **kwargs: t.Any,
-    ) -> str:
-        """Invoke the model to generate a response based on the given prompt.
-        Args:
-            prompt (str): The prompt to be used for generating the response.
-            stop (list[str], optional): List of strings that indicate when the model should stop generating the response. Defaults to ["USER:", "ASSISTANT:"].
-            **kwargs: Additional keyword arguments to be passed to the model.
-        Returns:
-            str: The generated response based on the prompt.
-        """
-        prompt_final = f"USER:\n{prompt}\nASSISTANT:\n"
-        result = self.create_completion(
-            prompt_final,
-            repeat_penalty=self.generation_kwargs["repetition_penalty"],
-            max_tokens=self.generation_kwargs["max_new_tokens"],
-            stop=stop,
-            echo=False,
-            temperature=self.generation_kwargs["temperature"],
-            mirostat_mode = 2,
-            mirostat_tau=4.0,
-            mirostat_eta=1.1
-        )
-        resp = result['choices'][0]['text']
-        # history.append(
-        #     [prompt, resp]
-        # )
-        return resp
-    def stream(
-        self,
-        prompt: str,
-        stop: list[str] | None = ["USER:", "ASSISTANT:"],
-        # history: list = [],
-        **kwargs: t.Any,
-    ):
-        """Generate text responses based on the given prompt using the model.
-        Args:
-            prompt (str): The prompt to generate text responses.
-            stop (list[str], optional): List of strings to stop the generation. Defaults to ["USER:", "ASSISTANT:"].
-            **kwargs: Additional keyword arguments for the model.
-        Yields:
-            str: Text responses generated by the model based on the prompt.
-        """
-        prompt = f"USER:\n{prompt}\nASSISTANT:\n"
-        output = self.create_completion(
-            prompt,
-            stream=True,
-            repeat_penalty=self.generation_kwargs["repetition_penalty"],
-            max_tokens=self.generation_kwargs["max_new_tokens"],
-            stop=stop,
-            echo=False,
-            temperature=self.generation_kwargs["temperature"],
-            mirostat_mode = 2,
-            mirostat_tau=4.0,
-            mirostat_eta=1.1
-        )
-        # history.append([])
-        for chunk in output:
-            item = chunk['choices'][0]['text']
-            # self.resps[-1].append(item)
-            yield chunk['choices'][0]['text']
-        # self.resps[-1] = "".join(self.resps[-1])
 class OpenAI_M():
     def __init__(
         self,
@@ -377,6 +259,44 @@ class OpenAI_M():
                 print(e)
                 return ""
+    async def get_tool_result_async(
+        self,
+        prompt: str,
+        **kwargs: t.Any
+    ):
+        """
+        Asynchronous version of the get_tool_result function that can run in parallel using multiprocessing.
+        Args:
+            prompt (str): The prompt to get the decision for.
+            **kwargs: Additional keyword arguments to pass to the decision function.
+        Returns:
+            str: The result from the selected tool based on the decision made.
+        """
+        decision_dict_str = await asyncio.to_thread(self.get_decision, prompt, **kwargs)
+        try:
+            decision_dict = json.loads(decision_dict_str)
+        except Exception as e:
+            print(e)
+            return ""
+        func_name = decision_dict.get("function_name", None)
+        if func_name is None:
+            return ""
+        else:
+            try:
+                for tool in self.tools:
+                    if tool.__name__ == func_name:
+                        tool_final = tool
+                func_kwargs = decision_dict.get("params")
+                loop = asyncio.get_running_loop()
+                with ProcessPoolExecutor() as pool:
+                    result = await loop.run_in_executor(pool, tool_final, **func_kwargs)
+                return result
+            except Exception as e:
+                print(e)
+                return ""
     def agent_response(
         self,

hdl/utils/llm/llama_chat.py ADDED Viewed

@@ -0,0 +1,122 @@
+import typing as t
+from llama_cpp import Llama
+class GGUF_M(Llama):
+    def __init__(
+        self,
+        model_path :str,
+        device: str='gpu',
+        generation_kwargs: dict = {},
+        server_ip: str = "127.0.0.1",
+        server_port: int = 8000,
+        *args,
+        **kwargs
+    ):
+        """Initialize the model with the specified parameters.
+        Args:
+            model_path (str): The path to the model.
+            device (str, optional): The device to use, either 'gpu' or 'cpu'. Defaults to 'gpu'.
+            generation_kwargs (dict, optional): Additional generation keyword arguments. Defaults to {}.
+            server_ip (str, optional): The IP address of the server. Defaults to "127.0.0.1".
+            server_port (int, optional): The port of the server. Defaults to 8000.
+            *args: Variable length argument list.
+            **kwargs: Arbitrary keyword arguments.
+        Raises:
+            KeyError: If 'num_threads' or 'max_context_length' is missing in generation_kwargs.
+        """
+        print("正在从本地加载模型...")
+        if device.lower() == 'cpu':
+            super().__init__(
+                model_path=model_path,
+                n_threads=generation_kwargs['num_threads'],
+                n_ctx=generation_kwargs['max_context_length'],
+                *args,
+                **kwargs
+            )
+        else:
+            super().__init__(
+                model_path=model_path,
+                n_threads=generation_kwargs['num_threads'],
+                n_ctx=generation_kwargs['max_context_length'],
+                n_gpu_layers=-1,
+                flash_attn=True,
+                *args,
+                **kwargs
+            )
+        self.generation_kwargs = generation_kwargs
+    def invoke(
+        self,
+        prompt : str,
+        stop: list[str] | None = ["USER:", "ASSISTANT:"],
+        # history: list = [],
+        **kwargs: t.Any,
+    ) -> str:
+        """Invoke the model to generate a response based on the given prompt.
+        Args:
+            prompt (str): The prompt to be used for generating the response.
+            stop (list[str], optional): List of strings that indicate when the model should stop generating the response. Defaults to ["USER:", "ASSISTANT:"].
+            **kwargs: Additional keyword arguments to be passed to the model.
+        Returns:
+            str: The generated response based on the prompt.
+        """
+        prompt_final = f"USER:\n{prompt}\nASSISTANT:\n"
+        result = self.create_completion(
+            prompt_final,
+            repeat_penalty=self.generation_kwargs["repetition_penalty"],
+            max_tokens=self.generation_kwargs["max_new_tokens"],
+            stop=stop,
+            echo=False,
+            temperature=self.generation_kwargs["temperature"],
+            mirostat_mode = 2,
+            mirostat_tau=4.0,
+            mirostat_eta=1.1
+        )
+        resp = result['choices'][0]['text']
+        # history.append(
+        #     [prompt, resp]
+        # )
+        return resp
+    def stream(
+        self,
+        prompt: str,
+        stop: list[str] | None = ["USER:", "ASSISTANT:"],
+        # history: list = [],
+        **kwargs: t.Any,
+    ):
+        """Generate text responses based on the given prompt using the model.
+        Args:
+            prompt (str): The prompt to generate text responses.
+            stop (list[str], optional): List of strings to stop the generation. Defaults to ["USER:", "ASSISTANT:"].
+            **kwargs: Additional keyword arguments for the model.
+        Yields:
+            str: Text responses generated by the model based on the prompt.
+        """
+        prompt = f"USER:\n{prompt}\nASSISTANT:\n"
+        output = self.create_completion(
+            prompt,
+            stream=True,
+            repeat_penalty=self.generation_kwargs["repetition_penalty"],
+            max_tokens=self.generation_kwargs["max_new_tokens"],
+            stop=stop,
+            echo=False,
+            temperature=self.generation_kwargs["temperature"],
+            mirostat_mode = 2,
+            mirostat_tau=4.0,
+            mirostat_eta=1.1
+        )
+        # history.append([])
+        for chunk in output:
+            item = chunk['choices'][0]['text']
+            # self.resps[-1].append(item)
+            yield chunk['choices'][0]['text']
+        # self.resps[-1] = "".join(self.resps[-1])

{hjxdl-0.1.38.dist-info → hjxdl-0.1.39.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: hjxdl
-Version: 0.1.38
+Version: 0.1.39
 Summary: A collection of functions for Jupyter notebooks
 Home-page: https://github.com/huluxiaohuowa/hdl
 Author: Jianxing Hu

{hjxdl-0.1.38.dist-info → hjxdl-0.1.39.dist-info}/RECORD RENAMED Viewed

@@ -1,5 +1,5 @@
 hdl/__init__.py,sha256=GffnD0jLJdhkd-vo989v40N90sQbofkayRBwxc6TVhQ,72
-hdl/_version.py,sha256=_2BzHyrUcTFR5ix_ca-uPHbXU_rcLiE194BnEhwOnRU,413
+hdl/_version.py,sha256=6nXIPX9zBoWwZZ8FWkd2Pe2QAfUPdNNa0BUqqXMd0RE,413
 hdl/args/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 hdl/args/loss_args.py,sha256=s7YzSdd7IjD24rZvvOrxLLFqMZQb9YylxKeyelSdrTk,70
 hdl/controllers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -127,14 +127,15 @@ hdl/utils/desc/template.py,sha256=a3NcSihzZMm9Bk76iDVe54_xBDceGmLebS0XMONE3nk,11
 hdl/utils/general/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 hdl/utils/general/glob.py,sha256=8-RCnt6L297wMIfn34ZAMCsGCZUjHG3MGglGZI1cX0g,491
 hdl/utils/llm/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-hdl/utils/llm/chat.py,sha256=6ZlIhmnTc6FrJEhDfzMVsILFmpHWzNMtrmDrrPoMJYg,13700
+hdl/utils/llm/chat.py,sha256=rQKsIqw2pj2CkhfOaJ2Oahgt3XgmkgrHBgkxs6dfE0U,10770
 hdl/utils/llm/embs.py,sha256=Tf0FOYrOFZp7qQpEPiSCXzlgyHH0X9HVTUtsup74a9E,7174
 hdl/utils/llm/extract.py,sha256=2sK_WJzmYIc8iuWaM9DA6Nw3_6q1O4lJ5pKpcZo-bBA,6512
+hdl/utils/llm/llama_chat.py,sha256=watcHGOaz-bv3x-yDucYlGk5f8FiqfFhwWogrl334fk,4387
 hdl/utils/schedulers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 hdl/utils/schedulers/norm_lr.py,sha256=bDwCmdEK-WkgxQMFBiMuchv8Mm7C0-GZJ6usm-PQk14,4461
 hdl/utils/weather/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 hdl/utils/weather/weather.py,sha256=k11o6wM15kF8b9NMlEfrg68ak-SfSYLN3nOOflFUv-I,4381
-hjxdl-0.1.38.dist-info/METADATA,sha256=esqj1qYfOApxJmmvuZouXa8ylxI9v4PDPEkH5aS8HYE,737
-hjxdl-0.1.38.dist-info/WHEEL,sha256=UvcQYKBHoFqaQd6LKyqHw9fxEolWLQnlzP0h_LgJAfI,91
-hjxdl-0.1.38.dist-info/top_level.txt,sha256=-kxwTM5JPhylp06z3zAVO3w6_h7wtBfBo2zgM6YZoTk,4
-hjxdl-0.1.38.dist-info/RECORD,,
+hjxdl-0.1.39.dist-info/METADATA,sha256=DUifflUXAgFT-Jaxbmb2ZvDnjb-0nhkFKYSuyZAeN6Q,737
+hjxdl-0.1.39.dist-info/WHEEL,sha256=UvcQYKBHoFqaQd6LKyqHw9fxEolWLQnlzP0h_LgJAfI,91
+hjxdl-0.1.39.dist-info/top_level.txt,sha256=-kxwTM5JPhylp06z3zAVO3w6_h7wtBfBo2zgM6YZoTk,4
+hjxdl-0.1.39.dist-info/RECORD,,

{hjxdl-0.1.38.dist-info → hjxdl-0.1.39.dist-info}/WHEEL RENAMED Viewed

File without changes

{hjxdl-0.1.38.dist-info → hjxdl-0.1.39.dist-info}/top_level.txt RENAMED Viewed

File without changes

hjxdl 0.1.38__py3-none-any.whl → 0.1.39__py3-none-any.whl

hjxdl 0.1.38py3-none-any.whl → 0.1.39py3-none-any.whl