PyPI - not-again-ai - Versions diffs - 0.10.3__py3-none-any.whl → 0.11.0__py3-none-any.whl - Mend

not-again-ai 0.10.3py3-none-any.whl → 0.11.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

not_again_ai/llm/openai_api/chat_completion.py CHANGED Viewed

@@ -32,8 +32,8 @@ def chat_completion(
             https://platform.openai.com/docs/models/model-endpoint-compatibility
             for details on which models work with the Chat API.
         client (OpenAI): An instance of the OpenAI client.
-        tools (list[dict[str, Any]], optional): A list of tools the model may generate JSON inputs for.
-            Defaults to None.
+        tools (list[dict[str, Any]], optional):A list of tools the model may call.
+            Use this to provide a list of functions the model may generate JSON inputs for. Defaults to None.
         tool_choice (str, optional): The tool choice to use. Can be "auto", "required", "none", or a specific function name.
             Note the function name cannot be any of "auto", "required", or "none". Defaults to "auto".
         max_tokens (int, optional): The maximum number of tokens to generate in the chat completion.
@@ -58,21 +58,21 @@ def chat_completion(
     Returns:
         dict[str, Any]: A dictionary with the following keys:
-            'finish_reason' (str): The reason the model stopped generating further tokens.
+            finish_reason (str): The reason the model stopped generating further tokens.
                 Can be 'stop', 'length', or 'tool_calls'.
-            'tool_names' (list[str], optional): The names of the tools called by the model.
-            'tool_args_list' (list[dict], optional): The arguments of the tools called by the model.
-            'message' (str | dict): The content of the generated assistant message.
+            tool_names (list[str], optional): The names of the tools called by the model.
+            tool_args_list (list[dict], optional): The arguments of the tools called by the model.
+            message (str | dict): The content of the generated assistant message.
                 If json_mode is True, this will be a dictionary.
-            'logprobs' (list[dict[str, Any] | list[dict[str, Any]]]): If logprobs[1] is between 1 and 5, each element in the list
+            logprobs (list[dict[str, Any] | list[dict[str, Any]]]): If logprobs[1] is between 1 and 5, each element in the list
                 will be a list of dictionaries containing the token, logprob, and bytes for the top `logprobs[1]` logprobs. Otherwise,
                 this will be a list of dictionaries containing the token, logprob, and bytes for each token in the message.
-            'choices' (list[dict], optional): A list of chat completion choices if n > 1 where each dict contains the above fields.
-            'completion_tokens' (int): The number of tokens used by the model to generate the completion.
+            choices (list[dict], optional): A list of chat completion choices if n > 1 where each dict contains the above fields.
+            completion_tokens (int): The number of tokens used by the model to generate the completion.
                 NOTE: If n > 1 this is the sum of all completions.
-            'prompt_tokens' (int): The number of tokens in the messages sent to the model.
-            'system_fingerprint' (str, optional): If seed is set, a unique identifier for the model used to generate the response.
-            'response_duration' (float): The time, in seconds, taken to generate the response from the API.
+            prompt_tokens (int): The number of tokens in the messages sent to the model.
+            system_fingerprint (str, optional): If seed is set, a unique identifier for the model used to generate the response.
+            response_duration (float): The time, in seconds, taken to generate the response from the API.
     """
     response_format = {"type": "json_object"} if json_mode else None

not_again_ai/local_llm/chat_completion.py CHANGED Viewed

@@ -11,6 +11,7 @@ def chat_completion(
     messages: list[dict[str, Any]],
     model: str,
     client: OpenAI | Client,
+    tools: list[dict[str, Any]] | None = None,
     max_tokens: int | None = None,
     temperature: float = 0.7,
     json_mode: bool = False,
@@ -25,6 +26,8 @@ def chat_completion(
         messages (list[dict[str, Any]]): A list of messages to send to the model.
         model (str): The model name to use.
         client (OpenAI | Client): The client object to use for chat completion.
+        tools (list[dict[str, Any]], optional):A list of tools the model may call.
+            Use this to provide a list of functions the model may generate JSON inputs for. Defaults to None.
         max_tokens (int, optional): The maximum number of tokens to generate.
         temperature (float, optional): The temperature of the model. Increasing the temperature will make the model answer more creatively.
         json_mode (bool, optional): This will structure the response as a valid JSON object.
@@ -34,6 +37,9 @@ def chat_completion(
         dict[str, Any]: A dictionary with the following keys
             message (str | dict): The content of the generated assistant message.
                 If json_mode is True, this will be a dictionary.
+            tool_names (list[str], optional): The names of the tools called by the model.
+                If the model does not support tools, a ResponseError is raised.
+            tool_args_list (list[dict], optional): The arguments of the tools called by the model.
             prompt_tokens (int): The number of tokens in the messages sent to the model.
             completion_tokens (int): The number of tokens used by the model to generate the completion.
             response_duration (float): The time, in seconds, taken to generate the response by using the model.
@@ -45,6 +51,7 @@ def chat_completion(
             messages=messages,
             model=model,
             client=client,
+            tools=tools,
             max_tokens=max_tokens,
             temperature=temperature,
             json_mode=json_mode,
@@ -56,6 +63,7 @@ def chat_completion(
             messages=messages,
             model=model,
             client=client,
+            tools=tools,
             max_tokens=max_tokens,
             temperature=temperature,
             json_mode=json_mode,
@@ -68,6 +76,9 @@ def chat_completion(
     # Parse the responses to be consistent
     response_data = {}
     response_data["message"] = response.get("message")
+    if response.get("tool_names") and response.get("tool_args_list"):
+        response_data["tool_names"] = response.get("tool_names")
+        response_data["tool_args_list"] = response.get("tool_args_list")
     response_data["completion_tokens"] = response.get("completion_tokens")
     response_data["prompt_tokens"] = response.get("prompt_tokens")
     response_data["response_duration"] = response.get("response_duration")

not_again_ai/local_llm/ollama/chat_completion.py CHANGED Viewed

@@ -13,6 +13,7 @@ def chat_completion(
     messages: list[dict[str, Any]],
     model: str,
     client: Client,
+    tools: list[dict[str, Any]] | None = None,
     max_tokens: int | None = None,
     context_window: int | None = None,
     temperature: float = 0.8,
@@ -27,6 +28,8 @@ def chat_completion(
         messages (list[dict[str, Any]]): A list of messages to send to the model.
         model (str): The model to use.
         client (Client): The Ollama client.
+        tools (list[dict[str, Any]], optional):A list of tools the model may call.
+            Use this to provide a list of functions the model may generate JSON inputs for. Defaults to None.
         max_tokens (int, optional): The maximum number of tokens to generate. Ollama calls this `num_predict`.
         context_window (int, optional): The number of tokens to consider as context. Ollama calls this `num_ctx`.
         temperature (float, optional): The temperature of the model. Increasing the temperature will make the model answer more creatively.
@@ -38,6 +41,9 @@ def chat_completion(
         dict[str, Any]: A dictionary with the following keys
             message (str | dict): The content of the generated assistant message.
                 If json_mode is True, this will be a dictionary.
+            tool_names (list[str], optional): The names of the tools called by the model.
+                If the model does not support tools, a ResponseError is raised.
+            tool_args_list (list[dict], optional): The arguments of the tools called by the model.
             prompt_tokens (int): The number of tokens in the messages sent to the model.
             completion_tokens (int): The number of tokens used by the model to generate the completion.
             response_duration (float): The time, in seconds, taken to generate the response by using the model.
@@ -59,6 +65,8 @@ def chat_completion(
     }
     if json_mode:
         all_args["format"] = "json"
+    if tools:
+        all_args["tools"] = tools
     try:
         start_time = time.time()
@@ -78,19 +86,26 @@ def chat_completion(
     response_data: dict[str, Any] = {}
     # Handle getting the message returned by the model
-    message = response["message"].get("content", None)  # type: ignore
+    message = response["message"].get("content", "")
     if message and json_mode:
         with contextlib.suppress(json.JSONDecodeError):
             message = json.loads(message)
-    if message:
-        response_data["message"] = message
+    response_data["message"] = message
+    # Try getting tool calls
+    if response["message"].get("tool_calls"):
+        tool_calls = response["message"]["tool_calls"]
+        tool_names = [tool_call["function"]["name"] for tool_call in tool_calls]
+        tool_args_list = [tool_call["function"]["arguments"] for tool_call in tool_calls]
+        response_data["tool_names"] = tool_names
+        response_data["tool_args_list"] = tool_args_list
     tokenizer = load_tokenizer(model)
     prompt_tokens = num_tokens_from_messages(messages, tokenizer)
     response_data["prompt_tokens"] = prompt_tokens
     # Get the number of tokens generated
-    response_data["completion_tokens"] = response.get("eval_count", None)  # type: ignore
+    response_data["completion_tokens"] = response.get("eval_count", None)
     if response_data["completion_tokens"] is None:
         response_data["completion_tokens"] = num_tokens_in_string(str(response_data["message"]), tokenizer)

not_again_ai/local_llm/ollama/model_mapping.py CHANGED Viewed

@@ -7,6 +7,7 @@ i.e. all phi3 models will start with "phi3".
 OLLAMA_MODEL_MAPPING = {
     "phi3": "microsoft/Phi-3-mini-4k-instruct",
     "llama3:": "nvidia/Llama3-ChatQA-1.5-8B",  # Using this version to get around needed to accept an agreement to get access to the tokenizer
+    "llama3.1": "unsloth/Meta-Llama-3.1-8B-Instruct",
     "gemma": "google/gemma-1.1-7b-it",  # Requires HF_TOKEN set and accepting the agreement on the HF model page
     "qwen2": "Qwen/Qwen2-7B-Instruct",
     "granite-code": "ibm-granite/granite-34b-code-instruct",

{not_again_ai-0.10.3.dist-info → not_again_ai-0.11.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: not-again-ai
-Version: 0.10.3
+Version: 0.11.0
 Summary: Designed to once and for all collect all the little things that come up over and over again in AI projects and put them in one place.
 Home-page: https://github.com/DaveCoDev/not-again-ai
 License: MIT
@@ -24,15 +24,15 @@ Provides-Extra: viz
 Requires-Dist: jinja2 (>=3.1,<4.0) ; extra == "local-llm"
 Requires-Dist: loguru (==0.7.2)
 Requires-Dist: numpy (>=1.26,<2.0) ; extra == "statistics" or extra == "viz"
-Requires-Dist: ollama (>=0.2,<0.3) ; extra == "local-llm"
-Requires-Dist: openai (>=1.36,<2.0) ; extra == "llm"
+Requires-Dist: ollama (>=0.3,<0.4) ; extra == "local-llm"
+Requires-Dist: openai (>=1.37,<2.0) ; extra == "llm"
 Requires-Dist: pandas (>=2.2,<3.0) ; extra == "viz"
 Requires-Dist: python-liquid (>=1.12,<2.0) ; extra == "llm"
 Requires-Dist: scikit-learn (>=1.5,<2.0) ; extra == "statistics"
 Requires-Dist: scipy (>=1.14,<2.0) ; extra == "statistics"
 Requires-Dist: seaborn (>=0.13,<0.14) ; extra == "viz"
 Requires-Dist: tiktoken (>=0.7,<0.8) ; extra == "llm"
-Requires-Dist: transformers (>=4.42,<5.0) ; extra == "local-llm"
+Requires-Dist: transformers (>=4.43,<5.0) ; extra == "local-llm"
 Project-URL: Documentation, https://github.com/DaveCoDev/not-again-ai
 Project-URL: Repository, https://github.com/DaveCoDev/not-again-ai
 Description-Content-Type: text/markdown
@@ -295,7 +295,7 @@ installed package to indicate that inline type annotations should be checked.
 ## Typos
-Checks for typos using [typos](https://github.com/crate-ci/typos)
+Check for typos using [typos](https://github.com/crate-ci/typos)
 ```bash
 (.venv) $ nox -s typos

{not_again_ai-0.10.3.dist-info → not_again_ai-0.11.0.dist-info}/RECORD RENAMED Viewed

@@ -4,20 +4,20 @@ not_again_ai/base/file_system.py,sha256=KNQmacO4Q__CQuq2oPzWrg3rQO48n3evglc9bNiP
 not_again_ai/base/parallel.py,sha256=fcYhKBYBWvob84iKp3O93wvFFdXeidljZsShgBLTNGA,3448
 not_again_ai/llm/__init__.py,sha256=_wNUL6FDaT369Z8W48FsaC_NkcOZ-ib2MMUvnaLOS-0,451
 not_again_ai/llm/openai_api/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-not_again_ai/llm/openai_api/chat_completion.py,sha256=9p024l0popYW08AbRYwriN_ikkUANYNl0JEFlFXuySA,8915
+not_again_ai/llm/openai_api/chat_completion.py,sha256=PRFi5Sl1K5GOgfWDYygHlmS-Ks1ZE6ETBzinZsz5GCc,8954
 not_again_ai/llm/openai_api/context_management.py,sha256=BJSG100_qw9MeTCZGztDV5CBXjVOxU4x7gyoRlLxWnI,3561
 not_again_ai/llm/openai_api/embeddings.py,sha256=4OBnxZicrY6q4dQhuPqMdAnifyjwrsKMTDj-kVre0yc,2500
 not_again_ai/llm/openai_api/openai_client.py,sha256=6pZw2xw9X-ceV22rhApwFJ2tAKCxi-SxkjxBsTBZ2Nw,2470
 not_again_ai/llm/openai_api/prompts.py,sha256=7cDfvIKCTYM0t5lK34FLLqYf-SR_cynDXIXw3zWDizA,7094
 not_again_ai/llm/openai_api/tokens.py,sha256=31neIrY66ejJQ10VB3EWnkN00wuw9vMpCS8tsw2WtFg,4392
 not_again_ai/local_llm/__init__.py,sha256=BsUn39U3QQaw6yomQHfp_HIPHRIBoMAgjcP3CDADx04,882
-not_again_ai/local_llm/chat_completion.py,sha256=m0fe7oGPtl46kvAIU6RhHeIvDu_pAWphrAbFY3K1i1E,3407
+not_again_ai/local_llm/chat_completion.py,sha256=buZQGV2sChaSi5cgiAcOd9gi4lAEzFIGGIqV-1qazAc,4174
 not_again_ai/local_llm/huggingface/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 not_again_ai/local_llm/huggingface/chat_completion.py,sha256=Y6uMbxLG8TaMVi3hJGrMl_G9Y1N_0dld5Kv1iqYnoao,2300
 not_again_ai/local_llm/huggingface/helpers.py,sha256=YPr8KbQ8Ac_Mn_nBcrFuL3bCl-IuDCdaRvYVCocy8Gk,734
 not_again_ai/local_llm/ollama/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-not_again_ai/local_llm/ollama/chat_completion.py,sha256=a2V_Od-Q-Oy8av9N8Lq2ltBDsVwTS0H7ywA6kTPkvP0,4142
-not_again_ai/local_llm/ollama/model_mapping.py,sha256=EYxwcRKvIrQAZ3iBFUMzs3f_eYevFOTP8A9AFmh0Syo,837
+not_again_ai/local_llm/ollama/chat_completion.py,sha256=C8uU-yq7FL9OLdflZVjbNkEOofmD2A3Hcsd8k-59iS4,5053
+not_again_ai/local_llm/ollama/model_mapping.py,sha256=sJqPg97OO68O0k5MFkTjRLIn9gB7gCRAcyUEjxMfizo,891
 not_again_ai/local_llm/ollama/ollama_client.py,sha256=dktyw7aKFq4EA3dU7Le5UpfsSq3Oh_POmYSrAI4qLi8,765
 not_again_ai/local_llm/ollama/service.py,sha256=XczbxISTAp4KHnIkqRZaMsfBohH-TAHrjZ8T9x3cRAY,2900
 not_again_ai/local_llm/ollama/tokens.py,sha256=k7K7enOSuCJRHteDG0x-CbuivQ2uAtKK3e0Jr7-BUd4,3952
@@ -32,8 +32,8 @@ not_again_ai/viz/distributions.py,sha256=OyWwJaNI6lMRm_iSrhq-CORLNvXfeuLSgDtVo3u
 not_again_ai/viz/scatterplot.py,sha256=5CUOWeknbBOaZPeX9oPin5sBkRKEwk8qeFH45R-9LlY,2292
 not_again_ai/viz/time_series.py,sha256=pOGZqXp_2nd6nKo-PUQNCtmMh__69jxQ6bQibTGLwZA,5212
 not_again_ai/viz/utils.py,sha256=hN7gwxtBt3U6jQni2K8j5m5pCXpaJDoNzGhBBikEU28,238
-not_again_ai-0.10.3.dist-info/LICENSE,sha256=btjOgNGpp-ux5xOo1Gx1MddxeWtT9sof3s3Nui29QfA,1071
-not_again_ai-0.10.3.dist-info/METADATA,sha256=aXiTuKLLH3tLVi6Lz-5J0_OWn2XwATyJRt975_aPQnA,15518
-not_again_ai-0.10.3.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
-not_again_ai-0.10.3.dist-info/entry_points.txt,sha256=EMJegugnmJUd-jMUA_qIRMIPAasbei8gP6O4-ER0BxQ,61
-not_again_ai-0.10.3.dist-info/RECORD,,
+not_again_ai-0.11.0.dist-info/LICENSE,sha256=btjOgNGpp-ux5xOo1Gx1MddxeWtT9sof3s3Nui29QfA,1071
+not_again_ai-0.11.0.dist-info/METADATA,sha256=S7IbgUSScGSxAeKWmyxk4hpy4qS-eLqpmfDfFEZq4Ok,15517
+not_again_ai-0.11.0.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
+not_again_ai-0.11.0.dist-info/entry_points.txt,sha256=EMJegugnmJUd-jMUA_qIRMIPAasbei8gP6O4-ER0BxQ,61
+not_again_ai-0.11.0.dist-info/RECORD,,

{not_again_ai-0.10.3.dist-info → not_again_ai-0.11.0.dist-info}/LICENSE RENAMED Viewed

File without changes

{not_again_ai-0.10.3.dist-info → not_again_ai-0.11.0.dist-info}/WHEEL RENAMED Viewed

File without changes

{not_again_ai-0.10.3.dist-info → not_again_ai-0.11.0.dist-info}/entry_points.txt RENAMED Viewed

File without changes

not-again-ai 0.10.3__py3-none-any.whl → 0.11.0__py3-none-any.whl

not-again-ai 0.10.3py3-none-any.whl → 0.11.0py3-none-any.whl