PyPI - lollms-client - Versions diffs - 1.5.6__py3-none-any.whl → 1.7.10__py3-none-any.whl - Mend

lollms-client 1.5.6py3-none-any.whl → 1.7.10py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

lollms_client/__init__.py +1 -1
lollms_client/llm_bindings/azure_openai/__init__.py +2 -2
lollms_client/llm_bindings/claude/__init__.py +125 -34
lollms_client/llm_bindings/gemini/__init__.py +261 -159
lollms_client/llm_bindings/grok/__init__.py +52 -14
lollms_client/llm_bindings/groq/__init__.py +2 -2
lollms_client/llm_bindings/hugging_face_inference_api/__init__.py +2 -2
lollms_client/llm_bindings/litellm/__init__.py +1 -1
lollms_client/llm_bindings/llamacpp/__init__.py +18 -11
lollms_client/llm_bindings/lollms/__init__.py +76 -21
lollms_client/llm_bindings/lollms_webui/__init__.py +1 -1
lollms_client/llm_bindings/mistral/__init__.py +2 -2
lollms_client/llm_bindings/novita_ai/__init__.py +142 -6
lollms_client/llm_bindings/ollama/__init__.py +307 -89
lollms_client/llm_bindings/open_router/__init__.py +2 -2
lollms_client/llm_bindings/openai/__init__.py +81 -20
lollms_client/llm_bindings/openllm/__init__.py +362 -506
lollms_client/llm_bindings/openwebui/__init__.py +333 -171
lollms_client/llm_bindings/perplexity/__init__.py +2 -2
lollms_client/llm_bindings/pythonllamacpp/__init__.py +3 -3
lollms_client/llm_bindings/tensor_rt/__init__.py +1 -1
lollms_client/llm_bindings/transformers/__init__.py +428 -632
lollms_client/llm_bindings/vllm/__init__.py +1 -1
lollms_client/lollms_agentic.py +4 -2
lollms_client/lollms_base_binding.py +61 -0
lollms_client/lollms_core.py +512 -1890
lollms_client/lollms_discussion.py +25 -11
lollms_client/lollms_llm_binding.py +112 -261
lollms_client/lollms_mcp_binding.py +34 -75
lollms_client/lollms_stt_binding.py +85 -52
lollms_client/lollms_tti_binding.py +23 -37
lollms_client/lollms_ttm_binding.py +24 -42
lollms_client/lollms_tts_binding.py +28 -17
lollms_client/lollms_ttv_binding.py +24 -42
lollms_client/lollms_types.py +4 -2
lollms_client/stt_bindings/whisper/__init__.py +108 -23
lollms_client/stt_bindings/whispercpp/__init__.py +7 -1
lollms_client/tti_bindings/diffusers/__init__.py +418 -810
lollms_client/tti_bindings/diffusers/server/main.py +1051 -0
lollms_client/tti_bindings/gemini/__init__.py +182 -239
lollms_client/tti_bindings/leonardo_ai/__init__.py +6 -3
lollms_client/tti_bindings/lollms/__init__.py +4 -1
lollms_client/tti_bindings/novita_ai/__init__.py +5 -2
lollms_client/tti_bindings/openai/__init__.py +10 -11
lollms_client/tti_bindings/stability_ai/__init__.py +5 -3
lollms_client/ttm_bindings/audiocraft/__init__.py +7 -12
lollms_client/ttm_bindings/beatoven_ai/__init__.py +7 -3
lollms_client/ttm_bindings/lollms/__init__.py +4 -17
lollms_client/ttm_bindings/replicate/__init__.py +7 -4
lollms_client/ttm_bindings/stability_ai/__init__.py +7 -4
lollms_client/ttm_bindings/topmediai/__init__.py +6 -3
lollms_client/tts_bindings/bark/__init__.py +7 -10
lollms_client/tts_bindings/lollms/__init__.py +6 -1
lollms_client/tts_bindings/piper_tts/__init__.py +8 -11
lollms_client/tts_bindings/xtts/__init__.py +157 -74
lollms_client/tts_bindings/xtts/server/main.py +241 -280
{lollms_client-1.5.6.dist-info → lollms_client-1.7.10.dist-info}/METADATA +113 -5
lollms_client-1.7.10.dist-info/RECORD +89 -0
lollms_client-1.5.6.dist-info/RECORD +0 -87
{lollms_client-1.5.6.dist-info → lollms_client-1.7.10.dist-info}/WHEEL +0 -0
{lollms_client-1.5.6.dist-info → lollms_client-1.7.10.dist-info}/licenses/LICENSE +0 -0
{lollms_client-1.5.6.dist-info → lollms_client-1.7.10.dist-info}/top_level.txt +0 -0

lollms_client/llm_bindings/novita_ai/__init__.py CHANGED Viewed

@@ -19,8 +19,6 @@ BindingName = "NovitaAIBinding"
 API_BASE_URL = "https://api.novita.ai"
 # A hardcoded list of models based on Novita AI's documentation.
-# The API is OpenAI-compatible but does not provide a models listing endpoint.
-# Sourced from: https://docs.novita.ai/language-model/models
 _FALLBACK_MODELS = [
     {'model_name': 'meta-llama/Llama-3-8B-Instruct', 'display_name': 'Llama 3 8B Instruct', 'description': 'Meta\'s Llama 3 8B instruction-tuned model.', 'owned_by': 'Meta'},
     {'model_name': 'meta-llama/Llama-3-70B-Instruct', 'display_name': 'Llama 3 70B Instruct', 'description': 'Meta\'s Llama 3 70B instruction-tuned model.', 'owned_by': 'Meta'},
@@ -28,6 +26,7 @@ _FALLBACK_MODELS = [
     {'model_name': 'mistralai/Mistral-7B-Instruct-v0.2', 'display_name': 'Mistral 7B Instruct v0.2', 'description': 'Mistral AI\'s 7B instruction-tuned model.', 'owned_by': 'Mistral AI'},
     {'model_name': 'google/gemma-7b-it', 'display_name': 'Gemma 7B IT', 'description': 'Google\'s Gemma 7B instruction-tuned model.', 'owned_by': 'Google'},
     {'model_name': 'google/gemma-2-9b-it', 'display_name': 'Gemma 2 9B IT', 'description': 'Google\'s next-generation Gemma 2 9B instruction-tuned model.', 'owned_by': 'Google'},
+    {'model_name': 'deepseek/deepseek-r1', 'display_name': 'Deepseek R1', 'description': 'Deepseek R1 reasoning model.', 'owned_by': 'Deepseek AI'},
     {'model_name': 'deepseek-ai/deepseek-coder-33b-instruct', 'display_name': 'Deepseek Coder 33B Instruct', 'description': 'A powerful coding model from Deepseek AI.', 'owned_by': 'Deepseek AI'},
 ]
@@ -73,6 +72,119 @@ class NovitaAIBinding(LollmsLLMBinding):
         if frequency_penalty is not None: params['frequency_penalty'] = frequency_penalty
         return params
+    def generate_text(self,
+                     prompt: str,
+                     images: Optional[List[str]] = None,
+                     system_prompt: str = "",
+                     n_predict: Optional[int] = 2048,
+                     stream: Optional[bool] = False,
+                     temperature: float = 0.7,
+                     top_k: int = 50, # Not supported by Novita API
+                     top_p: float = 0.9,
+                     repeat_penalty: float = 1.1, # maps to frequency_penalty
+                     repeat_last_n: int = 64,   # Not supported
+                     seed: Optional[int] = None, # Not supported
+                     n_threads: Optional[int] = None, # Not applicable
+                     ctx_size: int | None = None, # Determined by model
+                     streaming_callback: Optional[Callable[[str, MSG_TYPE], None]] = None,
+                     split:Optional[bool]=False,
+                     user_keyword:Optional[str]="!@>user:",
+                     ai_keyword:Optional[str]="!@>assistant:",
+                     think: Optional[bool] = False,
+                     reasoning_effort: Optional[str] = "low", # low, medium, high
+                     reasoning_summary: Optional[bool] = False, # auto
+                     ) -> Union[str, dict]:
+        """
+        Generate text using Novita AI.
+        """
+        # Build messages
+        messages = []
+        if system_prompt and system_prompt.strip():
+            messages.append({"role": "system", "content": system_prompt})
+        if split:
+            # Simple split logic to support history if provided in prompt string
+            # This is a basic fallback; usually chat() is preferred for history
+            msgs = self.split_discussion(prompt, user_keyword, ai_keyword)
+            messages.extend(msgs)
+        else:
+            messages.append({"role": "user", "content": prompt})
+        if images:
+            ASCIIColors.warning("Novita AI API does not support images in this binding yet. They will be ignored.")
+        # Construct parameters
+        # Map repeat_penalty to frequency_penalty loosely if needed, or just pass as is if supported
+        # Novita supports standard OpenAI params
+        api_params = self._construct_parameters(
+            temperature, top_p, n_predict, 0.0, repeat_penalty
+        )
+        payload = {
+            "model": self.model_name,
+            "messages": messages,
+            "stream": stream,
+            **api_params
+        }
+        url = f"{API_BASE_URL}/v1/chat/completions"
+        full_response_text = ""
+        try:
+            if stream:
+                with requests.post(url, headers=self.headers, json=payload, stream=True) as response:
+                    response.raise_for_status()
+                    for line in response.iter_lines():
+                        if line:
+                            decoded_line = line.decode('utf-8')
+                            if decoded_line.startswith("data:"):
+                                content = decoded_line[len("data: "):].strip()
+                                if content == "[DONE]":
+                                    break
+                                try:
+                                    chunk = json.loads(content)
+                                    delta = chunk.get("choices", [{}])[0].get("delta", {})
+                                    text_chunk = delta.get("content", "")
+                                    # Deepseek R1 might output thinking in content or reasoning_content field
+                                    # Standard OpenAI compatible R1 usually puts thought in <think> tags or reasoning_content
+                                    reasoning_chunk = delta.get("reasoning_content", "")
+                                    if reasoning_chunk:
+                                         # If we get reasoning content field, wrap it in <think> for lollms UI if think is enabled
+                                         if think:
+                                             formatted_reasoning = f"<think>{reasoning_chunk}</think>" # Naive streaming wrap, might be broken tags
+                                             # Better to just stream it if UI handles it, or just text
+                                             if streaming_callback:
+                                                streaming_callback(reasoning_chunk, MSG_TYPE.MSG_TYPE_CHUNK)
+                                         else:
+                                             # If think disabled, we might skip reasoning or just show it?
+                                             # Typically we want to show it.
+                                             pass
+                                    if text_chunk:
+                                        full_response_text += text_chunk
+                                        if streaming_callback:
+                                            if not streaming_callback(text_chunk, MSG_TYPE.MSG_TYPE_CHUNK):
+                                                break
+                                except json.JSONDecodeError:
+                                    continue
+                return full_response_text
+            else:
+                response = requests.post(url, headers=self.headers, json=payload)
+                response.raise_for_status()
+                data = response.json()
+                choice = data["choices"][0]["message"]
+                content = choice.get("content", "")
+                reasoning = choice.get("reasoning_content", "")
+                if think and reasoning:
+                    return f"<think>\n{reasoning}\n</think>\n{content}"
+                return content
+        except Exception as e:
+            trace_exception(e)
+            return {"status": False, "error": str(e)}
     def chat(self,
              discussion: LollmsDiscussion,
              branch_tip_id: Optional[str] = None,
@@ -86,7 +198,10 @@ class NovitaAIBinding(LollmsLLMBinding):
              seed: Optional[int] = None, # Not supported
              n_threads: Optional[int] = None, # Not applicable
              ctx_size: Optional[int] = None, # Determined by model
-             streaming_callback: Optional[Callable[[str, MSG_TYPE], None]] = None
+             streaming_callback: Optional[Callable[[str, MSG_TYPE], None]] = None,
+             think: Optional[bool] = False,
+             reasoning_effort: Optional[str] = "low", # low, medium, high
+             reasoning_summary: Optional[bool] = False, # auto
              ) -> Union[str, dict]:
         """
         Conduct a chat session with a Novita AI model using a LollmsDiscussion object.
@@ -139,6 +254,19 @@ class NovitaAIBinding(LollmsLLMBinding):
                                     chunk = json.loads(content)
                                     delta = chunk.get("choices", [{}])[0].get("delta", {})
                                     text_chunk = delta.get("content", "")
+                                    # Support for reasoning content if provided (e.g. Deepseek R1)
+                                    reasoning_chunk = delta.get("reasoning_content", "")
+                                    if reasoning_chunk and think:
+                                        # Simple handling: stream it as regular chunk or specific type if supported
+                                        # Lollms typically expects <think> tags in the text if it's mixed
+                                        # Since we can't easily inject tags in a stream without state,
+                                        # we assume the model output might contain them or we just output reasoning.
+                                        # For now, append to text.
+                                        if streaming_callback:
+                                            # We could prefix with <think> if it's the start, but that's complex in stateless loop
+                                            streaming_callback(reasoning_chunk, MSG_TYPE.MSG_TYPE_CHUNK)
                                     if text_chunk:
                                         full_response_text += text_chunk
                                         if streaming_callback:
@@ -152,7 +280,15 @@ class NovitaAIBinding(LollmsLLMBinding):
                 response = requests.post(url, headers=self.headers, json=payload)
                 response.raise_for_status()
                 data = response.json()
-                return data["choices"][0]["message"]["content"]
+                choice = data["choices"][0]["message"]
+                content = choice.get("content", "")
+                reasoning = choice.get("reasoning_content", "")
+                if think and reasoning:
+                    return f"<think>\n{reasoning}\n</think>\n{content}"
+                return content
         except requests.exceptions.HTTPError as e:
             try:
                 error_details = e.response.json()
@@ -211,7 +347,7 @@ class NovitaAIBinding(LollmsLLMBinding):
             "supports_vision": False
         }
-    def listModels(self) -> List[Dict[str, str]]:
+    def list_models(self) -> List[Dict[str, str]]:
         """
         Lists available models. Novita AI API does not have a models endpoint,
         so a hardcoded list from their documentation is returned.
@@ -242,7 +378,7 @@ if __name__ == '__main__':
         # --- List Models ---
         ASCIIColors.cyan("\n--- Listing Models (static list) ---")
-        models = binding.listModels()
+        models = binding.list_models()
         if models:
             ASCIIColors.green(f"Found {len(models)} models.")
             for m in models:

lollms-client 1.5.6__py3-none-any.whl → 1.7.10__py3-none-any.whl

lollms-client 1.5.6py3-none-any.whl → 1.7.10py3-none-any.whl