PyPI - webscout - Versions diffs - 8.2.4__py3-none-any.whl → 8.2.6__py3-none-any.whl - Mend

webscout 8.2.4py3-none-any.whl → 8.2.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of webscout might be problematic. Click here for more details.

Files changed (110) hide show

webscout/AIauto.py +112 -22
webscout/AIutel.py +240 -344
webscout/Extra/autocoder/autocoder.py +66 -5
webscout/Extra/gguf.py +2 -0
webscout/Provider/AISEARCH/scira_search.py +3 -5
webscout/Provider/Aitopia.py +75 -51
webscout/Provider/AllenAI.py +64 -67
webscout/Provider/ChatGPTClone.py +33 -34
webscout/Provider/ChatSandbox.py +342 -0
webscout/Provider/Cloudflare.py +79 -32
webscout/Provider/Deepinfra.py +69 -56
webscout/Provider/ElectronHub.py +48 -39
webscout/Provider/ExaChat.py +36 -20
webscout/Provider/GPTWeb.py +24 -18
webscout/Provider/GithubChat.py +52 -49
webscout/Provider/GizAI.py +285 -0
webscout/Provider/Glider.py +39 -28
webscout/Provider/Groq.py +48 -20
webscout/Provider/HeckAI.py +18 -36
webscout/Provider/Jadve.py +30 -37
webscout/Provider/LambdaChat.py +36 -59
webscout/Provider/MCPCore.py +18 -21
webscout/Provider/Marcus.py +23 -14
webscout/Provider/Nemotron.py +218 -0
webscout/Provider/Netwrck.py +35 -26
webscout/Provider/OPENAI/__init__.py +1 -1
webscout/Provider/OPENAI/exachat.py +4 -0
webscout/Provider/OPENAI/scirachat.py +3 -4
webscout/Provider/OPENAI/textpollinations.py +20 -22
webscout/Provider/OPENAI/toolbaz.py +1 -0
webscout/Provider/PI.py +22 -13
webscout/Provider/StandardInput.py +42 -30
webscout/Provider/TeachAnything.py +24 -12
webscout/Provider/TextPollinationsAI.py +78 -76
webscout/Provider/TwoAI.py +120 -88
webscout/Provider/TypliAI.py +305 -0
webscout/Provider/Venice.py +24 -22
webscout/Provider/VercelAI.py +31 -12
webscout/Provider/WiseCat.py +1 -1
webscout/Provider/WrDoChat.py +370 -0
webscout/Provider/__init__.py +11 -13
webscout/Provider/ai4chat.py +5 -3
webscout/Provider/akashgpt.py +59 -66
webscout/Provider/asksteve.py +53 -44
webscout/Provider/cerebras.py +77 -31
webscout/Provider/chatglm.py +47 -37
webscout/Provider/elmo.py +38 -32
webscout/Provider/freeaichat.py +57 -43
webscout/Provider/granite.py +24 -21
webscout/Provider/hermes.py +27 -20
webscout/Provider/learnfastai.py +25 -20
webscout/Provider/llmchatco.py +48 -78
webscout/Provider/multichat.py +13 -3
webscout/Provider/scira_chat.py +50 -30
webscout/Provider/scnet.py +27 -21
webscout/Provider/searchchat.py +16 -24
webscout/Provider/sonus.py +37 -39
webscout/Provider/toolbaz.py +24 -46
webscout/Provider/turboseek.py +37 -41
webscout/Provider/typefully.py +30 -22
webscout/Provider/typegpt.py +47 -51
webscout/Provider/uncovr.py +46 -40
webscout/__init__.py +0 -1
webscout/cli.py +256 -0
webscout/conversation.py +305 -448
webscout/exceptions.py +3 -0
webscout/swiftcli/__init__.py +80 -794
webscout/swiftcli/core/__init__.py +7 -0
webscout/swiftcli/core/cli.py +297 -0
webscout/swiftcli/core/context.py +104 -0
webscout/swiftcli/core/group.py +241 -0
webscout/swiftcli/decorators/__init__.py +28 -0
webscout/swiftcli/decorators/command.py +221 -0
webscout/swiftcli/decorators/options.py +220 -0
webscout/swiftcli/decorators/output.py +252 -0
webscout/swiftcli/exceptions.py +21 -0
webscout/swiftcli/plugins/__init__.py +9 -0
webscout/swiftcli/plugins/base.py +135 -0
webscout/swiftcli/plugins/manager.py +262 -0
webscout/swiftcli/utils/__init__.py +59 -0
webscout/swiftcli/utils/formatting.py +252 -0
webscout/swiftcli/utils/parsing.py +267 -0
webscout/version.py +1 -1
{webscout-8.2.4.dist-info → webscout-8.2.6.dist-info}/METADATA +166 -45
{webscout-8.2.4.dist-info → webscout-8.2.6.dist-info}/RECORD +89 -89
{webscout-8.2.4.dist-info → webscout-8.2.6.dist-info}/WHEEL +1 -1
webscout-8.2.6.dist-info/entry_points.txt +3 -0
{webscout-8.2.4.dist-info → webscout-8.2.6.dist-info}/top_level.txt +0 -1
inferno/__init__.py +0 -6
inferno/__main__.py +0 -9
inferno/cli.py +0 -6
inferno/lol.py +0 -589
webscout/LLM.py +0 -442
webscout/Local/__init__.py +0 -12
webscout/Local/__main__.py +0 -9
webscout/Local/api.py +0 -576
webscout/Local/cli.py +0 -516
webscout/Local/config.py +0 -75
webscout/Local/llm.py +0 -287
webscout/Local/model_manager.py +0 -253
webscout/Local/server.py +0 -721
webscout/Local/utils.py +0 -93
webscout/Provider/Chatify.py +0 -175
webscout/Provider/PizzaGPT.py +0 -228
webscout/Provider/askmyai.py +0 -158
webscout/Provider/gaurish.py +0 -244
webscout/Provider/promptrefine.py +0 -193
webscout/Provider/tutorai.py +0 -270
webscout-8.2.4.dist-info/entry_points.txt +0 -5
{webscout-8.2.4.dist-info → webscout-8.2.6.dist-info}/licenses/LICENSE.md +0 -0

webscout/Provider/scira_chat.py CHANGED Viewed

@@ -1,11 +1,12 @@
 from os import system
-import requests
+from curl_cffi import CurlError
+from curl_cffi.requests import Session
 import json
 import uuid
 import re
-from typing import Any, Dict, Optional, Union
+from typing import Any, Dict, Optional, Union, List
 from webscout.AIutel import Optimizers
-from webscout.AIutel import Conversation
+from webscout.AIutel import Conversation, sanitize_stream # Import sanitize_stream
 from webscout.AIutel import AwesomePrompts
 from webscout.AIbase import Provider
 from webscout import exceptions
@@ -17,15 +18,14 @@ class SciraAI(Provider):
     """
     AVAILABLE_MODELS = {
-        "scira-default": "Grok3",
-        "scira-grok-3-mini": "Grok3-mini", # thinking model
+        "scira-default": "Grok3-mini", # thinking model
+        "scira-grok-3": "Grok3",
+        "scira-anthropic": "Sonnet 3.7 thinking",
         "scira-vision" : "Grok2-Vision", # vision model
         "scira-4.1-mini": "GPT4.1-mini",
         "scira-qwq": "QWQ-32B",
         "scira-o4-mini": "o4-mini",
         "scira-google": "gemini 2.5 flash"
     }
     def __init__(
@@ -92,9 +92,9 @@ class SciraAI(Provider):
             "Sec-Fetch-Site": "same-origin"
         }
-        self.session = requests.Session()
+        self.session = Session() # Use curl_cffi Session
         self.session.headers.update(self.headers)
-        self.session.proxies.update(proxies)
+        self.session.proxies = proxies # Assign proxies directly
         self.is_conversation = is_conversation
         self.max_tokens_to_sample = max_tokens
@@ -150,12 +150,23 @@ class SciraAI(Provider):
         return self.fingerprint
+    @staticmethod
+    def _scira_extractor(chunk: Union[str, Dict[str, Any]]) -> Optional[str]:
+        """Extracts content from the Scira stream format '0:"..."'."""
+        if isinstance(chunk, str):
+            match = re.search(r'0:"(.*?)"(?=,|$)', chunk) # Look for 0:"...", possibly followed by comma or end of string
+            if match:
+                # Decode potential unicode escapes like \u00e9 and handle escaped quotes/backslashes
+                content = match.group(1).encode().decode('unicode_escape')
+                return content.replace('\\\\', '\\').replace('\\"', '"')
+        return None
     def ask(
         self,
         prompt: str,
         optimizer: str = None,
         conversationally: bool = False,
-    ) -> Dict[str, Any]:
+    ) -> Dict[str, Any]: # Note: Stream parameter removed as API doesn't seem to support it
         conversation_prompt = self.conversation.gen_complete_prompt(prompt)
         if optimizer:
             if optimizer in self.__available_optimizers:
@@ -181,10 +192,16 @@ class SciraAI(Provider):
         }
         try:
-            response = self.session.post(self.url, json=payload, timeout=self.timeout)
+            # Use curl_cffi post with impersonate
+            response = self.session.post(
+                self.url,
+                json=payload,
+                timeout=self.timeout,
+                impersonate="chrome120" # Add impersonate
+            )
             if response.status_code != 200:
                 # Try to get response content for better error messages
-                try:
+                try: # Use try-except for reading response content
                     error_content = response.text
                 except:
                     error_content = "<could not read response content>"
@@ -192,7 +209,10 @@ class SciraAI(Provider):
                 if response.status_code in [403, 429]:
                     print(f"Received status code {response.status_code}, refreshing identity...")
                     self.refresh_identity()
-                    response = self.session.post(self.url, json=payload, timeout=self.timeout)
+                    response = self.session.post(
+                        self.url, json=payload, timeout=self.timeout,
+                        impersonate="chrome120" # Add impersonate to retry
+                    )
                     if not response.ok:
                         raise exceptions.FailedToGenerateResponseError(
                             f"Failed to generate response after identity refresh - ({response.status_code}, {response.reason}) - {error_content}"
@@ -203,28 +223,27 @@ class SciraAI(Provider):
                         f"Request failed with status code {response.status_code}. Response: {error_content}"
                     )
-            full_response = ""
-            debug_lines = []
-            # Collect the first few lines for debugging
-            for i, line in enumerate(response.iter_lines()):
-                if line:
-                    try:
-                        line_str = line.decode('utf-8')
-                        debug_lines.append(line_str)
+            response_text_raw = response.text # Get raw response text
-                        # Format 2: 0:"content" (quoted format)
-                        match = re.search(r'0:"(.*?)"', line_str)
-                        if match:
-                            content = match.group(1)
-                            full_response += content
-                            continue
+            # Process the text using sanitize_stream line by line
+            processed_stream = sanitize_stream(
+                data=response_text_raw.splitlines(), # Split into lines
+                intro_value=None, # No simple prefix
+                to_json=False,    # Content is not JSON
+                content_extractor=self._scira_extractor # Use the specific extractor
+            )
+            # Aggregate the results from the generator
+            full_response = ""
+            for content in processed_stream:
+                if content and isinstance(content, str):
+                    full_response += content
-                    except: pass
             self.last_response = {"text": full_response}
             self.conversation.update_chat_history(prompt, full_response)
             return {"text": full_response}
+        except CurlError as e: # Catch CurlError
+            raise exceptions.FailedToGenerateResponseError(f"Request failed (CurlError): {e}") from e
         except Exception as e:
             raise exceptions.FailedToGenerateResponseError(f"Request failed: {e}")
@@ -242,7 +261,8 @@ class SciraAI(Provider):
     def get_message(self, response: dict) -> str:
         assert isinstance(response, dict), "Response should be of dict data-type only"
-        return response["text"].replace('\\n', '\n').replace('\\n\\n', '\n\n')
+        # Extractor handles formatting
+        return response.get("text", "").replace('\\n', '\n').replace('\\n\\n', '\n\n')
 if __name__ == "__main__":
     print("-" * 100)

webscout/Provider/scnet.py CHANGED Viewed

@@ -4,7 +4,7 @@ import json
 import secrets
 from typing import Any, Dict, Optional, Generator, Union
-from webscout.AIutel import Optimizers, Conversation, AwesomePrompts
+from webscout.AIutel import Optimizers, Conversation, AwesomePrompts, sanitize_stream
 from webscout.AIbase import Provider
 from webscout import exceptions
@@ -29,7 +29,10 @@ class SCNet(Provider):
         is_conversation: bool = True,
         max_tokens: int = 2048, # Note: max_tokens is not used by this API
         timeout: int = 30,
-        intro: Optional[str] = None,
+        intro: Optional[str] = ("You are a helpful, advanced LLM assistant. "
+            "You must always answer in English, regardless of the user's language. "
+            "If the user asks in another language, politely respond in English only. "
+            "Be clear, concise, and helpful."),
         filepath: Optional[str] = None,
         update_file: bool = True,
         proxies: Optional[dict] = None,
@@ -86,6 +89,13 @@ class SCNet(Provider):
         self.conversation = Conversation(is_conversation, max_tokens, filepath, update_file)
         self.conversation.history_offset = history_offset
+    @staticmethod
+    def _scnet_extractor(chunk: Union[str, Dict[str, Any]]) -> Optional[str]:
+        """Extracts content from SCNet stream JSON objects."""
+        if isinstance(chunk, dict):
+            return chunk.get("content")
+        return None
     def ask(
         self,
         prompt: str,
@@ -126,25 +136,21 @@ class SCNet(Provider):
                 response.raise_for_status() # Check for HTTP errors
                 streaming_text = ""
-                # Iterate over bytes and decode manually
-                for line_bytes in response.iter_lines():
-                    if line_bytes:
-                        line = line_bytes.decode('utf-8') # Decode bytes
-                        if line.startswith("data:"):
-                            data = line[5:].strip()
-                            if data and data != "[done]":
-                                try:
-                                    obj = json.loads(data)
-                                    content = obj.get("content", "")
-                                    streaming_text += content
-                                    resp = {"text": content}
-                                    # Yield dict or raw string
-                                    yield resp if not raw else content
-                                except (json.JSONDecodeError, UnicodeDecodeError):
-                                    continue
-                            elif data == "[done]":
-                                break
+                # Use sanitize_stream
+                processed_stream = sanitize_stream(
+                    data=response.iter_content(chunk_size=None), # Pass byte iterator
+                    intro_value="data:",
+                    to_json=True,     # Stream sends JSON
+                    skip_markers=["[done]"],
+                    content_extractor=self._scnet_extractor, # Use the specific extractor
+                    yield_raw_on_error=False # Skip non-JSON lines or lines where extractor fails
+                )
+                for content_chunk in processed_stream:
+                    # content_chunk is the string extracted by _scnet_extractor
+                    if content_chunk and isinstance(content_chunk, str):
+                        streaming_text += content_chunk
+                        yield {"text": content_chunk} if not raw else content_chunk
                 # Update history and last response after stream finishes
                 self.last_response = {"text": streaming_text}
                 self.conversation.update_chat_history(prompt, streaming_text)

webscout/Provider/searchchat.py CHANGED Viewed

@@ -6,7 +6,7 @@ from typing import Any, Dict, Optional, Generator, Union
 from webscout.AIutel import Optimizers
 from webscout.AIutel import Conversation
-from webscout.AIutel import AwesomePrompts
+from webscout.AIutel import AwesomePrompts, sanitize_stream # Import sanitize_stream
 from webscout.AIbase import Provider
 from webscout import exceptions
 from webscout.litagent import LitAgent
@@ -183,33 +183,25 @@ class SearchChatAI(Provider):
                         )
                 streaming_text = ""
-                # Iterate over bytes and decode manually
-                for line_bytes in response.iter_lines():
-                    if line_bytes:
-                        line = line_bytes.decode('utf-8')
-                        if line.startswith('data: '):
-                            data_str = line[6:]  # Remove 'data: ' prefix
-                            if data_str == '[DONE]':
-                                break
-                            try:
-                                data = json.loads(data_str)
-                                if "choices" in data and len(data["choices"]) > 0:
-                                    delta = data["choices"][0].get("delta", {})
-                                    if "content" in delta and delta["content"] is not None:
-                                        content = delta["content"]
-                                        streaming_text += content
-                                        resp = dict(text=content)
-                                        # Yield dict or raw string
-                                        yield resp if not raw else content
-                            except (json.JSONDecodeError, UnicodeDecodeError):
-                                continue
+                # Use sanitize_stream
+                processed_stream = sanitize_stream(
+                    data=response.iter_content(chunk_size=None), # Pass byte iterator
+                    intro_value="data:",
+                    to_json=True,     # Stream sends JSON
+                    skip_markers=["[DONE]"],
+                    content_extractor=lambda chunk: chunk.get('choices', [{}])[0].get('delta', {}).get('content') if isinstance(chunk, dict) else None,
+                    yield_raw_on_error=False # Skip non-JSON or lines where extractor fails
+                )
+                for content_chunk in processed_stream:
+                    # content_chunk is the string extracted by the content_extractor
+                    if content_chunk and isinstance(content_chunk, str):
+                        streaming_text += content_chunk
+                        yield dict(text=content_chunk) if not raw else content_chunk
                 # Update history and last response after stream finishes
                 self.last_response = {"text": streaming_text}
                 self.conversation.update_chat_history(prompt, streaming_text)
             except CurlError as e: # Catch CurlError
                 raise exceptions.FailedToGenerateResponseError(f"Request failed (CurlError): {str(e)}") from e
             except Exception as e: # Catch other potential exceptions

webscout/Provider/sonus.py CHANGED Viewed

@@ -4,7 +4,7 @@ import json
 from typing import Any, Dict, Optional, Generator, Union
 from webscout.AIutel import Optimizers
 from webscout.AIutel import Conversation
-from webscout.AIutel import AwesomePrompts
+from webscout.AIutel import AwesomePrompts, sanitize_stream # Import sanitize_stream
 from webscout.AIbase import Provider
 from webscout import exceptions
 from webscout.litagent import LitAgent
@@ -78,6 +78,13 @@ class SonusAI(Provider):
         )
         self.conversation.history_offset = history_offset
+    @staticmethod
+    def _sonus_extractor(chunk: Union[str, Dict[str, Any]]) -> Optional[str]:
+        """Extracts content from Sonus stream JSON objects."""
+        if isinstance(chunk, dict) and "content" in chunk:
+            return chunk.get("content")
+        return None
     def ask(
         self,
         prompt: str,
@@ -124,30 +131,22 @@ class SonusAI(Provider):
                     raise exceptions.FailedToGenerateResponseError(
                         f"Request failed with status code {response.status_code} - {response.text}"
                     )
                 streaming_text = ""
-                # Iterate over bytes and decode manually
-                for line_bytes in response.iter_lines():
-                    if line_bytes:
-                        try:
-                            # Decode the line and remove 'data: ' prefix if present
-                            line = line_bytes.decode('utf-8')
-                            if line.startswith('data: '):
-                                line = line[6:]
-                            # Handle potential empty lines after prefix removal
-                            if not line.strip():
-                                continue
+                # Use sanitize_stream
+                processed_stream = sanitize_stream(
+                    data=response.iter_content(chunk_size=None), # Pass byte iterator
+                    intro_value="data:",
+                    to_json=True,     # Stream sends JSON
+                    content_extractor=self._sonus_extractor, # Use the specific extractor
+                    yield_raw_on_error=False # Skip non-JSON lines or lines where extractor fails
+                )
-                            data = json.loads(line)
-                            if "content" in data:
-                                content = data["content"]
-                                streaming_text += content
-                                resp = dict(text=content)
-                                # Yield dict or raw string
-                                yield resp if raw else resp
-                        except (json.JSONDecodeError, UnicodeDecodeError):
-                            continue
+                for content_chunk in processed_stream:
+                    # content_chunk is the string extracted by _sonus_extractor
+                    if content_chunk and isinstance(content_chunk, str):
+                        streaming_text += content_chunk
+                        yield dict(text=content_chunk) if not raw else content_chunk
                 # Update history and last response after stream finishes
                 self.last_response = {"text": streaming_text}
@@ -173,23 +172,22 @@ class SonusAI(Provider):
                         f"Request failed with status code {response.status_code} - {response.text}"
                     )
+                response_text_raw = response.text # Get raw text
+                # Use sanitize_stream to process the non-streaming text
+                processed_stream = sanitize_stream(
+                    data=response_text_raw.splitlines(), # Split into lines
+                    intro_value="data:",
+                    to_json=True,
+                    content_extractor=self._sonus_extractor,
+                    yield_raw_on_error=False
+                )
+                # Aggregate the results
                 full_response = ""
-                # Process the full response text which might contain multiple JSON objects
-                # Split by lines and process each potential JSON object
-                for line in response.text.splitlines():
-                    if line:
-                        try:
-                            if line.startswith('data: '):
-                                line = line[6:]
-                            if not line.strip():
-                                continue
-                            data = json.loads(line)
-                            if "content" in data:
-                                full_response += data["content"]
-                        except (json.JSONDecodeError, UnicodeDecodeError):
-                            continue
+                for content in processed_stream:
+                    if content and isinstance(content, str):
+                        full_response += content
                 self.last_response = {"text": full_response}
                 self.conversation.update_chat_history(prompt, full_response)

webscout/Provider/toolbaz.py CHANGED Viewed

@@ -13,7 +13,7 @@ from typing import Any, Dict, Optional, Generator, Union, List
 from webscout import exceptions
 from webscout.AIutel import Optimizers
 from webscout.AIutel import Conversation
-from webscout.AIutel import AwesomePrompts
+from webscout.AIutel import AwesomePrompts, sanitize_stream # Import sanitize_stream
 from webscout.AIbase import Provider
 class Toolbaz(Provider):
@@ -26,6 +26,7 @@ class Toolbaz(Provider):
         "gemini-2.0-flash-thinking",
         "gemini-2.0-flash",
         "gemini-1.5-flash",
+        "o3-mini",
         "gpt-4o-latest",
         "gpt-4o",
         "deepseek-r1",
@@ -111,6 +112,13 @@ class Toolbaz(Provider):
         )
         self.conversation.history_offset = history_offset
+    @staticmethod
+    def _toolbaz_extractor(chunk: Union[str, Dict[str, Any]]) -> Optional[str]:
+        """Removes [model:...] tags from a string chunk."""
+        if isinstance(chunk, str):
+            return re.sub(r"\[model:.*?\]", "", chunk)
+        return None
     def random_string(self, length):
         return ''.join(random.choices(string.ascii_letters + string.digits, k=length))
@@ -207,53 +215,23 @@ class Toolbaz(Provider):
                 )
                 resp.raise_for_status()
-                buffer = ""
-                tag_start = "[model:"
                 streaming_text = ""
-                # Iterate over bytes and decode manually
-                for chunk_bytes in resp.iter_content(chunk_size=1024): # Read in larger chunks
-                    if chunk_bytes:
-                        text = chunk_bytes.decode(errors="ignore")
-                        buffer += text
-                        processed_buffer = ""
-                        last_processed_index = 0
-                        # Find all complete tags and process text between them
-                        for match in re.finditer(r"\[model:.*?\]", buffer):
-                            # Add text before the tag
-                            segment = buffer[last_processed_index:match.start()]
-                            if segment:
-                                processed_buffer += segment
-                            last_processed_index = match.end()
-                        # Add remaining text after the last complete tag
-                        processed_buffer += buffer[last_processed_index:]
-                        # Now, check for incomplete tag at the end
-                        last_tag_start_index = processed_buffer.rfind(tag_start)
-                        if last_tag_start_index != -1:
-                            # Text before the potential incomplete tag
-                            text_to_yield = processed_buffer[:last_tag_start_index]
-                            # Keep the potential incomplete tag start for the next iteration
-                            buffer = processed_buffer[last_tag_start_index:]
-                        else:
-                            # No potential incomplete tag found, yield everything processed
-                            text_to_yield = processed_buffer
-                            buffer = "" # Clear buffer as everything is processed
-                        if text_to_yield:
-                            streaming_text += text_to_yield
-                            # Yield dict or raw string
-                            yield {"text": text_to_yield} if not raw else text_to_yield
-                # Process any remaining text in the buffer after the loop finishes
-                # Remove any potential tags (complete or incomplete)
-                final_text = re.sub(r"\[model:.*?\]", "", buffer)
-                if final_text:
-                    streaming_text += final_text
-                    yield {"text": final_text} if not raw else final_text
+                # Use sanitize_stream with the custom extractor
+                # It will decode bytes and yield processed string chunks
+                processed_stream = sanitize_stream(
+                    data=resp.iter_content(chunk_size=None), # Pass byte iterator
+                    intro_value=None, # No simple prefix
+                    to_json=False,    # Content is text
+                    content_extractor=self._toolbaz_extractor, # Use the tag remover
+                    yield_raw_on_error=True # Yield even if extractor somehow fails (though unlikely for regex)
+                )
+                for content_chunk in processed_stream:
+                    # content_chunk is the string with tags removed
+                    if content_chunk and isinstance(content_chunk, str):
+                        streaming_text += content_chunk
+                        yield {"text": content_chunk} if not raw else content_chunk
                 self.last_response = {"text": streaming_text}
                 self.conversation.update_chat_history(prompt, streaming_text)

webscout/Provider/turboseek.py CHANGED Viewed

@@ -4,10 +4,10 @@ import json
 from webscout.AIutel import Optimizers
 from webscout.AIutel import Conversation
-from webscout.AIutel import AwesomePrompts, sanitize_stream
+from webscout.AIutel import AwesomePrompts, sanitize_stream # Import sanitize_stream
 from webscout.AIbase import Provider
 from webscout import exceptions
-from typing import Union, Any, AsyncGenerator, Dict
+from typing import Optional, Union, Any, AsyncGenerator, Dict
 from webscout.litagent import LitAgent
 class TurboSeek(Provider):
@@ -88,6 +88,13 @@ class TurboSeek(Provider):
         )
         self.conversation.history_offset = history_offset
+    @staticmethod
+    def _turboseek_extractor(chunk: Union[str, Dict[str, Any]]) -> Optional[str]:
+        """Extracts content from TurboSeek stream JSON objects."""
+        if isinstance(chunk, dict) and "text" in chunk:
+            return chunk.get("text") # json.loads already handles unicode escapes
+        return None
     def ask(
         self,
         prompt: str,
@@ -142,24 +149,24 @@ class TurboSeek(Provider):
                     raise exceptions.FailedToGenerateResponseError(
                         f"Failed to generate response - ({response.status_code}, {response.reason}) - {response.text}"
                     )
                 streaming_text = ""
-                # Iterate over bytes and decode manually
-                for value_bytes in response.iter_lines():
-                    try:
-                        if value_bytes and value_bytes.startswith(b"data: "): # Check for bytes
-                            # Decode bytes to string
-                            line = value_bytes[6:].decode('utf-8')
-                            data = json.loads(line)
-                            if "text" in data:
-                                # Decode potential unicode escapes
-                                content = data["text"].encode().decode('unicode_escape')
-                                streaming_text += content
-                                resp = dict(text=content)
-                                self.last_response.update(resp) # Update last_response incrementally
-                                # Yield raw bytes or dict based on flag
-                                yield value_bytes if raw else resp
-                    except (json.decoder.JSONDecodeError, UnicodeDecodeError):
-                        pass # Ignore lines that are not valid JSON or cannot be decoded
+                # Use sanitize_stream with the custom extractor
+                processed_stream = sanitize_stream(
+                    data=response.iter_content(chunk_size=None), # Pass byte iterator
+                    intro_value="data:",
+                    to_json=True,     # Stream sends JSON
+                    content_extractor=self._turboseek_extractor, # Use the specific extractor
+                    yield_raw_on_error=False # Skip non-JSON lines or lines where extractor fails
+                )
+                for content_chunk in processed_stream:
+                    # content_chunk is the string extracted by _turboseek_extractor
+                    if content_chunk and isinstance(content_chunk, str):
+                        streaming_text += content_chunk
+                        self.last_response.update(dict(text=streaming_text)) # Update last_response incrementally
+                        yield dict(text=content_chunk) if not raw else content_chunk # Yield dict or raw string
                 # Update conversation history after stream finishes
                 if streaming_text: # Only update if content was received
                     self.conversation.update_chat_history(
@@ -174,21 +181,15 @@ class TurboSeek(Provider):
         def for_non_stream():
             # Aggregate the stream using the updated for_stream logic
             full_text = ""
-            for chunk_data in for_stream():
-                 # Ensure chunk_data is a dict (not raw) and has 'text'
-                if isinstance(chunk_data, dict) and "text" in chunk_data:
-                    full_text += chunk_data["text"]
-                # If raw=True, chunk_data is bytes, decode and process if needed (though raw non-stream is less common)
-                elif isinstance(chunk_data, bytes):
-                     try:
-                         if chunk_data.startswith(b"data: "):
-                             line = chunk_data[6:].decode('utf-8')
-                             data = json.loads(line)
-                             if "text" in data:
-                                 content = data["text"].encode().decode('unicode_escape')
-                                 full_text += content
-                     except (json.decoder.JSONDecodeError, UnicodeDecodeError):
-                         pass
+            try:
+                # Ensure raw=False so for_stream yields dicts
+                for chunk_data in for_stream():
+                    if isinstance(chunk_data, dict) and "text" in chunk_data:
+                        full_text += chunk_data["text"]
+                    elif isinstance(chunk_data, str): # Handle case where raw=True was passed
+                        full_text += chunk_data
+            except Exception as e:
+                raise exceptions.FailedToGenerateResponseError(f"Failed to aggregate non-stream response: {e}") from e
             # last_response and history are updated within for_stream
             # Ensure last_response reflects the complete aggregated text
             self.last_response = {"text": full_text}
@@ -241,7 +242,7 @@ class TurboSeek(Provider):
             str: Message extracted
         """
         assert isinstance(response, dict), "Response should be of dict data-type only"
-        # Text is already decoded in ask method
+        # Unicode escapes are handled by json.loads within sanitize_stream
         return response.get("text", "")
 if __name__ == '__main__':
@@ -250,13 +251,9 @@ if __name__ == '__main__':
     try: # Add try-except block for testing
         ai = TurboSeek(timeout=60)
         print("[bold blue]Testing Stream:[/bold blue]")
-        response_stream = ai.chat("hello buddy", stream=True)
-        full_stream_response = ""
+        response_stream = ai.chat("yooooooooooo", stream=True)
         for chunk in response_stream:
             print(chunk, end="", flush=True)
-            full_stream_response += chunk
-        print("\n[bold green]Stream Test Complete.[/bold green]\n")
         # Optional: Test non-stream
         # print("[bold blue]Testing Non-Stream:[/bold blue]")
         # response_non_stream = ai.chat("What is the capital of France?", stream=False)
@@ -267,4 +264,3 @@ if __name__ == '__main__':
         print(f"\n[bold red]API Error:[/bold red] {e}")
     except Exception as e:
         print(f"\n[bold red]An unexpected error occurred:[/bold red] {e}")

webscout 8.2.4__py3-none-any.whl → 8.2.6__py3-none-any.whl

Potentially problematic release.

webscout 8.2.4py3-none-any.whl → 8.2.6py3-none-any.whl