PyPI - webscout - Versions diffs - 8.3__py3-none-any.whl → 8.3.2__py3-none-any.whl - Mend

webscout 8.3py3-none-any.whl → 8.3.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of webscout might be problematic. Click here for more details.

Files changed (120) hide show

webscout/AIauto.py +4 -4
webscout/AIbase.py +61 -1
webscout/AIutel.py +46 -53
webscout/Bing_search.py +418 -0
webscout/Extra/YTToolkit/ytapi/patterns.py +45 -45
webscout/Extra/YTToolkit/ytapi/stream.py +1 -1
webscout/Extra/YTToolkit/ytapi/video.py +10 -10
webscout/Extra/autocoder/autocoder_utiles.py +1 -1
webscout/Extra/gguf.py +706 -177
webscout/Litlogger/formats.py +9 -0
webscout/Litlogger/handlers.py +18 -0
webscout/Litlogger/logger.py +43 -1
webscout/Provider/AISEARCH/genspark_search.py +7 -7
webscout/Provider/AISEARCH/scira_search.py +3 -2
webscout/Provider/GeminiProxy.py +140 -0
webscout/Provider/LambdaChat.py +7 -1
webscout/Provider/MCPCore.py +78 -75
webscout/Provider/OPENAI/BLACKBOXAI.py +1046 -1017
webscout/Provider/OPENAI/GeminiProxy.py +328 -0
webscout/Provider/OPENAI/Qwen3.py +303 -303
webscout/Provider/OPENAI/README.md +5 -0
webscout/Provider/OPENAI/README_AUTOPROXY.md +238 -0
webscout/Provider/OPENAI/TogetherAI.py +355 -0
webscout/Provider/OPENAI/__init__.py +16 -1
webscout/Provider/OPENAI/autoproxy.py +332 -0
webscout/Provider/OPENAI/base.py +101 -14
webscout/Provider/OPENAI/chatgpt.py +15 -2
webscout/Provider/OPENAI/chatgptclone.py +14 -3
webscout/Provider/OPENAI/deepinfra.py +339 -328
webscout/Provider/OPENAI/e2b.py +295 -74
webscout/Provider/OPENAI/mcpcore.py +109 -70
webscout/Provider/OPENAI/opkfc.py +18 -6
webscout/Provider/OPENAI/scirachat.py +59 -50
webscout/Provider/OPENAI/toolbaz.py +2 -10
webscout/Provider/OPENAI/writecream.py +166 -166
webscout/Provider/OPENAI/x0gpt.py +367 -367
webscout/Provider/OPENAI/xenai.py +514 -0
webscout/Provider/OPENAI/yep.py +389 -383
webscout/Provider/STT/__init__.py +3 -0
webscout/Provider/STT/base.py +281 -0
webscout/Provider/STT/elevenlabs.py +265 -0
webscout/Provider/TTI/__init__.py +4 -1
webscout/Provider/TTI/aiarta.py +399 -365
webscout/Provider/TTI/base.py +74 -2
webscout/Provider/TTI/bing.py +231 -0
webscout/Provider/TTI/fastflux.py +63 -30
webscout/Provider/TTI/gpt1image.py +149 -0
webscout/Provider/TTI/imagen.py +196 -0
webscout/Provider/TTI/magicstudio.py +60 -29
webscout/Provider/TTI/piclumen.py +43 -32
webscout/Provider/TTI/pixelmuse.py +232 -225
webscout/Provider/TTI/pollinations.py +43 -32
webscout/Provider/TTI/together.py +287 -0
webscout/Provider/TTI/utils.py +2 -1
webscout/Provider/TTS/README.md +1 -0
webscout/Provider/TTS/__init__.py +2 -1
webscout/Provider/TTS/freetts.py +140 -0
webscout/Provider/TTS/speechma.py +45 -39
webscout/Provider/TogetherAI.py +366 -0
webscout/Provider/UNFINISHED/ChutesAI.py +314 -0
webscout/Provider/UNFINISHED/fetch_together_models.py +95 -0
webscout/Provider/XenAI.py +324 -0
webscout/Provider/__init__.py +8 -0
webscout/Provider/deepseek_assistant.py +378 -0
webscout/Provider/scira_chat.py +3 -2
webscout/Provider/toolbaz.py +0 -1
webscout/auth/__init__.py +44 -0
webscout/auth/api_key_manager.py +189 -0
webscout/auth/auth_system.py +100 -0
webscout/auth/config.py +76 -0
webscout/auth/database.py +400 -0
webscout/auth/exceptions.py +67 -0
webscout/auth/middleware.py +248 -0
webscout/auth/models.py +130 -0
webscout/auth/providers.py +257 -0
webscout/auth/rate_limiter.py +254 -0
webscout/auth/request_models.py +127 -0
webscout/auth/request_processing.py +226 -0
webscout/auth/routes.py +526 -0
webscout/auth/schemas.py +103 -0
webscout/auth/server.py +312 -0
webscout/auth/static/favicon.svg +11 -0
webscout/auth/swagger_ui.py +203 -0
webscout/auth/templates/components/authentication.html +237 -0
webscout/auth/templates/components/base.html +103 -0
webscout/auth/templates/components/endpoints.html +750 -0
webscout/auth/templates/components/examples.html +491 -0
webscout/auth/templates/components/footer.html +75 -0
webscout/auth/templates/components/header.html +27 -0
webscout/auth/templates/components/models.html +286 -0
webscout/auth/templates/components/navigation.html +70 -0
webscout/auth/templates/static/api.js +455 -0
webscout/auth/templates/static/icons.js +168 -0
webscout/auth/templates/static/main.js +784 -0
webscout/auth/templates/static/particles.js +201 -0
webscout/auth/templates/static/styles.css +3353 -0
webscout/auth/templates/static/ui.js +374 -0
webscout/auth/templates/swagger_ui.html +170 -0
webscout/client.py +49 -3
webscout/litagent/Readme.md +12 -3
webscout/litagent/agent.py +99 -62
webscout/scout/core/scout.py +104 -26
webscout/scout/element.py +139 -18
webscout/swiftcli/core/cli.py +14 -3
webscout/swiftcli/decorators/output.py +59 -9
webscout/update_checker.py +31 -49
webscout/version.py +1 -1
webscout/webscout_search.py +4 -12
webscout/webscout_search_async.py +3 -10
webscout/yep_search.py +2 -11
{webscout-8.3.dist-info → webscout-8.3.2.dist-info}/METADATA +41 -11
{webscout-8.3.dist-info → webscout-8.3.2.dist-info}/RECORD +116 -68
{webscout-8.3.dist-info → webscout-8.3.2.dist-info}/entry_points.txt +1 -1
webscout/Provider/HF_space/__init__.py +0 -0
webscout/Provider/HF_space/qwen_qwen2.py +0 -206
webscout/Provider/OPENAI/api.py +0 -1035
webscout/Provider/TTI/artbit.py +0 -0
{webscout-8.3.dist-info → webscout-8.3.2.dist-info}/WHEEL +0 -0
{webscout-8.3.dist-info → webscout-8.3.2.dist-info}/licenses/LICENSE.md +0 -0
{webscout-8.3.dist-info → webscout-8.3.2.dist-info}/top_level.txt +0 -0

webscout/Provider/OPENAI/Qwen3.py CHANGED Viewed

@@ -1,304 +1,304 @@
-import requests
-import json
-import time
-import uuid
-from typing import List, Dict, Optional, Union, Generator, Any
-from webscout.Provider.OPENAI.base import OpenAICompatibleProvider, BaseChat, BaseCompletions
-from webscout.Provider.OPENAI.utils import (
-    ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
-    ChatCompletionMessage, CompletionUsage,
-    get_last_user_message, get_system_prompt,
-    count_tokens
-)
-class Completions(BaseCompletions):
-    def __init__(self, client: 'Qwen3'):
-        self._client = client
-    def create(
-        self,
-        *,
-        model: str,
-        messages: List[Dict[str, str]],
-        max_tokens: Optional[int] = 2048,
-        stream: bool = False,
-        temperature: Optional[float] = None,
-        top_p: Optional[float] = None,
-        timeout: Optional[int] = None,
-        proxies: Optional[dict] = None,
-        **kwargs: Any
-    ) -> Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]:
-        payload = {
-            "data": [
-                get_last_user_message(messages),
-                {
-                    "thinking_budget": kwargs.get("thinking_budget", 38),
-                    "model": self._client.get_model(model),
-                    "sys_prompt": get_system_prompt(messages)
-                },
-                None, None
-            ],
-            "event_data": None,
-            "fn_index": 13,
-            "trigger_id": 31,
-            "session_hash": str(uuid.uuid4()).replace('-', '')
-        }
-        request_id = f"chatcmpl-{uuid.uuid4()}"
-        created_time = int(time.time())
-        if stream:
-            return self._create_stream(request_id, created_time, model, payload, timeout=timeout, proxies=proxies)
-        else:
-            return self._create_non_stream(request_id, created_time, model, payload, timeout=timeout, proxies=proxies)
-    def _create_stream(
-        self, request_id: str, created_time: int, model: str, payload: Dict[str, Any],
-        timeout: Optional[int] = None, proxies: Optional[dict] = None
-    ) -> Generator[ChatCompletionChunk, None, None]:
-        original_proxies = self._client.session.proxies.copy()
-        if proxies is not None:
-            self._client.session.proxies = proxies
-        else:
-            self._client.session.proxies = {}
-        try:
-            session = self._client.session
-            headers = self._client.headers
-            # Step 1: Join the queue
-            join_resp = session.post(self._client.api_endpoint, headers=headers, json=payload, timeout=timeout if timeout is not None else self._client.timeout)
-            join_resp.raise_for_status()
-            event_id = join_resp.json().get('event_id')
-            session_hash = payload["session_hash"]
-            # Step 2: Stream data
-            params = {'session_hash': session_hash}
-            stream_resp = session.get(self._client.url + "/gradio_api/queue/data", headers=self._client.stream_headers, params=params, stream=True, timeout=timeout if timeout is not None else self._client.timeout)
-            stream_resp.raise_for_status()
-            # --- New logic to yield all content, tool reasoning, and status, similar to Reasoning class ---
-            is_thinking_tag_open = False # True if <think> has been yielded and not yet </think>
-            for line in stream_resp.iter_lines():
-                if line:
-                    decoded_line = line.decode('utf-8')
-                    if decoded_line.startswith('data: '):
-                        try:
-                            json_data = json.loads(decoded_line[6:])
-                            if json_data.get('msg') == 'process_generating':
-                                if 'output' in json_data and 'data' in json_data['output'] and len(json_data['output']['data']) > 5:
-                                    updates_list = json_data['output']['data'][5] # This is a list of operations
-                                    for op_details in updates_list:
-                                        action = op_details[0]
-                                        path = op_details[1]
-                                        value = op_details[2]
-                                        content_to_yield = None
-                                        is_current_op_tool = False
-                                        is_current_op_text = False
-                                        # Case 1: Adding a new content block (tool or text object)
-                                        if action == "add" and isinstance(value, dict) and "type" in value:
-                                            if len(path) == 4 and path[0] == "value" and path[2] == "content":
-                                                block_type = value.get("type")
-                                                content_to_yield = value.get("content")
-                                                if block_type == "tool":
-                                                    is_current_op_tool = True
-                                                elif block_type == "text":
-                                                    is_current_op_text = True
-                                        # Case 2: Appending content string to an existing block
-                                        elif action == "append" and isinstance(value, str):
-                                            if len(path) == 5 and path[0] == "value" and path[2] == "content" and path[4] == "content":
-                                                block_index = path[3] # 0 for tool's content, 1 for text's content
-                                                content_to_yield = value
-                                                if block_index == 0: # Appending to tool's content
-                                                    is_current_op_tool = True
-                                                elif block_index == 1: # Appending to text's content
-                                                    is_current_op_text = True
-                                        # Case 3: Tool status update (e.g., "End of Thought")
-                                        elif action == "replace" and len(path) == 6 and \
-                                             path[0] == "value" and path[2] == "content" and \
-                                             path[3] == 0 and path[4] == "options" and path[5] == "status": # path[3]==0 ensures it's the tool block
-                                            if value == "done": # Tool block processing is complete
-                                                if is_thinking_tag_open:
-                                                    delta = ChoiceDelta(content="</think>\n\n", role="assistant")
-                                                    yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
-                                                    is_thinking_tag_open = False
-                                            continue # This operation itself doesn't yield visible content
-                                        # Yielding logic
-                                        if is_current_op_tool and content_to_yield:
-                                            if not is_thinking_tag_open:
-                                                delta = ChoiceDelta(content="<think>", role="assistant")
-                                                yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
-                                                is_thinking_tag_open = True
-                                            delta = ChoiceDelta(content=content_to_yield, role="assistant")
-                                            yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
-                                        elif is_current_op_text and content_to_yield:
-                                            if is_thinking_tag_open: # If text starts, close any open thinking tag
-                                                delta = ChoiceDelta(content="</think>", role="assistant")
-                                                yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
-                                                is_thinking_tag_open = False
-                                            delta = ChoiceDelta(content=content_to_yield, role="assistant")
-                                            yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
-                            if json_data.get('msg') == 'process_completed':
-                                if is_thinking_tag_open: # Ensure </think> is yielded if process completes mid-thought
-                                    delta = ChoiceDelta(content="</think>", role="assistant")
-                                    yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
-                                    is_thinking_tag_open = False
-                                break
-                        except json.JSONDecodeError:
-                            continue
-                        except Exception as e:
-                            # Log or handle other potential exceptions
-                            continue
-            # After the loop, ensure the tag is closed if the stream broke for reasons other than 'process_completed'
-            if is_thinking_tag_open:
-                delta = ChoiceDelta(content="</think>", role="assistant")
-                yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
-        finally:
-            self._client.session.proxies = original_proxies
-    def _create_non_stream(
-        self, request_id: str, created_time: int, model: str, payload: Dict[str, Any],
-        timeout: Optional[int] = None, proxies: Optional[dict] = None
-    ) -> ChatCompletion:
-        original_proxies = self._client.session.proxies.copy()
-        if proxies is not None:
-            self._client.session.proxies = proxies
-        else:
-            self._client.session.proxies = {}
-        try:
-            # For non-streaming, just call the join endpoint and parse the result
-            session = self._client.session
-            headers = self._client.headers
-            resp = session.post(self._client.api_endpoint, headers=headers, json=payload, timeout=timeout if timeout is not None else self._client.timeout)
-            resp.raise_for_status()
-            data = resp.json()
-            # Return the full content as a single message, including all tool and text reasoning if present
-            output = ""
-            if 'output' in data and 'data' in data['output'] and len(data['output']['data']) > 5:
-                updates = data['output']['data'][5]
-                parts = []
-                for update in updates:
-                    if isinstance(update, list) and len(update) > 2 and isinstance(update[2], str):
-                        parts.append(update[2])
-                    elif isinstance(update, list) and isinstance(update[1], list) and len(update[1]) > 4:
-                        if update[1][4] == "content":
-                            parts.append(update[2])
-                        elif update[1][4] == "options" and update[2] != "done":
-                            parts.append(str(update[2]))
-                    elif isinstance(update, dict):
-                        if update.get('type') == 'tool':
-                            parts.append(update.get('content', ''))
-                        elif update.get('type') == 'text':
-                            parts.append(update.get('content', ''))
-                output = "\n".join([str(p) for p in parts if p])
-            else:
-                output = data.get('output', {}).get('data', ["", "", "", "", "", [["", "", ""]]])[5][0][2]
-            message = ChatCompletionMessage(role="assistant", content=output)
-            choice = Choice(index=0, message=message, finish_reason="stop")
-            # Use count_tokens to compute usage
-            prompt_tokens = count_tokens([m.get('content', '') for m in payload['data'] if isinstance(m, dict) and 'content' in m or isinstance(m, str)])
-            completion_tokens = count_tokens(output)
-            usage = CompletionUsage(
-                prompt_tokens=prompt_tokens,
-                completion_tokens=completion_tokens,
-                total_tokens=prompt_tokens + completion_tokens
-            )
-            completion = ChatCompletion(
-                id=request_id,
-                choices=[choice],
-                created=created_time,
-                model=model,
-                usage=usage,
-            )
-            return completion
-        finally:
-            self._client.session.proxies = original_proxies
-class Chat(BaseChat):
-    def __init__(self, client: 'Qwen3'):
-        self.completions = Completions(client)
-class Qwen3(OpenAICompatibleProvider):
-    url = "https://qwen-qwen3-demo.hf.space"
-    api_endpoint = "https://qwen-qwen3-demo.hf.space/gradio_api/queue/join?__theme=system"
-    AVAILABLE_MODELS = [
-        "qwen3-235b-a22b",
-        "qwen3-32b",
-        "qwen3-30b-a3b",
-        "qwen3-14b",
-        "qwen3-8b",
-        "qwen3-4b",
-        "qwen3-1.7b",
-        "qwen3-0.6b",
-    ]
-    MODEL_ALIASES = {
-        "qwen-3-235b": "qwen3-235b-a22b",
-        "qwen-3-30b": "qwen3-30b-a3b",
-        "qwen-3-32b": "qwen3-32b",
-        "qwen-3-14b": "qwen3-14b",
-        "qwen-3-4b": "qwen3-4b",
-        "qwen-3-1.7b": "qwen3-1.7b",
-        "qwen-3-0.6b": "qwen3-0.6b"
-    }
-    def __init__(self):
-        self.timeout = 30
-        self.session = requests.Session()
-        self.session.proxies = {}
-        self.headers = {
-            'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64; rv:136.0) Gecko/20100101 Firefox/136.0',
-            'Accept': '*/*',
-            'Accept-Language': 'en-US,en;q=0.5',
-            'Accept-Encoding': 'gzip, deflate, br, zstd',
-            'Referer': f'{self.url}/?__theme=system',
-            'content-type': 'application/json',
-            'Origin': self.url,
-            'Connection': 'keep-alive',
-            'Sec-Fetch-Dest': 'empty',
-            'Sec-Fetch-Mode': 'cors',
-            'Sec-Fetch-Site': 'same-origin',
-            'Pragma': 'no-cache',
-            'Cache-Control': 'no-cache',
-        }
-        self.stream_headers = {
-            'Accept': 'text/event-stream',
-            'Accept-Language': 'en-US,en;q=0.5',
-            'Referer': f'{self.url}/?__theme=system',
-            'User-Agent': self.headers['User-Agent'],
-        }
-        self.session.headers.update(self.headers)
-        self.chat = Chat(self)
-    def get_model(self, model):
-        return self.MODEL_ALIASES.get(model, model)
-    @property
-    def models(self):
-        class _ModelList:
-            def list(inner_self):
-                return type(self).AVAILABLE_MODELS
-        return _ModelList()
-if __name__ == "__main__":
-    client = Qwen3()
-    from rich import print
-    resp = client.chat.completions.create(
-        model="qwen3-14b",
-        messages=[
-            {"role": "system", "content": "You are a helpful assistant."},
-            {"role": "user", "content": "Hello "}
-        ],
-        stream=True
-    )
-    for chunk in resp:
+import requests
+import json
+import time
+import uuid
+from typing import List, Dict, Optional, Union, Generator, Any
+from webscout.Provider.OPENAI.base import OpenAICompatibleProvider, BaseChat, BaseCompletions
+from webscout.Provider.OPENAI.utils import (
+    ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
+    ChatCompletionMessage, CompletionUsage,
+    get_last_user_message, get_system_prompt,
+    count_tokens
+)
+class Completions(BaseCompletions):
+    def __init__(self, client: 'Qwen3'):
+        self._client = client
+    def create(
+        self,
+        *,
+        model: str,
+        messages: List[Dict[str, str]],
+        max_tokens: Optional[int] = 2048,
+        stream: bool = False,
+        temperature: Optional[float] = None,
+        top_p: Optional[float] = None,
+        timeout: Optional[int] = None,
+        proxies: Optional[dict] = None,
+        **kwargs: Any
+    ) -> Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]:
+        payload = {
+            "data": [
+                get_last_user_message(messages),
+                {
+                    "thinking_budget": kwargs.get("thinking_budget", 38),
+                    "model": self._client.get_model(model),
+                    "sys_prompt": get_system_prompt(messages)
+                },
+                None, None
+            ],
+            "event_data": None,
+            "fn_index": 13,
+            "trigger_id": 31,
+            "session_hash": str(uuid.uuid4()).replace('-', '')
+        }
+        request_id = f"chatcmpl-{uuid.uuid4()}"
+        created_time = int(time.time())
+        if stream:
+            return self._create_stream(request_id, created_time, model, payload, timeout=timeout, proxies=proxies)
+        else:
+            return self._create_non_stream(request_id, created_time, model, payload, timeout=timeout, proxies=proxies)
+    def _create_stream(
+        self, request_id: str, created_time: int, model: str, payload: Dict[str, Any],
+        timeout: Optional[int] = None, proxies: Optional[dict] = None
+    ) -> Generator[ChatCompletionChunk, None, None]:
+        original_proxies = self._client.session.proxies.copy()
+        if proxies is not None:
+            self._client.session.proxies = proxies
+        else:
+            self._client.session.proxies = {}
+        try:
+            session = self._client.session
+            headers = self._client.headers
+            # Step 1: Join the queue
+            join_resp = session.post(self._client.api_endpoint, headers=headers, json=payload, timeout=timeout if timeout is not None else self._client.timeout)
+            join_resp.raise_for_status()
+            event_id = join_resp.json().get('event_id')
+            session_hash = payload["session_hash"]
+            # Step 2: Stream data
+            params = {'session_hash': session_hash}
+            stream_resp = session.get(self._client.url + "/gradio_api/queue/data", headers=self._client.stream_headers, params=params, stream=True, timeout=timeout if timeout is not None else self._client.timeout)
+            stream_resp.raise_for_status()
+            # --- New logic to yield all content, tool reasoning, and status, similar to Reasoning class ---
+            is_thinking_tag_open = False # True if <think> has been yielded and not yet </think>
+            for line in stream_resp.iter_lines():
+                if line:
+                    decoded_line = line.decode('utf-8')
+                    if decoded_line.startswith('data: '):
+                        try:
+                            json_data = json.loads(decoded_line[6:])
+                            if json_data.get('msg') == 'process_generating':
+                                if 'output' in json_data and 'data' in json_data['output'] and len(json_data['output']['data']) > 5:
+                                    updates_list = json_data['output']['data'][5] # This is a list of operations
+                                    for op_details in updates_list:
+                                        action = op_details[0]
+                                        path = op_details[1]
+                                        value = op_details[2]
+                                        content_to_yield = None
+                                        is_current_op_tool = False
+                                        is_current_op_text = False
+                                        # Case 1: Adding a new content block (tool or text object)
+                                        if action == "add" and isinstance(value, dict) and "type" in value:
+                                            if len(path) == 4 and path[0] == "value" and path[2] == "content":
+                                                block_type = value.get("type")
+                                                content_to_yield = value.get("content")
+                                                if block_type == "tool":
+                                                    is_current_op_tool = True
+                                                elif block_type == "text":
+                                                    is_current_op_text = True
+                                        # Case 2: Appending content string to an existing block
+                                        elif action == "append" and isinstance(value, str):
+                                            if len(path) == 5 and path[0] == "value" and path[2] == "content" and path[4] == "content":
+                                                block_index = path[3] # 0 for tool's content, 1 for text's content
+                                                content_to_yield = value
+                                                if block_index == 0: # Appending to tool's content
+                                                    is_current_op_tool = True
+                                                elif block_index == 1: # Appending to text's content
+                                                    is_current_op_text = True
+                                        # Case 3: Tool status update (e.g., "End of Thought")
+                                        elif action == "replace" and len(path) == 6 and \
+                                             path[0] == "value" and path[2] == "content" and \
+                                             path[3] == 0 and path[4] == "options" and path[5] == "status": # path[3]==0 ensures it's the tool block
+                                            if value == "done": # Tool block processing is complete
+                                                if is_thinking_tag_open:
+                                                    delta = ChoiceDelta(content="</think>\n\n", role="assistant")
+                                                    yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
+                                                    is_thinking_tag_open = False
+                                            continue # This operation itself doesn't yield visible content
+                                        # Yielding logic
+                                        if is_current_op_tool and content_to_yield:
+                                            if not is_thinking_tag_open:
+                                                delta = ChoiceDelta(content="<think>", role="assistant")
+                                                yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
+                                                is_thinking_tag_open = True
+                                            delta = ChoiceDelta(content=content_to_yield, role="assistant")
+                                            yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
+                                        elif is_current_op_text and content_to_yield:
+                                            if is_thinking_tag_open: # If text starts, close any open thinking tag
+                                                delta = ChoiceDelta(content="</think>", role="assistant")
+                                                yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
+                                                is_thinking_tag_open = False
+                                            delta = ChoiceDelta(content=content_to_yield, role="assistant")
+                                            yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
+                            if json_data.get('msg') == 'process_completed':
+                                if is_thinking_tag_open: # Ensure </think> is yielded if process completes mid-thought
+                                    delta = ChoiceDelta(content="</think>", role="assistant")
+                                    yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
+                                    is_thinking_tag_open = False
+                                break
+                        except json.JSONDecodeError:
+                            continue
+                        except Exception as e:
+                            # Log or handle other potential exceptions
+                            continue
+            # After the loop, ensure the tag is closed if the stream broke for reasons other than 'process_completed'
+            if is_thinking_tag_open:
+                delta = ChoiceDelta(content="</think>", role="assistant")
+                yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
+        finally:
+            self._client.session.proxies = original_proxies
+    def _create_non_stream(
+        self, request_id: str, created_time: int, model: str, payload: Dict[str, Any],
+        timeout: Optional[int] = None, proxies: Optional[dict] = None
+    ) -> ChatCompletion:
+        original_proxies = self._client.session.proxies.copy()
+        if proxies is not None:
+            self._client.session.proxies = proxies
+        else:
+            self._client.session.proxies = {}
+        try:
+            # For non-streaming, just call the join endpoint and parse the result
+            session = self._client.session
+            headers = self._client.headers
+            resp = session.post(self._client.api_endpoint, headers=headers, json=payload, timeout=timeout if timeout is not None else self._client.timeout)
+            resp.raise_for_status()
+            data = resp.json()
+            # Return the full content as a single message, including all tool and text reasoning if present
+            output = ""
+            if 'output' in data and 'data' in data['output'] and len(data['output']['data']) > 5:
+                updates = data['output']['data'][5]
+                parts = []
+                for update in updates:
+                    if isinstance(update, list) and len(update) > 2 and isinstance(update[2], str):
+                        parts.append(update[2])
+                    elif isinstance(update, list) and isinstance(update[1], list) and len(update[1]) > 4:
+                        if update[1][4] == "content":
+                            parts.append(update[2])
+                        elif update[1][4] == "options" and update[2] != "done":
+                            parts.append(str(update[2]))
+                    elif isinstance(update, dict):
+                        if update.get('type') == 'tool':
+                            parts.append(update.get('content', ''))
+                        elif update.get('type') == 'text':
+                            parts.append(update.get('content', ''))
+                output = "\n".join([str(p) for p in parts if p])
+            else:
+                output = data.get('output', {}).get('data', ["", "", "", "", "", [["", "", ""]]])[5][0][2]
+            message = ChatCompletionMessage(role="assistant", content=output)
+            choice = Choice(index=0, message=message, finish_reason="stop")
+            # Use count_tokens to compute usage
+            prompt_tokens = count_tokens([m.get('content', '') for m in payload['data'] if isinstance(m, dict) and 'content' in m or isinstance(m, str)])
+            completion_tokens = count_tokens(output)
+            usage = CompletionUsage(
+                prompt_tokens=prompt_tokens,
+                completion_tokens=completion_tokens,
+                total_tokens=prompt_tokens + completion_tokens
+            )
+            completion = ChatCompletion(
+                id=request_id,
+                choices=[choice],
+                created=created_time,
+                model=model,
+                usage=usage,
+            )
+            return completion
+        finally:
+            self._client.session.proxies = original_proxies
+class Chat(BaseChat):
+    def __init__(self, client: 'Qwen3'):
+        self.completions = Completions(client)
+class Qwen3(OpenAICompatibleProvider):
+    url = "https://qwen-qwen3-demo.hf.space"
+    api_endpoint = "https://qwen-qwen3-demo.hf.space/gradio_api/queue/join?__theme=system"
+    AVAILABLE_MODELS = [
+        "qwen3-235b-a22b",
+        "qwen3-32b",
+        "qwen3-30b-a3b",
+        "qwen3-14b",
+        "qwen3-8b",
+        "qwen3-4b",
+        "qwen3-1.7b",
+        "qwen3-0.6b",
+    ]
+    MODEL_ALIASES = {
+        "qwen-3-235b": "qwen3-235b-a22b",
+        "qwen-3-30b": "qwen3-30b-a3b",
+        "qwen-3-32b": "qwen3-32b",
+        "qwen-3-14b": "qwen3-14b",
+        "qwen-3-4b": "qwen3-4b",
+        "qwen-3-1.7b": "qwen3-1.7b",
+        "qwen-3-0.6b": "qwen3-0.6b"
+    }
+    def __init__(self):
+        self.timeout = 30
+        self.session = requests.Session()
+        self.session.proxies = {}
+        self.headers = {
+            'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64; rv:136.0) Gecko/20100101 Firefox/136.0',
+            'Accept': '*/*',
+            'Accept-Language': 'en-US,en;q=0.5',
+            'Accept-Encoding': 'gzip, deflate, br, zstd',
+            'Referer': f'{self.url}/?__theme=system',
+            'content-type': 'application/json',
+            'Origin': self.url,
+            'Connection': 'keep-alive',
+            'Sec-Fetch-Dest': 'empty',
+            'Sec-Fetch-Mode': 'cors',
+            'Sec-Fetch-Site': 'same-origin',
+            'Pragma': 'no-cache',
+            'Cache-Control': 'no-cache',
+        }
+        self.stream_headers = {
+            'Accept': 'text/event-stream',
+            'Accept-Language': 'en-US,en;q=0.5',
+            'Referer': f'{self.url}/?__theme=system',
+            'User-Agent': self.headers['User-Agent'],
+        }
+        self.session.headers.update(self.headers)
+        self.chat = Chat(self)
+    def get_model(self, model):
+        return self.MODEL_ALIASES.get(model, model)
+    @property
+    def models(self):
+        class _ModelList:
+            def list(inner_self):
+                return type(self).AVAILABLE_MODELS
+        return _ModelList()
+if __name__ == "__main__":
+    client = Qwen3()
+    from rich import print
+    resp = client.chat.completions.create(
+        model="qwen3-14b",
+        messages=[
+            {"role": "system", "content": "You are a helpful assistant."},
+            {"role": "user", "content": "Hello "}
+        ],
+        stream=True
+    )
+    for chunk in resp:
         print(chunk, end="", flush=True)

webscout/Provider/OPENAI/README.md CHANGED Viewed

@@ -65,6 +65,11 @@ Currently, the following providers are implemented with OpenAI-compatible interf
 - TwoAI
 - oivscode
 - Qwen3
+- TogetherAI
+- PiAI
+- FalconH1
+- XenAI
+- GeminiProxy
 ---

webscout 8.3__py3-none-any.whl → 8.3.2__py3-none-any.whl

Potentially problematic release.

webscout 8.3py3-none-any.whl → 8.3.2py3-none-any.whl