webscout 8.2.8__py3-none-any.whl → 8.2.9__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- webscout/AIauto.py +32 -14
- webscout/AIbase.py +96 -37
- webscout/AIutel.py +491 -87
- webscout/Bard.py +441 -323
- webscout/Extra/GitToolkit/__init__.py +10 -10
- webscout/Extra/YTToolkit/ytapi/video.py +232 -232
- webscout/Litlogger/README.md +10 -0
- webscout/Litlogger/__init__.py +7 -59
- webscout/Litlogger/formats.py +4 -0
- webscout/Litlogger/handlers.py +103 -0
- webscout/Litlogger/levels.py +13 -0
- webscout/Litlogger/logger.py +92 -0
- webscout/Provider/AISEARCH/Perplexity.py +332 -358
- webscout/Provider/AISEARCH/felo_search.py +9 -35
- webscout/Provider/AISEARCH/genspark_search.py +30 -56
- webscout/Provider/AISEARCH/hika_search.py +4 -16
- webscout/Provider/AISEARCH/iask_search.py +410 -436
- webscout/Provider/AISEARCH/monica_search.py +4 -30
- webscout/Provider/AISEARCH/scira_search.py +6 -32
- webscout/Provider/AISEARCH/webpilotai_search.py +38 -64
- webscout/Provider/Blackboxai.py +153 -35
- webscout/Provider/Deepinfra.py +339 -339
- webscout/Provider/ExaChat.py +358 -358
- webscout/Provider/Gemini.py +169 -169
- webscout/Provider/GithubChat.py +1 -2
- webscout/Provider/Glider.py +3 -3
- webscout/Provider/HeckAI.py +171 -81
- webscout/Provider/OPENAI/BLACKBOXAI.py +766 -735
- webscout/Provider/OPENAI/Cloudflare.py +7 -7
- webscout/Provider/OPENAI/FreeGemini.py +6 -5
- webscout/Provider/OPENAI/NEMOTRON.py +8 -20
- webscout/Provider/OPENAI/Qwen3.py +283 -0
- webscout/Provider/OPENAI/README.md +952 -1253
- webscout/Provider/OPENAI/TwoAI.py +357 -0
- webscout/Provider/OPENAI/__init__.py +5 -1
- webscout/Provider/OPENAI/ai4chat.py +40 -40
- webscout/Provider/OPENAI/api.py +808 -649
- webscout/Provider/OPENAI/c4ai.py +3 -3
- webscout/Provider/OPENAI/chatgpt.py +555 -555
- webscout/Provider/OPENAI/chatgptclone.py +493 -487
- webscout/Provider/OPENAI/chatsandbox.py +4 -3
- webscout/Provider/OPENAI/copilot.py +242 -0
- webscout/Provider/OPENAI/deepinfra.py +5 -2
- webscout/Provider/OPENAI/e2b.py +63 -5
- webscout/Provider/OPENAI/exaai.py +416 -410
- webscout/Provider/OPENAI/exachat.py +444 -443
- webscout/Provider/OPENAI/freeaichat.py +2 -2
- webscout/Provider/OPENAI/glider.py +5 -2
- webscout/Provider/OPENAI/groq.py +5 -2
- webscout/Provider/OPENAI/heckai.py +308 -307
- webscout/Provider/OPENAI/mcpcore.py +8 -2
- webscout/Provider/OPENAI/multichat.py +4 -4
- webscout/Provider/OPENAI/netwrck.py +6 -5
- webscout/Provider/OPENAI/oivscode.py +287 -0
- webscout/Provider/OPENAI/opkfc.py +496 -496
- webscout/Provider/OPENAI/pydantic_imports.py +172 -0
- webscout/Provider/OPENAI/scirachat.py +15 -9
- webscout/Provider/OPENAI/sonus.py +304 -303
- webscout/Provider/OPENAI/standardinput.py +433 -433
- webscout/Provider/OPENAI/textpollinations.py +4 -4
- webscout/Provider/OPENAI/toolbaz.py +413 -413
- webscout/Provider/OPENAI/typefully.py +3 -3
- webscout/Provider/OPENAI/typegpt.py +11 -5
- webscout/Provider/OPENAI/uncovrAI.py +463 -462
- webscout/Provider/OPENAI/utils.py +90 -79
- webscout/Provider/OPENAI/venice.py +431 -425
- webscout/Provider/OPENAI/wisecat.py +387 -381
- webscout/Provider/OPENAI/writecream.py +3 -3
- webscout/Provider/OPENAI/x0gpt.py +365 -378
- webscout/Provider/OPENAI/yep.py +39 -13
- webscout/Provider/TTI/README.md +55 -101
- webscout/Provider/TTI/__init__.py +4 -9
- webscout/Provider/TTI/aiarta.py +365 -0
- webscout/Provider/TTI/artbit.py +0 -0
- webscout/Provider/TTI/base.py +64 -0
- webscout/Provider/TTI/fastflux.py +200 -0
- webscout/Provider/TTI/magicstudio.py +201 -0
- webscout/Provider/TTI/piclumen.py +203 -0
- webscout/Provider/TTI/pixelmuse.py +225 -0
- webscout/Provider/TTI/pollinations.py +221 -0
- webscout/Provider/TTI/utils.py +11 -0
- webscout/Provider/TTS/__init__.py +2 -1
- webscout/Provider/TTS/base.py +159 -159
- webscout/Provider/TTS/openai_fm.py +129 -0
- webscout/Provider/TextPollinationsAI.py +308 -308
- webscout/Provider/TwoAI.py +239 -44
- webscout/Provider/UNFINISHED/Youchat.py +330 -330
- webscout/Provider/UNFINISHED/puterjs.py +635 -0
- webscout/Provider/UNFINISHED/test_lmarena.py +119 -119
- webscout/Provider/Writecream.py +246 -246
- webscout/Provider/__init__.py +2 -0
- webscout/Provider/ai4chat.py +33 -8
- webscout/Provider/koala.py +169 -169
- webscout/Provider/oivscode.py +309 -0
- webscout/Provider/samurai.py +3 -2
- webscout/Provider/typegpt.py +3 -3
- webscout/Provider/uncovr.py +368 -368
- webscout/client.py +70 -0
- webscout/litprinter/__init__.py +58 -58
- webscout/optimizers.py +419 -419
- webscout/scout/README.md +3 -1
- webscout/scout/core/crawler.py +134 -64
- webscout/scout/core/scout.py +148 -109
- webscout/scout/element.py +106 -88
- webscout/swiftcli/Readme.md +323 -323
- webscout/swiftcli/plugins/manager.py +9 -2
- webscout/version.py +1 -1
- webscout/zeroart/__init__.py +134 -134
- webscout/zeroart/effects.py +100 -100
- webscout/zeroart/fonts.py +1238 -1238
- {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/METADATA +159 -35
- {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/RECORD +116 -161
- {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/WHEEL +1 -1
- {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/entry_points.txt +1 -0
- webscout/Litlogger/Readme.md +0 -175
- webscout/Litlogger/core/__init__.py +0 -6
- webscout/Litlogger/core/level.py +0 -23
- webscout/Litlogger/core/logger.py +0 -165
- webscout/Litlogger/handlers/__init__.py +0 -12
- webscout/Litlogger/handlers/console.py +0 -33
- webscout/Litlogger/handlers/file.py +0 -143
- webscout/Litlogger/handlers/network.py +0 -173
- webscout/Litlogger/styles/__init__.py +0 -7
- webscout/Litlogger/styles/colors.py +0 -249
- webscout/Litlogger/styles/formats.py +0 -458
- webscout/Litlogger/styles/text.py +0 -87
- webscout/Litlogger/utils/__init__.py +0 -6
- webscout/Litlogger/utils/detectors.py +0 -153
- webscout/Litlogger/utils/formatters.py +0 -200
- webscout/Provider/TTI/AiForce/README.md +0 -159
- webscout/Provider/TTI/AiForce/__init__.py +0 -22
- webscout/Provider/TTI/AiForce/async_aiforce.py +0 -224
- webscout/Provider/TTI/AiForce/sync_aiforce.py +0 -245
- webscout/Provider/TTI/FreeAIPlayground/README.md +0 -99
- webscout/Provider/TTI/FreeAIPlayground/__init__.py +0 -9
- webscout/Provider/TTI/FreeAIPlayground/async_freeaiplayground.py +0 -181
- webscout/Provider/TTI/FreeAIPlayground/sync_freeaiplayground.py +0 -180
- webscout/Provider/TTI/ImgSys/README.md +0 -174
- webscout/Provider/TTI/ImgSys/__init__.py +0 -23
- webscout/Provider/TTI/ImgSys/async_imgsys.py +0 -202
- webscout/Provider/TTI/ImgSys/sync_imgsys.py +0 -195
- webscout/Provider/TTI/MagicStudio/README.md +0 -101
- webscout/Provider/TTI/MagicStudio/__init__.py +0 -2
- webscout/Provider/TTI/MagicStudio/async_magicstudio.py +0 -111
- webscout/Provider/TTI/MagicStudio/sync_magicstudio.py +0 -109
- webscout/Provider/TTI/Nexra/README.md +0 -155
- webscout/Provider/TTI/Nexra/__init__.py +0 -22
- webscout/Provider/TTI/Nexra/async_nexra.py +0 -286
- webscout/Provider/TTI/Nexra/sync_nexra.py +0 -258
- webscout/Provider/TTI/PollinationsAI/README.md +0 -146
- webscout/Provider/TTI/PollinationsAI/__init__.py +0 -23
- webscout/Provider/TTI/PollinationsAI/async_pollinations.py +0 -311
- webscout/Provider/TTI/PollinationsAI/sync_pollinations.py +0 -265
- webscout/Provider/TTI/aiarta/README.md +0 -134
- webscout/Provider/TTI/aiarta/__init__.py +0 -2
- webscout/Provider/TTI/aiarta/async_aiarta.py +0 -482
- webscout/Provider/TTI/aiarta/sync_aiarta.py +0 -440
- webscout/Provider/TTI/artbit/README.md +0 -100
- webscout/Provider/TTI/artbit/__init__.py +0 -22
- webscout/Provider/TTI/artbit/async_artbit.py +0 -155
- webscout/Provider/TTI/artbit/sync_artbit.py +0 -148
- webscout/Provider/TTI/fastflux/README.md +0 -129
- webscout/Provider/TTI/fastflux/__init__.py +0 -22
- webscout/Provider/TTI/fastflux/async_fastflux.py +0 -261
- webscout/Provider/TTI/fastflux/sync_fastflux.py +0 -252
- webscout/Provider/TTI/huggingface/README.md +0 -114
- webscout/Provider/TTI/huggingface/__init__.py +0 -22
- webscout/Provider/TTI/huggingface/async_huggingface.py +0 -199
- webscout/Provider/TTI/huggingface/sync_huggingface.py +0 -195
- webscout/Provider/TTI/piclumen/README.md +0 -161
- webscout/Provider/TTI/piclumen/__init__.py +0 -23
- webscout/Provider/TTI/piclumen/async_piclumen.py +0 -268
- webscout/Provider/TTI/piclumen/sync_piclumen.py +0 -233
- webscout/Provider/TTI/pixelmuse/README.md +0 -79
- webscout/Provider/TTI/pixelmuse/__init__.py +0 -4
- webscout/Provider/TTI/pixelmuse/async_pixelmuse.py +0 -249
- webscout/Provider/TTI/pixelmuse/sync_pixelmuse.py +0 -182
- webscout/Provider/TTI/talkai/README.md +0 -139
- webscout/Provider/TTI/talkai/__init__.py +0 -4
- webscout/Provider/TTI/talkai/async_talkai.py +0 -229
- webscout/Provider/TTI/talkai/sync_talkai.py +0 -207
- webscout/Provider/UNFINISHED/oivscode.py +0 -351
- {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/licenses/LICENSE.md +0 -0
- {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/top_level.txt +0 -0
|
@@ -12,7 +12,7 @@ from uuid import uuid4
|
|
|
12
12
|
from .base import OpenAICompatibleProvider, BaseChat, BaseCompletions
|
|
13
13
|
from .utils import (
|
|
14
14
|
ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
|
|
15
|
-
ChatCompletionMessage, CompletionUsage
|
|
15
|
+
ChatCompletionMessage, CompletionUsage, count_tokens
|
|
16
16
|
)
|
|
17
17
|
|
|
18
18
|
from webscout.AIutel import sanitize_stream
|
|
@@ -123,9 +123,9 @@ class Completions(BaseCompletions):
|
|
|
123
123
|
delta = ChoiceDelta(content=content_chunk)
|
|
124
124
|
choice = Choice(index=0, delta=delta, finish_reason=None)
|
|
125
125
|
|
|
126
|
-
# Estimate token usage
|
|
127
|
-
prompt_tokens =
|
|
128
|
-
completion_tokens =
|
|
126
|
+
# Estimate token usage using count_tokens
|
|
127
|
+
prompt_tokens = count_tokens([msg.get("content", "") for msg in payload["messages"]])
|
|
128
|
+
completion_tokens = count_tokens(accumulated_content)
|
|
129
129
|
|
|
130
130
|
chunk = ChatCompletionChunk(
|
|
131
131
|
id=request_id,
|
|
@@ -202,9 +202,9 @@ class Completions(BaseCompletions):
|
|
|
202
202
|
finish_reason="stop"
|
|
203
203
|
)
|
|
204
204
|
|
|
205
|
-
# Estimate token usage
|
|
206
|
-
prompt_tokens =
|
|
207
|
-
completion_tokens =
|
|
205
|
+
# Estimate token usage using count_tokens
|
|
206
|
+
prompt_tokens = count_tokens([msg.get("content", "") for msg in payload["messages"]])
|
|
207
|
+
completion_tokens = count_tokens(full_content)
|
|
208
208
|
usage = CompletionUsage(
|
|
209
209
|
prompt_tokens=prompt_tokens,
|
|
210
210
|
completion_tokens=completion_tokens,
|
|
@@ -22,7 +22,8 @@ from webscout.Provider.OPENAI.utils import (
|
|
|
22
22
|
ChoiceDelta,
|
|
23
23
|
CompletionUsage,
|
|
24
24
|
format_prompt,
|
|
25
|
-
get_system_prompt
|
|
25
|
+
get_system_prompt,
|
|
26
|
+
count_tokens
|
|
26
27
|
)
|
|
27
28
|
|
|
28
29
|
# ANSI escape codes for formatting
|
|
@@ -100,7 +101,7 @@ class Completions(BaseCompletions):
|
|
|
100
101
|
for text_chunk in processed_stream:
|
|
101
102
|
if text_chunk and isinstance(text_chunk, str):
|
|
102
103
|
streaming_text += text_chunk
|
|
103
|
-
completion_tokens +=
|
|
104
|
+
completion_tokens += count_tokens(text_chunk)
|
|
104
105
|
|
|
105
106
|
delta = ChoiceDelta(content=text_chunk, role="assistant")
|
|
106
107
|
choice = Choice(index=0, delta=delta, finish_reason=None)
|
|
@@ -160,9 +161,9 @@ class Completions(BaseCompletions):
|
|
|
160
161
|
# Skip invalid JSON
|
|
161
162
|
pass
|
|
162
163
|
|
|
163
|
-
# Create usage statistics
|
|
164
|
-
prompt_tokens =
|
|
165
|
-
completion_tokens =
|
|
164
|
+
# Create usage statistics using count_tokens
|
|
165
|
+
prompt_tokens = count_tokens(str(payload))
|
|
166
|
+
completion_tokens = count_tokens(full_text_response)
|
|
166
167
|
total_tokens = prompt_tokens + completion_tokens
|
|
167
168
|
|
|
168
169
|
usage = CompletionUsage(
|
|
@@ -9,7 +9,7 @@ from typing import List, Dict, Optional, Union, Generator, Any
|
|
|
9
9
|
from webscout.Provider.OPENAI.base import OpenAICompatibleProvider, BaseChat, BaseCompletions
|
|
10
10
|
from webscout.Provider.OPENAI.utils import (
|
|
11
11
|
ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
|
|
12
|
-
ChatCompletionMessage, CompletionUsage, format_prompt
|
|
12
|
+
ChatCompletionMessage, CompletionUsage, format_prompt, count_tokens
|
|
13
13
|
)
|
|
14
14
|
try:
|
|
15
15
|
from webscout.litagent import LitAgent
|
|
@@ -89,8 +89,8 @@ class Completions(BaseCompletions):
|
|
|
89
89
|
pass
|
|
90
90
|
message = ChatCompletionMessage(role="assistant", content=full_response_content)
|
|
91
91
|
choice = Choice(index=0, message=message, finish_reason="stop")
|
|
92
|
-
prompt_tokens =
|
|
93
|
-
completion_tokens =
|
|
92
|
+
prompt_tokens = count_tokens(payload.get("content", ""))
|
|
93
|
+
completion_tokens = count_tokens(full_response_content)
|
|
94
94
|
usage = CompletionUsage(
|
|
95
95
|
prompt_tokens=prompt_tokens,
|
|
96
96
|
completion_tokens=completion_tokens,
|
|
@@ -111,16 +111,10 @@ class Chat(BaseChat):
|
|
|
111
111
|
|
|
112
112
|
class NEMOTRON(OpenAICompatibleProvider):
|
|
113
113
|
AVAILABLE_MODELS = [
|
|
114
|
-
"
|
|
115
|
-
"
|
|
114
|
+
"gpt4o",
|
|
115
|
+
"nemotron70b",
|
|
116
116
|
]
|
|
117
117
|
|
|
118
|
-
# Model mapping for payload
|
|
119
|
-
MODEL_PAYLOAD_MAPPING = {
|
|
120
|
-
"NEMOTRON/gpt4o": "gpt4o",
|
|
121
|
-
"NEMOTRON/nemotron70b": "nemotron70b",
|
|
122
|
-
}
|
|
123
|
-
|
|
124
118
|
API_BASE_URL = "https://nemotron.one/api/chat"
|
|
125
119
|
def __init__(
|
|
126
120
|
self,
|
|
@@ -183,18 +177,12 @@ class NEMOTRON(OpenAICompatibleProvider):
|
|
|
183
177
|
Returns:
|
|
184
178
|
NEMOTRON model name for API payload
|
|
185
179
|
"""
|
|
186
|
-
#
|
|
187
|
-
if model_alias.
|
|
188
|
-
base_model = model_alias.split("/")[1]
|
|
189
|
-
if base_model in ["gpt4o", "nemotron70b"]:
|
|
190
|
-
return base_model
|
|
191
|
-
|
|
192
|
-
# Handle direct model names
|
|
193
|
-
if model_alias in ["gpt4o", "nemotron70b"]:
|
|
180
|
+
# Accept only direct model names
|
|
181
|
+
if model_alias in self.AVAILABLE_MODELS:
|
|
194
182
|
return model_alias
|
|
195
183
|
|
|
196
184
|
# Case-insensitive matching
|
|
197
|
-
for m in
|
|
185
|
+
for m in self.AVAILABLE_MODELS:
|
|
198
186
|
if m.lower() == model_alias.lower():
|
|
199
187
|
return m
|
|
200
188
|
|
|
@@ -0,0 +1,283 @@
|
|
|
1
|
+
import requests
|
|
2
|
+
import json
|
|
3
|
+
import time
|
|
4
|
+
import uuid
|
|
5
|
+
from typing import List, Dict, Optional, Union, Generator, Any
|
|
6
|
+
|
|
7
|
+
from webscout.Provider.OPENAI.base import OpenAICompatibleProvider, BaseChat, BaseCompletions
|
|
8
|
+
from webscout.Provider.OPENAI.utils import (
|
|
9
|
+
ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
|
|
10
|
+
ChatCompletionMessage, CompletionUsage,
|
|
11
|
+
get_last_user_message, get_system_prompt,
|
|
12
|
+
count_tokens
|
|
13
|
+
)
|
|
14
|
+
|
|
15
|
+
class Completions(BaseCompletions):
|
|
16
|
+
def __init__(self, client: 'Qwen3'):
|
|
17
|
+
self._client = client
|
|
18
|
+
|
|
19
|
+
def create(
|
|
20
|
+
self,
|
|
21
|
+
*,
|
|
22
|
+
model: str,
|
|
23
|
+
messages: List[Dict[str, str]],
|
|
24
|
+
max_tokens: Optional[int] = 2048,
|
|
25
|
+
stream: bool = False,
|
|
26
|
+
temperature: Optional[float] = None,
|
|
27
|
+
top_p: Optional[float] = None,
|
|
28
|
+
**kwargs: Any
|
|
29
|
+
) -> Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]:
|
|
30
|
+
payload = {
|
|
31
|
+
"data": [
|
|
32
|
+
get_last_user_message(messages),
|
|
33
|
+
{
|
|
34
|
+
"thinking_budget": kwargs.get("thinking_budget", 38),
|
|
35
|
+
"model": self._client.get_model(model),
|
|
36
|
+
"sys_prompt": get_system_prompt(messages)
|
|
37
|
+
},
|
|
38
|
+
None, None
|
|
39
|
+
],
|
|
40
|
+
"event_data": None,
|
|
41
|
+
"fn_index": 13,
|
|
42
|
+
"trigger_id": 31,
|
|
43
|
+
"session_hash": str(uuid.uuid4()).replace('-', '')
|
|
44
|
+
}
|
|
45
|
+
|
|
46
|
+
request_id = f"chatcmpl-{uuid.uuid4()}"
|
|
47
|
+
created_time = int(time.time())
|
|
48
|
+
|
|
49
|
+
if stream:
|
|
50
|
+
return self._create_stream(request_id, created_time, model, payload)
|
|
51
|
+
else:
|
|
52
|
+
return self._create_non_stream(request_id, created_time, model, payload)
|
|
53
|
+
|
|
54
|
+
def _create_stream(
|
|
55
|
+
self, request_id: str, created_time: int, model: str, payload: Dict[str, Any]
|
|
56
|
+
) -> Generator[ChatCompletionChunk, None, None]:
|
|
57
|
+
session = self._client.session
|
|
58
|
+
headers = self._client.headers
|
|
59
|
+
# Step 1: Join the queue
|
|
60
|
+
join_resp = session.post(self._client.api_endpoint, headers=headers, json=payload, timeout=self._client.timeout)
|
|
61
|
+
join_resp.raise_for_status()
|
|
62
|
+
event_id = join_resp.json().get('event_id')
|
|
63
|
+
session_hash = payload["session_hash"]
|
|
64
|
+
|
|
65
|
+
# Step 2: Stream data
|
|
66
|
+
params = {'session_hash': session_hash}
|
|
67
|
+
stream_resp = session.get(self._client.url + "/gradio_api/queue/data", headers=self._client.stream_headers, params=params, stream=True, timeout=self._client.timeout)
|
|
68
|
+
stream_resp.raise_for_status()
|
|
69
|
+
|
|
70
|
+
# --- New logic to yield all content, tool reasoning, and status, similar to Reasoning class ---
|
|
71
|
+
is_thinking_tag_open = False # True if <think> has been yielded and not yet </think>
|
|
72
|
+
|
|
73
|
+
for line in stream_resp.iter_lines():
|
|
74
|
+
if line:
|
|
75
|
+
decoded_line = line.decode('utf-8')
|
|
76
|
+
if decoded_line.startswith('data: '):
|
|
77
|
+
try:
|
|
78
|
+
json_data = json.loads(decoded_line[6:])
|
|
79
|
+
if json_data.get('msg') == 'process_generating':
|
|
80
|
+
if 'output' in json_data and 'data' in json_data['output'] and len(json_data['output']['data']) > 5:
|
|
81
|
+
updates_list = json_data['output']['data'][5] # This is a list of operations
|
|
82
|
+
for op_details in updates_list:
|
|
83
|
+
action = op_details[0]
|
|
84
|
+
path = op_details[1]
|
|
85
|
+
value = op_details[2]
|
|
86
|
+
|
|
87
|
+
content_to_yield = None
|
|
88
|
+
is_current_op_tool = False
|
|
89
|
+
is_current_op_text = False
|
|
90
|
+
|
|
91
|
+
# Case 1: Adding a new content block (tool or text object)
|
|
92
|
+
if action == "add" and isinstance(value, dict) and "type" in value:
|
|
93
|
+
if len(path) == 4 and path[0] == "value" and path[2] == "content":
|
|
94
|
+
block_type = value.get("type")
|
|
95
|
+
content_to_yield = value.get("content")
|
|
96
|
+
if block_type == "tool":
|
|
97
|
+
is_current_op_tool = True
|
|
98
|
+
elif block_type == "text":
|
|
99
|
+
is_current_op_text = True
|
|
100
|
+
|
|
101
|
+
# Case 2: Appending content string to an existing block
|
|
102
|
+
elif action == "append" and isinstance(value, str):
|
|
103
|
+
if len(path) == 5 and path[0] == "value" and path[2] == "content" and path[4] == "content":
|
|
104
|
+
block_index = path[3] # 0 for tool's content, 1 for text's content
|
|
105
|
+
content_to_yield = value
|
|
106
|
+
if block_index == 0: # Appending to tool's content
|
|
107
|
+
is_current_op_tool = True
|
|
108
|
+
elif block_index == 1: # Appending to text's content
|
|
109
|
+
is_current_op_text = True
|
|
110
|
+
|
|
111
|
+
# Case 3: Tool status update (e.g., "End of Thought")
|
|
112
|
+
elif action == "replace" and len(path) == 6 and \
|
|
113
|
+
path[0] == "value" and path[2] == "content" and \
|
|
114
|
+
path[3] == 0 and path[4] == "options" and path[5] == "status": # path[3]==0 ensures it's the tool block
|
|
115
|
+
if value == "done": # Tool block processing is complete
|
|
116
|
+
if is_thinking_tag_open:
|
|
117
|
+
delta = ChoiceDelta(content="</think>\n\n", role="assistant")
|
|
118
|
+
yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
|
|
119
|
+
is_thinking_tag_open = False
|
|
120
|
+
continue # This operation itself doesn't yield visible content
|
|
121
|
+
|
|
122
|
+
# Yielding logic
|
|
123
|
+
if is_current_op_tool and content_to_yield:
|
|
124
|
+
if not is_thinking_tag_open:
|
|
125
|
+
delta = ChoiceDelta(content="<think>", role="assistant")
|
|
126
|
+
yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
|
|
127
|
+
is_thinking_tag_open = True
|
|
128
|
+
|
|
129
|
+
delta = ChoiceDelta(content=content_to_yield, role="assistant")
|
|
130
|
+
yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
|
|
131
|
+
|
|
132
|
+
elif is_current_op_text and content_to_yield:
|
|
133
|
+
if is_thinking_tag_open: # If text starts, close any open thinking tag
|
|
134
|
+
delta = ChoiceDelta(content="</think>", role="assistant")
|
|
135
|
+
yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
|
|
136
|
+
is_thinking_tag_open = False
|
|
137
|
+
|
|
138
|
+
delta = ChoiceDelta(content=content_to_yield, role="assistant")
|
|
139
|
+
yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
|
|
140
|
+
|
|
141
|
+
if json_data.get('msg') == 'process_completed':
|
|
142
|
+
if is_thinking_tag_open: # Ensure </think> is yielded if process completes mid-thought
|
|
143
|
+
delta = ChoiceDelta(content="</think>", role="assistant")
|
|
144
|
+
yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
|
|
145
|
+
is_thinking_tag_open = False
|
|
146
|
+
break
|
|
147
|
+
except json.JSONDecodeError:
|
|
148
|
+
continue
|
|
149
|
+
except Exception as e:
|
|
150
|
+
# Log or handle other potential exceptions
|
|
151
|
+
continue
|
|
152
|
+
|
|
153
|
+
# After the loop, ensure the tag is closed if the stream broke for reasons other than 'process_completed'
|
|
154
|
+
if is_thinking_tag_open:
|
|
155
|
+
delta = ChoiceDelta(content="</think>", role="assistant")
|
|
156
|
+
yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
|
|
157
|
+
|
|
158
|
+
def _create_non_stream(
|
|
159
|
+
self, request_id: str, created_time: int, model: str, payload: Dict[str, Any]
|
|
160
|
+
) -> ChatCompletion:
|
|
161
|
+
# For non-streaming, just call the join endpoint and parse the result
|
|
162
|
+
session = self._client.session
|
|
163
|
+
headers = self._client.headers
|
|
164
|
+
resp = session.post(self._client.api_endpoint, headers=headers, json=payload, timeout=self._client.timeout)
|
|
165
|
+
resp.raise_for_status()
|
|
166
|
+
data = resp.json()
|
|
167
|
+
# Return the full content as a single message, including all tool and text reasoning if present
|
|
168
|
+
output = ""
|
|
169
|
+
if 'output' in data and 'data' in data['output'] and len(data['output']['data']) > 5:
|
|
170
|
+
updates = data['output']['data'][5]
|
|
171
|
+
parts = []
|
|
172
|
+
for update in updates:
|
|
173
|
+
if isinstance(update, list) and len(update) > 2 and isinstance(update[2], str):
|
|
174
|
+
parts.append(update[2])
|
|
175
|
+
elif isinstance(update, list) and isinstance(update[1], list) and len(update[1]) > 4:
|
|
176
|
+
if update[1][4] == "content":
|
|
177
|
+
parts.append(update[2])
|
|
178
|
+
elif update[1][4] == "options" and update[2] != "done":
|
|
179
|
+
parts.append(str(update[2]))
|
|
180
|
+
elif isinstance(update, dict):
|
|
181
|
+
if update.get('type') == 'tool':
|
|
182
|
+
parts.append(update.get('content', ''))
|
|
183
|
+
elif update.get('type') == 'text':
|
|
184
|
+
parts.append(update.get('content', ''))
|
|
185
|
+
output = "\n".join([str(p) for p in parts if p])
|
|
186
|
+
else:
|
|
187
|
+
output = data.get('output', {}).get('data', ["", "", "", "", "", [["", "", ""]]])[5][0][2]
|
|
188
|
+
message = ChatCompletionMessage(role="assistant", content=output)
|
|
189
|
+
choice = Choice(index=0, message=message, finish_reason="stop")
|
|
190
|
+
# Use count_tokens to compute usage
|
|
191
|
+
prompt_tokens = count_tokens([m.get('content', '') for m in payload['data'] if isinstance(m, dict) and 'content' in m or isinstance(m, str)])
|
|
192
|
+
completion_tokens = count_tokens(output)
|
|
193
|
+
usage = CompletionUsage(
|
|
194
|
+
prompt_tokens=prompt_tokens,
|
|
195
|
+
completion_tokens=completion_tokens,
|
|
196
|
+
total_tokens=prompt_tokens + completion_tokens
|
|
197
|
+
)
|
|
198
|
+
completion = ChatCompletion(
|
|
199
|
+
id=request_id,
|
|
200
|
+
choices=[choice],
|
|
201
|
+
created=created_time,
|
|
202
|
+
model=model,
|
|
203
|
+
usage=usage,
|
|
204
|
+
)
|
|
205
|
+
return completion
|
|
206
|
+
|
|
207
|
+
class Chat(BaseChat):
|
|
208
|
+
def __init__(self, client: 'Qwen3'):
|
|
209
|
+
self.completions = Completions(client)
|
|
210
|
+
|
|
211
|
+
class Qwen3(OpenAICompatibleProvider):
|
|
212
|
+
url = "https://qwen-qwen3-demo.hf.space"
|
|
213
|
+
api_endpoint = "https://qwen-qwen3-demo.hf.space/gradio_api/queue/join?__theme=system"
|
|
214
|
+
AVAILABLE_MODELS = [
|
|
215
|
+
"qwen3-235b-a22b",
|
|
216
|
+
"qwen3-32b",
|
|
217
|
+
"qwen3-30b-a3b",
|
|
218
|
+
"qwen3-14b",
|
|
219
|
+
"qwen3-8b",
|
|
220
|
+
"qwen3-4b",
|
|
221
|
+
"qwen3-1.7b",
|
|
222
|
+
"qwen3-0.6b",
|
|
223
|
+
]
|
|
224
|
+
MODEL_ALIASES = {
|
|
225
|
+
"qwen-3-235b": "qwen3-235b-a22b",
|
|
226
|
+
"qwen-3-30b": "qwen3-30b-a3b",
|
|
227
|
+
"qwen-3-32b": "qwen3-32b",
|
|
228
|
+
"qwen-3-14b": "qwen3-14b",
|
|
229
|
+
"qwen-3-4b": "qwen3-4b",
|
|
230
|
+
"qwen-3-1.7b": "qwen3-1.7b",
|
|
231
|
+
"qwen-3-0.6b": "qwen3-0.6b"
|
|
232
|
+
}
|
|
233
|
+
|
|
234
|
+
def __init__(self, timeout: Optional[int] = None):
|
|
235
|
+
self.timeout = timeout
|
|
236
|
+
self.session = requests.Session()
|
|
237
|
+
self.headers = {
|
|
238
|
+
'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64; rv:136.0) Gecko/20100101 Firefox/136.0',
|
|
239
|
+
'Accept': '*/*',
|
|
240
|
+
'Accept-Language': 'en-US,en;q=0.5',
|
|
241
|
+
'Accept-Encoding': 'gzip, deflate, br, zstd',
|
|
242
|
+
'Referer': f'{self.url}/?__theme=system',
|
|
243
|
+
'content-type': 'application/json',
|
|
244
|
+
'Origin': self.url,
|
|
245
|
+
'Connection': 'keep-alive',
|
|
246
|
+
'Sec-Fetch-Dest': 'empty',
|
|
247
|
+
'Sec-Fetch-Mode': 'cors',
|
|
248
|
+
'Sec-Fetch-Site': 'same-origin',
|
|
249
|
+
'Pragma': 'no-cache',
|
|
250
|
+
'Cache-Control': 'no-cache',
|
|
251
|
+
}
|
|
252
|
+
self.stream_headers = {
|
|
253
|
+
'Accept': 'text/event-stream',
|
|
254
|
+
'Accept-Language': 'en-US,en;q=0.5',
|
|
255
|
+
'Referer': f'{self.url}/?__theme=system',
|
|
256
|
+
'User-Agent': self.headers['User-Agent'],
|
|
257
|
+
}
|
|
258
|
+
self.session.headers.update(self.headers)
|
|
259
|
+
self.chat = Chat(self)
|
|
260
|
+
|
|
261
|
+
def get_model(self, model):
|
|
262
|
+
return self.MODEL_ALIASES.get(model, model)
|
|
263
|
+
|
|
264
|
+
@property
|
|
265
|
+
def models(self):
|
|
266
|
+
class _ModelList:
|
|
267
|
+
def list(inner_self):
|
|
268
|
+
return type(self).AVAILABLE_MODELS
|
|
269
|
+
return _ModelList()
|
|
270
|
+
|
|
271
|
+
if __name__ == "__main__":
|
|
272
|
+
client = Qwen3()
|
|
273
|
+
from rich import print
|
|
274
|
+
resp = client.chat.completions.create(
|
|
275
|
+
model="qwen3-14b",
|
|
276
|
+
messages=[
|
|
277
|
+
{"role": "system", "content": "You are a helpful assistant."},
|
|
278
|
+
{"role": "user", "content": "Hello "}
|
|
279
|
+
],
|
|
280
|
+
stream=True
|
|
281
|
+
)
|
|
282
|
+
for chunk in resp:
|
|
283
|
+
print(chunk, end="", flush=True)
|