webscout 8.2.8__py3-none-any.whl → 8.2.9__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (184) hide show
  1. webscout/AIauto.py +32 -14
  2. webscout/AIbase.py +96 -37
  3. webscout/AIutel.py +491 -87
  4. webscout/Bard.py +441 -323
  5. webscout/Extra/GitToolkit/__init__.py +10 -10
  6. webscout/Extra/YTToolkit/ytapi/video.py +232 -232
  7. webscout/Litlogger/README.md +10 -0
  8. webscout/Litlogger/__init__.py +7 -59
  9. webscout/Litlogger/formats.py +4 -0
  10. webscout/Litlogger/handlers.py +103 -0
  11. webscout/Litlogger/levels.py +13 -0
  12. webscout/Litlogger/logger.py +92 -0
  13. webscout/Provider/AISEARCH/Perplexity.py +332 -358
  14. webscout/Provider/AISEARCH/felo_search.py +9 -35
  15. webscout/Provider/AISEARCH/genspark_search.py +30 -56
  16. webscout/Provider/AISEARCH/hika_search.py +4 -16
  17. webscout/Provider/AISEARCH/iask_search.py +410 -436
  18. webscout/Provider/AISEARCH/monica_search.py +4 -30
  19. webscout/Provider/AISEARCH/scira_search.py +6 -32
  20. webscout/Provider/AISEARCH/webpilotai_search.py +38 -64
  21. webscout/Provider/Blackboxai.py +153 -35
  22. webscout/Provider/Deepinfra.py +339 -339
  23. webscout/Provider/ExaChat.py +358 -358
  24. webscout/Provider/Gemini.py +169 -169
  25. webscout/Provider/GithubChat.py +1 -2
  26. webscout/Provider/Glider.py +3 -3
  27. webscout/Provider/HeckAI.py +171 -81
  28. webscout/Provider/OPENAI/BLACKBOXAI.py +766 -735
  29. webscout/Provider/OPENAI/Cloudflare.py +7 -7
  30. webscout/Provider/OPENAI/FreeGemini.py +6 -5
  31. webscout/Provider/OPENAI/NEMOTRON.py +8 -20
  32. webscout/Provider/OPENAI/Qwen3.py +283 -0
  33. webscout/Provider/OPENAI/README.md +952 -1253
  34. webscout/Provider/OPENAI/TwoAI.py +357 -0
  35. webscout/Provider/OPENAI/__init__.py +5 -1
  36. webscout/Provider/OPENAI/ai4chat.py +40 -40
  37. webscout/Provider/OPENAI/api.py +808 -649
  38. webscout/Provider/OPENAI/c4ai.py +3 -3
  39. webscout/Provider/OPENAI/chatgpt.py +555 -555
  40. webscout/Provider/OPENAI/chatgptclone.py +493 -487
  41. webscout/Provider/OPENAI/chatsandbox.py +4 -3
  42. webscout/Provider/OPENAI/copilot.py +242 -0
  43. webscout/Provider/OPENAI/deepinfra.py +5 -2
  44. webscout/Provider/OPENAI/e2b.py +63 -5
  45. webscout/Provider/OPENAI/exaai.py +416 -410
  46. webscout/Provider/OPENAI/exachat.py +444 -443
  47. webscout/Provider/OPENAI/freeaichat.py +2 -2
  48. webscout/Provider/OPENAI/glider.py +5 -2
  49. webscout/Provider/OPENAI/groq.py +5 -2
  50. webscout/Provider/OPENAI/heckai.py +308 -307
  51. webscout/Provider/OPENAI/mcpcore.py +8 -2
  52. webscout/Provider/OPENAI/multichat.py +4 -4
  53. webscout/Provider/OPENAI/netwrck.py +6 -5
  54. webscout/Provider/OPENAI/oivscode.py +287 -0
  55. webscout/Provider/OPENAI/opkfc.py +496 -496
  56. webscout/Provider/OPENAI/pydantic_imports.py +172 -0
  57. webscout/Provider/OPENAI/scirachat.py +15 -9
  58. webscout/Provider/OPENAI/sonus.py +304 -303
  59. webscout/Provider/OPENAI/standardinput.py +433 -433
  60. webscout/Provider/OPENAI/textpollinations.py +4 -4
  61. webscout/Provider/OPENAI/toolbaz.py +413 -413
  62. webscout/Provider/OPENAI/typefully.py +3 -3
  63. webscout/Provider/OPENAI/typegpt.py +11 -5
  64. webscout/Provider/OPENAI/uncovrAI.py +463 -462
  65. webscout/Provider/OPENAI/utils.py +90 -79
  66. webscout/Provider/OPENAI/venice.py +431 -425
  67. webscout/Provider/OPENAI/wisecat.py +387 -381
  68. webscout/Provider/OPENAI/writecream.py +3 -3
  69. webscout/Provider/OPENAI/x0gpt.py +365 -378
  70. webscout/Provider/OPENAI/yep.py +39 -13
  71. webscout/Provider/TTI/README.md +55 -101
  72. webscout/Provider/TTI/__init__.py +4 -9
  73. webscout/Provider/TTI/aiarta.py +365 -0
  74. webscout/Provider/TTI/artbit.py +0 -0
  75. webscout/Provider/TTI/base.py +64 -0
  76. webscout/Provider/TTI/fastflux.py +200 -0
  77. webscout/Provider/TTI/magicstudio.py +201 -0
  78. webscout/Provider/TTI/piclumen.py +203 -0
  79. webscout/Provider/TTI/pixelmuse.py +225 -0
  80. webscout/Provider/TTI/pollinations.py +221 -0
  81. webscout/Provider/TTI/utils.py +11 -0
  82. webscout/Provider/TTS/__init__.py +2 -1
  83. webscout/Provider/TTS/base.py +159 -159
  84. webscout/Provider/TTS/openai_fm.py +129 -0
  85. webscout/Provider/TextPollinationsAI.py +308 -308
  86. webscout/Provider/TwoAI.py +239 -44
  87. webscout/Provider/UNFINISHED/Youchat.py +330 -330
  88. webscout/Provider/UNFINISHED/puterjs.py +635 -0
  89. webscout/Provider/UNFINISHED/test_lmarena.py +119 -119
  90. webscout/Provider/Writecream.py +246 -246
  91. webscout/Provider/__init__.py +2 -0
  92. webscout/Provider/ai4chat.py +33 -8
  93. webscout/Provider/koala.py +169 -169
  94. webscout/Provider/oivscode.py +309 -0
  95. webscout/Provider/samurai.py +3 -2
  96. webscout/Provider/typegpt.py +3 -3
  97. webscout/Provider/uncovr.py +368 -368
  98. webscout/client.py +70 -0
  99. webscout/litprinter/__init__.py +58 -58
  100. webscout/optimizers.py +419 -419
  101. webscout/scout/README.md +3 -1
  102. webscout/scout/core/crawler.py +134 -64
  103. webscout/scout/core/scout.py +148 -109
  104. webscout/scout/element.py +106 -88
  105. webscout/swiftcli/Readme.md +323 -323
  106. webscout/swiftcli/plugins/manager.py +9 -2
  107. webscout/version.py +1 -1
  108. webscout/zeroart/__init__.py +134 -134
  109. webscout/zeroart/effects.py +100 -100
  110. webscout/zeroart/fonts.py +1238 -1238
  111. {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/METADATA +159 -35
  112. {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/RECORD +116 -161
  113. {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/WHEEL +1 -1
  114. {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/entry_points.txt +1 -0
  115. webscout/Litlogger/Readme.md +0 -175
  116. webscout/Litlogger/core/__init__.py +0 -6
  117. webscout/Litlogger/core/level.py +0 -23
  118. webscout/Litlogger/core/logger.py +0 -165
  119. webscout/Litlogger/handlers/__init__.py +0 -12
  120. webscout/Litlogger/handlers/console.py +0 -33
  121. webscout/Litlogger/handlers/file.py +0 -143
  122. webscout/Litlogger/handlers/network.py +0 -173
  123. webscout/Litlogger/styles/__init__.py +0 -7
  124. webscout/Litlogger/styles/colors.py +0 -249
  125. webscout/Litlogger/styles/formats.py +0 -458
  126. webscout/Litlogger/styles/text.py +0 -87
  127. webscout/Litlogger/utils/__init__.py +0 -6
  128. webscout/Litlogger/utils/detectors.py +0 -153
  129. webscout/Litlogger/utils/formatters.py +0 -200
  130. webscout/Provider/TTI/AiForce/README.md +0 -159
  131. webscout/Provider/TTI/AiForce/__init__.py +0 -22
  132. webscout/Provider/TTI/AiForce/async_aiforce.py +0 -224
  133. webscout/Provider/TTI/AiForce/sync_aiforce.py +0 -245
  134. webscout/Provider/TTI/FreeAIPlayground/README.md +0 -99
  135. webscout/Provider/TTI/FreeAIPlayground/__init__.py +0 -9
  136. webscout/Provider/TTI/FreeAIPlayground/async_freeaiplayground.py +0 -181
  137. webscout/Provider/TTI/FreeAIPlayground/sync_freeaiplayground.py +0 -180
  138. webscout/Provider/TTI/ImgSys/README.md +0 -174
  139. webscout/Provider/TTI/ImgSys/__init__.py +0 -23
  140. webscout/Provider/TTI/ImgSys/async_imgsys.py +0 -202
  141. webscout/Provider/TTI/ImgSys/sync_imgsys.py +0 -195
  142. webscout/Provider/TTI/MagicStudio/README.md +0 -101
  143. webscout/Provider/TTI/MagicStudio/__init__.py +0 -2
  144. webscout/Provider/TTI/MagicStudio/async_magicstudio.py +0 -111
  145. webscout/Provider/TTI/MagicStudio/sync_magicstudio.py +0 -109
  146. webscout/Provider/TTI/Nexra/README.md +0 -155
  147. webscout/Provider/TTI/Nexra/__init__.py +0 -22
  148. webscout/Provider/TTI/Nexra/async_nexra.py +0 -286
  149. webscout/Provider/TTI/Nexra/sync_nexra.py +0 -258
  150. webscout/Provider/TTI/PollinationsAI/README.md +0 -146
  151. webscout/Provider/TTI/PollinationsAI/__init__.py +0 -23
  152. webscout/Provider/TTI/PollinationsAI/async_pollinations.py +0 -311
  153. webscout/Provider/TTI/PollinationsAI/sync_pollinations.py +0 -265
  154. webscout/Provider/TTI/aiarta/README.md +0 -134
  155. webscout/Provider/TTI/aiarta/__init__.py +0 -2
  156. webscout/Provider/TTI/aiarta/async_aiarta.py +0 -482
  157. webscout/Provider/TTI/aiarta/sync_aiarta.py +0 -440
  158. webscout/Provider/TTI/artbit/README.md +0 -100
  159. webscout/Provider/TTI/artbit/__init__.py +0 -22
  160. webscout/Provider/TTI/artbit/async_artbit.py +0 -155
  161. webscout/Provider/TTI/artbit/sync_artbit.py +0 -148
  162. webscout/Provider/TTI/fastflux/README.md +0 -129
  163. webscout/Provider/TTI/fastflux/__init__.py +0 -22
  164. webscout/Provider/TTI/fastflux/async_fastflux.py +0 -261
  165. webscout/Provider/TTI/fastflux/sync_fastflux.py +0 -252
  166. webscout/Provider/TTI/huggingface/README.md +0 -114
  167. webscout/Provider/TTI/huggingface/__init__.py +0 -22
  168. webscout/Provider/TTI/huggingface/async_huggingface.py +0 -199
  169. webscout/Provider/TTI/huggingface/sync_huggingface.py +0 -195
  170. webscout/Provider/TTI/piclumen/README.md +0 -161
  171. webscout/Provider/TTI/piclumen/__init__.py +0 -23
  172. webscout/Provider/TTI/piclumen/async_piclumen.py +0 -268
  173. webscout/Provider/TTI/piclumen/sync_piclumen.py +0 -233
  174. webscout/Provider/TTI/pixelmuse/README.md +0 -79
  175. webscout/Provider/TTI/pixelmuse/__init__.py +0 -4
  176. webscout/Provider/TTI/pixelmuse/async_pixelmuse.py +0 -249
  177. webscout/Provider/TTI/pixelmuse/sync_pixelmuse.py +0 -182
  178. webscout/Provider/TTI/talkai/README.md +0 -139
  179. webscout/Provider/TTI/talkai/__init__.py +0 -4
  180. webscout/Provider/TTI/talkai/async_talkai.py +0 -229
  181. webscout/Provider/TTI/talkai/sync_talkai.py +0 -207
  182. webscout/Provider/UNFINISHED/oivscode.py +0 -351
  183. {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/licenses/LICENSE.md +0 -0
  184. {webscout-8.2.8.dist-info → webscout-8.2.9.dist-info}/top_level.txt +0 -0
@@ -12,7 +12,7 @@ from uuid import uuid4
12
12
  from .base import OpenAICompatibleProvider, BaseChat, BaseCompletions
13
13
  from .utils import (
14
14
  ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
15
- ChatCompletionMessage, CompletionUsage
15
+ ChatCompletionMessage, CompletionUsage, count_tokens
16
16
  )
17
17
 
18
18
  from webscout.AIutel import sanitize_stream
@@ -123,9 +123,9 @@ class Completions(BaseCompletions):
123
123
  delta = ChoiceDelta(content=content_chunk)
124
124
  choice = Choice(index=0, delta=delta, finish_reason=None)
125
125
 
126
- # Estimate token usage (very rough estimate)
127
- prompt_tokens = sum(len(msg.get("content", "")) // 4 for msg in payload["messages"])
128
- completion_tokens = len(accumulated_content) // 4
126
+ # Estimate token usage using count_tokens
127
+ prompt_tokens = count_tokens([msg.get("content", "") for msg in payload["messages"]])
128
+ completion_tokens = count_tokens(accumulated_content)
129
129
 
130
130
  chunk = ChatCompletionChunk(
131
131
  id=request_id,
@@ -202,9 +202,9 @@ class Completions(BaseCompletions):
202
202
  finish_reason="stop"
203
203
  )
204
204
 
205
- # Estimate token usage (very rough estimate)
206
- prompt_tokens = sum(len(msg.get("content", "")) // 4 for msg in payload["messages"])
207
- completion_tokens = len(full_content) // 4
205
+ # Estimate token usage using count_tokens
206
+ prompt_tokens = count_tokens([msg.get("content", "") for msg in payload["messages"]])
207
+ completion_tokens = count_tokens(full_content)
208
208
  usage = CompletionUsage(
209
209
  prompt_tokens=prompt_tokens,
210
210
  completion_tokens=completion_tokens,
@@ -22,7 +22,8 @@ from webscout.Provider.OPENAI.utils import (
22
22
  ChoiceDelta,
23
23
  CompletionUsage,
24
24
  format_prompt,
25
- get_system_prompt
25
+ get_system_prompt,
26
+ count_tokens
26
27
  )
27
28
 
28
29
  # ANSI escape codes for formatting
@@ -100,7 +101,7 @@ class Completions(BaseCompletions):
100
101
  for text_chunk in processed_stream:
101
102
  if text_chunk and isinstance(text_chunk, str):
102
103
  streaming_text += text_chunk
103
- completion_tokens += len(text_chunk) // 4 # Rough estimate
104
+ completion_tokens += count_tokens(text_chunk)
104
105
 
105
106
  delta = ChoiceDelta(content=text_chunk, role="assistant")
106
107
  choice = Choice(index=0, delta=delta, finish_reason=None)
@@ -160,9 +161,9 @@ class Completions(BaseCompletions):
160
161
  # Skip invalid JSON
161
162
  pass
162
163
 
163
- # Create usage statistics (rough estimate)
164
- prompt_tokens = len(str(payload)) // 4
165
- completion_tokens = len(full_text_response) // 4
164
+ # Create usage statistics using count_tokens
165
+ prompt_tokens = count_tokens(str(payload))
166
+ completion_tokens = count_tokens(full_text_response)
166
167
  total_tokens = prompt_tokens + completion_tokens
167
168
 
168
169
  usage = CompletionUsage(
@@ -9,7 +9,7 @@ from typing import List, Dict, Optional, Union, Generator, Any
9
9
  from webscout.Provider.OPENAI.base import OpenAICompatibleProvider, BaseChat, BaseCompletions
10
10
  from webscout.Provider.OPENAI.utils import (
11
11
  ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
12
- ChatCompletionMessage, CompletionUsage, format_prompt
12
+ ChatCompletionMessage, CompletionUsage, format_prompt, count_tokens
13
13
  )
14
14
  try:
15
15
  from webscout.litagent import LitAgent
@@ -89,8 +89,8 @@ class Completions(BaseCompletions):
89
89
  pass
90
90
  message = ChatCompletionMessage(role="assistant", content=full_response_content)
91
91
  choice = Choice(index=0, message=message, finish_reason="stop")
92
- prompt_tokens = len(payload.get("content", "")) // 4
93
- completion_tokens = len(full_response_content) // 4
92
+ prompt_tokens = count_tokens(payload.get("content", ""))
93
+ completion_tokens = count_tokens(full_response_content)
94
94
  usage = CompletionUsage(
95
95
  prompt_tokens=prompt_tokens,
96
96
  completion_tokens=completion_tokens,
@@ -111,16 +111,10 @@ class Chat(BaseChat):
111
111
 
112
112
  class NEMOTRON(OpenAICompatibleProvider):
113
113
  AVAILABLE_MODELS = [
114
- "NEMOTRON/gpt4o",
115
- "NEMOTRON/nemotron70b",
114
+ "gpt4o",
115
+ "nemotron70b",
116
116
  ]
117
117
 
118
- # Model mapping for payload
119
- MODEL_PAYLOAD_MAPPING = {
120
- "NEMOTRON/gpt4o": "gpt4o",
121
- "NEMOTRON/nemotron70b": "nemotron70b",
122
- }
123
-
124
118
  API_BASE_URL = "https://nemotron.one/api/chat"
125
119
  def __init__(
126
120
  self,
@@ -183,18 +177,12 @@ class NEMOTRON(OpenAICompatibleProvider):
183
177
  Returns:
184
178
  NEMOTRON model name for API payload
185
179
  """
186
- # Handle NEMOTRON/ prefix aliases for payload
187
- if model_alias.startswith("NEMOTRON/"):
188
- base_model = model_alias.split("/")[1]
189
- if base_model in ["gpt4o", "nemotron70b"]:
190
- return base_model
191
-
192
- # Handle direct model names
193
- if model_alias in ["gpt4o", "nemotron70b"]:
180
+ # Accept only direct model names
181
+ if model_alias in self.AVAILABLE_MODELS:
194
182
  return model_alias
195
183
 
196
184
  # Case-insensitive matching
197
- for m in ["gpt4o", "nemotron70b"]:
185
+ for m in self.AVAILABLE_MODELS:
198
186
  if m.lower() == model_alias.lower():
199
187
  return m
200
188
 
@@ -0,0 +1,283 @@
1
+ import requests
2
+ import json
3
+ import time
4
+ import uuid
5
+ from typing import List, Dict, Optional, Union, Generator, Any
6
+
7
+ from webscout.Provider.OPENAI.base import OpenAICompatibleProvider, BaseChat, BaseCompletions
8
+ from webscout.Provider.OPENAI.utils import (
9
+ ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
10
+ ChatCompletionMessage, CompletionUsage,
11
+ get_last_user_message, get_system_prompt,
12
+ count_tokens
13
+ )
14
+
15
+ class Completions(BaseCompletions):
16
+ def __init__(self, client: 'Qwen3'):
17
+ self._client = client
18
+
19
+ def create(
20
+ self,
21
+ *,
22
+ model: str,
23
+ messages: List[Dict[str, str]],
24
+ max_tokens: Optional[int] = 2048,
25
+ stream: bool = False,
26
+ temperature: Optional[float] = None,
27
+ top_p: Optional[float] = None,
28
+ **kwargs: Any
29
+ ) -> Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]:
30
+ payload = {
31
+ "data": [
32
+ get_last_user_message(messages),
33
+ {
34
+ "thinking_budget": kwargs.get("thinking_budget", 38),
35
+ "model": self._client.get_model(model),
36
+ "sys_prompt": get_system_prompt(messages)
37
+ },
38
+ None, None
39
+ ],
40
+ "event_data": None,
41
+ "fn_index": 13,
42
+ "trigger_id": 31,
43
+ "session_hash": str(uuid.uuid4()).replace('-', '')
44
+ }
45
+
46
+ request_id = f"chatcmpl-{uuid.uuid4()}"
47
+ created_time = int(time.time())
48
+
49
+ if stream:
50
+ return self._create_stream(request_id, created_time, model, payload)
51
+ else:
52
+ return self._create_non_stream(request_id, created_time, model, payload)
53
+
54
+ def _create_stream(
55
+ self, request_id: str, created_time: int, model: str, payload: Dict[str, Any]
56
+ ) -> Generator[ChatCompletionChunk, None, None]:
57
+ session = self._client.session
58
+ headers = self._client.headers
59
+ # Step 1: Join the queue
60
+ join_resp = session.post(self._client.api_endpoint, headers=headers, json=payload, timeout=self._client.timeout)
61
+ join_resp.raise_for_status()
62
+ event_id = join_resp.json().get('event_id')
63
+ session_hash = payload["session_hash"]
64
+
65
+ # Step 2: Stream data
66
+ params = {'session_hash': session_hash}
67
+ stream_resp = session.get(self._client.url + "/gradio_api/queue/data", headers=self._client.stream_headers, params=params, stream=True, timeout=self._client.timeout)
68
+ stream_resp.raise_for_status()
69
+
70
+ # --- New logic to yield all content, tool reasoning, and status, similar to Reasoning class ---
71
+ is_thinking_tag_open = False # True if <think> has been yielded and not yet </think>
72
+
73
+ for line in stream_resp.iter_lines():
74
+ if line:
75
+ decoded_line = line.decode('utf-8')
76
+ if decoded_line.startswith('data: '):
77
+ try:
78
+ json_data = json.loads(decoded_line[6:])
79
+ if json_data.get('msg') == 'process_generating':
80
+ if 'output' in json_data and 'data' in json_data['output'] and len(json_data['output']['data']) > 5:
81
+ updates_list = json_data['output']['data'][5] # This is a list of operations
82
+ for op_details in updates_list:
83
+ action = op_details[0]
84
+ path = op_details[1]
85
+ value = op_details[2]
86
+
87
+ content_to_yield = None
88
+ is_current_op_tool = False
89
+ is_current_op_text = False
90
+
91
+ # Case 1: Adding a new content block (tool or text object)
92
+ if action == "add" and isinstance(value, dict) and "type" in value:
93
+ if len(path) == 4 and path[0] == "value" and path[2] == "content":
94
+ block_type = value.get("type")
95
+ content_to_yield = value.get("content")
96
+ if block_type == "tool":
97
+ is_current_op_tool = True
98
+ elif block_type == "text":
99
+ is_current_op_text = True
100
+
101
+ # Case 2: Appending content string to an existing block
102
+ elif action == "append" and isinstance(value, str):
103
+ if len(path) == 5 and path[0] == "value" and path[2] == "content" and path[4] == "content":
104
+ block_index = path[3] # 0 for tool's content, 1 for text's content
105
+ content_to_yield = value
106
+ if block_index == 0: # Appending to tool's content
107
+ is_current_op_tool = True
108
+ elif block_index == 1: # Appending to text's content
109
+ is_current_op_text = True
110
+
111
+ # Case 3: Tool status update (e.g., "End of Thought")
112
+ elif action == "replace" and len(path) == 6 and \
113
+ path[0] == "value" and path[2] == "content" and \
114
+ path[3] == 0 and path[4] == "options" and path[5] == "status": # path[3]==0 ensures it's the tool block
115
+ if value == "done": # Tool block processing is complete
116
+ if is_thinking_tag_open:
117
+ delta = ChoiceDelta(content="</think>\n\n", role="assistant")
118
+ yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
119
+ is_thinking_tag_open = False
120
+ continue # This operation itself doesn't yield visible content
121
+
122
+ # Yielding logic
123
+ if is_current_op_tool and content_to_yield:
124
+ if not is_thinking_tag_open:
125
+ delta = ChoiceDelta(content="<think>", role="assistant")
126
+ yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
127
+ is_thinking_tag_open = True
128
+
129
+ delta = ChoiceDelta(content=content_to_yield, role="assistant")
130
+ yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
131
+
132
+ elif is_current_op_text and content_to_yield:
133
+ if is_thinking_tag_open: # If text starts, close any open thinking tag
134
+ delta = ChoiceDelta(content="</think>", role="assistant")
135
+ yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
136
+ is_thinking_tag_open = False
137
+
138
+ delta = ChoiceDelta(content=content_to_yield, role="assistant")
139
+ yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
140
+
141
+ if json_data.get('msg') == 'process_completed':
142
+ if is_thinking_tag_open: # Ensure </think> is yielded if process completes mid-thought
143
+ delta = ChoiceDelta(content="</think>", role="assistant")
144
+ yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
145
+ is_thinking_tag_open = False
146
+ break
147
+ except json.JSONDecodeError:
148
+ continue
149
+ except Exception as e:
150
+ # Log or handle other potential exceptions
151
+ continue
152
+
153
+ # After the loop, ensure the tag is closed if the stream broke for reasons other than 'process_completed'
154
+ if is_thinking_tag_open:
155
+ delta = ChoiceDelta(content="</think>", role="assistant")
156
+ yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
157
+
158
+ def _create_non_stream(
159
+ self, request_id: str, created_time: int, model: str, payload: Dict[str, Any]
160
+ ) -> ChatCompletion:
161
+ # For non-streaming, just call the join endpoint and parse the result
162
+ session = self._client.session
163
+ headers = self._client.headers
164
+ resp = session.post(self._client.api_endpoint, headers=headers, json=payload, timeout=self._client.timeout)
165
+ resp.raise_for_status()
166
+ data = resp.json()
167
+ # Return the full content as a single message, including all tool and text reasoning if present
168
+ output = ""
169
+ if 'output' in data and 'data' in data['output'] and len(data['output']['data']) > 5:
170
+ updates = data['output']['data'][5]
171
+ parts = []
172
+ for update in updates:
173
+ if isinstance(update, list) and len(update) > 2 and isinstance(update[2], str):
174
+ parts.append(update[2])
175
+ elif isinstance(update, list) and isinstance(update[1], list) and len(update[1]) > 4:
176
+ if update[1][4] == "content":
177
+ parts.append(update[2])
178
+ elif update[1][4] == "options" and update[2] != "done":
179
+ parts.append(str(update[2]))
180
+ elif isinstance(update, dict):
181
+ if update.get('type') == 'tool':
182
+ parts.append(update.get('content', ''))
183
+ elif update.get('type') == 'text':
184
+ parts.append(update.get('content', ''))
185
+ output = "\n".join([str(p) for p in parts if p])
186
+ else:
187
+ output = data.get('output', {}).get('data', ["", "", "", "", "", [["", "", ""]]])[5][0][2]
188
+ message = ChatCompletionMessage(role="assistant", content=output)
189
+ choice = Choice(index=0, message=message, finish_reason="stop")
190
+ # Use count_tokens to compute usage
191
+ prompt_tokens = count_tokens([m.get('content', '') for m in payload['data'] if isinstance(m, dict) and 'content' in m or isinstance(m, str)])
192
+ completion_tokens = count_tokens(output)
193
+ usage = CompletionUsage(
194
+ prompt_tokens=prompt_tokens,
195
+ completion_tokens=completion_tokens,
196
+ total_tokens=prompt_tokens + completion_tokens
197
+ )
198
+ completion = ChatCompletion(
199
+ id=request_id,
200
+ choices=[choice],
201
+ created=created_time,
202
+ model=model,
203
+ usage=usage,
204
+ )
205
+ return completion
206
+
207
+ class Chat(BaseChat):
208
+ def __init__(self, client: 'Qwen3'):
209
+ self.completions = Completions(client)
210
+
211
+ class Qwen3(OpenAICompatibleProvider):
212
+ url = "https://qwen-qwen3-demo.hf.space"
213
+ api_endpoint = "https://qwen-qwen3-demo.hf.space/gradio_api/queue/join?__theme=system"
214
+ AVAILABLE_MODELS = [
215
+ "qwen3-235b-a22b",
216
+ "qwen3-32b",
217
+ "qwen3-30b-a3b",
218
+ "qwen3-14b",
219
+ "qwen3-8b",
220
+ "qwen3-4b",
221
+ "qwen3-1.7b",
222
+ "qwen3-0.6b",
223
+ ]
224
+ MODEL_ALIASES = {
225
+ "qwen-3-235b": "qwen3-235b-a22b",
226
+ "qwen-3-30b": "qwen3-30b-a3b",
227
+ "qwen-3-32b": "qwen3-32b",
228
+ "qwen-3-14b": "qwen3-14b",
229
+ "qwen-3-4b": "qwen3-4b",
230
+ "qwen-3-1.7b": "qwen3-1.7b",
231
+ "qwen-3-0.6b": "qwen3-0.6b"
232
+ }
233
+
234
+ def __init__(self, timeout: Optional[int] = None):
235
+ self.timeout = timeout
236
+ self.session = requests.Session()
237
+ self.headers = {
238
+ 'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64; rv:136.0) Gecko/20100101 Firefox/136.0',
239
+ 'Accept': '*/*',
240
+ 'Accept-Language': 'en-US,en;q=0.5',
241
+ 'Accept-Encoding': 'gzip, deflate, br, zstd',
242
+ 'Referer': f'{self.url}/?__theme=system',
243
+ 'content-type': 'application/json',
244
+ 'Origin': self.url,
245
+ 'Connection': 'keep-alive',
246
+ 'Sec-Fetch-Dest': 'empty',
247
+ 'Sec-Fetch-Mode': 'cors',
248
+ 'Sec-Fetch-Site': 'same-origin',
249
+ 'Pragma': 'no-cache',
250
+ 'Cache-Control': 'no-cache',
251
+ }
252
+ self.stream_headers = {
253
+ 'Accept': 'text/event-stream',
254
+ 'Accept-Language': 'en-US,en;q=0.5',
255
+ 'Referer': f'{self.url}/?__theme=system',
256
+ 'User-Agent': self.headers['User-Agent'],
257
+ }
258
+ self.session.headers.update(self.headers)
259
+ self.chat = Chat(self)
260
+
261
+ def get_model(self, model):
262
+ return self.MODEL_ALIASES.get(model, model)
263
+
264
+ @property
265
+ def models(self):
266
+ class _ModelList:
267
+ def list(inner_self):
268
+ return type(self).AVAILABLE_MODELS
269
+ return _ModelList()
270
+
271
+ if __name__ == "__main__":
272
+ client = Qwen3()
273
+ from rich import print
274
+ resp = client.chat.completions.create(
275
+ model="qwen3-14b",
276
+ messages=[
277
+ {"role": "system", "content": "You are a helpful assistant."},
278
+ {"role": "user", "content": "Hello "}
279
+ ],
280
+ stream=True
281
+ )
282
+ for chunk in resp:
283
+ print(chunk, end="", flush=True)