webscout 8.2.9__py3-none-any.whl → 8.3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of webscout might be problematic. Click here for more details.
- webscout/AIauto.py +2 -2
- webscout/Provider/Blackboxai.py +2 -0
- webscout/Provider/ChatSandbox.py +2 -1
- webscout/Provider/Deepinfra.py +1 -1
- webscout/Provider/HeckAI.py +1 -1
- webscout/Provider/LambdaChat.py +1 -0
- webscout/Provider/MCPCore.py +7 -3
- webscout/Provider/OPENAI/BLACKBOXAI.py +1017 -766
- webscout/Provider/OPENAI/Cloudflare.py +31 -14
- webscout/Provider/OPENAI/FalconH1.py +457 -0
- webscout/Provider/OPENAI/FreeGemini.py +29 -13
- webscout/Provider/OPENAI/NEMOTRON.py +26 -14
- webscout/Provider/OPENAI/PI.py +427 -0
- webscout/Provider/OPENAI/Qwen3.py +303 -282
- webscout/Provider/OPENAI/TwoAI.py +29 -12
- webscout/Provider/OPENAI/__init__.py +3 -1
- webscout/Provider/OPENAI/ai4chat.py +33 -23
- webscout/Provider/OPENAI/api.py +78 -12
- webscout/Provider/OPENAI/base.py +2 -0
- webscout/Provider/OPENAI/c4ai.py +31 -10
- webscout/Provider/OPENAI/chatgpt.py +41 -22
- webscout/Provider/OPENAI/chatgptclone.py +32 -13
- webscout/Provider/OPENAI/chatsandbox.py +7 -3
- webscout/Provider/OPENAI/copilot.py +26 -10
- webscout/Provider/OPENAI/deepinfra.py +327 -321
- webscout/Provider/OPENAI/e2b.py +77 -99
- webscout/Provider/OPENAI/exaai.py +13 -10
- webscout/Provider/OPENAI/exachat.py +10 -6
- webscout/Provider/OPENAI/flowith.py +7 -3
- webscout/Provider/OPENAI/freeaichat.py +10 -6
- webscout/Provider/OPENAI/glider.py +10 -6
- webscout/Provider/OPENAI/heckai.py +11 -8
- webscout/Provider/OPENAI/llmchatco.py +9 -7
- webscout/Provider/OPENAI/mcpcore.py +10 -7
- webscout/Provider/OPENAI/multichat.py +3 -1
- webscout/Provider/OPENAI/netwrck.py +10 -6
- webscout/Provider/OPENAI/oivscode.py +12 -9
- webscout/Provider/OPENAI/opkfc.py +14 -3
- webscout/Provider/OPENAI/scirachat.py +14 -8
- webscout/Provider/OPENAI/sonus.py +10 -6
- webscout/Provider/OPENAI/standardinput.py +18 -9
- webscout/Provider/OPENAI/textpollinations.py +14 -7
- webscout/Provider/OPENAI/toolbaz.py +16 -10
- webscout/Provider/OPENAI/typefully.py +14 -7
- webscout/Provider/OPENAI/typegpt.py +10 -6
- webscout/Provider/OPENAI/uncovrAI.py +22 -8
- webscout/Provider/OPENAI/venice.py +10 -6
- webscout/Provider/OPENAI/writecream.py +166 -163
- webscout/Provider/OPENAI/x0gpt.py +367 -365
- webscout/Provider/OPENAI/yep.py +384 -382
- webscout/Provider/PI.py +2 -1
- webscout/Provider/__init__.py +0 -2
- webscout/Provider/granite.py +41 -6
- webscout/Provider/oivscode.py +37 -37
- webscout/Provider/scnet.py +1 -0
- webscout/version.py +1 -1
- {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/METADATA +2 -1
- {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/RECORD +62 -61
- {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/WHEEL +1 -1
- webscout/Provider/ChatGPTGratis.py +0 -194
- {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/entry_points.txt +0 -0
- {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/licenses/LICENSE.md +0 -0
- {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/top_level.txt +0 -0
|
@@ -31,6 +31,8 @@ class Completions(BaseCompletions):
|
|
|
31
31
|
stream: bool = False,
|
|
32
32
|
temperature: Optional[float] = None,
|
|
33
33
|
top_p: Optional[float] = None,
|
|
34
|
+
timeout: Optional[int] = None,
|
|
35
|
+
proxies: Optional[dict] = None,
|
|
34
36
|
**kwargs: Any
|
|
35
37
|
) -> Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]:
|
|
36
38
|
"""
|
|
@@ -68,7 +70,9 @@ class Completions(BaseCompletions):
|
|
|
68
70
|
request_id=request_id,
|
|
69
71
|
created_time=created_time,
|
|
70
72
|
model=model,
|
|
71
|
-
payload=payload
|
|
73
|
+
payload=payload,
|
|
74
|
+
timeout=timeout,
|
|
75
|
+
proxies=proxies
|
|
72
76
|
)
|
|
73
77
|
|
|
74
78
|
# Otherwise use non-streaming implementation
|
|
@@ -76,7 +80,9 @@ class Completions(BaseCompletions):
|
|
|
76
80
|
request_id=request_id,
|
|
77
81
|
created_time=created_time,
|
|
78
82
|
model=model,
|
|
79
|
-
payload=payload
|
|
83
|
+
payload=payload,
|
|
84
|
+
timeout=timeout,
|
|
85
|
+
proxies=proxies
|
|
80
86
|
)
|
|
81
87
|
|
|
82
88
|
def _create_streaming(
|
|
@@ -85,9 +91,14 @@ class Completions(BaseCompletions):
|
|
|
85
91
|
request_id: str,
|
|
86
92
|
created_time: int,
|
|
87
93
|
model: str,
|
|
88
|
-
payload: Dict[str, Any]
|
|
94
|
+
payload: Dict[str, Any],
|
|
95
|
+
timeout: Optional[int] = None,
|
|
96
|
+
proxies: Optional[dict] = None
|
|
89
97
|
) -> Generator[ChatCompletionChunk, None, None]:
|
|
90
98
|
"""Implementation for streaming chat completions."""
|
|
99
|
+
original_proxies = self._client.session.proxies
|
|
100
|
+
if proxies is not None:
|
|
101
|
+
self._client.session.proxies = proxies
|
|
91
102
|
try:
|
|
92
103
|
response = self._client.session.post(
|
|
93
104
|
self._client.chat_endpoint,
|
|
@@ -95,7 +106,7 @@ class Completions(BaseCompletions):
|
|
|
95
106
|
cookies=self._client.cookies,
|
|
96
107
|
data=json.dumps(payload),
|
|
97
108
|
stream=True,
|
|
98
|
-
timeout=self._client.timeout,
|
|
109
|
+
timeout=timeout if timeout is not None else self._client.timeout,
|
|
99
110
|
impersonate="chrome120"
|
|
100
111
|
)
|
|
101
112
|
response.raise_for_status()
|
|
@@ -152,6 +163,9 @@ class Completions(BaseCompletions):
|
|
|
152
163
|
raise IOError(f"Cloudflare streaming request failed (CurlError): {e}") from e
|
|
153
164
|
except Exception as e:
|
|
154
165
|
raise IOError(f"Cloudflare streaming request failed: {e}") from e
|
|
166
|
+
finally:
|
|
167
|
+
if proxies is not None:
|
|
168
|
+
self._client.session.proxies = original_proxies
|
|
155
169
|
|
|
156
170
|
def _create_non_streaming(
|
|
157
171
|
self,
|
|
@@ -159,9 +173,14 @@ class Completions(BaseCompletions):
|
|
|
159
173
|
request_id: str,
|
|
160
174
|
created_time: int,
|
|
161
175
|
model: str,
|
|
162
|
-
payload: Dict[str, Any]
|
|
176
|
+
payload: Dict[str, Any],
|
|
177
|
+
timeout: Optional[int] = None,
|
|
178
|
+
proxies: Optional[dict] = None
|
|
163
179
|
) -> ChatCompletion:
|
|
164
180
|
"""Implementation for non-streaming chat completions."""
|
|
181
|
+
original_proxies = self._client.session.proxies
|
|
182
|
+
if proxies is not None:
|
|
183
|
+
self._client.session.proxies = proxies
|
|
165
184
|
try:
|
|
166
185
|
response = self._client.session.post(
|
|
167
186
|
self._client.chat_endpoint,
|
|
@@ -169,7 +188,7 @@ class Completions(BaseCompletions):
|
|
|
169
188
|
cookies=self._client.cookies,
|
|
170
189
|
data=json.dumps(payload),
|
|
171
190
|
stream=True, # Still use streaming API but collect all chunks
|
|
172
|
-
timeout=self._client.timeout,
|
|
191
|
+
timeout=timeout if timeout is not None else self._client.timeout,
|
|
173
192
|
impersonate="chrome120"
|
|
174
193
|
)
|
|
175
194
|
response.raise_for_status()
|
|
@@ -226,6 +245,9 @@ class Completions(BaseCompletions):
|
|
|
226
245
|
raise IOError(f"Cloudflare request failed (CurlError): {e}") from e
|
|
227
246
|
except Exception as e:
|
|
228
247
|
raise IOError(f"Cloudflare request failed: {e}") from e
|
|
248
|
+
finally:
|
|
249
|
+
if proxies is not None:
|
|
250
|
+
self._client.session.proxies = original_proxies
|
|
229
251
|
|
|
230
252
|
@staticmethod
|
|
231
253
|
def _cloudflare_extractor(chunk: Union[str, Dict[str, Any]]) -> Optional[str]:
|
|
@@ -315,23 +337,19 @@ class Cloudflare(OpenAICompatibleProvider):
|
|
|
315
337
|
def __init__(
|
|
316
338
|
self,
|
|
317
339
|
api_key: Optional[str] = None, # Not used but included for compatibility
|
|
318
|
-
timeout: int = 30,
|
|
319
|
-
proxies: dict = {},
|
|
320
340
|
):
|
|
321
341
|
"""
|
|
322
342
|
Initialize the Cloudflare client.
|
|
323
343
|
|
|
324
344
|
Args:
|
|
325
345
|
api_key: Not used but included for compatibility with OpenAI interface
|
|
326
|
-
timeout: Request timeout in seconds
|
|
327
|
-
proxies: Optional proxy configuration
|
|
328
346
|
"""
|
|
329
|
-
self.timeout =
|
|
330
|
-
self.proxies = proxies
|
|
347
|
+
self.timeout = 30
|
|
331
348
|
self.chat_endpoint = "https://playground.ai.cloudflare.com/api/inference"
|
|
332
349
|
|
|
333
350
|
# Initialize session
|
|
334
351
|
self.session = Session()
|
|
352
|
+
self.session.proxies = {}
|
|
335
353
|
|
|
336
354
|
# Set headers
|
|
337
355
|
self.headers = {
|
|
@@ -358,9 +376,8 @@ class Cloudflare(OpenAICompatibleProvider):
|
|
|
358
376
|
'__cf_bm': uuid4().hex,
|
|
359
377
|
}
|
|
360
378
|
|
|
361
|
-
# Apply headers
|
|
379
|
+
# Apply headers to session
|
|
362
380
|
self.session.headers.update(self.headers)
|
|
363
|
-
self.session.proxies = proxies
|
|
364
381
|
|
|
365
382
|
# Initialize chat interface
|
|
366
383
|
self.chat = Chat(self)
|
|
@@ -0,0 +1,457 @@
|
|
|
1
|
+
import requests
|
|
2
|
+
import json
|
|
3
|
+
import time
|
|
4
|
+
import uuid
|
|
5
|
+
from typing import List, Dict, Optional, Union, Generator, Any
|
|
6
|
+
|
|
7
|
+
from webscout.Provider.OPENAI.base import OpenAICompatibleProvider, BaseChat, BaseCompletions
|
|
8
|
+
from webscout.Provider.OPENAI.utils import (
|
|
9
|
+
ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
|
|
10
|
+
ChatCompletionMessage, CompletionUsage,
|
|
11
|
+
get_system_prompt,
|
|
12
|
+
count_tokens,
|
|
13
|
+
format_prompt
|
|
14
|
+
)
|
|
15
|
+
from webscout.litagent import LitAgent
|
|
16
|
+
|
|
17
|
+
def convert_openai_to_falcon_history(messages: List[Dict[str, str]]) -> list:
|
|
18
|
+
"""
|
|
19
|
+
Converts a list of OpenAI-style chat messages to Falcon/Gradio chat history format.
|
|
20
|
+
|
|
21
|
+
Args:
|
|
22
|
+
messages (List[Dict[str, str]]):
|
|
23
|
+
A list of message dictionaries, each with 'role' and 'content' keys, following the OpenAI API format.
|
|
24
|
+
|
|
25
|
+
Returns:
|
|
26
|
+
list: A single-turn Falcon/Gradio chat history in the format [[prompt, None]].
|
|
27
|
+
"""
|
|
28
|
+
prompt = format_prompt(messages, add_special_tokens=False, do_continue=True, include_system=True)
|
|
29
|
+
return [[prompt, None]]
|
|
30
|
+
|
|
31
|
+
class Completions(BaseCompletions):
|
|
32
|
+
"""
|
|
33
|
+
Handles text completion requests for the FalconH1 provider, supporting both streaming and non-streaming modes.
|
|
34
|
+
|
|
35
|
+
Attributes:
|
|
36
|
+
_client (Any): Reference to the FalconH1 client instance.
|
|
37
|
+
_last_yielded_content_stream (str): Tracks the last yielded content in streaming mode.
|
|
38
|
+
"""
|
|
39
|
+
def __init__(self, client):
|
|
40
|
+
"""
|
|
41
|
+
Initializes the Completions handler.
|
|
42
|
+
|
|
43
|
+
Args:
|
|
44
|
+
client: The FalconH1 client instance.
|
|
45
|
+
"""
|
|
46
|
+
self._client = client
|
|
47
|
+
self._last_yielded_content_stream = ""
|
|
48
|
+
|
|
49
|
+
def create(
|
|
50
|
+
self,
|
|
51
|
+
*,
|
|
52
|
+
model: str,
|
|
53
|
+
messages: List[Dict[str, str]],
|
|
54
|
+
max_tokens: Optional[int] = 1024,
|
|
55
|
+
stream: bool = False,
|
|
56
|
+
temperature: Optional[float] = 0.1,
|
|
57
|
+
top_p: Optional[float] = 1.0,
|
|
58
|
+
timeout: Optional[int] = None,
|
|
59
|
+
proxies: Optional[dict] = None,
|
|
60
|
+
**kwargs: Any
|
|
61
|
+
) -> Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]:
|
|
62
|
+
"""
|
|
63
|
+
Creates a chat completion using the FalconH1 API, supporting both streaming and non-streaming responses.
|
|
64
|
+
|
|
65
|
+
Args:
|
|
66
|
+
model (str): The model identifier to use for completion.
|
|
67
|
+
messages (List[Dict[str, str]]): List of chat messages in OpenAI format.
|
|
68
|
+
max_tokens (Optional[int]): Maximum number of tokens to generate in the completion.
|
|
69
|
+
stream (bool): Whether to stream the response as chunks.
|
|
70
|
+
temperature (Optional[float]): Sampling temperature.
|
|
71
|
+
top_p (Optional[float]): Nucleus sampling probability.
|
|
72
|
+
timeout (Optional[int]): Request timeout in seconds.
|
|
73
|
+
proxies (Optional[dict]): Optional proxy settings for the request.
|
|
74
|
+
**kwargs: Additional keyword arguments for advanced options (e.g., top_k, repetition_penalty).
|
|
75
|
+
|
|
76
|
+
Returns:
|
|
77
|
+
Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]: The chat completion result or a generator yielding streamed chunks.
|
|
78
|
+
"""
|
|
79
|
+
session_hash = str(uuid.uuid4()).replace('-', '')
|
|
80
|
+
chat_history = convert_openai_to_falcon_history(messages)
|
|
81
|
+
if not chat_history or chat_history[-1][0] is None:
|
|
82
|
+
raise ValueError("Messages must contain at least one user message for Falcon API.")
|
|
83
|
+
resolved_model_name = self._client.get_model(model)
|
|
84
|
+
payload_data = [
|
|
85
|
+
chat_history,
|
|
86
|
+
resolved_model_name,
|
|
87
|
+
temperature,
|
|
88
|
+
max_tokens,
|
|
89
|
+
top_p,
|
|
90
|
+
kwargs.get("top_k", 20),
|
|
91
|
+
kwargs.get("repetition_penalty", 1.2)
|
|
92
|
+
]
|
|
93
|
+
payload = {
|
|
94
|
+
"data": payload_data,
|
|
95
|
+
"event_data": None,
|
|
96
|
+
"fn_index": 5,
|
|
97
|
+
"trigger_id": 12,
|
|
98
|
+
"session_hash": session_hash
|
|
99
|
+
}
|
|
100
|
+
request_id = f"chatcmpl-{uuid.uuid4()}"
|
|
101
|
+
created_time = int(time.time())
|
|
102
|
+
if stream:
|
|
103
|
+
self._last_yielded_content_stream = ""
|
|
104
|
+
return self._create_stream(request_id, created_time, resolved_model_name, payload, session_hash, timeout=timeout, proxies=proxies)
|
|
105
|
+
else:
|
|
106
|
+
return self._create_non_stream(request_id, created_time, resolved_model_name, payload, session_hash, timeout=timeout, proxies=proxies)
|
|
107
|
+
|
|
108
|
+
def _create_stream(
|
|
109
|
+
self, request_id: str, created_time: int, model: str, payload: Dict[str, Any], session_hash: str,
|
|
110
|
+
timeout: Optional[int] = None, proxies: Optional[dict] = None
|
|
111
|
+
) -> Generator[ChatCompletionChunk, None, None]:
|
|
112
|
+
"""
|
|
113
|
+
Internal method to handle streaming chat completions from the FalconH1 API.
|
|
114
|
+
|
|
115
|
+
Args:
|
|
116
|
+
request_id (str): Unique request identifier.
|
|
117
|
+
created_time (int): Timestamp of request creation.
|
|
118
|
+
model (str): Model identifier.
|
|
119
|
+
payload (Dict[str, Any]): Request payload for the API.
|
|
120
|
+
session_hash (str): Unique session hash for the request.
|
|
121
|
+
timeout (Optional[int]): Request timeout in seconds.
|
|
122
|
+
proxies (Optional[dict]): Optional proxy settings.
|
|
123
|
+
|
|
124
|
+
Yields:
|
|
125
|
+
ChatCompletionChunk: Chunks of the chat completion as they are received from the API.
|
|
126
|
+
"""
|
|
127
|
+
original_proxies = self._client.session.proxies.copy()
|
|
128
|
+
if proxies is not None:
|
|
129
|
+
self._client.session.proxies = proxies
|
|
130
|
+
else:
|
|
131
|
+
self._client.session.proxies = {}
|
|
132
|
+
try:
|
|
133
|
+
session = self._client.session
|
|
134
|
+
join_resp = session.post(
|
|
135
|
+
self._client.api_join_endpoint,
|
|
136
|
+
headers=self._client.headers,
|
|
137
|
+
json=payload,
|
|
138
|
+
timeout=timeout if timeout is not None else self._client.timeout
|
|
139
|
+
)
|
|
140
|
+
join_resp.raise_for_status()
|
|
141
|
+
data_url = f"{self._client.api_data_endpoint}?session_hash={session_hash}"
|
|
142
|
+
stream_resp = session.get(
|
|
143
|
+
data_url,
|
|
144
|
+
headers=self._client.stream_headers,
|
|
145
|
+
stream=True,
|
|
146
|
+
timeout=timeout if timeout is not None else self._client.timeout
|
|
147
|
+
)
|
|
148
|
+
stream_resp.raise_for_status()
|
|
149
|
+
for line in stream_resp.iter_lines():
|
|
150
|
+
if line:
|
|
151
|
+
decoded_line = line.decode('utf-8')
|
|
152
|
+
if decoded_line.startswith('data: '):
|
|
153
|
+
try:
|
|
154
|
+
json_data = json.loads(decoded_line[6:])
|
|
155
|
+
msg_type = json_data.get('msg')
|
|
156
|
+
if msg_type == 'process_generating':
|
|
157
|
+
output_field = json_data.get('output', {})
|
|
158
|
+
data_field = output_field.get('data')
|
|
159
|
+
if data_field and isinstance(data_field, list) and len(data_field) > 0:
|
|
160
|
+
inner_data = data_field[0]
|
|
161
|
+
content_to_yield = None
|
|
162
|
+
if isinstance(inner_data, list) and len(inner_data) > 0:
|
|
163
|
+
if isinstance(inner_data[0], list) and len(inner_data[0]) == 3 and inner_data[0][0] == "append":
|
|
164
|
+
content_to_yield = inner_data[0][2]
|
|
165
|
+
elif isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and \
|
|
166
|
+
isinstance(inner_data[0][1], str):
|
|
167
|
+
current_full_response = inner_data[0][1]
|
|
168
|
+
if current_full_response.startswith(self._last_yielded_content_stream):
|
|
169
|
+
content_to_yield = current_full_response[len(self._last_yielded_content_stream):]
|
|
170
|
+
else:
|
|
171
|
+
content_to_yield = current_full_response
|
|
172
|
+
self._last_yielded_content_stream = current_full_response
|
|
173
|
+
if content_to_yield:
|
|
174
|
+
delta = ChoiceDelta(content=content_to_yield, role="assistant")
|
|
175
|
+
yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
|
|
176
|
+
elif msg_type == 'process_completed' or msg_type == 'close_stream':
|
|
177
|
+
break
|
|
178
|
+
except json.JSONDecodeError:
|
|
179
|
+
continue
|
|
180
|
+
except Exception as e:
|
|
181
|
+
continue
|
|
182
|
+
finally:
|
|
183
|
+
self._client.session.proxies = original_proxies
|
|
184
|
+
|
|
185
|
+
def _create_non_stream(
|
|
186
|
+
self, request_id: str, created_time: int, model: str, payload: Dict[str, Any], session_hash: str,
|
|
187
|
+
timeout: Optional[int] = None, proxies: Optional[dict] = None
|
|
188
|
+
) -> ChatCompletion:
|
|
189
|
+
"""
|
|
190
|
+
Internal method to handle non-streaming chat completions from the FalconH1 API.
|
|
191
|
+
|
|
192
|
+
Args:
|
|
193
|
+
request_id (str): Unique request identifier.
|
|
194
|
+
created_time (int): Timestamp of request creation.
|
|
195
|
+
model (str): Model identifier.
|
|
196
|
+
payload (Dict[str, Any]): Request payload for the API.
|
|
197
|
+
session_hash (str): Unique session hash for the request.
|
|
198
|
+
timeout (Optional[int]): Request timeout in seconds.
|
|
199
|
+
proxies (Optional[dict]): Optional proxy settings.
|
|
200
|
+
|
|
201
|
+
Returns:
|
|
202
|
+
ChatCompletion: The full chat completion result.
|
|
203
|
+
"""
|
|
204
|
+
original_proxies = self._client.session.proxies.copy()
|
|
205
|
+
if proxies is not None:
|
|
206
|
+
self._client.session.proxies = proxies
|
|
207
|
+
else:
|
|
208
|
+
self._client.session.proxies = {}
|
|
209
|
+
full_response_content = ""
|
|
210
|
+
last_full_response_chunk_ns = ""
|
|
211
|
+
response_parts = []
|
|
212
|
+
try:
|
|
213
|
+
session = self._client.session
|
|
214
|
+
join_resp = session.post(
|
|
215
|
+
self._client.api_join_endpoint, headers=self._client.headers, json=payload,
|
|
216
|
+
timeout=timeout if timeout is not None else self._client.timeout
|
|
217
|
+
)
|
|
218
|
+
join_resp.raise_for_status()
|
|
219
|
+
data_url = f"{self._client.api_data_endpoint}?session_hash={session_hash}"
|
|
220
|
+
overall_start_time = time.time()
|
|
221
|
+
effective_timeout = timeout if timeout is not None else self._client.timeout
|
|
222
|
+
while True:
|
|
223
|
+
if time.time() - overall_start_time > effective_timeout:
|
|
224
|
+
raise TimeoutError("Timeout waiting for non-stream response completion.")
|
|
225
|
+
stream_resp = session.get(
|
|
226
|
+
data_url, headers=self._client.stream_headers, stream=True,
|
|
227
|
+
timeout=effective_timeout
|
|
228
|
+
)
|
|
229
|
+
stream_resp.raise_for_status()
|
|
230
|
+
found_completion_message = False
|
|
231
|
+
for line in stream_resp.iter_lines():
|
|
232
|
+
if time.time() - overall_start_time > effective_timeout:
|
|
233
|
+
raise TimeoutError("Timeout during non-stream response processing.")
|
|
234
|
+
if line:
|
|
235
|
+
decoded_line = line.decode('utf-8')
|
|
236
|
+
if decoded_line.startswith('data: '):
|
|
237
|
+
try:
|
|
238
|
+
json_data = json.loads(decoded_line[6:])
|
|
239
|
+
msg_type = json_data.get('msg')
|
|
240
|
+
if msg_type == 'process_generating':
|
|
241
|
+
output_field = json_data.get('output', {})
|
|
242
|
+
data_field = output_field.get('data')
|
|
243
|
+
if data_field and isinstance(data_field, list) and len(data_field) > 0:
|
|
244
|
+
inner_data = data_field[0]
|
|
245
|
+
current_chunk_text = None
|
|
246
|
+
if isinstance(inner_data, list) and len(inner_data) > 0:
|
|
247
|
+
if isinstance(inner_data[0], list) and len(inner_data[0]) == 3 and inner_data[0][0] == "append":
|
|
248
|
+
current_chunk_text = inner_data[0][2]
|
|
249
|
+
elif isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and isinstance(inner_data[0][1], str):
|
|
250
|
+
current_full_response = inner_data[0][1]
|
|
251
|
+
if current_full_response.startswith(last_full_response_chunk_ns):
|
|
252
|
+
current_chunk_text = current_full_response[len(last_full_response_chunk_ns):]
|
|
253
|
+
else:
|
|
254
|
+
current_chunk_text = current_full_response
|
|
255
|
+
last_full_response_chunk_ns = current_full_response
|
|
256
|
+
if current_chunk_text:
|
|
257
|
+
response_parts.append(current_chunk_text)
|
|
258
|
+
elif msg_type == 'process_completed' or msg_type == 'close_stream':
|
|
259
|
+
if msg_type == 'process_completed':
|
|
260
|
+
output_field = json_data.get('output', {})
|
|
261
|
+
data_field = output_field.get('data')
|
|
262
|
+
if data_field and isinstance(data_field, list) and len(data_field) > 0:
|
|
263
|
+
inner_data = data_field[0]
|
|
264
|
+
if isinstance(inner_data, list) and len(inner_data) > 0 and \
|
|
265
|
+
isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and \
|
|
266
|
+
isinstance(inner_data[0][1], str):
|
|
267
|
+
final_full_response = inner_data[0][1]
|
|
268
|
+
if final_full_response != last_full_response_chunk_ns:
|
|
269
|
+
if final_full_response.startswith(last_full_response_chunk_ns):
|
|
270
|
+
response_parts.append(final_full_response[len(last_full_response_chunk_ns):])
|
|
271
|
+
else:
|
|
272
|
+
response_parts = [final_full_response]
|
|
273
|
+
last_full_response_chunk_ns = final_full_response
|
|
274
|
+
found_completion_message = True
|
|
275
|
+
break
|
|
276
|
+
except json.JSONDecodeError:
|
|
277
|
+
continue
|
|
278
|
+
except Exception as e:
|
|
279
|
+
raise e
|
|
280
|
+
if found_completion_message:
|
|
281
|
+
break
|
|
282
|
+
full_response_content = "".join(response_parts)
|
|
283
|
+
message = ChatCompletionMessage(role="assistant", content=full_response_content)
|
|
284
|
+
choice = Choice(index=0, message=message, finish_reason="stop")
|
|
285
|
+
|
|
286
|
+
# Simplified token counting without history iteration
|
|
287
|
+
chat_history = payload['data'][0]
|
|
288
|
+
prompt = chat_history[0][0] if chat_history and chat_history[0] and chat_history[0][0] else ""
|
|
289
|
+
prompt_tokens = count_tokens(prompt)
|
|
290
|
+
completion_tokens = count_tokens(full_response_content)
|
|
291
|
+
usage = CompletionUsage(
|
|
292
|
+
prompt_tokens=prompt_tokens,
|
|
293
|
+
completion_tokens=completion_tokens,
|
|
294
|
+
total_tokens=prompt_tokens + completion_tokens
|
|
295
|
+
)
|
|
296
|
+
return ChatCompletion(
|
|
297
|
+
id=request_id, choices=[choice], created=created_time,
|
|
298
|
+
model=model, usage=usage
|
|
299
|
+
)
|
|
300
|
+
finally:
|
|
301
|
+
self._client.session.proxies = original_proxies
|
|
302
|
+
|
|
303
|
+
class Chat(BaseChat):
|
|
304
|
+
"""
|
|
305
|
+
Provides a chat interface for the FalconH1 provider, exposing the completions API.
|
|
306
|
+
|
|
307
|
+
Attributes:
|
|
308
|
+
completions (Completions): The completions handler for chat requests.
|
|
309
|
+
"""
|
|
310
|
+
def __init__(self, client):
|
|
311
|
+
"""
|
|
312
|
+
Initializes the Chat interface for FalconH1.
|
|
313
|
+
|
|
314
|
+
Args:
|
|
315
|
+
client: The FalconH1 client instance.
|
|
316
|
+
"""
|
|
317
|
+
self.completions = Completions(client)
|
|
318
|
+
|
|
319
|
+
class FalconH1(OpenAICompatibleProvider):
|
|
320
|
+
"""
|
|
321
|
+
FalconH1 provider implementation compatible with the OpenAI API interface.
|
|
322
|
+
Handles chat completions using FalconH1 models via the Hugging Face Spaces API.
|
|
323
|
+
|
|
324
|
+
Attributes:
|
|
325
|
+
base_url (str): Base URL for the FalconH1 API.
|
|
326
|
+
api_join_endpoint (str): Endpoint for joining the chat queue.
|
|
327
|
+
api_data_endpoint (str): Endpoint for retrieving chat data.
|
|
328
|
+
AVAILABLE_MODELS (List[str]): List of supported FalconH1 model identifiers.
|
|
329
|
+
timeout (int): Default request timeout in seconds.
|
|
330
|
+
session (requests.Session): HTTP session for API requests.
|
|
331
|
+
headers (dict): Default HTTP headers for requests.
|
|
332
|
+
stream_headers (dict): HTTP headers for streaming requests.
|
|
333
|
+
chat (Chat): Chat interface for completions.
|
|
334
|
+
"""
|
|
335
|
+
base_url = "https://tiiuae-falcon-h1-playground.hf.space"
|
|
336
|
+
api_join_endpoint = f"{base_url}/gradio_api/queue/join?__theme=dark"
|
|
337
|
+
api_data_endpoint = f"{base_url}/gradio_api/queue/data"
|
|
338
|
+
AVAILABLE_MODELS = [
|
|
339
|
+
"Falcon-H1-34B-Instruct",
|
|
340
|
+
"Falcon-H1-7B-Instruct",
|
|
341
|
+
"Falcon-H1-3B-Instruct",
|
|
342
|
+
"Falcon-H1-1.5B-Deep-Instruct",
|
|
343
|
+
"Falcon-H1-1.5B-Instruct",
|
|
344
|
+
"Falcon-H1-0.5B-Instruct",
|
|
345
|
+
]
|
|
346
|
+
def __init__(self, timeout: int = 120, proxies: Optional[dict] = None):
|
|
347
|
+
"""
|
|
348
|
+
Initializes the FalconH1 provider with optional timeout and proxy settings.
|
|
349
|
+
|
|
350
|
+
Args:
|
|
351
|
+
timeout (int): Default request timeout in seconds (default: 120).
|
|
352
|
+
proxies (Optional[dict]): Optional proxy settings for HTTP requests.
|
|
353
|
+
"""
|
|
354
|
+
self.timeout = timeout
|
|
355
|
+
self.session = requests.Session()
|
|
356
|
+
if proxies:
|
|
357
|
+
self.session.proxies = proxies
|
|
358
|
+
else:
|
|
359
|
+
self.session.proxies = {}
|
|
360
|
+
self.headers = {
|
|
361
|
+
'User-Agent': LitAgent().random(),
|
|
362
|
+
'Accept': '*/*',
|
|
363
|
+
'Accept-Language': 'en-US,en;q=0.9,en-IN;q=0.8',
|
|
364
|
+
'Accept-Encoding': 'gzip, deflate, br, zstd',
|
|
365
|
+
'Referer': f'{self.base_url}/?__theme=dark',
|
|
366
|
+
'Content-Type': 'application/json',
|
|
367
|
+
'Origin': self.base_url,
|
|
368
|
+
'Connection': 'keep-alive',
|
|
369
|
+
'Sec-Fetch-Dest': 'empty',
|
|
370
|
+
'Sec-Fetch-Mode': 'cors',
|
|
371
|
+
'Sec-Fetch-Site': 'same-origin',
|
|
372
|
+
'DNT': '1',
|
|
373
|
+
'Sec-GPC': '1',
|
|
374
|
+
}
|
|
375
|
+
self.stream_headers = {
|
|
376
|
+
'Accept': 'text/event-stream',
|
|
377
|
+
'Accept-Language': self.headers['Accept-Language'],
|
|
378
|
+
'Referer': self.headers['Referer'],
|
|
379
|
+
'User-Agent': self.headers['User-Agent'],
|
|
380
|
+
'Connection': 'keep-alive',
|
|
381
|
+
'Cache-Control': 'no-cache',
|
|
382
|
+
}
|
|
383
|
+
self.session.headers.update(self.headers)
|
|
384
|
+
self.chat = Chat(self)
|
|
385
|
+
def get_model(self, model_identifier: str) -> str:
|
|
386
|
+
"""
|
|
387
|
+
Returns the resolved model name for the given identifier.
|
|
388
|
+
|
|
389
|
+
Args:
|
|
390
|
+
model_identifier (str): The model identifier string.
|
|
391
|
+
|
|
392
|
+
Returns:
|
|
393
|
+
str: The resolved model name (currently returns the identifier as-is).
|
|
394
|
+
"""
|
|
395
|
+
return model_identifier
|
|
396
|
+
@property
|
|
397
|
+
def models(self):
|
|
398
|
+
"""
|
|
399
|
+
Returns a list-like object containing available FalconH1 models.
|
|
400
|
+
|
|
401
|
+
Returns:
|
|
402
|
+
ModelList: An object with a .list() method returning model data objects.
|
|
403
|
+
"""
|
|
404
|
+
class ModelData:
|
|
405
|
+
def __init__(self, id_str):
|
|
406
|
+
self.id = id_str
|
|
407
|
+
class ModelList:
|
|
408
|
+
def __init__(self, models_available):
|
|
409
|
+
self.data = [ModelData(m) for m in models_available]
|
|
410
|
+
def list(self):
|
|
411
|
+
return self.data
|
|
412
|
+
return ModelList(self.AVAILABLE_MODELS)
|
|
413
|
+
|
|
414
|
+
if __name__ == "__main__":
|
|
415
|
+
"""
|
|
416
|
+
Example usage of the FalconH1 provider for both non-streaming and streaming chat completions.
|
|
417
|
+
"""
|
|
418
|
+
print("FalconH1 Provider Example")
|
|
419
|
+
client = FalconH1()
|
|
420
|
+
print("\n--- Non-Streaming Example ---")
|
|
421
|
+
try:
|
|
422
|
+
response = client.chat.completions.create(
|
|
423
|
+
model="Falcon-H1-34B-Instruct",
|
|
424
|
+
messages=[
|
|
425
|
+
{"role": "system", "content": "You are a helpful AI assistant named Falcon."},
|
|
426
|
+
{"role": "user", "content": "Hello, what is your name and what can you do?"}
|
|
427
|
+
]
|
|
428
|
+
)
|
|
429
|
+
print(f"ID: {response.id}")
|
|
430
|
+
print(f"Model: {response.model}")
|
|
431
|
+
if response.choices:
|
|
432
|
+
print(f"Response: {response.choices[0].message.content}")
|
|
433
|
+
if response.usage:
|
|
434
|
+
print(f"Usage: {response.usage}")
|
|
435
|
+
except Exception as e:
|
|
436
|
+
print(f"Error in non-streaming example: {e}")
|
|
437
|
+
print("\n--- Streaming Example ---")
|
|
438
|
+
try:
|
|
439
|
+
stream_response = client.chat.completions.create(
|
|
440
|
+
model="Falcon-H1-34B-Instruct",
|
|
441
|
+
messages=[
|
|
442
|
+
{"role": "user", "content": "Tell me a short story about a brave falcon."}
|
|
443
|
+
],
|
|
444
|
+
stream=True,
|
|
445
|
+
max_tokens=150
|
|
446
|
+
)
|
|
447
|
+
print("Streaming response:")
|
|
448
|
+
full_streamed_content = ""
|
|
449
|
+
for chunk in stream_response:
|
|
450
|
+
if chunk.choices and chunk.choices[0].delta and chunk.choices[0].delta.content:
|
|
451
|
+
content_piece = chunk.choices[0].delta.content
|
|
452
|
+
print(content_piece, end="", flush=True)
|
|
453
|
+
full_streamed_content += content_piece
|
|
454
|
+
print("\n--- End of Stream ---")
|
|
455
|
+
except Exception as e:
|
|
456
|
+
print(f"Error in streaming example: {e}")
|
|
457
|
+
|