webscout 2025.10.19.2__py3-none-any.whl → 2025.10.22.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of webscout might be problematic. Click here for more details.

@@ -1,452 +0,0 @@
1
- import requests
2
- import json
3
- import time
4
- import uuid
5
- from typing import List, Dict, Optional, Union, Generator, Any
6
-
7
- from webscout.Provider.OPENAI.base import OpenAICompatibleProvider, BaseChat, BaseCompletions
8
- from webscout.Provider.OPENAI.utils import (
9
- ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
10
- ChatCompletionMessage, CompletionUsage,
11
- get_system_prompt,
12
- count_tokens,
13
- format_prompt
14
- )
15
- from webscout.litagent import LitAgent
16
-
17
- def convert_openai_to_falcon_history(messages: List[Dict[str, str]]) -> list:
18
- """
19
- Converts a list of OpenAI-style chat messages to Falcon/Gradio chat history format.
20
-
21
- Args:
22
- messages (List[Dict[str, str]]):
23
- A list of message dictionaries, each with 'role' and 'content' keys, following the OpenAI API format.
24
-
25
- Returns:
26
- list: A single-turn Falcon/Gradio chat history in the format [[prompt, None]].
27
- """
28
- prompt = format_prompt(messages, add_special_tokens=False, do_continue=True, include_system=True)
29
- return [[prompt, None]]
30
-
31
- class Completions(BaseCompletions):
32
- """
33
- Handles text completion requests for the FalconH1 provider, supporting both streaming and non-streaming modes.
34
-
35
- Attributes:
36
- _client (Any): Reference to the FalconH1 client instance.
37
- _last_yielded_content_stream (str): Tracks the last yielded content in streaming mode.
38
- """
39
- def __init__(self, client):
40
- """
41
- Initializes the Completions handler.
42
-
43
- Args:
44
- client: The FalconH1 client instance.
45
- """
46
- self._client = client
47
- self._last_yielded_content_stream = ""
48
-
49
- def create(
50
- self,
51
- *,
52
- model: str,
53
- messages: List[Dict[str, str]],
54
- max_tokens: Optional[int] = 1024,
55
- stream: bool = False,
56
- temperature: Optional[float] = 0.1,
57
- top_p: Optional[float] = 1.0,
58
- timeout: Optional[int] = None,
59
- proxies: Optional[dict] = None,
60
- **kwargs: Any
61
- ) -> Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]:
62
- """
63
- Creates a chat completion using the FalconH1 API, supporting both streaming and non-streaming responses.
64
-
65
- Args:
66
- model (str): The model identifier to use for completion.
67
- messages (List[Dict[str, str]]): List of chat messages in OpenAI format.
68
- max_tokens (Optional[int]): Maximum number of tokens to generate in the completion.
69
- stream (bool): Whether to stream the response as chunks.
70
- temperature (Optional[float]): Sampling temperature.
71
- top_p (Optional[float]): Nucleus sampling probability.
72
- timeout (Optional[int]): Request timeout in seconds.
73
- proxies (Optional[dict]): Optional proxy settings for the request.
74
- **kwargs: Additional keyword arguments for advanced options (e.g., top_k, repetition_penalty).
75
-
76
- Returns:
77
- Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]: The chat completion result or a generator yielding streamed chunks.
78
- """
79
- session_hash = str(uuid.uuid4()).replace('-', '')
80
- chat_history = convert_openai_to_falcon_history(messages)
81
- if not chat_history or chat_history[-1][0] is None:
82
- raise ValueError("Messages must contain at least one user message for Falcon API.")
83
- resolved_model_name = self._client.get_model(model)
84
- payload_data = [
85
- chat_history,
86
- resolved_model_name,
87
- temperature,
88
- max_tokens,
89
- top_p,
90
- kwargs.get("top_k", 20),
91
- kwargs.get("repetition_penalty", 1.2)
92
- ]
93
- payload = {
94
- "data": payload_data,
95
- "event_data": None,
96
- "fn_index": 5,
97
- "trigger_id": 12,
98
- "session_hash": session_hash
99
- }
100
- request_id = f"chatcmpl-{uuid.uuid4()}"
101
- created_time = int(time.time())
102
- if stream:
103
- self._last_yielded_content_stream = ""
104
- return self._create_stream(request_id, created_time, resolved_model_name, payload, session_hash, timeout=timeout, proxies=proxies)
105
- else:
106
- return self._create_non_stream(request_id, created_time, resolved_model_name, payload, session_hash, timeout=timeout, proxies=proxies)
107
-
108
- def _create_stream(
109
- self, request_id: str, created_time: int, model: str, payload: Dict[str, Any], session_hash: str,
110
- timeout: Optional[int] = None, proxies: Optional[dict] = None
111
- ) -> Generator[ChatCompletionChunk, None, None]:
112
- """
113
- Internal method to handle streaming chat completions from the FalconH1 API.
114
-
115
- Args:
116
- request_id (str): Unique request identifier.
117
- created_time (int): Timestamp of request creation.
118
- model (str): Model identifier.
119
- payload (Dict[str, Any]): Request payload for the API.
120
- session_hash (str): Unique session hash for the request.
121
- timeout (Optional[int]): Request timeout in seconds.
122
- proxies (Optional[dict]): Optional proxy settings.
123
-
124
- Yields:
125
- ChatCompletionChunk: Chunks of the chat completion as they are received from the API.
126
- """
127
- original_proxies = self._client.session.proxies.copy()
128
- if proxies is not None:
129
- self._client.session.proxies = proxies
130
- else:
131
- self._client.session.proxies = {}
132
- try:
133
- session = self._client.session
134
- join_resp = session.post(
135
- self._client.api_join_endpoint,
136
- headers=self._client.headers,
137
- json=payload,
138
- timeout=timeout if timeout is not None else self._client.timeout
139
- )
140
- join_resp.raise_for_status()
141
- data_url = f"{self._client.api_data_endpoint}?session_hash={session_hash}"
142
- stream_resp = session.get(
143
- data_url,
144
- headers=self._client.stream_headers,
145
- stream=True,
146
- timeout=timeout if timeout is not None else self._client.timeout
147
- )
148
- stream_resp.raise_for_status()
149
- for line in stream_resp.iter_lines():
150
- if line:
151
- decoded_line = line.decode('utf-8')
152
- if decoded_line.startswith('data: '):
153
- try:
154
- json_data = json.loads(decoded_line[6:])
155
- msg_type = json_data.get('msg')
156
- if msg_type == 'process_generating':
157
- output_field = json_data.get('output', {})
158
- data_field = output_field.get('data')
159
- if data_field and isinstance(data_field, list) and len(data_field) > 0:
160
- inner_data = data_field[0]
161
- content_to_yield = None
162
- if isinstance(inner_data, list) and len(inner_data) > 0:
163
- if isinstance(inner_data[0], list) and len(inner_data[0]) == 3 and inner_data[0][0] == "append":
164
- content_to_yield = inner_data[0][2]
165
- elif isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and \
166
- isinstance(inner_data[0][1], str):
167
- current_full_response = inner_data[0][1]
168
- if current_full_response.startswith(self._last_yielded_content_stream):
169
- content_to_yield = current_full_response[len(self._last_yielded_content_stream):]
170
- else:
171
- content_to_yield = current_full_response
172
- self._last_yielded_content_stream = current_full_response
173
- if content_to_yield:
174
- delta = ChoiceDelta(content=content_to_yield, role="assistant")
175
- yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
176
- elif msg_type == 'process_completed' or msg_type == 'close_stream':
177
- break
178
- except json.JSONDecodeError:
179
- continue
180
- except Exception as e:
181
- continue
182
- finally:
183
- self._client.session.proxies = original_proxies
184
-
185
- def _create_non_stream(
186
- self, request_id: str, created_time: int, model: str, payload: Dict[str, Any], session_hash: str,
187
- timeout: Optional[int] = None, proxies: Optional[dict] = None
188
- ) -> ChatCompletion:
189
- """
190
- Internal method to handle non-streaming chat completions from the FalconH1 API.
191
-
192
- Args:
193
- request_id (str): Unique request identifier.
194
- created_time (int): Timestamp of request creation.
195
- model (str): Model identifier.
196
- payload (Dict[str, Any]): Request payload for the API.
197
- session_hash (str): Unique session hash for the request.
198
- timeout (Optional[int]): Request timeout in seconds.
199
- proxies (Optional[dict]): Optional proxy settings.
200
-
201
- Returns:
202
- ChatCompletion: The full chat completion result.
203
- """
204
- original_proxies = self._client.session.proxies.copy()
205
- if proxies is not None:
206
- self._client.session.proxies = proxies
207
- else:
208
- self._client.session.proxies = {}
209
- full_response_content = ""
210
- last_full_response_chunk_ns = ""
211
- response_parts = []
212
- try:
213
- session = self._client.session
214
- join_resp = session.post(
215
- self._client.api_join_endpoint, headers=self._client.headers, json=payload,
216
- timeout=timeout if timeout is not None else self._client.timeout
217
- )
218
- join_resp.raise_for_status()
219
- data_url = f"{self._client.api_data_endpoint}?session_hash={session_hash}"
220
- overall_start_time = time.time()
221
- effective_timeout = timeout if timeout is not None else self._client.timeout
222
- while True:
223
- if time.time() - overall_start_time > effective_timeout:
224
- raise TimeoutError("Timeout waiting for non-stream response completion.")
225
- stream_resp = session.get(
226
- data_url, headers=self._client.stream_headers, stream=True,
227
- timeout=effective_timeout
228
- )
229
- stream_resp.raise_for_status()
230
- found_completion_message = False
231
- for line in stream_resp.iter_lines():
232
- if time.time() - overall_start_time > effective_timeout:
233
- raise TimeoutError("Timeout during non-stream response processing.")
234
- if line:
235
- decoded_line = line.decode('utf-8')
236
- if decoded_line.startswith('data: '):
237
- try:
238
- json_data = json.loads(decoded_line[6:])
239
- msg_type = json_data.get('msg')
240
- if msg_type == 'process_generating':
241
- output_field = json_data.get('output', {})
242
- data_field = output_field.get('data')
243
- if data_field and isinstance(data_field, list) and len(data_field) > 0:
244
- inner_data = data_field[0]
245
- current_chunk_text = None
246
- if isinstance(inner_data, list) and len(inner_data) > 0:
247
- if isinstance(inner_data[0], list) and len(inner_data[0]) == 3 and inner_data[0][0] == "append":
248
- current_chunk_text = inner_data[0][2]
249
- elif isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and isinstance(inner_data[0][1], str):
250
- current_full_response = inner_data[0][1]
251
- if current_full_response.startswith(last_full_response_chunk_ns):
252
- current_chunk_text = current_full_response[len(last_full_response_chunk_ns):]
253
- else:
254
- current_chunk_text = current_full_response
255
- last_full_response_chunk_ns = current_full_response
256
- if current_chunk_text:
257
- response_parts.append(current_chunk_text)
258
- elif msg_type == 'process_completed' or msg_type == 'close_stream':
259
- if msg_type == 'process_completed':
260
- output_field = json_data.get('output', {})
261
- data_field = output_field.get('data')
262
- if data_field and isinstance(data_field, list) and len(data_field) > 0:
263
- inner_data = data_field[0]
264
- if isinstance(inner_data, list) and len(inner_data) > 0 and \
265
- isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and \
266
- isinstance(inner_data[0][1], str):
267
- final_full_response = inner_data[0][1]
268
- if final_full_response != last_full_response_chunk_ns:
269
- if final_full_response.startswith(last_full_response_chunk_ns):
270
- response_parts.append(final_full_response[len(last_full_response_chunk_ns):])
271
- else:
272
- response_parts = [final_full_response]
273
- last_full_response_chunk_ns = final_full_response
274
- found_completion_message = True
275
- break
276
- except json.JSONDecodeError:
277
- continue
278
- except Exception as e:
279
- raise e
280
- if found_completion_message:
281
- break
282
- full_response_content = "".join(response_parts)
283
- message = ChatCompletionMessage(role="assistant", content=full_response_content)
284
- choice = Choice(index=0, message=message, finish_reason="stop")
285
-
286
- # Simplified token counting without history iteration
287
- chat_history = payload['data'][0]
288
- prompt = chat_history[0][0] if chat_history and chat_history[0] and chat_history[0][0] else ""
289
- prompt_tokens = count_tokens(prompt)
290
- completion_tokens = count_tokens(full_response_content)
291
- usage = CompletionUsage(
292
- prompt_tokens=prompt_tokens,
293
- completion_tokens=completion_tokens,
294
- total_tokens=prompt_tokens + completion_tokens
295
- )
296
- return ChatCompletion(
297
- id=request_id, choices=[choice], created=created_time,
298
- model=model, usage=usage
299
- )
300
- finally:
301
- self._client.session.proxies = original_proxies
302
-
303
- class Chat(BaseChat):
304
- """
305
- Provides a chat interface for the FalconH1 provider, exposing the completions API.
306
-
307
- Attributes:
308
- completions (Completions): The completions handler for chat requests.
309
- """
310
- def __init__(self, client):
311
- """
312
- Initializes the Chat interface for FalconH1.
313
-
314
- Args:
315
- client: The FalconH1 client instance.
316
- """
317
- self.completions = Completions(client)
318
-
319
- class FalconH1(OpenAICompatibleProvider):
320
- """
321
- FalconH1 provider implementation compatible with the OpenAI API interface.
322
- Handles chat completions using FalconH1 models via the Hugging Face Spaces API.
323
-
324
- Attributes:
325
- base_url (str): Base URL for the FalconH1 API.
326
- api_join_endpoint (str): Endpoint for joining the chat queue.
327
- api_data_endpoint (str): Endpoint for retrieving chat data.
328
- AVAILABLE_MODELS (List[str]): List of supported FalconH1 model identifiers.
329
- timeout (int): Default request timeout in seconds.
330
- session (requests.Session): HTTP session for API requests.
331
- headers (dict): Default HTTP headers for requests.
332
- stream_headers (dict): HTTP headers for streaming requests.
333
- chat (Chat): Chat interface for completions.
334
- """
335
- base_url = "https://tiiuae-falcon-h1-playground.hf.space"
336
- api_join_endpoint = f"{base_url}/gradio_api/queue/join?__theme=dark"
337
- api_data_endpoint = f"{base_url}/gradio_api/queue/data"
338
- AVAILABLE_MODELS = [
339
- "Falcon-H1-34B-Instruct",
340
- "Falcon-H1-7B-Instruct",
341
- "Falcon-H1-3B-Instruct",
342
- "Falcon-H1-1.5B-Deep-Instruct",
343
- "Falcon-H1-1.5B-Instruct",
344
- "Falcon-H1-0.5B-Instruct",
345
- ]
346
- def __init__(self, timeout: int = 120, proxies: Optional[dict] = None):
347
- """
348
- Initializes the FalconH1 provider with optional timeout and proxy settings.
349
-
350
- Args:
351
- timeout (int): Default request timeout in seconds (default: 120).
352
- proxies (Optional[dict]): Optional proxy settings for HTTP requests.
353
- """
354
- super().__init__(proxies=proxies)
355
- self.timeout = timeout
356
- self.headers = {
357
- 'User-Agent': LitAgent().random(),
358
- 'Accept': '*/*',
359
- 'Accept-Language': 'en-US,en;q=0.9,en-IN;q=0.8',
360
- 'Accept-Encoding': 'gzip, deflate, br, zstd',
361
- 'Referer': f'{self.base_url}/?__theme=dark',
362
- 'Content-Type': 'application/json',
363
- 'Origin': self.base_url,
364
- 'Connection': 'keep-alive',
365
- 'Sec-Fetch-Dest': 'empty',
366
- 'Sec-Fetch-Mode': 'cors',
367
- 'Sec-Fetch-Site': 'same-origin',
368
- 'DNT': '1',
369
- 'Sec-GPC': '1',
370
- }
371
- self.stream_headers = {
372
- 'Accept': 'text/event-stream',
373
- 'Accept-Language': self.headers['Accept-Language'],
374
- 'Referer': self.headers['Referer'],
375
- 'User-Agent': self.headers['User-Agent'],
376
- 'Connection': 'keep-alive',
377
- 'Cache-Control': 'no-cache',
378
- }
379
- self.session.headers.update(self.headers)
380
- self.chat = Chat(self)
381
- def get_model(self, model_identifier: str) -> str:
382
- """
383
- Returns the resolved model name for the given identifier.
384
-
385
- Args:
386
- model_identifier (str): The model identifier string.
387
-
388
- Returns:
389
- str: The resolved model name (currently returns the identifier as-is).
390
- """
391
- return model_identifier
392
- @property
393
- def models(self):
394
- """
395
- Returns a list-like object containing available FalconH1 models.
396
-
397
- Returns:
398
- ModelList: An object with a .list() method returning model data objects.
399
- """
400
- class ModelData:
401
- def __init__(self, id_str):
402
- self.id = id_str
403
- class ModelList:
404
- def __init__(self, models_available):
405
- self.data = [ModelData(m) for m in models_available]
406
- def list(self):
407
- return self.data
408
- return ModelList(self.AVAILABLE_MODELS)
409
-
410
- if __name__ == "__main__":
411
- """
412
- Example usage of the FalconH1 provider for both non-streaming and streaming chat completions.
413
- """
414
- print("FalconH1 Provider Example")
415
- client = FalconH1()
416
- print("\n--- Non-Streaming Example ---")
417
- try:
418
- response = client.chat.completions.create(
419
- model="Falcon-H1-34B-Instruct",
420
- messages=[
421
- {"role": "system", "content": "You are a helpful AI assistant named Falcon."},
422
- {"role": "user", "content": "Hello, what is your name and what can you do?"}
423
- ]
424
- )
425
- print(f"ID: {response.id}")
426
- print(f"Model: {response.model}")
427
- if response.choices:
428
- print(f"Response: {response.choices[0].message.content}")
429
- if response.usage:
430
- print(f"Usage: {response.usage}")
431
- except Exception as e:
432
- print(f"Error in non-streaming example: {e}")
433
- print("\n--- Streaming Example ---")
434
- try:
435
- stream_response = client.chat.completions.create(
436
- model="Falcon-H1-34B-Instruct",
437
- messages=[
438
- {"role": "user", "content": "Tell me a short story about a brave falcon."}
439
- ],
440
- stream=True,
441
- max_tokens=150
442
- )
443
- print("Streaming response:")
444
- full_streamed_content = ""
445
- for chunk in stream_response:
446
- if chunk.choices and chunk.choices[0].delta and chunk.choices[0].delta.content:
447
- content_piece = chunk.choices[0].delta.content
448
- print(content_piece, end="", flush=True)
449
- full_streamed_content += content_piece
450
- print("\n--- End of Stream ---")
451
- except Exception as e:
452
- print(f"Error in streaming example: {e}")