webscout 8.2.9__py3-none-any.whl → 8.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of webscout might be problematic. Click here for more details.

Files changed (63) hide show
  1. webscout/AIauto.py +2 -2
  2. webscout/Provider/Blackboxai.py +2 -0
  3. webscout/Provider/ChatSandbox.py +2 -1
  4. webscout/Provider/Deepinfra.py +1 -1
  5. webscout/Provider/HeckAI.py +1 -1
  6. webscout/Provider/LambdaChat.py +1 -0
  7. webscout/Provider/MCPCore.py +7 -3
  8. webscout/Provider/OPENAI/BLACKBOXAI.py +1017 -766
  9. webscout/Provider/OPENAI/Cloudflare.py +31 -14
  10. webscout/Provider/OPENAI/FalconH1.py +457 -0
  11. webscout/Provider/OPENAI/FreeGemini.py +29 -13
  12. webscout/Provider/OPENAI/NEMOTRON.py +26 -14
  13. webscout/Provider/OPENAI/PI.py +427 -0
  14. webscout/Provider/OPENAI/Qwen3.py +303 -282
  15. webscout/Provider/OPENAI/TwoAI.py +29 -12
  16. webscout/Provider/OPENAI/__init__.py +3 -1
  17. webscout/Provider/OPENAI/ai4chat.py +33 -23
  18. webscout/Provider/OPENAI/api.py +78 -12
  19. webscout/Provider/OPENAI/base.py +2 -0
  20. webscout/Provider/OPENAI/c4ai.py +31 -10
  21. webscout/Provider/OPENAI/chatgpt.py +41 -22
  22. webscout/Provider/OPENAI/chatgptclone.py +32 -13
  23. webscout/Provider/OPENAI/chatsandbox.py +7 -3
  24. webscout/Provider/OPENAI/copilot.py +26 -10
  25. webscout/Provider/OPENAI/deepinfra.py +327 -321
  26. webscout/Provider/OPENAI/e2b.py +77 -99
  27. webscout/Provider/OPENAI/exaai.py +13 -10
  28. webscout/Provider/OPENAI/exachat.py +10 -6
  29. webscout/Provider/OPENAI/flowith.py +7 -3
  30. webscout/Provider/OPENAI/freeaichat.py +10 -6
  31. webscout/Provider/OPENAI/glider.py +10 -6
  32. webscout/Provider/OPENAI/heckai.py +11 -8
  33. webscout/Provider/OPENAI/llmchatco.py +9 -7
  34. webscout/Provider/OPENAI/mcpcore.py +10 -7
  35. webscout/Provider/OPENAI/multichat.py +3 -1
  36. webscout/Provider/OPENAI/netwrck.py +10 -6
  37. webscout/Provider/OPENAI/oivscode.py +12 -9
  38. webscout/Provider/OPENAI/opkfc.py +14 -3
  39. webscout/Provider/OPENAI/scirachat.py +14 -8
  40. webscout/Provider/OPENAI/sonus.py +10 -6
  41. webscout/Provider/OPENAI/standardinput.py +18 -9
  42. webscout/Provider/OPENAI/textpollinations.py +14 -7
  43. webscout/Provider/OPENAI/toolbaz.py +16 -10
  44. webscout/Provider/OPENAI/typefully.py +14 -7
  45. webscout/Provider/OPENAI/typegpt.py +10 -6
  46. webscout/Provider/OPENAI/uncovrAI.py +22 -8
  47. webscout/Provider/OPENAI/venice.py +10 -6
  48. webscout/Provider/OPENAI/writecream.py +166 -163
  49. webscout/Provider/OPENAI/x0gpt.py +367 -365
  50. webscout/Provider/OPENAI/yep.py +384 -382
  51. webscout/Provider/PI.py +2 -1
  52. webscout/Provider/__init__.py +0 -2
  53. webscout/Provider/granite.py +41 -6
  54. webscout/Provider/oivscode.py +37 -37
  55. webscout/Provider/scnet.py +1 -0
  56. webscout/version.py +1 -1
  57. {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/METADATA +2 -1
  58. {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/RECORD +62 -61
  59. {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/WHEEL +1 -1
  60. webscout/Provider/ChatGPTGratis.py +0 -194
  61. {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/entry_points.txt +0 -0
  62. {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/licenses/LICENSE.md +0 -0
  63. {webscout-8.2.9.dist-info → webscout-8.3.dist-info}/top_level.txt +0 -0
@@ -31,6 +31,8 @@ class Completions(BaseCompletions):
31
31
  stream: bool = False,
32
32
  temperature: Optional[float] = None,
33
33
  top_p: Optional[float] = None,
34
+ timeout: Optional[int] = None,
35
+ proxies: Optional[dict] = None,
34
36
  **kwargs: Any
35
37
  ) -> Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]:
36
38
  """
@@ -68,7 +70,9 @@ class Completions(BaseCompletions):
68
70
  request_id=request_id,
69
71
  created_time=created_time,
70
72
  model=model,
71
- payload=payload
73
+ payload=payload,
74
+ timeout=timeout,
75
+ proxies=proxies
72
76
  )
73
77
 
74
78
  # Otherwise use non-streaming implementation
@@ -76,7 +80,9 @@ class Completions(BaseCompletions):
76
80
  request_id=request_id,
77
81
  created_time=created_time,
78
82
  model=model,
79
- payload=payload
83
+ payload=payload,
84
+ timeout=timeout,
85
+ proxies=proxies
80
86
  )
81
87
 
82
88
  def _create_streaming(
@@ -85,9 +91,14 @@ class Completions(BaseCompletions):
85
91
  request_id: str,
86
92
  created_time: int,
87
93
  model: str,
88
- payload: Dict[str, Any]
94
+ payload: Dict[str, Any],
95
+ timeout: Optional[int] = None,
96
+ proxies: Optional[dict] = None
89
97
  ) -> Generator[ChatCompletionChunk, None, None]:
90
98
  """Implementation for streaming chat completions."""
99
+ original_proxies = self._client.session.proxies
100
+ if proxies is not None:
101
+ self._client.session.proxies = proxies
91
102
  try:
92
103
  response = self._client.session.post(
93
104
  self._client.chat_endpoint,
@@ -95,7 +106,7 @@ class Completions(BaseCompletions):
95
106
  cookies=self._client.cookies,
96
107
  data=json.dumps(payload),
97
108
  stream=True,
98
- timeout=self._client.timeout,
109
+ timeout=timeout if timeout is not None else self._client.timeout,
99
110
  impersonate="chrome120"
100
111
  )
101
112
  response.raise_for_status()
@@ -152,6 +163,9 @@ class Completions(BaseCompletions):
152
163
  raise IOError(f"Cloudflare streaming request failed (CurlError): {e}") from e
153
164
  except Exception as e:
154
165
  raise IOError(f"Cloudflare streaming request failed: {e}") from e
166
+ finally:
167
+ if proxies is not None:
168
+ self._client.session.proxies = original_proxies
155
169
 
156
170
  def _create_non_streaming(
157
171
  self,
@@ -159,9 +173,14 @@ class Completions(BaseCompletions):
159
173
  request_id: str,
160
174
  created_time: int,
161
175
  model: str,
162
- payload: Dict[str, Any]
176
+ payload: Dict[str, Any],
177
+ timeout: Optional[int] = None,
178
+ proxies: Optional[dict] = None
163
179
  ) -> ChatCompletion:
164
180
  """Implementation for non-streaming chat completions."""
181
+ original_proxies = self._client.session.proxies
182
+ if proxies is not None:
183
+ self._client.session.proxies = proxies
165
184
  try:
166
185
  response = self._client.session.post(
167
186
  self._client.chat_endpoint,
@@ -169,7 +188,7 @@ class Completions(BaseCompletions):
169
188
  cookies=self._client.cookies,
170
189
  data=json.dumps(payload),
171
190
  stream=True, # Still use streaming API but collect all chunks
172
- timeout=self._client.timeout,
191
+ timeout=timeout if timeout is not None else self._client.timeout,
173
192
  impersonate="chrome120"
174
193
  )
175
194
  response.raise_for_status()
@@ -226,6 +245,9 @@ class Completions(BaseCompletions):
226
245
  raise IOError(f"Cloudflare request failed (CurlError): {e}") from e
227
246
  except Exception as e:
228
247
  raise IOError(f"Cloudflare request failed: {e}") from e
248
+ finally:
249
+ if proxies is not None:
250
+ self._client.session.proxies = original_proxies
229
251
 
230
252
  @staticmethod
231
253
  def _cloudflare_extractor(chunk: Union[str, Dict[str, Any]]) -> Optional[str]:
@@ -315,23 +337,19 @@ class Cloudflare(OpenAICompatibleProvider):
315
337
  def __init__(
316
338
  self,
317
339
  api_key: Optional[str] = None, # Not used but included for compatibility
318
- timeout: int = 30,
319
- proxies: dict = {},
320
340
  ):
321
341
  """
322
342
  Initialize the Cloudflare client.
323
343
 
324
344
  Args:
325
345
  api_key: Not used but included for compatibility with OpenAI interface
326
- timeout: Request timeout in seconds
327
- proxies: Optional proxy configuration
328
346
  """
329
- self.timeout = timeout
330
- self.proxies = proxies
347
+ self.timeout = 30
331
348
  self.chat_endpoint = "https://playground.ai.cloudflare.com/api/inference"
332
349
 
333
350
  # Initialize session
334
351
  self.session = Session()
352
+ self.session.proxies = {}
335
353
 
336
354
  # Set headers
337
355
  self.headers = {
@@ -358,9 +376,8 @@ class Cloudflare(OpenAICompatibleProvider):
358
376
  '__cf_bm': uuid4().hex,
359
377
  }
360
378
 
361
- # Apply headers and proxies to session
379
+ # Apply headers to session
362
380
  self.session.headers.update(self.headers)
363
- self.session.proxies = proxies
364
381
 
365
382
  # Initialize chat interface
366
383
  self.chat = Chat(self)
@@ -0,0 +1,457 @@
1
+ import requests
2
+ import json
3
+ import time
4
+ import uuid
5
+ from typing import List, Dict, Optional, Union, Generator, Any
6
+
7
+ from webscout.Provider.OPENAI.base import OpenAICompatibleProvider, BaseChat, BaseCompletions
8
+ from webscout.Provider.OPENAI.utils import (
9
+ ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
10
+ ChatCompletionMessage, CompletionUsage,
11
+ get_system_prompt,
12
+ count_tokens,
13
+ format_prompt
14
+ )
15
+ from webscout.litagent import LitAgent
16
+
17
+ def convert_openai_to_falcon_history(messages: List[Dict[str, str]]) -> list:
18
+ """
19
+ Converts a list of OpenAI-style chat messages to Falcon/Gradio chat history format.
20
+
21
+ Args:
22
+ messages (List[Dict[str, str]]):
23
+ A list of message dictionaries, each with 'role' and 'content' keys, following the OpenAI API format.
24
+
25
+ Returns:
26
+ list: A single-turn Falcon/Gradio chat history in the format [[prompt, None]].
27
+ """
28
+ prompt = format_prompt(messages, add_special_tokens=False, do_continue=True, include_system=True)
29
+ return [[prompt, None]]
30
+
31
+ class Completions(BaseCompletions):
32
+ """
33
+ Handles text completion requests for the FalconH1 provider, supporting both streaming and non-streaming modes.
34
+
35
+ Attributes:
36
+ _client (Any): Reference to the FalconH1 client instance.
37
+ _last_yielded_content_stream (str): Tracks the last yielded content in streaming mode.
38
+ """
39
+ def __init__(self, client):
40
+ """
41
+ Initializes the Completions handler.
42
+
43
+ Args:
44
+ client: The FalconH1 client instance.
45
+ """
46
+ self._client = client
47
+ self._last_yielded_content_stream = ""
48
+
49
+ def create(
50
+ self,
51
+ *,
52
+ model: str,
53
+ messages: List[Dict[str, str]],
54
+ max_tokens: Optional[int] = 1024,
55
+ stream: bool = False,
56
+ temperature: Optional[float] = 0.1,
57
+ top_p: Optional[float] = 1.0,
58
+ timeout: Optional[int] = None,
59
+ proxies: Optional[dict] = None,
60
+ **kwargs: Any
61
+ ) -> Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]:
62
+ """
63
+ Creates a chat completion using the FalconH1 API, supporting both streaming and non-streaming responses.
64
+
65
+ Args:
66
+ model (str): The model identifier to use for completion.
67
+ messages (List[Dict[str, str]]): List of chat messages in OpenAI format.
68
+ max_tokens (Optional[int]): Maximum number of tokens to generate in the completion.
69
+ stream (bool): Whether to stream the response as chunks.
70
+ temperature (Optional[float]): Sampling temperature.
71
+ top_p (Optional[float]): Nucleus sampling probability.
72
+ timeout (Optional[int]): Request timeout in seconds.
73
+ proxies (Optional[dict]): Optional proxy settings for the request.
74
+ **kwargs: Additional keyword arguments for advanced options (e.g., top_k, repetition_penalty).
75
+
76
+ Returns:
77
+ Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]: The chat completion result or a generator yielding streamed chunks.
78
+ """
79
+ session_hash = str(uuid.uuid4()).replace('-', '')
80
+ chat_history = convert_openai_to_falcon_history(messages)
81
+ if not chat_history or chat_history[-1][0] is None:
82
+ raise ValueError("Messages must contain at least one user message for Falcon API.")
83
+ resolved_model_name = self._client.get_model(model)
84
+ payload_data = [
85
+ chat_history,
86
+ resolved_model_name,
87
+ temperature,
88
+ max_tokens,
89
+ top_p,
90
+ kwargs.get("top_k", 20),
91
+ kwargs.get("repetition_penalty", 1.2)
92
+ ]
93
+ payload = {
94
+ "data": payload_data,
95
+ "event_data": None,
96
+ "fn_index": 5,
97
+ "trigger_id": 12,
98
+ "session_hash": session_hash
99
+ }
100
+ request_id = f"chatcmpl-{uuid.uuid4()}"
101
+ created_time = int(time.time())
102
+ if stream:
103
+ self._last_yielded_content_stream = ""
104
+ return self._create_stream(request_id, created_time, resolved_model_name, payload, session_hash, timeout=timeout, proxies=proxies)
105
+ else:
106
+ return self._create_non_stream(request_id, created_time, resolved_model_name, payload, session_hash, timeout=timeout, proxies=proxies)
107
+
108
+ def _create_stream(
109
+ self, request_id: str, created_time: int, model: str, payload: Dict[str, Any], session_hash: str,
110
+ timeout: Optional[int] = None, proxies: Optional[dict] = None
111
+ ) -> Generator[ChatCompletionChunk, None, None]:
112
+ """
113
+ Internal method to handle streaming chat completions from the FalconH1 API.
114
+
115
+ Args:
116
+ request_id (str): Unique request identifier.
117
+ created_time (int): Timestamp of request creation.
118
+ model (str): Model identifier.
119
+ payload (Dict[str, Any]): Request payload for the API.
120
+ session_hash (str): Unique session hash for the request.
121
+ timeout (Optional[int]): Request timeout in seconds.
122
+ proxies (Optional[dict]): Optional proxy settings.
123
+
124
+ Yields:
125
+ ChatCompletionChunk: Chunks of the chat completion as they are received from the API.
126
+ """
127
+ original_proxies = self._client.session.proxies.copy()
128
+ if proxies is not None:
129
+ self._client.session.proxies = proxies
130
+ else:
131
+ self._client.session.proxies = {}
132
+ try:
133
+ session = self._client.session
134
+ join_resp = session.post(
135
+ self._client.api_join_endpoint,
136
+ headers=self._client.headers,
137
+ json=payload,
138
+ timeout=timeout if timeout is not None else self._client.timeout
139
+ )
140
+ join_resp.raise_for_status()
141
+ data_url = f"{self._client.api_data_endpoint}?session_hash={session_hash}"
142
+ stream_resp = session.get(
143
+ data_url,
144
+ headers=self._client.stream_headers,
145
+ stream=True,
146
+ timeout=timeout if timeout is not None else self._client.timeout
147
+ )
148
+ stream_resp.raise_for_status()
149
+ for line in stream_resp.iter_lines():
150
+ if line:
151
+ decoded_line = line.decode('utf-8')
152
+ if decoded_line.startswith('data: '):
153
+ try:
154
+ json_data = json.loads(decoded_line[6:])
155
+ msg_type = json_data.get('msg')
156
+ if msg_type == 'process_generating':
157
+ output_field = json_data.get('output', {})
158
+ data_field = output_field.get('data')
159
+ if data_field and isinstance(data_field, list) and len(data_field) > 0:
160
+ inner_data = data_field[0]
161
+ content_to_yield = None
162
+ if isinstance(inner_data, list) and len(inner_data) > 0:
163
+ if isinstance(inner_data[0], list) and len(inner_data[0]) == 3 and inner_data[0][0] == "append":
164
+ content_to_yield = inner_data[0][2]
165
+ elif isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and \
166
+ isinstance(inner_data[0][1], str):
167
+ current_full_response = inner_data[0][1]
168
+ if current_full_response.startswith(self._last_yielded_content_stream):
169
+ content_to_yield = current_full_response[len(self._last_yielded_content_stream):]
170
+ else:
171
+ content_to_yield = current_full_response
172
+ self._last_yielded_content_stream = current_full_response
173
+ if content_to_yield:
174
+ delta = ChoiceDelta(content=content_to_yield, role="assistant")
175
+ yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
176
+ elif msg_type == 'process_completed' or msg_type == 'close_stream':
177
+ break
178
+ except json.JSONDecodeError:
179
+ continue
180
+ except Exception as e:
181
+ continue
182
+ finally:
183
+ self._client.session.proxies = original_proxies
184
+
185
+ def _create_non_stream(
186
+ self, request_id: str, created_time: int, model: str, payload: Dict[str, Any], session_hash: str,
187
+ timeout: Optional[int] = None, proxies: Optional[dict] = None
188
+ ) -> ChatCompletion:
189
+ """
190
+ Internal method to handle non-streaming chat completions from the FalconH1 API.
191
+
192
+ Args:
193
+ request_id (str): Unique request identifier.
194
+ created_time (int): Timestamp of request creation.
195
+ model (str): Model identifier.
196
+ payload (Dict[str, Any]): Request payload for the API.
197
+ session_hash (str): Unique session hash for the request.
198
+ timeout (Optional[int]): Request timeout in seconds.
199
+ proxies (Optional[dict]): Optional proxy settings.
200
+
201
+ Returns:
202
+ ChatCompletion: The full chat completion result.
203
+ """
204
+ original_proxies = self._client.session.proxies.copy()
205
+ if proxies is not None:
206
+ self._client.session.proxies = proxies
207
+ else:
208
+ self._client.session.proxies = {}
209
+ full_response_content = ""
210
+ last_full_response_chunk_ns = ""
211
+ response_parts = []
212
+ try:
213
+ session = self._client.session
214
+ join_resp = session.post(
215
+ self._client.api_join_endpoint, headers=self._client.headers, json=payload,
216
+ timeout=timeout if timeout is not None else self._client.timeout
217
+ )
218
+ join_resp.raise_for_status()
219
+ data_url = f"{self._client.api_data_endpoint}?session_hash={session_hash}"
220
+ overall_start_time = time.time()
221
+ effective_timeout = timeout if timeout is not None else self._client.timeout
222
+ while True:
223
+ if time.time() - overall_start_time > effective_timeout:
224
+ raise TimeoutError("Timeout waiting for non-stream response completion.")
225
+ stream_resp = session.get(
226
+ data_url, headers=self._client.stream_headers, stream=True,
227
+ timeout=effective_timeout
228
+ )
229
+ stream_resp.raise_for_status()
230
+ found_completion_message = False
231
+ for line in stream_resp.iter_lines():
232
+ if time.time() - overall_start_time > effective_timeout:
233
+ raise TimeoutError("Timeout during non-stream response processing.")
234
+ if line:
235
+ decoded_line = line.decode('utf-8')
236
+ if decoded_line.startswith('data: '):
237
+ try:
238
+ json_data = json.loads(decoded_line[6:])
239
+ msg_type = json_data.get('msg')
240
+ if msg_type == 'process_generating':
241
+ output_field = json_data.get('output', {})
242
+ data_field = output_field.get('data')
243
+ if data_field and isinstance(data_field, list) and len(data_field) > 0:
244
+ inner_data = data_field[0]
245
+ current_chunk_text = None
246
+ if isinstance(inner_data, list) and len(inner_data) > 0:
247
+ if isinstance(inner_data[0], list) and len(inner_data[0]) == 3 and inner_data[0][0] == "append":
248
+ current_chunk_text = inner_data[0][2]
249
+ elif isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and isinstance(inner_data[0][1], str):
250
+ current_full_response = inner_data[0][1]
251
+ if current_full_response.startswith(last_full_response_chunk_ns):
252
+ current_chunk_text = current_full_response[len(last_full_response_chunk_ns):]
253
+ else:
254
+ current_chunk_text = current_full_response
255
+ last_full_response_chunk_ns = current_full_response
256
+ if current_chunk_text:
257
+ response_parts.append(current_chunk_text)
258
+ elif msg_type == 'process_completed' or msg_type == 'close_stream':
259
+ if msg_type == 'process_completed':
260
+ output_field = json_data.get('output', {})
261
+ data_field = output_field.get('data')
262
+ if data_field and isinstance(data_field, list) and len(data_field) > 0:
263
+ inner_data = data_field[0]
264
+ if isinstance(inner_data, list) and len(inner_data) > 0 and \
265
+ isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and \
266
+ isinstance(inner_data[0][1], str):
267
+ final_full_response = inner_data[0][1]
268
+ if final_full_response != last_full_response_chunk_ns:
269
+ if final_full_response.startswith(last_full_response_chunk_ns):
270
+ response_parts.append(final_full_response[len(last_full_response_chunk_ns):])
271
+ else:
272
+ response_parts = [final_full_response]
273
+ last_full_response_chunk_ns = final_full_response
274
+ found_completion_message = True
275
+ break
276
+ except json.JSONDecodeError:
277
+ continue
278
+ except Exception as e:
279
+ raise e
280
+ if found_completion_message:
281
+ break
282
+ full_response_content = "".join(response_parts)
283
+ message = ChatCompletionMessage(role="assistant", content=full_response_content)
284
+ choice = Choice(index=0, message=message, finish_reason="stop")
285
+
286
+ # Simplified token counting without history iteration
287
+ chat_history = payload['data'][0]
288
+ prompt = chat_history[0][0] if chat_history and chat_history[0] and chat_history[0][0] else ""
289
+ prompt_tokens = count_tokens(prompt)
290
+ completion_tokens = count_tokens(full_response_content)
291
+ usage = CompletionUsage(
292
+ prompt_tokens=prompt_tokens,
293
+ completion_tokens=completion_tokens,
294
+ total_tokens=prompt_tokens + completion_tokens
295
+ )
296
+ return ChatCompletion(
297
+ id=request_id, choices=[choice], created=created_time,
298
+ model=model, usage=usage
299
+ )
300
+ finally:
301
+ self._client.session.proxies = original_proxies
302
+
303
+ class Chat(BaseChat):
304
+ """
305
+ Provides a chat interface for the FalconH1 provider, exposing the completions API.
306
+
307
+ Attributes:
308
+ completions (Completions): The completions handler for chat requests.
309
+ """
310
+ def __init__(self, client):
311
+ """
312
+ Initializes the Chat interface for FalconH1.
313
+
314
+ Args:
315
+ client: The FalconH1 client instance.
316
+ """
317
+ self.completions = Completions(client)
318
+
319
+ class FalconH1(OpenAICompatibleProvider):
320
+ """
321
+ FalconH1 provider implementation compatible with the OpenAI API interface.
322
+ Handles chat completions using FalconH1 models via the Hugging Face Spaces API.
323
+
324
+ Attributes:
325
+ base_url (str): Base URL for the FalconH1 API.
326
+ api_join_endpoint (str): Endpoint for joining the chat queue.
327
+ api_data_endpoint (str): Endpoint for retrieving chat data.
328
+ AVAILABLE_MODELS (List[str]): List of supported FalconH1 model identifiers.
329
+ timeout (int): Default request timeout in seconds.
330
+ session (requests.Session): HTTP session for API requests.
331
+ headers (dict): Default HTTP headers for requests.
332
+ stream_headers (dict): HTTP headers for streaming requests.
333
+ chat (Chat): Chat interface for completions.
334
+ """
335
+ base_url = "https://tiiuae-falcon-h1-playground.hf.space"
336
+ api_join_endpoint = f"{base_url}/gradio_api/queue/join?__theme=dark"
337
+ api_data_endpoint = f"{base_url}/gradio_api/queue/data"
338
+ AVAILABLE_MODELS = [
339
+ "Falcon-H1-34B-Instruct",
340
+ "Falcon-H1-7B-Instruct",
341
+ "Falcon-H1-3B-Instruct",
342
+ "Falcon-H1-1.5B-Deep-Instruct",
343
+ "Falcon-H1-1.5B-Instruct",
344
+ "Falcon-H1-0.5B-Instruct",
345
+ ]
346
+ def __init__(self, timeout: int = 120, proxies: Optional[dict] = None):
347
+ """
348
+ Initializes the FalconH1 provider with optional timeout and proxy settings.
349
+
350
+ Args:
351
+ timeout (int): Default request timeout in seconds (default: 120).
352
+ proxies (Optional[dict]): Optional proxy settings for HTTP requests.
353
+ """
354
+ self.timeout = timeout
355
+ self.session = requests.Session()
356
+ if proxies:
357
+ self.session.proxies = proxies
358
+ else:
359
+ self.session.proxies = {}
360
+ self.headers = {
361
+ 'User-Agent': LitAgent().random(),
362
+ 'Accept': '*/*',
363
+ 'Accept-Language': 'en-US,en;q=0.9,en-IN;q=0.8',
364
+ 'Accept-Encoding': 'gzip, deflate, br, zstd',
365
+ 'Referer': f'{self.base_url}/?__theme=dark',
366
+ 'Content-Type': 'application/json',
367
+ 'Origin': self.base_url,
368
+ 'Connection': 'keep-alive',
369
+ 'Sec-Fetch-Dest': 'empty',
370
+ 'Sec-Fetch-Mode': 'cors',
371
+ 'Sec-Fetch-Site': 'same-origin',
372
+ 'DNT': '1',
373
+ 'Sec-GPC': '1',
374
+ }
375
+ self.stream_headers = {
376
+ 'Accept': 'text/event-stream',
377
+ 'Accept-Language': self.headers['Accept-Language'],
378
+ 'Referer': self.headers['Referer'],
379
+ 'User-Agent': self.headers['User-Agent'],
380
+ 'Connection': 'keep-alive',
381
+ 'Cache-Control': 'no-cache',
382
+ }
383
+ self.session.headers.update(self.headers)
384
+ self.chat = Chat(self)
385
+ def get_model(self, model_identifier: str) -> str:
386
+ """
387
+ Returns the resolved model name for the given identifier.
388
+
389
+ Args:
390
+ model_identifier (str): The model identifier string.
391
+
392
+ Returns:
393
+ str: The resolved model name (currently returns the identifier as-is).
394
+ """
395
+ return model_identifier
396
+ @property
397
+ def models(self):
398
+ """
399
+ Returns a list-like object containing available FalconH1 models.
400
+
401
+ Returns:
402
+ ModelList: An object with a .list() method returning model data objects.
403
+ """
404
+ class ModelData:
405
+ def __init__(self, id_str):
406
+ self.id = id_str
407
+ class ModelList:
408
+ def __init__(self, models_available):
409
+ self.data = [ModelData(m) for m in models_available]
410
+ def list(self):
411
+ return self.data
412
+ return ModelList(self.AVAILABLE_MODELS)
413
+
414
+ if __name__ == "__main__":
415
+ """
416
+ Example usage of the FalconH1 provider for both non-streaming and streaming chat completions.
417
+ """
418
+ print("FalconH1 Provider Example")
419
+ client = FalconH1()
420
+ print("\n--- Non-Streaming Example ---")
421
+ try:
422
+ response = client.chat.completions.create(
423
+ model="Falcon-H1-34B-Instruct",
424
+ messages=[
425
+ {"role": "system", "content": "You are a helpful AI assistant named Falcon."},
426
+ {"role": "user", "content": "Hello, what is your name and what can you do?"}
427
+ ]
428
+ )
429
+ print(f"ID: {response.id}")
430
+ print(f"Model: {response.model}")
431
+ if response.choices:
432
+ print(f"Response: {response.choices[0].message.content}")
433
+ if response.usage:
434
+ print(f"Usage: {response.usage}")
435
+ except Exception as e:
436
+ print(f"Error in non-streaming example: {e}")
437
+ print("\n--- Streaming Example ---")
438
+ try:
439
+ stream_response = client.chat.completions.create(
440
+ model="Falcon-H1-34B-Instruct",
441
+ messages=[
442
+ {"role": "user", "content": "Tell me a short story about a brave falcon."}
443
+ ],
444
+ stream=True,
445
+ max_tokens=150
446
+ )
447
+ print("Streaming response:")
448
+ full_streamed_content = ""
449
+ for chunk in stream_response:
450
+ if chunk.choices and chunk.choices[0].delta and chunk.choices[0].delta.content:
451
+ content_piece = chunk.choices[0].delta.content
452
+ print(content_piece, end="", flush=True)
453
+ full_streamed_content += content_piece
454
+ print("\n--- End of Stream ---")
455
+ except Exception as e:
456
+ print(f"Error in streaming example: {e}")
457
+