webscout 2025.10.19.2__py3-none-any.whl → 2025.10.22.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of webscout might be problematic. Click here for more details.
- webscout/Provider/DeepAI.py +1 -1
- webscout/Provider/Flowith.py +1 -1
- webscout/Provider/GMI.py +4 -1
- webscout/Provider/OLLAMA.py +3 -2
- webscout/Provider/OPENAI/DeepAI.py +145 -57
- webscout/Provider/OPENAI/flowith.py +3 -2
- webscout/Provider/OPENAI/gmi.py +4 -1
- webscout/version.py +1 -1
- webscout/version.py.bak +1 -1
- {webscout-2025.10.19.2.dist-info → webscout-2025.10.22.1.dist-info}/METADATA +1 -1
- {webscout-2025.10.19.2.dist-info → webscout-2025.10.22.1.dist-info}/RECORD +15 -17
- webscout/Provider/OPENAI/FalconH1.py +0 -452
- webscout/Provider/deepseek_assistant.py +0 -378
- {webscout-2025.10.19.2.dist-info → webscout-2025.10.22.1.dist-info}/WHEEL +0 -0
- {webscout-2025.10.19.2.dist-info → webscout-2025.10.22.1.dist-info}/entry_points.txt +0 -0
- {webscout-2025.10.19.2.dist-info → webscout-2025.10.22.1.dist-info}/licenses/LICENSE.md +0 -0
- {webscout-2025.10.19.2.dist-info → webscout-2025.10.22.1.dist-info}/top_level.txt +0 -0
|
@@ -1,452 +0,0 @@
|
|
|
1
|
-
import requests
|
|
2
|
-
import json
|
|
3
|
-
import time
|
|
4
|
-
import uuid
|
|
5
|
-
from typing import List, Dict, Optional, Union, Generator, Any
|
|
6
|
-
|
|
7
|
-
from webscout.Provider.OPENAI.base import OpenAICompatibleProvider, BaseChat, BaseCompletions
|
|
8
|
-
from webscout.Provider.OPENAI.utils import (
|
|
9
|
-
ChatCompletionChunk, ChatCompletion, Choice, ChoiceDelta,
|
|
10
|
-
ChatCompletionMessage, CompletionUsage,
|
|
11
|
-
get_system_prompt,
|
|
12
|
-
count_tokens,
|
|
13
|
-
format_prompt
|
|
14
|
-
)
|
|
15
|
-
from webscout.litagent import LitAgent
|
|
16
|
-
|
|
17
|
-
def convert_openai_to_falcon_history(messages: List[Dict[str, str]]) -> list:
|
|
18
|
-
"""
|
|
19
|
-
Converts a list of OpenAI-style chat messages to Falcon/Gradio chat history format.
|
|
20
|
-
|
|
21
|
-
Args:
|
|
22
|
-
messages (List[Dict[str, str]]):
|
|
23
|
-
A list of message dictionaries, each with 'role' and 'content' keys, following the OpenAI API format.
|
|
24
|
-
|
|
25
|
-
Returns:
|
|
26
|
-
list: A single-turn Falcon/Gradio chat history in the format [[prompt, None]].
|
|
27
|
-
"""
|
|
28
|
-
prompt = format_prompt(messages, add_special_tokens=False, do_continue=True, include_system=True)
|
|
29
|
-
return [[prompt, None]]
|
|
30
|
-
|
|
31
|
-
class Completions(BaseCompletions):
|
|
32
|
-
"""
|
|
33
|
-
Handles text completion requests for the FalconH1 provider, supporting both streaming and non-streaming modes.
|
|
34
|
-
|
|
35
|
-
Attributes:
|
|
36
|
-
_client (Any): Reference to the FalconH1 client instance.
|
|
37
|
-
_last_yielded_content_stream (str): Tracks the last yielded content in streaming mode.
|
|
38
|
-
"""
|
|
39
|
-
def __init__(self, client):
|
|
40
|
-
"""
|
|
41
|
-
Initializes the Completions handler.
|
|
42
|
-
|
|
43
|
-
Args:
|
|
44
|
-
client: The FalconH1 client instance.
|
|
45
|
-
"""
|
|
46
|
-
self._client = client
|
|
47
|
-
self._last_yielded_content_stream = ""
|
|
48
|
-
|
|
49
|
-
def create(
|
|
50
|
-
self,
|
|
51
|
-
*,
|
|
52
|
-
model: str,
|
|
53
|
-
messages: List[Dict[str, str]],
|
|
54
|
-
max_tokens: Optional[int] = 1024,
|
|
55
|
-
stream: bool = False,
|
|
56
|
-
temperature: Optional[float] = 0.1,
|
|
57
|
-
top_p: Optional[float] = 1.0,
|
|
58
|
-
timeout: Optional[int] = None,
|
|
59
|
-
proxies: Optional[dict] = None,
|
|
60
|
-
**kwargs: Any
|
|
61
|
-
) -> Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]:
|
|
62
|
-
"""
|
|
63
|
-
Creates a chat completion using the FalconH1 API, supporting both streaming and non-streaming responses.
|
|
64
|
-
|
|
65
|
-
Args:
|
|
66
|
-
model (str): The model identifier to use for completion.
|
|
67
|
-
messages (List[Dict[str, str]]): List of chat messages in OpenAI format.
|
|
68
|
-
max_tokens (Optional[int]): Maximum number of tokens to generate in the completion.
|
|
69
|
-
stream (bool): Whether to stream the response as chunks.
|
|
70
|
-
temperature (Optional[float]): Sampling temperature.
|
|
71
|
-
top_p (Optional[float]): Nucleus sampling probability.
|
|
72
|
-
timeout (Optional[int]): Request timeout in seconds.
|
|
73
|
-
proxies (Optional[dict]): Optional proxy settings for the request.
|
|
74
|
-
**kwargs: Additional keyword arguments for advanced options (e.g., top_k, repetition_penalty).
|
|
75
|
-
|
|
76
|
-
Returns:
|
|
77
|
-
Union[ChatCompletion, Generator[ChatCompletionChunk, None, None]]: The chat completion result or a generator yielding streamed chunks.
|
|
78
|
-
"""
|
|
79
|
-
session_hash = str(uuid.uuid4()).replace('-', '')
|
|
80
|
-
chat_history = convert_openai_to_falcon_history(messages)
|
|
81
|
-
if not chat_history or chat_history[-1][0] is None:
|
|
82
|
-
raise ValueError("Messages must contain at least one user message for Falcon API.")
|
|
83
|
-
resolved_model_name = self._client.get_model(model)
|
|
84
|
-
payload_data = [
|
|
85
|
-
chat_history,
|
|
86
|
-
resolved_model_name,
|
|
87
|
-
temperature,
|
|
88
|
-
max_tokens,
|
|
89
|
-
top_p,
|
|
90
|
-
kwargs.get("top_k", 20),
|
|
91
|
-
kwargs.get("repetition_penalty", 1.2)
|
|
92
|
-
]
|
|
93
|
-
payload = {
|
|
94
|
-
"data": payload_data,
|
|
95
|
-
"event_data": None,
|
|
96
|
-
"fn_index": 5,
|
|
97
|
-
"trigger_id": 12,
|
|
98
|
-
"session_hash": session_hash
|
|
99
|
-
}
|
|
100
|
-
request_id = f"chatcmpl-{uuid.uuid4()}"
|
|
101
|
-
created_time = int(time.time())
|
|
102
|
-
if stream:
|
|
103
|
-
self._last_yielded_content_stream = ""
|
|
104
|
-
return self._create_stream(request_id, created_time, resolved_model_name, payload, session_hash, timeout=timeout, proxies=proxies)
|
|
105
|
-
else:
|
|
106
|
-
return self._create_non_stream(request_id, created_time, resolved_model_name, payload, session_hash, timeout=timeout, proxies=proxies)
|
|
107
|
-
|
|
108
|
-
def _create_stream(
|
|
109
|
-
self, request_id: str, created_time: int, model: str, payload: Dict[str, Any], session_hash: str,
|
|
110
|
-
timeout: Optional[int] = None, proxies: Optional[dict] = None
|
|
111
|
-
) -> Generator[ChatCompletionChunk, None, None]:
|
|
112
|
-
"""
|
|
113
|
-
Internal method to handle streaming chat completions from the FalconH1 API.
|
|
114
|
-
|
|
115
|
-
Args:
|
|
116
|
-
request_id (str): Unique request identifier.
|
|
117
|
-
created_time (int): Timestamp of request creation.
|
|
118
|
-
model (str): Model identifier.
|
|
119
|
-
payload (Dict[str, Any]): Request payload for the API.
|
|
120
|
-
session_hash (str): Unique session hash for the request.
|
|
121
|
-
timeout (Optional[int]): Request timeout in seconds.
|
|
122
|
-
proxies (Optional[dict]): Optional proxy settings.
|
|
123
|
-
|
|
124
|
-
Yields:
|
|
125
|
-
ChatCompletionChunk: Chunks of the chat completion as they are received from the API.
|
|
126
|
-
"""
|
|
127
|
-
original_proxies = self._client.session.proxies.copy()
|
|
128
|
-
if proxies is not None:
|
|
129
|
-
self._client.session.proxies = proxies
|
|
130
|
-
else:
|
|
131
|
-
self._client.session.proxies = {}
|
|
132
|
-
try:
|
|
133
|
-
session = self._client.session
|
|
134
|
-
join_resp = session.post(
|
|
135
|
-
self._client.api_join_endpoint,
|
|
136
|
-
headers=self._client.headers,
|
|
137
|
-
json=payload,
|
|
138
|
-
timeout=timeout if timeout is not None else self._client.timeout
|
|
139
|
-
)
|
|
140
|
-
join_resp.raise_for_status()
|
|
141
|
-
data_url = f"{self._client.api_data_endpoint}?session_hash={session_hash}"
|
|
142
|
-
stream_resp = session.get(
|
|
143
|
-
data_url,
|
|
144
|
-
headers=self._client.stream_headers,
|
|
145
|
-
stream=True,
|
|
146
|
-
timeout=timeout if timeout is not None else self._client.timeout
|
|
147
|
-
)
|
|
148
|
-
stream_resp.raise_for_status()
|
|
149
|
-
for line in stream_resp.iter_lines():
|
|
150
|
-
if line:
|
|
151
|
-
decoded_line = line.decode('utf-8')
|
|
152
|
-
if decoded_line.startswith('data: '):
|
|
153
|
-
try:
|
|
154
|
-
json_data = json.loads(decoded_line[6:])
|
|
155
|
-
msg_type = json_data.get('msg')
|
|
156
|
-
if msg_type == 'process_generating':
|
|
157
|
-
output_field = json_data.get('output', {})
|
|
158
|
-
data_field = output_field.get('data')
|
|
159
|
-
if data_field and isinstance(data_field, list) and len(data_field) > 0:
|
|
160
|
-
inner_data = data_field[0]
|
|
161
|
-
content_to_yield = None
|
|
162
|
-
if isinstance(inner_data, list) and len(inner_data) > 0:
|
|
163
|
-
if isinstance(inner_data[0], list) and len(inner_data[0]) == 3 and inner_data[0][0] == "append":
|
|
164
|
-
content_to_yield = inner_data[0][2]
|
|
165
|
-
elif isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and \
|
|
166
|
-
isinstance(inner_data[0][1], str):
|
|
167
|
-
current_full_response = inner_data[0][1]
|
|
168
|
-
if current_full_response.startswith(self._last_yielded_content_stream):
|
|
169
|
-
content_to_yield = current_full_response[len(self._last_yielded_content_stream):]
|
|
170
|
-
else:
|
|
171
|
-
content_to_yield = current_full_response
|
|
172
|
-
self._last_yielded_content_stream = current_full_response
|
|
173
|
-
if content_to_yield:
|
|
174
|
-
delta = ChoiceDelta(content=content_to_yield, role="assistant")
|
|
175
|
-
yield ChatCompletionChunk(id=request_id, choices=[Choice(index=0, delta=delta)], created=created_time, model=model)
|
|
176
|
-
elif msg_type == 'process_completed' or msg_type == 'close_stream':
|
|
177
|
-
break
|
|
178
|
-
except json.JSONDecodeError:
|
|
179
|
-
continue
|
|
180
|
-
except Exception as e:
|
|
181
|
-
continue
|
|
182
|
-
finally:
|
|
183
|
-
self._client.session.proxies = original_proxies
|
|
184
|
-
|
|
185
|
-
def _create_non_stream(
|
|
186
|
-
self, request_id: str, created_time: int, model: str, payload: Dict[str, Any], session_hash: str,
|
|
187
|
-
timeout: Optional[int] = None, proxies: Optional[dict] = None
|
|
188
|
-
) -> ChatCompletion:
|
|
189
|
-
"""
|
|
190
|
-
Internal method to handle non-streaming chat completions from the FalconH1 API.
|
|
191
|
-
|
|
192
|
-
Args:
|
|
193
|
-
request_id (str): Unique request identifier.
|
|
194
|
-
created_time (int): Timestamp of request creation.
|
|
195
|
-
model (str): Model identifier.
|
|
196
|
-
payload (Dict[str, Any]): Request payload for the API.
|
|
197
|
-
session_hash (str): Unique session hash for the request.
|
|
198
|
-
timeout (Optional[int]): Request timeout in seconds.
|
|
199
|
-
proxies (Optional[dict]): Optional proxy settings.
|
|
200
|
-
|
|
201
|
-
Returns:
|
|
202
|
-
ChatCompletion: The full chat completion result.
|
|
203
|
-
"""
|
|
204
|
-
original_proxies = self._client.session.proxies.copy()
|
|
205
|
-
if proxies is not None:
|
|
206
|
-
self._client.session.proxies = proxies
|
|
207
|
-
else:
|
|
208
|
-
self._client.session.proxies = {}
|
|
209
|
-
full_response_content = ""
|
|
210
|
-
last_full_response_chunk_ns = ""
|
|
211
|
-
response_parts = []
|
|
212
|
-
try:
|
|
213
|
-
session = self._client.session
|
|
214
|
-
join_resp = session.post(
|
|
215
|
-
self._client.api_join_endpoint, headers=self._client.headers, json=payload,
|
|
216
|
-
timeout=timeout if timeout is not None else self._client.timeout
|
|
217
|
-
)
|
|
218
|
-
join_resp.raise_for_status()
|
|
219
|
-
data_url = f"{self._client.api_data_endpoint}?session_hash={session_hash}"
|
|
220
|
-
overall_start_time = time.time()
|
|
221
|
-
effective_timeout = timeout if timeout is not None else self._client.timeout
|
|
222
|
-
while True:
|
|
223
|
-
if time.time() - overall_start_time > effective_timeout:
|
|
224
|
-
raise TimeoutError("Timeout waiting for non-stream response completion.")
|
|
225
|
-
stream_resp = session.get(
|
|
226
|
-
data_url, headers=self._client.stream_headers, stream=True,
|
|
227
|
-
timeout=effective_timeout
|
|
228
|
-
)
|
|
229
|
-
stream_resp.raise_for_status()
|
|
230
|
-
found_completion_message = False
|
|
231
|
-
for line in stream_resp.iter_lines():
|
|
232
|
-
if time.time() - overall_start_time > effective_timeout:
|
|
233
|
-
raise TimeoutError("Timeout during non-stream response processing.")
|
|
234
|
-
if line:
|
|
235
|
-
decoded_line = line.decode('utf-8')
|
|
236
|
-
if decoded_line.startswith('data: '):
|
|
237
|
-
try:
|
|
238
|
-
json_data = json.loads(decoded_line[6:])
|
|
239
|
-
msg_type = json_data.get('msg')
|
|
240
|
-
if msg_type == 'process_generating':
|
|
241
|
-
output_field = json_data.get('output', {})
|
|
242
|
-
data_field = output_field.get('data')
|
|
243
|
-
if data_field and isinstance(data_field, list) and len(data_field) > 0:
|
|
244
|
-
inner_data = data_field[0]
|
|
245
|
-
current_chunk_text = None
|
|
246
|
-
if isinstance(inner_data, list) and len(inner_data) > 0:
|
|
247
|
-
if isinstance(inner_data[0], list) and len(inner_data[0]) == 3 and inner_data[0][0] == "append":
|
|
248
|
-
current_chunk_text = inner_data[0][2]
|
|
249
|
-
elif isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and isinstance(inner_data[0][1], str):
|
|
250
|
-
current_full_response = inner_data[0][1]
|
|
251
|
-
if current_full_response.startswith(last_full_response_chunk_ns):
|
|
252
|
-
current_chunk_text = current_full_response[len(last_full_response_chunk_ns):]
|
|
253
|
-
else:
|
|
254
|
-
current_chunk_text = current_full_response
|
|
255
|
-
last_full_response_chunk_ns = current_full_response
|
|
256
|
-
if current_chunk_text:
|
|
257
|
-
response_parts.append(current_chunk_text)
|
|
258
|
-
elif msg_type == 'process_completed' or msg_type == 'close_stream':
|
|
259
|
-
if msg_type == 'process_completed':
|
|
260
|
-
output_field = json_data.get('output', {})
|
|
261
|
-
data_field = output_field.get('data')
|
|
262
|
-
if data_field and isinstance(data_field, list) and len(data_field) > 0:
|
|
263
|
-
inner_data = data_field[0]
|
|
264
|
-
if isinstance(inner_data, list) and len(inner_data) > 0 and \
|
|
265
|
-
isinstance(inner_data[0], list) and len(inner_data[0]) == 2 and \
|
|
266
|
-
isinstance(inner_data[0][1], str):
|
|
267
|
-
final_full_response = inner_data[0][1]
|
|
268
|
-
if final_full_response != last_full_response_chunk_ns:
|
|
269
|
-
if final_full_response.startswith(last_full_response_chunk_ns):
|
|
270
|
-
response_parts.append(final_full_response[len(last_full_response_chunk_ns):])
|
|
271
|
-
else:
|
|
272
|
-
response_parts = [final_full_response]
|
|
273
|
-
last_full_response_chunk_ns = final_full_response
|
|
274
|
-
found_completion_message = True
|
|
275
|
-
break
|
|
276
|
-
except json.JSONDecodeError:
|
|
277
|
-
continue
|
|
278
|
-
except Exception as e:
|
|
279
|
-
raise e
|
|
280
|
-
if found_completion_message:
|
|
281
|
-
break
|
|
282
|
-
full_response_content = "".join(response_parts)
|
|
283
|
-
message = ChatCompletionMessage(role="assistant", content=full_response_content)
|
|
284
|
-
choice = Choice(index=0, message=message, finish_reason="stop")
|
|
285
|
-
|
|
286
|
-
# Simplified token counting without history iteration
|
|
287
|
-
chat_history = payload['data'][0]
|
|
288
|
-
prompt = chat_history[0][0] if chat_history and chat_history[0] and chat_history[0][0] else ""
|
|
289
|
-
prompt_tokens = count_tokens(prompt)
|
|
290
|
-
completion_tokens = count_tokens(full_response_content)
|
|
291
|
-
usage = CompletionUsage(
|
|
292
|
-
prompt_tokens=prompt_tokens,
|
|
293
|
-
completion_tokens=completion_tokens,
|
|
294
|
-
total_tokens=prompt_tokens + completion_tokens
|
|
295
|
-
)
|
|
296
|
-
return ChatCompletion(
|
|
297
|
-
id=request_id, choices=[choice], created=created_time,
|
|
298
|
-
model=model, usage=usage
|
|
299
|
-
)
|
|
300
|
-
finally:
|
|
301
|
-
self._client.session.proxies = original_proxies
|
|
302
|
-
|
|
303
|
-
class Chat(BaseChat):
|
|
304
|
-
"""
|
|
305
|
-
Provides a chat interface for the FalconH1 provider, exposing the completions API.
|
|
306
|
-
|
|
307
|
-
Attributes:
|
|
308
|
-
completions (Completions): The completions handler for chat requests.
|
|
309
|
-
"""
|
|
310
|
-
def __init__(self, client):
|
|
311
|
-
"""
|
|
312
|
-
Initializes the Chat interface for FalconH1.
|
|
313
|
-
|
|
314
|
-
Args:
|
|
315
|
-
client: The FalconH1 client instance.
|
|
316
|
-
"""
|
|
317
|
-
self.completions = Completions(client)
|
|
318
|
-
|
|
319
|
-
class FalconH1(OpenAICompatibleProvider):
|
|
320
|
-
"""
|
|
321
|
-
FalconH1 provider implementation compatible with the OpenAI API interface.
|
|
322
|
-
Handles chat completions using FalconH1 models via the Hugging Face Spaces API.
|
|
323
|
-
|
|
324
|
-
Attributes:
|
|
325
|
-
base_url (str): Base URL for the FalconH1 API.
|
|
326
|
-
api_join_endpoint (str): Endpoint for joining the chat queue.
|
|
327
|
-
api_data_endpoint (str): Endpoint for retrieving chat data.
|
|
328
|
-
AVAILABLE_MODELS (List[str]): List of supported FalconH1 model identifiers.
|
|
329
|
-
timeout (int): Default request timeout in seconds.
|
|
330
|
-
session (requests.Session): HTTP session for API requests.
|
|
331
|
-
headers (dict): Default HTTP headers for requests.
|
|
332
|
-
stream_headers (dict): HTTP headers for streaming requests.
|
|
333
|
-
chat (Chat): Chat interface for completions.
|
|
334
|
-
"""
|
|
335
|
-
base_url = "https://tiiuae-falcon-h1-playground.hf.space"
|
|
336
|
-
api_join_endpoint = f"{base_url}/gradio_api/queue/join?__theme=dark"
|
|
337
|
-
api_data_endpoint = f"{base_url}/gradio_api/queue/data"
|
|
338
|
-
AVAILABLE_MODELS = [
|
|
339
|
-
"Falcon-H1-34B-Instruct",
|
|
340
|
-
"Falcon-H1-7B-Instruct",
|
|
341
|
-
"Falcon-H1-3B-Instruct",
|
|
342
|
-
"Falcon-H1-1.5B-Deep-Instruct",
|
|
343
|
-
"Falcon-H1-1.5B-Instruct",
|
|
344
|
-
"Falcon-H1-0.5B-Instruct",
|
|
345
|
-
]
|
|
346
|
-
def __init__(self, timeout: int = 120, proxies: Optional[dict] = None):
|
|
347
|
-
"""
|
|
348
|
-
Initializes the FalconH1 provider with optional timeout and proxy settings.
|
|
349
|
-
|
|
350
|
-
Args:
|
|
351
|
-
timeout (int): Default request timeout in seconds (default: 120).
|
|
352
|
-
proxies (Optional[dict]): Optional proxy settings for HTTP requests.
|
|
353
|
-
"""
|
|
354
|
-
super().__init__(proxies=proxies)
|
|
355
|
-
self.timeout = timeout
|
|
356
|
-
self.headers = {
|
|
357
|
-
'User-Agent': LitAgent().random(),
|
|
358
|
-
'Accept': '*/*',
|
|
359
|
-
'Accept-Language': 'en-US,en;q=0.9,en-IN;q=0.8',
|
|
360
|
-
'Accept-Encoding': 'gzip, deflate, br, zstd',
|
|
361
|
-
'Referer': f'{self.base_url}/?__theme=dark',
|
|
362
|
-
'Content-Type': 'application/json',
|
|
363
|
-
'Origin': self.base_url,
|
|
364
|
-
'Connection': 'keep-alive',
|
|
365
|
-
'Sec-Fetch-Dest': 'empty',
|
|
366
|
-
'Sec-Fetch-Mode': 'cors',
|
|
367
|
-
'Sec-Fetch-Site': 'same-origin',
|
|
368
|
-
'DNT': '1',
|
|
369
|
-
'Sec-GPC': '1',
|
|
370
|
-
}
|
|
371
|
-
self.stream_headers = {
|
|
372
|
-
'Accept': 'text/event-stream',
|
|
373
|
-
'Accept-Language': self.headers['Accept-Language'],
|
|
374
|
-
'Referer': self.headers['Referer'],
|
|
375
|
-
'User-Agent': self.headers['User-Agent'],
|
|
376
|
-
'Connection': 'keep-alive',
|
|
377
|
-
'Cache-Control': 'no-cache',
|
|
378
|
-
}
|
|
379
|
-
self.session.headers.update(self.headers)
|
|
380
|
-
self.chat = Chat(self)
|
|
381
|
-
def get_model(self, model_identifier: str) -> str:
|
|
382
|
-
"""
|
|
383
|
-
Returns the resolved model name for the given identifier.
|
|
384
|
-
|
|
385
|
-
Args:
|
|
386
|
-
model_identifier (str): The model identifier string.
|
|
387
|
-
|
|
388
|
-
Returns:
|
|
389
|
-
str: The resolved model name (currently returns the identifier as-is).
|
|
390
|
-
"""
|
|
391
|
-
return model_identifier
|
|
392
|
-
@property
|
|
393
|
-
def models(self):
|
|
394
|
-
"""
|
|
395
|
-
Returns a list-like object containing available FalconH1 models.
|
|
396
|
-
|
|
397
|
-
Returns:
|
|
398
|
-
ModelList: An object with a .list() method returning model data objects.
|
|
399
|
-
"""
|
|
400
|
-
class ModelData:
|
|
401
|
-
def __init__(self, id_str):
|
|
402
|
-
self.id = id_str
|
|
403
|
-
class ModelList:
|
|
404
|
-
def __init__(self, models_available):
|
|
405
|
-
self.data = [ModelData(m) for m in models_available]
|
|
406
|
-
def list(self):
|
|
407
|
-
return self.data
|
|
408
|
-
return ModelList(self.AVAILABLE_MODELS)
|
|
409
|
-
|
|
410
|
-
if __name__ == "__main__":
|
|
411
|
-
"""
|
|
412
|
-
Example usage of the FalconH1 provider for both non-streaming and streaming chat completions.
|
|
413
|
-
"""
|
|
414
|
-
print("FalconH1 Provider Example")
|
|
415
|
-
client = FalconH1()
|
|
416
|
-
print("\n--- Non-Streaming Example ---")
|
|
417
|
-
try:
|
|
418
|
-
response = client.chat.completions.create(
|
|
419
|
-
model="Falcon-H1-34B-Instruct",
|
|
420
|
-
messages=[
|
|
421
|
-
{"role": "system", "content": "You are a helpful AI assistant named Falcon."},
|
|
422
|
-
{"role": "user", "content": "Hello, what is your name and what can you do?"}
|
|
423
|
-
]
|
|
424
|
-
)
|
|
425
|
-
print(f"ID: {response.id}")
|
|
426
|
-
print(f"Model: {response.model}")
|
|
427
|
-
if response.choices:
|
|
428
|
-
print(f"Response: {response.choices[0].message.content}")
|
|
429
|
-
if response.usage:
|
|
430
|
-
print(f"Usage: {response.usage}")
|
|
431
|
-
except Exception as e:
|
|
432
|
-
print(f"Error in non-streaming example: {e}")
|
|
433
|
-
print("\n--- Streaming Example ---")
|
|
434
|
-
try:
|
|
435
|
-
stream_response = client.chat.completions.create(
|
|
436
|
-
model="Falcon-H1-34B-Instruct",
|
|
437
|
-
messages=[
|
|
438
|
-
{"role": "user", "content": "Tell me a short story about a brave falcon."}
|
|
439
|
-
],
|
|
440
|
-
stream=True,
|
|
441
|
-
max_tokens=150
|
|
442
|
-
)
|
|
443
|
-
print("Streaming response:")
|
|
444
|
-
full_streamed_content = ""
|
|
445
|
-
for chunk in stream_response:
|
|
446
|
-
if chunk.choices and chunk.choices[0].delta and chunk.choices[0].delta.content:
|
|
447
|
-
content_piece = chunk.choices[0].delta.content
|
|
448
|
-
print(content_piece, end="", flush=True)
|
|
449
|
-
full_streamed_content += content_piece
|
|
450
|
-
print("\n--- End of Stream ---")
|
|
451
|
-
except Exception as e:
|
|
452
|
-
print(f"Error in streaming example: {e}")
|