webscout 8.2.6__py3-none-any.whl → 8.2.7__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of webscout might be problematic. Click here for more details.

Files changed (292) hide show
  1. webscout/AIutel.py +97 -87
  2. webscout/version.py +1 -1
  3. {webscout-8.2.6.dist-info → webscout-8.2.7.dist-info}/METADATA +2 -15
  4. webscout-8.2.7.dist-info/RECORD +26 -0
  5. {webscout-8.2.6.dist-info → webscout-8.2.7.dist-info}/WHEEL +1 -1
  6. webscout-8.2.7.dist-info/entry_points.txt +3 -0
  7. webscout-8.2.7.dist-info/top_level.txt +1 -0
  8. webscout/Extra/GitToolkit/__init__.py +0 -10
  9. webscout/Extra/GitToolkit/gitapi/__init__.py +0 -12
  10. webscout/Extra/GitToolkit/gitapi/repository.py +0 -195
  11. webscout/Extra/GitToolkit/gitapi/user.py +0 -96
  12. webscout/Extra/GitToolkit/gitapi/utils.py +0 -62
  13. webscout/Extra/YTToolkit/YTdownloader.py +0 -957
  14. webscout/Extra/YTToolkit/__init__.py +0 -3
  15. webscout/Extra/YTToolkit/transcriber.py +0 -476
  16. webscout/Extra/YTToolkit/ytapi/__init__.py +0 -6
  17. webscout/Extra/YTToolkit/ytapi/channel.py +0 -307
  18. webscout/Extra/YTToolkit/ytapi/errors.py +0 -13
  19. webscout/Extra/YTToolkit/ytapi/extras.py +0 -45
  20. webscout/Extra/YTToolkit/ytapi/https.py +0 -88
  21. webscout/Extra/YTToolkit/ytapi/patterns.py +0 -61
  22. webscout/Extra/YTToolkit/ytapi/playlist.py +0 -59
  23. webscout/Extra/YTToolkit/ytapi/pool.py +0 -8
  24. webscout/Extra/YTToolkit/ytapi/query.py +0 -40
  25. webscout/Extra/YTToolkit/ytapi/stream.py +0 -63
  26. webscout/Extra/YTToolkit/ytapi/utils.py +0 -62
  27. webscout/Extra/YTToolkit/ytapi/video.py +0 -232
  28. webscout/Extra/__init__.py +0 -7
  29. webscout/Extra/autocoder/__init__.py +0 -9
  30. webscout/Extra/autocoder/autocoder.py +0 -910
  31. webscout/Extra/autocoder/autocoder_utiles.py +0 -332
  32. webscout/Extra/gguf.py +0 -684
  33. webscout/Extra/tempmail/__init__.py +0 -28
  34. webscout/Extra/tempmail/async_utils.py +0 -141
  35. webscout/Extra/tempmail/base.py +0 -161
  36. webscout/Extra/tempmail/cli.py +0 -187
  37. webscout/Extra/tempmail/emailnator.py +0 -84
  38. webscout/Extra/tempmail/mail_tm.py +0 -361
  39. webscout/Extra/tempmail/temp_mail_io.py +0 -292
  40. webscout/Extra/weather.py +0 -194
  41. webscout/Extra/weather_ascii.py +0 -76
  42. webscout/Litlogger/__init__.py +0 -67
  43. webscout/Litlogger/core/__init__.py +0 -6
  44. webscout/Litlogger/core/level.py +0 -23
  45. webscout/Litlogger/core/logger.py +0 -165
  46. webscout/Litlogger/handlers/__init__.py +0 -12
  47. webscout/Litlogger/handlers/console.py +0 -33
  48. webscout/Litlogger/handlers/file.py +0 -143
  49. webscout/Litlogger/handlers/network.py +0 -173
  50. webscout/Litlogger/styles/__init__.py +0 -7
  51. webscout/Litlogger/styles/colors.py +0 -249
  52. webscout/Litlogger/styles/formats.py +0 -458
  53. webscout/Litlogger/styles/text.py +0 -87
  54. webscout/Litlogger/utils/__init__.py +0 -6
  55. webscout/Litlogger/utils/detectors.py +0 -153
  56. webscout/Litlogger/utils/formatters.py +0 -200
  57. webscout/Provider/AI21.py +0 -177
  58. webscout/Provider/AISEARCH/DeepFind.py +0 -250
  59. webscout/Provider/AISEARCH/ISou.py +0 -256
  60. webscout/Provider/AISEARCH/Perplexity.py +0 -359
  61. webscout/Provider/AISEARCH/__init__.py +0 -10
  62. webscout/Provider/AISEARCH/felo_search.py +0 -228
  63. webscout/Provider/AISEARCH/genspark_search.py +0 -208
  64. webscout/Provider/AISEARCH/hika_search.py +0 -198
  65. webscout/Provider/AISEARCH/iask_search.py +0 -436
  66. webscout/Provider/AISEARCH/monica_search.py +0 -246
  67. webscout/Provider/AISEARCH/scira_search.py +0 -322
  68. webscout/Provider/AISEARCH/webpilotai_search.py +0 -281
  69. webscout/Provider/Aitopia.py +0 -316
  70. webscout/Provider/AllenAI.py +0 -447
  71. webscout/Provider/Andi.py +0 -228
  72. webscout/Provider/Blackboxai.py +0 -229
  73. webscout/Provider/ChatGPTClone.py +0 -237
  74. webscout/Provider/ChatGPTGratis.py +0 -194
  75. webscout/Provider/ChatSandbox.py +0 -342
  76. webscout/Provider/Cloudflare.py +0 -325
  77. webscout/Provider/Cohere.py +0 -208
  78. webscout/Provider/Deepinfra.py +0 -338
  79. webscout/Provider/ElectronHub.py +0 -773
  80. webscout/Provider/ExaAI.py +0 -261
  81. webscout/Provider/ExaChat.py +0 -358
  82. webscout/Provider/Free2GPT.py +0 -241
  83. webscout/Provider/GPTWeb.py +0 -249
  84. webscout/Provider/Gemini.py +0 -169
  85. webscout/Provider/GithubChat.py +0 -370
  86. webscout/Provider/GizAI.py +0 -285
  87. webscout/Provider/Glider.py +0 -222
  88. webscout/Provider/Groq.py +0 -801
  89. webscout/Provider/HF_space/__init__.py +0 -0
  90. webscout/Provider/HF_space/qwen_qwen2.py +0 -206
  91. webscout/Provider/HeckAI.py +0 -257
  92. webscout/Provider/HuggingFaceChat.py +0 -469
  93. webscout/Provider/Hunyuan.py +0 -283
  94. webscout/Provider/Jadve.py +0 -291
  95. webscout/Provider/Koboldai.py +0 -381
  96. webscout/Provider/LambdaChat.py +0 -411
  97. webscout/Provider/Llama3.py +0 -259
  98. webscout/Provider/MCPCore.py +0 -315
  99. webscout/Provider/Marcus.py +0 -206
  100. webscout/Provider/Nemotron.py +0 -218
  101. webscout/Provider/Netwrck.py +0 -270
  102. webscout/Provider/OLLAMA.py +0 -396
  103. webscout/Provider/OPENAI/__init__.py +0 -28
  104. webscout/Provider/OPENAI/ai4chat.py +0 -286
  105. webscout/Provider/OPENAI/base.py +0 -46
  106. webscout/Provider/OPENAI/c4ai.py +0 -367
  107. webscout/Provider/OPENAI/chatgpt.py +0 -549
  108. webscout/Provider/OPENAI/chatgptclone.py +0 -481
  109. webscout/Provider/OPENAI/deepinfra.py +0 -309
  110. webscout/Provider/OPENAI/e2b.py +0 -1350
  111. webscout/Provider/OPENAI/exaai.py +0 -404
  112. webscout/Provider/OPENAI/exachat.py +0 -437
  113. webscout/Provider/OPENAI/freeaichat.py +0 -352
  114. webscout/Provider/OPENAI/glider.py +0 -316
  115. webscout/Provider/OPENAI/groq.py +0 -354
  116. webscout/Provider/OPENAI/heckai.py +0 -341
  117. webscout/Provider/OPENAI/llmchatco.py +0 -327
  118. webscout/Provider/OPENAI/mcpcore.py +0 -376
  119. webscout/Provider/OPENAI/multichat.py +0 -368
  120. webscout/Provider/OPENAI/netwrck.py +0 -350
  121. webscout/Provider/OPENAI/opkfc.py +0 -488
  122. webscout/Provider/OPENAI/scirachat.py +0 -462
  123. webscout/Provider/OPENAI/sonus.py +0 -294
  124. webscout/Provider/OPENAI/standardinput.py +0 -425
  125. webscout/Provider/OPENAI/textpollinations.py +0 -329
  126. webscout/Provider/OPENAI/toolbaz.py +0 -406
  127. webscout/Provider/OPENAI/typegpt.py +0 -346
  128. webscout/Provider/OPENAI/uncovrAI.py +0 -455
  129. webscout/Provider/OPENAI/utils.py +0 -211
  130. webscout/Provider/OPENAI/venice.py +0 -413
  131. webscout/Provider/OPENAI/wisecat.py +0 -381
  132. webscout/Provider/OPENAI/writecream.py +0 -156
  133. webscout/Provider/OPENAI/x0gpt.py +0 -371
  134. webscout/Provider/OPENAI/yep.py +0 -327
  135. webscout/Provider/OpenGPT.py +0 -209
  136. webscout/Provider/Openai.py +0 -496
  137. webscout/Provider/PI.py +0 -429
  138. webscout/Provider/Perplexitylabs.py +0 -415
  139. webscout/Provider/QwenLM.py +0 -254
  140. webscout/Provider/Reka.py +0 -214
  141. webscout/Provider/StandardInput.py +0 -290
  142. webscout/Provider/TTI/AiForce/__init__.py +0 -22
  143. webscout/Provider/TTI/AiForce/async_aiforce.py +0 -224
  144. webscout/Provider/TTI/AiForce/sync_aiforce.py +0 -245
  145. webscout/Provider/TTI/FreeAIPlayground/__init__.py +0 -9
  146. webscout/Provider/TTI/FreeAIPlayground/async_freeaiplayground.py +0 -181
  147. webscout/Provider/TTI/FreeAIPlayground/sync_freeaiplayground.py +0 -180
  148. webscout/Provider/TTI/ImgSys/__init__.py +0 -23
  149. webscout/Provider/TTI/ImgSys/async_imgsys.py +0 -202
  150. webscout/Provider/TTI/ImgSys/sync_imgsys.py +0 -195
  151. webscout/Provider/TTI/MagicStudio/__init__.py +0 -2
  152. webscout/Provider/TTI/MagicStudio/async_magicstudio.py +0 -111
  153. webscout/Provider/TTI/MagicStudio/sync_magicstudio.py +0 -109
  154. webscout/Provider/TTI/Nexra/__init__.py +0 -22
  155. webscout/Provider/TTI/Nexra/async_nexra.py +0 -286
  156. webscout/Provider/TTI/Nexra/sync_nexra.py +0 -258
  157. webscout/Provider/TTI/PollinationsAI/__init__.py +0 -23
  158. webscout/Provider/TTI/PollinationsAI/async_pollinations.py +0 -311
  159. webscout/Provider/TTI/PollinationsAI/sync_pollinations.py +0 -265
  160. webscout/Provider/TTI/__init__.py +0 -12
  161. webscout/Provider/TTI/aiarta/__init__.py +0 -2
  162. webscout/Provider/TTI/aiarta/async_aiarta.py +0 -482
  163. webscout/Provider/TTI/aiarta/sync_aiarta.py +0 -440
  164. webscout/Provider/TTI/artbit/__init__.py +0 -22
  165. webscout/Provider/TTI/artbit/async_artbit.py +0 -155
  166. webscout/Provider/TTI/artbit/sync_artbit.py +0 -148
  167. webscout/Provider/TTI/fastflux/__init__.py +0 -22
  168. webscout/Provider/TTI/fastflux/async_fastflux.py +0 -261
  169. webscout/Provider/TTI/fastflux/sync_fastflux.py +0 -252
  170. webscout/Provider/TTI/huggingface/__init__.py +0 -22
  171. webscout/Provider/TTI/huggingface/async_huggingface.py +0 -199
  172. webscout/Provider/TTI/huggingface/sync_huggingface.py +0 -195
  173. webscout/Provider/TTI/piclumen/__init__.py +0 -23
  174. webscout/Provider/TTI/piclumen/async_piclumen.py +0 -268
  175. webscout/Provider/TTI/piclumen/sync_piclumen.py +0 -233
  176. webscout/Provider/TTI/pixelmuse/__init__.py +0 -4
  177. webscout/Provider/TTI/pixelmuse/async_pixelmuse.py +0 -249
  178. webscout/Provider/TTI/pixelmuse/sync_pixelmuse.py +0 -182
  179. webscout/Provider/TTI/talkai/__init__.py +0 -4
  180. webscout/Provider/TTI/talkai/async_talkai.py +0 -229
  181. webscout/Provider/TTI/talkai/sync_talkai.py +0 -207
  182. webscout/Provider/TTS/__init__.py +0 -8
  183. webscout/Provider/TTS/base.py +0 -159
  184. webscout/Provider/TTS/deepgram.py +0 -156
  185. webscout/Provider/TTS/elevenlabs.py +0 -111
  186. webscout/Provider/TTS/gesserit.py +0 -128
  187. webscout/Provider/TTS/murfai.py +0 -113
  188. webscout/Provider/TTS/parler.py +0 -111
  189. webscout/Provider/TTS/speechma.py +0 -180
  190. webscout/Provider/TTS/streamElements.py +0 -333
  191. webscout/Provider/TTS/utils.py +0 -280
  192. webscout/Provider/TeachAnything.py +0 -233
  193. webscout/Provider/TextPollinationsAI.py +0 -306
  194. webscout/Provider/TwoAI.py +0 -280
  195. webscout/Provider/TypliAI.py +0 -305
  196. webscout/Provider/Venice.py +0 -258
  197. webscout/Provider/VercelAI.py +0 -253
  198. webscout/Provider/WiseCat.py +0 -233
  199. webscout/Provider/WrDoChat.py +0 -370
  200. webscout/Provider/Writecream.py +0 -237
  201. webscout/Provider/WritingMate.py +0 -269
  202. webscout/Provider/Youchat.py +0 -330
  203. webscout/Provider/__init__.py +0 -178
  204. webscout/Provider/ai4chat.py +0 -203
  205. webscout/Provider/aimathgpt.py +0 -189
  206. webscout/Provider/akashgpt.py +0 -335
  207. webscout/Provider/asksteve.py +0 -212
  208. webscout/Provider/bagoodex.py +0 -145
  209. webscout/Provider/cerebras.py +0 -288
  210. webscout/Provider/chatglm.py +0 -215
  211. webscout/Provider/cleeai.py +0 -213
  212. webscout/Provider/copilot.py +0 -425
  213. webscout/Provider/elmo.py +0 -283
  214. webscout/Provider/freeaichat.py +0 -285
  215. webscout/Provider/geminiapi.py +0 -208
  216. webscout/Provider/geminiprorealtime.py +0 -160
  217. webscout/Provider/granite.py +0 -235
  218. webscout/Provider/hermes.py +0 -266
  219. webscout/Provider/julius.py +0 -223
  220. webscout/Provider/koala.py +0 -268
  221. webscout/Provider/learnfastai.py +0 -325
  222. webscout/Provider/llama3mitril.py +0 -215
  223. webscout/Provider/llmchat.py +0 -255
  224. webscout/Provider/llmchatco.py +0 -306
  225. webscout/Provider/meta.py +0 -798
  226. webscout/Provider/multichat.py +0 -364
  227. webscout/Provider/scira_chat.py +0 -297
  228. webscout/Provider/scnet.py +0 -243
  229. webscout/Provider/searchchat.py +0 -292
  230. webscout/Provider/sonus.py +0 -258
  231. webscout/Provider/talkai.py +0 -194
  232. webscout/Provider/toolbaz.py +0 -353
  233. webscout/Provider/turboseek.py +0 -266
  234. webscout/Provider/typefully.py +0 -330
  235. webscout/Provider/typegpt.py +0 -289
  236. webscout/Provider/uncovr.py +0 -368
  237. webscout/Provider/x0gpt.py +0 -299
  238. webscout/Provider/yep.py +0 -389
  239. webscout/litagent/__init__.py +0 -29
  240. webscout/litagent/agent.py +0 -455
  241. webscout/litagent/constants.py +0 -60
  242. webscout/litprinter/__init__.py +0 -59
  243. webscout/scout/__init__.py +0 -8
  244. webscout/scout/core/__init__.py +0 -7
  245. webscout/scout/core/crawler.py +0 -140
  246. webscout/scout/core/scout.py +0 -568
  247. webscout/scout/core/search_result.py +0 -96
  248. webscout/scout/core/text_analyzer.py +0 -63
  249. webscout/scout/core/text_utils.py +0 -277
  250. webscout/scout/core/web_analyzer.py +0 -52
  251. webscout/scout/core.py +0 -881
  252. webscout/scout/element.py +0 -460
  253. webscout/scout/parsers/__init__.py +0 -69
  254. webscout/scout/parsers/html5lib_parser.py +0 -172
  255. webscout/scout/parsers/html_parser.py +0 -236
  256. webscout/scout/parsers/lxml_parser.py +0 -178
  257. webscout/scout/utils.py +0 -37
  258. webscout/swiftcli/__init__.py +0 -95
  259. webscout/swiftcli/core/__init__.py +0 -7
  260. webscout/swiftcli/core/cli.py +0 -297
  261. webscout/swiftcli/core/context.py +0 -104
  262. webscout/swiftcli/core/group.py +0 -241
  263. webscout/swiftcli/decorators/__init__.py +0 -28
  264. webscout/swiftcli/decorators/command.py +0 -221
  265. webscout/swiftcli/decorators/options.py +0 -220
  266. webscout/swiftcli/decorators/output.py +0 -252
  267. webscout/swiftcli/exceptions.py +0 -21
  268. webscout/swiftcli/plugins/__init__.py +0 -9
  269. webscout/swiftcli/plugins/base.py +0 -135
  270. webscout/swiftcli/plugins/manager.py +0 -262
  271. webscout/swiftcli/utils/__init__.py +0 -59
  272. webscout/swiftcli/utils/formatting.py +0 -252
  273. webscout/swiftcli/utils/parsing.py +0 -267
  274. webscout/zeroart/__init__.py +0 -55
  275. webscout/zeroart/base.py +0 -60
  276. webscout/zeroart/effects.py +0 -99
  277. webscout/zeroart/fonts.py +0 -816
  278. webscout-8.2.6.dist-info/RECORD +0 -307
  279. webscout-8.2.6.dist-info/entry_points.txt +0 -3
  280. webscout-8.2.6.dist-info/top_level.txt +0 -2
  281. webstoken/__init__.py +0 -30
  282. webstoken/classifier.py +0 -189
  283. webstoken/keywords.py +0 -216
  284. webstoken/language.py +0 -128
  285. webstoken/ner.py +0 -164
  286. webstoken/normalizer.py +0 -35
  287. webstoken/processor.py +0 -77
  288. webstoken/sentiment.py +0 -206
  289. webstoken/stemmer.py +0 -73
  290. webstoken/tagger.py +0 -60
  291. webstoken/tokenizer.py +0 -158
  292. {webscout-8.2.6.dist-info → webscout-8.2.7.dist-info}/licenses/LICENSE.md +0 -0
@@ -1,469 +0,0 @@
1
- from curl_cffi.requests import Session
2
- from curl_cffi import CurlError
3
- import uuid
4
- import json
5
- import time
6
- import random
7
- import re
8
- from typing import Any, Dict, List, Optional, Union, Generator
9
-
10
- from webscout.AIutel import Conversation
11
- from webscout.AIbase import Provider
12
- from webscout import exceptions
13
- from webscout.litagent import LitAgent
14
-
15
- class HuggingFaceChat(Provider):
16
- """
17
- A class to interact with the Hugging Face Chat API.
18
- Uses cookies for authentication and supports streaming responses.
19
- """
20
-
21
- # Available models (default models - will be updated dynamically)
22
- AVAILABLE_MODELS = ['meta-llama/Llama-3.3-70B-Instruct', 'Qwen/Qwen3-235B-A22B', 'Qwen/Qwen2.5-72B-Instruct', 'CohereForAI/c4ai-command-r-plus-08-2024', 'deepseek-ai/DeepSeek-R1-Distill-Qwen-32B', 'nvidia/Llama-3.1-Nemotron-70B-Instruct-HF', 'Qwen/QwQ-32B', 'google/gemma-3-27b-it', 'mistralai/Mistral-Small-3.1-24B-Instruct-2503', 'Qwen/Qwen2.5-VL-32B-Instruct', 'microsoft/Phi-4', 'NousResearch/Hermes-3-Llama-3.1-8B', 'internal/task']
23
-
24
- def __init__(
25
- self,
26
- is_conversation: bool = True,
27
- max_tokens: int = 2000, # Note: max_tokens is not used by this API
28
- timeout: int = 60,
29
- filepath: str = None,
30
- update_file: bool = True,
31
- proxies: dict = {},
32
- model: str = "Qwen/QwQ-32B",
33
- cookie_path: str = "cookies.json",
34
- assistantId: str = None, # Note: assistantId is not used by this API
35
- system_prompt: str = "You are a helpful assistant. Please answer the following question.",
36
- ):
37
- """Initialize the HuggingFaceChat client."""
38
- self.url = "https://huggingface.co/chat"
39
- self.cookie_path = cookie_path
40
- # Initialize curl_cffi Session
41
- self.session = Session()
42
- # Set up headers for all requests (remove those handled by impersonate)
43
- self.headers = {
44
- "Content-Type": "application/json", # Keep Content-Type for JSON posts
45
- "Accept": "*/*", # Keep Accept
46
- "Accept-Language": "en-US,en;q=0.9", # Keep Accept-Language
47
- "Origin": "https://huggingface.co", # Keep Origin
48
- "Referer": "https://huggingface.co/chat", # Keep Referer (will be updated)
49
- "Sec-Fetch-Dest": "empty", # Keep Sec-Fetch-*
50
- "Sec-Fetch-Mode": "cors",
51
- "Sec-Fetch-Site": "same-origin",
52
- "DNT": "1", # Keep DNT
53
- "Priority": "u=1, i" # Keep Priority
54
- }
55
-
56
- # Update curl_cffi session headers and proxies
57
- self.session.headers.update(self.headers)
58
- self.session.proxies = proxies # Assign proxies directly
59
- self.system_prompt = system_prompt
60
- self.assistantId = assistantId or None # Generate a new UUID if not provided
61
- # Load cookies for authentication
62
- self.cookies = self.load_cookies()
63
- # Apply cookies to curl_cffi session
64
- if self.cookies:
65
- for name, value in self.cookies.items():
66
- # Set cookies on the session object
67
- self.session.cookies.set(name, value, domain="huggingface.co") # Specify domain if needed
68
-
69
- # Update available models
70
- self.update_available_models()
71
-
72
- # Set default model if none provided
73
- self.model = model
74
-
75
- # Provider settings
76
- self.is_conversation = is_conversation
77
- self.max_tokens_to_sample = max_tokens
78
- self.timeout = timeout
79
- self.last_response = {}
80
-
81
- # Initialize a simplified conversation history for file saving only
82
- self.conversation = Conversation(is_conversation, max_tokens, filepath, update_file)
83
-
84
- # Store conversation data for different models
85
- self._conversation_data = {}
86
-
87
- def update_available_models(self):
88
- """Update the available models list from HuggingFace"""
89
- try:
90
- models = self.get_models()
91
- if models and len(models) > 0:
92
- self.AVAILABLE_MODELS = models
93
- except Exception:
94
- # Fallback to default models list if fetching fails
95
- pass
96
-
97
- @classmethod
98
- def get_models(cls):
99
- """Fetch available models from HuggingFace."""
100
- try:
101
- # Use a temporary curl_cffi session for this class method
102
- temp_session = Session()
103
- response = temp_session.get(
104
- "https://huggingface.co/chat",
105
- impersonate="chrome110" # Use impersonate for fetching
106
- )
107
- response.raise_for_status()
108
- text = response.text
109
- models_match = re.search(r'models:(\[.+?\]),oldModels:', text)
110
-
111
- if not models_match:
112
- return cls.AVAILABLE_MODELS
113
-
114
- models_text = models_match.group(1)
115
- models_text = re.sub(r',parameters:{[^}]+?}', '', models_text)
116
- models_text = models_text.replace('void 0', 'null')
117
-
118
- def add_quotation_mark(match):
119
- return f'{match.group(1)}"{match.group(2)}":'
120
-
121
- models_text = re.sub(r'([{,])([A-Za-z0-9_]+?):', add_quotation_mark, models_text)
122
-
123
- models_data = json.loads(models_text)
124
- # print([model["id"] for model in models_data])
125
- return [model["id"] for model in models_data]
126
- except (CurlError, Exception): # Catch CurlError and other exceptions
127
- return cls.AVAILABLE_MODELS
128
-
129
- def load_cookies(self):
130
- """Load cookies from a JSON file"""
131
- try:
132
- with open(self.cookie_path, 'r') as f:
133
- cookies_data = json.load(f)
134
-
135
- # Convert the cookie list to a dictionary format for requests
136
- cookies = {}
137
- for cookie in cookies_data:
138
- # Only include cookies that are not expired and have a name and value
139
- if 'name' in cookie and 'value' in cookie:
140
- # Check if the cookie hasn't expired
141
- if 'expirationDate' not in cookie or cookie['expirationDate'] > time.time():
142
- cookies[cookie['name']] = cookie['value']
143
-
144
- return cookies
145
- except Exception:
146
- return {}
147
-
148
- def create_conversation(self, model: str):
149
- """Create a new conversation with the specified model."""
150
- url = "https://huggingface.co/chat/conversation"
151
- payload = {"model": model, "assistantId": self.assistantId, "preprompt": self.system_prompt}
152
-
153
- # Update referer for this specific request
154
- headers = self.headers.copy()
155
- headers["Referer"] = f"https://huggingface.co/chat/models/{model}"
156
-
157
- try:
158
- # Use curl_cffi session post with impersonate
159
- response = self.session.post(
160
- url,
161
- json=payload,
162
- headers=headers, # Use updated headers with specific Referer
163
- impersonate="chrome110" # Use a common impersonation profile
164
- )
165
-
166
- if response.status_code == 401:
167
- raise exceptions.AuthenticationError("Authentication failed. Please check your cookies.")
168
-
169
- # Handle other error codes
170
- if response.status_code != 200:
171
- return None
172
-
173
- data = response.json()
174
- conversation_id = data.get("conversationId")
175
-
176
- # Store conversation data
177
- if model not in self._conversation_data:
178
- self._conversation_data[model] = {
179
- "conversationId": conversation_id,
180
- "messageId": str(uuid.uuid4()) # Initial message ID
181
- }
182
-
183
- return conversation_id
184
- except CurlError as e: # Catch CurlError
185
- # Log or handle CurlError specifically if needed
186
- return None
187
- except Exception: # Catch other potential exceptions (like JSONDecodeError, HTTPError)
188
- return None
189
-
190
- def fetch_message_id(self, conversation_id: str) -> str:
191
- """Fetch the latest message ID for a conversation."""
192
- try:
193
- url = f"https://huggingface.co/chat/conversation/{conversation_id}/__data.json?x-sveltekit-invalidated=11"
194
- response = self.session.get(
195
- url,
196
- headers=self.headers, # Use base headers
197
- impersonate="chrome110" # Use a common impersonation profile
198
- )
199
- response.raise_for_status()
200
-
201
- # Parse the JSON data from the response
202
- json_data = None
203
- for line in response.text.split('\n'):
204
- if line.strip():
205
- try:
206
- parsed = json.loads(line)
207
- if isinstance(parsed, dict) and "nodes" in parsed:
208
- json_data = parsed
209
- break
210
- except json.JSONDecodeError:
211
- continue
212
-
213
- if not json_data:
214
- # Fall back to a UUID if we can't parse the response
215
- return str(uuid.uuid4())
216
-
217
- # Extract message ID using the same pattern as in the example
218
- if json_data.get("nodes", []) and json_data["nodes"][-1].get("type") == "error":
219
- return str(uuid.uuid4())
220
-
221
- data = json_data["nodes"][1]["data"]
222
- keys = data[data[0]["messages"]]
223
- message_keys = data[keys[-1]]
224
- message_id = data[message_keys["id"]]
225
-
226
- return message_id
227
-
228
- except CurlError: # Catch CurlError
229
- return str(uuid.uuid4()) # Fallback on CurlError
230
- except Exception: # Catch other potential exceptions
231
- # Fall back to a UUID if there's an error
232
- return str(uuid.uuid4())
233
-
234
- def generate_boundary(self):
235
- """Generate a random boundary for multipart/form-data requests"""
236
- boundary_chars = "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789"
237
- boundary = "----WebKitFormBoundary"
238
- boundary += "".join(random.choice(boundary_chars) for _ in range(16))
239
- return boundary
240
-
241
- def process_response(self, response, prompt: str):
242
- """Process streaming response and extract content."""
243
- full_text = ""
244
- sources = None
245
- reasoning_text = ""
246
- has_reasoning = False
247
-
248
- for line in response.iter_lines(decode_unicode=True):
249
- if not line:
250
- continue
251
-
252
- try:
253
- # Parse each line as JSON
254
- data = json.loads(line)
255
-
256
- # Handle different response types
257
- if "type" not in data:
258
- continue
259
-
260
- if data["type"] == "stream" and "token" in data:
261
- token = data["token"].replace("\u0000", "")
262
- full_text += token
263
- resp = {"text": token}
264
- yield resp
265
- elif data["type"] == "finalAnswer":
266
- final_text = data.get("text", "")
267
- if final_text and not full_text:
268
- full_text = final_text
269
- resp = {"text": final_text}
270
- yield resp
271
- elif data["type"] == "webSearch" and "sources" in data:
272
- sources = data["sources"]
273
- elif data["type"] == "reasoning":
274
- has_reasoning = True
275
- if data.get("subtype") == "stream" and "token" in data:
276
- reasoning_text += data["token"]
277
- # elif data.get("subtype") == "status":
278
- # # For status updates in reasoning, we can just append them as a comment
279
- # if data.get("status"):
280
- # reasoning_text += f"\n# {data['status']}"
281
-
282
- # If we have reasoning, prepend it to the next text output
283
- if reasoning_text and not full_text:
284
- resp = {"text": f"<think>\n{reasoning_text}\n</think>\n", "is_reasoning": True}
285
- yield resp
286
-
287
- except json.JSONDecodeError:
288
- continue
289
-
290
- # Update conversation history only for saving to file if needed
291
- if full_text and self.conversation.file:
292
- if has_reasoning:
293
- full_text_with_reasoning = f"<think>\n{reasoning_text}\n</think>\n{full_text}"
294
- self.last_response = {"text": full_text_with_reasoning}
295
- self.conversation.update_chat_history(prompt, full_text_with_reasoning)
296
- else:
297
- self.last_response = {"text": full_text}
298
- self.conversation.update_chat_history(prompt, full_text)
299
-
300
- return full_text
301
-
302
- def ask(
303
- self,
304
- prompt: str,
305
- stream: bool = False, # API supports streaming
306
- raw: bool = False,
307
- optimizer: str = None, # Note: optimizer is not used by this API
308
- conversationally: bool = False, # Note: conversationally is not used by this API
309
- web_search: bool = False,
310
- ) -> Union[Dict[str, Any], Generator]:
311
- """Send a message to the HuggingFace Chat API"""
312
- model = self.model
313
-
314
- # Check if we have a conversation for this model
315
- if model not in self._conversation_data:
316
- conversation_id = self.create_conversation(model)
317
- if not conversation_id:
318
- raise exceptions.FailedToGenerateResponseError(f"Failed to create conversation with model {model}")
319
- else:
320
- conversation_id = self._conversation_data[model]["conversationId"]
321
- # Refresh message ID
322
- self._conversation_data[model]["messageId"] = self.fetch_message_id(conversation_id)
323
-
324
- url = f"https://huggingface.co/chat/conversation/{conversation_id}"
325
- message_id = self._conversation_data[model]["messageId"]
326
-
327
- # Data to send - use the prompt directly without generating a complete prompt
328
- # since HuggingFace maintains conversation state internally
329
- request_data = {
330
- "inputs": prompt,
331
- "id": message_id,
332
- "is_retry": False,
333
- "is_continue": False,
334
- "web_search": web_search,
335
- "tools": ["66e85bb396d054c5771bc6cb", "00000000000000000000000a"]
336
- }
337
-
338
- # Create multipart form data
339
- boundary = self.generate_boundary()
340
- multipart_headers = self.headers.copy()
341
- multipart_headers["Content-Type"] = f"multipart/form-data; boundary={boundary}"
342
-
343
- # Serialize the data to JSON
344
- data_json = json.dumps(request_data, separators=(',', ':'))
345
-
346
- # Create the multipart form data body
347
- body = f"--{boundary}\r\n"
348
- body += f'Content-Disposition: form-data; name="data"\r\n'
349
- body += f"Content-Type: application/json\r\n\r\n"
350
- body += f"{data_json}\r\n"
351
- body += f"--{boundary}--\r\n"
352
-
353
- multipart_headers["Content-Length"] = str(len(body))
354
-
355
- def for_stream():
356
- try:
357
- # Try with multipart/form-data first
358
- response = None
359
- try:
360
- # Use curl_cffi session post with impersonate
361
- response = self.session.post(
362
- url,
363
- data=body,
364
- headers=multipart_headers, # Use multipart headers
365
- stream=True,
366
- timeout=self.timeout,
367
- impersonate="chrome110" # Use a common impersonation profile
368
- )
369
- response.raise_for_status() # Check status after potential error
370
- except (CurlError, exceptions.FailedToGenerateResponseError, Exception): # Catch potential errors
371
- response = None # Ensure response is None if multipart fails
372
-
373
- # If multipart fails or returns error, try with regular JSON
374
- if not response or response.status_code != 200:
375
- # Use curl_cffi session post with impersonate
376
- response = self.session.post(
377
- url,
378
- json=request_data, # Use JSON payload
379
- headers=self.headers, # Use class-defined headers
380
- stream=True,
381
- timeout=self.timeout,
382
- impersonate="chrome110" # Use a common impersonation profile
383
- )
384
-
385
- response.raise_for_status() # Check status after potential fallback
386
-
387
- # Process the streaming response (iter_lines works with curl_cffi)
388
- yield from self.process_response(response, prompt)
389
-
390
- except (CurlError, exceptions.FailedToGenerateResponseError, Exception) as e: # Catch errors from both attempts
391
- if isinstance(e):
392
- if hasattr(e, 'response') and e.response is not None:
393
- status_code = e.response.status_code
394
- if status_code == 401:
395
- raise exceptions.AuthenticationError("Authentication failed. Please check your cookies.")
396
-
397
- # Try another model if current one fails
398
- if len(self.AVAILABLE_MODELS) > 1:
399
- current_model_index = self.AVAILABLE_MODELS.index(self.model) if self.model in self.AVAILABLE_MODELS else 0
400
- next_model_index = (current_model_index + 1) % len(self.AVAILABLE_MODELS)
401
- self.model = self.AVAILABLE_MODELS[next_model_index]
402
-
403
- # Create new conversation with the alternate model
404
- conversation_id = self.create_conversation(self.model)
405
- if conversation_id:
406
- # Try again with the new model
407
- yield from self.ask(prompt, stream=True, raw=raw, optimizer=optimizer,
408
- conversationally=conversationally, web_search=web_search)
409
- return
410
-
411
- # If we get here, all models failed
412
- raise exceptions.FailedToGenerateResponseError(f"Request failed after trying fallback: {str(e)}") from e
413
-
414
-
415
- def for_non_stream():
416
- # Aggregate the stream using the updated for_stream logic
417
- response_text = ""
418
- try:
419
- # Ensure raw=False so for_stream yields dicts
420
- for chunk_data in for_stream():
421
- if isinstance(chunk_data, dict) and "text" in chunk_data:
422
- response_text += chunk_data["text"]
423
- # Handle raw string case if raw=True was passed
424
- elif raw and isinstance(chunk_data, str):
425
- response_text += chunk_data
426
- except Exception as e:
427
- # If aggregation fails but some text was received, use it. Otherwise, re-raise.
428
- if not response_text:
429
- raise exceptions.FailedToGenerateResponseError(f"Failed to get non-stream response: {str(e)}") from e
430
-
431
- # last_response and history are updated within process_response called by for_stream
432
- # Return the final aggregated response dict or raw string
433
- return response_text if raw else {"text": response_text} # Return dict for consistency
434
-
435
-
436
- return for_stream() if stream else for_non_stream()
437
-
438
- def chat(
439
- self,
440
- prompt: str,
441
- stream: bool = False,
442
- optimizer: str = None, # Note: optimizer is not used by this API
443
- conversationally: bool = False, # Note: conversationally is not used by this API
444
- web_search: bool = False
445
- ) -> Union[str, Generator]:
446
- """Generate a response to a prompt"""
447
- def for_stream_chat():
448
- # ask() yields dicts or strings when streaming
449
- gen = self.ask(
450
- prompt, stream=True, raw=False, # Ensure ask yields dicts
451
- optimizer=optimizer, conversationally=conversationally, web_search=web_search
452
- )
453
- for response_dict in gen:
454
- yield self.get_message(response_dict) # get_message expects dict
455
-
456
- def for_non_stream_chat():
457
- # ask() returns dict or str when not streaming
458
- response_data = self.ask(
459
- prompt, stream=False, raw=False, # Ensure ask returns dict
460
- optimizer=optimizer, conversationally=conversationally, web_search=web_search
461
- )
462
- return self.get_message(response_data) # get_message expects dict
463
-
464
- return for_stream_chat() if stream else for_non_stream_chat()
465
-
466
- def get_message(self, response: dict) -> str:
467
- """Extract message text from response"""
468
- assert isinstance(response, dict), "Response should be of dict data-type only"
469
- return response.get("text", "")