webscout 8.2.6__py3-none-any.whl → 8.2.7__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of webscout might be problematic. Click here for more details.

Files changed (292) hide show
  1. webscout/AIutel.py +97 -87
  2. webscout/version.py +1 -1
  3. {webscout-8.2.6.dist-info → webscout-8.2.7.dist-info}/METADATA +2 -15
  4. webscout-8.2.7.dist-info/RECORD +26 -0
  5. {webscout-8.2.6.dist-info → webscout-8.2.7.dist-info}/WHEEL +1 -1
  6. webscout-8.2.7.dist-info/entry_points.txt +3 -0
  7. webscout-8.2.7.dist-info/top_level.txt +1 -0
  8. webscout/Extra/GitToolkit/__init__.py +0 -10
  9. webscout/Extra/GitToolkit/gitapi/__init__.py +0 -12
  10. webscout/Extra/GitToolkit/gitapi/repository.py +0 -195
  11. webscout/Extra/GitToolkit/gitapi/user.py +0 -96
  12. webscout/Extra/GitToolkit/gitapi/utils.py +0 -62
  13. webscout/Extra/YTToolkit/YTdownloader.py +0 -957
  14. webscout/Extra/YTToolkit/__init__.py +0 -3
  15. webscout/Extra/YTToolkit/transcriber.py +0 -476
  16. webscout/Extra/YTToolkit/ytapi/__init__.py +0 -6
  17. webscout/Extra/YTToolkit/ytapi/channel.py +0 -307
  18. webscout/Extra/YTToolkit/ytapi/errors.py +0 -13
  19. webscout/Extra/YTToolkit/ytapi/extras.py +0 -45
  20. webscout/Extra/YTToolkit/ytapi/https.py +0 -88
  21. webscout/Extra/YTToolkit/ytapi/patterns.py +0 -61
  22. webscout/Extra/YTToolkit/ytapi/playlist.py +0 -59
  23. webscout/Extra/YTToolkit/ytapi/pool.py +0 -8
  24. webscout/Extra/YTToolkit/ytapi/query.py +0 -40
  25. webscout/Extra/YTToolkit/ytapi/stream.py +0 -63
  26. webscout/Extra/YTToolkit/ytapi/utils.py +0 -62
  27. webscout/Extra/YTToolkit/ytapi/video.py +0 -232
  28. webscout/Extra/__init__.py +0 -7
  29. webscout/Extra/autocoder/__init__.py +0 -9
  30. webscout/Extra/autocoder/autocoder.py +0 -910
  31. webscout/Extra/autocoder/autocoder_utiles.py +0 -332
  32. webscout/Extra/gguf.py +0 -684
  33. webscout/Extra/tempmail/__init__.py +0 -28
  34. webscout/Extra/tempmail/async_utils.py +0 -141
  35. webscout/Extra/tempmail/base.py +0 -161
  36. webscout/Extra/tempmail/cli.py +0 -187
  37. webscout/Extra/tempmail/emailnator.py +0 -84
  38. webscout/Extra/tempmail/mail_tm.py +0 -361
  39. webscout/Extra/tempmail/temp_mail_io.py +0 -292
  40. webscout/Extra/weather.py +0 -194
  41. webscout/Extra/weather_ascii.py +0 -76
  42. webscout/Litlogger/__init__.py +0 -67
  43. webscout/Litlogger/core/__init__.py +0 -6
  44. webscout/Litlogger/core/level.py +0 -23
  45. webscout/Litlogger/core/logger.py +0 -165
  46. webscout/Litlogger/handlers/__init__.py +0 -12
  47. webscout/Litlogger/handlers/console.py +0 -33
  48. webscout/Litlogger/handlers/file.py +0 -143
  49. webscout/Litlogger/handlers/network.py +0 -173
  50. webscout/Litlogger/styles/__init__.py +0 -7
  51. webscout/Litlogger/styles/colors.py +0 -249
  52. webscout/Litlogger/styles/formats.py +0 -458
  53. webscout/Litlogger/styles/text.py +0 -87
  54. webscout/Litlogger/utils/__init__.py +0 -6
  55. webscout/Litlogger/utils/detectors.py +0 -153
  56. webscout/Litlogger/utils/formatters.py +0 -200
  57. webscout/Provider/AI21.py +0 -177
  58. webscout/Provider/AISEARCH/DeepFind.py +0 -250
  59. webscout/Provider/AISEARCH/ISou.py +0 -256
  60. webscout/Provider/AISEARCH/Perplexity.py +0 -359
  61. webscout/Provider/AISEARCH/__init__.py +0 -10
  62. webscout/Provider/AISEARCH/felo_search.py +0 -228
  63. webscout/Provider/AISEARCH/genspark_search.py +0 -208
  64. webscout/Provider/AISEARCH/hika_search.py +0 -198
  65. webscout/Provider/AISEARCH/iask_search.py +0 -436
  66. webscout/Provider/AISEARCH/monica_search.py +0 -246
  67. webscout/Provider/AISEARCH/scira_search.py +0 -322
  68. webscout/Provider/AISEARCH/webpilotai_search.py +0 -281
  69. webscout/Provider/Aitopia.py +0 -316
  70. webscout/Provider/AllenAI.py +0 -447
  71. webscout/Provider/Andi.py +0 -228
  72. webscout/Provider/Blackboxai.py +0 -229
  73. webscout/Provider/ChatGPTClone.py +0 -237
  74. webscout/Provider/ChatGPTGratis.py +0 -194
  75. webscout/Provider/ChatSandbox.py +0 -342
  76. webscout/Provider/Cloudflare.py +0 -325
  77. webscout/Provider/Cohere.py +0 -208
  78. webscout/Provider/Deepinfra.py +0 -338
  79. webscout/Provider/ElectronHub.py +0 -773
  80. webscout/Provider/ExaAI.py +0 -261
  81. webscout/Provider/ExaChat.py +0 -358
  82. webscout/Provider/Free2GPT.py +0 -241
  83. webscout/Provider/GPTWeb.py +0 -249
  84. webscout/Provider/Gemini.py +0 -169
  85. webscout/Provider/GithubChat.py +0 -370
  86. webscout/Provider/GizAI.py +0 -285
  87. webscout/Provider/Glider.py +0 -222
  88. webscout/Provider/Groq.py +0 -801
  89. webscout/Provider/HF_space/__init__.py +0 -0
  90. webscout/Provider/HF_space/qwen_qwen2.py +0 -206
  91. webscout/Provider/HeckAI.py +0 -257
  92. webscout/Provider/HuggingFaceChat.py +0 -469
  93. webscout/Provider/Hunyuan.py +0 -283
  94. webscout/Provider/Jadve.py +0 -291
  95. webscout/Provider/Koboldai.py +0 -381
  96. webscout/Provider/LambdaChat.py +0 -411
  97. webscout/Provider/Llama3.py +0 -259
  98. webscout/Provider/MCPCore.py +0 -315
  99. webscout/Provider/Marcus.py +0 -206
  100. webscout/Provider/Nemotron.py +0 -218
  101. webscout/Provider/Netwrck.py +0 -270
  102. webscout/Provider/OLLAMA.py +0 -396
  103. webscout/Provider/OPENAI/__init__.py +0 -28
  104. webscout/Provider/OPENAI/ai4chat.py +0 -286
  105. webscout/Provider/OPENAI/base.py +0 -46
  106. webscout/Provider/OPENAI/c4ai.py +0 -367
  107. webscout/Provider/OPENAI/chatgpt.py +0 -549
  108. webscout/Provider/OPENAI/chatgptclone.py +0 -481
  109. webscout/Provider/OPENAI/deepinfra.py +0 -309
  110. webscout/Provider/OPENAI/e2b.py +0 -1350
  111. webscout/Provider/OPENAI/exaai.py +0 -404
  112. webscout/Provider/OPENAI/exachat.py +0 -437
  113. webscout/Provider/OPENAI/freeaichat.py +0 -352
  114. webscout/Provider/OPENAI/glider.py +0 -316
  115. webscout/Provider/OPENAI/groq.py +0 -354
  116. webscout/Provider/OPENAI/heckai.py +0 -341
  117. webscout/Provider/OPENAI/llmchatco.py +0 -327
  118. webscout/Provider/OPENAI/mcpcore.py +0 -376
  119. webscout/Provider/OPENAI/multichat.py +0 -368
  120. webscout/Provider/OPENAI/netwrck.py +0 -350
  121. webscout/Provider/OPENAI/opkfc.py +0 -488
  122. webscout/Provider/OPENAI/scirachat.py +0 -462
  123. webscout/Provider/OPENAI/sonus.py +0 -294
  124. webscout/Provider/OPENAI/standardinput.py +0 -425
  125. webscout/Provider/OPENAI/textpollinations.py +0 -329
  126. webscout/Provider/OPENAI/toolbaz.py +0 -406
  127. webscout/Provider/OPENAI/typegpt.py +0 -346
  128. webscout/Provider/OPENAI/uncovrAI.py +0 -455
  129. webscout/Provider/OPENAI/utils.py +0 -211
  130. webscout/Provider/OPENAI/venice.py +0 -413
  131. webscout/Provider/OPENAI/wisecat.py +0 -381
  132. webscout/Provider/OPENAI/writecream.py +0 -156
  133. webscout/Provider/OPENAI/x0gpt.py +0 -371
  134. webscout/Provider/OPENAI/yep.py +0 -327
  135. webscout/Provider/OpenGPT.py +0 -209
  136. webscout/Provider/Openai.py +0 -496
  137. webscout/Provider/PI.py +0 -429
  138. webscout/Provider/Perplexitylabs.py +0 -415
  139. webscout/Provider/QwenLM.py +0 -254
  140. webscout/Provider/Reka.py +0 -214
  141. webscout/Provider/StandardInput.py +0 -290
  142. webscout/Provider/TTI/AiForce/__init__.py +0 -22
  143. webscout/Provider/TTI/AiForce/async_aiforce.py +0 -224
  144. webscout/Provider/TTI/AiForce/sync_aiforce.py +0 -245
  145. webscout/Provider/TTI/FreeAIPlayground/__init__.py +0 -9
  146. webscout/Provider/TTI/FreeAIPlayground/async_freeaiplayground.py +0 -181
  147. webscout/Provider/TTI/FreeAIPlayground/sync_freeaiplayground.py +0 -180
  148. webscout/Provider/TTI/ImgSys/__init__.py +0 -23
  149. webscout/Provider/TTI/ImgSys/async_imgsys.py +0 -202
  150. webscout/Provider/TTI/ImgSys/sync_imgsys.py +0 -195
  151. webscout/Provider/TTI/MagicStudio/__init__.py +0 -2
  152. webscout/Provider/TTI/MagicStudio/async_magicstudio.py +0 -111
  153. webscout/Provider/TTI/MagicStudio/sync_magicstudio.py +0 -109
  154. webscout/Provider/TTI/Nexra/__init__.py +0 -22
  155. webscout/Provider/TTI/Nexra/async_nexra.py +0 -286
  156. webscout/Provider/TTI/Nexra/sync_nexra.py +0 -258
  157. webscout/Provider/TTI/PollinationsAI/__init__.py +0 -23
  158. webscout/Provider/TTI/PollinationsAI/async_pollinations.py +0 -311
  159. webscout/Provider/TTI/PollinationsAI/sync_pollinations.py +0 -265
  160. webscout/Provider/TTI/__init__.py +0 -12
  161. webscout/Provider/TTI/aiarta/__init__.py +0 -2
  162. webscout/Provider/TTI/aiarta/async_aiarta.py +0 -482
  163. webscout/Provider/TTI/aiarta/sync_aiarta.py +0 -440
  164. webscout/Provider/TTI/artbit/__init__.py +0 -22
  165. webscout/Provider/TTI/artbit/async_artbit.py +0 -155
  166. webscout/Provider/TTI/artbit/sync_artbit.py +0 -148
  167. webscout/Provider/TTI/fastflux/__init__.py +0 -22
  168. webscout/Provider/TTI/fastflux/async_fastflux.py +0 -261
  169. webscout/Provider/TTI/fastflux/sync_fastflux.py +0 -252
  170. webscout/Provider/TTI/huggingface/__init__.py +0 -22
  171. webscout/Provider/TTI/huggingface/async_huggingface.py +0 -199
  172. webscout/Provider/TTI/huggingface/sync_huggingface.py +0 -195
  173. webscout/Provider/TTI/piclumen/__init__.py +0 -23
  174. webscout/Provider/TTI/piclumen/async_piclumen.py +0 -268
  175. webscout/Provider/TTI/piclumen/sync_piclumen.py +0 -233
  176. webscout/Provider/TTI/pixelmuse/__init__.py +0 -4
  177. webscout/Provider/TTI/pixelmuse/async_pixelmuse.py +0 -249
  178. webscout/Provider/TTI/pixelmuse/sync_pixelmuse.py +0 -182
  179. webscout/Provider/TTI/talkai/__init__.py +0 -4
  180. webscout/Provider/TTI/talkai/async_talkai.py +0 -229
  181. webscout/Provider/TTI/talkai/sync_talkai.py +0 -207
  182. webscout/Provider/TTS/__init__.py +0 -8
  183. webscout/Provider/TTS/base.py +0 -159
  184. webscout/Provider/TTS/deepgram.py +0 -156
  185. webscout/Provider/TTS/elevenlabs.py +0 -111
  186. webscout/Provider/TTS/gesserit.py +0 -128
  187. webscout/Provider/TTS/murfai.py +0 -113
  188. webscout/Provider/TTS/parler.py +0 -111
  189. webscout/Provider/TTS/speechma.py +0 -180
  190. webscout/Provider/TTS/streamElements.py +0 -333
  191. webscout/Provider/TTS/utils.py +0 -280
  192. webscout/Provider/TeachAnything.py +0 -233
  193. webscout/Provider/TextPollinationsAI.py +0 -306
  194. webscout/Provider/TwoAI.py +0 -280
  195. webscout/Provider/TypliAI.py +0 -305
  196. webscout/Provider/Venice.py +0 -258
  197. webscout/Provider/VercelAI.py +0 -253
  198. webscout/Provider/WiseCat.py +0 -233
  199. webscout/Provider/WrDoChat.py +0 -370
  200. webscout/Provider/Writecream.py +0 -237
  201. webscout/Provider/WritingMate.py +0 -269
  202. webscout/Provider/Youchat.py +0 -330
  203. webscout/Provider/__init__.py +0 -178
  204. webscout/Provider/ai4chat.py +0 -203
  205. webscout/Provider/aimathgpt.py +0 -189
  206. webscout/Provider/akashgpt.py +0 -335
  207. webscout/Provider/asksteve.py +0 -212
  208. webscout/Provider/bagoodex.py +0 -145
  209. webscout/Provider/cerebras.py +0 -288
  210. webscout/Provider/chatglm.py +0 -215
  211. webscout/Provider/cleeai.py +0 -213
  212. webscout/Provider/copilot.py +0 -425
  213. webscout/Provider/elmo.py +0 -283
  214. webscout/Provider/freeaichat.py +0 -285
  215. webscout/Provider/geminiapi.py +0 -208
  216. webscout/Provider/geminiprorealtime.py +0 -160
  217. webscout/Provider/granite.py +0 -235
  218. webscout/Provider/hermes.py +0 -266
  219. webscout/Provider/julius.py +0 -223
  220. webscout/Provider/koala.py +0 -268
  221. webscout/Provider/learnfastai.py +0 -325
  222. webscout/Provider/llama3mitril.py +0 -215
  223. webscout/Provider/llmchat.py +0 -255
  224. webscout/Provider/llmchatco.py +0 -306
  225. webscout/Provider/meta.py +0 -798
  226. webscout/Provider/multichat.py +0 -364
  227. webscout/Provider/scira_chat.py +0 -297
  228. webscout/Provider/scnet.py +0 -243
  229. webscout/Provider/searchchat.py +0 -292
  230. webscout/Provider/sonus.py +0 -258
  231. webscout/Provider/talkai.py +0 -194
  232. webscout/Provider/toolbaz.py +0 -353
  233. webscout/Provider/turboseek.py +0 -266
  234. webscout/Provider/typefully.py +0 -330
  235. webscout/Provider/typegpt.py +0 -289
  236. webscout/Provider/uncovr.py +0 -368
  237. webscout/Provider/x0gpt.py +0 -299
  238. webscout/Provider/yep.py +0 -389
  239. webscout/litagent/__init__.py +0 -29
  240. webscout/litagent/agent.py +0 -455
  241. webscout/litagent/constants.py +0 -60
  242. webscout/litprinter/__init__.py +0 -59
  243. webscout/scout/__init__.py +0 -8
  244. webscout/scout/core/__init__.py +0 -7
  245. webscout/scout/core/crawler.py +0 -140
  246. webscout/scout/core/scout.py +0 -568
  247. webscout/scout/core/search_result.py +0 -96
  248. webscout/scout/core/text_analyzer.py +0 -63
  249. webscout/scout/core/text_utils.py +0 -277
  250. webscout/scout/core/web_analyzer.py +0 -52
  251. webscout/scout/core.py +0 -881
  252. webscout/scout/element.py +0 -460
  253. webscout/scout/parsers/__init__.py +0 -69
  254. webscout/scout/parsers/html5lib_parser.py +0 -172
  255. webscout/scout/parsers/html_parser.py +0 -236
  256. webscout/scout/parsers/lxml_parser.py +0 -178
  257. webscout/scout/utils.py +0 -37
  258. webscout/swiftcli/__init__.py +0 -95
  259. webscout/swiftcli/core/__init__.py +0 -7
  260. webscout/swiftcli/core/cli.py +0 -297
  261. webscout/swiftcli/core/context.py +0 -104
  262. webscout/swiftcli/core/group.py +0 -241
  263. webscout/swiftcli/decorators/__init__.py +0 -28
  264. webscout/swiftcli/decorators/command.py +0 -221
  265. webscout/swiftcli/decorators/options.py +0 -220
  266. webscout/swiftcli/decorators/output.py +0 -252
  267. webscout/swiftcli/exceptions.py +0 -21
  268. webscout/swiftcli/plugins/__init__.py +0 -9
  269. webscout/swiftcli/plugins/base.py +0 -135
  270. webscout/swiftcli/plugins/manager.py +0 -262
  271. webscout/swiftcli/utils/__init__.py +0 -59
  272. webscout/swiftcli/utils/formatting.py +0 -252
  273. webscout/swiftcli/utils/parsing.py +0 -267
  274. webscout/zeroart/__init__.py +0 -55
  275. webscout/zeroart/base.py +0 -60
  276. webscout/zeroart/effects.py +0 -99
  277. webscout/zeroart/fonts.py +0 -816
  278. webscout-8.2.6.dist-info/RECORD +0 -307
  279. webscout-8.2.6.dist-info/entry_points.txt +0 -3
  280. webscout-8.2.6.dist-info/top_level.txt +0 -2
  281. webstoken/__init__.py +0 -30
  282. webstoken/classifier.py +0 -189
  283. webstoken/keywords.py +0 -216
  284. webstoken/language.py +0 -128
  285. webstoken/ner.py +0 -164
  286. webstoken/normalizer.py +0 -35
  287. webstoken/processor.py +0 -77
  288. webstoken/sentiment.py +0 -206
  289. webstoken/stemmer.py +0 -73
  290. webstoken/tagger.py +0 -60
  291. webstoken/tokenizer.py +0 -158
  292. {webscout-8.2.6.dist-info → webscout-8.2.7.dist-info}/licenses/LICENSE.md +0 -0
@@ -1,447 +0,0 @@
1
- from curl_cffi.requests import Session
2
- from curl_cffi import CurlError
3
- import json
4
- import os
5
- from uuid import uuid4
6
- from typing import Any, Dict, Optional, Generator, Union
7
-
8
- from webscout.AIutel import Optimizers
9
- from webscout.AIutel import Conversation
10
- from webscout.AIutel import AwesomePrompts, sanitize_stream
11
- from webscout.AIbase import Provider, AsyncProvider
12
- from webscout import exceptions
13
- from webscout.litagent import LitAgent
14
-
15
- class AllenAI(Provider):
16
- """
17
- A class to interact with the AllenAI (Ai2 Playground) API.
18
- """
19
-
20
- AVAILABLE_MODELS = [
21
- 'OLMo-2-1124-13B-Instruct',
22
- 'Llama-3-1-Tulu-3-8B',
23
- 'olmo-2-0325-32b-instruct',
24
- 'Llama-3-1-Tulu-3-70B',
25
- 'OLMoE-1B-7B-0924-Instruct',
26
- 'tulu3-405b',
27
- 'olmo-2-0325-32b-instruct',
28
- 'tulu-3-1-8b',
29
- 'olmoe-0125'
30
- ]
31
-
32
- # Default model options from JS implementation
33
- DEFAULT_OPTIONS = {
34
- "max_tokens": 2048,
35
- "temperature": 0.7,
36
- "top_p": 1,
37
- "n": 1,
38
- "stop": None,
39
- "logprobs": None
40
- }
41
-
42
- # Host mapping for models - some models work best with specific hosts
43
- MODEL_HOST_MAP = {
44
- 'tulu3-405b': 'inferd',
45
- 'tulu2': 'inferd',
46
- 'olmo-7b-instruct': 'inferd'
47
- }
48
-
49
- def __init__(
50
- self,
51
- is_conversation: bool = True,
52
- max_tokens: int = 2048,
53
- timeout: int = 30,
54
- intro: str = None,
55
- filepath: str = None,
56
- update_file: bool = True,
57
- proxies: dict = {},
58
- history_offset: int = 10250,
59
- act: str = None,
60
- model: str = "OLMo-2-1124-13B-Instruct",
61
- host: str = None
62
- ):
63
- """Initializes the AllenAI API client."""
64
- if model not in self.AVAILABLE_MODELS:
65
- raise ValueError(f"Invalid model: {model}. Choose from: {self.AVAILABLE_MODELS}")
66
-
67
- self.url = "https://playground.allenai.org"
68
- self.api_endpoint = "https://olmo-api.allen.ai/v3/message/stream"
69
- self.whoami_endpoint = "https://olmo-api.allen.ai/v3/whoami"
70
-
71
- # Updated headers (remove those handled by impersonate)
72
- self.headers = {
73
- 'Accept': '*/*',
74
- 'Accept-Language': 'id-ID,id;q=0.9',
75
- 'Origin': self.url,
76
- 'Referer': f"{self.url}/",
77
- 'Cache-Control': 'no-cache',
78
- 'Pragma': 'no-cache',
79
- 'Priority': 'u=1, i',
80
- 'Sec-Fetch-Dest': 'empty',
81
- 'Sec-Fetch-Mode': 'cors',
82
- 'Sec-Fetch-Site': 'cross-site',
83
- 'Content-Type': 'application/json'
84
- }
85
-
86
- # Initialize curl_cffi Session
87
- self.session = Session()
88
- # Update curl_cffi session headers and proxies
89
- self.session.headers.update(self.headers)
90
- self.session.proxies = proxies
91
-
92
- self.model = model
93
-
94
- # Auto-detect host if not provided
95
- if not host:
96
- # Use the preferred host from the model-host map, or default to modal
97
- self.host = self.MODEL_HOST_MAP.get(model, 'modal')
98
- else:
99
- self.host = host
100
-
101
- self.is_conversation = is_conversation
102
- self.max_tokens_to_sample = max_tokens
103
- self.timeout = timeout
104
- self.last_response = {}
105
- # Generate user ID if needed
106
- self.x_anonymous_user_id = None
107
- self.parent = None
108
-
109
- # Default options
110
- self.options = self.DEFAULT_OPTIONS.copy()
111
- self.options["max_tokens"] = max_tokens
112
-
113
- self.__available_optimizers = (
114
- method
115
- for method in dir(Optimizers)
116
- if callable(getattr(Optimizers, method)) and not method.startswith("__")
117
- )
118
- Conversation.intro = (
119
- AwesomePrompts().get_act(
120
- act, raise_not_found=True, default=None, case_insensitive=True
121
- )
122
- if act
123
- else intro or Conversation.intro
124
- )
125
-
126
- self.conversation = Conversation(
127
- is_conversation, self.max_tokens_to_sample, filepath, update_file
128
- )
129
- self.conversation.history_offset = history_offset
130
-
131
- def whoami(self):
132
- """Gets or creates a user ID for authentication with Allen AI API"""
133
- temp_id = str(uuid4())
134
- request_headers = self.session.headers.copy() # Use session headers as base
135
- request_headers.update({"x-anonymous-user-id": temp_id})
136
-
137
- try:
138
- # Use curl_cffi session get with impersonate
139
- response = self.session.get(
140
- self.whoami_endpoint,
141
- headers=request_headers, # Pass updated headers
142
- timeout=self.timeout,
143
- impersonate="chrome110" # Use a common impersonation profile
144
- )
145
- response.raise_for_status() # Check for HTTP errors
146
-
147
- data = response.json()
148
- self.x_anonymous_user_id = data.get("client", temp_id)
149
- return data
150
-
151
- except CurlError as e: # Catch CurlError
152
- self.x_anonymous_user_id = temp_id
153
- return {"client": temp_id, "error": f"CurlError: {e}"}
154
- except Exception as e: # Catch other potential exceptions (like HTTPError, JSONDecodeError)
155
- self.x_anonymous_user_id = temp_id
156
- err_text = getattr(e, 'response', None) and getattr(e.response, 'text', '')
157
- return {"client": temp_id, "error": f"{type(e).__name__}: {e} - {err_text}"}
158
-
159
- @staticmethod
160
- def _allenai_extractor(chunk: Union[str, Dict[str, Any]]) -> Optional[str]:
161
- """Extracts content from AllenAI stream JSON objects."""
162
- if isinstance(chunk, dict):
163
- if chunk.get("message", "").startswith("msg_") and "content" in chunk:
164
- return chunk.get("content")
165
- elif "message" in chunk and chunk.get("content"): # Legacy handling
166
- return chunk.get("content")
167
- return None
168
-
169
- def ask(
170
- self,
171
- prompt: str,
172
- stream: bool = False, # API supports streaming
173
- raw: bool = False,
174
- optimizer: str = None,
175
- conversationally: bool = False,
176
- host: str = None,
177
- private: bool = False,
178
- top_p: float = None,
179
- temperature: float = None,
180
- options: dict = None,
181
- ) -> Union[Dict[str, Any], Generator]:
182
- conversation_prompt = self.conversation.gen_complete_prompt(prompt)
183
- if optimizer:
184
- if optimizer in self.__available_optimizers:
185
- conversation_prompt = getattr(Optimizers, optimizer)(conversation_prompt if conversationally else prompt)
186
- else:
187
- raise Exception(f"Optimizer is not one of {self.__available_optimizers}")
188
-
189
- # Ensure we have a user ID
190
- if not self.x_anonymous_user_id:
191
- self.whoami()
192
- # Check if whoami failed and we still don't have an ID
193
- if not self.x_anonymous_user_id:
194
- raise exceptions.AuthenticationError("Failed to obtain anonymous user ID.")
195
-
196
- # Prepare the API request headers for this specific request
197
- request_headers = self.session.headers.copy()
198
- request_headers.update({
199
- "x-anonymous-user-id": self.x_anonymous_user_id,
200
- "Content-Type": "application/json" # Ensure Content-Type is set
201
- })
202
-
203
- # Create options dictionary
204
- opts = self.options.copy()
205
- if temperature is not None:
206
- opts["temperature"] = temperature
207
- if top_p is not None:
208
- opts["top_p"] = top_p
209
- if options:
210
- opts.update(options)
211
-
212
- # Use the host param or the default host
213
- use_host = host or self.host
214
-
215
- # List of hosts to try - start with provided host, then try alternative hosts
216
- hosts_to_try = [use_host]
217
- if use_host == 'modal':
218
- hosts_to_try.append('inferd')
219
- else:
220
- hosts_to_try.append('modal')
221
-
222
- last_error = None
223
-
224
- # Try each host until one works
225
- for current_host in hosts_to_try:
226
- # Create the JSON payload as per the JS implementation
227
- payload = {
228
- "content": conversation_prompt,
229
- "private": private,
230
- "model": self.model,
231
- "host": current_host,
232
- "opts": opts
233
- }
234
- payload["host"] = current_host # Ensure host is updated in payload
235
-
236
- try:
237
- if stream:
238
- # Pass request_headers to the stream method
239
- return self._stream_request(payload, prompt, request_headers, raw)
240
- else:
241
- # Pass request_headers to the non-stream method
242
- return self._non_stream_request(payload, prompt, request_headers, raw)
243
- except (exceptions.FailedToGenerateResponseError, CurlError, Exception) as e:
244
- last_error = e
245
- # Log the error but continue to try other hosts
246
- print(f"Host '{current_host}' failed for model '{self.model}' ({type(e).__name__}), trying next host...")
247
- continue
248
-
249
- # If we've tried all hosts and none worked, raise the last error
250
- raise last_error or exceptions.FailedToGenerateResponseError("All hosts failed. Unable to complete request.")
251
-
252
- def _stream_request(self, payload, prompt, request_headers, raw=False):
253
- """Handle streaming requests with the given payload and headers"""
254
- streaming_text = "" # Initialize outside try block
255
- current_parent = None # Initialize outside try block
256
- try:
257
- # Use curl_cffi session post with impersonate
258
- response = self.session.post(
259
- self.api_endpoint,
260
- headers=request_headers, # Use headers passed to this method
261
- json=payload,
262
- stream=True,
263
- timeout=self.timeout,
264
- impersonate="chrome110" # Use a common impersonation profile
265
- )
266
- response.raise_for_status() # Check for HTTP errors
267
-
268
- # Use sanitize_stream
269
- processed_stream = sanitize_stream(
270
- data=response.iter_content(chunk_size=None), # Pass byte iterator
271
- intro_value=None, # No prefix
272
- to_json=True, # Stream sends JSON lines
273
- content_extractor=self._allenai_extractor, # Use the specific extractor
274
- yield_raw_on_error=False # Skip non-JSON lines or lines where extractor fails
275
- )
276
-
277
- for content_chunk in processed_stream:
278
- # content_chunk is the string extracted by _allenai_extractor
279
- if content_chunk and isinstance(content_chunk, str):
280
- streaming_text += content_chunk
281
- resp = dict(text=content_chunk)
282
- yield resp if not raw else content_chunk
283
-
284
- # Try to extract parent ID from the *last* raw line (less reliable than before)
285
- # This part is tricky as sanitize_stream consumes the raw lines.
286
- # We might need to re-fetch or adjust if parent ID is critical per stream.
287
- # For now, we'll rely on the non-stream request to update parent ID more reliably.
288
- # Example placeholder logic (might not work reliably):
289
- try:
290
- last_line_data = json.loads(response.text.splitlines()[-1]) # Get last line if possible
291
- if last_line_data.get("id"):
292
- current_parent = last_line_data.get("id")
293
- elif last_line_data.get("children"):
294
- for child in last_line_data["children"]: # Use last_line_data here
295
- if child.get("role") == "assistant":
296
- current_parent = child.get("id")
297
- break
298
-
299
- # Handle completion
300
- if last_line_data.get("final") or last_line_data.get("finish_reason") == "stop":
301
- if current_parent:
302
- self.parent = current_parent
303
-
304
- # Update conversation history
305
- self.conversation.update_chat_history(prompt, streaming_text)
306
- self.last_response = {"text": streaming_text} # Update last response here
307
- return # End the generator
308
- except Exception as e:
309
- # Log the error but continue with the rest of the function
310
- print(f"Error processing response data: {str(e)}")
311
-
312
- # If loop finishes without returning (e.g., no final message), update history
313
- if current_parent:
314
- self.parent = current_parent
315
- self.conversation.update_chat_history(prompt, streaming_text)
316
- self.last_response = {"text": streaming_text}
317
-
318
- except CurlError as e: # Catch CurlError
319
- raise exceptions.FailedToGenerateResponseError(f"Request failed (CurlError): {str(e)}") from e
320
- except Exception as e: # Catch other potential exceptions (like HTTPError)
321
- err_text = getattr(e, 'response', None) and getattr(e.response, 'text', '')
322
- raise exceptions.FailedToGenerateResponseError(f"Request failed ({type(e).__name__}): {str(e)} - {err_text}") from e
323
-
324
-
325
- def _non_stream_request(self, payload, prompt, request_headers, raw=False):
326
- """Handle non-streaming requests with the given payload and headers"""
327
- try:
328
- # Use curl_cffi session post with impersonate
329
- response = self.session.post(
330
- self.api_endpoint,
331
- headers=request_headers, # Use headers passed to this method
332
- json=payload,
333
- stream=False, # Explicitly set stream to False
334
- timeout=self.timeout,
335
- impersonate="chrome110" # Use a common impersonation profile
336
- )
337
- response.raise_for_status() # Check for HTTP errors
338
-
339
- raw_response = response.text # Get raw text
340
-
341
- # Process the full text using sanitize_stream line by line
342
- processed_stream = sanitize_stream(
343
- data=raw_response.splitlines(), # Split into lines
344
- intro_value=None,
345
- to_json=True,
346
- content_extractor=self._allenai_extractor,
347
- yield_raw_on_error=False
348
- )
349
- # Aggregate the results
350
- parsed_response = "".join(list(processed_stream))
351
-
352
- # Update parent ID from the full response if possible (might need adjustment based on actual non-stream response structure)
353
- # This part is speculative as the non-stream structure isn't fully clear from the stream logic
354
- try:
355
- lines = raw_response.splitlines()
356
- if lines:
357
- last_line_data = json.loads(lines[-1])
358
- if last_line_data.get("id"):
359
- self.parent = last_line_data.get("id")
360
- elif last_line_data.get("children"):
361
- for child in last_line_data["children"]:
362
- if child.get("role") == "assistant":
363
- self.parent = child.get("id")
364
- break
365
- except (json.JSONDecodeError, IndexError):
366
- pass # Ignore errors parsing parent ID from non-stream
367
-
368
- self.conversation.update_chat_history(prompt, parsed_response)
369
- self.last_response = {"text": parsed_response}
370
- return self.last_response if not raw else parsed_response # Return dict or raw string
371
-
372
- except CurlError as e: # Catch CurlError
373
- raise exceptions.FailedToGenerateResponseError(f"Request failed (CurlError): {str(e)}") from e
374
- except Exception as e: # Catch other potential exceptions (like HTTPError, JSONDecodeError)
375
- err_text = getattr(e, 'response', None) and getattr(e.response, 'text', '')
376
- raise exceptions.FailedToGenerateResponseError(f"Request failed ({type(e).__name__}): {str(e)} - {err_text}") from e
377
-
378
-
379
- def chat(
380
- self,
381
- prompt: str,
382
- stream: bool = False,
383
- optimizer: str = None,
384
- conversationally: bool = False,
385
- host: str = None,
386
- options: dict = None,
387
- ) -> Union[str, Generator[str, None, None]]: # Corrected return type hint
388
- def for_stream_chat(): # Renamed inner function
389
- # ask() yields dicts or strings when streaming
390
- gen = self.ask(
391
- prompt,
392
- stream=True,
393
- raw=False, # Ensure ask yields dicts
394
- optimizer=optimizer,
395
- conversationally=conversationally,
396
- host=host,
397
- options=options
398
- )
399
- for response_dict in gen:
400
- yield self.get_message(response_dict) # get_message expects dict
401
-
402
- def for_non_stream_chat(): # Renamed inner function
403
- # ask() returns dict or str when not streaming
404
- response_data = self.ask(
405
- prompt,
406
- stream=False,
407
- raw=False, # Ensure ask returns dict
408
- optimizer=optimizer,
409
- conversationally=conversationally,
410
- host=host,
411
- options=options
412
- )
413
- return self.get_message(response_data) # get_message expects dict
414
-
415
- return for_stream_chat() if stream else for_non_stream_chat() # Use renamed functions
416
-
417
- def get_message(self, response: dict) -> str:
418
- assert isinstance(response, dict), "Response should be of dict data-type only"
419
- return response["text"]
420
-
421
-
422
-
423
- if __name__ == "__main__":
424
- # Ensure curl_cffi is installed
425
- print("-" * 80)
426
- print(f"{'Model':<50} {'Status':<10} {'Response'}")
427
- print("-" * 80)
428
-
429
- for model in AllenAI.AVAILABLE_MODELS:
430
- try:
431
- # Auto-detect host
432
- test_ai = AllenAI(model=model, timeout=60)
433
- # Pass the host explicitly to display accurate error messages
434
- response = test_ai.chat("Say 'Hello' in one word")
435
- response_text = response
436
-
437
- if response_text and len(response_text.strip()) > 0:
438
- status = "✓"
439
- # Truncate response if too long
440
- display_text = response_text.strip()[:50] + "..." if len(response_text.strip()) > 50 else response_text.strip()
441
- print(f"{model:<50} {status:<10} {display_text} (host: {test_ai.host})")
442
- else:
443
- status = "✗"
444
- display_text = "Empty or invalid response"
445
- print(f"{model:<50} {status:<10} {display_text}")
446
- except Exception as e:
447
- print(f"{model:<50} {'✗':<10} {str(e)}")
webscout/Provider/Andi.py DELETED
@@ -1,228 +0,0 @@
1
- from uuid import uuid4
2
- import requests
3
- import json
4
- from webscout.AIutel import Optimizers
5
- from webscout.AIutel import Conversation
6
- from webscout.AIutel import AwesomePrompts, sanitize_stream
7
- from webscout.AIbase import Provider, AsyncProvider
8
- from webscout import exceptions
9
- from typing import Union, Any, AsyncGenerator, Dict
10
- from webscout import WEBS
11
- from webscout.litagent import LitAgent
12
-
13
- class AndiSearch(Provider):
14
- def __init__(
15
- self,
16
- is_conversation: bool = True,
17
- max_tokens: int = 600,
18
- timeout: int = 30,
19
- intro: str = None,
20
- filepath: str = None,
21
- update_file: bool = True,
22
- proxies: dict = {},
23
- history_offset: int = 10250,
24
- act: str = None,
25
- ):
26
- """Instantiates AndiSearch
27
-
28
- Args:
29
- is_conversation (bool, optional): Flag for chatting conversationally. Defaults to True.
30
- max_tokens (int, optional): Maximum number of tokens to be generated upon completion. Defaults to 600.
31
- timeout (int, optional): Http request timeout. Defaults to 30.
32
- intro (str, optional): Conversation introductory prompt. Defaults to None.
33
- filepath (str, optional): Path to file containing conversation history. Defaults to None.
34
- update_file (bool, optional): Add new prompts and responses to the file. Defaults to True.
35
- proxies (dict, optional): Http request proxies. Defaults to {}.
36
- history_offset (int, optional): Limit conversation history to this number of last texts. Defaults to 10250.
37
- act (str|int, optional): Awesome prompt key or index. (Used as intro). Defaults to None.
38
- """
39
- self.session = requests.Session()
40
- self.is_conversation = is_conversation
41
- self.max_tokens_to_sample = max_tokens
42
- self.chat_endpoint = "https://write.andisearch.com/v1/write_streaming"
43
- self.stream_chunk_size = 64
44
- self.timeout = timeout
45
- self.last_response = {}
46
- self.headers = {
47
- "accept": "text/event-stream",
48
- "accept-encoding": "gzip, deflate, br, zstd",
49
- "accept-language": "en-US,en;q=0.9,en-IN;q=0.8",
50
- "andi-auth-key": "andi-summarizer",
51
- "andi-origin": "x-andi-origin",
52
- "authorization": str(uuid4()),
53
- "content-type": "application/json",
54
- "dnt": "1",
55
- "origin": "https://andisearch.com",
56
- "priority": "u=1, i",
57
- "sec-ch-ua": '"Not)A;Brand";v="99", "Microsoft Edge";v="127", "Chromium";v="127"',
58
- "sec-ch-ua-mobile": "?0",
59
- "sec-ch-ua-platform": '"Windows"',
60
- "sec-fetch-dest": "empty",
61
- "sec-fetch-mode": "cors",
62
- "sec-fetch-site": "same-site",
63
- "user-agent": LitAgent().random(),
64
- "x-amz-date": "20240730T031106Z",
65
- "x-amz-security-token": str(uuid4()),
66
- }
67
-
68
- self.__available_optimizers = (
69
- method
70
- for method in dir(Optimizers)
71
- if callable(getattr(Optimizers, method)) and not method.startswith("__")
72
- )
73
- self.session.headers.update(self.headers)
74
- Conversation.intro = (
75
- AwesomePrompts().get_act(
76
- act, raise_not_found=True, default=None, case_insensitive=True
77
- )
78
- if act
79
- else intro or Conversation.intro
80
- )
81
- self.conversation = Conversation(
82
- is_conversation, self.max_tokens_to_sample, filepath, update_file
83
- )
84
- self.conversation.history_offset = history_offset
85
- self.session.proxies = proxies
86
-
87
- def ask(
88
- self,
89
- prompt: str,
90
- stream: bool = False,
91
- raw: bool = False,
92
- optimizer: str = None,
93
- conversationally: bool = False,
94
- ) -> dict:
95
-
96
- conversation_prompt = self.conversation.gen_complete_prompt(prompt)
97
- if optimizer:
98
- if optimizer in self.__available_optimizers:
99
- conversation_prompt = getattr(Optimizers, optimizer)(
100
- conversation_prompt if conversationally else prompt
101
- )
102
- else:
103
- raise Exception(
104
- f"Optimizer is not one of {self.__available_optimizers}"
105
- )
106
-
107
- # Initialize the webscout instance
108
- webs = WEBS()
109
-
110
- # Fetch search results
111
- search_query = prompt
112
- search_results = webs.text(search_query, max_results=7)
113
-
114
- # Format the search results into the required serp payload structure
115
- serp_payload = {
116
- "query": search_query,
117
- "serp": {
118
- "results_type": "Search",
119
- "answer": "",
120
- "type": "navigation",
121
- "title": "",
122
- "description": "",
123
- "image": "",
124
- "link": "",
125
- "source": "liftndrift.com",
126
- "engine": "andi-b",
127
- "results": [
128
- {
129
- "title": result["title"],
130
- "link": result["href"],
131
- "desc": result["body"],
132
- "image": "",
133
- "type": "website",
134
- "source": result["href"].split("//")[1].split("/")[0] # Extract the domain name
135
- }
136
- for result in search_results
137
- ]
138
- }
139
- }
140
- self.session.headers.update(self.headers)
141
- payload = serp_payload
142
-
143
- def for_stream():
144
- response = self.session.post(
145
- self.chat_endpoint, json=payload, stream=True, timeout=self.timeout
146
- )
147
- if not response.ok:
148
- raise exceptions.FailedToGenerateResponseError(
149
- f"Failed to generate response - ({response.status_code}, {response.reason}) - {response.text}"
150
- )
151
-
152
- streaming_text = ""
153
- for value in response.iter_lines(
154
- decode_unicode=True,
155
- chunk_size=self.stream_chunk_size,
156
- delimiter="\n",
157
- ):
158
- try:
159
- if bool(value):
160
- streaming_text += value + ("\n" if stream else "")
161
- resp = dict(text=streaming_text)
162
- self.last_response.update(resp)
163
- yield value if raw else resp
164
- except json.decoder.JSONDecodeError:
165
- pass
166
- self.conversation.update_chat_history(
167
- prompt, self.get_message(self.last_response)
168
- )
169
-
170
- def for_non_stream():
171
- for _ in for_stream():
172
- pass
173
- return self.last_response
174
-
175
- return for_stream() if stream else for_non_stream()
176
-
177
- def chat(
178
- self,
179
- prompt: str,
180
- stream: bool = False,
181
- optimizer: str = None,
182
- conversationally: bool = False,
183
- ) -> str:
184
- """Generate response `str`
185
- Args:
186
- prompt (str): Prompt to be send.
187
- stream (bool, optional): Flag for streaming response. Defaults to False.
188
- optimizer (str, optional): Prompt optimizer name - `[code, shell_command]`. Defaults to None.
189
- conversationally (bool, optional): Chat conversationally when using optimizer. Defaults to False.
190
- Returns:
191
- str: Response generated
192
- """
193
-
194
- def for_stream():
195
- for response in self.ask(
196
- prompt, True, optimizer=optimizer, conversationally=conversationally
197
- ):
198
- yield self.get_message(response)
199
-
200
- def for_non_stream():
201
- return self.get_message(
202
- self.ask(
203
- prompt,
204
- False,
205
- optimizer=optimizer,
206
- conversationally=conversationally,
207
- )
208
- )
209
-
210
- return for_stream() if stream else for_non_stream()
211
-
212
- def get_message(self, response: dict) -> str:
213
- """Retrieves message only from response
214
-
215
- Args:
216
- response (dict): Response generated by `self.ask`
217
-
218
- Returns:
219
- str: Message extracted
220
- """
221
- assert isinstance(response, dict), "Response should be of dict data-type only"
222
- return response["text"]
223
- if __name__ == '__main__':
224
- from rich import print
225
- ai = AndiSearch()
226
- response = ai.chat("tell me about india")
227
- for chunk in response:
228
- print(chunk, end="", flush=True)