webscout 8.2.2__py3-none-any.whl → 2026.1.19__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (483) hide show
  1. webscout/AIauto.py +524 -143
  2. webscout/AIbase.py +247 -123
  3. webscout/AIutel.py +68 -132
  4. webscout/Bard.py +1072 -535
  5. webscout/Extra/GitToolkit/__init__.py +2 -2
  6. webscout/Extra/GitToolkit/gitapi/__init__.py +20 -12
  7. webscout/Extra/GitToolkit/gitapi/gist.py +142 -0
  8. webscout/Extra/GitToolkit/gitapi/organization.py +91 -0
  9. webscout/Extra/GitToolkit/gitapi/repository.py +308 -195
  10. webscout/Extra/GitToolkit/gitapi/search.py +162 -0
  11. webscout/Extra/GitToolkit/gitapi/trending.py +236 -0
  12. webscout/Extra/GitToolkit/gitapi/user.py +128 -96
  13. webscout/Extra/GitToolkit/gitapi/utils.py +82 -62
  14. webscout/Extra/YTToolkit/README.md +443 -0
  15. webscout/Extra/YTToolkit/YTdownloader.py +953 -957
  16. webscout/Extra/YTToolkit/__init__.py +3 -3
  17. webscout/Extra/YTToolkit/transcriber.py +595 -476
  18. webscout/Extra/YTToolkit/ytapi/README.md +230 -0
  19. webscout/Extra/YTToolkit/ytapi/__init__.py +22 -6
  20. webscout/Extra/YTToolkit/ytapi/captions.py +190 -0
  21. webscout/Extra/YTToolkit/ytapi/channel.py +302 -307
  22. webscout/Extra/YTToolkit/ytapi/errors.py +13 -13
  23. webscout/Extra/YTToolkit/ytapi/extras.py +178 -45
  24. webscout/Extra/YTToolkit/ytapi/hashtag.py +120 -0
  25. webscout/Extra/YTToolkit/ytapi/https.py +89 -88
  26. webscout/Extra/YTToolkit/ytapi/patterns.py +61 -61
  27. webscout/Extra/YTToolkit/ytapi/playlist.py +59 -59
  28. webscout/Extra/YTToolkit/ytapi/pool.py +8 -8
  29. webscout/Extra/YTToolkit/ytapi/query.py +143 -40
  30. webscout/Extra/YTToolkit/ytapi/shorts.py +122 -0
  31. webscout/Extra/YTToolkit/ytapi/stream.py +68 -63
  32. webscout/Extra/YTToolkit/ytapi/suggestions.py +97 -0
  33. webscout/Extra/YTToolkit/ytapi/utils.py +66 -62
  34. webscout/Extra/YTToolkit/ytapi/video.py +189 -18
  35. webscout/Extra/__init__.py +2 -3
  36. webscout/Extra/gguf.py +1298 -682
  37. webscout/Extra/tempmail/README.md +488 -0
  38. webscout/Extra/tempmail/__init__.py +28 -28
  39. webscout/Extra/tempmail/async_utils.py +143 -141
  40. webscout/Extra/tempmail/base.py +172 -161
  41. webscout/Extra/tempmail/cli.py +191 -187
  42. webscout/Extra/tempmail/emailnator.py +88 -84
  43. webscout/Extra/tempmail/mail_tm.py +378 -361
  44. webscout/Extra/tempmail/temp_mail_io.py +304 -292
  45. webscout/Extra/weather.py +196 -194
  46. webscout/Extra/weather_ascii.py +17 -15
  47. webscout/Provider/AISEARCH/PERPLEXED_search.py +175 -0
  48. webscout/Provider/AISEARCH/Perplexity.py +237 -304
  49. webscout/Provider/AISEARCH/README.md +106 -0
  50. webscout/Provider/AISEARCH/__init__.py +16 -10
  51. webscout/Provider/AISEARCH/brave_search.py +298 -0
  52. webscout/Provider/AISEARCH/iask_search.py +130 -209
  53. webscout/Provider/AISEARCH/monica_search.py +200 -246
  54. webscout/Provider/AISEARCH/webpilotai_search.py +242 -281
  55. webscout/Provider/Algion.py +413 -0
  56. webscout/Provider/Andi.py +74 -69
  57. webscout/Provider/Apriel.py +313 -0
  58. webscout/Provider/Ayle.py +323 -0
  59. webscout/Provider/ChatSandbox.py +329 -0
  60. webscout/Provider/ClaudeOnline.py +365 -0
  61. webscout/Provider/Cohere.py +232 -208
  62. webscout/Provider/DeepAI.py +367 -0
  63. webscout/Provider/Deepinfra.py +343 -173
  64. webscout/Provider/EssentialAI.py +217 -0
  65. webscout/Provider/ExaAI.py +274 -261
  66. webscout/Provider/Gemini.py +60 -54
  67. webscout/Provider/GithubChat.py +385 -367
  68. webscout/Provider/Gradient.py +286 -0
  69. webscout/Provider/Groq.py +556 -670
  70. webscout/Provider/HadadXYZ.py +323 -0
  71. webscout/Provider/HeckAI.py +392 -233
  72. webscout/Provider/HuggingFace.py +387 -0
  73. webscout/Provider/IBM.py +340 -0
  74. webscout/Provider/Jadve.py +317 -266
  75. webscout/Provider/K2Think.py +306 -0
  76. webscout/Provider/Koboldai.py +221 -381
  77. webscout/Provider/Netwrck.py +273 -228
  78. webscout/Provider/Nvidia.py +310 -0
  79. webscout/Provider/OPENAI/DeepAI.py +489 -0
  80. webscout/Provider/OPENAI/K2Think.py +423 -0
  81. webscout/Provider/OPENAI/PI.py +463 -0
  82. webscout/Provider/OPENAI/README.md +890 -0
  83. webscout/Provider/OPENAI/TogetherAI.py +405 -0
  84. webscout/Provider/OPENAI/TwoAI.py +255 -0
  85. webscout/Provider/OPENAI/__init__.py +148 -25
  86. webscout/Provider/OPENAI/ai4chat.py +348 -0
  87. webscout/Provider/OPENAI/akashgpt.py +436 -0
  88. webscout/Provider/OPENAI/algion.py +303 -0
  89. webscout/Provider/OPENAI/ayle.py +365 -0
  90. webscout/Provider/OPENAI/base.py +253 -46
  91. webscout/Provider/OPENAI/cerebras.py +296 -0
  92. webscout/Provider/OPENAI/chatgpt.py +514 -193
  93. webscout/Provider/OPENAI/chatsandbox.py +233 -0
  94. webscout/Provider/OPENAI/deepinfra.py +403 -272
  95. webscout/Provider/OPENAI/e2b.py +2370 -1350
  96. webscout/Provider/OPENAI/elmo.py +278 -0
  97. webscout/Provider/OPENAI/exaai.py +186 -138
  98. webscout/Provider/OPENAI/freeassist.py +446 -0
  99. webscout/Provider/OPENAI/gradient.py +448 -0
  100. webscout/Provider/OPENAI/groq.py +380 -0
  101. webscout/Provider/OPENAI/hadadxyz.py +292 -0
  102. webscout/Provider/OPENAI/heckai.py +100 -104
  103. webscout/Provider/OPENAI/huggingface.py +321 -0
  104. webscout/Provider/OPENAI/ibm.py +425 -0
  105. webscout/Provider/OPENAI/llmchat.py +253 -0
  106. webscout/Provider/OPENAI/llmchatco.py +378 -327
  107. webscout/Provider/OPENAI/meta.py +541 -0
  108. webscout/Provider/OPENAI/netwrck.py +110 -84
  109. webscout/Provider/OPENAI/nvidia.py +317 -0
  110. webscout/Provider/OPENAI/oivscode.py +348 -0
  111. webscout/Provider/OPENAI/openrouter.py +328 -0
  112. webscout/Provider/OPENAI/pydantic_imports.py +1 -0
  113. webscout/Provider/OPENAI/sambanova.py +397 -0
  114. webscout/Provider/OPENAI/sonus.py +126 -115
  115. webscout/Provider/OPENAI/textpollinations.py +218 -133
  116. webscout/Provider/OPENAI/toolbaz.py +136 -166
  117. webscout/Provider/OPENAI/typefully.py +419 -0
  118. webscout/Provider/OPENAI/typliai.py +279 -0
  119. webscout/Provider/OPENAI/utils.py +314 -211
  120. webscout/Provider/OPENAI/wisecat.py +103 -125
  121. webscout/Provider/OPENAI/writecream.py +185 -156
  122. webscout/Provider/OPENAI/x0gpt.py +227 -136
  123. webscout/Provider/OPENAI/zenmux.py +380 -0
  124. webscout/Provider/OpenRouter.py +386 -0
  125. webscout/Provider/Openai.py +337 -496
  126. webscout/Provider/PI.py +443 -344
  127. webscout/Provider/QwenLM.py +346 -254
  128. webscout/Provider/STT/__init__.py +28 -0
  129. webscout/Provider/STT/base.py +303 -0
  130. webscout/Provider/STT/elevenlabs.py +264 -0
  131. webscout/Provider/Sambanova.py +317 -0
  132. webscout/Provider/TTI/README.md +69 -0
  133. webscout/Provider/TTI/__init__.py +37 -12
  134. webscout/Provider/TTI/base.py +147 -0
  135. webscout/Provider/TTI/claudeonline.py +393 -0
  136. webscout/Provider/TTI/magicstudio.py +292 -0
  137. webscout/Provider/TTI/miragic.py +180 -0
  138. webscout/Provider/TTI/pollinations.py +331 -0
  139. webscout/Provider/TTI/together.py +334 -0
  140. webscout/Provider/TTI/utils.py +14 -0
  141. webscout/Provider/TTS/README.md +186 -0
  142. webscout/Provider/TTS/__init__.py +43 -7
  143. webscout/Provider/TTS/base.py +523 -0
  144. webscout/Provider/TTS/deepgram.py +286 -156
  145. webscout/Provider/TTS/elevenlabs.py +189 -111
  146. webscout/Provider/TTS/freetts.py +218 -0
  147. webscout/Provider/TTS/murfai.py +288 -113
  148. webscout/Provider/TTS/openai_fm.py +364 -0
  149. webscout/Provider/TTS/parler.py +203 -111
  150. webscout/Provider/TTS/qwen.py +334 -0
  151. webscout/Provider/TTS/sherpa.py +286 -0
  152. webscout/Provider/TTS/speechma.py +693 -180
  153. webscout/Provider/TTS/streamElements.py +275 -333
  154. webscout/Provider/TTS/utils.py +280 -280
  155. webscout/Provider/TextPollinationsAI.py +221 -121
  156. webscout/Provider/TogetherAI.py +450 -0
  157. webscout/Provider/TwoAI.py +309 -199
  158. webscout/Provider/TypliAI.py +311 -0
  159. webscout/Provider/UNFINISHED/ChatHub.py +219 -0
  160. webscout/Provider/{OPENAI/glider.py → UNFINISHED/ChutesAI.py} +160 -145
  161. webscout/Provider/UNFINISHED/GizAI.py +300 -0
  162. webscout/Provider/UNFINISHED/Marcus.py +218 -0
  163. webscout/Provider/UNFINISHED/Qodo.py +481 -0
  164. webscout/Provider/UNFINISHED/XenAI.py +330 -0
  165. webscout/Provider/{Youchat.py → UNFINISHED/Youchat.py} +64 -47
  166. webscout/Provider/UNFINISHED/aihumanizer.py +41 -0
  167. webscout/Provider/UNFINISHED/grammerchecker.py +37 -0
  168. webscout/Provider/UNFINISHED/liner.py +342 -0
  169. webscout/Provider/UNFINISHED/liner_api_request.py +246 -0
  170. webscout/Provider/UNFINISHED/samurai.py +231 -0
  171. webscout/Provider/WiseCat.py +256 -196
  172. webscout/Provider/WrDoChat.py +390 -0
  173. webscout/Provider/__init__.py +115 -198
  174. webscout/Provider/ai4chat.py +181 -202
  175. webscout/Provider/akashgpt.py +330 -342
  176. webscout/Provider/cerebras.py +397 -242
  177. webscout/Provider/cleeai.py +236 -213
  178. webscout/Provider/elmo.py +291 -234
  179. webscout/Provider/geminiapi.py +343 -208
  180. webscout/Provider/julius.py +245 -223
  181. webscout/Provider/learnfastai.py +333 -266
  182. webscout/Provider/llama3mitril.py +230 -180
  183. webscout/Provider/llmchat.py +308 -213
  184. webscout/Provider/llmchatco.py +321 -311
  185. webscout/Provider/meta.py +996 -794
  186. webscout/Provider/oivscode.py +332 -0
  187. webscout/Provider/searchchat.py +316 -293
  188. webscout/Provider/sonus.py +264 -208
  189. webscout/Provider/toolbaz.py +359 -320
  190. webscout/Provider/turboseek.py +332 -219
  191. webscout/Provider/typefully.py +262 -280
  192. webscout/Provider/x0gpt.py +332 -256
  193. webscout/__init__.py +31 -38
  194. webscout/__main__.py +5 -5
  195. webscout/cli.py +585 -293
  196. webscout/client.py +1497 -0
  197. webscout/conversation.py +140 -565
  198. webscout/exceptions.py +383 -339
  199. webscout/litagent/__init__.py +29 -29
  200. webscout/litagent/agent.py +492 -455
  201. webscout/litagent/constants.py +60 -60
  202. webscout/models.py +505 -181
  203. webscout/optimizers.py +32 -378
  204. webscout/prompt_manager.py +376 -274
  205. webscout/sanitize.py +1514 -0
  206. webscout/scout/README.md +452 -0
  207. webscout/scout/__init__.py +8 -8
  208. webscout/scout/core/__init__.py +7 -7
  209. webscout/scout/core/crawler.py +330 -140
  210. webscout/scout/core/scout.py +800 -568
  211. webscout/scout/core/search_result.py +51 -96
  212. webscout/scout/core/text_analyzer.py +64 -63
  213. webscout/scout/core/text_utils.py +412 -277
  214. webscout/scout/core/web_analyzer.py +54 -52
  215. webscout/scout/element.py +872 -460
  216. webscout/scout/parsers/__init__.py +70 -69
  217. webscout/scout/parsers/html5lib_parser.py +182 -172
  218. webscout/scout/parsers/html_parser.py +238 -236
  219. webscout/scout/parsers/lxml_parser.py +203 -178
  220. webscout/scout/utils.py +38 -37
  221. webscout/search/__init__.py +47 -0
  222. webscout/search/base.py +201 -0
  223. webscout/search/bing_main.py +45 -0
  224. webscout/search/brave_main.py +92 -0
  225. webscout/search/duckduckgo_main.py +57 -0
  226. webscout/search/engines/__init__.py +127 -0
  227. webscout/search/engines/bing/__init__.py +15 -0
  228. webscout/search/engines/bing/base.py +35 -0
  229. webscout/search/engines/bing/images.py +114 -0
  230. webscout/search/engines/bing/news.py +96 -0
  231. webscout/search/engines/bing/suggestions.py +36 -0
  232. webscout/search/engines/bing/text.py +109 -0
  233. webscout/search/engines/brave/__init__.py +19 -0
  234. webscout/search/engines/brave/base.py +47 -0
  235. webscout/search/engines/brave/images.py +213 -0
  236. webscout/search/engines/brave/news.py +353 -0
  237. webscout/search/engines/brave/suggestions.py +318 -0
  238. webscout/search/engines/brave/text.py +167 -0
  239. webscout/search/engines/brave/videos.py +364 -0
  240. webscout/search/engines/duckduckgo/__init__.py +25 -0
  241. webscout/search/engines/duckduckgo/answers.py +80 -0
  242. webscout/search/engines/duckduckgo/base.py +189 -0
  243. webscout/search/engines/duckduckgo/images.py +100 -0
  244. webscout/search/engines/duckduckgo/maps.py +183 -0
  245. webscout/search/engines/duckduckgo/news.py +70 -0
  246. webscout/search/engines/duckduckgo/suggestions.py +22 -0
  247. webscout/search/engines/duckduckgo/text.py +221 -0
  248. webscout/search/engines/duckduckgo/translate.py +48 -0
  249. webscout/search/engines/duckduckgo/videos.py +80 -0
  250. webscout/search/engines/duckduckgo/weather.py +84 -0
  251. webscout/search/engines/mojeek.py +61 -0
  252. webscout/search/engines/wikipedia.py +77 -0
  253. webscout/search/engines/yahoo/__init__.py +41 -0
  254. webscout/search/engines/yahoo/answers.py +19 -0
  255. webscout/search/engines/yahoo/base.py +34 -0
  256. webscout/search/engines/yahoo/images.py +323 -0
  257. webscout/search/engines/yahoo/maps.py +19 -0
  258. webscout/search/engines/yahoo/news.py +258 -0
  259. webscout/search/engines/yahoo/suggestions.py +140 -0
  260. webscout/search/engines/yahoo/text.py +273 -0
  261. webscout/search/engines/yahoo/translate.py +19 -0
  262. webscout/search/engines/yahoo/videos.py +302 -0
  263. webscout/search/engines/yahoo/weather.py +220 -0
  264. webscout/search/engines/yandex.py +67 -0
  265. webscout/search/engines/yep/__init__.py +13 -0
  266. webscout/search/engines/yep/base.py +34 -0
  267. webscout/search/engines/yep/images.py +101 -0
  268. webscout/search/engines/yep/suggestions.py +38 -0
  269. webscout/search/engines/yep/text.py +99 -0
  270. webscout/search/http_client.py +172 -0
  271. webscout/search/results.py +141 -0
  272. webscout/search/yahoo_main.py +57 -0
  273. webscout/search/yep_main.py +48 -0
  274. webscout/server/__init__.py +48 -0
  275. webscout/server/config.py +78 -0
  276. webscout/server/exceptions.py +69 -0
  277. webscout/server/providers.py +286 -0
  278. webscout/server/request_models.py +131 -0
  279. webscout/server/request_processing.py +404 -0
  280. webscout/server/routes.py +642 -0
  281. webscout/server/server.py +351 -0
  282. webscout/server/ui_templates.py +1171 -0
  283. webscout/swiftcli/__init__.py +79 -809
  284. webscout/swiftcli/core/__init__.py +7 -0
  285. webscout/swiftcli/core/cli.py +574 -0
  286. webscout/swiftcli/core/context.py +98 -0
  287. webscout/swiftcli/core/group.py +268 -0
  288. webscout/swiftcli/decorators/__init__.py +28 -0
  289. webscout/swiftcli/decorators/command.py +243 -0
  290. webscout/swiftcli/decorators/options.py +247 -0
  291. webscout/swiftcli/decorators/output.py +392 -0
  292. webscout/swiftcli/exceptions.py +21 -0
  293. webscout/swiftcli/plugins/__init__.py +9 -0
  294. webscout/swiftcli/plugins/base.py +134 -0
  295. webscout/swiftcli/plugins/manager.py +269 -0
  296. webscout/swiftcli/utils/__init__.py +58 -0
  297. webscout/swiftcli/utils/formatting.py +251 -0
  298. webscout/swiftcli/utils/parsing.py +368 -0
  299. webscout/update_checker.py +280 -136
  300. webscout/utils.py +28 -14
  301. webscout/version.py +2 -1
  302. webscout/version.py.bak +3 -0
  303. webscout/zeroart/__init__.py +218 -55
  304. webscout/zeroart/base.py +70 -60
  305. webscout/zeroart/effects.py +155 -99
  306. webscout/zeroart/fonts.py +1799 -816
  307. webscout-2026.1.19.dist-info/METADATA +638 -0
  308. webscout-2026.1.19.dist-info/RECORD +312 -0
  309. {webscout-8.2.2.dist-info → webscout-2026.1.19.dist-info}/WHEEL +1 -1
  310. webscout-2026.1.19.dist-info/entry_points.txt +4 -0
  311. webscout-2026.1.19.dist-info/top_level.txt +1 -0
  312. inferno/__init__.py +0 -6
  313. inferno/__main__.py +0 -9
  314. inferno/cli.py +0 -6
  315. webscout/DWEBS.py +0 -477
  316. webscout/Extra/autocoder/__init__.py +0 -9
  317. webscout/Extra/autocoder/autocoder.py +0 -849
  318. webscout/Extra/autocoder/autocoder_utiles.py +0 -332
  319. webscout/LLM.py +0 -442
  320. webscout/Litlogger/__init__.py +0 -67
  321. webscout/Litlogger/core/__init__.py +0 -6
  322. webscout/Litlogger/core/level.py +0 -23
  323. webscout/Litlogger/core/logger.py +0 -165
  324. webscout/Litlogger/handlers/__init__.py +0 -12
  325. webscout/Litlogger/handlers/console.py +0 -33
  326. webscout/Litlogger/handlers/file.py +0 -143
  327. webscout/Litlogger/handlers/network.py +0 -173
  328. webscout/Litlogger/styles/__init__.py +0 -7
  329. webscout/Litlogger/styles/colors.py +0 -249
  330. webscout/Litlogger/styles/formats.py +0 -458
  331. webscout/Litlogger/styles/text.py +0 -87
  332. webscout/Litlogger/utils/__init__.py +0 -6
  333. webscout/Litlogger/utils/detectors.py +0 -153
  334. webscout/Litlogger/utils/formatters.py +0 -200
  335. webscout/Local/__init__.py +0 -12
  336. webscout/Local/__main__.py +0 -9
  337. webscout/Local/api.py +0 -576
  338. webscout/Local/cli.py +0 -516
  339. webscout/Local/config.py +0 -75
  340. webscout/Local/llm.py +0 -287
  341. webscout/Local/model_manager.py +0 -253
  342. webscout/Local/server.py +0 -721
  343. webscout/Local/utils.py +0 -93
  344. webscout/Provider/AI21.py +0 -177
  345. webscout/Provider/AISEARCH/DeepFind.py +0 -250
  346. webscout/Provider/AISEARCH/ISou.py +0 -256
  347. webscout/Provider/AISEARCH/felo_search.py +0 -228
  348. webscout/Provider/AISEARCH/genspark_search.py +0 -208
  349. webscout/Provider/AISEARCH/hika_search.py +0 -194
  350. webscout/Provider/AISEARCH/scira_search.py +0 -324
  351. webscout/Provider/Aitopia.py +0 -292
  352. webscout/Provider/AllenAI.py +0 -413
  353. webscout/Provider/Blackboxai.py +0 -229
  354. webscout/Provider/C4ai.py +0 -432
  355. webscout/Provider/ChatGPTClone.py +0 -226
  356. webscout/Provider/ChatGPTES.py +0 -237
  357. webscout/Provider/ChatGPTGratis.py +0 -194
  358. webscout/Provider/Chatify.py +0 -175
  359. webscout/Provider/Cloudflare.py +0 -273
  360. webscout/Provider/DeepSeek.py +0 -196
  361. webscout/Provider/ElectronHub.py +0 -709
  362. webscout/Provider/ExaChat.py +0 -342
  363. webscout/Provider/Free2GPT.py +0 -241
  364. webscout/Provider/GPTWeb.py +0 -193
  365. webscout/Provider/Glider.py +0 -211
  366. webscout/Provider/HF_space/__init__.py +0 -0
  367. webscout/Provider/HF_space/qwen_qwen2.py +0 -206
  368. webscout/Provider/HuggingFaceChat.py +0 -462
  369. webscout/Provider/Hunyuan.py +0 -272
  370. webscout/Provider/LambdaChat.py +0 -392
  371. webscout/Provider/Llama.py +0 -200
  372. webscout/Provider/Llama3.py +0 -204
  373. webscout/Provider/Marcus.py +0 -148
  374. webscout/Provider/OLLAMA.py +0 -396
  375. webscout/Provider/OPENAI/c4ai.py +0 -367
  376. webscout/Provider/OPENAI/chatgptclone.py +0 -460
  377. webscout/Provider/OPENAI/exachat.py +0 -433
  378. webscout/Provider/OPENAI/freeaichat.py +0 -352
  379. webscout/Provider/OPENAI/opkfc.py +0 -488
  380. webscout/Provider/OPENAI/scirachat.py +0 -463
  381. webscout/Provider/OPENAI/standardinput.py +0 -425
  382. webscout/Provider/OPENAI/typegpt.py +0 -346
  383. webscout/Provider/OPENAI/uncovrAI.py +0 -455
  384. webscout/Provider/OPENAI/venice.py +0 -413
  385. webscout/Provider/OPENAI/yep.py +0 -327
  386. webscout/Provider/OpenGPT.py +0 -199
  387. webscout/Provider/Perplexitylabs.py +0 -415
  388. webscout/Provider/Phind.py +0 -535
  389. webscout/Provider/PizzaGPT.py +0 -198
  390. webscout/Provider/Reka.py +0 -214
  391. webscout/Provider/StandardInput.py +0 -278
  392. webscout/Provider/TTI/AiForce/__init__.py +0 -22
  393. webscout/Provider/TTI/AiForce/async_aiforce.py +0 -224
  394. webscout/Provider/TTI/AiForce/sync_aiforce.py +0 -245
  395. webscout/Provider/TTI/FreeAIPlayground/__init__.py +0 -9
  396. webscout/Provider/TTI/FreeAIPlayground/async_freeaiplayground.py +0 -181
  397. webscout/Provider/TTI/FreeAIPlayground/sync_freeaiplayground.py +0 -180
  398. webscout/Provider/TTI/ImgSys/__init__.py +0 -23
  399. webscout/Provider/TTI/ImgSys/async_imgsys.py +0 -202
  400. webscout/Provider/TTI/ImgSys/sync_imgsys.py +0 -195
  401. webscout/Provider/TTI/MagicStudio/__init__.py +0 -2
  402. webscout/Provider/TTI/MagicStudio/async_magicstudio.py +0 -111
  403. webscout/Provider/TTI/MagicStudio/sync_magicstudio.py +0 -109
  404. webscout/Provider/TTI/Nexra/__init__.py +0 -22
  405. webscout/Provider/TTI/Nexra/async_nexra.py +0 -286
  406. webscout/Provider/TTI/Nexra/sync_nexra.py +0 -258
  407. webscout/Provider/TTI/PollinationsAI/__init__.py +0 -23
  408. webscout/Provider/TTI/PollinationsAI/async_pollinations.py +0 -311
  409. webscout/Provider/TTI/PollinationsAI/sync_pollinations.py +0 -265
  410. webscout/Provider/TTI/aiarta/__init__.py +0 -2
  411. webscout/Provider/TTI/aiarta/async_aiarta.py +0 -482
  412. webscout/Provider/TTI/aiarta/sync_aiarta.py +0 -440
  413. webscout/Provider/TTI/artbit/__init__.py +0 -22
  414. webscout/Provider/TTI/artbit/async_artbit.py +0 -155
  415. webscout/Provider/TTI/artbit/sync_artbit.py +0 -148
  416. webscout/Provider/TTI/fastflux/__init__.py +0 -22
  417. webscout/Provider/TTI/fastflux/async_fastflux.py +0 -261
  418. webscout/Provider/TTI/fastflux/sync_fastflux.py +0 -252
  419. webscout/Provider/TTI/huggingface/__init__.py +0 -22
  420. webscout/Provider/TTI/huggingface/async_huggingface.py +0 -199
  421. webscout/Provider/TTI/huggingface/sync_huggingface.py +0 -195
  422. webscout/Provider/TTI/piclumen/__init__.py +0 -23
  423. webscout/Provider/TTI/piclumen/async_piclumen.py +0 -268
  424. webscout/Provider/TTI/piclumen/sync_piclumen.py +0 -233
  425. webscout/Provider/TTI/pixelmuse/__init__.py +0 -4
  426. webscout/Provider/TTI/pixelmuse/async_pixelmuse.py +0 -249
  427. webscout/Provider/TTI/pixelmuse/sync_pixelmuse.py +0 -182
  428. webscout/Provider/TTI/talkai/__init__.py +0 -4
  429. webscout/Provider/TTI/talkai/async_talkai.py +0 -229
  430. webscout/Provider/TTI/talkai/sync_talkai.py +0 -207
  431. webscout/Provider/TTS/gesserit.py +0 -127
  432. webscout/Provider/TeachAnything.py +0 -187
  433. webscout/Provider/Venice.py +0 -219
  434. webscout/Provider/VercelAI.py +0 -234
  435. webscout/Provider/WebSim.py +0 -228
  436. webscout/Provider/Writecream.py +0 -211
  437. webscout/Provider/WritingMate.py +0 -197
  438. webscout/Provider/aimathgpt.py +0 -189
  439. webscout/Provider/askmyai.py +0 -158
  440. webscout/Provider/asksteve.py +0 -203
  441. webscout/Provider/bagoodex.py +0 -145
  442. webscout/Provider/chatglm.py +0 -205
  443. webscout/Provider/copilot.py +0 -428
  444. webscout/Provider/freeaichat.py +0 -271
  445. webscout/Provider/gaurish.py +0 -244
  446. webscout/Provider/geminiprorealtime.py +0 -160
  447. webscout/Provider/granite.py +0 -187
  448. webscout/Provider/hermes.py +0 -219
  449. webscout/Provider/koala.py +0 -268
  450. webscout/Provider/labyrinth.py +0 -340
  451. webscout/Provider/lepton.py +0 -194
  452. webscout/Provider/llamatutor.py +0 -192
  453. webscout/Provider/multichat.py +0 -325
  454. webscout/Provider/promptrefine.py +0 -193
  455. webscout/Provider/scira_chat.py +0 -277
  456. webscout/Provider/scnet.py +0 -187
  457. webscout/Provider/talkai.py +0 -194
  458. webscout/Provider/tutorai.py +0 -252
  459. webscout/Provider/typegpt.py +0 -232
  460. webscout/Provider/uncovr.py +0 -312
  461. webscout/Provider/yep.py +0 -376
  462. webscout/litprinter/__init__.py +0 -59
  463. webscout/scout/core.py +0 -881
  464. webscout/tempid.py +0 -128
  465. webscout/webscout_search.py +0 -1346
  466. webscout/webscout_search_async.py +0 -877
  467. webscout/yep_search.py +0 -297
  468. webscout-8.2.2.dist-info/METADATA +0 -734
  469. webscout-8.2.2.dist-info/RECORD +0 -309
  470. webscout-8.2.2.dist-info/entry_points.txt +0 -5
  471. webscout-8.2.2.dist-info/top_level.txt +0 -3
  472. webstoken/__init__.py +0 -30
  473. webstoken/classifier.py +0 -189
  474. webstoken/keywords.py +0 -216
  475. webstoken/language.py +0 -128
  476. webstoken/ner.py +0 -164
  477. webstoken/normalizer.py +0 -35
  478. webstoken/processor.py +0 -77
  479. webstoken/sentiment.py +0 -206
  480. webstoken/stemmer.py +0 -73
  481. webstoken/tagger.py +0 -60
  482. webstoken/tokenizer.py +0 -158
  483. {webscout-8.2.2.dist-info → webscout-2026.1.19.dist-info/licenses}/LICENSE.md +0 -0
@@ -1,1346 +0,0 @@
1
- from __future__ import annotations
2
-
3
- # import logging
4
- import json
5
- from urllib.parse import quote
6
- import warnings
7
- from concurrent.futures import ThreadPoolExecutor
8
- from datetime import datetime, timezone
9
- from decimal import Decimal
10
- from functools import cached_property
11
- from itertools import cycle, islice
12
- from random import choice, shuffle
13
- from threading import Event
14
- from time import sleep, time
15
- from types import TracebackType
16
- from typing import Any, cast
17
- import os
18
- from typing import Literal, Iterator
19
-
20
- import primp # type: ignore
21
-
22
- try:
23
- from lxml.etree import _Element
24
- from lxml.html import HTMLParser as LHTMLParser
25
- from lxml.html import document_fromstring
26
-
27
- LXML_AVAILABLE = True
28
- except ImportError:
29
- LXML_AVAILABLE = False
30
-
31
- from .exceptions import ConversationLimitException, WebscoutE, RatelimitE, TimeoutE
32
- from .utils import (
33
- _calculate_distance,
34
- _expand_proxy_tb_alias,
35
- _extract_vqd,
36
- _normalize,
37
- _normalize_url,
38
- _text_extract_json,
39
- json_loads,
40
- )
41
-
42
- # logger = logging.getLogger("webscout.WEBS")
43
-
44
-
45
- class WEBS:
46
- """webscout class to get search results from duckduckgo.com."""
47
-
48
- _executor: ThreadPoolExecutor = ThreadPoolExecutor()
49
- _impersonates = (
50
- "chrome_100", "chrome_101", "chrome_104", "chrome_105", "chrome_106", "chrome_107",
51
- "chrome_108", "chrome_109", "chrome_114", "chrome_116", "chrome_117", "chrome_118",
52
- "chrome_119", "chrome_120", "chrome_123", "chrome_124", "chrome_126", "chrome_127",
53
- "chrome_128", "chrome_129", "chrome_130", "chrome_131", "chrome_133",
54
- "safari_ios_16.5", "safari_ios_17.2", "safari_ios_17.4.1", "safari_ios_18.1.1",
55
- "safari_15.3", "safari_15.5", "safari_15.6.1", "safari_16", "safari_16.5",
56
- "safari_17.0", "safari_17.2.1", "safari_17.4.1", "safari_17.5",
57
- "safari_18", "safari_18.2",
58
- "safari_ipad_18",
59
- "edge_101", "edge_122", "edge_127", "edge_131",
60
- "firefox_109", "firefox_117", "firefox_128", "firefox_133", "firefox_135",
61
- ) # fmt: skip
62
- _impersonates_os = ("android", "ios", "linux", "macos", "windows")
63
- _chat_models = {
64
- "gpt-4o-mini": "gpt-4o-mini",
65
- "llama-3.3-70b": "meta-llama/Llama-3.3-70B-Instruct-Turbo",
66
- "claude-3-haiku": "claude-3-haiku-20240307",
67
- "o3-mini": "o3-mini",
68
- "mistral-small-3": "mistralai/Mistral-Small-24B-Instruct-2501",
69
- }
70
-
71
- def __init__(
72
- self,
73
- headers: dict[str, str] | None = None,
74
- proxy: str | None = None,
75
- proxies: dict[str, str] | str | None = None, # deprecated
76
- timeout: int | None = 10,
77
- verify: bool = True,
78
- ) -> None:
79
- """Initialize the WEBS object.
80
-
81
- Args:
82
- headers (dict, optional): Dictionary of headers for the HTTP client. Defaults to None.
83
- proxy (str, optional): proxy for the HTTP client, supports http/https/socks5 protocols.
84
- example: "http://user:pass@example.com:3128". Defaults to None.
85
- timeout (int, optional): Timeout value for the HTTP client. Defaults to 10.
86
- verify (bool): SSL verification when making the request. Defaults to True.
87
- """
88
- ddgs_proxy: str | None = os.environ.get("DDGS_PROXY")
89
- self.proxy: str | None = ddgs_proxy if ddgs_proxy else _expand_proxy_tb_alias(proxy)
90
- assert self.proxy is None or isinstance(self.proxy, str), "proxy must be a str"
91
- if not proxy and proxies:
92
- warnings.warn("'proxies' is deprecated, use 'proxy' instead.", stacklevel=1)
93
- self.proxy = proxies.get("http") or proxies.get("https") if isinstance(proxies, dict) else proxies
94
-
95
- default_headers = {
96
- "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8",
97
- "Accept-Language": "en-US,en;q=0.5",
98
- "Accept-Encoding": "gzip, deflate, br",
99
- "DNT": "1",
100
- "Connection": "keep-alive",
101
- "Upgrade-Insecure-Requests": "1",
102
- "Sec-Fetch-Dest": "document",
103
- "Sec-Fetch-Mode": "navigate",
104
- "Sec-Fetch-Site": "none",
105
- "Sec-Fetch-User": "?1",
106
- "Referer": "https://duckduckgo.com/",
107
- }
108
-
109
- self.headers = headers if headers else {}
110
- self.headers.update(default_headers)
111
-
112
- self.client = primp.Client(
113
- headers=self.headers,
114
- proxy=self.proxy,
115
- timeout=timeout,
116
- cookie_store=True,
117
- referer=True,
118
- impersonate=choice(self._impersonates),
119
- impersonate_os=choice(self._impersonates_os),
120
- follow_redirects=False,
121
- verify=verify,
122
- )
123
- self.timeout = timeout
124
- self.sleep_timestamp = 0.0
125
-
126
- self._exception_event = Event()
127
- self._chat_messages: list[dict[str, str]] = []
128
- self._chat_tokens_count = 0
129
- self._chat_vqd: str = ""
130
- self._chat_vqd_hash: str = ""
131
- self._chat_xfe: str = ""
132
-
133
- def __enter__(self) -> WEBS:
134
- return self
135
-
136
- def __exit__(
137
- self,
138
- exc_type: type[BaseException] | None = None,
139
- exc_val: BaseException | None = None,
140
- exc_tb: TracebackType | None = None,
141
- ) -> None:
142
- pass
143
-
144
- @cached_property
145
- def parser(self) -> LHTMLParser:
146
- """Get HTML parser."""
147
- return LHTMLParser(remove_blank_text=True, remove_comments=True, remove_pis=True, collect_ids=False)
148
-
149
- def _sleep(self, sleeptime: float = 0.75) -> None:
150
- """Sleep between API requests."""
151
- delay = 0.0 if not self.sleep_timestamp else 0.0 if time() - self.sleep_timestamp >= 20 else sleeptime
152
- self.sleep_timestamp = time()
153
- sleep(delay)
154
-
155
- def _get_url(
156
- self,
157
- method: Literal["GET", "HEAD", "OPTIONS", "DELETE", "POST", "PUT", "PATCH"],
158
- url: str,
159
- params: dict[str, str] | None = None,
160
- content: bytes | None = None,
161
- data: dict[str, str] | None = None,
162
- headers: dict[str, str] | None = None,
163
- cookies: dict[str, str] | None = None,
164
- json: Any = None,
165
- timeout: float | None = None,
166
- ) -> Any:
167
- self._sleep()
168
- try:
169
- resp = self.client.request(
170
- method,
171
- url,
172
- params=params,
173
- content=content,
174
- data=data,
175
- headers=headers,
176
- cookies=cookies,
177
- json=json,
178
- timeout=timeout or self.timeout,
179
- )
180
- except Exception as ex:
181
- if "time" in str(ex).lower():
182
- raise TimeoutE(f"{url} {type(ex).__name__}: {ex}") from ex
183
- raise WebscoutE(f"{url} {type(ex).__name__}: {ex}") from ex
184
- if resp.status_code == 200:
185
- return resp
186
- elif resp.status_code in (202, 301, 403, 400, 429, 418):
187
- raise RatelimitE(f"{resp.url} {resp.status_code} Ratelimit")
188
- raise WebscoutE(f"{resp.url} return None. {params=} {content=} {data=}")
189
-
190
- def _get_vqd(self, keywords: str) -> str:
191
- """Get vqd value for a search query."""
192
- resp_content = self._get_url("GET", "https://duckduckgo.com", params={"q": keywords}).content
193
- return _extract_vqd(resp_content, keywords)
194
-
195
- def chat_yield(self, keywords: str, model: str = "gpt-4o-mini", timeout: int = 30, max_retries: int = 3) -> Iterator[str]:
196
- """Initiates a chat session with webscout AI.
197
-
198
- Args:
199
- keywords (str): The initial message or question to send to the AI.
200
- model (str): The model to use: "gpt-4o-mini", "llama-3.3-70b", "claude-3-haiku",
201
- "o3-mini", "mistral-small-3". Defaults to "gpt-4o-mini".
202
- timeout (int): Timeout value for the HTTP client. Defaults to 30.
203
- max_retries (int): Maximum number of retry attempts for rate limited requests. Defaults to 3.
204
-
205
- Yields:
206
- str: Chunks of the response from the AI.
207
- """
208
- # Get Cloudflare Turnstile token
209
- def get_turnstile_token():
210
- try:
211
- # Visit the DuckDuckGo chat page to get the Turnstile token
212
- resp_content = self._get_url(
213
- method="GET",
214
- url="https://duckduckgo.com/?q=DuckDuckGo+AI+Chat&ia=chat&duckai=1",
215
- ).content
216
-
217
- # Extract the Turnstile token if available
218
- if b'cf-turnstile-response' in resp_content:
219
- token = resp_content.split(b'cf-turnstile-response="', maxsplit=1)[1].split(b'"', maxsplit=1)[0].decode()
220
- return token
221
- return ""
222
- except Exception:
223
- return ""
224
-
225
- # x-fe-version
226
- if not self._chat_xfe:
227
- resp_content = self._get_url(
228
- method="GET",
229
- url="https://duckduckgo.com/?q=DuckDuckGo+AI+Chat&ia=chat&duckai=1",
230
- ).content
231
- try:
232
- xfe1 = resp_content.split(b'__DDG_BE_VERSION__="', maxsplit=1)[1].split(b'"', maxsplit=1)[0].decode()
233
- xfe2 = resp_content.split(b'__DDG_FE_CHAT_HASH__="', maxsplit=1)[1].split(b'"', maxsplit=1)[0].decode()
234
- self._chat_xfe = f"{xfe1}-{xfe2}"
235
- except Exception as ex:
236
- raise WebscoutE(
237
- f"chat_yield() Error to get _chat_xfe: {type(ex).__name__}: {ex}"
238
- ) from ex
239
- # vqd
240
- if not self._chat_vqd:
241
- resp = self._get_url(
242
- method="GET", url="https://duckduckgo.com/duckchat/v1/status", headers={"x-vqd-accept": "1"}
243
- )
244
- self._chat_vqd = resp.headers.get("x-vqd-4", "")
245
- self._chat_vqd_hash = resp.headers.get("x-vqd-hash-1", "")
246
-
247
- self._chat_messages.append({"role": "user", "content": keywords})
248
- self._chat_tokens_count += max(len(keywords) // 4, 1) # approximate number of tokens
249
- if model not in self._chat_models:
250
- warnings.warn(f"{model=} is unavailable. Using 'gpt-4o-mini'", stacklevel=1)
251
- model = "gpt-4o-mini"
252
-
253
- # Get Cloudflare Turnstile token
254
- turnstile_token = get_turnstile_token()
255
-
256
- json_data = {
257
- "model": self._chat_models[model],
258
- "messages": self._chat_messages,
259
- }
260
-
261
- # Add Turnstile token if available
262
- if turnstile_token:
263
- json_data["cf-turnstile-response"] = turnstile_token
264
-
265
- # Enhanced headers to better mimic a real browser
266
- chat_headers = {
267
- "x-fe-version": self._chat_xfe,
268
- "x-vqd-4": self._chat_vqd,
269
- "x-vqd-hash-1": "",
270
- "Accept": "text/event-stream",
271
- "Accept-Language": "en-US,en;q=0.9",
272
- "Cache-Control": "no-cache",
273
- "Content-Type": "application/json",
274
- "DNT": "1",
275
- "Origin": "https://duckduckgo.com",
276
- "Referer": "https://duckduckgo.com/",
277
- "Sec-Fetch-Dest": "empty",
278
- "Sec-Fetch-Mode": "cors",
279
- "Sec-Fetch-Site": "same-origin",
280
- "User-Agent": self.client.headers.get("User-Agent", "")
281
- }
282
-
283
- # Retry logic for rate limited requests
284
- retry_count = 0
285
- while retry_count <= max_retries:
286
- try:
287
- resp = self._get_url(
288
- method="POST",
289
- url="https://duckduckgo.com/duckchat/v1/chat",
290
- headers=chat_headers,
291
- json=json_data,
292
- timeout=timeout,
293
- )
294
-
295
- self._chat_vqd = resp.headers.get("x-vqd-4", "")
296
- self._chat_vqd_hash = resp.headers.get("x-vqd-hash-1", "")
297
- chunks = []
298
-
299
- for chunk in resp.stream():
300
- lines = chunk.split(b"data:")
301
- for line in lines:
302
- if line := line.strip():
303
- if line == b"[DONE]":
304
- break
305
- if line == b"[DONE][LIMIT_CONVERSATION]":
306
- raise ConversationLimitException("ERR_CONVERSATION_LIMIT")
307
- x = json_loads(line)
308
- if isinstance(x, dict):
309
- if x.get("action") == "error":
310
- err_message = x.get("type", "")
311
- if x.get("status") == 429:
312
- raise (
313
- ConversationLimitException(err_message)
314
- if err_message == "ERR_CONVERSATION_LIMIT"
315
- else RatelimitE(err_message)
316
- )
317
- raise WebscoutE(err_message)
318
- elif message := x.get("message"):
319
- chunks.append(message)
320
- yield message
321
-
322
- # If we get here, the request was successful
323
- result = "".join(chunks)
324
- self._chat_messages.append({"role": "assistant", "content": result})
325
- self._chat_tokens_count += len(result)
326
- return
327
-
328
- except RatelimitE as ex:
329
- retry_count += 1
330
- if retry_count > max_retries:
331
- raise WebscoutE(f"chat_yield() Rate limit exceeded after {max_retries} retries: {ex}") from ex
332
-
333
- # Get a fresh Turnstile token for the retry
334
- turnstile_token = get_turnstile_token()
335
- if turnstile_token:
336
- json_data["cf-turnstile-response"] = turnstile_token
337
-
338
- # Exponential backoff
339
- sleep_time = 2 ** retry_count
340
- sleep(sleep_time)
341
-
342
- except Exception as ex:
343
- raise WebscoutE(f"chat_yield() {type(ex).__name__}: {ex}") from ex
344
-
345
- def chat(self, keywords: str, model: str = "gpt-4o-mini", timeout: int = 30, max_retries: int = 3) -> str:
346
- """Initiates a chat session with webscout AI.
347
-
348
- Args:
349
- keywords (str): The initial message or question to send to the AI.
350
- model (str): The model to use: "gpt-4o-mini", "llama-3.3-70b", "claude-3-haiku",
351
- "o3-mini", "mistral-small-3". Defaults to "gpt-4o-mini".
352
- timeout (int): Timeout value for the HTTP client. Defaults to 30.
353
- max_retries (int): Maximum number of retry attempts for rate limited requests. Defaults to 3.
354
-
355
- Returns:
356
- str: The response from the AI.
357
- """
358
- answer_generator = self.chat_yield(keywords, model, timeout, max_retries)
359
- return "".join(answer_generator)
360
-
361
- def text(
362
- self,
363
- keywords: str,
364
- region: str = "wt-wt",
365
- safesearch: str = "moderate",
366
- timelimit: str | None = None,
367
- backend: str = "auto",
368
- max_results: int | None = None,
369
- ) -> list[dict[str, str]]:
370
- """webscout text search. Query params: https://duckduckgo.com/params.
371
-
372
- Args:
373
- keywords: keywords for query.
374
- region: wt-wt, us-en, uk-en, ru-ru, etc. Defaults to "wt-wt".
375
- safesearch: on, moderate, off. Defaults to "moderate".
376
- timelimit: d, w, m, y. Defaults to None.
377
- backend: auto, html, lite. Defaults to auto.
378
- auto - try all backends in random order,
379
- html - collect data from https://html.duckduckgo.com,
380
- lite - collect data from https://lite.duckduckgo.com.
381
- max_results: max number of results. If None, returns results only from the first response. Defaults to None.
382
-
383
- Returns:
384
- List of dictionaries with search results.
385
-
386
- Raises:
387
- WebscoutE: Base exception for webscout errors.
388
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
389
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
390
- """
391
- if backend in ("api", "ecosia"):
392
- warnings.warn(f"{backend=} is deprecated, using backend='auto'", stacklevel=2)
393
- backend = "auto"
394
- backends = ["html", "lite"] if backend == "auto" else [backend]
395
- shuffle(backends)
396
-
397
- results, err = [], None
398
- for b in backends:
399
- try:
400
- if b == "html":
401
- results = self._text_html(keywords, region, timelimit, max_results)
402
- elif b == "lite":
403
- results = self._text_lite(keywords, region, timelimit, max_results)
404
- return results
405
- except Exception as ex:
406
- err = ex
407
-
408
- raise WebscoutE(err)
409
-
410
- def _text_api(
411
- self,
412
- keywords: str,
413
- region: str = "wt-wt",
414
- safesearch: str = "moderate",
415
- timelimit: str | None = None,
416
- max_results: int | None = None,
417
- ) -> list[dict[str, str]]:
418
- """webscout text search. Query params: https://duckduckgo.com/params.
419
-
420
- Args:
421
- keywords: keywords for query.
422
- region: wt-wt, us-en, uk-en, ru-ru, etc. Defaults to "wt-wt".
423
- safesearch: on, moderate, off. Defaults to "moderate".
424
- timelimit: d, w, m, y. Defaults to None.
425
- max_results: max number of results. If None, returns results only from the first response. Defaults to None.
426
-
427
- Returns:
428
- List of dictionaries with search results.
429
-
430
- Raises:
431
- WebscoutE: Base exception for webscout errors.
432
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
433
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
434
- """
435
- assert keywords, "keywords is mandatory"
436
-
437
- vqd = self._get_vqd(keywords)
438
-
439
- payload = {
440
- "q": keywords,
441
- "kl": region,
442
- "l": region,
443
- "p": "",
444
- "s": "0",
445
- "df": "",
446
- "vqd": vqd,
447
- "bing_market": f"{region[3:]}-{region[:2].upper()}",
448
- "ex": "",
449
- }
450
- safesearch = safesearch.lower()
451
- if safesearch == "moderate":
452
- payload["ex"] = "-1"
453
- elif safesearch == "off":
454
- payload["ex"] = "-2"
455
- elif safesearch == "on": # strict
456
- payload["p"] = "1"
457
- if timelimit:
458
- payload["df"] = timelimit
459
-
460
- cache = set()
461
- results: list[dict[str, str]] = []
462
-
463
- def _text_api_page(s: int) -> list[dict[str, str]]:
464
- payload["s"] = f"{s}"
465
- resp_content = self._get_url("GET", "https://links.duckduckgo.com/d.js", params=payload).content
466
- page_data = _text_extract_json(resp_content, keywords)
467
- page_results = []
468
- for row in page_data:
469
- href = row.get("u", None)
470
- if href and href not in cache and href != f"http://www.google.com/search?q={keywords}":
471
- cache.add(href)
472
- body = _normalize(row["a"])
473
- if body:
474
- result = {
475
- "title": _normalize(row["t"]),
476
- "href": _normalize_url(href),
477
- "body": body,
478
- }
479
- page_results.append(result)
480
- return page_results
481
-
482
- slist = [0]
483
- if max_results:
484
- max_results = min(max_results, 2023)
485
- slist.extend(range(23, max_results, 50))
486
- try:
487
- for r in self._executor.map(_text_api_page, slist):
488
- results.extend(r)
489
- except Exception as e:
490
- raise e
491
-
492
- return list(islice(results, max_results))
493
-
494
- def _text_html(
495
- self,
496
- keywords: str,
497
- region: str = "wt-wt",
498
- timelimit: str | None = None,
499
- max_results: int | None = None,
500
- ) -> list[dict[str, str]]:
501
- """webscout text search. Query params: https://duckduckgo.com/params.
502
-
503
- Args:
504
- keywords: keywords for query.
505
- region: wt-wt, us-en, uk-en, ru-ru, etc. Defaults to "wt-wt".
506
- timelimit: d, w, m, y. Defaults to None.
507
- max_results: max number of results. If None, returns results only from the first response. Defaults to None.
508
-
509
- Returns:
510
- List of dictionaries with search results.
511
-
512
- Raises:
513
- WebscoutE: Base exception for webscout errors.
514
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
515
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
516
- """
517
- assert keywords, "keywords is mandatory"
518
-
519
- payload = {
520
- "q": keywords,
521
- "s": "0",
522
- "o": "json",
523
- "api": "d.js",
524
- "vqd": "",
525
- "kl": region,
526
- "bing_market": region,
527
- }
528
- if timelimit:
529
- payload["df"] = timelimit
530
- if max_results and max_results > 20:
531
- vqd = self._get_vqd(keywords)
532
- payload["vqd"] = vqd
533
-
534
- cache = set()
535
- results: list[dict[str, str]] = []
536
-
537
- def _text_html_page(s: int) -> list[dict[str, str]]:
538
- payload["s"] = f"{s}"
539
- resp_content = self._get_url("POST", "https://html.duckduckgo.com/html", data=payload).content
540
- if b"No results." in resp_content:
541
- return []
542
-
543
- page_results = []
544
- tree = document_fromstring(resp_content, self.parser)
545
- elements = tree.xpath("//div[h2]")
546
- if not isinstance(elements, list):
547
- return []
548
- for e in elements:
549
- if isinstance(e, _Element):
550
- hrefxpath = e.xpath("./a/@href")
551
- href = str(hrefxpath[0]) if hrefxpath and isinstance(hrefxpath, list) else None
552
- if (
553
- href
554
- and href not in cache
555
- and not href.startswith(
556
- ("http://www.google.com/search?q=", "https://duckduckgo.com/y.js?ad_domain")
557
- )
558
- ):
559
- cache.add(href)
560
- titlexpath = e.xpath("./h2/a/text()")
561
- title = str(titlexpath[0]) if titlexpath and isinstance(titlexpath, list) else ""
562
- bodyxpath = e.xpath("./a//text()")
563
- body = "".join(str(x) for x in bodyxpath) if bodyxpath and isinstance(bodyxpath, list) else ""
564
- result = {
565
- "title": _normalize(title),
566
- "href": _normalize_url(href),
567
- "body": _normalize(body),
568
- }
569
- page_results.append(result)
570
- return page_results
571
-
572
- slist = [0]
573
- if max_results:
574
- max_results = min(max_results, 2023)
575
- slist.extend(range(23, max_results, 50))
576
- try:
577
- for r in self._executor.map(_text_html_page, slist):
578
- results.extend(r)
579
- except Exception as e:
580
- raise e
581
-
582
- return list(islice(results, max_results))
583
-
584
- def _text_lite(
585
- self,
586
- keywords: str,
587
- region: str = "wt-wt",
588
- timelimit: str | None = None,
589
- max_results: int | None = None,
590
- ) -> list[dict[str, str]]:
591
- """webscout text search. Query params: https://duckduckgo.com/params.
592
-
593
- Args:
594
- keywords: keywords for query.
595
- region: wt-wt, us-en, uk-en, ru-ru, etc. Defaults to "wt-wt".
596
- timelimit: d, w, m, y. Defaults to None.
597
- max_results: max number of results. If None, returns results only from the first response. Defaults to None.
598
-
599
- Returns:
600
- List of dictionaries with search results.
601
-
602
- Raises:
603
- WebscoutE: Base exception for webscout errors.
604
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
605
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
606
- """
607
- assert keywords, "keywords is mandatory"
608
-
609
- payload = {
610
- "q": keywords,
611
- "s": "0",
612
- "o": "json",
613
- "api": "d.js",
614
- "vqd": "",
615
- "kl": region,
616
- "bing_market": region,
617
- }
618
- if timelimit:
619
- payload["df"] = timelimit
620
-
621
- cache = set()
622
- results: list[dict[str, str]] = []
623
-
624
- def _text_lite_page(s: int) -> list[dict[str, str]]:
625
- payload["s"] = f"{s}"
626
- resp_content = self._get_url("POST", "https://lite.duckduckgo.com/lite/", data=payload).content
627
- if b"No more results." in resp_content:
628
- return []
629
-
630
- page_results = []
631
- tree = document_fromstring(resp_content, self.parser)
632
- elements = tree.xpath("//table[last()]//tr")
633
- if not isinstance(elements, list):
634
- return []
635
-
636
- data = zip(cycle(range(1, 5)), elements)
637
- for i, e in data:
638
- if isinstance(e, _Element):
639
- if i == 1:
640
- hrefxpath = e.xpath(".//a//@href")
641
- href = str(hrefxpath[0]) if hrefxpath and isinstance(hrefxpath, list) else None
642
- if (
643
- href is None
644
- or href in cache
645
- or href.startswith(
646
- ("http://www.google.com/search?q=", "https://duckduckgo.com/y.js?ad_domain")
647
- )
648
- ):
649
- [next(data, None) for _ in range(3)] # skip block(i=1,2,3,4)
650
- else:
651
- cache.add(href)
652
- titlexpath = e.xpath(".//a//text()")
653
- title = str(titlexpath[0]) if titlexpath and isinstance(titlexpath, list) else ""
654
- elif i == 2:
655
- bodyxpath = e.xpath(".//td[@class='result-snippet']//text()")
656
- body = (
657
- "".join(str(x) for x in bodyxpath).strip()
658
- if bodyxpath and isinstance(bodyxpath, list)
659
- else ""
660
- )
661
- if href:
662
- result = {
663
- "title": _normalize(title),
664
- "href": _normalize_url(href),
665
- "body": _normalize(body),
666
- }
667
- page_results.append(result)
668
- return page_results
669
-
670
- slist = [0]
671
- if max_results:
672
- max_results = min(max_results, 2023)
673
- slist.extend(range(23, max_results, 50))
674
- try:
675
- for r in self._executor.map(_text_lite_page, slist):
676
- results.extend(r)
677
- except Exception as e:
678
- raise e
679
-
680
- return list(islice(results, max_results))
681
-
682
- def images(
683
- self,
684
- keywords: str,
685
- region: str = "wt-wt",
686
- safesearch: str = "moderate",
687
- timelimit: str | None = None,
688
- size: str | None = None,
689
- color: str | None = None,
690
- type_image: str | None = None,
691
- layout: str | None = None,
692
- license_image: str | None = None,
693
- max_results: int | None = None,
694
- ) -> list[dict[str, str]]:
695
- """webscout images search. Query params: https://duckduckgo.com/params.
696
-
697
- Args:
698
- keywords: keywords for query.
699
- region: wt-wt, us-en, uk-en, ru-ru, etc. Defaults to "wt-wt".
700
- safesearch: on, moderate, off. Defaults to "moderate".
701
- timelimit: Day, Week, Month, Year. Defaults to None.
702
- size: Small, Medium, Large, Wallpaper. Defaults to None.
703
- color: color, Monochrome, Red, Orange, Yellow, Green, Blue,
704
- Purple, Pink, Brown, Black, Gray, Teal, White. Defaults to None.
705
- type_image: photo, clipart, gif, transparent, line.
706
- Defaults to None.
707
- layout: Square, Tall, Wide. Defaults to None.
708
- license_image: any (All Creative Commons), Public (PublicDomain),
709
- Share (Free to Share and Use), ShareCommercially (Free to Share and Use Commercially),
710
- Modify (Free to Modify, Share, and Use), ModifyCommercially (Free to Modify, Share, and
711
- Use Commercially). Defaults to None.
712
- max_results: max number of results. If None, returns results only from the first response. Defaults to None.
713
-
714
- Returns:
715
- List of dictionaries with images search results.
716
-
717
- Raises:
718
- WebscoutE: Base exception for webscout errors.
719
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
720
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
721
- """
722
- assert keywords, "keywords is mandatory"
723
-
724
- vqd = self._get_vqd(keywords)
725
-
726
- safesearch_base = {"on": "1", "moderate": "1", "off": "-1"}
727
- timelimit = f"time:{timelimit}" if timelimit else ""
728
- size = f"size:{size}" if size else ""
729
- color = f"color:{color}" if color else ""
730
- type_image = f"type:{type_image}" if type_image else ""
731
- layout = f"layout:{layout}" if layout else ""
732
- license_image = f"license:{license_image}" if license_image else ""
733
- payload = {
734
- "l": region,
735
- "o": "json",
736
- "q": keywords,
737
- "vqd": vqd,
738
- "f": f"{timelimit},{size},{color},{type_image},{layout},{license_image}",
739
- "p": safesearch_base[safesearch.lower()],
740
- }
741
-
742
- cache = set()
743
- results: list[dict[str, str]] = []
744
-
745
- def _images_page(s: int) -> list[dict[str, str]]:
746
- payload["s"] = f"{s}"
747
- resp_content = self._get_url("GET", "https://duckduckgo.com/i.js", params=payload).content
748
- resp_json = json_loads(resp_content)
749
-
750
- page_data = resp_json.get("results", [])
751
- page_results = []
752
- for row in page_data:
753
- image_url = row.get("image")
754
- if image_url and image_url not in cache:
755
- cache.add(image_url)
756
- result = {
757
- "title": row["title"],
758
- "image": _normalize_url(image_url),
759
- "thumbnail": _normalize_url(row["thumbnail"]),
760
- "url": _normalize_url(row["url"]),
761
- "height": row["height"],
762
- "width": row["width"],
763
- "source": row["source"],
764
- }
765
- page_results.append(result)
766
- return page_results
767
-
768
- slist = [0]
769
- if max_results:
770
- max_results = min(max_results, 500)
771
- slist.extend(range(100, max_results, 100))
772
- try:
773
- for r in self._executor.map(_images_page, slist):
774
- results.extend(r)
775
- except Exception as e:
776
- raise e
777
-
778
- return list(islice(results, max_results))
779
-
780
- def videos(
781
- self,
782
- keywords: str,
783
- region: str = "wt-wt",
784
- safesearch: str = "moderate",
785
- timelimit: str | None = None,
786
- resolution: str | None = None,
787
- duration: str | None = None,
788
- license_videos: str | None = None,
789
- max_results: int | None = None,
790
- ) -> list[dict[str, str]]:
791
- """webscout videos search. Query params: https://duckduckgo.com/params.
792
-
793
- Args:
794
- keywords: keywords for query.
795
- region: wt-wt, us-en, uk-en, ru-ru, etc. Defaults to "wt-wt".
796
- safesearch: on, moderate, off. Defaults to "moderate".
797
- timelimit: d, w, m. Defaults to None.
798
- resolution: high, standart. Defaults to None.
799
- duration: short, medium, long. Defaults to None.
800
- license_videos: creativeCommon, youtube. Defaults to None.
801
- max_results: max number of results. If None, returns results only from the first response. Defaults to None.
802
-
803
- Returns:
804
- List of dictionaries with videos search results.
805
-
806
- Raises:
807
- WebscoutE: Base exception for webscout errors.
808
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
809
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
810
- """
811
- assert keywords, "keywords is mandatory"
812
-
813
- vqd = self._get_vqd(keywords)
814
-
815
- safesearch_base = {"on": "1", "moderate": "-1", "off": "-2"}
816
- timelimit = f"publishedAfter:{timelimit}" if timelimit else ""
817
- resolution = f"videoDefinition:{resolution}" if resolution else ""
818
- duration = f"videoDuration:{duration}" if duration else ""
819
- license_videos = f"videoLicense:{license_videos}" if license_videos else ""
820
- payload = {
821
- "l": region,
822
- "o": "json",
823
- "q": keywords,
824
- "vqd": vqd,
825
- "f": f"{timelimit},{resolution},{duration},{license_videos}",
826
- "p": safesearch_base[safesearch.lower()],
827
- }
828
-
829
- cache = set()
830
- results: list[dict[str, str]] = []
831
-
832
- def _videos_page(s: int) -> list[dict[str, str]]:
833
- payload["s"] = f"{s}"
834
- resp_content = self._get_url("GET", "https://duckduckgo.com/v.js", params=payload).content
835
- resp_json = json_loads(resp_content)
836
-
837
- page_data = resp_json.get("results", [])
838
- page_results = []
839
- for row in page_data:
840
- if row["content"] not in cache:
841
- cache.add(row["content"])
842
- page_results.append(row)
843
- return page_results
844
-
845
- slist = [0]
846
- if max_results:
847
- max_results = min(max_results, 400)
848
- slist.extend(range(60, max_results, 60))
849
- try:
850
- for r in self._executor.map(_videos_page, slist):
851
- results.extend(r)
852
- except Exception as e:
853
- raise e
854
-
855
- return list(islice(results, max_results))
856
-
857
- def news(
858
- self,
859
- keywords: str,
860
- region: str = "wt-wt",
861
- safesearch: str = "moderate",
862
- timelimit: str | None = None,
863
- max_results: int | None = None,
864
- ) -> list[dict[str, str]]:
865
- """webscout news search. Query params: https://duckduckgo.com/params.
866
-
867
- Args:
868
- keywords: keywords for query.
869
- region: wt-wt, us-en, uk-en, ru-ru, etc. Defaults to "wt-wt".
870
- safesearch: on, moderate, off. Defaults to "moderate".
871
- timelimit: d, w, m. Defaults to None.
872
- max_results: max number of results. If None, returns results only from the first response. Defaults to None.
873
-
874
- Returns:
875
- List of dictionaries with news search results.
876
-
877
- Raises:
878
- WebscoutE: Base exception for webscout errors.
879
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
880
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
881
- """
882
- assert keywords, "keywords is mandatory"
883
-
884
- vqd = self._get_vqd(keywords)
885
-
886
- safesearch_base = {"on": "1", "moderate": "-1", "off": "-2"}
887
- payload = {
888
- "l": region,
889
- "o": "json",
890
- "noamp": "1",
891
- "q": keywords,
892
- "vqd": vqd,
893
- "p": safesearch_base[safesearch.lower()],
894
- }
895
- if timelimit:
896
- payload["df"] = timelimit
897
-
898
- cache = set()
899
- results: list[dict[str, str]] = []
900
-
901
- def _news_page(s: int) -> list[dict[str, str]]:
902
- payload["s"] = f"{s}"
903
- resp_content = self._get_url("GET", "https://duckduckgo.com/news.js", params=payload).content
904
- resp_json = json_loads(resp_content)
905
- page_data = resp_json.get("results", [])
906
- page_results = []
907
- for row in page_data:
908
- if row["url"] not in cache:
909
- cache.add(row["url"])
910
- image_url = row.get("image", None)
911
- result = {
912
- "date": datetime.fromtimestamp(row["date"], timezone.utc).isoformat(),
913
- "title": row["title"],
914
- "body": _normalize(row["excerpt"]),
915
- "url": _normalize_url(row["url"]),
916
- "image": _normalize_url(image_url),
917
- "source": row["source"],
918
- }
919
- page_results.append(result)
920
- return page_results
921
-
922
- slist = [0]
923
- if max_results:
924
- max_results = min(max_results, 120)
925
- slist.extend(range(30, max_results, 30))
926
- try:
927
- for r in self._executor.map(_news_page, slist):
928
- results.extend(r)
929
- except Exception as e:
930
- raise e
931
-
932
- return list(islice(results, max_results))
933
-
934
- def answers(self, keywords: str) -> list[dict[str, str]]:
935
- """webscout instant answers. Query params: https://duckduckgo.com/params.
936
-
937
- Args:
938
- keywords: keywords for query,
939
-
940
- Returns:
941
- List of dictionaries with instant answers results.
942
-
943
- Raises:
944
- WebscoutE: Base exception for webscout errors.
945
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
946
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
947
- """
948
- assert keywords, "keywords is mandatory"
949
-
950
- payload = {
951
- "q": f"what is {keywords}",
952
- "format": "json",
953
- }
954
- resp_content = self._get_url("GET", "https://api.duckduckgo.com/", params=payload).content
955
- page_data = json_loads(resp_content)
956
-
957
- results = []
958
- answer = page_data.get("AbstractText")
959
- url = page_data.get("AbstractURL")
960
- if answer:
961
- results.append(
962
- {
963
- "icon": None,
964
- "text": answer,
965
- "topic": None,
966
- "url": url,
967
- }
968
- )
969
-
970
- # related
971
- payload = {
972
- "q": f"{keywords}",
973
- "format": "json",
974
- }
975
- resp_content = self._get_url("GET", "https://api.duckduckgo.com/", params=payload).content
976
- resp_json = json_loads(resp_content)
977
- page_data = resp_json.get("RelatedTopics", [])
978
-
979
- for row in page_data:
980
- topic = row.get("Name")
981
- if not topic:
982
- icon = row["Icon"].get("URL")
983
- results.append(
984
- {
985
- "icon": f"https://duckduckgo.com{icon}" if icon else "",
986
- "text": row["Text"],
987
- "topic": None,
988
- "url": row["FirstURL"],
989
- }
990
- )
991
- else:
992
- for subrow in row["Topics"]:
993
- icon = subrow["Icon"].get("URL")
994
- results.append(
995
- {
996
- "icon": f"https://duckduckgo.com{icon}" if icon else "",
997
- "text": subrow["Text"],
998
- "topic": topic,
999
- "url": subrow["FirstURL"],
1000
- }
1001
- )
1002
-
1003
- return results
1004
-
1005
- def suggestions(self, keywords: str, region: str = "wt-wt") -> list[dict[str, str]]:
1006
- """webscout suggestions. Query params: https://duckduckgo.com/params.
1007
-
1008
- Args:
1009
- keywords: keywords for query.
1010
- region: wt-wt, us-en, uk-en, ru-ru, etc. Defaults to "wt-wt".
1011
-
1012
- Returns:
1013
- List of dictionaries with suggestions results.
1014
-
1015
- Raises:
1016
- WebscoutE: Base exception for webscout errors.
1017
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
1018
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
1019
- """
1020
- assert keywords, "keywords is mandatory"
1021
-
1022
- payload = {
1023
- "q": keywords,
1024
- "kl": region,
1025
- }
1026
- resp_content = self._get_url("GET", "https://duckduckgo.com/ac/", params=payload).content
1027
- page_data = json_loads(resp_content)
1028
- return [r for r in page_data]
1029
-
1030
- def maps(
1031
- self,
1032
- keywords: str,
1033
- place: str | None = None,
1034
- street: str | None = None,
1035
- city: str | None = None,
1036
- county: str | None = None,
1037
- state: str | None = None,
1038
- country: str | None = None,
1039
- postalcode: str | None = None,
1040
- latitude: str | None = None,
1041
- longitude: str | None = None,
1042
- radius: int = 0,
1043
- max_results: int | None = None,
1044
- ) -> list[dict[str, str]]:
1045
- """webscout maps search. Query params: https://duckduckgo.com/params.
1046
-
1047
- Args:
1048
- keywords: keywords for query
1049
- place: if set, the other parameters are not used. Defaults to None.
1050
- street: house number/street. Defaults to None.
1051
- city: city of search. Defaults to None.
1052
- county: county of search. Defaults to None.
1053
- state: state of search. Defaults to None.
1054
- country: country of search. Defaults to None.
1055
- postalcode: postalcode of search. Defaults to None.
1056
- latitude: geographic coordinate (north-south position). Defaults to None.
1057
- longitude: geographic coordinate (east-west position); if latitude and
1058
- longitude are set, the other parameters are not used. Defaults to None.
1059
- radius: expand the search square by the distance in kilometers. Defaults to 0.
1060
- max_results: max number of results. If None, returns results only from the first response. Defaults to None.
1061
-
1062
- Returns:
1063
- List of dictionaries with maps search results, or None if there was an error.
1064
-
1065
- Raises:
1066
- WebscoutE: Base exception for webscout errors.
1067
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
1068
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
1069
- """
1070
- assert keywords, "keywords is mandatory"
1071
-
1072
- vqd = self._get_vqd(keywords)
1073
-
1074
- # if longitude and latitude are specified, skip the request about bbox to the nominatim api
1075
- if latitude and longitude:
1076
- lat_t = Decimal(latitude.replace(",", "."))
1077
- lat_b = Decimal(latitude.replace(",", "."))
1078
- lon_l = Decimal(longitude.replace(",", "."))
1079
- lon_r = Decimal(longitude.replace(",", "."))
1080
- if radius == 0:
1081
- radius = 1
1082
- # otherwise request about bbox to nominatim api
1083
- else:
1084
- if place:
1085
- params = {
1086
- "q": place,
1087
- "polygon_geojson": "0",
1088
- "format": "jsonv2",
1089
- }
1090
- else:
1091
- params = {
1092
- "polygon_geojson": "0",
1093
- "format": "jsonv2",
1094
- }
1095
- if street:
1096
- params["street"] = street
1097
- if city:
1098
- params["city"] = city
1099
- if county:
1100
- params["county"] = county
1101
- if state:
1102
- params["state"] = state
1103
- if country:
1104
- params["country"] = country
1105
- if postalcode:
1106
- params["postalcode"] = postalcode
1107
- # request nominatim api to get coordinates box
1108
- resp_content = self._get_url(
1109
- "GET",
1110
- "https://nominatim.openstreetmap.org/search.php",
1111
- params=params,
1112
- ).content
1113
- if resp_content == b"[]":
1114
- raise WebscoutE("maps() Coordinates are not found, check function parameters.")
1115
- resp_json = json_loads(resp_content)
1116
- coordinates = resp_json[0]["boundingbox"]
1117
- lat_t, lon_l = Decimal(coordinates[1]), Decimal(coordinates[2])
1118
- lat_b, lon_r = Decimal(coordinates[0]), Decimal(coordinates[3])
1119
-
1120
- # if a radius is specified, expand the search square
1121
- lat_t += Decimal(radius) * Decimal(0.008983)
1122
- lat_b -= Decimal(radius) * Decimal(0.008983)
1123
- lon_l -= Decimal(radius) * Decimal(0.008983)
1124
- lon_r += Decimal(radius) * Decimal(0.008983)
1125
- # logger.debug(f"bbox coordinates\n{lat_t} {lon_l}\n{lat_b} {lon_r}")
1126
-
1127
- cache = set()
1128
- results: list[dict[str, str]] = []
1129
-
1130
- def _maps_page(
1131
- bbox: tuple[Decimal, Decimal, Decimal, Decimal],
1132
- ) -> list[dict[str, str]] | None:
1133
- if max_results and len(results) >= max_results:
1134
- return None
1135
- lat_t, lon_l, lat_b, lon_r = bbox
1136
- params = {
1137
- "q": keywords,
1138
- "vqd": vqd,
1139
- "tg": "maps_places",
1140
- "rt": "D",
1141
- "mkexp": "b",
1142
- "wiki_info": "1",
1143
- "is_requery": "1",
1144
- "bbox_tl": f"{lat_t},{lon_l}",
1145
- "bbox_br": f"{lat_b},{lon_r}",
1146
- "strict_bbox": "1",
1147
- }
1148
- resp_content = self._get_url("GET", "https://duckduckgo.com/local.js", params=params).content
1149
- resp_json = json_loads(resp_content)
1150
- page_data = resp_json.get("results", [])
1151
-
1152
- page_results = []
1153
- for res in page_data:
1154
- r_name = f'{res["name"]} {res["address"]}'
1155
- if r_name in cache:
1156
- continue
1157
- else:
1158
- cache.add(r_name)
1159
- result = {
1160
- "title": res["name"],
1161
- "address": res["address"],
1162
- "country_code": res["country_code"],
1163
- "url": _normalize_url(res["website"]),
1164
- "phone": res["phone"] or "",
1165
- "latitude": res["coordinates"]["latitude"],
1166
- "longitude": res["coordinates"]["longitude"],
1167
- "source": _normalize_url(res["url"]),
1168
- "image": x.get("image", "") if (x := res["embed"]) else "",
1169
- "desc": x.get("description", "") if (x := res["embed"]) else "",
1170
- "hours": res["hours"] or "",
1171
- "category": res["ddg_category"] or "",
1172
- "facebook": f"www.facebook.com/profile.php?id={x}" if (x := res["facebook_id"]) else "",
1173
- "instagram": f"https://www.instagram.com/{x}" if (x := res["instagram_id"]) else "",
1174
- "twitter": f"https://twitter.com/{x}" if (x := res["twitter_id"]) else "",
1175
- }
1176
- page_results.append(result)
1177
- return page_results
1178
-
1179
- # search squares (bboxes)
1180
- start_bbox = (lat_t, lon_l, lat_b, lon_r)
1181
- work_bboxes = [start_bbox]
1182
- while work_bboxes:
1183
- queue_bboxes = [] # for next iteration, at the end of the iteration work_bboxes = queue_bboxes
1184
- tasks = []
1185
- for bbox in work_bboxes:
1186
- tasks.append(bbox)
1187
- # if distance between coordinates > 1, divide the square into 4 parts and save them in queue_bboxes
1188
- if _calculate_distance(lat_t, lon_l, lat_b, lon_r) > 1:
1189
- lat_t, lon_l, lat_b, lon_r = bbox
1190
- lat_middle = (lat_t + lat_b) / 2
1191
- lon_middle = (lon_l + lon_r) / 2
1192
- bbox1 = (lat_t, lon_l, lat_middle, lon_middle)
1193
- bbox2 = (lat_t, lon_middle, lat_middle, lon_r)
1194
- bbox3 = (lat_middle, lon_l, lat_b, lon_middle)
1195
- bbox4 = (lat_middle, lon_middle, lat_b, lon_r)
1196
- queue_bboxes.extend([bbox1, bbox2, bbox3, bbox4])
1197
-
1198
- # gather tasks using asyncio.wait_for and timeout
1199
- work_bboxes_results = []
1200
- try:
1201
- for r in self._executor.map(_maps_page, tasks):
1202
- if r:
1203
- work_bboxes_results.extend(r)
1204
- except Exception as e:
1205
- raise e
1206
-
1207
- for x in work_bboxes_results:
1208
- if isinstance(x, list):
1209
- results.extend(x)
1210
- elif isinstance(x, dict):
1211
- results.append(x)
1212
-
1213
- work_bboxes = queue_bboxes
1214
- if not max_results or len(results) >= max_results or len(work_bboxes_results) == 0:
1215
- break
1216
-
1217
- return list(islice(results, max_results))
1218
-
1219
- def translate(self, keywords: list[str] | str, from_: str | None = None, to: str = "en") -> list[dict[str, str]]:
1220
- """webscout translate.
1221
-
1222
- Args:
1223
- keywords: string or list of strings to translate.
1224
- from_: translate from (defaults automatically). Defaults to None.
1225
- to: what language to translate. Defaults to "en".
1226
-
1227
- Returns:
1228
- List od dictionaries with translated keywords.
1229
-
1230
- Raises:
1231
- WebscoutE: Base exception for webscout errors.
1232
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
1233
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
1234
- """
1235
- assert keywords, "keywords is mandatory"
1236
-
1237
- vqd = self._get_vqd("translate")
1238
-
1239
- payload = {
1240
- "vqd": vqd,
1241
- "query": "translate",
1242
- "to": to,
1243
- }
1244
- if from_:
1245
- payload["from"] = from_
1246
-
1247
- def _translate_keyword(keyword: str) -> dict[str, str]:
1248
- resp_content = self._get_url(
1249
- "POST",
1250
- "https://duckduckgo.com/translation.js",
1251
- params=payload,
1252
- content=keyword.encode(),
1253
- ).content
1254
- page_data: dict[str, str] = json_loads(resp_content)
1255
- page_data["original"] = keyword
1256
- return page_data
1257
-
1258
- if isinstance(keywords, str):
1259
- keywords = [keywords]
1260
-
1261
- results = []
1262
- try:
1263
- for r in self._executor.map(_translate_keyword, keywords):
1264
- results.append(r)
1265
- except Exception as e:
1266
- raise e
1267
-
1268
- return results
1269
-
1270
- def weather(
1271
- self,
1272
- location: str,
1273
- language: str = "en",
1274
- ) -> dict[str, Any]:
1275
- """Get weather information for a location from DuckDuckGo.
1276
-
1277
- Args:
1278
- location: Location to get weather for.
1279
- language: Language code (e.g. 'en', 'es'). Defaults to "en".
1280
-
1281
- Returns:
1282
- Dictionary containing weather data with structure described in docstring.
1283
-
1284
- Raises:
1285
- WebscoutE: Base exception for webscout errors.
1286
- RatelimitE: Inherits from WebscoutE, raised for exceeding API request rate limits.
1287
- TimeoutE: Inherits from WebscoutE, raised for API request timeouts.
1288
- """
1289
- assert location, "location is mandatory"
1290
- lang = language.split('-')[0]
1291
- url = f"https://duckduckgo.com/js/spice/forecast/{quote(location)}/{lang}"
1292
-
1293
- resp = self._get_url("GET", url).content
1294
- resp_text = resp.decode('utf-8')
1295
-
1296
- if "ddg_spice_forecast(" not in resp_text:
1297
- raise WebscoutE(f"No weather data found for {location}")
1298
-
1299
- json_text = resp_text[resp_text.find('(') + 1:resp_text.rfind(')')]
1300
- try:
1301
- result = json.loads(json_text)
1302
- except Exception as e:
1303
- raise WebscoutE(f"Error parsing weather JSON: {e}")
1304
-
1305
- if not result or 'currentWeather' not in result or 'forecastDaily' not in result:
1306
- raise WebscoutE(f"Invalid weather data format for {location}")
1307
-
1308
- formatted_data = {
1309
- "location": result["currentWeather"]["metadata"].get("ddg-location", "Unknown"),
1310
- "current": {
1311
- "condition": result["currentWeather"].get("conditionCode"),
1312
- "temperature_c": result["currentWeather"].get("temperature"),
1313
- "feels_like_c": result["currentWeather"].get("temperatureApparent"),
1314
- "humidity": result["currentWeather"].get("humidity"),
1315
- "wind_speed_ms": result["currentWeather"].get("windSpeed"),
1316
- "wind_direction": result["currentWeather"].get("windDirection"),
1317
- "visibility_m": result["currentWeather"].get("visibility"),
1318
- },
1319
- "daily_forecast": [],
1320
- "hourly_forecast": []
1321
- }
1322
-
1323
- for day in result["forecastDaily"]["days"]:
1324
- formatted_data["daily_forecast"].append({
1325
- "date": datetime.fromisoformat(day["forecastStart"].replace("Z", "+00:00")).strftime("%Y-%m-%d"),
1326
- "condition": day["daytimeForecast"].get("conditionCode"),
1327
- "max_temp_c": day["temperatureMax"],
1328
- "min_temp_c": day["temperatureMin"],
1329
- "sunrise": datetime.fromisoformat(day["sunrise"].replace("Z", "+00:00")).strftime("%H:%M"),
1330
- "sunset": datetime.fromisoformat(day["sunset"].replace("Z", "+00:00")).strftime("%H:%M"),
1331
- })
1332
-
1333
- if 'forecastHourly' in result and 'hours' in result['forecastHourly']:
1334
- for hour in result['forecastHourly']['hours']:
1335
- formatted_data["hourly_forecast"].append({
1336
- "time": datetime.fromisoformat(hour["forecastStart"].replace("Z", "+00:00")).strftime("%H:%M"),
1337
- "condition": hour.get("conditionCode"),
1338
- "temperature_c": hour.get("temperature"),
1339
- "feels_like_c": hour.get("temperatureApparent"),
1340
- "humidity": hour.get("humidity"),
1341
- "wind_speed_ms": hour.get("windSpeed"),
1342
- "wind_direction": hour.get("windDirection"),
1343
- "visibility_m": hour.get("visibility"),
1344
- })
1345
-
1346
- return formatted_data