webscout 8.2.7__py3-none-any.whl → 8.2.9__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- webscout/AIauto.py +33 -15
- webscout/AIbase.py +96 -37
- webscout/AIutel.py +703 -250
- webscout/Bard.py +441 -323
- webscout/Extra/Act.md +309 -0
- webscout/Extra/GitToolkit/__init__.py +10 -0
- webscout/Extra/GitToolkit/gitapi/README.md +110 -0
- webscout/Extra/GitToolkit/gitapi/__init__.py +12 -0
- webscout/Extra/GitToolkit/gitapi/repository.py +195 -0
- webscout/Extra/GitToolkit/gitapi/user.py +96 -0
- webscout/Extra/GitToolkit/gitapi/utils.py +62 -0
- webscout/Extra/YTToolkit/README.md +375 -0
- webscout/Extra/YTToolkit/YTdownloader.py +957 -0
- webscout/Extra/YTToolkit/__init__.py +3 -0
- webscout/Extra/YTToolkit/transcriber.py +476 -0
- webscout/Extra/YTToolkit/ytapi/README.md +44 -0
- webscout/Extra/YTToolkit/ytapi/__init__.py +6 -0
- webscout/Extra/YTToolkit/ytapi/channel.py +307 -0
- webscout/Extra/YTToolkit/ytapi/errors.py +13 -0
- webscout/Extra/YTToolkit/ytapi/extras.py +118 -0
- webscout/Extra/YTToolkit/ytapi/https.py +88 -0
- webscout/Extra/YTToolkit/ytapi/patterns.py +61 -0
- webscout/Extra/YTToolkit/ytapi/playlist.py +59 -0
- webscout/Extra/YTToolkit/ytapi/pool.py +8 -0
- webscout/Extra/YTToolkit/ytapi/query.py +40 -0
- webscout/Extra/YTToolkit/ytapi/stream.py +63 -0
- webscout/Extra/YTToolkit/ytapi/utils.py +62 -0
- webscout/Extra/YTToolkit/ytapi/video.py +232 -0
- webscout/Extra/__init__.py +7 -0
- webscout/Extra/autocoder/__init__.py +9 -0
- webscout/Extra/autocoder/autocoder.py +1105 -0
- webscout/Extra/autocoder/autocoder_utiles.py +332 -0
- webscout/Extra/gguf.md +430 -0
- webscout/Extra/gguf.py +684 -0
- webscout/Extra/tempmail/README.md +488 -0
- webscout/Extra/tempmail/__init__.py +28 -0
- webscout/Extra/tempmail/async_utils.py +141 -0
- webscout/Extra/tempmail/base.py +161 -0
- webscout/Extra/tempmail/cli.py +187 -0
- webscout/Extra/tempmail/emailnator.py +84 -0
- webscout/Extra/tempmail/mail_tm.py +361 -0
- webscout/Extra/tempmail/temp_mail_io.py +292 -0
- webscout/Extra/weather.md +281 -0
- webscout/Extra/weather.py +194 -0
- webscout/Extra/weather_ascii.py +76 -0
- webscout/Litlogger/README.md +10 -0
- webscout/Litlogger/__init__.py +15 -0
- webscout/Litlogger/formats.py +4 -0
- webscout/Litlogger/handlers.py +103 -0
- webscout/Litlogger/levels.py +13 -0
- webscout/Litlogger/logger.py +92 -0
- webscout/Provider/AI21.py +177 -0
- webscout/Provider/AISEARCH/DeepFind.py +254 -0
- webscout/Provider/AISEARCH/Perplexity.py +333 -0
- webscout/Provider/AISEARCH/README.md +279 -0
- webscout/Provider/AISEARCH/__init__.py +9 -0
- webscout/Provider/AISEARCH/felo_search.py +202 -0
- webscout/Provider/AISEARCH/genspark_search.py +324 -0
- webscout/Provider/AISEARCH/hika_search.py +186 -0
- webscout/Provider/AISEARCH/iask_search.py +410 -0
- webscout/Provider/AISEARCH/monica_search.py +220 -0
- webscout/Provider/AISEARCH/scira_search.py +298 -0
- webscout/Provider/AISEARCH/webpilotai_search.py +255 -0
- webscout/Provider/Aitopia.py +316 -0
- webscout/Provider/AllenAI.py +440 -0
- webscout/Provider/Andi.py +228 -0
- webscout/Provider/Blackboxai.py +791 -0
- webscout/Provider/ChatGPTClone.py +237 -0
- webscout/Provider/ChatGPTGratis.py +194 -0
- webscout/Provider/ChatSandbox.py +342 -0
- webscout/Provider/Cloudflare.py +324 -0
- webscout/Provider/Cohere.py +208 -0
- webscout/Provider/Deepinfra.py +340 -0
- webscout/Provider/ExaAI.py +261 -0
- webscout/Provider/ExaChat.py +358 -0
- webscout/Provider/Flowith.py +217 -0
- webscout/Provider/FreeGemini.py +250 -0
- webscout/Provider/Gemini.py +169 -0
- webscout/Provider/GithubChat.py +369 -0
- webscout/Provider/GizAI.py +295 -0
- webscout/Provider/Glider.py +225 -0
- webscout/Provider/Groq.py +801 -0
- webscout/Provider/HF_space/__init__.py +0 -0
- webscout/Provider/HF_space/qwen_qwen2.py +206 -0
- webscout/Provider/HeckAI.py +375 -0
- webscout/Provider/HuggingFaceChat.py +469 -0
- webscout/Provider/Hunyuan.py +283 -0
- webscout/Provider/Jadve.py +291 -0
- webscout/Provider/Koboldai.py +384 -0
- webscout/Provider/LambdaChat.py +411 -0
- webscout/Provider/Llama3.py +259 -0
- webscout/Provider/MCPCore.py +315 -0
- webscout/Provider/Marcus.py +198 -0
- webscout/Provider/Nemotron.py +218 -0
- webscout/Provider/Netwrck.py +270 -0
- webscout/Provider/OLLAMA.py +396 -0
- webscout/Provider/OPENAI/BLACKBOXAI.py +766 -0
- webscout/Provider/OPENAI/Cloudflare.py +378 -0
- webscout/Provider/OPENAI/FreeGemini.py +283 -0
- webscout/Provider/OPENAI/NEMOTRON.py +232 -0
- webscout/Provider/OPENAI/Qwen3.py +283 -0
- webscout/Provider/OPENAI/README.md +952 -0
- webscout/Provider/OPENAI/TwoAI.py +357 -0
- webscout/Provider/OPENAI/__init__.py +40 -0
- webscout/Provider/OPENAI/ai4chat.py +293 -0
- webscout/Provider/OPENAI/api.py +969 -0
- webscout/Provider/OPENAI/base.py +249 -0
- webscout/Provider/OPENAI/c4ai.py +373 -0
- webscout/Provider/OPENAI/chatgpt.py +556 -0
- webscout/Provider/OPENAI/chatgptclone.py +494 -0
- webscout/Provider/OPENAI/chatsandbox.py +173 -0
- webscout/Provider/OPENAI/copilot.py +242 -0
- webscout/Provider/OPENAI/deepinfra.py +322 -0
- webscout/Provider/OPENAI/e2b.py +1414 -0
- webscout/Provider/OPENAI/exaai.py +417 -0
- webscout/Provider/OPENAI/exachat.py +444 -0
- webscout/Provider/OPENAI/flowith.py +162 -0
- webscout/Provider/OPENAI/freeaichat.py +359 -0
- webscout/Provider/OPENAI/glider.py +326 -0
- webscout/Provider/OPENAI/groq.py +364 -0
- webscout/Provider/OPENAI/heckai.py +308 -0
- webscout/Provider/OPENAI/llmchatco.py +335 -0
- webscout/Provider/OPENAI/mcpcore.py +389 -0
- webscout/Provider/OPENAI/multichat.py +376 -0
- webscout/Provider/OPENAI/netwrck.py +357 -0
- webscout/Provider/OPENAI/oivscode.py +287 -0
- webscout/Provider/OPENAI/opkfc.py +496 -0
- webscout/Provider/OPENAI/pydantic_imports.py +172 -0
- webscout/Provider/OPENAI/scirachat.py +477 -0
- webscout/Provider/OPENAI/sonus.py +304 -0
- webscout/Provider/OPENAI/standardinput.py +433 -0
- webscout/Provider/OPENAI/textpollinations.py +339 -0
- webscout/Provider/OPENAI/toolbaz.py +413 -0
- webscout/Provider/OPENAI/typefully.py +355 -0
- webscout/Provider/OPENAI/typegpt.py +364 -0
- webscout/Provider/OPENAI/uncovrAI.py +463 -0
- webscout/Provider/OPENAI/utils.py +318 -0
- webscout/Provider/OPENAI/venice.py +431 -0
- webscout/Provider/OPENAI/wisecat.py +387 -0
- webscout/Provider/OPENAI/writecream.py +163 -0
- webscout/Provider/OPENAI/x0gpt.py +365 -0
- webscout/Provider/OPENAI/yep.py +382 -0
- webscout/Provider/OpenGPT.py +209 -0
- webscout/Provider/Openai.py +496 -0
- webscout/Provider/PI.py +429 -0
- webscout/Provider/Perplexitylabs.py +415 -0
- webscout/Provider/QwenLM.py +254 -0
- webscout/Provider/Reka.py +214 -0
- webscout/Provider/StandardInput.py +290 -0
- webscout/Provider/TTI/README.md +82 -0
- webscout/Provider/TTI/__init__.py +7 -0
- webscout/Provider/TTI/aiarta.py +365 -0
- webscout/Provider/TTI/artbit.py +0 -0
- webscout/Provider/TTI/base.py +64 -0
- webscout/Provider/TTI/fastflux.py +200 -0
- webscout/Provider/TTI/magicstudio.py +201 -0
- webscout/Provider/TTI/piclumen.py +203 -0
- webscout/Provider/TTI/pixelmuse.py +225 -0
- webscout/Provider/TTI/pollinations.py +221 -0
- webscout/Provider/TTI/utils.py +11 -0
- webscout/Provider/TTS/README.md +192 -0
- webscout/Provider/TTS/__init__.py +10 -0
- webscout/Provider/TTS/base.py +159 -0
- webscout/Provider/TTS/deepgram.py +156 -0
- webscout/Provider/TTS/elevenlabs.py +111 -0
- webscout/Provider/TTS/gesserit.py +128 -0
- webscout/Provider/TTS/murfai.py +113 -0
- webscout/Provider/TTS/openai_fm.py +129 -0
- webscout/Provider/TTS/parler.py +111 -0
- webscout/Provider/TTS/speechma.py +580 -0
- webscout/Provider/TTS/sthir.py +94 -0
- webscout/Provider/TTS/streamElements.py +333 -0
- webscout/Provider/TTS/utils.py +280 -0
- webscout/Provider/TeachAnything.py +229 -0
- webscout/Provider/TextPollinationsAI.py +308 -0
- webscout/Provider/TwoAI.py +475 -0
- webscout/Provider/TypliAI.py +305 -0
- webscout/Provider/UNFINISHED/ChatHub.py +209 -0
- webscout/Provider/UNFINISHED/Youchat.py +330 -0
- webscout/Provider/UNFINISHED/liner_api_request.py +263 -0
- webscout/Provider/UNFINISHED/puterjs.py +635 -0
- webscout/Provider/UNFINISHED/test_lmarena.py +119 -0
- webscout/Provider/Venice.py +258 -0
- webscout/Provider/VercelAI.py +253 -0
- webscout/Provider/WiseCat.py +233 -0
- webscout/Provider/WrDoChat.py +370 -0
- webscout/Provider/Writecream.py +246 -0
- webscout/Provider/WritingMate.py +269 -0
- webscout/Provider/__init__.py +174 -0
- webscout/Provider/ai4chat.py +174 -0
- webscout/Provider/akashgpt.py +335 -0
- webscout/Provider/asksteve.py +220 -0
- webscout/Provider/cerebras.py +290 -0
- webscout/Provider/chatglm.py +215 -0
- webscout/Provider/cleeai.py +213 -0
- webscout/Provider/copilot.py +425 -0
- webscout/Provider/elmo.py +283 -0
- webscout/Provider/freeaichat.py +285 -0
- webscout/Provider/geminiapi.py +208 -0
- webscout/Provider/granite.py +235 -0
- webscout/Provider/hermes.py +266 -0
- webscout/Provider/julius.py +223 -0
- webscout/Provider/koala.py +170 -0
- webscout/Provider/learnfastai.py +325 -0
- webscout/Provider/llama3mitril.py +215 -0
- webscout/Provider/llmchat.py +258 -0
- webscout/Provider/llmchatco.py +306 -0
- webscout/Provider/lmarena.py +198 -0
- webscout/Provider/meta.py +801 -0
- webscout/Provider/multichat.py +364 -0
- webscout/Provider/oivscode.py +309 -0
- webscout/Provider/samurai.py +224 -0
- webscout/Provider/scira_chat.py +299 -0
- webscout/Provider/scnet.py +243 -0
- webscout/Provider/searchchat.py +292 -0
- webscout/Provider/sonus.py +258 -0
- webscout/Provider/talkai.py +194 -0
- webscout/Provider/toolbaz.py +353 -0
- webscout/Provider/turboseek.py +266 -0
- webscout/Provider/typefully.py +202 -0
- webscout/Provider/typegpt.py +289 -0
- webscout/Provider/uncovr.py +368 -0
- webscout/Provider/x0gpt.py +299 -0
- webscout/Provider/yep.py +389 -0
- webscout/__init__.py +4 -2
- webscout/cli.py +3 -28
- webscout/client.py +70 -0
- webscout/conversation.py +35 -35
- webscout/litagent/Readme.md +276 -0
- webscout/litagent/__init__.py +29 -0
- webscout/litagent/agent.py +455 -0
- webscout/litagent/constants.py +60 -0
- webscout/litprinter/__init__.py +59 -0
- webscout/optimizers.py +419 -419
- webscout/scout/README.md +404 -0
- webscout/scout/__init__.py +8 -0
- webscout/scout/core/__init__.py +7 -0
- webscout/scout/core/crawler.py +210 -0
- webscout/scout/core/scout.py +607 -0
- webscout/scout/core/search_result.py +96 -0
- webscout/scout/core/text_analyzer.py +63 -0
- webscout/scout/core/text_utils.py +277 -0
- webscout/scout/core/web_analyzer.py +52 -0
- webscout/scout/element.py +478 -0
- webscout/scout/parsers/__init__.py +69 -0
- webscout/scout/parsers/html5lib_parser.py +172 -0
- webscout/scout/parsers/html_parser.py +236 -0
- webscout/scout/parsers/lxml_parser.py +178 -0
- webscout/scout/utils.py +37 -0
- webscout/swiftcli/Readme.md +323 -0
- webscout/swiftcli/__init__.py +95 -0
- webscout/swiftcli/core/__init__.py +7 -0
- webscout/swiftcli/core/cli.py +297 -0
- webscout/swiftcli/core/context.py +104 -0
- webscout/swiftcli/core/group.py +241 -0
- webscout/swiftcli/decorators/__init__.py +28 -0
- webscout/swiftcli/decorators/command.py +221 -0
- webscout/swiftcli/decorators/options.py +220 -0
- webscout/swiftcli/decorators/output.py +252 -0
- webscout/swiftcli/exceptions.py +21 -0
- webscout/swiftcli/plugins/__init__.py +9 -0
- webscout/swiftcli/plugins/base.py +135 -0
- webscout/swiftcli/plugins/manager.py +269 -0
- webscout/swiftcli/utils/__init__.py +59 -0
- webscout/swiftcli/utils/formatting.py +252 -0
- webscout/swiftcli/utils/parsing.py +267 -0
- webscout/version.py +1 -1
- webscout/webscout_search.py +2 -182
- webscout/webscout_search_async.py +1 -179
- webscout/zeroart/README.md +89 -0
- webscout/zeroart/__init__.py +135 -0
- webscout/zeroart/base.py +66 -0
- webscout/zeroart/effects.py +101 -0
- webscout/zeroart/fonts.py +1239 -0
- {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/METADATA +262 -83
- webscout-8.2.9.dist-info/RECORD +289 -0
- {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/WHEEL +1 -1
- {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/entry_points.txt +1 -0
- webscout-8.2.7.dist-info/RECORD +0 -26
- {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/licenses/LICENSE.md +0 -0
- {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/top_level.txt +0 -0
|
@@ -0,0 +1,186 @@
|
|
|
1
|
+
import requests
|
|
2
|
+
import hashlib
|
|
3
|
+
import json
|
|
4
|
+
import random
|
|
5
|
+
import time
|
|
6
|
+
import re
|
|
7
|
+
from typing import Dict, Optional, Generator, Union, Any
|
|
8
|
+
|
|
9
|
+
from webscout.AIbase import AISearch, SearchResponse
|
|
10
|
+
from webscout import exceptions
|
|
11
|
+
from webscout.litagent import LitAgent
|
|
12
|
+
|
|
13
|
+
|
|
14
|
+
class Hika(AISearch):
|
|
15
|
+
"""A class to interact with the Hika AI search API."""
|
|
16
|
+
|
|
17
|
+
def __init__(
|
|
18
|
+
self,
|
|
19
|
+
timeout: int = 60,
|
|
20
|
+
proxies: Optional[dict] = None,
|
|
21
|
+
language: str = "en",
|
|
22
|
+
# model: str = "deepseek-r1",
|
|
23
|
+
|
|
24
|
+
):
|
|
25
|
+
self.session = requests.Session()
|
|
26
|
+
self.base_url = "https://api.hika.fyi/api/"
|
|
27
|
+
self.endpoint = "kbase/web"
|
|
28
|
+
self.timeout = timeout
|
|
29
|
+
self.language = language
|
|
30
|
+
# self.model = model
|
|
31
|
+
self.last_response = {}
|
|
32
|
+
|
|
33
|
+
self.headers = {
|
|
34
|
+
"Content-Type": "application/json",
|
|
35
|
+
"Origin": "https://hika.fyi",
|
|
36
|
+
"Referer": "https://hika.fyi/",
|
|
37
|
+
"User-Agent": LitAgent().random()
|
|
38
|
+
}
|
|
39
|
+
|
|
40
|
+
self.session.headers.update(self.headers)
|
|
41
|
+
self.proxies = proxies
|
|
42
|
+
|
|
43
|
+
def generate_id(self):
|
|
44
|
+
"""Generate a unique ID and hash for the request."""
|
|
45
|
+
uid = ''.join(random.choice('0123456789abcdefghijklmnopqrstuvwxyz') for _ in range(10))
|
|
46
|
+
uid += hex(int(time.time()))[2:]
|
|
47
|
+
hash_id = hashlib.sha256(f"#{uid}*".encode()).hexdigest()
|
|
48
|
+
return {"uid": uid, "hashId": hash_id}
|
|
49
|
+
|
|
50
|
+
def clean_text(self, text):
|
|
51
|
+
"""Clean all XML tags and control markers from text.
|
|
52
|
+
|
|
53
|
+
Args:
|
|
54
|
+
text (str): The text to clean
|
|
55
|
+
|
|
56
|
+
Returns:
|
|
57
|
+
str: Cleaned text
|
|
58
|
+
"""
|
|
59
|
+
if not text:
|
|
60
|
+
return ""
|
|
61
|
+
|
|
62
|
+
# Remove XML tags and special markers
|
|
63
|
+
# First remove <r> tag at the beginning
|
|
64
|
+
text = text.lstrip("<r>")
|
|
65
|
+
|
|
66
|
+
# Remove any remaining XML tags
|
|
67
|
+
text = re.sub(r'<[^>]+>', '', text)
|
|
68
|
+
|
|
69
|
+
# Remove [DONE] marker at the end
|
|
70
|
+
text = re.sub(r'\[DONE\]\s*$', '', text)
|
|
71
|
+
|
|
72
|
+
return text
|
|
73
|
+
|
|
74
|
+
def search(
|
|
75
|
+
self,
|
|
76
|
+
prompt: str,
|
|
77
|
+
stream: bool = False,
|
|
78
|
+
raw: bool = False,
|
|
79
|
+
) -> Union[SearchResponse, Generator[Union[Dict[str, str], SearchResponse], None, None]]:
|
|
80
|
+
"""Search using the Hika API and get AI-generated responses."""
|
|
81
|
+
if not prompt or len(prompt) < 2:
|
|
82
|
+
raise exceptions.APIConnectionError("Search query must be at least 2 characters long")
|
|
83
|
+
|
|
84
|
+
# Generate ID for this request
|
|
85
|
+
id_data = self.generate_id()
|
|
86
|
+
uid, hash_id = id_data["uid"], id_data["hashId"]
|
|
87
|
+
|
|
88
|
+
# Update headers with request-specific values
|
|
89
|
+
request_headers = {
|
|
90
|
+
**self.headers,
|
|
91
|
+
"x-hika": hash_id,
|
|
92
|
+
"x-uid": uid
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
# Prepare payload (fix: stream as string, add search_language)
|
|
96
|
+
payload = {
|
|
97
|
+
"keyword": prompt,
|
|
98
|
+
"language": self.language,
|
|
99
|
+
"search_language": self.language,
|
|
100
|
+
"stream": "true" # Must be string, not boolean
|
|
101
|
+
}
|
|
102
|
+
|
|
103
|
+
def for_stream():
|
|
104
|
+
try:
|
|
105
|
+
with self.session.post(
|
|
106
|
+
f"{self.base_url}{self.endpoint}",
|
|
107
|
+
json=payload,
|
|
108
|
+
headers=request_headers,
|
|
109
|
+
stream=True,
|
|
110
|
+
timeout=self.timeout,
|
|
111
|
+
proxies=self.proxies
|
|
112
|
+
) as response:
|
|
113
|
+
if not response.ok:
|
|
114
|
+
raise exceptions.APIConnectionError(
|
|
115
|
+
f"Failed to generate response - ({response.status_code}, {response.reason}) - {response.text}"
|
|
116
|
+
)
|
|
117
|
+
|
|
118
|
+
for line in response.iter_lines(decode_unicode=True):
|
|
119
|
+
if line and line.startswith("data: "):
|
|
120
|
+
try:
|
|
121
|
+
data = json.loads(line[6:])
|
|
122
|
+
# Handle chunk and references
|
|
123
|
+
if "chunk" in data:
|
|
124
|
+
chunk = data["chunk"]
|
|
125
|
+
if "[DONE]" in chunk:
|
|
126
|
+
continue
|
|
127
|
+
clean_chunk = self.clean_text(chunk)
|
|
128
|
+
if clean_chunk:
|
|
129
|
+
if raw:
|
|
130
|
+
yield {"text": clean_chunk}
|
|
131
|
+
else:
|
|
132
|
+
yield SearchResponse(clean_chunk)
|
|
133
|
+
elif "references" in data:
|
|
134
|
+
# Optionally yield references if raw requested
|
|
135
|
+
if raw:
|
|
136
|
+
yield {"references": data["references"]}
|
|
137
|
+
except json.JSONDecodeError:
|
|
138
|
+
pass
|
|
139
|
+
|
|
140
|
+
except requests.exceptions.RequestException as e:
|
|
141
|
+
raise exceptions.APIConnectionError(f"Request failed: {e}")
|
|
142
|
+
|
|
143
|
+
def for_non_stream():
|
|
144
|
+
full_response = ""
|
|
145
|
+
for chunk in for_stream():
|
|
146
|
+
if raw:
|
|
147
|
+
yield chunk
|
|
148
|
+
else:
|
|
149
|
+
full_response += str(chunk)
|
|
150
|
+
|
|
151
|
+
if not raw:
|
|
152
|
+
# Clean up the response text one final time
|
|
153
|
+
cleaned_response = self.format_response(full_response)
|
|
154
|
+
self.last_response = SearchResponse(cleaned_response)
|
|
155
|
+
return self.last_response
|
|
156
|
+
|
|
157
|
+
return for_stream() if stream else for_non_stream()
|
|
158
|
+
|
|
159
|
+
def format_response(self, text: str) -> str:
|
|
160
|
+
"""Format the response text for better readability."""
|
|
161
|
+
if not text:
|
|
162
|
+
return ""
|
|
163
|
+
|
|
164
|
+
# First clean any tags or markers
|
|
165
|
+
cleaned_text = self.clean_text(text)
|
|
166
|
+
|
|
167
|
+
# Remove any empty lines
|
|
168
|
+
cleaned_text = re.sub(r'\n\s*\n', '\n\n', cleaned_text)
|
|
169
|
+
|
|
170
|
+
# Remove any trailing whitespace
|
|
171
|
+
cleaned_text = cleaned_text.strip()
|
|
172
|
+
|
|
173
|
+
return cleaned_text
|
|
174
|
+
|
|
175
|
+
|
|
176
|
+
if __name__ == "__main__":
|
|
177
|
+
from rich import print
|
|
178
|
+
ai = Hika()
|
|
179
|
+
try:
|
|
180
|
+
response = ai.search(input(">>> "), stream=True, raw=False)
|
|
181
|
+
for chunk in response:
|
|
182
|
+
print(chunk, end="", flush=True)
|
|
183
|
+
except KeyboardInterrupt:
|
|
184
|
+
print("\nSearch interrupted by user.")
|
|
185
|
+
except Exception as e:
|
|
186
|
+
print(f"\nError: {e}")
|
|
@@ -0,0 +1,410 @@
|
|
|
1
|
+
import aiohttp
|
|
2
|
+
import asyncio
|
|
3
|
+
import lxml.html
|
|
4
|
+
import re
|
|
5
|
+
import urllib.parse
|
|
6
|
+
from markdownify import markdownify as md
|
|
7
|
+
from typing import Dict, Optional, Generator, Union, AsyncIterator, Literal
|
|
8
|
+
|
|
9
|
+
from webscout.AIbase import AISearch, SearchResponse
|
|
10
|
+
from webscout import exceptions
|
|
11
|
+
from webscout.scout import Scout
|
|
12
|
+
|
|
13
|
+
|
|
14
|
+
def cache_find(diff: Union[dict, list]) -> Optional[str]:
|
|
15
|
+
"""Find HTML content in a nested dictionary or list structure.
|
|
16
|
+
|
|
17
|
+
Args:
|
|
18
|
+
diff (Union[dict, list]): The nested structure to search
|
|
19
|
+
|
|
20
|
+
Returns:
|
|
21
|
+
Optional[str]: The found HTML content, or None if not found
|
|
22
|
+
"""
|
|
23
|
+
values = diff if isinstance(diff, list) else diff.values()
|
|
24
|
+
for value in values:
|
|
25
|
+
if isinstance(value, (list, dict)):
|
|
26
|
+
cache = cache_find(value)
|
|
27
|
+
if cache:
|
|
28
|
+
return cache
|
|
29
|
+
if isinstance(value, str) and re.search(r"<p>.+?</p>", value):
|
|
30
|
+
return md(value).strip()
|
|
31
|
+
|
|
32
|
+
return None
|
|
33
|
+
|
|
34
|
+
|
|
35
|
+
ModeType = Literal["question", "academic", "fast", "forums", "wiki", "advanced"]
|
|
36
|
+
DetailLevelType = Literal["concise", "detailed", "comprehensive"]
|
|
37
|
+
|
|
38
|
+
|
|
39
|
+
class IAsk(AISearch):
|
|
40
|
+
"""A class to interact with the IAsk AI search API.
|
|
41
|
+
|
|
42
|
+
IAsk provides a powerful search interface that returns AI-generated responses
|
|
43
|
+
based on web content. It supports both streaming and non-streaming responses,
|
|
44
|
+
as well as different search modes and detail levels.
|
|
45
|
+
|
|
46
|
+
Basic Usage:
|
|
47
|
+
>>> from webscout import IAsk
|
|
48
|
+
>>> ai = IAsk()
|
|
49
|
+
>>> # Non-streaming example
|
|
50
|
+
>>> response = ai.search("What is Python?")
|
|
51
|
+
>>> print(response)
|
|
52
|
+
Python is a high-level programming language...
|
|
53
|
+
|
|
54
|
+
>>> # Streaming example
|
|
55
|
+
>>> for chunk in ai.search("Tell me about AI", stream=True):
|
|
56
|
+
... print(chunk, end="", flush=True)
|
|
57
|
+
Artificial Intelligence is...
|
|
58
|
+
|
|
59
|
+
>>> # With specific mode and detail level
|
|
60
|
+
>>> response = ai.search("Climate change", mode="academic", detail_level="detailed")
|
|
61
|
+
>>> print(response)
|
|
62
|
+
Climate change refers to...
|
|
63
|
+
|
|
64
|
+
Args:
|
|
65
|
+
timeout (int, optional): Request timeout in seconds. Defaults to 30.
|
|
66
|
+
proxies (dict, optional): Proxy configuration for requests. Defaults to None.
|
|
67
|
+
mode (ModeType, optional): Default search mode. Defaults to "question".
|
|
68
|
+
detail_level (DetailLevelType, optional): Default detail level. Defaults to None.
|
|
69
|
+
"""
|
|
70
|
+
|
|
71
|
+
def __init__(
|
|
72
|
+
self,
|
|
73
|
+
timeout: int = 30,
|
|
74
|
+
proxies: Optional[dict] = None,
|
|
75
|
+
mode: ModeType = "question",
|
|
76
|
+
detail_level: Optional[DetailLevelType] = None,
|
|
77
|
+
):
|
|
78
|
+
"""Initialize the IAsk API client.
|
|
79
|
+
|
|
80
|
+
Args:
|
|
81
|
+
timeout (int, optional): Request timeout in seconds. Defaults to 30.
|
|
82
|
+
proxies (dict, optional): Proxy configuration for requests. Defaults to None.
|
|
83
|
+
mode (ModeType, optional): Default search mode. Defaults to "question".
|
|
84
|
+
detail_level (DetailLevelType, optional): Default detail level. Defaults to None.
|
|
85
|
+
"""
|
|
86
|
+
self.timeout = timeout
|
|
87
|
+
self.proxies = proxies or {}
|
|
88
|
+
self.default_mode = mode
|
|
89
|
+
self.default_detail_level = detail_level
|
|
90
|
+
self.api_endpoint = "https://iask.ai/"
|
|
91
|
+
self.last_response = {}
|
|
92
|
+
|
|
93
|
+
def create_url(self, query: str, mode: ModeType = "question", detail_level: Optional[DetailLevelType] = None) -> str:
|
|
94
|
+
"""Create a properly formatted URL with mode and detail level parameters.
|
|
95
|
+
|
|
96
|
+
Args:
|
|
97
|
+
query (str): The search query.
|
|
98
|
+
mode (ModeType, optional): Search mode. Defaults to "question".
|
|
99
|
+
detail_level (DetailLevelType, optional): Detail level. Defaults to None.
|
|
100
|
+
|
|
101
|
+
Returns:
|
|
102
|
+
str: Formatted URL with query parameters.
|
|
103
|
+
|
|
104
|
+
Example:
|
|
105
|
+
>>> ai = IAsk()
|
|
106
|
+
>>> url = ai.create_url("Climate change", mode="academic", detail_level="detailed")
|
|
107
|
+
>>> print(url)
|
|
108
|
+
https://iask.ai/?mode=academic&q=Climate+change&options%5Bdetail_level%5D=detailed
|
|
109
|
+
"""
|
|
110
|
+
# Create a dictionary of parameters with flattened structure
|
|
111
|
+
params = {
|
|
112
|
+
"mode": mode,
|
|
113
|
+
"q": query
|
|
114
|
+
}
|
|
115
|
+
|
|
116
|
+
# Add detail_level if provided using the flattened format
|
|
117
|
+
if detail_level:
|
|
118
|
+
params["options[detail_level]"] = detail_level
|
|
119
|
+
|
|
120
|
+
# Encode the parameters and build the URL
|
|
121
|
+
query_string = urllib.parse.urlencode(params)
|
|
122
|
+
url = f"{self.api_endpoint}?{query_string}"
|
|
123
|
+
|
|
124
|
+
return url
|
|
125
|
+
|
|
126
|
+
def format_html(self, html_content: str) -> str:
|
|
127
|
+
"""Format HTML content into a more readable text format.
|
|
128
|
+
|
|
129
|
+
Args:
|
|
130
|
+
html_content (str): The HTML content to format.
|
|
131
|
+
|
|
132
|
+
Returns:
|
|
133
|
+
str: Formatted text.
|
|
134
|
+
"""
|
|
135
|
+
scout = Scout(html_content, features='html.parser')
|
|
136
|
+
output_lines = []
|
|
137
|
+
|
|
138
|
+
for child in scout.find_all(['h1', 'h2', 'h3', 'p', 'ol', 'ul', 'div']):
|
|
139
|
+
if child.name in ["h1", "h2", "h3"]:
|
|
140
|
+
output_lines.append(f"\n**{child.get_text().strip()}**\n")
|
|
141
|
+
elif child.name == "p":
|
|
142
|
+
text = child.get_text().strip()
|
|
143
|
+
text = re.sub(r"^According to Ask AI & Question AI www\.iAsk\.ai:\s*", "", text).strip()
|
|
144
|
+
# Remove footnote markers
|
|
145
|
+
text = re.sub(r'\[\d+\]\(#fn:\d+ \'see footnote\'\)', '', text)
|
|
146
|
+
output_lines.append(text + "\n")
|
|
147
|
+
elif child.name in ["ol", "ul"]:
|
|
148
|
+
for li in child.find_all("li"):
|
|
149
|
+
output_lines.append("- " + li.get_text().strip() + "\n")
|
|
150
|
+
elif child.name == "div" and "footnotes" in child.get("class", []):
|
|
151
|
+
output_lines.append("\n**Authoritative Sources**\n")
|
|
152
|
+
for li in child.find_all("li"):
|
|
153
|
+
link = li.find("a")
|
|
154
|
+
if link:
|
|
155
|
+
output_lines.append(f"- {link.get_text().strip()} ({link.get('href')})\n")
|
|
156
|
+
|
|
157
|
+
return "".join(output_lines)
|
|
158
|
+
|
|
159
|
+
def search(
|
|
160
|
+
self,
|
|
161
|
+
prompt: str,
|
|
162
|
+
stream: bool = False,
|
|
163
|
+
raw: bool = False,
|
|
164
|
+
mode: Optional[ModeType] = None,
|
|
165
|
+
detail_level: Optional[DetailLevelType] = None,
|
|
166
|
+
) -> Union[SearchResponse, Generator[Union[Dict[str, str], SearchResponse], None, None]]:
|
|
167
|
+
"""Search using the IAsk API and get AI-generated responses.
|
|
168
|
+
|
|
169
|
+
This method sends a search query to IAsk and returns the AI-generated response.
|
|
170
|
+
It supports both streaming and non-streaming modes, as well as raw response format.
|
|
171
|
+
|
|
172
|
+
Args:
|
|
173
|
+
prompt (str): The search query or prompt to send to the API.
|
|
174
|
+
stream (bool, optional): If True, yields response chunks as they arrive.
|
|
175
|
+
If False, returns complete response. Defaults to False.
|
|
176
|
+
raw (bool, optional): If True, returns raw response dictionaries with 'text' key.
|
|
177
|
+
If False, returns Response objects that convert to text automatically.
|
|
178
|
+
Defaults to False.
|
|
179
|
+
mode (ModeType, optional): Search mode to use. Defaults to None (uses instance default).
|
|
180
|
+
detail_level (DetailLevelType, optional): Detail level to use. Defaults to None (uses instance default).
|
|
181
|
+
|
|
182
|
+
Returns:
|
|
183
|
+
Union[Response, Generator[Union[Dict[str, str], Response], None, None]]:
|
|
184
|
+
- If stream=False: Returns complete response as Response object
|
|
185
|
+
- If stream=True: Yields response chunks as either Dict or Response objects
|
|
186
|
+
|
|
187
|
+
Raises:
|
|
188
|
+
APIConnectionError: If the API request fails
|
|
189
|
+
|
|
190
|
+
Examples:
|
|
191
|
+
Basic search:
|
|
192
|
+
>>> ai = IAsk()
|
|
193
|
+
>>> response = ai.search("What is Python?")
|
|
194
|
+
>>> print(response)
|
|
195
|
+
Python is a programming language...
|
|
196
|
+
|
|
197
|
+
Streaming response:
|
|
198
|
+
>>> for chunk in ai.search("Tell me about AI", stream=True):
|
|
199
|
+
... print(chunk, end="")
|
|
200
|
+
Artificial Intelligence...
|
|
201
|
+
|
|
202
|
+
Raw response format:
|
|
203
|
+
>>> for chunk in ai.search("Hello", stream=True, raw=True):
|
|
204
|
+
... print(chunk)
|
|
205
|
+
{'text': 'Hello'}
|
|
206
|
+
{'text': ' there!'}
|
|
207
|
+
|
|
208
|
+
With specific mode and detail level:
|
|
209
|
+
>>> response = ai.search("Climate change", mode="academic", detail_level="detailed")
|
|
210
|
+
>>> print(response)
|
|
211
|
+
Climate change refers to...
|
|
212
|
+
"""
|
|
213
|
+
# Use provided parameters or fall back to instance defaults
|
|
214
|
+
search_mode = mode or self.default_mode
|
|
215
|
+
search_detail_level = detail_level or self.default_detail_level
|
|
216
|
+
|
|
217
|
+
# For non-streaming, run the async search and return the complete response
|
|
218
|
+
if not stream:
|
|
219
|
+
# Create a new event loop for this request
|
|
220
|
+
loop = asyncio.new_event_loop()
|
|
221
|
+
asyncio.set_event_loop(loop)
|
|
222
|
+
try:
|
|
223
|
+
result = loop.run_until_complete(
|
|
224
|
+
self._async_search(prompt, False, raw, search_mode, search_detail_level)
|
|
225
|
+
)
|
|
226
|
+
return result
|
|
227
|
+
finally:
|
|
228
|
+
loop.close()
|
|
229
|
+
|
|
230
|
+
# For streaming, use a simpler approach with a single event loop
|
|
231
|
+
# that stays open until the generator is exhausted
|
|
232
|
+
buffer = ""
|
|
233
|
+
|
|
234
|
+
def sync_generator():
|
|
235
|
+
nonlocal buffer
|
|
236
|
+
# Create a new event loop for this generator
|
|
237
|
+
loop = asyncio.new_event_loop()
|
|
238
|
+
asyncio.set_event_loop(loop)
|
|
239
|
+
|
|
240
|
+
try:
|
|
241
|
+
# Get the async generator
|
|
242
|
+
async_gen_coro = self._async_search(prompt, True, raw, search_mode, search_detail_level)
|
|
243
|
+
async_gen = loop.run_until_complete(async_gen_coro)
|
|
244
|
+
|
|
245
|
+
# Process chunks one by one
|
|
246
|
+
while True:
|
|
247
|
+
try:
|
|
248
|
+
# Get the next chunk
|
|
249
|
+
chunk_coro = async_gen.__anext__()
|
|
250
|
+
chunk = loop.run_until_complete(chunk_coro)
|
|
251
|
+
|
|
252
|
+
# Update buffer and yield the chunk
|
|
253
|
+
if isinstance(chunk, dict) and 'text' in chunk:
|
|
254
|
+
buffer += chunk['text']
|
|
255
|
+
elif isinstance(chunk, SearchResponse):
|
|
256
|
+
buffer += chunk.text
|
|
257
|
+
else:
|
|
258
|
+
buffer += str(chunk)
|
|
259
|
+
|
|
260
|
+
yield chunk
|
|
261
|
+
except StopAsyncIteration:
|
|
262
|
+
break
|
|
263
|
+
except Exception as e:
|
|
264
|
+
print(f"Error in generator: {e}")
|
|
265
|
+
break
|
|
266
|
+
finally:
|
|
267
|
+
# Store the final response and close the loop
|
|
268
|
+
self.last_response = {"text": buffer}
|
|
269
|
+
loop.close()
|
|
270
|
+
|
|
271
|
+
return sync_generator()
|
|
272
|
+
|
|
273
|
+
async def _async_search(
|
|
274
|
+
self,
|
|
275
|
+
prompt: str,
|
|
276
|
+
stream: bool = False,
|
|
277
|
+
raw: bool = False,
|
|
278
|
+
mode: ModeType = "question",
|
|
279
|
+
detail_level: Optional[DetailLevelType] = None,
|
|
280
|
+
) -> Union[SearchResponse, AsyncIterator[Union[Dict[str, str], SearchResponse]]]:
|
|
281
|
+
"""Internal async implementation of the search method."""
|
|
282
|
+
|
|
283
|
+
async def stream_generator() -> AsyncIterator[str]:
|
|
284
|
+
async with aiohttp.ClientSession() as session:
|
|
285
|
+
# Prepare parameters
|
|
286
|
+
params = {"mode": mode, "q": prompt}
|
|
287
|
+
if detail_level:
|
|
288
|
+
params["options[detail_level]"] = detail_level
|
|
289
|
+
|
|
290
|
+
try:
|
|
291
|
+
async with session.get(
|
|
292
|
+
self.api_endpoint,
|
|
293
|
+
params=params,
|
|
294
|
+
proxy=self.proxies.get('http') if self.proxies else None,
|
|
295
|
+
timeout=self.timeout
|
|
296
|
+
) as response:
|
|
297
|
+
if not response.ok:
|
|
298
|
+
raise exceptions.APIConnectionError(
|
|
299
|
+
f"Failed to generate response - ({response.status_code}, {response.reason}) - {await response.text()}"
|
|
300
|
+
)
|
|
301
|
+
|
|
302
|
+
etree = lxml.html.fromstring(await response.text())
|
|
303
|
+
phx_node = etree.xpath('//*[starts-with(@id, "phx-")]').pop()
|
|
304
|
+
csrf_token = (
|
|
305
|
+
etree.xpath('//*[@name="csrf-token"]').pop().get("content")
|
|
306
|
+
)
|
|
307
|
+
|
|
308
|
+
async with session.ws_connect(
|
|
309
|
+
f"{self.api_endpoint}live/websocket",
|
|
310
|
+
params={
|
|
311
|
+
"_csrf_token": csrf_token,
|
|
312
|
+
"vsn": "2.0.0",
|
|
313
|
+
},
|
|
314
|
+
proxy=self.proxies.get('http') if self.proxies else None,
|
|
315
|
+
timeout=self.timeout
|
|
316
|
+
) as wsResponse:
|
|
317
|
+
await wsResponse.send_json(
|
|
318
|
+
[
|
|
319
|
+
None,
|
|
320
|
+
None,
|
|
321
|
+
f"lv:{phx_node.get('id')}",
|
|
322
|
+
"phx_join",
|
|
323
|
+
{
|
|
324
|
+
"params": {"_csrf_token": csrf_token},
|
|
325
|
+
"url": str(response.url),
|
|
326
|
+
"session": phx_node.get("data-phx-session"),
|
|
327
|
+
},
|
|
328
|
+
]
|
|
329
|
+
)
|
|
330
|
+
while True:
|
|
331
|
+
json_data = await wsResponse.receive_json()
|
|
332
|
+
if not json_data:
|
|
333
|
+
break
|
|
334
|
+
diff: dict = json_data[4]
|
|
335
|
+
try:
|
|
336
|
+
chunk: str = diff["e"][0][1]["data"]
|
|
337
|
+
# Check if the chunk contains HTML content
|
|
338
|
+
if re.search(r"<[^>]+>", chunk):
|
|
339
|
+
formatted_chunk = self.format_html(chunk)
|
|
340
|
+
yield formatted_chunk
|
|
341
|
+
else:
|
|
342
|
+
yield chunk.replace("<br/>", "\n")
|
|
343
|
+
except:
|
|
344
|
+
cache = cache_find(diff)
|
|
345
|
+
if cache:
|
|
346
|
+
if diff.get("response", None):
|
|
347
|
+
# Format the cache content if it contains HTML
|
|
348
|
+
if re.search(r"<[^>]+>", cache):
|
|
349
|
+
formatted_cache = self.format_html(cache)
|
|
350
|
+
yield formatted_cache
|
|
351
|
+
else:
|
|
352
|
+
yield cache
|
|
353
|
+
break
|
|
354
|
+
except Exception as e:
|
|
355
|
+
raise exceptions.APIConnectionError(f"Error connecting to IAsk API: {str(e)}")
|
|
356
|
+
|
|
357
|
+
# For non-streaming, collect all chunks and return a single response
|
|
358
|
+
if not stream:
|
|
359
|
+
buffer = ""
|
|
360
|
+
async for chunk in stream_generator():
|
|
361
|
+
buffer += chunk
|
|
362
|
+
self.last_response = {"text": buffer}
|
|
363
|
+
return SearchResponse(buffer) if not raw else {"text": buffer}
|
|
364
|
+
|
|
365
|
+
# For streaming, create an async generator that yields chunks
|
|
366
|
+
async def process_stream():
|
|
367
|
+
buffer = ""
|
|
368
|
+
async for chunk in stream_generator():
|
|
369
|
+
buffer += chunk
|
|
370
|
+
if raw:
|
|
371
|
+
yield {"text": chunk}
|
|
372
|
+
else:
|
|
373
|
+
yield SearchResponse(chunk)
|
|
374
|
+
self.last_response = {"text": buffer}
|
|
375
|
+
|
|
376
|
+
# Return the async generator
|
|
377
|
+
return process_stream()
|
|
378
|
+
|
|
379
|
+
|
|
380
|
+
if __name__ == "__main__":
|
|
381
|
+
from rich import print
|
|
382
|
+
|
|
383
|
+
ai = IAsk()
|
|
384
|
+
|
|
385
|
+
# Example 1: Simple search with default mode
|
|
386
|
+
print("\n[bold cyan]Example 1: Simple search with default mode[/bold cyan]")
|
|
387
|
+
response = ai.search("What is Python?", stream=True)
|
|
388
|
+
for chunk in response:
|
|
389
|
+
print(chunk, end="", flush=True)
|
|
390
|
+
print("\n\n[bold green]Response complete.[/bold green]\n")
|
|
391
|
+
|
|
392
|
+
# Example 2: Search with academic mode
|
|
393
|
+
print("\n[bold cyan]Example 2: Search with academic mode[/bold cyan]")
|
|
394
|
+
response = ai.search("Quantum computing applications", mode="academic", stream=True)
|
|
395
|
+
for chunk in response:
|
|
396
|
+
print(chunk, end="", flush=True)
|
|
397
|
+
print("\n\n[bold green]Response complete.[/bold green]\n")
|
|
398
|
+
|
|
399
|
+
# Example 3: Search with advanced mode and detailed level
|
|
400
|
+
print("\n[bold cyan]Example 3: Search with advanced mode and detailed level[/bold cyan]")
|
|
401
|
+
response = ai.search("Climate change solutions", mode="advanced", detail_level="detailed", stream=True)
|
|
402
|
+
for chunk in response:
|
|
403
|
+
print(chunk, end="", flush=True)
|
|
404
|
+
print("\n\n[bold green]Response complete.[/bold green]\n")
|
|
405
|
+
|
|
406
|
+
# Example 4: Demonstrating the create_url method
|
|
407
|
+
print("\n[bold cyan]Example 4: Generated URL for browser access[/bold cyan]")
|
|
408
|
+
url = ai.create_url("Helpingai details", mode="question", detail_level="detailed")
|
|
409
|
+
print(f"URL: {url}")
|
|
410
|
+
print("This URL can be used directly in a browser or with other HTTP clients.")
|