webscout 8.2.2__py3-none-any.whl → 8.2.7__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of webscout might be problematic. Click here for more details.

Files changed (306) hide show
  1. webscout/AIauto.py +112 -22
  2. webscout/AIbase.py +144 -7
  3. webscout/AIutel.py +249 -131
  4. webscout/Bard.py +579 -206
  5. webscout/DWEBS.py +78 -35
  6. webscout/__init__.py +0 -1
  7. webscout/cli.py +256 -0
  8. webscout/conversation.py +307 -436
  9. webscout/exceptions.py +23 -0
  10. webscout/prompt_manager.py +56 -42
  11. webscout/version.py +1 -1
  12. webscout/webscout_search.py +65 -47
  13. webscout/webscout_search_async.py +81 -126
  14. webscout/yep_search.py +93 -43
  15. {webscout-8.2.2.dist-info → webscout-8.2.7.dist-info}/METADATA +172 -52
  16. webscout-8.2.7.dist-info/RECORD +26 -0
  17. {webscout-8.2.2.dist-info → webscout-8.2.7.dist-info}/WHEEL +1 -1
  18. webscout-8.2.7.dist-info/entry_points.txt +3 -0
  19. webscout-8.2.7.dist-info/top_level.txt +1 -0
  20. inferno/__init__.py +0 -6
  21. inferno/__main__.py +0 -9
  22. inferno/cli.py +0 -6
  23. webscout/Extra/GitToolkit/__init__.py +0 -10
  24. webscout/Extra/GitToolkit/gitapi/__init__.py +0 -12
  25. webscout/Extra/GitToolkit/gitapi/repository.py +0 -195
  26. webscout/Extra/GitToolkit/gitapi/user.py +0 -96
  27. webscout/Extra/GitToolkit/gitapi/utils.py +0 -62
  28. webscout/Extra/YTToolkit/YTdownloader.py +0 -957
  29. webscout/Extra/YTToolkit/__init__.py +0 -3
  30. webscout/Extra/YTToolkit/transcriber.py +0 -476
  31. webscout/Extra/YTToolkit/ytapi/__init__.py +0 -6
  32. webscout/Extra/YTToolkit/ytapi/channel.py +0 -307
  33. webscout/Extra/YTToolkit/ytapi/errors.py +0 -13
  34. webscout/Extra/YTToolkit/ytapi/extras.py +0 -45
  35. webscout/Extra/YTToolkit/ytapi/https.py +0 -88
  36. webscout/Extra/YTToolkit/ytapi/patterns.py +0 -61
  37. webscout/Extra/YTToolkit/ytapi/playlist.py +0 -59
  38. webscout/Extra/YTToolkit/ytapi/pool.py +0 -8
  39. webscout/Extra/YTToolkit/ytapi/query.py +0 -40
  40. webscout/Extra/YTToolkit/ytapi/stream.py +0 -63
  41. webscout/Extra/YTToolkit/ytapi/utils.py +0 -62
  42. webscout/Extra/YTToolkit/ytapi/video.py +0 -232
  43. webscout/Extra/__init__.py +0 -7
  44. webscout/Extra/autocoder/__init__.py +0 -9
  45. webscout/Extra/autocoder/autocoder.py +0 -849
  46. webscout/Extra/autocoder/autocoder_utiles.py +0 -332
  47. webscout/Extra/gguf.py +0 -682
  48. webscout/Extra/tempmail/__init__.py +0 -28
  49. webscout/Extra/tempmail/async_utils.py +0 -141
  50. webscout/Extra/tempmail/base.py +0 -161
  51. webscout/Extra/tempmail/cli.py +0 -187
  52. webscout/Extra/tempmail/emailnator.py +0 -84
  53. webscout/Extra/tempmail/mail_tm.py +0 -361
  54. webscout/Extra/tempmail/temp_mail_io.py +0 -292
  55. webscout/Extra/weather.py +0 -194
  56. webscout/Extra/weather_ascii.py +0 -76
  57. webscout/LLM.py +0 -442
  58. webscout/Litlogger/__init__.py +0 -67
  59. webscout/Litlogger/core/__init__.py +0 -6
  60. webscout/Litlogger/core/level.py +0 -23
  61. webscout/Litlogger/core/logger.py +0 -165
  62. webscout/Litlogger/handlers/__init__.py +0 -12
  63. webscout/Litlogger/handlers/console.py +0 -33
  64. webscout/Litlogger/handlers/file.py +0 -143
  65. webscout/Litlogger/handlers/network.py +0 -173
  66. webscout/Litlogger/styles/__init__.py +0 -7
  67. webscout/Litlogger/styles/colors.py +0 -249
  68. webscout/Litlogger/styles/formats.py +0 -458
  69. webscout/Litlogger/styles/text.py +0 -87
  70. webscout/Litlogger/utils/__init__.py +0 -6
  71. webscout/Litlogger/utils/detectors.py +0 -153
  72. webscout/Litlogger/utils/formatters.py +0 -200
  73. webscout/Local/__init__.py +0 -12
  74. webscout/Local/__main__.py +0 -9
  75. webscout/Local/api.py +0 -576
  76. webscout/Local/cli.py +0 -516
  77. webscout/Local/config.py +0 -75
  78. webscout/Local/llm.py +0 -287
  79. webscout/Local/model_manager.py +0 -253
  80. webscout/Local/server.py +0 -721
  81. webscout/Local/utils.py +0 -93
  82. webscout/Provider/AI21.py +0 -177
  83. webscout/Provider/AISEARCH/DeepFind.py +0 -250
  84. webscout/Provider/AISEARCH/ISou.py +0 -256
  85. webscout/Provider/AISEARCH/Perplexity.py +0 -359
  86. webscout/Provider/AISEARCH/__init__.py +0 -10
  87. webscout/Provider/AISEARCH/felo_search.py +0 -228
  88. webscout/Provider/AISEARCH/genspark_search.py +0 -208
  89. webscout/Provider/AISEARCH/hika_search.py +0 -194
  90. webscout/Provider/AISEARCH/iask_search.py +0 -436
  91. webscout/Provider/AISEARCH/monica_search.py +0 -246
  92. webscout/Provider/AISEARCH/scira_search.py +0 -324
  93. webscout/Provider/AISEARCH/webpilotai_search.py +0 -281
  94. webscout/Provider/Aitopia.py +0 -292
  95. webscout/Provider/AllenAI.py +0 -413
  96. webscout/Provider/Andi.py +0 -228
  97. webscout/Provider/Blackboxai.py +0 -229
  98. webscout/Provider/C4ai.py +0 -432
  99. webscout/Provider/ChatGPTClone.py +0 -226
  100. webscout/Provider/ChatGPTES.py +0 -237
  101. webscout/Provider/ChatGPTGratis.py +0 -194
  102. webscout/Provider/Chatify.py +0 -175
  103. webscout/Provider/Cloudflare.py +0 -273
  104. webscout/Provider/Cohere.py +0 -208
  105. webscout/Provider/DeepSeek.py +0 -196
  106. webscout/Provider/Deepinfra.py +0 -297
  107. webscout/Provider/ElectronHub.py +0 -709
  108. webscout/Provider/ExaAI.py +0 -261
  109. webscout/Provider/ExaChat.py +0 -342
  110. webscout/Provider/Free2GPT.py +0 -241
  111. webscout/Provider/GPTWeb.py +0 -193
  112. webscout/Provider/Gemini.py +0 -169
  113. webscout/Provider/GithubChat.py +0 -367
  114. webscout/Provider/Glider.py +0 -211
  115. webscout/Provider/Groq.py +0 -670
  116. webscout/Provider/HF_space/__init__.py +0 -0
  117. webscout/Provider/HF_space/qwen_qwen2.py +0 -206
  118. webscout/Provider/HeckAI.py +0 -233
  119. webscout/Provider/HuggingFaceChat.py +0 -462
  120. webscout/Provider/Hunyuan.py +0 -272
  121. webscout/Provider/Jadve.py +0 -266
  122. webscout/Provider/Koboldai.py +0 -381
  123. webscout/Provider/LambdaChat.py +0 -392
  124. webscout/Provider/Llama.py +0 -200
  125. webscout/Provider/Llama3.py +0 -204
  126. webscout/Provider/Marcus.py +0 -148
  127. webscout/Provider/Netwrck.py +0 -228
  128. webscout/Provider/OLLAMA.py +0 -396
  129. webscout/Provider/OPENAI/__init__.py +0 -25
  130. webscout/Provider/OPENAI/base.py +0 -46
  131. webscout/Provider/OPENAI/c4ai.py +0 -367
  132. webscout/Provider/OPENAI/chatgpt.py +0 -549
  133. webscout/Provider/OPENAI/chatgptclone.py +0 -460
  134. webscout/Provider/OPENAI/deepinfra.py +0 -272
  135. webscout/Provider/OPENAI/e2b.py +0 -1350
  136. webscout/Provider/OPENAI/exaai.py +0 -404
  137. webscout/Provider/OPENAI/exachat.py +0 -433
  138. webscout/Provider/OPENAI/freeaichat.py +0 -352
  139. webscout/Provider/OPENAI/glider.py +0 -316
  140. webscout/Provider/OPENAI/heckai.py +0 -337
  141. webscout/Provider/OPENAI/llmchatco.py +0 -327
  142. webscout/Provider/OPENAI/netwrck.py +0 -348
  143. webscout/Provider/OPENAI/opkfc.py +0 -488
  144. webscout/Provider/OPENAI/scirachat.py +0 -463
  145. webscout/Provider/OPENAI/sonus.py +0 -294
  146. webscout/Provider/OPENAI/standardinput.py +0 -425
  147. webscout/Provider/OPENAI/textpollinations.py +0 -285
  148. webscout/Provider/OPENAI/toolbaz.py +0 -405
  149. webscout/Provider/OPENAI/typegpt.py +0 -346
  150. webscout/Provider/OPENAI/uncovrAI.py +0 -455
  151. webscout/Provider/OPENAI/utils.py +0 -211
  152. webscout/Provider/OPENAI/venice.py +0 -413
  153. webscout/Provider/OPENAI/wisecat.py +0 -381
  154. webscout/Provider/OPENAI/writecream.py +0 -156
  155. webscout/Provider/OPENAI/x0gpt.py +0 -371
  156. webscout/Provider/OPENAI/yep.py +0 -327
  157. webscout/Provider/OpenGPT.py +0 -199
  158. webscout/Provider/Openai.py +0 -496
  159. webscout/Provider/PI.py +0 -344
  160. webscout/Provider/Perplexitylabs.py +0 -415
  161. webscout/Provider/Phind.py +0 -535
  162. webscout/Provider/PizzaGPT.py +0 -198
  163. webscout/Provider/QwenLM.py +0 -254
  164. webscout/Provider/Reka.py +0 -214
  165. webscout/Provider/StandardInput.py +0 -278
  166. webscout/Provider/TTI/AiForce/__init__.py +0 -22
  167. webscout/Provider/TTI/AiForce/async_aiforce.py +0 -224
  168. webscout/Provider/TTI/AiForce/sync_aiforce.py +0 -245
  169. webscout/Provider/TTI/FreeAIPlayground/__init__.py +0 -9
  170. webscout/Provider/TTI/FreeAIPlayground/async_freeaiplayground.py +0 -181
  171. webscout/Provider/TTI/FreeAIPlayground/sync_freeaiplayground.py +0 -180
  172. webscout/Provider/TTI/ImgSys/__init__.py +0 -23
  173. webscout/Provider/TTI/ImgSys/async_imgsys.py +0 -202
  174. webscout/Provider/TTI/ImgSys/sync_imgsys.py +0 -195
  175. webscout/Provider/TTI/MagicStudio/__init__.py +0 -2
  176. webscout/Provider/TTI/MagicStudio/async_magicstudio.py +0 -111
  177. webscout/Provider/TTI/MagicStudio/sync_magicstudio.py +0 -109
  178. webscout/Provider/TTI/Nexra/__init__.py +0 -22
  179. webscout/Provider/TTI/Nexra/async_nexra.py +0 -286
  180. webscout/Provider/TTI/Nexra/sync_nexra.py +0 -258
  181. webscout/Provider/TTI/PollinationsAI/__init__.py +0 -23
  182. webscout/Provider/TTI/PollinationsAI/async_pollinations.py +0 -311
  183. webscout/Provider/TTI/PollinationsAI/sync_pollinations.py +0 -265
  184. webscout/Provider/TTI/__init__.py +0 -12
  185. webscout/Provider/TTI/aiarta/__init__.py +0 -2
  186. webscout/Provider/TTI/aiarta/async_aiarta.py +0 -482
  187. webscout/Provider/TTI/aiarta/sync_aiarta.py +0 -440
  188. webscout/Provider/TTI/artbit/__init__.py +0 -22
  189. webscout/Provider/TTI/artbit/async_artbit.py +0 -155
  190. webscout/Provider/TTI/artbit/sync_artbit.py +0 -148
  191. webscout/Provider/TTI/fastflux/__init__.py +0 -22
  192. webscout/Provider/TTI/fastflux/async_fastflux.py +0 -261
  193. webscout/Provider/TTI/fastflux/sync_fastflux.py +0 -252
  194. webscout/Provider/TTI/huggingface/__init__.py +0 -22
  195. webscout/Provider/TTI/huggingface/async_huggingface.py +0 -199
  196. webscout/Provider/TTI/huggingface/sync_huggingface.py +0 -195
  197. webscout/Provider/TTI/piclumen/__init__.py +0 -23
  198. webscout/Provider/TTI/piclumen/async_piclumen.py +0 -268
  199. webscout/Provider/TTI/piclumen/sync_piclumen.py +0 -233
  200. webscout/Provider/TTI/pixelmuse/__init__.py +0 -4
  201. webscout/Provider/TTI/pixelmuse/async_pixelmuse.py +0 -249
  202. webscout/Provider/TTI/pixelmuse/sync_pixelmuse.py +0 -182
  203. webscout/Provider/TTI/talkai/__init__.py +0 -4
  204. webscout/Provider/TTI/talkai/async_talkai.py +0 -229
  205. webscout/Provider/TTI/talkai/sync_talkai.py +0 -207
  206. webscout/Provider/TTS/__init__.py +0 -7
  207. webscout/Provider/TTS/deepgram.py +0 -156
  208. webscout/Provider/TTS/elevenlabs.py +0 -111
  209. webscout/Provider/TTS/gesserit.py +0 -127
  210. webscout/Provider/TTS/murfai.py +0 -113
  211. webscout/Provider/TTS/parler.py +0 -111
  212. webscout/Provider/TTS/speechma.py +0 -180
  213. webscout/Provider/TTS/streamElements.py +0 -333
  214. webscout/Provider/TTS/utils.py +0 -280
  215. webscout/Provider/TeachAnything.py +0 -187
  216. webscout/Provider/TextPollinationsAI.py +0 -231
  217. webscout/Provider/TwoAI.py +0 -199
  218. webscout/Provider/Venice.py +0 -219
  219. webscout/Provider/VercelAI.py +0 -234
  220. webscout/Provider/WebSim.py +0 -228
  221. webscout/Provider/WiseCat.py +0 -196
  222. webscout/Provider/Writecream.py +0 -211
  223. webscout/Provider/WritingMate.py +0 -197
  224. webscout/Provider/Youchat.py +0 -330
  225. webscout/Provider/__init__.py +0 -198
  226. webscout/Provider/ai4chat.py +0 -202
  227. webscout/Provider/aimathgpt.py +0 -189
  228. webscout/Provider/akashgpt.py +0 -342
  229. webscout/Provider/askmyai.py +0 -158
  230. webscout/Provider/asksteve.py +0 -203
  231. webscout/Provider/bagoodex.py +0 -145
  232. webscout/Provider/cerebras.py +0 -242
  233. webscout/Provider/chatglm.py +0 -205
  234. webscout/Provider/cleeai.py +0 -213
  235. webscout/Provider/copilot.py +0 -428
  236. webscout/Provider/elmo.py +0 -234
  237. webscout/Provider/freeaichat.py +0 -271
  238. webscout/Provider/gaurish.py +0 -244
  239. webscout/Provider/geminiapi.py +0 -208
  240. webscout/Provider/geminiprorealtime.py +0 -160
  241. webscout/Provider/granite.py +0 -187
  242. webscout/Provider/hermes.py +0 -219
  243. webscout/Provider/julius.py +0 -223
  244. webscout/Provider/koala.py +0 -268
  245. webscout/Provider/labyrinth.py +0 -340
  246. webscout/Provider/learnfastai.py +0 -266
  247. webscout/Provider/lepton.py +0 -194
  248. webscout/Provider/llama3mitril.py +0 -180
  249. webscout/Provider/llamatutor.py +0 -192
  250. webscout/Provider/llmchat.py +0 -213
  251. webscout/Provider/llmchatco.py +0 -311
  252. webscout/Provider/meta.py +0 -794
  253. webscout/Provider/multichat.py +0 -325
  254. webscout/Provider/promptrefine.py +0 -193
  255. webscout/Provider/scira_chat.py +0 -277
  256. webscout/Provider/scnet.py +0 -187
  257. webscout/Provider/searchchat.py +0 -293
  258. webscout/Provider/sonus.py +0 -208
  259. webscout/Provider/talkai.py +0 -194
  260. webscout/Provider/toolbaz.py +0 -320
  261. webscout/Provider/turboseek.py +0 -219
  262. webscout/Provider/tutorai.py +0 -252
  263. webscout/Provider/typefully.py +0 -280
  264. webscout/Provider/typegpt.py +0 -232
  265. webscout/Provider/uncovr.py +0 -312
  266. webscout/Provider/x0gpt.py +0 -256
  267. webscout/Provider/yep.py +0 -376
  268. webscout/litagent/__init__.py +0 -29
  269. webscout/litagent/agent.py +0 -455
  270. webscout/litagent/constants.py +0 -60
  271. webscout/litprinter/__init__.py +0 -59
  272. webscout/scout/__init__.py +0 -8
  273. webscout/scout/core/__init__.py +0 -7
  274. webscout/scout/core/crawler.py +0 -140
  275. webscout/scout/core/scout.py +0 -568
  276. webscout/scout/core/search_result.py +0 -96
  277. webscout/scout/core/text_analyzer.py +0 -63
  278. webscout/scout/core/text_utils.py +0 -277
  279. webscout/scout/core/web_analyzer.py +0 -52
  280. webscout/scout/core.py +0 -881
  281. webscout/scout/element.py +0 -460
  282. webscout/scout/parsers/__init__.py +0 -69
  283. webscout/scout/parsers/html5lib_parser.py +0 -172
  284. webscout/scout/parsers/html_parser.py +0 -236
  285. webscout/scout/parsers/lxml_parser.py +0 -178
  286. webscout/scout/utils.py +0 -37
  287. webscout/swiftcli/__init__.py +0 -809
  288. webscout/zeroart/__init__.py +0 -55
  289. webscout/zeroart/base.py +0 -60
  290. webscout/zeroart/effects.py +0 -99
  291. webscout/zeroart/fonts.py +0 -816
  292. webscout-8.2.2.dist-info/RECORD +0 -309
  293. webscout-8.2.2.dist-info/entry_points.txt +0 -5
  294. webscout-8.2.2.dist-info/top_level.txt +0 -3
  295. webstoken/__init__.py +0 -30
  296. webstoken/classifier.py +0 -189
  297. webstoken/keywords.py +0 -216
  298. webstoken/language.py +0 -128
  299. webstoken/ner.py +0 -164
  300. webstoken/normalizer.py +0 -35
  301. webstoken/processor.py +0 -77
  302. webstoken/sentiment.py +0 -206
  303. webstoken/stemmer.py +0 -73
  304. webstoken/tagger.py +0 -60
  305. webstoken/tokenizer.py +0 -158
  306. {webscout-8.2.2.dist-info → webscout-8.2.7.dist-info/licenses}/LICENSE.md +0 -0
webscout/Local/api.py DELETED
@@ -1,576 +0,0 @@
1
- """
2
- API endpoints for webscout.Local
3
- """
4
-
5
- import time
6
- import json
7
- import logging
8
- from typing import Dict, List, Optional, Union, Any
9
- from datetime import datetime
10
- import base64
11
- from uuid import uuid4
12
-
13
- from fastapi import APIRouter, HTTPException, BackgroundTasks, Depends
14
- from fastapi.responses import StreamingResponse
15
- from pydantic import BaseModel
16
-
17
- from .llm import ModelManager
18
- from .config import Config
19
-
20
- logger = logging.getLogger(__name__)
21
-
22
- # API Models
23
- class GenerateRequest(BaseModel):
24
- model: str
25
- prompt: str = ""
26
- suffix: Optional[str] = None
27
- images: Optional[List[str]] = None
28
- system: Optional[str] = None
29
- template: Optional[str] = None
30
- context: Optional[List[int]] = None
31
- stream: bool = True
32
- raw: bool = False
33
- format: Optional[Union[str, Dict[str, Any]]] = None
34
- options: Optional[Dict[str, Any]] = None
35
- keep_alive: Optional[str] = "5m"
36
-
37
- class ChatMessage(BaseModel):
38
- role: str
39
- content: Union[str, List[Dict[str, Any]]]
40
- images: Optional[List[str]] = None
41
- tool_calls: Optional[List[Dict[str, Any]]] = None
42
-
43
- class ChatRequest(BaseModel):
44
- model: str
45
- messages: List[ChatMessage]
46
- stream: bool = True
47
- tools: Optional[List[Dict[str, Any]]] = None
48
- format: Optional[Union[str, Dict[str, Any]]] = None
49
- options: Optional[Dict[str, Any]] = None
50
- keep_alive: Optional[str] = "5m"
51
-
52
- class EmbeddingRequest(BaseModel):
53
- model: str
54
- input: Union[str, List[str]]
55
- truncate: bool = True
56
- options: Optional[Dict[str, Any]] = None
57
- keep_alive: Optional[str] = "5m"
58
-
59
- class PullModelRequest(BaseModel):
60
- model: str
61
- insecure: bool = False
62
- stream: bool = True
63
-
64
- class DeleteModelRequest(BaseModel):
65
- model: str
66
-
67
- class ModelResponse(BaseModel):
68
- name: str
69
- modified_at: str
70
- size: int
71
- details: Optional[Dict[str, Any]] = None
72
-
73
- class ModelsResponse(BaseModel):
74
- models: List[ModelResponse]
75
-
76
- # API Router
77
- router = APIRouter()
78
-
79
- # Dependency to get model manager
80
- def get_model_manager(config: Config = Depends(lambda: Config.from_env())):
81
- return ModelManager(config)
82
-
83
- @router.post("/api/generate")
84
- async def generate(
85
- request: GenerateRequest,
86
- background_tasks: BackgroundTasks,
87
- model_manager: ModelManager = Depends(get_model_manager),
88
- ):
89
- """Generate a completion for a given prompt"""
90
- try:
91
- # Parse keep_alive
92
- keep_alive_seconds = 300 # Default 5 minutes
93
- if request.keep_alive:
94
- if request.keep_alive.endswith("ms"):
95
- keep_alive_seconds = int(request.keep_alive[:-2]) / 1000
96
- elif request.keep_alive.endswith("s"):
97
- keep_alive_seconds = int(request.keep_alive[:-1])
98
- elif request.keep_alive.endswith("m"):
99
- keep_alive_seconds = int(request.keep_alive[:-1]) * 60
100
- elif request.keep_alive.endswith("h"):
101
- keep_alive_seconds = int(request.keep_alive[:-1]) * 3600
102
- elif request.keep_alive == "0":
103
- # Special case: unload immediately after completion
104
- keep_alive_seconds = 0
105
- else:
106
- try:
107
- keep_alive_seconds = int(request.keep_alive)
108
- except ValueError:
109
- pass
110
-
111
- # If prompt is empty, just load the model and return
112
- if not request.prompt:
113
- model = model_manager.load_model(
114
- request.model,
115
- **(request.options or {})
116
- )
117
-
118
- # Schedule unloading if keep_alive is 0
119
- if keep_alive_seconds == 0:
120
- background_tasks.add_task(model_manager.unload_model, request.model)
121
-
122
- return {
123
- "model": request.model,
124
- "created_at": datetime.now().isoformat(),
125
- "response": "",
126
- "done": True,
127
- "done_reason": "load" if keep_alive_seconds > 0 else "unload"
128
- }
129
-
130
- # Load the model
131
- model = model_manager.load_model(
132
- request.model,
133
- **(request.options or {})
134
- )
135
-
136
- # Process images if provided
137
- image_data = None
138
- if request.images and len(request.images) > 0:
139
- # For now, we only support the first image
140
- image_base64 = request.images[0]
141
- if image_base64.startswith("data:"):
142
- # Handle data URI
143
- image_base64 = image_base64.split(",", 1)[1]
144
- image_data = base64.b64decode(image_base64)
145
-
146
- # Prepare generation parameters
147
- generation_params = {
148
- "prompt": request.prompt,
149
- "suffix": request.suffix,
150
- "max_tokens": request.options.get("num_predict", 128) if request.options else 128,
151
- "temperature": request.options.get("temperature", 0.8) if request.options else 0.8,
152
- "top_p": request.options.get("top_p", 0.95) if request.options else 0.95,
153
- "echo": False,
154
- }
155
-
156
- # Add system prompt if provided
157
- if request.system:
158
- generation_params["system_prompt"] = request.system
159
-
160
- # Add format if provided
161
- if request.format:
162
- generation_params["response_format"] = request.format
163
-
164
- # Add images if provided
165
- if image_data:
166
- generation_params["image_data"] = image_data
167
-
168
- # Add context if provided
169
- if request.context:
170
- generation_params["context"] = request.context
171
-
172
- # Stream the response
173
- if request.stream:
174
- async def generate_stream():
175
- start_time = time.time()
176
- load_time = 0 # We don't track this separately
177
-
178
- # Start generation
179
- completion_id = str(uuid4())
180
-
181
- # Initial response
182
- yield json.dumps({
183
- "model": request.model,
184
- "created_at": datetime.now().isoformat(),
185
- "response": "",
186
- "done": False
187
- }) + "\n"
188
-
189
- # Generate completion
190
- completion = model.create_completion(**generation_params)
191
-
192
- # Final response with stats
193
- end_time = time.time()
194
- total_duration = int((end_time - start_time) * 1e9) # Convert to nanoseconds
195
-
196
- yield json.dumps({
197
- "model": request.model,
198
- "created_at": datetime.now().isoformat(),
199
- "response": completion["choices"][0]["text"],
200
- "done": True,
201
- "context": completion.get("context", []),
202
- "total_duration": total_duration,
203
- "load_duration": load_time,
204
- "prompt_eval_count": completion.get("usage", {}).get("prompt_tokens", 0),
205
- "prompt_eval_duration": 0, # Not tracked
206
- "eval_count": completion.get("usage", {}).get("completion_tokens", 0),
207
- "eval_duration": 0 # Not tracked
208
- }) + "\n"
209
-
210
- # Schedule unloading if keep_alive is 0
211
- if keep_alive_seconds == 0:
212
- background_tasks.add_task(model_manager.unload_model, request.model)
213
-
214
- return StreamingResponse(generate_stream(), media_type="application/json")
215
- else:
216
- # Non-streaming response
217
- start_time = time.time()
218
-
219
- # Generate completion
220
- completion = model.create_completion(**generation_params)
221
-
222
- # Calculate durations
223
- end_time = time.time()
224
- total_duration = int((end_time - start_time) * 1e9) # Convert to nanoseconds
225
-
226
- # Schedule unloading if keep_alive is 0
227
- if keep_alive_seconds == 0:
228
- background_tasks.add_task(model_manager.unload_model, request.model)
229
-
230
- return {
231
- "model": request.model,
232
- "created_at": datetime.now().isoformat(),
233
- "response": completion["choices"][0]["text"],
234
- "done": True,
235
- "context": completion.get("context", []),
236
- "total_duration": total_duration,
237
- "load_duration": 0, # Not tracked separately
238
- "prompt_eval_count": completion.get("usage", {}).get("prompt_tokens", 0),
239
- "prompt_eval_duration": 0, # Not tracked
240
- "eval_count": completion.get("usage", {}).get("completion_tokens", 0),
241
- "eval_duration": 0 # Not tracked
242
- }
243
-
244
- except Exception as e:
245
- logger.error(f"Error in generate: {str(e)}")
246
- raise HTTPException(status_code=500, detail=str(e))
247
-
248
- @router.post("/api/chat")
249
- async def chat(
250
- request: ChatRequest,
251
- background_tasks: BackgroundTasks,
252
- model_manager: ModelManager = Depends(get_model_manager),
253
- ):
254
- """Generate a chat completion"""
255
- try:
256
- # Parse keep_alive
257
- keep_alive_seconds = 300 # Default 5 minutes
258
- if request.keep_alive:
259
- if request.keep_alive.endswith("ms"):
260
- keep_alive_seconds = int(request.keep_alive[:-2]) / 1000
261
- elif request.keep_alive.endswith("s"):
262
- keep_alive_seconds = int(request.keep_alive[:-1])
263
- elif request.keep_alive.endswith("m"):
264
- keep_alive_seconds = int(request.keep_alive[:-1]) * 60
265
- elif request.keep_alive.endswith("h"):
266
- keep_alive_seconds = int(request.keep_alive[:-1]) * 3600
267
- elif request.keep_alive == "0":
268
- # Special case: unload immediately after completion
269
- keep_alive_seconds = 0
270
- else:
271
- try:
272
- keep_alive_seconds = int(request.keep_alive)
273
- except ValueError:
274
- pass
275
-
276
- # If messages is empty, just load the model and return
277
- if not request.messages:
278
- model = model_manager.load_model(
279
- request.model,
280
- **(request.options or {})
281
- )
282
-
283
- # Schedule unloading if keep_alive is 0
284
- if keep_alive_seconds == 0:
285
- background_tasks.add_task(model_manager.unload_model, request.model)
286
-
287
- return {
288
- "model": request.model,
289
- "created_at": datetime.now().isoformat(),
290
- "message": {
291
- "role": "assistant",
292
- "content": ""
293
- },
294
- "done_reason": "load" if keep_alive_seconds > 0 else "unload",
295
- "done": True
296
- }
297
-
298
- # Load the model
299
- model = model_manager.load_model(
300
- request.model,
301
- **(request.options or {})
302
- )
303
-
304
- # Convert messages to the format expected by llama-cpp-python
305
- messages = []
306
- for msg in request.messages:
307
- if isinstance(msg.content, str):
308
- messages.append({
309
- "role": msg.role,
310
- "content": msg.content
311
- })
312
- else:
313
- # Handle multimodal content
314
- messages.append({
315
- "role": msg.role,
316
- "content": msg.content
317
- })
318
-
319
- # Prepare chat parameters
320
- chat_params = {
321
- "messages": messages,
322
- "temperature": request.options.get("temperature", 0.8) if request.options else 0.8,
323
- "top_p": request.options.get("top_p", 0.95) if request.options else 0.95,
324
- }
325
-
326
- # Add tools if provided
327
- if request.tools:
328
- chat_params["tools"] = request.tools
329
-
330
- # Add format if provided
331
- if request.format:
332
- chat_params["response_format"] = request.format
333
-
334
- # Stream the response
335
- if request.stream:
336
- async def generate_stream():
337
- start_time = time.time()
338
-
339
- # Start generation
340
- completion_id = str(uuid4())
341
-
342
- # Initial response
343
- yield json.dumps({
344
- "model": request.model,
345
- "created_at": datetime.now().isoformat(),
346
- "message": {
347
- "role": "assistant",
348
- "content": ""
349
- },
350
- "done": False
351
- }) + "\n"
352
-
353
- # Generate chat completion
354
- completion = model.create_chat_completion(**chat_params)
355
-
356
- # Final response with stats
357
- end_time = time.time()
358
- total_duration = int((end_time - start_time) * 1e9) # Convert to nanoseconds
359
-
360
- response_message = completion["choices"][0]["message"]
361
-
362
- yield json.dumps({
363
- "model": request.model,
364
- "created_at": datetime.now().isoformat(),
365
- "message": response_message,
366
- "done": True,
367
- "done_reason": "stop",
368
- "total_duration": total_duration,
369
- "load_duration": 0, # Not tracked separately
370
- "prompt_eval_count": completion.get("usage", {}).get("prompt_tokens", 0),
371
- "prompt_eval_duration": 0, # Not tracked
372
- "eval_count": completion.get("usage", {}).get("completion_tokens", 0),
373
- "eval_duration": 0 # Not tracked
374
- }) + "\n"
375
-
376
- # Schedule unloading if keep_alive is 0
377
- if keep_alive_seconds == 0:
378
- background_tasks.add_task(model_manager.unload_model, request.model)
379
-
380
- return StreamingResponse(generate_stream(), media_type="application/json")
381
- else:
382
- # Non-streaming response
383
- start_time = time.time()
384
-
385
- # Generate chat completion
386
- completion = model.create_chat_completion(**chat_params)
387
-
388
- # Calculate durations
389
- end_time = time.time()
390
- total_duration = int((end_time - start_time) * 1e9) # Convert to nanoseconds
391
-
392
- response_message = completion["choices"][0]["message"]
393
-
394
- # Schedule unloading if keep_alive is 0
395
- if keep_alive_seconds == 0:
396
- background_tasks.add_task(model_manager.unload_model, request.model)
397
-
398
- return {
399
- "model": request.model,
400
- "created_at": datetime.now().isoformat(),
401
- "message": response_message,
402
- "done": True,
403
- "done_reason": "stop",
404
- "total_duration": total_duration,
405
- "load_duration": 0, # Not tracked separately
406
- "prompt_eval_count": completion.get("usage", {}).get("prompt_tokens", 0),
407
- "prompt_eval_duration": 0, # Not tracked
408
- "eval_count": completion.get("usage", {}).get("completion_tokens", 0),
409
- "eval_duration": 0 # Not tracked
410
- }
411
-
412
- except Exception as e:
413
- logger.error(f"Error in chat: {str(e)}")
414
- raise HTTPException(status_code=500, detail=str(e))
415
-
416
- @router.post("/api/embed")
417
- async def embed(
418
- request: EmbeddingRequest,
419
- background_tasks: BackgroundTasks,
420
- model_manager: ModelManager = Depends(get_model_manager),
421
- ):
422
- """Generate embeddings from a model"""
423
- try:
424
- # Parse keep_alive
425
- keep_alive_seconds = 300 # Default 5 minutes
426
- if request.keep_alive:
427
- if request.keep_alive.endswith("ms"):
428
- keep_alive_seconds = int(request.keep_alive[:-2]) / 1000
429
- elif request.keep_alive.endswith("s"):
430
- keep_alive_seconds = int(request.keep_alive[:-1])
431
- elif request.keep_alive.endswith("m"):
432
- keep_alive_seconds = int(request.keep_alive[:-1]) * 60
433
- elif request.keep_alive.endswith("h"):
434
- keep_alive_seconds = int(request.keep_alive[:-1]) * 3600
435
- elif request.keep_alive == "0":
436
- # Special case: unload immediately after completion
437
- keep_alive_seconds = 0
438
- else:
439
- try:
440
- keep_alive_seconds = int(request.keep_alive)
441
- except ValueError:
442
- pass
443
-
444
- # Load the model with embedding=True
445
- model_options = {**(request.options or {}), "embedding": True}
446
- model = model_manager.load_model(
447
- request.model,
448
- **model_options
449
- )
450
-
451
- # Generate embeddings
452
- start_time = time.time()
453
-
454
- if isinstance(request.input, str):
455
- # Single input
456
- embedding = model.create_embedding(request.input)
457
- embeddings = [embedding["embedding"]]
458
- else:
459
- # Multiple inputs
460
- embeddings = []
461
- for text in request.input:
462
- embedding = model.create_embedding(text)
463
- embeddings.append(embedding["embedding"])
464
-
465
- # Calculate durations
466
- end_time = time.time()
467
- total_duration = int((end_time - start_time) * 1e9) # Convert to nanoseconds
468
-
469
- # Schedule unloading if keep_alive is 0
470
- if keep_alive_seconds == 0:
471
- background_tasks.add_task(model_manager.unload_model, request.model)
472
-
473
- return {
474
- "model": request.model,
475
- "embeddings": embeddings,
476
- "total_duration": total_duration,
477
- "load_duration": 0, # Not tracked separately
478
- "prompt_eval_count": 0 # Not tracked
479
- }
480
-
481
- except Exception as e:
482
- logger.error(f"Error in embed: {str(e)}")
483
- raise HTTPException(status_code=500, detail=str(e))
484
-
485
- @router.post("/api/pull")
486
- async def pull_model(
487
- request: PullModelRequest,
488
- model_manager: ModelManager = Depends(get_model_manager),
489
- ):
490
- """Pull a model from Hugging Face Hub"""
491
- try:
492
- if request.stream:
493
- async def generate_stream():
494
- # Initial response
495
- yield json.dumps({"status": "pulling manifest"}) + "\n"
496
-
497
- # Pull the model
498
- result = await model_manager.pull_model(request.model, request.insecure)
499
-
500
- if result["status"] == "error":
501
- yield json.dumps({"status": "error", "error": result["message"]}) + "\n"
502
- return
503
-
504
- # Success response
505
- yield json.dumps({"status": "downloading model"}) + "\n"
506
- yield json.dumps({"status": "verifying sha256 digest"}) + "\n"
507
- yield json.dumps({"status": "writing manifest"}) + "\n"
508
- yield json.dumps({"status": "success"}) + "\n"
509
-
510
- return StreamingResponse(generate_stream(), media_type="application/json")
511
- else:
512
- # Non-streaming response
513
- result = await model_manager.pull_model(request.model, request.insecure)
514
-
515
- if result["status"] == "error":
516
- return {"status": "error", "error": result["message"]}
517
-
518
- return {"status": "success"}
519
-
520
- except Exception as e:
521
- logger.error(f"Error in pull_model: {str(e)}")
522
- raise HTTPException(status_code=500, detail=str(e))
523
-
524
- @router.delete("/api/delete")
525
- async def delete_model(
526
- request: DeleteModelRequest,
527
- model_manager: ModelManager = Depends(get_model_manager),
528
- ):
529
- """Delete a model"""
530
- try:
531
- success = model_manager.delete_model(request.model)
532
-
533
- if not success:
534
- raise HTTPException(status_code=404, detail=f"Model '{request.model}' not found")
535
-
536
- return {"status": "success"}
537
-
538
- except HTTPException:
539
- raise
540
- except Exception as e:
541
- logger.error(f"Error in delete_model: {str(e)}")
542
- raise HTTPException(status_code=500, detail=str(e))
543
-
544
- @router.get("/api/tags")
545
- async def list_models(
546
- model_manager: ModelManager = Depends(get_model_manager),
547
- ):
548
- """List all available models"""
549
- try:
550
- models = model_manager.list_models()
551
-
552
- # Convert to response format
553
- response_models = []
554
- for model in models:
555
- response_models.append(ModelResponse(
556
- name=model["name"],
557
- modified_at=model["modified_at"],
558
- size=model["size"],
559
- details={
560
- "format": "gguf",
561
- "family": "llama", # Default, could be improved with model metadata
562
- "parameter_size": "Unknown",
563
- "quantization_level": "Unknown"
564
- }
565
- ))
566
-
567
- return ModelsResponse(models=response_models)
568
-
569
- except Exception as e:
570
- logger.error(f"Error in list_models: {str(e)}")
571
- raise HTTPException(status_code=500, detail=str(e))
572
-
573
- @router.get("/api/version")
574
- async def version():
575
- """Get the version of webscout.Local"""
576
- return {"version": "0.1.0"}