webscout 8.2.7__py3-none-any.whl → 8.2.9__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (281) hide show
  1. webscout/AIauto.py +33 -15
  2. webscout/AIbase.py +96 -37
  3. webscout/AIutel.py +703 -250
  4. webscout/Bard.py +441 -323
  5. webscout/Extra/Act.md +309 -0
  6. webscout/Extra/GitToolkit/__init__.py +10 -0
  7. webscout/Extra/GitToolkit/gitapi/README.md +110 -0
  8. webscout/Extra/GitToolkit/gitapi/__init__.py +12 -0
  9. webscout/Extra/GitToolkit/gitapi/repository.py +195 -0
  10. webscout/Extra/GitToolkit/gitapi/user.py +96 -0
  11. webscout/Extra/GitToolkit/gitapi/utils.py +62 -0
  12. webscout/Extra/YTToolkit/README.md +375 -0
  13. webscout/Extra/YTToolkit/YTdownloader.py +957 -0
  14. webscout/Extra/YTToolkit/__init__.py +3 -0
  15. webscout/Extra/YTToolkit/transcriber.py +476 -0
  16. webscout/Extra/YTToolkit/ytapi/README.md +44 -0
  17. webscout/Extra/YTToolkit/ytapi/__init__.py +6 -0
  18. webscout/Extra/YTToolkit/ytapi/channel.py +307 -0
  19. webscout/Extra/YTToolkit/ytapi/errors.py +13 -0
  20. webscout/Extra/YTToolkit/ytapi/extras.py +118 -0
  21. webscout/Extra/YTToolkit/ytapi/https.py +88 -0
  22. webscout/Extra/YTToolkit/ytapi/patterns.py +61 -0
  23. webscout/Extra/YTToolkit/ytapi/playlist.py +59 -0
  24. webscout/Extra/YTToolkit/ytapi/pool.py +8 -0
  25. webscout/Extra/YTToolkit/ytapi/query.py +40 -0
  26. webscout/Extra/YTToolkit/ytapi/stream.py +63 -0
  27. webscout/Extra/YTToolkit/ytapi/utils.py +62 -0
  28. webscout/Extra/YTToolkit/ytapi/video.py +232 -0
  29. webscout/Extra/__init__.py +7 -0
  30. webscout/Extra/autocoder/__init__.py +9 -0
  31. webscout/Extra/autocoder/autocoder.py +1105 -0
  32. webscout/Extra/autocoder/autocoder_utiles.py +332 -0
  33. webscout/Extra/gguf.md +430 -0
  34. webscout/Extra/gguf.py +684 -0
  35. webscout/Extra/tempmail/README.md +488 -0
  36. webscout/Extra/tempmail/__init__.py +28 -0
  37. webscout/Extra/tempmail/async_utils.py +141 -0
  38. webscout/Extra/tempmail/base.py +161 -0
  39. webscout/Extra/tempmail/cli.py +187 -0
  40. webscout/Extra/tempmail/emailnator.py +84 -0
  41. webscout/Extra/tempmail/mail_tm.py +361 -0
  42. webscout/Extra/tempmail/temp_mail_io.py +292 -0
  43. webscout/Extra/weather.md +281 -0
  44. webscout/Extra/weather.py +194 -0
  45. webscout/Extra/weather_ascii.py +76 -0
  46. webscout/Litlogger/README.md +10 -0
  47. webscout/Litlogger/__init__.py +15 -0
  48. webscout/Litlogger/formats.py +4 -0
  49. webscout/Litlogger/handlers.py +103 -0
  50. webscout/Litlogger/levels.py +13 -0
  51. webscout/Litlogger/logger.py +92 -0
  52. webscout/Provider/AI21.py +177 -0
  53. webscout/Provider/AISEARCH/DeepFind.py +254 -0
  54. webscout/Provider/AISEARCH/Perplexity.py +333 -0
  55. webscout/Provider/AISEARCH/README.md +279 -0
  56. webscout/Provider/AISEARCH/__init__.py +9 -0
  57. webscout/Provider/AISEARCH/felo_search.py +202 -0
  58. webscout/Provider/AISEARCH/genspark_search.py +324 -0
  59. webscout/Provider/AISEARCH/hika_search.py +186 -0
  60. webscout/Provider/AISEARCH/iask_search.py +410 -0
  61. webscout/Provider/AISEARCH/monica_search.py +220 -0
  62. webscout/Provider/AISEARCH/scira_search.py +298 -0
  63. webscout/Provider/AISEARCH/webpilotai_search.py +255 -0
  64. webscout/Provider/Aitopia.py +316 -0
  65. webscout/Provider/AllenAI.py +440 -0
  66. webscout/Provider/Andi.py +228 -0
  67. webscout/Provider/Blackboxai.py +791 -0
  68. webscout/Provider/ChatGPTClone.py +237 -0
  69. webscout/Provider/ChatGPTGratis.py +194 -0
  70. webscout/Provider/ChatSandbox.py +342 -0
  71. webscout/Provider/Cloudflare.py +324 -0
  72. webscout/Provider/Cohere.py +208 -0
  73. webscout/Provider/Deepinfra.py +340 -0
  74. webscout/Provider/ExaAI.py +261 -0
  75. webscout/Provider/ExaChat.py +358 -0
  76. webscout/Provider/Flowith.py +217 -0
  77. webscout/Provider/FreeGemini.py +250 -0
  78. webscout/Provider/Gemini.py +169 -0
  79. webscout/Provider/GithubChat.py +369 -0
  80. webscout/Provider/GizAI.py +295 -0
  81. webscout/Provider/Glider.py +225 -0
  82. webscout/Provider/Groq.py +801 -0
  83. webscout/Provider/HF_space/__init__.py +0 -0
  84. webscout/Provider/HF_space/qwen_qwen2.py +206 -0
  85. webscout/Provider/HeckAI.py +375 -0
  86. webscout/Provider/HuggingFaceChat.py +469 -0
  87. webscout/Provider/Hunyuan.py +283 -0
  88. webscout/Provider/Jadve.py +291 -0
  89. webscout/Provider/Koboldai.py +384 -0
  90. webscout/Provider/LambdaChat.py +411 -0
  91. webscout/Provider/Llama3.py +259 -0
  92. webscout/Provider/MCPCore.py +315 -0
  93. webscout/Provider/Marcus.py +198 -0
  94. webscout/Provider/Nemotron.py +218 -0
  95. webscout/Provider/Netwrck.py +270 -0
  96. webscout/Provider/OLLAMA.py +396 -0
  97. webscout/Provider/OPENAI/BLACKBOXAI.py +766 -0
  98. webscout/Provider/OPENAI/Cloudflare.py +378 -0
  99. webscout/Provider/OPENAI/FreeGemini.py +283 -0
  100. webscout/Provider/OPENAI/NEMOTRON.py +232 -0
  101. webscout/Provider/OPENAI/Qwen3.py +283 -0
  102. webscout/Provider/OPENAI/README.md +952 -0
  103. webscout/Provider/OPENAI/TwoAI.py +357 -0
  104. webscout/Provider/OPENAI/__init__.py +40 -0
  105. webscout/Provider/OPENAI/ai4chat.py +293 -0
  106. webscout/Provider/OPENAI/api.py +969 -0
  107. webscout/Provider/OPENAI/base.py +249 -0
  108. webscout/Provider/OPENAI/c4ai.py +373 -0
  109. webscout/Provider/OPENAI/chatgpt.py +556 -0
  110. webscout/Provider/OPENAI/chatgptclone.py +494 -0
  111. webscout/Provider/OPENAI/chatsandbox.py +173 -0
  112. webscout/Provider/OPENAI/copilot.py +242 -0
  113. webscout/Provider/OPENAI/deepinfra.py +322 -0
  114. webscout/Provider/OPENAI/e2b.py +1414 -0
  115. webscout/Provider/OPENAI/exaai.py +417 -0
  116. webscout/Provider/OPENAI/exachat.py +444 -0
  117. webscout/Provider/OPENAI/flowith.py +162 -0
  118. webscout/Provider/OPENAI/freeaichat.py +359 -0
  119. webscout/Provider/OPENAI/glider.py +326 -0
  120. webscout/Provider/OPENAI/groq.py +364 -0
  121. webscout/Provider/OPENAI/heckai.py +308 -0
  122. webscout/Provider/OPENAI/llmchatco.py +335 -0
  123. webscout/Provider/OPENAI/mcpcore.py +389 -0
  124. webscout/Provider/OPENAI/multichat.py +376 -0
  125. webscout/Provider/OPENAI/netwrck.py +357 -0
  126. webscout/Provider/OPENAI/oivscode.py +287 -0
  127. webscout/Provider/OPENAI/opkfc.py +496 -0
  128. webscout/Provider/OPENAI/pydantic_imports.py +172 -0
  129. webscout/Provider/OPENAI/scirachat.py +477 -0
  130. webscout/Provider/OPENAI/sonus.py +304 -0
  131. webscout/Provider/OPENAI/standardinput.py +433 -0
  132. webscout/Provider/OPENAI/textpollinations.py +339 -0
  133. webscout/Provider/OPENAI/toolbaz.py +413 -0
  134. webscout/Provider/OPENAI/typefully.py +355 -0
  135. webscout/Provider/OPENAI/typegpt.py +364 -0
  136. webscout/Provider/OPENAI/uncovrAI.py +463 -0
  137. webscout/Provider/OPENAI/utils.py +318 -0
  138. webscout/Provider/OPENAI/venice.py +431 -0
  139. webscout/Provider/OPENAI/wisecat.py +387 -0
  140. webscout/Provider/OPENAI/writecream.py +163 -0
  141. webscout/Provider/OPENAI/x0gpt.py +365 -0
  142. webscout/Provider/OPENAI/yep.py +382 -0
  143. webscout/Provider/OpenGPT.py +209 -0
  144. webscout/Provider/Openai.py +496 -0
  145. webscout/Provider/PI.py +429 -0
  146. webscout/Provider/Perplexitylabs.py +415 -0
  147. webscout/Provider/QwenLM.py +254 -0
  148. webscout/Provider/Reka.py +214 -0
  149. webscout/Provider/StandardInput.py +290 -0
  150. webscout/Provider/TTI/README.md +82 -0
  151. webscout/Provider/TTI/__init__.py +7 -0
  152. webscout/Provider/TTI/aiarta.py +365 -0
  153. webscout/Provider/TTI/artbit.py +0 -0
  154. webscout/Provider/TTI/base.py +64 -0
  155. webscout/Provider/TTI/fastflux.py +200 -0
  156. webscout/Provider/TTI/magicstudio.py +201 -0
  157. webscout/Provider/TTI/piclumen.py +203 -0
  158. webscout/Provider/TTI/pixelmuse.py +225 -0
  159. webscout/Provider/TTI/pollinations.py +221 -0
  160. webscout/Provider/TTI/utils.py +11 -0
  161. webscout/Provider/TTS/README.md +192 -0
  162. webscout/Provider/TTS/__init__.py +10 -0
  163. webscout/Provider/TTS/base.py +159 -0
  164. webscout/Provider/TTS/deepgram.py +156 -0
  165. webscout/Provider/TTS/elevenlabs.py +111 -0
  166. webscout/Provider/TTS/gesserit.py +128 -0
  167. webscout/Provider/TTS/murfai.py +113 -0
  168. webscout/Provider/TTS/openai_fm.py +129 -0
  169. webscout/Provider/TTS/parler.py +111 -0
  170. webscout/Provider/TTS/speechma.py +580 -0
  171. webscout/Provider/TTS/sthir.py +94 -0
  172. webscout/Provider/TTS/streamElements.py +333 -0
  173. webscout/Provider/TTS/utils.py +280 -0
  174. webscout/Provider/TeachAnything.py +229 -0
  175. webscout/Provider/TextPollinationsAI.py +308 -0
  176. webscout/Provider/TwoAI.py +475 -0
  177. webscout/Provider/TypliAI.py +305 -0
  178. webscout/Provider/UNFINISHED/ChatHub.py +209 -0
  179. webscout/Provider/UNFINISHED/Youchat.py +330 -0
  180. webscout/Provider/UNFINISHED/liner_api_request.py +263 -0
  181. webscout/Provider/UNFINISHED/puterjs.py +635 -0
  182. webscout/Provider/UNFINISHED/test_lmarena.py +119 -0
  183. webscout/Provider/Venice.py +258 -0
  184. webscout/Provider/VercelAI.py +253 -0
  185. webscout/Provider/WiseCat.py +233 -0
  186. webscout/Provider/WrDoChat.py +370 -0
  187. webscout/Provider/Writecream.py +246 -0
  188. webscout/Provider/WritingMate.py +269 -0
  189. webscout/Provider/__init__.py +174 -0
  190. webscout/Provider/ai4chat.py +174 -0
  191. webscout/Provider/akashgpt.py +335 -0
  192. webscout/Provider/asksteve.py +220 -0
  193. webscout/Provider/cerebras.py +290 -0
  194. webscout/Provider/chatglm.py +215 -0
  195. webscout/Provider/cleeai.py +213 -0
  196. webscout/Provider/copilot.py +425 -0
  197. webscout/Provider/elmo.py +283 -0
  198. webscout/Provider/freeaichat.py +285 -0
  199. webscout/Provider/geminiapi.py +208 -0
  200. webscout/Provider/granite.py +235 -0
  201. webscout/Provider/hermes.py +266 -0
  202. webscout/Provider/julius.py +223 -0
  203. webscout/Provider/koala.py +170 -0
  204. webscout/Provider/learnfastai.py +325 -0
  205. webscout/Provider/llama3mitril.py +215 -0
  206. webscout/Provider/llmchat.py +258 -0
  207. webscout/Provider/llmchatco.py +306 -0
  208. webscout/Provider/lmarena.py +198 -0
  209. webscout/Provider/meta.py +801 -0
  210. webscout/Provider/multichat.py +364 -0
  211. webscout/Provider/oivscode.py +309 -0
  212. webscout/Provider/samurai.py +224 -0
  213. webscout/Provider/scira_chat.py +299 -0
  214. webscout/Provider/scnet.py +243 -0
  215. webscout/Provider/searchchat.py +292 -0
  216. webscout/Provider/sonus.py +258 -0
  217. webscout/Provider/talkai.py +194 -0
  218. webscout/Provider/toolbaz.py +353 -0
  219. webscout/Provider/turboseek.py +266 -0
  220. webscout/Provider/typefully.py +202 -0
  221. webscout/Provider/typegpt.py +289 -0
  222. webscout/Provider/uncovr.py +368 -0
  223. webscout/Provider/x0gpt.py +299 -0
  224. webscout/Provider/yep.py +389 -0
  225. webscout/__init__.py +4 -2
  226. webscout/cli.py +3 -28
  227. webscout/client.py +70 -0
  228. webscout/conversation.py +35 -35
  229. webscout/litagent/Readme.md +276 -0
  230. webscout/litagent/__init__.py +29 -0
  231. webscout/litagent/agent.py +455 -0
  232. webscout/litagent/constants.py +60 -0
  233. webscout/litprinter/__init__.py +59 -0
  234. webscout/optimizers.py +419 -419
  235. webscout/scout/README.md +404 -0
  236. webscout/scout/__init__.py +8 -0
  237. webscout/scout/core/__init__.py +7 -0
  238. webscout/scout/core/crawler.py +210 -0
  239. webscout/scout/core/scout.py +607 -0
  240. webscout/scout/core/search_result.py +96 -0
  241. webscout/scout/core/text_analyzer.py +63 -0
  242. webscout/scout/core/text_utils.py +277 -0
  243. webscout/scout/core/web_analyzer.py +52 -0
  244. webscout/scout/element.py +478 -0
  245. webscout/scout/parsers/__init__.py +69 -0
  246. webscout/scout/parsers/html5lib_parser.py +172 -0
  247. webscout/scout/parsers/html_parser.py +236 -0
  248. webscout/scout/parsers/lxml_parser.py +178 -0
  249. webscout/scout/utils.py +37 -0
  250. webscout/swiftcli/Readme.md +323 -0
  251. webscout/swiftcli/__init__.py +95 -0
  252. webscout/swiftcli/core/__init__.py +7 -0
  253. webscout/swiftcli/core/cli.py +297 -0
  254. webscout/swiftcli/core/context.py +104 -0
  255. webscout/swiftcli/core/group.py +241 -0
  256. webscout/swiftcli/decorators/__init__.py +28 -0
  257. webscout/swiftcli/decorators/command.py +221 -0
  258. webscout/swiftcli/decorators/options.py +220 -0
  259. webscout/swiftcli/decorators/output.py +252 -0
  260. webscout/swiftcli/exceptions.py +21 -0
  261. webscout/swiftcli/plugins/__init__.py +9 -0
  262. webscout/swiftcli/plugins/base.py +135 -0
  263. webscout/swiftcli/plugins/manager.py +269 -0
  264. webscout/swiftcli/utils/__init__.py +59 -0
  265. webscout/swiftcli/utils/formatting.py +252 -0
  266. webscout/swiftcli/utils/parsing.py +267 -0
  267. webscout/version.py +1 -1
  268. webscout/webscout_search.py +2 -182
  269. webscout/webscout_search_async.py +1 -179
  270. webscout/zeroart/README.md +89 -0
  271. webscout/zeroart/__init__.py +135 -0
  272. webscout/zeroart/base.py +66 -0
  273. webscout/zeroart/effects.py +101 -0
  274. webscout/zeroart/fonts.py +1239 -0
  275. {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/METADATA +262 -83
  276. webscout-8.2.9.dist-info/RECORD +289 -0
  277. {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/WHEEL +1 -1
  278. {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/entry_points.txt +1 -0
  279. webscout-8.2.7.dist-info/RECORD +0 -26
  280. {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/licenses/LICENSE.md +0 -0
  281. {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,318 @@
1
+ from typing import List, Dict, Optional, Any, Union, Literal
2
+ from enum import Enum
3
+ import time
4
+ import uuid
5
+ from webscout.Provider.OPENAI.pydantic_imports import (
6
+ BaseModel, Field, field_validator, model_validator, field_serializer, model_serializer,
7
+ StrictStr, StrictInt, StrictFloat, StrictBool
8
+ )
9
+
10
+ # --- OpenAI Response Structure Mimics ---
11
+ # Moved here for reusability across different OpenAI-compatible providers
12
+
13
+ class ToolCallType(str, Enum):
14
+ """Type of tool call."""
15
+ FUNCTION = "function"
16
+
17
+ class FunctionCall(BaseModel):
18
+ """Function call specification."""
19
+ name: StrictStr
20
+ arguments: StrictStr
21
+
22
+ class ToolFunction(BaseModel):
23
+ """Function specification in a tool."""
24
+ name: StrictStr
25
+ arguments: StrictStr
26
+
27
+ class ToolCall(BaseModel):
28
+ """Tool call specification."""
29
+ id: StrictStr
30
+ type: StrictStr
31
+ function: ToolFunction
32
+
33
+ class CompletionUsage(BaseModel):
34
+ """Token usage information."""
35
+ prompt_tokens: StrictInt
36
+ completion_tokens: StrictInt
37
+ total_tokens: StrictInt
38
+ prompt_tokens_details: Optional[Dict[str, Any]] = None
39
+
40
+ class ChoiceDelta(BaseModel):
41
+ """Delta content in streaming response."""
42
+ content: Optional[StrictStr] = None
43
+ function_call: Optional[FunctionCall] = None
44
+ role: Optional[StrictStr] = None
45
+ tool_calls: Optional[List[ToolCall]] = None
46
+
47
+ class ChatCompletionMessage(BaseModel):
48
+ """Chat message in completion response."""
49
+ role: StrictStr
50
+ content: Optional[StrictStr] = None
51
+ function_call: Optional[FunctionCall] = None
52
+ tool_calls: Optional[List[ToolCall]] = None
53
+
54
+ class Choice(BaseModel):
55
+ """Choice in completion response."""
56
+ index: StrictInt
57
+ message: Optional[ChatCompletionMessage] = None
58
+ delta: Optional[ChoiceDelta] = None
59
+ finish_reason: Optional[StrictStr] = None
60
+ logprobs: Optional[Dict[str, Any]] = None
61
+
62
+ class ModelData(BaseModel):
63
+ """OpenAI model info response."""
64
+ id: StrictStr
65
+ object: StrictStr = "model"
66
+ created: StrictInt = int(time.time())
67
+ owned_by: StrictStr = "webscout"
68
+ permission: Optional[List[Dict[str, Any]]] = None
69
+ root: Optional[StrictStr] = None
70
+ parent: Optional[StrictStr] = None
71
+
72
+ class ModelList(BaseModel):
73
+ """OpenAI model list response."""
74
+ data: List[ModelData]
75
+ object: StrictStr = "list"
76
+
77
+
78
+ # @dataclass
79
+ # class EmbeddingData(BaseModel):
80
+ # """Single embedding data."""
81
+ # embedding: List[float]
82
+ # index: int
83
+ # object: str = "embedding"
84
+
85
+ # @dataclass
86
+ # class EmbeddingResponse(BaseModel):
87
+ # """OpenAI embeddings response."""
88
+ # data: List[EmbeddingData]
89
+ # model: str
90
+ # usage: CompletionUsage
91
+ # object: str = "list"
92
+
93
+ # @dataclass
94
+ # class FineTuningJob(BaseModel):
95
+ # """OpenAI fine-tuning job."""
96
+ # id: str
97
+ # model: str
98
+ # created_at: int
99
+ # status: str
100
+ # training_file: str
101
+ # hyperparameters: Dict[str, Any]
102
+ # object: str = "fine_tuning.job"
103
+ # finished_at: Optional[int] = None
104
+ # validation_file: Optional[str] = None
105
+ # trained_tokens: Optional[int] = None
106
+ # result_files: Optional[List[str]] = None
107
+ # organization_id: Optional[str] = None
108
+
109
+ # @dataclass
110
+ # class FineTuningJobList(BaseModel):
111
+ # """OpenAI fine-tuning job list response."""
112
+ # data: List[FineTuningJob]
113
+ # object: str = "list"
114
+ # has_more: bool = False
115
+
116
+ # @dataclass
117
+ # class File(BaseModel):
118
+ # """OpenAI file."""
119
+ # id: str
120
+ # bytes: int
121
+ # created_at: int
122
+ # filename: str
123
+ # purpose: str
124
+ # object: str = "file"
125
+ # status: str = "uploaded"
126
+ # status_details: Optional[str] = None
127
+
128
+ # @dataclass
129
+ # class FileList(BaseModel):
130
+ # """OpenAI file list response."""
131
+ # data: List[File]
132
+ # object: str = "list"
133
+
134
+ # @dataclass
135
+ # class DeletedObject(BaseModel):
136
+ # """OpenAI deleted object response."""
137
+ # id: str
138
+ # object: str = "deleted_object"
139
+ # deleted: bool = True
140
+
141
+ # @dataclass
142
+ # class ImageData(BaseModel):
143
+ # """OpenAI generated image."""
144
+ # url: Optional[str] = None
145
+ # b64_json: Optional[str] = None
146
+ # revised_prompt: Optional[str] = None
147
+
148
+ # @dataclass
149
+ # class ImageResponse(BaseModel):
150
+ # """OpenAI image generation response."""
151
+ # data: List[ImageData]
152
+ # created: int = int(time.time())
153
+
154
+ class ChatCompletion(BaseModel):
155
+ """Chat completion response."""
156
+ model: StrictStr
157
+ choices: List[Choice]
158
+ id: StrictStr = Field(default_factory=lambda: f"chatcmpl-{str(uuid.uuid4())}")
159
+ created: StrictInt = Field(default_factory=lambda: int(time.time()))
160
+ object: StrictStr = "chat.completion"
161
+ system_fingerprint: Optional[StrictStr] = None
162
+ usage: Optional[CompletionUsage] = None
163
+
164
+ class ChatCompletionChunk(BaseModel):
165
+ """Streaming chat completion response chunk."""
166
+ model: StrictStr
167
+ choices: List[Choice]
168
+ id: StrictStr = Field(default_factory=lambda: f"chatcmpl-{str(uuid.uuid4())}")
169
+ created: StrictInt = Field(default_factory=lambda: int(time.time()))
170
+ object: StrictStr = "chat.completion.chunk"
171
+ system_fingerprint: Optional[StrictStr] = None
172
+ usage: Optional[Dict[str, Any]] = None # Add usage field for streaming chunks
173
+
174
+
175
+ # --- Helper Functions ---
176
+
177
+ def format_prompt(messages: List[Dict[str, Any]], add_special_tokens: bool = False,
178
+ do_continue: bool = False, include_system: bool = True) -> str:
179
+ """
180
+ Format a series of messages into a single string, optionally adding special tokens.
181
+
182
+ Args:
183
+ messages: A list of message dictionaries, each containing 'role' and 'content'.
184
+ add_special_tokens: Whether to add special formatting tokens.
185
+ do_continue: If True, don't add the final "Assistant:" prompt.
186
+ include_system: Whether to include system messages in the formatted output.
187
+
188
+ Returns:
189
+ A formatted string containing all messages.
190
+ """
191
+ # Helper function to convert content to string
192
+ def to_string(value) -> str:
193
+ if isinstance(value, str):
194
+ return value
195
+ elif isinstance(value, dict):
196
+ if "text" in value:
197
+ return value.get("text", "")
198
+ return ""
199
+ elif isinstance(value, list):
200
+ return "".join([to_string(v) for v in value])
201
+ return str(value)
202
+
203
+ # If there's only one message and no special tokens needed, just return its content
204
+ if not add_special_tokens and len(messages) <= 1:
205
+ return to_string(messages[0]["content"])
206
+
207
+ # Filter and process messages
208
+ processed_messages = [
209
+ (message["role"], to_string(message["content"]))
210
+ for message in messages
211
+ if include_system or message.get("role") != "system"
212
+ ]
213
+
214
+ # Format each message as "Role: Content"
215
+ formatted = "\n".join([
216
+ f'{role.capitalize()}: {content}'
217
+ for role, content in processed_messages
218
+ if content.strip()
219
+ ])
220
+
221
+ # Add final prompt for assistant if needed
222
+ if do_continue:
223
+ return formatted
224
+
225
+ return f"{formatted}\nAssistant:"
226
+
227
+
228
+ def get_system_prompt(messages: List[Dict[str, Any]]) -> str:
229
+ """
230
+ Extract and concatenate all system messages.
231
+
232
+ Args:
233
+ messages: A list of message dictionaries.
234
+
235
+ Returns:
236
+ A string containing all system messages concatenated with newlines.
237
+ """
238
+ return "\n".join([m["content"] for m in messages if m["role"] == "system"])
239
+
240
+
241
+ def get_last_user_message(messages: List[Dict[str, Any]]) -> str:
242
+ """
243
+ Get the content of the last user message in the conversation.
244
+
245
+ Args:
246
+ messages: A list of message dictionaries.
247
+
248
+ Returns:
249
+ The content of the last user message as a string.
250
+ """
251
+ for message in reversed(messages):
252
+ if message["role"] == "user":
253
+ if isinstance(message["content"], str):
254
+ return message["content"]
255
+ # Handle complex content structures
256
+ if isinstance(message["content"], dict) and "text" in message["content"]:
257
+ return message["content"]["text"]
258
+ if isinstance(message["content"], list):
259
+ text_parts = []
260
+ for part in message["content"]:
261
+ if isinstance(part, dict) and part.get("type") == "text":
262
+ text_parts.append(part.get("text", ""))
263
+ elif isinstance(part, str):
264
+ text_parts.append(part)
265
+ return "".join(text_parts)
266
+ return ""
267
+
268
+
269
+ # --- Token Counter ---
270
+
271
+ def count_tokens(text_or_messages: Any) -> int:
272
+ """
273
+ Count tokens in a string or a list of messages using tiktoken if available, else fallback to webstoken's WordTokenizer.
274
+
275
+ Args:
276
+ text_or_messages: A string or a list of messages (string or any type).
277
+ model: Optional model name for tiktoken encoding.
278
+
279
+ Returns:
280
+ int: Number of tokens.
281
+ """
282
+ try:
283
+ import tiktoken
284
+ # Use tiktoken if available
285
+ if isinstance(text_or_messages, str):
286
+ enc = tiktoken.encoding_for_model("gpt-4o")
287
+ return len(enc.encode(text_or_messages))
288
+ elif isinstance(text_or_messages, list):
289
+ enc = tiktoken.encoding_for_model("gpt-4o")
290
+ total = 0
291
+ for m in text_or_messages:
292
+ # Remove .get('content', '') and treat m as string or convert to string
293
+ if isinstance(m, str):
294
+ total += len(enc.encode(m))
295
+ else:
296
+ total += len(enc.encode(str(m)))
297
+ return total
298
+ else:
299
+ return 0
300
+ except ImportError:
301
+ # Fallback to webstoken's WordTokenizer
302
+ try:
303
+ from webstoken import WordTokenizer
304
+ except ImportError:
305
+ return 0
306
+ tokenizer = WordTokenizer()
307
+ if isinstance(text_or_messages, str):
308
+ return len(tokenizer.tokenize(text_or_messages))
309
+ elif isinstance(text_or_messages, list):
310
+ total = 0
311
+ for m in text_or_messages:
312
+ if isinstance(m, str):
313
+ total += len(tokenizer.tokenize(m))
314
+ else:
315
+ total += len(tokenizer.tokenize(str(m)))
316
+ return total
317
+ else:
318
+ return 0