PyPI - webscout - Versions diffs - 2.5__py3-none-any.whl → 2.7__py3-none-any.whl - Mend

webscout 2.5py3-none-any.whl → 2.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

webscout/AIutel.py +20 -20
webscout/Local/_version.py +1 -1
webscout/Local/formats.py +141 -88
webscout/Local/model.py +4 -4
webscout/Local/thread.py +165 -155
webscout/Provider/BasedGPT.py +226 -0
webscout/Provider/Poe.py +208 -0
webscout/Provider/__init__.py +3 -1
webscout/__init__.py +5 -31
webscout/cli.py +39 -3
webscout/version.py +1 -1
webscout/webai.py +16 -0
webscout/webscout_search.py +1018 -40
webscout/webscout_search_async.py +151 -839
{webscout-2.5.dist-info → webscout-2.7.dist-info}/METADATA +56 -21
{webscout-2.5.dist-info → webscout-2.7.dist-info}/RECORD +20 -18
{webscout-2.5.dist-info → webscout-2.7.dist-info}/LICENSE.md +0 -0
{webscout-2.5.dist-info → webscout-2.7.dist-info}/WHEEL +0 -0
{webscout-2.5.dist-info → webscout-2.7.dist-info}/entry_points.txt +0 -0
{webscout-2.5.dist-info → webscout-2.7.dist-info}/top_level.txt +0 -0

webscout/AIutel.py CHANGED Viewed

@@ -26,27 +26,27 @@ default_path = appdir.user_cache_dir
 if not os.path.exists(default_path):
     os.makedirs(default_path)
 webai = [
-    "leo",
-    "openai",
-    "opengpt",
-    "koboldai",
-    "gemini",
-    "phind",
-    "blackboxai",
-    "g4fauto",
-    "perplexity",
-    "groq",
-    "reka",
-    "cohere",
-    "yepchat",
-    "you",
-    "xjai",
-    "thinkany",
-    "berlin4h",
-    "chatgptuk",
-    "auto",
+   "leo",
+   "openai",
+   "opengpt",
+   "koboldai",
+   "gemini",
+   "phind",
+   "blackboxai",
+   "g4fauto",
+   "perplexity",
+   "groq",
+   "reka",
+   "cohere",
+   "yepchat",
+   "you",
+   "xjai",
+   "thinkany",
+   "berlin4h",
+   "chatgptuk",
+   "auto",
+   "poe",
 ]
 gpt4free_providers = [
     provider.__name__ for provider in g4f.Provider.__providers__  # if provider.working
 ]

webscout/Local/_version.py CHANGED Viewed

@@ -1,3 +1,3 @@
 from llama_cpp import __version__ as __llama_cpp_version__
-__version__ = '2.3'
+__version__ = '2.7'

webscout/Local/formats.py CHANGED Viewed

@@ -1,6 +1,38 @@
 from ._version import __version__, __llama_cpp_version__
-from typing import Union
+from typing import Callable, Union, Any
+class AdvancedFormat:
+    def __init__(self, base_dict: dict[str, Union[str, list]]):
+        self._base_dict = base_dict
+        self.overrides = {}
+    def __getitem__(self, key: str) -> Any:
+        if key in self.overrides:
+            return str(self.overrides[key]())
+        else:
+            return self._base_dict[key]
+    def __repr__(self) -> str:
+        # NOTE: This method does not represent overrides
+        return repr(self._base_dict)
+    def keys(self):
+        return self._base_dict.keys()
+    def override(self, key: str, fn: Callable) -> None:
+        self.overrides[key] = fn
+    def wrap(self, prompt: str) -> str:
+        return self['system_prefix'] + \
+               self['system_content'] + \
+               self['system_suffix'] + \
+               self['user_prefix'] + \
+               prompt + \
+               self['user_suffix'] + \
+               self['bot_prefix']
 def wrap(
@@ -8,26 +40,25 @@ def wrap(
     format: dict[str, Union[str, list]]
 ) -> str:
     """Wrap a given string in any prompt format for single-turn completion"""
-    return (
-        format['system_prefix'] +
-        format['system_content'] +
-        format['system_postfix'] +
-        format['user_prefix'] +
-        prompt +
-        format['user_postfix'] +
-        format['bot_prefix']
-    )
+    return format['system_prefix'] + \
+           format['system_content'] + \
+           format['system_suffix'] + \
+           format['user_prefix'] + \
+           prompt + \
+           format['user_suffix'] + \
+           format['bot_prefix']
 blank: dict[str, Union[str, list]] = {
     "system_prefix": "",
     "system_content": "",
-    "system_postfix": "",
+    "system_suffix": "",
     "user_prefix": "",
     "user_content": "",
-    "user_postfix": "",
+    "user_suffix": "",
     "bot_prefix": "",
     "bot_content": "",
-    "bot_postfix": "",
+    "bot_suffix": "",
     "stops": []
 }
@@ -36,13 +67,13 @@ alpaca: dict[str, Union[str, list]] = {
     "system_prefix": "",
     "system_content": "Below is an instruction that describes a task. " + \
     "Write a response that appropriately completes the request.",
-    "system_postfix": "\n\n",
+    "system_suffix": "\n\n",
     "user_prefix": "### Instruction:\n",
     "user_content": "",
-    "user_postfix": "\n\n",
+    "user_suffix": "\n\n",
     "bot_prefix": "### Response:\n",
     "bot_content": "",
-    "bot_postfix": "\n\n",
+    "bot_suffix": "\n\n",
     "stops": ['###', 'Instruction:', '\n\n\n']
 }
@@ -61,13 +92,13 @@ alpaca: dict[str, Union[str, list]] = {
 mistral_instruct: dict[str, Union[str, list]] = {
     "system_prefix": "",
     "system_content": "",
-    "system_postfix": "",
+    "system_suffix": "",
     "user_prefix": " [INST] ",
     "user_content": "",
-    "user_postfix": " [/INST]",
+    "user_suffix": " [/INST]",
     "bot_prefix": "",
     "bot_content": "",
-    "bot_postfix": "",
+    "bot_suffix": "",
     "stops": []
 }
@@ -75,16 +106,16 @@ mistral_instruct: dict[str, Union[str, list]] = {
 mistral_instruct_safe: dict[str, Union[str, list]] = {
     "system_prefix": "",
     "system_content": "",
-    "system_postfix": "",
+    "system_suffix": "",
     "user_prefix": " [INST] Always assist with care, respect, and truth. " + \
     "Respond with utmost utility yet securely. Avoid harmful, unethical, " + \
     "prejudiced, or negative content. Ensure replies promote fairness and " + \
     "positivity. ",
     "user_content": "",
-    "user_postfix": " [/INST]",
+    "user_suffix": " [/INST]",
     "bot_prefix": "",
     "bot_content": "",
-    "bot_postfix": "",
+    "bot_suffix": "",
     "stops": []
 }
@@ -92,13 +123,13 @@ mistral_instruct_safe: dict[str, Union[str, list]] = {
 chatml: dict[str, Union[str, list]] = {
     "system_prefix": "<|im_start|>system\n",
     "system_content": "",
-    "system_postfix": "<|im_end|>\n",
+    "system_suffix": "<|im_end|>\n",
     "user_prefix": "<|im_start|>user\n",
     "user_content": "",
-    "user_postfix": "<|im_end|>\n",
+    "user_suffix": "<|im_end|>\n",
     "bot_prefix": "<|im_start|>assistant\n",
     "bot_content": "",
-    "bot_postfix": "<|im_end|>\n",
+    "bot_suffix": "<|im_end|>\n",
     "stops": ['<|im_start|>']
 }
@@ -107,28 +138,33 @@ chatml: dict[str, Union[str, list]] = {
 llama2chat: dict[str, Union[str, list]] = {
     "system_prefix": "[INST] <<SYS>>\n",
     "system_content": "You are a helpful AI assistant.",
-    "system_postfix": "\n<</SYS>>\n\n",
+    "system_suffix": "\n<</SYS>>\n\n",
     "user_prefix": "",
     "user_content": "",
-    "user_postfix": " [/INST]",
+    "user_suffix": " [/INST]",
     "bot_prefix": " ",
     "bot_content": "",
-    "bot_postfix": " [INST] ",
+    "bot_suffix": " [INST] ",
     "stops": ['[INST]', '[/INST]']
 }
-# https://github.com/ggerganov/llama.cpp/issues/6747#issuecomment-2065013606
-# TODO: better reference
+# https://llama.meta.com/docs/model-cards-and-prompt-formats/meta-llama-3/
+#
+# for llama 3 instruct models, use the following string for `-p` in llama.cpp,
+# along with `-e` to escape newlines correctly
+#
+# '<|start_header_id|>system<|end_header_id|>\n\nYou are a helpful AI assistant called "Llama 3".<|eot_id|>\n<|start_header_id|>user<|end_header_id|>\n\nhi<|eot_id|>\n<|start_header_id|>assistant<|end_header_id|>\n\n'
+#
 llama3: dict[str, Union[str, list]] = {
     "system_prefix": "<|start_header_id|>system<|end_header_id|>\n\n",
     "system_content": 'You are a helpful AI assistant called "Llama 3".',
-    "system_postfix": "<|eot_id|>\n",
+    "system_suffix": "<|eot_id|>\n",
     "user_prefix": "<|start_header_id|>user<|end_header_id|>\n\n",
     "user_content": "",
-    "user_postfix": "<|eot_id|>\n",
+    "user_suffix": "<|eot_id|>\n",
     "bot_prefix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
     "bot_content": "",
-    "bot_postfix": "<|eot_id|>\n",
+    "bot_suffix": "<|eot_id|>\n",
     "stops": [128001, 128009]
 }
@@ -137,13 +173,13 @@ alpaca: dict[str, Union[str, list]] = {
     "system_prefix": "",
     "system_content": "Below is an instruction that describes a task. " + \
     "Write a response that appropriately completes the request.",
-    "system_postfix": "\n\n",
+    "system_suffix": "\n\n",
     "user_prefix": "### Instruction:\n",
     "user_content": "",
-    "user_postfix": "\n\n",
+    "user_suffix": "\n\n",
     "bot_prefix": "### Response:\n",
     "bot_content": "",
-    "bot_postfix": "\n\n",
+    "bot_suffix": "\n\n",
     "stops": ['###', 'Instruction:', '\n\n\n']
 }
@@ -151,13 +187,13 @@ alpaca: dict[str, Union[str, list]] = {
 phi3: dict[str, Union[str, list]] = {
     "system_prefix": "",
     "system_content": "", # does not officially support system prompt
-    "system_postfix": "",
+    "system_suffix": "",
     "user_prefix": "<|user|>\n",
     "user_content": "",
-    "user_postfix": "<|end|>\n",
+    "user_suffix": "<|end|>\n",
     "bot_prefix": "<|assistant|>\n",
     "bot_content": "",
-    "bot_postfix": "<|end|>\n",
+    "bot_suffix": "<|end|>\n",
     "stops": []
 }
@@ -167,13 +203,13 @@ phi3: dict[str, Union[str, list]] = {
 vicuna_lmsys: dict[str, Union[str, list]] = {
     "system_prefix": "",
     "system_content": "",
-    "system_postfix": " ",
+    "system_suffix": " ",
     "user_prefix": "USER: ",
     "user_content": "",
-    "user_postfix": " ",
+    "user_suffix": " ",
     "bot_prefix": "ASSISTANT: ",
     "bot_content": "",
-    "bot_postfix": " ",
+    "bot_suffix": " ",
     "stops": ['USER:']
 }
@@ -184,29 +220,46 @@ vicuna_common: dict[str, Union[str, list]] = {
     "system_content": "A chat between a curious user and an artificial " + \
     "intelligence assistant. The assistant gives helpful, detailed, " + \
     "and polite answers to the user's questions.",
-    "system_postfix": "\n\n",
+    "system_suffix": "\n\n",
     "user_prefix": "USER: ",
     "user_content": "",
-    "user_postfix": "\n",
+    "user_suffix": "\n",
     "bot_prefix": "ASSISTANT: ",
     "bot_content": "",
-    "bot_postfix": "\n",
+    "bot_suffix": "\n",
     "stops": ['USER:', 'ASSISTANT:']
 }
+# an unofficial format that is easily "picked up" by most models
+# change the tag attributes to suit your use case
+# note the lack of newlines - they are not necessary, and might
+# actually make it harder for the model to follow along
+markup = {
+    "system_prefix": '<message from="system">',
+    "system_content": '',
+    "system_suffix": '</message>',
+    "user_prefix": '<message from="user">',
+    "user_content": '',
+    "user_suffix": '</message>',
+    "bot_prefix": '<message from="bot">',
+    "bot_content": '',
+    "bot_suffix": '</message>',
+    "stops": ['</message>']
+}
 # https://huggingface.co/timdettmers/guanaco-65b
 guanaco: dict[str, Union[str, list]] = {
     "system_prefix": "",
     "system_content": "A chat between a curious human and an artificial " + \
     "intelligence assistant. The assistant gives helpful, detailed, " + \
     "and polite answers to the user's questions.",
-    "system_postfix": "\n",
+    "system_suffix": "\n",
     "user_prefix": "### Human: ",
     "user_content": "",
-    "user_postfix": " ",
+    "user_suffix": " ",
     "bot_prefix": "### Assistant:",
     "bot_content": "",
-    "bot_postfix": " ",
+    "bot_suffix": " ",
     "stops": ['###', 'Human:']
 }
@@ -215,13 +268,13 @@ orca_mini: dict[str, Union[str, list]] = {
     "system_prefix": "### System:\n",
     "system_content": "You are an AI assistant that follows instruction " + \
     "extremely well. Help as much as you can.",
-    "system_postfix": "\n\n",
+    "system_suffix": "\n\n",
     "user_prefix": "### User:\n",
     "user_content": "",
-    "user_postfix": "\n\n",
+    "user_suffix": "\n\n",
     "bot_prefix": "### Assistant:\n",
     "bot_content": "",
-    "bot_postfix": "\n\n",
+    "bot_suffix": "\n\n",
     "stops": ['###', 'User:']
 }
@@ -229,13 +282,13 @@ orca_mini: dict[str, Union[str, list]] = {
 zephyr: dict[str, Union[str, list]] = {
     "system_prefix": "<|system|>\n",
     "system_content": "You are a friendly chatbot.",
-    "system_postfix": "</s>\n",
+    "system_suffix": "</s>\n",
     "user_prefix": "<|user|>\n",
     "user_content": "",
-    "user_postfix": "</s>\n",
+    "user_suffix": "</s>\n",
     "bot_prefix": "<|assistant|>\n",
     "bot_content": "",
-    "bot_postfix": "\n",
+    "bot_suffix": "\n",
     "stops": ['<|user|>']
 }
@@ -243,13 +296,13 @@ zephyr: dict[str, Union[str, list]] = {
 openchat: dict[str, Union[str, list]] = {
     "system_prefix": "",
     "system_content": "",
-    "system_postfix": "",
+    "system_suffix": "",
     "user_prefix": "GPT4 Correct User: ",
     "user_content": "",
-    "user_postfix": "<|end_of_turn|>",
+    "user_suffix": "<|end_of_turn|>",
     "bot_prefix": "GPT4 Correct Assistant:",
     "bot_content": "",
-    "bot_postfix": "<|end_of_turn|>",
+    "bot_suffix": "<|end_of_turn|>",
     "stops": ['<|end_of_turn|>']
 }
@@ -260,13 +313,13 @@ synthia: dict[str, Union[str, list]] = {
     "system_content": "Elaborate on the topic using a Tree of Thoughts and " + \
     "backtrack when necessary to construct a clear, cohesive Chain of " + \
     "Thought reasoning. Always answer without hesitation.",
-    "system_postfix": "\n",
+    "system_suffix": "\n",
     "user_prefix": "USER: ",
     "user_content": "",
-    "user_postfix": "\n",
+    "user_suffix": "\n",
     "bot_prefix": "ASSISTANT: ",
     "bot_content": "",
-    "bot_postfix": "\n",
+    "bot_suffix": "\n",
     "stops": ['USER:', 'ASSISTANT:', 'SYSTEM:', '\n\n\n']
 }
@@ -281,13 +334,13 @@ neural_chat: dict[str, Union[str, list]] = {
         "to do anything that could be considered harmful to the user.\n" + \
         "- You are more than just an information source, you are also " + \
         "able to write poetry, short stories, and make jokes.",
-    "system_postfix": "</s>\n\n",
+    "system_suffix": "</s>\n\n",
     "user_prefix": "### User:\n",
     "user_content": "",
-    "user_postfix": "</s>\n\n",
+    "user_suffix": "</s>\n\n",
     "bot_prefix": "### Assistant:\n",
     "bot_content": "",
-    "bot_postfix": "</s>\n\n",
+    "bot_suffix": "</s>\n\n",
     "stops": ['###']
 }
@@ -296,13 +349,13 @@ chatml_alpaca: dict[str, Union[str, list]] = {
     "system_prefix": "<|im_start|>system\n",
     "system_content": "Below is an instruction that describes a task. Write " + \
     "a response that appropriately completes the request.",
-    "system_postfix": "<|im_end|>\n",
+    "system_suffix": "<|im_end|>\n",
     "user_prefix": "<|im_start|>instruction\n",
     "user_content": "",
-    "user_postfix": "<|im_end|>\n",
+    "user_suffix": "<|im_end|>\n",
     "bot_prefix": "<|im_start|>response\n",
     "bot_content": "",
-    "bot_postfix": "<|im_end|>\n",
+    "bot_suffix": "<|im_end|>\n",
     "stops": ['<|im_end|>', '<|im_start|>']
 }
@@ -312,13 +365,13 @@ autocorrect: dict[str, Union[str, list]] = {
     "system_content": "Below is a word or phrase that might be misspelled. " + \
     "Output the corrected word or phrase without " + \
     "changing the style or capitalization.",
-    "system_postfix": "<|im_end|>\n",
+    "system_suffix": "<|im_end|>\n",
     "user_prefix": "<|im_start|>input\n",
     "user_content": "",
-    "user_postfix": "<|im_end|>\n",
+    "user_suffix": "<|im_end|>\n",
     "bot_prefix": "<|im_start|>output\n",
     "bot_content": "",
-    "bot_postfix": "<|im_end|>\n",
+    "bot_suffix": "<|im_end|>\n",
     "stops": ['<|im_end|>', '<|im_start|>']
 }
@@ -327,13 +380,13 @@ autocorrect: dict[str, Union[str, list]] = {
 bagel: dict[str, Union[str, list]] = {
     "system_prefix": "system\n",
     "system_content": "",
-    "system_postfix": "\n",
+    "system_suffix": "\n",
     "user_prefix": "user\n",
     "user_content": "",
-    "user_postfix": "\n",
+    "user_suffix": "\n",
     "bot_prefix": "assistant\n",
     "bot_content": "",
-    "bot_postfix": "\n",
+    "bot_suffix": "\n",
     "stops": ['user\n', 'assistant\n', 'system\n']
 }
@@ -341,13 +394,13 @@ bagel: dict[str, Union[str, list]] = {
 solar_instruct: dict[str, Union[str, list]] = {
     "system_prefix": "",
     "system_content": "",
-    "system_postfix": "",
+    "system_suffix": "",
     "user_prefix": "### User:\n",
     "user_content": "",
-    "user_postfix": "\n\n",
+    "user_suffix": "\n\n",
     "bot_prefix": "### Assistant:\n",
     "bot_content": "",
-    "bot_postfix": "\n\n",
+    "bot_suffix": "\n\n",
     "stops": ['### User:', '###', '### Assistant:']
 }
@@ -356,13 +409,13 @@ noromaid: dict[str, Union[str, list]] = {
     "system_prefix": "",
     "system_content": "Below is an instruction that describes a task. " + \
     "Write a response that appropriately completes the request.",
-    "system_postfix": "\n\n",
+    "system_suffix": "\n\n",
     "user_prefix": "### Instruction:\nBob: ",
     "user_content": "",
-    "user_postfix": "\n\n",
+    "user_suffix": "\n\n",
     "bot_prefix": "### Response:\nAlice:",
     "bot_content": "",
-    "bot_postfix": "\n\n",
+    "bot_suffix": "\n\n",
     "stops": ['###', 'Instruction:', '\n\n\n']
 }
@@ -370,13 +423,13 @@ noromaid: dict[str, Union[str, list]] = {
 nschatml: dict[str, Union[str, list]] = {
     "system_prefix": "<|im_start|>\n",
     "system_content": "",
-    "system_postfix": "<|im_end|>\n",
+    "system_suffix": "<|im_end|>\n",
     "user_prefix": "<|im_user|>\n",
     "user_content": "",
-    "user_postfix": "<|im_end|>\n",
+    "user_suffix": "<|im_end|>\n",
     "bot_prefix": "<|im_bot|>\n",
     "bot_content": "",
-    "bot_postfix": "<|im_end|>\n",
+    "bot_suffix": "<|im_end|>\n",
     "stops": []
 }
@@ -384,13 +437,13 @@ nschatml: dict[str, Union[str, list]] = {
 natural: dict[str, Union[str, list]] = {
     "system_prefix": "<<SYSTEM>> ",
     "system_content": "",
-    "system_postfix": "\n\n",
+    "system_suffix": "\n\n",
     "user_prefix": "<<USER>> ",
     "user_content": "",
-    "user_postfix": "\n\n",
+    "user_suffix": "\n\n",
     "bot_prefix": "<<ASSISTANT>>",
     "bot_content": "",
-    "bot_postfix": "\n\n",
+    "bot_suffix": "\n\n",
     "stops": ['\n\nNote:', '<<SYSTEM>>', '<<USER>>', '<<ASSISTANT>>', '\n\n<<']
 }
@@ -398,13 +451,13 @@ natural: dict[str, Union[str, list]] = {
 command: dict[str, Union[str, list]] = {
     "system_prefix": "<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|>",
     "system_content": "",
-    "system_postfix": "<|END_OF_TURN_TOKEN|>",
+    "system_suffix": "<|END_OF_TURN_TOKEN|>",
     "user_prefix": "<|START_OF_TURN_TOKEN|><|USER_TOKEN|>",
     "user_content": "",
-    "user_postfix": "<|END_OF_TURN_TOKEN|>",
+    "user_suffix": "<|END_OF_TURN_TOKEN|>",
     "bot_prefix": "<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>",
     "bot_content": "",
-    "bot_postfix": "<|END_OF_TURN_TOKEN|>",
+    "bot_suffix": "<|END_OF_TURN_TOKEN|>",
     "stops": []
 }
@@ -479,4 +532,4 @@ alpaca_strict['stops'] = [
     '\n\n\n',
     '### Instruction:',
     '### Response:'
-]
+]

webscout/Local/model.py CHANGED Viewed

@@ -612,7 +612,7 @@ class Model:
         self,
         prompt: str,
         k: int
-    ) -> list[tuple[str, np.float64]]:
+    ) -> list[tuple[str, np.floating]]:
         """
         Given prompt `str` and k `int`, return a sorted list of the
         top k candidates for most likely next token, along with their
@@ -639,11 +639,11 @@ class Model:
         # must normalize over all tokens in vocab, not just top k
         if self.verbose:
             print_verbose(f'calculating softmax over {len(scores)} values')
-        normalized_scores: list[np.float64] = list(softmax(scores))
+        normalized_scores: list[np.floating] = list(softmax(scores))
         # construct the final list
         i = 0
-        token_probs_list: list[tuple[str, np.float64]] = []
+        token_probs_list: list[tuple[str, np.floating]] = []
         for tok_str in self.tokens:
             token_probs_list.append((tok_str, normalized_scores[i]))
             i += 1
@@ -666,7 +666,7 @@ class Model:
         for _tuple in self.candidates(prompt, k):
             print(
-                f"token '{_tuple[0]}' has probability {_tuple[1]}",
+                f"token {repr(_tuple[0])} has probability {_tuple[1]}",
                 file=file,
                 flush=flush
             )

webscout 2.5__py3-none-any.whl → 2.7__py3-none-any.whl

webscout 2.5py3-none-any.whl → 2.7py3-none-any.whl