PyPI - webscout - Versions diffs - 6.3__py3-none-any.whl → 6.5__py3-none-any.whl - Mend

webscout 6.3py3-none-any.whl → 6.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of webscout might be problematic. Click here for more details.

Files changed (131) hide show

webscout/AIauto.py +191 -176
webscout/AIbase.py +0 -197
webscout/AIutel.py +441 -1130
webscout/DWEBS.py +189 -35
webscout/{YTdownloader.py → Extra/YTToolkit/YTdownloader.py} +990 -1103
webscout/Extra/YTToolkit/__init__.py +3 -0
webscout/{transcriber.py → Extra/YTToolkit/transcriber.py} +479 -551
webscout/Extra/YTToolkit/ytapi/__init__.py +6 -0
webscout/Extra/YTToolkit/ytapi/channel.py +307 -0
webscout/Extra/YTToolkit/ytapi/errors.py +13 -0
webscout/Extra/YTToolkit/ytapi/extras.py +45 -0
webscout/Extra/YTToolkit/ytapi/https.py +88 -0
webscout/Extra/YTToolkit/ytapi/patterns.py +61 -0
webscout/Extra/YTToolkit/ytapi/playlist.py +59 -0
webscout/Extra/YTToolkit/ytapi/pool.py +8 -0
webscout/Extra/YTToolkit/ytapi/query.py +37 -0
webscout/Extra/YTToolkit/ytapi/stream.py +60 -0
webscout/Extra/YTToolkit/ytapi/utils.py +62 -0
webscout/Extra/YTToolkit/ytapi/video.py +102 -0
webscout/Extra/__init__.py +3 -1
webscout/Extra/autocoder/__init__.py +9 -0
webscout/Extra/autocoder/autocoder_utiles.py +121 -0
webscout/Extra/autocoder/rawdog.py +680 -0
webscout/Extra/autollama.py +246 -195
webscout/Extra/gguf.py +81 -56
webscout/Extra/markdownlite/__init__.py +862 -0
webscout/Extra/weather_ascii.py +2 -2
webscout/LLM.py +206 -43
webscout/Litlogger/__init__.py +681 -0
webscout/Provider/DARKAI.py +1 -1
webscout/Provider/EDITEE.py +1 -1
webscout/Provider/NinjaChat.py +1 -1
webscout/Provider/PI.py +120 -35
webscout/Provider/Perplexity.py +590 -598
webscout/Provider/Reka.py +0 -1
webscout/Provider/RoboCoders.py +206 -0
webscout/Provider/TTI/AiForce/__init__.py +22 -0
webscout/Provider/TTI/AiForce/async_aiforce.py +257 -0
webscout/Provider/TTI/AiForce/sync_aiforce.py +242 -0
webscout/Provider/TTI/Nexra/__init__.py +22 -0
webscout/Provider/TTI/Nexra/async_nexra.py +286 -0
webscout/Provider/TTI/Nexra/sync_nexra.py +258 -0
webscout/Provider/TTI/PollinationsAI/__init__.py +23 -0
webscout/Provider/TTI/PollinationsAI/async_pollinations.py +330 -0
webscout/Provider/TTI/PollinationsAI/sync_pollinations.py +285 -0
webscout/Provider/TTI/__init__.py +2 -4
webscout/Provider/TTI/artbit/__init__.py +22 -0
webscout/Provider/TTI/artbit/async_artbit.py +184 -0
webscout/Provider/TTI/artbit/sync_artbit.py +176 -0
webscout/Provider/TTI/blackbox/__init__.py +4 -0
webscout/Provider/TTI/blackbox/async_blackbox.py +212 -0
webscout/Provider/TTI/{blackboximage.py → blackbox/sync_blackbox.py} +199 -153
webscout/Provider/TTI/deepinfra/__init__.py +4 -0
webscout/Provider/TTI/deepinfra/async_deepinfra.py +227 -0
webscout/Provider/TTI/deepinfra/sync_deepinfra.py +199 -0
webscout/Provider/TTI/huggingface/__init__.py +22 -0
webscout/Provider/TTI/huggingface/async_huggingface.py +199 -0
webscout/Provider/TTI/huggingface/sync_huggingface.py +195 -0
webscout/Provider/TTI/imgninza/__init__.py +4 -0
webscout/Provider/TTI/imgninza/async_ninza.py +214 -0
webscout/Provider/TTI/{imgninza.py → imgninza/sync_ninza.py} +209 -136
webscout/Provider/TTI/talkai/__init__.py +4 -0
webscout/Provider/TTI/talkai/async_talkai.py +229 -0
webscout/Provider/TTI/talkai/sync_talkai.py +207 -0
webscout/Provider/TTS/__init__.py +5 -1
webscout/Provider/TTS/deepgram.py +183 -0
webscout/Provider/TTS/elevenlabs.py +137 -0
webscout/Provider/TTS/gesserit.py +151 -0
webscout/Provider/TTS/murfai.py +139 -0
webscout/Provider/TTS/parler.py +134 -107
webscout/Provider/TTS/streamElements.py +360 -275
webscout/Provider/TTS/utils.py +280 -0
webscout/Provider/TTS/voicepod.py +116 -116
webscout/Provider/__init__.py +8 -1
webscout/Provider/askmyai.py +2 -2
webscout/Provider/cerebras.py +227 -219
webscout/Provider/llama3mitril.py +0 -1
webscout/Provider/meta.py +794 -779
webscout/Provider/mhystical.py +176 -0
webscout/Provider/perplexitylabs.py +265 -0
webscout/Provider/twitterclone.py +251 -245
webscout/Provider/typegpt.py +358 -0
webscout/__init__.py +9 -8
webscout/__main__.py +5 -5
webscout/cli.py +252 -280
webscout/conversation.py +227 -0
webscout/exceptions.py +161 -29
webscout/litagent/__init__.py +172 -0
webscout/litprinter/__init__.py +832 -0
webscout/optimizers.py +270 -0
webscout/prompt_manager.py +279 -0
webscout/scout/__init__.py +11 -0
webscout/scout/core.py +884 -0
webscout/scout/element.py +459 -0
webscout/scout/parsers/__init__.py +69 -0
webscout/scout/parsers/html5lib_parser.py +172 -0
webscout/scout/parsers/html_parser.py +236 -0
webscout/scout/parsers/lxml_parser.py +178 -0
webscout/scout/utils.py +38 -0
webscout/swiftcli/__init__.py +810 -0
webscout/update_checker.py +125 -0
webscout/version.py +1 -1
webscout/zeroart/__init__.py +55 -0
webscout/zeroart/base.py +61 -0
webscout/zeroart/effects.py +99 -0
webscout/zeroart/fonts.py +816 -0
webscout/zerodir/__init__.py +225 -0
{webscout-6.3.dist-info → webscout-6.5.dist-info}/METADATA +37 -112
webscout-6.5.dist-info/RECORD +179 -0
webscout/Agents/Onlinesearcher.py +0 -182
webscout/Agents/__init__.py +0 -2
webscout/Agents/functioncall.py +0 -248
webscout/Bing_search.py +0 -154
webscout/Provider/TTI/AIuncensoredimage.py +0 -103
webscout/Provider/TTI/Nexra.py +0 -120
webscout/Provider/TTI/PollinationsAI.py +0 -138
webscout/Provider/TTI/WebSimAI.py +0 -142
webscout/Provider/TTI/aiforce.py +0 -160
webscout/Provider/TTI/artbit.py +0 -141
webscout/Provider/TTI/deepinfra.py +0 -148
webscout/Provider/TTI/huggingface.py +0 -155
webscout/Provider/TTI/talkai.py +0 -116
webscout/g4f.py +0 -666
webscout/models.py +0 -23
webscout/requestsHTMLfix.py +0 -775
webscout/webai.py +0 -2590
webscout-6.3.dist-info/RECORD +0 -124
{webscout-6.3.dist-info → webscout-6.5.dist-info}/LICENSE.md +0 -0
{webscout-6.3.dist-info → webscout-6.5.dist-info}/WHEEL +0 -0
{webscout-6.3.dist-info → webscout-6.5.dist-info}/entry_points.txt +0 -0
{webscout-6.3.dist-info → webscout-6.5.dist-info}/top_level.txt +0 -0

webscout/DWEBS.py CHANGED Viewed

@@ -1,21 +1,99 @@
-from bs4 import BeautifulSoup
 import requests
 from typing import Dict, List, Optional, Union, Any
 from concurrent.futures import ThreadPoolExecutor, as_completed
+from webscout.scout import Scout
 from urllib.parse import quote, urljoin
-from termcolor import colored
+from webscout.litagent import LitAgent
 import time
 import random
 import json
 import os
 from datetime import datetime, timedelta
 from functools import lru_cache
-import logging
-from tenacity import retry, stop_after_attempt, wait_exponential
+from webscout.Litlogger import LitLogger, LogFormat, ColorScheme
 class GoogleS:
-    """
-    Enhanced Google Search class with support for web search, image search, and advanced filters.
+    """A Python interface for Google search with advanced features
+    The GoogleS class provides a powerful interface to perform web searches, image searches,
+    and advanced filtering on Google. Built with love by HAI to keep it
+    Basic Usage:
+        >>> from webscout.DWEBS import GoogleS
+        >>> searcher = GoogleS()
+        >>> # Simple web search
+        >>> results = searcher.search("Python programming")
+        >>> for result in results:
+        ...     print(f"Title: {result['title']}")
+        ...     print(f"URL: {result['href']}")
+        ...     print(f"Description: {result['abstract']}")
+    Advanced Web Search:
+        >>> # Search with filters
+        >>> results = searcher.search(
+        ...     query="Python tutorials",
+        ...     site="github.com",
+        ...     file_type="pdf",
+        ...     time_period="month",
+        ...     max_results=5
+        ... )
+        >>> # Example response format:
+        >>> {
+        ...     'title': 'Python Tutorial',
+        ...     'href': 'https://example.com/python-tutorial',
+        ...     'abstract': 'Comprehensive Python tutorial covering basics to advanced topics',
+        ...     'index': 0,
+        ...     'type': 'web',
+        ...     'visible_text': ''  # Optional: Contains webpage text if extract_text=True
+        ... }
+    Image Search:
+        >>> # Search for images
+        >>> images = searcher.search_images(
+        ...     query="cute puppies",
+        ...     size="large",
+        ...     color="color",
+        ...     type_filter="photo",
+        ...     max_results=5
+        ... )
+        >>> # Example response format:
+        >>> {
+        ...     'title': 'Cute Puppy Image',
+        ...     'thumbnail': 'https://example.com/puppy-thumb.jpg',
+        ...     'full_url': 'https://example.com/puppy-full.jpg',
+        ...     'type': 'image'
+        ... }
+    Features:
+        - Web Search: Get detailed web results with title, URL, and description
+        - Image Search: Find images with thumbnails and full-resolution URLs
+        - Advanced Filters: Site-specific search, file types, time periods
+        - Rate Limiting: Smart request handling to avoid blocks
+        - Caching: Save results for faster repeat searches
+        - Retry Logic: Automatic retry on temporary failures
+        - Logging: Optional LitLogger integration for beautiful console output
+        - Proxy Support: Use custom proxies for requests
+        - Concurrent Processing: Multi-threaded requests for better performance
+    Response Format:
+        Web Search Results:
+            {
+                'title': str,       # Title of the webpage
+                'href': str,        # URL of the webpage
+                'abstract': str,    # Brief description or snippet
+                'index': int,       # Result position
+                'type': 'web',      # Result type identifier
+                'visible_text': str # Full page text (if extract_text=True)
+            }
+        Image Search Results:
+            {
+                'title': str,       # Image title or description
+                'thumbnail': str,   # Thumbnail image URL
+                'full_url': str,    # Full resolution image URL
+                'type': 'image'     # Result type identifier
+            }
     """
     SEARCH_TYPES = {
@@ -31,7 +109,8 @@ class GoogleS:
         timeout: Optional[int] = 10,
         max_workers: int = 20,
         cache_dir: Optional[str] = None,
-        rate_limit: float = 0.01
+        rate_limit: float = 0.01,
+        use_litlogger: bool = False
     ):
         """
         Initialize the GoogleS object with enhanced features.
@@ -39,10 +118,11 @@ class GoogleS:
         Args:
             cache_dir: Directory to store search result cache
             rate_limit: Minimum time between requests in seconds
+            use_litlogger: Whether to use LitLogger for logging (default: False)
         """
         self.proxy = proxy
         self.headers = headers if headers else {
-            "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/111.0.0.0 Safari/537.36"
+            "User-Agent": LitAgent().random()  # Use LitAgent to generate user agent
         }
         self.headers["Referer"] = "https://www.google.com/"
         self.client = requests.Session()
@@ -56,10 +136,16 @@ class GoogleS:
             os.makedirs(cache_dir)
         self.last_request_time = 0
         self.rate_limit = rate_limit
+        self.use_litlogger = use_litlogger
-        # Setup logging
-        logging.basicConfig(level=logging.INFO)
-        self.logger = logging.getLogger(__name__)
+        # Setup enhanced logging with LitLogger if enabled
+        if self.use_litlogger:
+            self.logger = LitLogger(
+                name="GoogleS",
+                format=LogFormat.MODERN_EMOJI,
+                color_scheme=ColorScheme.CYBERPUNK,
+                console_output=True
+            )
     def _respect_rate_limit(self):
         """Ensure minimum time between requests"""
@@ -69,20 +155,46 @@ class GoogleS:
             time.sleep(self.rate_limit - time_since_last)
         self.last_request_time = time.time()
-    @retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=4, max=10))
     def _get_url(self, method: str, url: str, params: Optional[Dict[str, str]] = None,
-                  data: Optional[Union[Dict[str, str], bytes]] = None) -> bytes:
+                  data: Optional[Union[Dict[str, str], bytes]] = None, max_retries: int = 3) -> bytes:
         """
-        Makes an HTTP request with retry logic and rate limiting.
+        Makes an HTTP request with manual retry logic and rate limiting.
+        Args:
+            method (str): HTTP method (GET, POST, etc.)
+            url (str): Target URL
+            params (Optional[Dict[str, str]]): Query parameters
+            data (Optional[Union[Dict[str, str], bytes]]): Request payload
+            max_retries (int): Maximum number of retry attempts
+        Returns:
+            bytes: Response content
         """
         self._respect_rate_limit()
-        try:
-            resp = self.client.request(method, url, params=params, data=data, timeout=self.timeout)
-            resp.raise_for_status()
-            return resp.content
-        except requests.exceptions.RequestException as ex:
-            self.logger.error(f"Request failed: {url} - {str(ex)}")
-            raise
+        for attempt in range(max_retries):
+            try:
+                if self.use_litlogger:
+                    self.logger.debug(f"Making {method} request to {url} (Attempt {attempt + 1})")
+                resp = self.client.request(method, url, params=params, data=data, timeout=self.timeout)
+                resp.raise_for_status()
+                if self.use_litlogger:
+                    self.logger.success(f"Request successful: {resp.status_code}")
+                return resp.content
+            except requests.exceptions.RequestException as ex:
+                if self.use_litlogger:
+                    self.logger.error(f"Request failed: {url} - {str(ex)}")
+                # Exponential backoff
+                if attempt < max_retries - 1:
+                    wait_time = (2 ** attempt) + random.random()
+                    time.sleep(wait_time)
+                else:
+                    raise
     @lru_cache(maxsize=100)
     def _cache_key(self, query: str, **kwargs) -> str:
@@ -99,7 +211,11 @@ class GoogleS:
             with open(cache_file, 'r') as f:
                 cached_data = json.load(f)
                 if datetime.fromisoformat(cached_data['timestamp']) + timedelta(hours=24) > datetime.now():
+                    if self.use_litlogger:
+                        self.logger.info(f"Using cached results for: {cache_key}")
                     return cached_data['results']
+        if self.use_litlogger:
+            self.logger.debug(f"No valid cache found for: {cache_key}")
         return None
     def _cache_results(self, cache_key: str, results: List[Dict[str, Any]]):
@@ -117,18 +233,49 @@ class GoogleS:
         self,
         query: str,
         max_results: int = 10,
-        size: Optional[str] = None,  # large, medium, icon
-        color: Optional[str] = None,  # color, gray, transparent
-        type_filter: Optional[str] = None,  # face, photo, clipart, lineart
+        size: Optional[str] = None,
+        color: Optional[str] = None,
+        type_filter: Optional[str] = None,
         **kwargs
     ) -> List[Dict[str, str]]:
-        """
-        Perform an image search and return results.
+        """Search for images on Google with style!
         Args:
-            size: Filter by image size
-            color: Filter by color
-            type_filter: Filter by image type
+            query (str): What you're looking for fam
+            max_results (int): How many results you want (default: 10)
+            size (Optional[str]): Image size filter
+                - 'large': Big pics
+                - 'medium': Medium sized
+                - 'icon': Small icons
+            color (Optional[str]): Color filter
+                - 'color': Full color
+                - 'gray': Black and white
+                - 'transparent': Transparent background
+            type_filter (Optional[str]): Type of image
+                - 'face': Just faces
+                - 'photo': Real photos
+                - 'clipart': Vector art
+                - 'lineart': Line drawings
+        Returns:
+            List[Dict[str, str]]: List of image results with these keys:
+                - 'thumbnail': Small preview URL
+                - 'full_url': Full resolution image URL
+                - 'title': Image title/description
+                - 'type': Always 'image'
+        Example:
+            >>> searcher = GoogleS()
+            >>> # Find some cool nature pics
+            >>> images = searcher.search_images(
+            ...     query="beautiful landscapes",
+            ...     size="large",
+            ...     color="color",
+            ...     max_results=5
+            ... )
+            >>> for img in images:
+            ...     print(f"Found: {img['title']}")
+            ...     print(f"URL: {img['full_url']}")
         """
         params = {
             "q": query,
@@ -144,7 +291,7 @@ class GoogleS:
             params["tbs"] = f"itp:{type_filter}"
         content = self._get_url("GET", self.SEARCH_TYPES["image"], params=params)
-        soup = BeautifulSoup(content, 'lxml')
+        soup = Scout(content)  # Use Scout parser
         results = []
         for img in soup.find_all("img", class_="rg_i"):
@@ -192,6 +339,9 @@ class GoogleS:
             exclude_terms: List of terms to exclude from search
             exact_phrase: Exact phrase to match
         """
+        if self.use_litlogger:
+            self.logger.info(f"Starting search for: {query}")
         # Build advanced query
         advanced_query = query
         if site:
@@ -202,7 +352,10 @@ class GoogleS:
             advanced_query += " " + " ".join(f"-{term}" for term in exclude_terms)
         if exact_phrase:
             advanced_query = f'"{exact_phrase}"' + advanced_query
+        if self.use_litlogger:
+            self.logger.debug(f"Advanced query: {advanced_query}")
         # Check cache first
         cache_key = self._cache_key(advanced_query, region=region, language=language,
                                   safe=safe, time_period=time_period, sort_by=sort_by)
@@ -233,7 +386,8 @@ class GoogleS:
             for future in as_completed(futures):
                 try:
                     resp_content = future.result()
-                    soup = BeautifulSoup(resp_content, 'lxml')  # Use lxml parser
+                    soup = Scout(resp_content)  # Use Scout parser
                     result_blocks = soup.find_all("div", class_="g")
                     if not result_blocks:
@@ -297,9 +451,9 @@ class GoogleS:
     def _extract_text_from_webpage(self, html_content: bytes, max_characters: Optional[int] = None) -> str:
         """
-        Extracts visible text from HTML content using lxml parser.
+        Extracts visible text from HTML content using Scout parser.
         """
-        soup = BeautifulSoup(html_content, 'lxml')  # Use lxml parser
+        soup = Scout(html_content)  # Use Scout parser
         for tag in soup(["script", "style", "header", "footer", "nav"]):
             tag.extract()
         visible_text = soup.get_text(strip=True)

webscout 6.3__py3-none-any.whl → 6.5__py3-none-any.whl

Potentially problematic release.

webscout 6.3py3-none-any.whl → 6.5py3-none-any.whl