PyPI - webscout - Versions diffs - 8.2.8__py3-none-any.whl → 8.3__py3-none-any.whl - Mend

webscout 8.2.8py3-none-any.whl → 8.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of webscout might be problematic. Click here for more details.

Files changed (197) hide show

webscout/AIauto.py +34 -16
webscout/AIbase.py +96 -37
webscout/AIutel.py +491 -87
webscout/Bard.py +441 -323
webscout/Extra/GitToolkit/__init__.py +10 -10
webscout/Extra/YTToolkit/ytapi/video.py +232 -232
webscout/Litlogger/README.md +10 -0
webscout/Litlogger/__init__.py +7 -59
webscout/Litlogger/formats.py +4 -0
webscout/Litlogger/handlers.py +103 -0
webscout/Litlogger/levels.py +13 -0
webscout/Litlogger/logger.py +92 -0
webscout/Provider/AISEARCH/Perplexity.py +332 -358
webscout/Provider/AISEARCH/felo_search.py +9 -35
webscout/Provider/AISEARCH/genspark_search.py +30 -56
webscout/Provider/AISEARCH/hika_search.py +4 -16
webscout/Provider/AISEARCH/iask_search.py +410 -436
webscout/Provider/AISEARCH/monica_search.py +4 -30
webscout/Provider/AISEARCH/scira_search.py +6 -32
webscout/Provider/AISEARCH/webpilotai_search.py +38 -64
webscout/Provider/Blackboxai.py +155 -35
webscout/Provider/ChatSandbox.py +2 -1
webscout/Provider/Deepinfra.py +339 -339
webscout/Provider/ExaChat.py +358 -358
webscout/Provider/Gemini.py +169 -169
webscout/Provider/GithubChat.py +1 -2
webscout/Provider/Glider.py +3 -3
webscout/Provider/HeckAI.py +172 -82
webscout/Provider/LambdaChat.py +1 -0
webscout/Provider/MCPCore.py +7 -3
webscout/Provider/OPENAI/BLACKBOXAI.py +421 -139
webscout/Provider/OPENAI/Cloudflare.py +38 -21
webscout/Provider/OPENAI/FalconH1.py +457 -0
webscout/Provider/OPENAI/FreeGemini.py +35 -18
webscout/Provider/OPENAI/NEMOTRON.py +34 -34
webscout/Provider/OPENAI/PI.py +427 -0
webscout/Provider/OPENAI/Qwen3.py +304 -0
webscout/Provider/OPENAI/README.md +952 -1253
webscout/Provider/OPENAI/TwoAI.py +374 -0
webscout/Provider/OPENAI/__init__.py +7 -1
webscout/Provider/OPENAI/ai4chat.py +73 -63
webscout/Provider/OPENAI/api.py +869 -644
webscout/Provider/OPENAI/base.py +2 -0
webscout/Provider/OPENAI/c4ai.py +34 -13
webscout/Provider/OPENAI/chatgpt.py +575 -556
webscout/Provider/OPENAI/chatgptclone.py +512 -487
webscout/Provider/OPENAI/chatsandbox.py +11 -6
webscout/Provider/OPENAI/copilot.py +258 -0
webscout/Provider/OPENAI/deepinfra.py +327 -318
webscout/Provider/OPENAI/e2b.py +140 -104
webscout/Provider/OPENAI/exaai.py +420 -411
webscout/Provider/OPENAI/exachat.py +448 -443
webscout/Provider/OPENAI/flowith.py +7 -3
webscout/Provider/OPENAI/freeaichat.py +12 -8
webscout/Provider/OPENAI/glider.py +15 -8
webscout/Provider/OPENAI/groq.py +5 -2
webscout/Provider/OPENAI/heckai.py +311 -307
webscout/Provider/OPENAI/llmchatco.py +9 -7
webscout/Provider/OPENAI/mcpcore.py +18 -9
webscout/Provider/OPENAI/multichat.py +7 -5
webscout/Provider/OPENAI/netwrck.py +16 -11
webscout/Provider/OPENAI/oivscode.py +290 -0
webscout/Provider/OPENAI/opkfc.py +507 -496
webscout/Provider/OPENAI/pydantic_imports.py +172 -0
webscout/Provider/OPENAI/scirachat.py +29 -17
webscout/Provider/OPENAI/sonus.py +308 -303
webscout/Provider/OPENAI/standardinput.py +442 -433
webscout/Provider/OPENAI/textpollinations.py +18 -11
webscout/Provider/OPENAI/toolbaz.py +419 -413
webscout/Provider/OPENAI/typefully.py +17 -10
webscout/Provider/OPENAI/typegpt.py +21 -11
webscout/Provider/OPENAI/uncovrAI.py +477 -462
webscout/Provider/OPENAI/utils.py +90 -79
webscout/Provider/OPENAI/venice.py +435 -425
webscout/Provider/OPENAI/wisecat.py +387 -381
webscout/Provider/OPENAI/writecream.py +166 -163
webscout/Provider/OPENAI/x0gpt.py +26 -37
webscout/Provider/OPENAI/yep.py +384 -356
webscout/Provider/PI.py +2 -1
webscout/Provider/TTI/README.md +55 -101
webscout/Provider/TTI/__init__.py +4 -9
webscout/Provider/TTI/aiarta.py +365 -0
webscout/Provider/TTI/artbit.py +0 -0
webscout/Provider/TTI/base.py +64 -0
webscout/Provider/TTI/fastflux.py +200 -0
webscout/Provider/TTI/magicstudio.py +201 -0
webscout/Provider/TTI/piclumen.py +203 -0
webscout/Provider/TTI/pixelmuse.py +225 -0
webscout/Provider/TTI/pollinations.py +221 -0
webscout/Provider/TTI/utils.py +11 -0
webscout/Provider/TTS/__init__.py +2 -1
webscout/Provider/TTS/base.py +159 -159
webscout/Provider/TTS/openai_fm.py +129 -0
webscout/Provider/TextPollinationsAI.py +308 -308
webscout/Provider/TwoAI.py +239 -44
webscout/Provider/UNFINISHED/Youchat.py +330 -330
webscout/Provider/UNFINISHED/puterjs.py +635 -0
webscout/Provider/UNFINISHED/test_lmarena.py +119 -119
webscout/Provider/Writecream.py +246 -246
webscout/Provider/__init__.py +2 -2
webscout/Provider/ai4chat.py +33 -8
webscout/Provider/granite.py +41 -6
webscout/Provider/koala.py +169 -169
webscout/Provider/oivscode.py +309 -0
webscout/Provider/samurai.py +3 -2
webscout/Provider/scnet.py +1 -0
webscout/Provider/typegpt.py +3 -3
webscout/Provider/uncovr.py +368 -368
webscout/client.py +70 -0
webscout/litprinter/__init__.py +58 -58
webscout/optimizers.py +419 -419
webscout/scout/README.md +3 -1
webscout/scout/core/crawler.py +134 -64
webscout/scout/core/scout.py +148 -109
webscout/scout/element.py +106 -88
webscout/swiftcli/Readme.md +323 -323
webscout/swiftcli/plugins/manager.py +9 -2
webscout/version.py +1 -1
webscout/zeroart/__init__.py +134 -134
webscout/zeroart/effects.py +100 -100
webscout/zeroart/fonts.py +1238 -1238
{webscout-8.2.8.dist-info → webscout-8.3.dist-info}/METADATA +160 -35
webscout-8.3.dist-info/RECORD +290 -0
{webscout-8.2.8.dist-info → webscout-8.3.dist-info}/WHEEL +1 -1
{webscout-8.2.8.dist-info → webscout-8.3.dist-info}/entry_points.txt +1 -0
webscout/Litlogger/Readme.md +0 -175
webscout/Litlogger/core/__init__.py +0 -6
webscout/Litlogger/core/level.py +0 -23
webscout/Litlogger/core/logger.py +0 -165
webscout/Litlogger/handlers/__init__.py +0 -12
webscout/Litlogger/handlers/console.py +0 -33
webscout/Litlogger/handlers/file.py +0 -143
webscout/Litlogger/handlers/network.py +0 -173
webscout/Litlogger/styles/__init__.py +0 -7
webscout/Litlogger/styles/colors.py +0 -249
webscout/Litlogger/styles/formats.py +0 -458
webscout/Litlogger/styles/text.py +0 -87
webscout/Litlogger/utils/__init__.py +0 -6
webscout/Litlogger/utils/detectors.py +0 -153
webscout/Litlogger/utils/formatters.py +0 -200
webscout/Provider/ChatGPTGratis.py +0 -194
webscout/Provider/TTI/AiForce/README.md +0 -159
webscout/Provider/TTI/AiForce/__init__.py +0 -22
webscout/Provider/TTI/AiForce/async_aiforce.py +0 -224
webscout/Provider/TTI/AiForce/sync_aiforce.py +0 -245
webscout/Provider/TTI/FreeAIPlayground/README.md +0 -99
webscout/Provider/TTI/FreeAIPlayground/__init__.py +0 -9
webscout/Provider/TTI/FreeAIPlayground/async_freeaiplayground.py +0 -181
webscout/Provider/TTI/FreeAIPlayground/sync_freeaiplayground.py +0 -180
webscout/Provider/TTI/ImgSys/README.md +0 -174
webscout/Provider/TTI/ImgSys/__init__.py +0 -23
webscout/Provider/TTI/ImgSys/async_imgsys.py +0 -202
webscout/Provider/TTI/ImgSys/sync_imgsys.py +0 -195
webscout/Provider/TTI/MagicStudio/README.md +0 -101
webscout/Provider/TTI/MagicStudio/__init__.py +0 -2
webscout/Provider/TTI/MagicStudio/async_magicstudio.py +0 -111
webscout/Provider/TTI/MagicStudio/sync_magicstudio.py +0 -109
webscout/Provider/TTI/Nexra/README.md +0 -155
webscout/Provider/TTI/Nexra/__init__.py +0 -22
webscout/Provider/TTI/Nexra/async_nexra.py +0 -286
webscout/Provider/TTI/Nexra/sync_nexra.py +0 -258
webscout/Provider/TTI/PollinationsAI/README.md +0 -146
webscout/Provider/TTI/PollinationsAI/__init__.py +0 -23
webscout/Provider/TTI/PollinationsAI/async_pollinations.py +0 -311
webscout/Provider/TTI/PollinationsAI/sync_pollinations.py +0 -265
webscout/Provider/TTI/aiarta/README.md +0 -134
webscout/Provider/TTI/aiarta/__init__.py +0 -2
webscout/Provider/TTI/aiarta/async_aiarta.py +0 -482
webscout/Provider/TTI/aiarta/sync_aiarta.py +0 -440
webscout/Provider/TTI/artbit/README.md +0 -100
webscout/Provider/TTI/artbit/__init__.py +0 -22
webscout/Provider/TTI/artbit/async_artbit.py +0 -155
webscout/Provider/TTI/artbit/sync_artbit.py +0 -148
webscout/Provider/TTI/fastflux/README.md +0 -129
webscout/Provider/TTI/fastflux/__init__.py +0 -22
webscout/Provider/TTI/fastflux/async_fastflux.py +0 -261
webscout/Provider/TTI/fastflux/sync_fastflux.py +0 -252
webscout/Provider/TTI/huggingface/README.md +0 -114
webscout/Provider/TTI/huggingface/__init__.py +0 -22
webscout/Provider/TTI/huggingface/async_huggingface.py +0 -199
webscout/Provider/TTI/huggingface/sync_huggingface.py +0 -195
webscout/Provider/TTI/piclumen/README.md +0 -161
webscout/Provider/TTI/piclumen/__init__.py +0 -23
webscout/Provider/TTI/piclumen/async_piclumen.py +0 -268
webscout/Provider/TTI/piclumen/sync_piclumen.py +0 -233
webscout/Provider/TTI/pixelmuse/README.md +0 -79
webscout/Provider/TTI/pixelmuse/__init__.py +0 -4
webscout/Provider/TTI/pixelmuse/async_pixelmuse.py +0 -249
webscout/Provider/TTI/pixelmuse/sync_pixelmuse.py +0 -182
webscout/Provider/TTI/talkai/README.md +0 -139
webscout/Provider/TTI/talkai/__init__.py +0 -4
webscout/Provider/TTI/talkai/async_talkai.py +0 -229
webscout/Provider/TTI/talkai/sync_talkai.py +0 -207
webscout/Provider/UNFINISHED/oivscode.py +0 -351
webscout-8.2.8.dist-info/RECORD +0 -334
{webscout-8.2.8.dist-info → webscout-8.3.dist-info}/licenses/LICENSE.md +0 -0
{webscout-8.2.8.dist-info → webscout-8.3.dist-info}/top_level.txt +0 -0

webscout/scout/core/scout.py CHANGED Viewed

@@ -1,20 +1,20 @@
 """
 Scout Main Module - HTML Parsing and Traversal
 """
-import re
-import json
 import hashlib
+import json
+import re
 import unicodedata
 import urllib.parse
-from typing import List, Dict, Optional, Any
+from typing import Any, Dict, List, Optional
+from ..element import NavigableString, Tag
 from ..parsers import ParserRegistry
-from ..element import Tag, NavigableString
 from ..utils import decode_markup
-from .text_analyzer import ScoutTextAnalyzer
-from .web_analyzer import ScoutWebAnalyzer
 from .search_result import ScoutSearchResult
+from .text_analyzer import ScoutTextAnalyzer
 from .text_utils import SentenceTokenizer
+from .web_analyzer import ScoutWebAnalyzer
 class Scout:
@@ -23,11 +23,11 @@ class Scout:
     A comprehensive HTML parsing and traversal library.
     Enhanced with advanced features and intelligent parsing.
     """
     def __init__(self, markup="", features='html.parser', from_encoding=None, **kwargs):
         """
         Initialize Scout with HTML content.
         Args:
             markup (str): HTML content to parse
             features (str): Parser to use ('html.parser', 'lxml', 'html5lib', 'lxml-xml')
@@ -38,50 +38,50 @@ class Scout:
         self.markup = self._preprocess_markup(markup, from_encoding)
         self.features = features
         self.from_encoding = from_encoding
         # Get the right parser for the job
         if features not in ParserRegistry.list_parsers():
             raise ValueError(
                 f"Invalid parser '{features}'! Choose from: {', '.join(ParserRegistry.list_parsers().keys())}"
             )
         parser_class = ParserRegistry.get_parser(features)
         self.parser = parser_class
         # Parse that HTML! 🎯
         self._soup = self.parser.parse(self.markup)
         # BeautifulSoup-like attributes
         self.name = self._soup.name if hasattr(self._soup, 'name') else None
         self.attrs = self._soup.attrs if hasattr(self._soup, 'attrs') else {}
         # Advanced parsing options
         self._cache = {}
         # Text and web analyzers
         self.text_analyzer = ScoutTextAnalyzer()
         self.web_analyzer = ScoutWebAnalyzer()
     def normalize_text(self, text: str, form='NFKD') -> str:
         """
         Normalize text using Unicode normalization.
         Args:
             text (str): Input text
             form (str, optional): Normalization form
         Returns:
             str: Normalized text
         """
         return unicodedata.normalize(form, text)
     def url_parse(self, url: str) -> Dict[str, str]:
         """
         Parse and analyze a URL.
         Args:
             url (str): URL to parse
         Returns:
             Dict[str, str]: Parsed URL components
         """
@@ -94,39 +94,39 @@ class Scout:
             'query': parsed.query,
             'fragment': parsed.fragment
         }
     def analyze_page_structure(self) -> Dict[str, Any]:
         """
         Analyze the structure of the parsed page.
         Returns:
             Dict[str, Any]: Page structure analysis
         """
         return self.web_analyzer.analyze_page_structure(self)
     def analyze_text(self, text: Optional[str] = None) -> Dict[str, Any]:
         """
         Perform advanced text analysis.
         Args:
             text (str, optional): Text to analyze. If None, uses page text.
         Returns:
             Dict[str, Any]: Text analysis results
         """
         if text is None:
             text = self.get_text()
         return {
             'word_count': self.text_analyzer.count_words(text),
             'entities': self.text_analyzer.extract_entities(text),
             'tokens': self.text_analyzer.tokenize(text)
         }
     def extract_semantic_info(self) -> Dict[str, Any]:
         """
         Extract semantic information from the document.
         Returns:
             Dict[str, Any]: Semantic information
         """
@@ -146,29 +146,29 @@ class Scout:
             }
         }
         return semantic_info
     def cache(self, key: str, value: Any = None) -> Any:
         """
         Manage a cache for parsed content.
         Args:
             key (str): Cache key
             value (Any, optional): Value to cache
         Returns:
             Any: Cached value or None
         """
         if value is not None:
             self._cache[key] = value
         return self._cache.get(key)
     def hash_content(self, method='md5') -> str:
         """
         Generate a hash of the parsed content.
         Args:
             method (str, optional): Hashing method
         Returns:
             str: Content hash
         """
@@ -177,21 +177,21 @@ class Scout:
             'sha1': hashlib.sha1,
             'sha256': hashlib.sha256
         }
         if method not in hash_methods:
             raise ValueError(f"Unsupported hash method: {method}")
         hasher = hash_methods[method]()
         hasher.update(str(self._soup).encode('utf-8'))
         return hasher.hexdigest()
     def extract_links(self, base_url: Optional[str] = None) -> List[Dict[str, str]]:
         """
         Extract all links from the document.
         Args:
             base_url (str, optional): Base URL for resolving relative links
         Returns:
             List[Dict[str, str]]: List of link dictionaries
         """
@@ -202,7 +202,7 @@ class Scout:
                 # Resolve relative URLs if base_url is provided
                 if base_url and not href.startswith(('http://', 'https://', '//')):
                     href = f"{base_url.rstrip('/')}/{href.lstrip('/')}"
                 links.append({
                     'href': href,
                     'text': link.get_text(strip=True),
@@ -210,11 +210,11 @@ class Scout:
                     'type': link.get('type')
                 })
         return links
     def extract_metadata(self) -> Dict[str, Any]:
         """
         Extract metadata from HTML document.
         Returns:
             Dict[str, Any]: Extracted metadata
         """
@@ -225,87 +225,87 @@ class Scout:
             'og_metadata': {},
             'twitter_metadata': {}
         }
         # Open Graph metadata
         for meta in self.find_all('meta', attrs={'property': re.compile(r'^og:')}):
             key = meta.attrs('property')[0][3:]
             metadata['og_metadata'][key] = meta.attrs('content')[0]
         # Twitter Card metadata
         for meta in self.find_all('meta', attrs={'name': re.compile(r'^twitter:')}):
             key = meta.attrs('name')[0][8:]
             metadata['twitter_metadata'][key] = meta.attrs('content')[0]
         return metadata
     def to_json(self, indent=2) -> str:
         """
         Convert parsed content to JSON.
         Args:
             indent (int, optional): JSON indentation
         Returns:
             str: JSON representation of the document
         """
         def _tag_to_dict(tag):
             if isinstance(tag, NavigableString):
                 return str(tag)
             result = {
                 'name': tag.name,
                 'attrs': tag.attrs,
                 'text': tag.get_text(strip=True)
             }
             if tag.contents:
                 result['children'] = [_tag_to_dict(child) for child in tag.contents]
             return result
         return json.dumps(_tag_to_dict(self._soup), indent=indent)
     def find(self, name=None, attrs={}, recursive=True, text=None, **kwargs) -> ScoutSearchResult:
         """
         Find the first matching element.
         Args:
             name (str, optional): Tag name to search for
             attrs (dict, optional): Attributes to match
             recursive (bool, optional): Search recursively
             text (str, optional): Text content to match
         Returns:
             ScoutSearchResult: First matching element
         """
         result = self._soup.find(name, attrs, recursive, text, **kwargs)
         return ScoutSearchResult([result]) if result else ScoutSearchResult([])
     def find_all(self, name=None, attrs={}, recursive=True, text=None, limit=None, **kwargs) -> ScoutSearchResult:
         """
         Find all matching elements.
         Args:
             name (str, optional): Tag name to search for
             attrs (dict, optional): Attributes to match
             recursive (bool, optional): Search recursively
             text (str, optional): Text content to match
             limit (int, optional): Maximum number of results
         Returns:
             ScoutSearchResult: List of matching elements
         """
         results = self._soup.find_all(name, attrs, recursive, text, limit, **kwargs)
         return ScoutSearchResult(results)
     def find_parent(self, name=None, attrs={}, **kwargs) -> Optional[Tag]:
         """
         Find the first parent matching given criteria.
         Args:
             name (str, optional): Tag name to search for
             attrs (dict, optional): Attributes to match
         Returns:
             Tag or None: First matching parent
         """
@@ -316,16 +316,16 @@ class Scout:
                 return current
             current = current.parent
         return None
     def find_parents(self, name=None, attrs={}, limit=None, **kwargs) -> List[Tag]:
         """
         Find all parents matching given criteria.
         Args:
             name (str, optional): Tag name to search for
             attrs (dict, optional): Attributes to match
             limit (int, optional): Maximum number of results
         Returns:
             List[Tag]: List of matching parents
         """
@@ -337,21 +337,21 @@ class Scout:
                 parents.append(current)
             current = current.parent
         return parents
     def find_next_sibling(self, name=None, attrs={}, **kwargs) -> Optional[Tag]:
         """
         Find the next sibling matching given criteria.
         Args:
             name (str, optional): Tag name to search for
             attrs (dict, optional): Attributes to match
         Returns:
             Tag or None: First matching next sibling
         """
         if not self._soup.parent:
             return None
         siblings = self._soup.parent.contents
         try:
             current_index = siblings.index(self._soup)
@@ -363,22 +363,22 @@ class Scout:
         except ValueError:
             pass
         return None
     def find_next_siblings(self, name=None, attrs={}, limit=None, **kwargs) -> List[Tag]:
         """
         Find all next siblings matching given criteria.
         Args:
             name (str, optional): Tag name to search for
             attrs (dict, optional): Attributes to match
             limit (int, optional): Maximum number of results
         Returns:
             List[Tag]: List of matching next siblings
         """
         if not self._soup.parent:
             return []
         siblings = []
         siblings_list = self._soup.parent.contents
         try:
@@ -393,40 +393,79 @@ class Scout:
         except ValueError:
             pass
         return siblings
+    def find_previous_sibling(self, name=None, attrs={}, **kwargs) -> Optional[Tag]:
+        """Find the previous sibling matching given criteria."""
+        if not self._soup.parent:
+            return None
+        siblings = self._soup.parent.contents
+        try:
+            current_index = siblings.index(self._soup)
+            for sibling in reversed(siblings[:current_index]):
+                if isinstance(sibling, Tag):
+                    if (name is None or sibling.name == name) and all(
+                        sibling.get(k) == v for k, v in attrs.items()
+                    ):
+                        return sibling
+        except ValueError:
+            pass
+        return None
+    def find_previous_siblings(self, name=None, attrs={}, limit=None, **kwargs) -> List[Tag]:
+        """Find all previous siblings matching given criteria."""
+        if not self._soup.parent:
+            return []
+        siblings = []
+        siblings_list = self._soup.parent.contents
+        try:
+            current_index = siblings_list.index(self._soup)
+            for sibling in reversed(siblings_list[:current_index]):
+                if isinstance(sibling, Tag):
+                    if (name is None or sibling.name == name) and all(
+                        sibling.get(k) == v for k, v in attrs.items()
+                    ):
+                        siblings.append(sibling)
+                        if limit and len(siblings) == limit:
+                            break
+        except ValueError:
+            pass
+        return siblings
     def select(self, selector: str) -> List[Tag]:
         """
         Select elements using CSS selector.
         Args:
             selector (str): CSS selector string
         Returns:
             List[Tag]: List of matching elements
         """
         return self._soup.select(selector)
     def select_one(self, selector: str) -> Optional[Tag]:
         """
         Select the first element matching the CSS selector.
         Args:
             selector (str): CSS selector string
         Returns:
             Tag or None: First matching element
         """
         return self._soup.select_one(selector)
     def get_text(self, separator=' ', strip=False, types=None) -> str:
         """
         Extract all text from the parsed document.
         Args:
             separator (str, optional): Text separator
             strip (bool, optional): Strip whitespace
             types (list, optional): Types of content to extract
         Returns:
             str: Extracted text
         """
@@ -434,113 +473,113 @@ class Scout:
         text = self._soup.get_text(separator, strip, types)
         sentences = tokenizer.tokenize(text)
         return "\n\n".join(sentences)
     def remove_tags(self, tags: List[str]) -> None:
         """
         Remove specified tags and their contents from the document.
         Args:
             tags (List[str]): List of tag names to remove
         """
         for tag_name in tags:
             for tag in self._soup.find_all(tag_name):
                 tag.decompose()
     def prettify(self, formatter='minimal') -> str:
         """
         Return a formatted, pretty-printed version of the HTML.
         Args:
             formatter (str, optional): Formatting style
         Returns:
             str: Prettified HTML
         """
         return self._soup.prettify(formatter)
     def decompose(self, tag: Tag = None) -> None:
         """
         Remove a tag and its contents from the document.
         Args:
             tag (Tag, optional): Tag to remove. If None, removes the root tag.
         """
         if tag is None:
             tag = self._soup
         tag.decompose()
     def extract(self, tag: Tag = None) -> Tag:
         """
         Remove a tag from the document and return it.
         Args:
             tag (Tag, optional): Tag to extract. If None, extracts the root tag.
         Returns:
             Tag: Extracted tag
         """
         if tag is None:
             tag = self._soup
         return tag.extract()
     def clear(self, tag: Tag = None) -> None:
         """
         Remove a tag's contents while keeping the tag itself.
         Args:
             tag (Tag, optional): Tag to clear. If None, clears the root tag.
         """
         if tag is None:
             tag = self._soup
         tag.clear()
     def replace_with(self, old_tag: Tag, new_tag: Tag) -> None:
         """
         Replace one tag with another.
         Args:
             old_tag (Tag): Tag to replace
             new_tag (Tag): Replacement tag
         """
         old_tag.replace_with(new_tag)
     def encode(self, encoding='utf-8') -> bytes:
         """
         Encode the document to a specific encoding.
         Args:
             encoding (str, optional): Encoding to use
         Returns:
             bytes: Encoded document
         """
         return str(self._soup).encode(encoding)
     def decode(self, encoding='utf-8') -> str:
         """
         Decode the document from a specific encoding.
         Args:
             encoding (str, optional): Encoding to use
         Returns:
             str: Decoded document
         """
         return str(self._soup)
     def __str__(self) -> str:
         """
         String representation of the parsed document.
         Returns:
             str: HTML content
         """
         return str(self._soup)
     def __repr__(self) -> str:
         """
         Detailed representation of the Scout object.
         Returns:
             str: Scout object description
         """
@@ -549,20 +588,20 @@ class Scout:
     def _preprocess_markup(self, markup: str, encoding: Optional[str] = None) -> str:
         """
         Preprocess markup before parsing.
         Args:
             markup (str): Input markup
             encoding (str, optional): Encoding to use
         Returns:
             str: Preprocessed markup
         """
         # Decode markup
         decoded_markup = decode_markup(markup, encoding)
         # Basic HTML cleaning
         # Remove comments, normalize whitespace, etc.
         decoded_markup = re.sub(r'<!--.*?-->', '', decoded_markup, flags=re.DOTALL)
         decoded_markup = re.sub(r'\s+', ' ', decoded_markup)
         return decoded_markup

webscout 8.2.8__py3-none-any.whl → 8.3__py3-none-any.whl

Potentially problematic release.

webscout 8.2.8py3-none-any.whl → 8.3py3-none-any.whl