PyPI - webscout - Versions diffs - 7.0__py3-none-any.whl → 7.2__py3-none-any.whl - Mend

webscout 7.0py3-none-any.whl → 7.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of webscout might be problematic. Click here for more details.

Files changed (147) hide show

webscout/AIauto.py +191 -191
webscout/AIbase.py +122 -122
webscout/AIutel.py +440 -440
webscout/Bard.py +343 -161
webscout/DWEBS.py +489 -492
webscout/Extra/YTToolkit/YTdownloader.py +995 -995
webscout/Extra/YTToolkit/__init__.py +2 -2
webscout/Extra/YTToolkit/transcriber.py +476 -479
webscout/Extra/YTToolkit/ytapi/channel.py +307 -307
webscout/Extra/YTToolkit/ytapi/playlist.py +58 -58
webscout/Extra/YTToolkit/ytapi/pool.py +7 -7
webscout/Extra/YTToolkit/ytapi/utils.py +62 -62
webscout/Extra/YTToolkit/ytapi/video.py +103 -103
webscout/Extra/autocoder/__init__.py +9 -9
webscout/Extra/autocoder/autocoder_utiles.py +199 -199
webscout/Extra/autocoder/rawdog.py +5 -7
webscout/Extra/autollama.py +230 -230
webscout/Extra/gguf.py +3 -3
webscout/Extra/weather.py +171 -171
webscout/LLM.py +442 -442
webscout/Litlogger/__init__.py +67 -681
webscout/Litlogger/core/__init__.py +6 -0
webscout/Litlogger/core/level.py +20 -0
webscout/Litlogger/core/logger.py +123 -0
webscout/Litlogger/handlers/__init__.py +12 -0
webscout/Litlogger/handlers/console.py +50 -0
webscout/Litlogger/handlers/file.py +143 -0
webscout/Litlogger/handlers/network.py +174 -0
webscout/Litlogger/styles/__init__.py +7 -0
webscout/Litlogger/styles/colors.py +231 -0
webscout/Litlogger/styles/formats.py +377 -0
webscout/Litlogger/styles/text.py +87 -0
webscout/Litlogger/utils/__init__.py +6 -0
webscout/Litlogger/utils/detectors.py +154 -0
webscout/Litlogger/utils/formatters.py +200 -0
webscout/Provider/AISEARCH/DeepFind.py +250 -250
webscout/Provider/Blackboxai.py +136 -137
webscout/Provider/ChatGPTGratis.py +226 -0
webscout/Provider/Cloudflare.py +91 -78
webscout/Provider/DeepSeek.py +218 -0
webscout/Provider/Deepinfra.py +59 -35
webscout/Provider/Free2GPT.py +131 -124
webscout/Provider/Gemini.py +100 -115
webscout/Provider/Glider.py +74 -59
webscout/Provider/Groq.py +30 -18
webscout/Provider/Jadve.py +108 -77
webscout/Provider/Llama3.py +117 -94
webscout/Provider/Marcus.py +191 -137
webscout/Provider/Netwrck.py +62 -50
webscout/Provider/PI.py +79 -124
webscout/Provider/PizzaGPT.py +129 -83
webscout/Provider/QwenLM.py +311 -0
webscout/Provider/TTI/AiForce/__init__.py +22 -22
webscout/Provider/TTI/AiForce/async_aiforce.py +257 -257
webscout/Provider/TTI/AiForce/sync_aiforce.py +242 -242
webscout/Provider/TTI/Nexra/__init__.py +22 -22
webscout/Provider/TTI/Nexra/async_nexra.py +286 -286
webscout/Provider/TTI/Nexra/sync_nexra.py +258 -258
webscout/Provider/TTI/PollinationsAI/__init__.py +23 -23
webscout/Provider/TTI/PollinationsAI/async_pollinations.py +330 -330
webscout/Provider/TTI/PollinationsAI/sync_pollinations.py +285 -285
webscout/Provider/TTI/artbit/__init__.py +22 -22
webscout/Provider/TTI/artbit/async_artbit.py +184 -184
webscout/Provider/TTI/artbit/sync_artbit.py +176 -176
webscout/Provider/TTI/blackbox/__init__.py +4 -4
webscout/Provider/TTI/blackbox/async_blackbox.py +212 -212
webscout/Provider/TTI/blackbox/sync_blackbox.py +199 -199
webscout/Provider/TTI/deepinfra/__init__.py +4 -4
webscout/Provider/TTI/deepinfra/async_deepinfra.py +227 -227
webscout/Provider/TTI/deepinfra/sync_deepinfra.py +199 -199
webscout/Provider/TTI/huggingface/__init__.py +22 -22
webscout/Provider/TTI/huggingface/async_huggingface.py +199 -199
webscout/Provider/TTI/huggingface/sync_huggingface.py +195 -195
webscout/Provider/TTI/imgninza/__init__.py +4 -4
webscout/Provider/TTI/imgninza/async_ninza.py +214 -214
webscout/Provider/TTI/imgninza/sync_ninza.py +209 -209
webscout/Provider/TTI/talkai/__init__.py +4 -4
webscout/Provider/TTI/talkai/async_talkai.py +229 -229
webscout/Provider/TTI/talkai/sync_talkai.py +207 -207
webscout/Provider/TTS/deepgram.py +182 -182
webscout/Provider/TTS/elevenlabs.py +136 -136
webscout/Provider/TTS/gesserit.py +150 -150
webscout/Provider/TTS/murfai.py +138 -138
webscout/Provider/TTS/parler.py +133 -134
webscout/Provider/TTS/streamElements.py +360 -360
webscout/Provider/TTS/utils.py +280 -280
webscout/Provider/TTS/voicepod.py +116 -116
webscout/Provider/TextPollinationsAI.py +74 -47
webscout/Provider/WiseCat.py +193 -0
webscout/Provider/__init__.py +144 -136
webscout/Provider/cerebras.py +242 -227
webscout/Provider/chatglm.py +204 -204
webscout/Provider/dgaf.py +67 -39
webscout/Provider/gaurish.py +105 -66
webscout/Provider/geminiapi.py +208 -208
webscout/Provider/granite.py +223 -0
webscout/Provider/hermes.py +218 -218
webscout/Provider/llama3mitril.py +179 -179
webscout/Provider/llamatutor.py +72 -62
webscout/Provider/llmchat.py +60 -35
webscout/Provider/meta.py +794 -794
webscout/Provider/multichat.py +331 -230
webscout/Provider/typegpt.py +359 -356
webscout/Provider/yep.py +5 -5
webscout/__main__.py +5 -5
webscout/cli.py +319 -319
webscout/conversation.py +241 -242
webscout/exceptions.py +328 -328
webscout/litagent/__init__.py +28 -28
webscout/litagent/agent.py +2 -3
webscout/litprinter/__init__.py +0 -58
webscout/scout/__init__.py +8 -8
webscout/scout/core.py +884 -884
webscout/scout/element.py +459 -459
webscout/scout/parsers/__init__.py +69 -69
webscout/scout/parsers/html5lib_parser.py +172 -172
webscout/scout/parsers/html_parser.py +236 -236
webscout/scout/parsers/lxml_parser.py +178 -178
webscout/scout/utils.py +38 -38
webscout/swiftcli/__init__.py +811 -811
webscout/update_checker.py +2 -12
webscout/version.py +1 -1
webscout/webscout_search.py +1142 -1140
webscout/webscout_search_async.py +635 -635
webscout/zeroart/__init__.py +54 -54
webscout/zeroart/base.py +60 -60
webscout/zeroart/effects.py +99 -99
webscout/zeroart/fonts.py +816 -816
{webscout-7.0.dist-info → webscout-7.2.dist-info}/METADATA +21 -28
webscout-7.2.dist-info/RECORD +217 -0
webstoken/__init__.py +30 -30
webstoken/classifier.py +189 -189
webstoken/keywords.py +216 -216
webstoken/language.py +128 -128
webstoken/ner.py +164 -164
webstoken/normalizer.py +35 -35
webstoken/processor.py +77 -77
webstoken/sentiment.py +206 -206
webstoken/stemmer.py +73 -73
webstoken/tagger.py +60 -60
webstoken/tokenizer.py +158 -158
webscout/Provider/RUBIKSAI.py +0 -272
webscout-7.0.dist-info/RECORD +0 -199
{webscout-7.0.dist-info → webscout-7.2.dist-info}/LICENSE.md +0 -0
{webscout-7.0.dist-info → webscout-7.2.dist-info}/WHEEL +0 -0
{webscout-7.0.dist-info → webscout-7.2.dist-info}/entry_points.txt +0 -0
{webscout-7.0.dist-info → webscout-7.2.dist-info}/top_level.txt +0 -0

webscout/scout/element.py CHANGED Viewed

@@ -1,460 +1,460 @@
-"""
-Scout Element Module - Advanced HTML Element Representation
-"""
-import re
-from typing import Optional, List, Dict, Union, Any, Callable, Iterable
-class NavigableString(str):
-    """
-    A string that knows its place in the document tree.
-    Mimics BeautifulSoup's NavigableString for better compatibility.
-    """
-    def __new__(cls, text: str):
-        """
-        Create a new NavigableString instance.
-        Args:
-            text (str): String content
-        """
-        return str.__new__(cls, text)
-    def __init__(self, text: str):
-        """
-        Initialize a navigable string.
-        Args:
-            text (str): String content
-        """
-        self.parent = None
-    def __repr__(self):
-        """String representation."""
-        return f"NavigableString({super().__repr__()})"
-    def __add__(self, other):
-        """
-        Allow concatenation of NavigableString with other strings.
-        Args:
-            other (str): String to concatenate
-        Returns:
-            str: Concatenated string
-        """
-        return str(self) + str(other)
-    def strip(self, chars=None):
-        """
-        Strip whitespace or specified characters.
-        Args:
-            chars (str, optional): Characters to strip
-        Returns:
-            str: Stripped string
-        """
-        return NavigableString(super().strip(chars))
-class Tag:
-    """
-    Represents an HTML tag with advanced traversal and manipulation capabilities.
-    Enhanced to closely mimic BeautifulSoup's Tag class.
-    """
-    def __init__(self, name: str, attrs: Dict[str, str] = None):
-        """
-        Initialize a Tag with name and attributes.
-        Args:
-            name (str): Tag name
-            attrs (dict, optional): Tag attributes
-        """
-        self.name = name
-        self.attrs = attrs or {}
-        self.contents = []
-        self.parent = None
-        self.string = None  # For single string content
-    def __str__(self):
-        """String representation of the tag."""
-        return self.decode_contents()
-    def __repr__(self):
-        """Detailed representation of the tag."""
-        return f"<{self.name} {self.attrs}>"
-    def __call__(self, *args, **kwargs):
-        """
-        Allows calling find_all directly on the tag.
-        Mimics BeautifulSoup's behavior.
-        """
-        return self.find_all(*args, **kwargs)
-    def __contains__(self, item):
-        """
-        Check if an item is in the tag's contents.
-        Args:
-            item: Item to search for
-        Returns:
-            bool: True if item is in contents, False otherwise
-        """
-        return item in self.contents
-    def __getitem__(self, key):
-        """
-        Get an attribute value using dictionary-like access.
-        Args:
-            key (str): Attribute name
-        Returns:
-            Any: Attribute value
-        """
-        return self.attrs[key]
-    def __iter__(self):
-        """
-        Iterate through tag's contents.
-        Returns:
-            Iterator: Contents of the tag
-        """
-        return iter(self.contents)
-    def __eq__(self, other):
-        """
-        Compare tags based on name and attributes.
-        Args:
-            other (Tag): Tag to compare
-        Returns:
-            bool: True if tags are equivalent
-        """
-        if not isinstance(other, Tag):
-            return False
-        return (
-            self.name == other.name and
-            self.attrs == other.attrs and
-            str(self) == str(other)
-        )
-    def __hash__(self):
-        """
-        Generate a hash for the tag.
-        Returns:
-            int: Hash value
-        """
-        return hash((self.name, frozenset(self.attrs.items()), str(self)))
-    def find(self, name=None, attrs={}, recursive=True, text=None, **kwargs) -> Optional['Tag']:
-        """
-        Find the first matching child element.
-        Enhanced with more flexible matching.
-        Args:
-            name (str, optional): Tag name to search for
-            attrs (dict, optional): Attributes to match
-            recursive (bool, optional): Search recursively
-            text (str, optional): Text content to match
-        Returns:
-            Tag or None: First matching element
-        """
-        results = self.find_all(name, attrs, recursive, text, limit=1, **kwargs)
-        return results[0] if results else None
-    def find_all(self, name=None, attrs={}, recursive=True, text=None, limit=None, **kwargs) -> List['Tag']:
-        """
-        Find all matching child elements.
-        Enhanced with more flexible matching and BeautifulSoup-like features.
-        Args:
-            name (str, optional): Tag name to search for
-            attrs (dict, optional): Attributes to match
-            recursive (bool, optional): Search recursively
-            text (str, optional): Text content to match
-            limit (int, optional): Maximum number of results
-        Returns:
-            List[Tag]: List of matching elements
-        """
-        results = []
-        def _match(tag):
-            # Check tag name with case-insensitive and regex support
-            if name:
-                if isinstance(name, str):
-                    if tag.name.lower() != name.lower():
-                        return False
-                elif isinstance(name, re.Pattern):
-                    if not name.search(tag.name):
-                        return False
-            # Check attributes with more flexible matching
-            for k, v in attrs.items():
-                # Handle special attribute matching
-                if k == 'class':
-                    tag_classes = tag.get('class', [])
-                    if isinstance(v, str) and v not in tag_classes:
-                        return False
-                    elif isinstance(v, list) and not all(cls in tag_classes for cls in v):
-                        return False
-                elif k == 'id':
-                    if tag.get('id') != v:
-                        return False
-                else:
-                    # Regex or exact match for other attributes
-                    tag_attr = tag.attrs.get(k)
-                    if isinstance(v, re.Pattern):
-                        if not v.search(str(tag_attr)):
-                            return False
-                    elif tag_attr != v:
-                        return False
-            # Check text content
-            if text:
-                tag_text = tag.get_text(strip=True)
-                if isinstance(text, str) and text.lower() not in tag_text.lower():
-                    return False
-                elif isinstance(text, re.Pattern) and not text.search(tag_text):
-                    return False
-            return True
-        def _search(element):
-            if _match(element):
-                results.append(element)
-                if limit and len(results) == limit:
-                    return
-            if recursive:
-                for child in element.contents:
-                    if isinstance(child, Tag):
-                        _search(child)
-        _search(self)
-        return results
-    def select(self, selector: str) -> List['Tag']:
-        """
-        Select elements using CSS selector.
-        Enhanced to support more complex selectors.
-        Args:
-            selector (str): CSS selector string
-        Returns:
-            List[Tag]: List of matching elements
-        """
-        # More advanced CSS selector parsing
-        # This is a simplified implementation and might need more robust parsing
-        parts = re.split(r'\s+', selector.strip())
-        results = []
-        def _match_selector(tag, selector_part):
-            # Support more complex selectors
-            if selector_part.startswith('.'):
-                # Class selector
-                return selector_part[1:] in tag.get('class', [])
-            elif selector_part.startswith('#'):
-                # ID selector
-                return tag.get('id') == selector_part[1:]
-            elif '[' in selector_part and ']' in selector_part:
-                # Attribute selector
-                attr_match = re.match(r'(\w+)\[([^=]+)(?:=(.+))?\]', selector_part)
-                if attr_match:
-                    tag_name, attr, value = attr_match.groups()
-                    if tag_name and tag.name != tag_name:
-                        return False
-                    if value:
-                        return tag.get(attr) == value.strip("'\"")
-                    return attr in tag.attrs
-            else:
-                # Tag selector
-                return tag.name == selector_part
-        def _recursive_select(element, selector_parts):
-            if not selector_parts:
-                results.append(element)
-                return
-            current_selector = selector_parts[0]
-            remaining_selectors = selector_parts[1:]
-            if _match_selector(element, current_selector):
-                if not remaining_selectors:
-                    results.append(element)
-                else:
-                    for child in element.contents:
-                        if isinstance(child, Tag):
-                            _recursive_select(child, remaining_selectors)
-        for child in self.contents:
-            if isinstance(child, Tag):
-                _recursive_select(child, parts)
-        return results
-    def select_one(self, selector: str) -> Optional['Tag']:
-        """
-        Select the first element matching the CSS selector.
-        Args:
-            selector (str): CSS selector string
-        Returns:
-            Tag or None: First matching element
-        """
-        results = self.select(selector)
-        return results[0] if results else None
-    def get_text(self, separator=' ', strip=False, types=None) -> str:
-        """
-        Extract text from the tag and its descendants.
-        Enhanced to support more flexible text extraction.
-        Args:
-            separator (str, optional): Text separator
-            strip (bool, optional): Strip whitespace
-            types (list, optional): Types of content to extract
-        Returns:
-            str: Extracted text
-        """
-        texts = []
-        for content in self.contents:
-            # Support filtering by content type
-            if types is None or type(content) in types:
-                if isinstance(content, NavigableString):
-                    texts.append(str(content))
-                elif isinstance(content, Tag):
-                    texts.append(content.get_text(separator, strip))
-        text = separator.join(texts)
-        text = re.sub(r'\n\n+', '\n', text) # Replace multiple newlines with single newlines
-        return text.strip() if strip else text
-    def find_text(self, pattern: Union[str, re.Pattern], **kwargs) -> Optional[str]:
-        """
-        Find the first text matching a pattern.
-        Args:
-            pattern (str or re.Pattern): Pattern to match
-            **kwargs: Additional arguments for get_text()
-        Returns:
-            str or None: First matching text
-        """
-        text = self.get_text(**kwargs)
-        if isinstance(pattern, str):
-            return pattern if pattern in text else None
-        elif isinstance(pattern, re.Pattern):
-            match = pattern.search(text)
-            return match.group(0) if match else None
-    def replace_text(self, old: Union[str, re.Pattern], new: str, **kwargs) -> str:
-        """
-        Replace text matching a pattern.
-        Args:
-            old (str or re.Pattern): Pattern to replace
-            new (str): Replacement text
-            **kwargs: Additional arguments for get_text()
-        Returns:
-            str: Modified text
-        """
-        text = self.get_text(**kwargs)
-        if isinstance(old, str):
-            return text.replace(old, new)
-        elif isinstance(old, re.Pattern):
-            return old.sub(new, text)
-    def get(self, key: str, default: Any = None) -> Any:
-        """
-        Get an attribute value.
-        Args:
-            key (str): Attribute name
-            default (Any, optional): Default value if attribute not found
-        Returns:
-            Any: Attribute value or default
-        """
-        return self.attrs.get(key, default)
-    def decompose(self) -> None:
-        """Remove the tag and its contents from the document."""
-        if self.parent:
-            self.parent.contents.remove(self)
-    def extract(self) -> 'Tag':
-        """
-        Remove the tag from the document and return it.
-        Returns:
-            Tag: Extracted tag
-        """
-        self.decompose()
-        return self
-    def clear(self) -> None:
-        """Remove all contents of the tag."""
-        self.contents.clear()
-    def replace_with(self, new_tag: 'Tag') -> None:
-        """
-        Replace this tag with another tag.
-        Args:
-            new_tag (Tag): Tag to replace the current tag
-        """
-        if self.parent:
-            index = self.parent.contents.index(self)
-            self.parent.contents[index] = new_tag
-            new_tag.parent = self.parent
-    def decode_contents(self, eventual_encoding='utf-8') -> str:
-        """
-        Decode the contents of the tag to a string.
-        Args:
-            eventual_encoding (str, optional): Encoding to use
-        Returns:
-            str: Decoded contents
-        """
-        return ''.join(str(content) for content in self.contents)
-    def prettify(self, formatter='minimal') -> str:
-        """
-        Return a nicely formatted representation of the tag.
-        Args:
-            formatter (str, optional): Formatting style
-        Returns:
-            str: Prettified tag representation
-        """
-        def _prettify(tag, indent=0):
-            result = ' ' * indent + f'<{tag.name}'
-            for k, v in tag.attrs.items():
-                result += f' {k}="{v}"'
-            result += '>\n'
-            for content in tag.contents:
-                if isinstance(content, Tag):
-                    result += _prettify(content, indent + 2)
-                else:
-                    result += ' ' * (indent + 2) + str(content) + '\n'
-            result += ' ' * indent + f'</{tag.name}>\n'
-            return result
+"""
+Scout Element Module - Advanced HTML Element Representation
+"""
+import re
+from typing import Optional, List, Dict, Union, Any, Callable, Iterable
+class NavigableString(str):
+    """
+    A string that knows its place in the document tree.
+    Mimics BeautifulSoup's NavigableString for better compatibility.
+    """
+    def __new__(cls, text: str):
+        """
+        Create a new NavigableString instance.
+        Args:
+            text (str): String content
+        """
+        return str.__new__(cls, text)
+    def __init__(self, text: str):
+        """
+        Initialize a navigable string.
+        Args:
+            text (str): String content
+        """
+        self.parent = None
+    def __repr__(self):
+        """String representation."""
+        return f"NavigableString({super().__repr__()})"
+    def __add__(self, other):
+        """
+        Allow concatenation of NavigableString with other strings.
+        Args:
+            other (str): String to concatenate
+        Returns:
+            str: Concatenated string
+        """
+        return str(self) + str(other)
+    def strip(self, chars=None):
+        """
+        Strip whitespace or specified characters.
+        Args:
+            chars (str, optional): Characters to strip
+        Returns:
+            str: Stripped string
+        """
+        return NavigableString(super().strip(chars))
+class Tag:
+    """
+    Represents an HTML tag with advanced traversal and manipulation capabilities.
+    Enhanced to closely mimic BeautifulSoup's Tag class.
+    """
+    def __init__(self, name: str, attrs: Dict[str, str] = None):
+        """
+        Initialize a Tag with name and attributes.
+        Args:
+            name (str): Tag name
+            attrs (dict, optional): Tag attributes
+        """
+        self.name = name
+        self.attrs = attrs or {}
+        self.contents = []
+        self.parent = None
+        self.string = None  # For single string content
+    def __str__(self):
+        """String representation of the tag."""
+        return self.decode_contents()
+    def __repr__(self):
+        """Detailed representation of the tag."""
+        return f"<{self.name} {self.attrs}>"
+    def __call__(self, *args, **kwargs):
+        """
+        Allows calling find_all directly on the tag.
+        Mimics BeautifulSoup's behavior.
+        """
+        return self.find_all(*args, **kwargs)
+    def __contains__(self, item):
+        """
+        Check if an item is in the tag's contents.
+        Args:
+            item: Item to search for
+        Returns:
+            bool: True if item is in contents, False otherwise
+        """
+        return item in self.contents
+    def __getitem__(self, key):
+        """
+        Get an attribute value using dictionary-like access.
+        Args:
+            key (str): Attribute name
+        Returns:
+            Any: Attribute value
+        """
+        return self.attrs[key]
+    def __iter__(self):
+        """
+        Iterate through tag's contents.
+        Returns:
+            Iterator: Contents of the tag
+        """
+        return iter(self.contents)
+    def __eq__(self, other):
+        """
+        Compare tags based on name and attributes.
+        Args:
+            other (Tag): Tag to compare
+        Returns:
+            bool: True if tags are equivalent
+        """
+        if not isinstance(other, Tag):
+            return False
+        return (
+            self.name == other.name and
+            self.attrs == other.attrs and
+            str(self) == str(other)
+        )
+    def __hash__(self):
+        """
+        Generate a hash for the tag.
+        Returns:
+            int: Hash value
+        """
+        return hash((self.name, frozenset(self.attrs.items()), str(self)))
+    def find(self, name=None, attrs={}, recursive=True, text=None, **kwargs) -> Optional['Tag']:
+        """
+        Find the first matching child element.
+        Enhanced with more flexible matching.
+        Args:
+            name (str, optional): Tag name to search for
+            attrs (dict, optional): Attributes to match
+            recursive (bool, optional): Search recursively
+            text (str, optional): Text content to match
+        Returns:
+            Tag or None: First matching element
+        """
+        results = self.find_all(name, attrs, recursive, text, limit=1, **kwargs)
+        return results[0] if results else None
+    def find_all(self, name=None, attrs={}, recursive=True, text=None, limit=None, **kwargs) -> List['Tag']:
+        """
+        Find all matching child elements.
+        Enhanced with more flexible matching and BeautifulSoup-like features.
+        Args:
+            name (str, optional): Tag name to search for
+            attrs (dict, optional): Attributes to match
+            recursive (bool, optional): Search recursively
+            text (str, optional): Text content to match
+            limit (int, optional): Maximum number of results
+        Returns:
+            List[Tag]: List of matching elements
+        """
+        results = []
+        def _match(tag):
+            # Check tag name with case-insensitive and regex support
+            if name:
+                if isinstance(name, str):
+                    if tag.name.lower() != name.lower():
+                        return False
+                elif isinstance(name, re.Pattern):
+                    if not name.search(tag.name):
+                        return False
+            # Check attributes with more flexible matching
+            for k, v in attrs.items():
+                # Handle special attribute matching
+                if k == 'class':
+                    tag_classes = tag.get('class', [])
+                    if isinstance(v, str) and v not in tag_classes:
+                        return False
+                    elif isinstance(v, list) and not all(cls in tag_classes for cls in v):
+                        return False
+                elif k == 'id':
+                    if tag.get('id') != v:
+                        return False
+                else:
+                    # Regex or exact match for other attributes
+                    tag_attr = tag.attrs.get(k)
+                    if isinstance(v, re.Pattern):
+                        if not v.search(str(tag_attr)):
+                            return False
+                    elif tag_attr != v:
+                        return False
+            # Check text content
+            if text:
+                tag_text = tag.get_text(strip=True)
+                if isinstance(text, str) and text.lower() not in tag_text.lower():
+                    return False
+                elif isinstance(text, re.Pattern) and not text.search(tag_text):
+                    return False
+            return True
+        def _search(element):
+            if _match(element):
+                results.append(element)
+                if limit and len(results) == limit:
+                    return
+            if recursive:
+                for child in element.contents:
+                    if isinstance(child, Tag):
+                        _search(child)
+        _search(self)
+        return results
+    def select(self, selector: str) -> List['Tag']:
+        """
+        Select elements using CSS selector.
+        Enhanced to support more complex selectors.
+        Args:
+            selector (str): CSS selector string
+        Returns:
+            List[Tag]: List of matching elements
+        """
+        # More advanced CSS selector parsing
+        # This is a simplified implementation and might need more robust parsing
+        parts = re.split(r'\s+', selector.strip())
+        results = []
+        def _match_selector(tag, selector_part):
+            # Support more complex selectors
+            if selector_part.startswith('.'):
+                # Class selector
+                return selector_part[1:] in tag.get('class', [])
+            elif selector_part.startswith('#'):
+                # ID selector
+                return tag.get('id') == selector_part[1:]
+            elif '[' in selector_part and ']' in selector_part:
+                # Attribute selector
+                attr_match = re.match(r'(\w+)\[([^=]+)(?:=(.+))?\]', selector_part)
+                if attr_match:
+                    tag_name, attr, value = attr_match.groups()
+                    if tag_name and tag.name != tag_name:
+                        return False
+                    if value:
+                        return tag.get(attr) == value.strip("'\"")
+                    return attr in tag.attrs
+            else:
+                # Tag selector
+                return tag.name == selector_part
+        def _recursive_select(element, selector_parts):
+            if not selector_parts:
+                results.append(element)
+                return
+            current_selector = selector_parts[0]
+            remaining_selectors = selector_parts[1:]
+            if _match_selector(element, current_selector):
+                if not remaining_selectors:
+                    results.append(element)
+                else:
+                    for child in element.contents:
+                        if isinstance(child, Tag):
+                            _recursive_select(child, remaining_selectors)
+        for child in self.contents:
+            if isinstance(child, Tag):
+                _recursive_select(child, parts)
+        return results
+    def select_one(self, selector: str) -> Optional['Tag']:
+        """
+        Select the first element matching the CSS selector.
+        Args:
+            selector (str): CSS selector string
+        Returns:
+            Tag or None: First matching element
+        """
+        results = self.select(selector)
+        return results[0] if results else None
+    def get_text(self, separator=' ', strip=False, types=None) -> str:
+        """
+        Extract text from the tag and its descendants.
+        Enhanced to support more flexible text extraction.
+        Args:
+            separator (str, optional): Text separator
+            strip (bool, optional): Strip whitespace
+            types (list, optional): Types of content to extract
+        Returns:
+            str: Extracted text
+        """
+        texts = []
+        for content in self.contents:
+            # Support filtering by content type
+            if types is None or type(content) in types:
+                if isinstance(content, NavigableString):
+                    texts.append(str(content))
+                elif isinstance(content, Tag):
+                    texts.append(content.get_text(separator, strip))
+        text = separator.join(texts)
+        text = re.sub(r'\n\n+', '\n', text) # Replace multiple newlines with single newlines
+        return text.strip() if strip else text
+    def find_text(self, pattern: Union[str, re.Pattern], **kwargs) -> Optional[str]:
+        """
+        Find the first text matching a pattern.
+        Args:
+            pattern (str or re.Pattern): Pattern to match
+            **kwargs: Additional arguments for get_text()
+        Returns:
+            str or None: First matching text
+        """
+        text = self.get_text(**kwargs)
+        if isinstance(pattern, str):
+            return pattern if pattern in text else None
+        elif isinstance(pattern, re.Pattern):
+            match = pattern.search(text)
+            return match.group(0) if match else None
+    def replace_text(self, old: Union[str, re.Pattern], new: str, **kwargs) -> str:
+        """
+        Replace text matching a pattern.
+        Args:
+            old (str or re.Pattern): Pattern to replace
+            new (str): Replacement text
+            **kwargs: Additional arguments for get_text()
+        Returns:
+            str: Modified text
+        """
+        text = self.get_text(**kwargs)
+        if isinstance(old, str):
+            return text.replace(old, new)
+        elif isinstance(old, re.Pattern):
+            return old.sub(new, text)
+    def get(self, key: str, default: Any = None) -> Any:
+        """
+        Get an attribute value.
+        Args:
+            key (str): Attribute name
+            default (Any, optional): Default value if attribute not found
+        Returns:
+            Any: Attribute value or default
+        """
+        return self.attrs.get(key, default)
+    def decompose(self) -> None:
+        """Remove the tag and its contents from the document."""
+        if self.parent:
+            self.parent.contents.remove(self)
+    def extract(self) -> 'Tag':
+        """
+        Remove the tag from the document and return it.
+        Returns:
+            Tag: Extracted tag
+        """
+        self.decompose()
+        return self
+    def clear(self) -> None:
+        """Remove all contents of the tag."""
+        self.contents.clear()
+    def replace_with(self, new_tag: 'Tag') -> None:
+        """
+        Replace this tag with another tag.
+        Args:
+            new_tag (Tag): Tag to replace the current tag
+        """
+        if self.parent:
+            index = self.parent.contents.index(self)
+            self.parent.contents[index] = new_tag
+            new_tag.parent = self.parent
+    def decode_contents(self, eventual_encoding='utf-8') -> str:
+        """
+        Decode the contents of the tag to a string.
+        Args:
+            eventual_encoding (str, optional): Encoding to use
+        Returns:
+            str: Decoded contents
+        """
+        return ''.join(str(content) for content in self.contents)
+    def prettify(self, formatter='minimal') -> str:
+        """
+        Return a nicely formatted representation of the tag.
+        Args:
+            formatter (str, optional): Formatting style
+        Returns:
+            str: Prettified tag representation
+        """
+        def _prettify(tag, indent=0):
+            result = ' ' * indent + f'<{tag.name}'
+            for k, v in tag.attrs.items():
+                result += f' {k}="{v}"'
+            result += '>\n'
+            for content in tag.contents:
+                if isinstance(content, Tag):
+                    result += _prettify(content, indent + 2)
+                else:
+                    result += ' ' * (indent + 2) + str(content) + '\n'
+            result += ' ' * indent + f'</{tag.name}>\n'
+            return result
         return _prettify(self)

webscout 7.0__py3-none-any.whl → 7.2__py3-none-any.whl

Potentially problematic release.

webscout 7.0py3-none-any.whl → 7.2py3-none-any.whl