PyPI - tldextract - Versions diffs - 5.1.2__py3-none-any.whl → 5.2.0__py3-none-any.whl - Mend

tldextract 5.1.2py3-none-any.whl → 5.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

tldextract/.tld_set_snapshot +5247 -3232
tldextract/__init__.py +4 -2
tldextract/_version.py +9 -4
tldextract/cache.py +5 -16
tldextract/remote.py +1 -1
tldextract/suffix_list.py +3 -1
tldextract/tldextract.py +99 -42
{tldextract-5.1.2.dist-info → tldextract-5.2.0.dist-info}/METADATA +58 -44
tldextract-5.2.0.dist-info/RECORD +16 -0
{tldextract-5.1.2.dist-info → tldextract-5.2.0.dist-info}/WHEEL +1 -1
{tldextract-5.1.2.dist-info → tldextract-5.2.0.dist-info/licenses}/LICENSE +1 -1
tldextract-5.1.2.dist-info/RECORD +0 -16
{tldextract-5.1.2.dist-info → tldextract-5.2.0.dist-info}/entry_points.txt +0 -0
{tldextract-5.1.2.dist-info → tldextract-5.2.0.dist-info}/top_level.txt +0 -0

tldextract/__init__.py CHANGED Viewed

@@ -1,12 +1,14 @@
 """Export tldextract's public interface."""
 from . import _version
-from .tldextract import TLDExtract, extract
+from .tldextract import ExtractResult, TLDExtract, extract, update
 __version__: str = _version.version
 __all__ = [
+    "__version__",
     "extract",
+    "ExtractResult",
     "TLDExtract",
-    "__version__",
+    "update",
 ]

tldextract/_version.py CHANGED Viewed

@@ -1,8 +1,13 @@
-# file generated by setuptools_scm
+# file generated by setuptools-scm
 # don't change, don't track in version control
+__all__ = ["__version__", "__version_tuple__", "version", "version_tuple"]
 TYPE_CHECKING = False
 if TYPE_CHECKING:
-    from typing import Tuple, Union
+    from typing import Tuple
+    from typing import Union
     VERSION_TUPLE = Tuple[Union[int, str], ...]
 else:
     VERSION_TUPLE = object
@@ -12,5 +17,5 @@ __version__: str
 __version_tuple__: VERSION_TUPLE
 version_tuple: VERSION_TUPLE
-__version__ = version = '5.1.2'
-__version_tuple__ = version_tuple = (5, 1, 2)
+__version__ = version = '5.2.0'
+__version_tuple__ = version_tuple = (5, 2, 0)

tldextract/cache.py CHANGED Viewed

@@ -24,18 +24,6 @@ _DID_LOG_UNABLE_TO_CACHE = False
 T = TypeVar("T")
-if sys.version_info >= (3, 9):
-    def md5(*args: bytes) -> hashlib._Hash:
-        """Use argument only available in newer Python.
-        In this file, MD5 is only used for cache location, not security.
-        """
-        return hashlib.md5(*args, usedforsecurity=False)
-else:
-    md5 = hashlib.md5
 def get_pkg_unique_identifier() -> str:
     """Generate an identifier unique to the python version, tldextract version, and python instance.
@@ -51,7 +39,9 @@ def get_pkg_unique_identifier() -> str:
     tldextract_version = "tldextract-" + version
     python_env_name = os.path.basename(sys.prefix)
     # just to handle the edge case of two identically named python environments
-    python_binary_path_short_hash = md5(sys.prefix.encode("utf-8")).hexdigest()[:6]
+    python_binary_path_short_hash = hashlib.md5(
+        sys.prefix.encode("utf-8"), usedforsecurity=False
+    ).hexdigest()[:6]
     python_version = ".".join([str(v) for v in sys.version_info[:-1]])
     identifier_parts = [
         python_version,
@@ -113,8 +103,7 @@ class DiskCache:
             with open(cache_filepath) as cache_file:
                 return json.load(cache_file)
         except (OSError, ValueError) as exc:
-            LOG.error("error reading TLD cache file %s: %s", cache_filepath, exc)
-            raise KeyError("namespace: " + namespace + " key: " + repr(key)) from None
+            raise KeyError("namespace: " + namespace + " key: " + repr(key)) from exc
     def set(  # noqa: A003
         self, namespace: str, key: str | dict[str, Hashable], value: object
@@ -238,7 +227,7 @@ def _fetch_url(session: requests.Session, url: str, timeout: int | None) -> str:
 def _make_cache_key(inputs: str | dict[str, Hashable]) -> str:
     key = repr(inputs)
-    return md5(key.encode("utf8")).hexdigest()
+    return hashlib.md5(key.encode("utf8"), usedforsecurity=False).hexdigest()
 def _make_dir(filename: str) -> None:

tldextract/remote.py CHANGED Viewed

@@ -46,7 +46,7 @@ def _schemeless_url(url: str) -> str:
         return url[2:]
     if (
         double_slashes_start < 2
-        or not url[double_slashes_start - 1] == ":"
+        or url[double_slashes_start - 1] != ":"
         or set(url[: double_slashes_start - 1]) - scheme_chars_set
     ):
         return url

tldextract/suffix_list.py CHANGED Viewed

@@ -47,7 +47,9 @@ def find_first_response(
                     session=session, url=url, timeout=cache_fetch_timeout
                 )
             except requests.exceptions.RequestException:
-                LOG.exception("Exception reading Public Suffix List url %s", url)
+                LOG.warning(
+                    "Exception reading Public Suffix List url %s", url, exc_info=True
+                )
     finally:
         # Ensure the session is always closed if it's constructed in the method
         if session_created:

tldextract/tldextract.py CHANGED Viewed

@@ -4,30 +4,30 @@ It does this via the Public Suffix List (PSL).
     >>> import tldextract
-    >>> tldextract.extract('http://forums.news.cnn.com/')
+    >>> tldextract.extract("http://forums.news.cnn.com/")
     ExtractResult(subdomain='forums.news', domain='cnn', suffix='com', is_private=False)
-    >>> tldextract.extract('http://forums.bbc.co.uk/') # United Kingdom
+    >>> tldextract.extract("http://forums.bbc.co.uk/")  # United Kingdom
     ExtractResult(subdomain='forums', domain='bbc', suffix='co.uk', is_private=False)
-    >>> tldextract.extract('http://www.worldbank.org.kg/') # Kyrgyzstan
+    >>> tldextract.extract("http://www.worldbank.org.kg/")  # Kyrgyzstan
     ExtractResult(subdomain='www', domain='worldbank', suffix='org.kg', is_private=False)
 Note subdomain and suffix are _optional_. Not all URL-like inputs have a
 subdomain or a valid suffix.
-    >>> tldextract.extract('google.com')
+    >>> tldextract.extract("google.com")
     ExtractResult(subdomain='', domain='google', suffix='com', is_private=False)
-    >>> tldextract.extract('google.notavalidsuffix')
+    >>> tldextract.extract("google.notavalidsuffix")
     ExtractResult(subdomain='google', domain='notavalidsuffix', suffix='', is_private=False)
-    >>> tldextract.extract('http://127.0.0.1:8080/deployed/')
+    >>> tldextract.extract("http://127.0.0.1:8080/deployed/")
     ExtractResult(subdomain='', domain='127.0.0.1', suffix='', is_private=False)
 To rejoin the original hostname, if it was indeed a valid, registered hostname:
-    >>> ext = tldextract.extract('http://forums.bbc.co.uk')
+    >>> ext = tldextract.extract("http://forums.bbc.co.uk")
     >>> ext.registered_domain
     'bbc.co.uk'
     >>> ext.fqdn
@@ -36,7 +36,6 @@ To rejoin the original hostname, if it was indeed a valid, registered hostname:
 from __future__ import annotations
-import logging
 import os
 import urllib.parse
 from collections.abc import Collection, Sequence
@@ -50,9 +49,6 @@ from .cache import DiskCache, get_cache_dir
 from .remote import lenient_netloc, looks_like_ip, looks_like_ipv6
 from .suffix_list import get_suffix_lists
-LOG = logging.getLogger("tldextract")
 CACHE_TIMEOUT = os.environ.get("TLDEXTRACT_CACHE_TIMEOUT")
 PUBLIC_SUFFIX_LIST_URLS = (
@@ -65,21 +61,48 @@ PUBLIC_SUFFIX_LIST_URLS = (
 class ExtractResult:
     """A URL's extracted subdomain, domain, and suffix.
-    Also contains metadata, like a flag that indicates if the URL has a private suffix.
+    These first 3 fields are what most users of this library will care about.
+    They are the split, non-overlapping hostname components of the input URL.
+    They can be used to rebuild the original URL's hostname.
+    Beyond the first 3 fields, the class contains metadata fields, like a flag
+    that indicates if the input URL's suffix is from a private domain.
     """
     subdomain: str
+    """All subdomains beneath the domain of the input URL, if it contained any such subdomains, or else the empty string."""
     domain: str
+    """The topmost domain of the input URL, if it contained a domain name, or else everything hostname-like in the input.
+    If the input URL didn't contain a real domain name, the `suffix` field will
+    be empty, and this field will catch values like an IP address, or
+    private network hostnames like "localhost".
+    """
     suffix: str
+    """The public suffix of the input URL, if it contained one, or else the empty string.
+    If `include_psl_private_domains` was set to `False`, this field is the same
+    as `registry_suffix`, i.e. a domain under which people can register
+    subdomains through a registrar. If `include_psl_private_domains` was set to
+    `True`, this field may be a PSL private domain, like "blogspot.com".
+    """
     is_private: bool
+    """Whether the input URL belongs in the Public Suffix List's private domains.
+    If `include_psl_private_domains` was set to `False`, this field is always
+    `False`.
+    """
     @property
     def registered_domain(self) -> str:
-        """Joins the domain and suffix fields with a dot, if they're both set.
+        """The `domain` and `suffix` fields joined with a dot, if they're both set, or else the empty string.
-        >>> extract('http://forums.bbc.co.uk').registered_domain
+        >>> extract("http://forums.bbc.co.uk").registered_domain
         'bbc.co.uk'
-        >>> extract('http://localhost:8080').registered_domain
+        >>> extract("http://localhost:8080").registered_domain
         ''
         """
         if self.suffix and self.domain:
@@ -88,11 +111,11 @@ class ExtractResult:
     @property
     def fqdn(self) -> str:
-        """Returns a Fully Qualified Domain Name, if there is a proper domain/suffix.
+        """The Fully Qualified Domain Name (FQDN), if there is a proper `domain` and `suffix`, or else the empty string.
-        >>> extract('http://forums.bbc.co.uk/path/to/file').fqdn
+        >>> extract("http://forums.bbc.co.uk/path/to/file").fqdn
         'forums.bbc.co.uk'
-        >>> extract('http://localhost:8080').fqdn
+        >>> extract("http://localhost:8080").fqdn
         ''
         """
         if self.suffix and (self.domain or self.is_private):
@@ -101,13 +124,13 @@ class ExtractResult:
     @property
     def ipv4(self) -> str:
-        """Returns the ipv4 if that is what the presented domain/url is.
+        """The IPv4 address, if that is what the input domain/URL was, or else the empty string.
-        >>> extract('http://127.0.0.1/path/to/file').ipv4
+        >>> extract("http://127.0.0.1/path/to/file").ipv4
         '127.0.0.1'
-        >>> extract('http://127.0.0.1.1/path/to/file').ipv4
+        >>> extract("http://127.0.0.1.1/path/to/file").ipv4
         ''
-        >>> extract('http://256.1.1.1').ipv4
+        >>> extract("http://256.1.1.1").ipv4
         ''
         """
         if (
@@ -120,13 +143,17 @@ class ExtractResult:
     @property
     def ipv6(self) -> str:
-        """Returns the ipv6 if that is what the presented domain/url is.
+        """The IPv6 address, if that is what the input domain/URL was, or else the empty string.
-        >>> extract('http://[aBcD:ef01:2345:6789:aBcD:ef01:127.0.0.1]/path/to/file').ipv6
+        >>> extract(
+        ...     "http://[aBcD:ef01:2345:6789:aBcD:ef01:127.0.0.1]/path/to/file"
+        ... ).ipv6
         'aBcD:ef01:2345:6789:aBcD:ef01:127.0.0.1'
-        >>> extract('http://[aBcD:ef01:2345:6789:aBcD:ef01:127.0.0.1.1]/path/to/file').ipv6
+        >>> extract(
+        ...     "http://[aBcD:ef01:2345:6789:aBcD:ef01:127.0.0.1.1]/path/to/file"
+        ... ).ipv6
         ''
-        >>> extract('http://[aBcD:ef01:2345:6789:aBcD:ef01:256.0.0.1]').ipv6
+        >>> extract("http://[aBcD:ef01:2345:6789:aBcD:ef01:256.0.0.1]").ipv6
         ''
         """
         min_num_ipv6_chars = 4
@@ -141,6 +168,31 @@ class ExtractResult:
                 return debracketed
         return ""
+    @property
+    def reverse_domain_name(self) -> str:
+        """The domain name in Reverse Domain Name Notation.
+        Joins extracted components of the input URL in reverse domain name
+        notation. The suffix is used as the leftmost component, followed by the
+        domain, then followed by the subdomain with its parts reversed.
+        Reverse Domain Name Notation is typically used to organize namespaces
+        for packages and plugins. Technically, a full reversal would reverse
+        the parts of the suffix, e.g. "co.uk" would become "uk.co", but this is
+        not done in practice when Reverse Domain Name Notation is called for.
+        So this property leaves the `suffix` part in its original order.
+        >>> extract("login.example.com").reverse_domain_name
+        'com.example.login'
+        >>> extract("login.example.co.uk").reverse_domain_name
+        'co.uk.example.login'
+        """
+        stack = [self.suffix, self.domain]
+        if self.subdomain:
+            stack.extend(reversed(self.subdomain.split(".")))
+        return ".".join(stack)
 class TLDExtract:
     """A callable for extracting, subdomain, domain, and suffix components from a URL."""
@@ -161,13 +213,14 @@ class TLDExtract:
         the `cache_dir` will live in the tldextract directory. You can disable
         the caching functionality of this module by setting `cache_dir` to `None`.
-        If the cached version does not exist (such as on the first run), HTTP request the URLs in
-        `suffix_list_urls` in order, until one returns public suffix list data. To disable HTTP
-        requests, set this to an empty sequence.
-        The default list of URLs point to the latest version of the Mozilla Public Suffix List and
-        its mirror, but any similar document could be specified. Local files can be specified by
-        using the `file://` protocol. (See `urllib2` documentation.)
+        If the cached version does not exist, such as on the first run, HTTP
+        request the URLs in `suffix_list_urls` in order, and use the first
+        successful response for public suffix definitions. Subsequent, untried
+        URLs are ignored. The default URLs are the latest version of the
+        Mozilla Public Suffix List and its mirror, but any similar document URL
+        could be specified. Local files can be specified by using the `file://`
+        protocol (see `urllib2` documentation). To disable HTTP requests, set
+        this to an empty sequence.
         If there is no cached version loaded and no data is found from the `suffix_list_urls`,
         the module will fall back to the included TLD set snapshot. If you do not want
@@ -179,7 +232,9 @@ class TLDExtract:
         suffix, so these domains are excluded by default. If you'd like them
         included instead, set `include_psl_private_domains` to True.
-        You can pass additional suffixes in `extra_suffixes` argument without changing list URL
+        You can specify additional suffixes in the `extra_suffixes` argument.
+        These will be merged into whatever public suffix definitions are
+        already in use by `tldextract`, above.
         cache_fetch_timeout is passed unmodified to the underlying request object
         per the requests documentation here:
@@ -237,9 +292,9 @@ class TLDExtract:
         I.e. its effective TLD, gTLD, ccTLD, etc. components.
         >>> extractor = TLDExtract()
-        >>> extractor.extract_str('http://forums.news.cnn.com/')
+        >>> extractor.extract_str("http://forums.news.cnn.com/")
         ExtractResult(subdomain='forums.news', domain='cnn', suffix='com', is_private=False)
-        >>> extractor.extract_str('http://forums.bbc.co.uk/')
+        >>> extractor.extract_str("http://forums.bbc.co.uk/")
         ExtractResult(subdomain='forums', domain='bbc', suffix='co.uk', is_private=False)
         Allows configuring the HTTP request via the optional `session`
@@ -272,9 +327,11 @@ class TLDExtract:
         name has already been parsed.
         >>> extractor = TLDExtract()
-        >>> extractor.extract_urllib(urllib.parse.urlsplit('http://forums.news.cnn.com/'))
+        >>> extractor.extract_urllib(
+        ...     urllib.parse.urlsplit("http://forums.news.cnn.com/")
+        ... )
         ExtractResult(subdomain='forums.news', domain='cnn', suffix='com', is_private=False)
-        >>> extractor.extract_urllib(urllib.parse.urlsplit('http://forums.bbc.co.uk/'))
+        >>> extractor.extract_urllib(urllib.parse.urlsplit("http://forums.bbc.co.uk/"))
         ExtractResult(subdomain='forums', domain='bbc', suffix='co.uk', is_private=False)
         """
         return self._extract_netloc(
@@ -298,9 +355,9 @@ class TLDExtract:
             len(netloc_with_ascii_dots) >= min_num_ipv6_chars
             and netloc_with_ascii_dots[0] == "["
             and netloc_with_ascii_dots[-1] == "]"
+            and looks_like_ipv6(netloc_with_ascii_dots[1:-1])
         ):
-            if looks_like_ipv6(netloc_with_ascii_dots[1:-1]):
-                return ExtractResult("", netloc_with_ascii_dots, "", is_private=False)
+            return ExtractResult("", netloc_with_ascii_dots, "", is_private=False)
         labels = netloc_with_ascii_dots.split(".")
@@ -330,9 +387,9 @@ class TLDExtract:
     @property
     def tlds(self, session: requests.Session | None = None) -> list[str]:
-        """Returns the list of tld's used by default.
+        """The list of TLDs used by default.
-        This will vary based on `include_psl_private_domains` and `extra_suffixes`
+        This will vary based on `include_psl_private_domains` and `extra_suffixes`.
         """
         return list(self._get_tld_extractor(session=session).tlds())

{tldextract-5.1.2.dist-info → tldextract-5.2.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
-Metadata-Version: 2.1
+Metadata-Version: 2.4
 Name: tldextract
-Version: 5.1.2
+Version: 5.2.0
 Summary: Accurately separates a URL's subdomain, domain, and public suffix, using the Public Suffix List (PSL). By default, this includes the public ICANN TLDs and their exceptions. You can optionally support the Public Suffix List's private domains as well.
 Author-email: John Kurkowski <john.kurkowski@gmail.com>
 License: BSD-3-Clause
@@ -10,33 +10,34 @@ Classifier: Development Status :: 5 - Production/Stable
 Classifier: Topic :: Utilities
 Classifier: License :: OSI Approved :: BSD License
 Classifier: Programming Language :: Python :: 3
-Classifier: Programming Language :: Python :: 3.8
 Classifier: Programming Language :: Python :: 3.9
 Classifier: Programming Language :: Python :: 3.10
 Classifier: Programming Language :: Python :: 3.11
 Classifier: Programming Language :: Python :: 3.12
-Requires-Python: >=3.8
+Classifier: Programming Language :: Python :: 3.13
+Requires-Python: >=3.9
 Description-Content-Type: text/markdown
 License-File: LICENSE
 Requires-Dist: idna
-Requires-Dist: requests >=2.1.0
-Requires-Dist: requests-file >=1.4
-Requires-Dist: filelock >=3.0.8
+Requires-Dist: requests>=2.1.0
+Requires-Dist: requests-file>=1.4
+Requires-Dist: filelock>=3.0.8
 Provides-Extra: release
-Requires-Dist: build ; extra == 'release'
-Requires-Dist: twine ; extra == 'release'
+Requires-Dist: build; extra == "release"
+Requires-Dist: twine; extra == "release"
 Provides-Extra: testing
-Requires-Dist: black ; extra == 'testing'
-Requires-Dist: mypy ; extra == 'testing'
-Requires-Dist: pytest ; extra == 'testing'
-Requires-Dist: pytest-gitignore ; extra == 'testing'
-Requires-Dist: pytest-mock ; extra == 'testing'
-Requires-Dist: responses ; extra == 'testing'
-Requires-Dist: ruff ; extra == 'testing'
-Requires-Dist: syrupy ; extra == 'testing'
-Requires-Dist: tox ; extra == 'testing'
-Requires-Dist: types-filelock ; extra == 'testing'
-Requires-Dist: types-requests ; extra == 'testing'
+Requires-Dist: mypy; extra == "testing"
+Requires-Dist: pytest; extra == "testing"
+Requires-Dist: pytest-gitignore; extra == "testing"
+Requires-Dist: pytest-mock; extra == "testing"
+Requires-Dist: responses; extra == "testing"
+Requires-Dist: ruff; extra == "testing"
+Requires-Dist: syrupy; extra == "testing"
+Requires-Dist: tox; extra == "testing"
+Requires-Dist: tox-uv; extra == "testing"
+Requires-Dist: types-filelock; extra == "testing"
+Requires-Dist: types-requests; extra == "testing"
+Dynamic: license-file
 # tldextract [![PyPI version](https://badge.fury.io/py/tldextract.svg)](https://badge.fury.io/py/tldextract) [![Build Status](https://github.com/john-kurkowski/tldextract/actions/workflows/ci.yml/badge.svg)](https://github.com/john-kurkowski/tldextract/actions/workflows/ci.yml)
@@ -95,8 +96,17 @@ To rejoin the original hostname, if it was indeed a valid, registered hostname:
 'forums.bbc.co.uk'
 ```
+In addition to the Python interface, there is a command-line interface. Split
+the URL components by space:
+```zsh
+$ tldextract 'http://forums.bbc.co.uk'
+forums bbc co.uk
+```
 By default, this package supports the public ICANN TLDs and their exceptions.
-You can optionally support the Public Suffix List's private domains as well.
+You can optionally support the Public Suffix List's [private
+domains](#public-vs-private-domains) as well.
 This package started by implementing the chosen answer from [this StackOverflow question on
 getting the "domain name" from a URL](http://stackoverflow.com/questions/569137/how-to-get-domain-name-from-url/569219#569219).
@@ -118,19 +128,12 @@ Or the latest dev version:
 pip install -e 'git://github.com/john-kurkowski/tldextract.git#egg=tldextract'
 ```
-Command-line usage, splits the URL components by space:
-```zsh
-tldextract http://forums.bbc.co.uk
-# forums bbc co.uk
-```
 ## Note about caching
 Beware when first calling `tldextract`, it updates its TLD list with a live HTTP
 request. This updated TLD set is usually cached indefinitely in `$HOME/.cache/python-tldextract`.
-To control the cache's location, set TLDEXTRACT_CACHE environment variable or set the
-cache_dir path in TLDExtract initialization.
+To control the cache's location, set the `TLDEXTRACT_CACHE` environment variable or set the
+`cache_dir` path when constructing a `TLDExtract`.
 (Arguably runtime bootstrapping like that shouldn't be the default behavior,
 like for production systems. But I want you to have the latest TLDs, especially
@@ -188,15 +191,17 @@ ExtractResult(subdomain='waiterrant', domain='blogspot', suffix='com', is_privat
 ```
 The following overrides this.
 ```python
 >>> extract = tldextract.TLDExtract()
 >>> extract('waiterrant.blogspot.com', include_psl_private_domains=True)
 ExtractResult(subdomain='', domain='waiterrant', suffix='blogspot.com', is_private=True)
 ```
-or to change the default for all extract calls,
+To change the default for all extract calls:
 ```python
->>> extract = tldextract.TLDExtract( include_psl_private_domains=True)
+>>> extract = tldextract.TLDExtract(include_psl_private_domains=True)
 >>> extract('waiterrant.blogspot.com')
 ExtractResult(subdomain='', domain='waiterrant', suffix='blogspot.com', is_private=True)
 ```
@@ -219,10 +224,12 @@ extract = tldextract.TLDExtract(
     fallback_to_snapshot=False)
 ```
-The above snippet will fetch from the URL *you* specified, upon first need to download the
-suffix list (i.e. if the cached version doesn't exist).
+If the cached version of public suffix definitions doesn't exist, such as on
+the first run, the above snippet will request the URLs you specified in order,
+and use the first successful response.
-If you want to use input data from your local filesystem, just use the `file://` protocol:
+If you want to use input data from your local filesystem, use the `file://`
+protocol with an absolute path:
 ```python
 extract = tldextract.TLDExtract(
@@ -231,17 +238,24 @@ extract = tldextract.TLDExtract(
     fallback_to_snapshot=False)
 ```
-Use an absolute path when specifying the `suffix_list_urls` keyword argument.
-`os.path` is your friend.
-The command line update command can be used with a URL or local file you specify:
+This also works via command line update:
 ```zsh
 tldextract --update --suffix_list_url "http://foo.bar.baz"
 ```
-This could be useful in production when you don't want the delay associated with updating the suffix
-list on first use, or if you are behind a complex firewall that prevents a simple update from working.
+Using your own URLs could be useful in production when you don't want the delay
+with updating the suffix list on first use, or if you are behind a complex
+firewall.
+You can also specify additional suffixes in the `extra_suffixes` param. These
+will be merged into whatever public suffix definitions are already in use by
+`tldextract`.
+```python
+extract = tldextract.TLDExtract(
+    extra_suffixes=["foo", "bar", "baz"])
+```
 ## FAQ
@@ -250,9 +264,9 @@ list on first use, or if you are behind a complex firewall that prevents a simpl
 This project doesn't contain an actual list of public suffixes. That comes from
 [the Public Suffix List (PSL)](https://publicsuffix.org/). Submit amendments there.
-(In the meantime, you can tell tldextract about your exception by either
+In the meantime, you can tell tldextract about your exception by either
 forking the PSL and using your fork in the `suffix_list_urls` param, or adding
-your suffix piecemeal with the `extra_suffixes` param.)
+your suffix piecemeal with the `extra_suffixes` param.
 ### I see my suffix in [the Public Suffix List (PSL)](https://publicsuffix.org/), but this library doesn't extract it.
@@ -309,5 +323,5 @@ tox -e py311
 Automatically format all code:
 ```zsh
-black .
+ruff format .
 ```

tldextract-5.2.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,16 @@
+tldextract/.tld_set_snapshot,sha256=tpMVwIXVOXJyS48t8RH_wymwyE_gpH1iyMkWVcx3Sjg,318581
+tldextract/__init__.py,sha256=1n2QxAmFCFp3X1A5O46wJOTZqWM2ukshNkkG-TrOaLQ,274
+tldextract/__main__.py,sha256=oiZ5EW_lxRLH6Khk6MdzXf7a1Ld5-A3k4wOFRmNNk2o,89
+tldextract/_version.py,sha256=1-tO6tx4p9okXz3ScGW6YFdQDbS8ruoK2_y0riYBx7M,511
+tldextract/cache.py,sha256=nrT9VuLmrjHHFxj-Cai97IyUXXenCX6KbHi07mPkzMc,8289
+tldextract/cli.py,sha256=nCzBAFrgAopTK1t5eBRQgeveSgWheUx4LAlAHE_8mzQ,3010
+tldextract/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+tldextract/remote.py,sha256=rovbxR73G8To-QRrA_cgSfk0S3k0_B2SyYefXiLHrQg,1940
+tldextract/suffix_list.py,sha256=ePH6iOIUBe0JE_mc07a34Nd7tFyfmHgP_mJkFhxzr7c,3947
+tldextract/tldextract.py,sha256=tM2Lrj0yclAulBueRxAK40bzhMl86Ftz4FHaFGyec7k,21454
+tldextract-5.2.0.dist-info/licenses/LICENSE,sha256=ZUrmz9cSprvhQmqmUdHIWbD51Cytv6PDTMlJLruTLuI,1527
+tldextract-5.2.0.dist-info/METADATA,sha256=LNhqdHD4eMtqA1DaxoVw0YpFq-XqW4_dtqc53bUAriM,11709
+tldextract-5.2.0.dist-info/WHEEL,sha256=CmyFI0kx5cdEMTLiONQRbGQwjIoR1aIYB7eCAQ4KPJ0,91
+tldextract-5.2.0.dist-info/entry_points.txt,sha256=EStkXC80BetCMp1UDhU3kWuXBo3qDpgKltZTJ1x4x1U,51
+tldextract-5.2.0.dist-info/top_level.txt,sha256=DWZIjV49WP30tyC1KOEP7t-EaS4IRCXQzc0KXAOn_bk,11
+tldextract-5.2.0.dist-info/RECORD,,

{tldextract-5.1.2.dist-info → tldextract-5.2.0.dist-info}/WHEEL RENAMED Viewed

@@ -1,5 +1,5 @@
 Wheel-Version: 1.0
-Generator: bdist_wheel (0.43.0)
+Generator: setuptools (78.1.0)
 Root-Is-Purelib: true
 Tag: py3-none-any

{tldextract-5.1.2.dist-info → tldextract-5.2.0.dist-info/licenses}/LICENSE RENAMED Viewed

@@ -1,6 +1,6 @@
 BSD 3-Clause License
-Copyright (c) 2013-2024, John Kurkowski
+Copyright (c) 2013-2025, John Kurkowski
 All rights reserved.
 Redistribution and use in source and binary forms, with or without

tldextract-5.1.2.dist-info/RECORD DELETED Viewed

@@ -1,16 +0,0 @@
-tldextract/.tld_set_snapshot,sha256=TVya0bCcmRKl_16oPKPIlNmWS09rXrjOKGgYjhvAGLE,238022
-tldextract/__init__.py,sha256=rZg3DKzS9CTARuF4Tuq50ViILwUktDED89Av8nStNuM,216
-tldextract/__main__.py,sha256=oiZ5EW_lxRLH6Khk6MdzXf7a1Ld5-A3k4wOFRmNNk2o,89
-tldextract/_version.py,sha256=iJQJoAO8HGnLsPBpH1rkF4KPbrYxIqs4qAXfUgzhRqQ,411
-tldextract/cache.py,sha256=vsr4ERgNxmBO_mYwXLCMbRRKq1s-IDZZLXoaGIYXmBM,8601
-tldextract/cli.py,sha256=nCzBAFrgAopTK1t5eBRQgeveSgWheUx4LAlAHE_8mzQ,3010
-tldextract/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-tldextract/remote.py,sha256=sklRFbATwPs_S33-KeIu9ixuSWP5w7QXO8jnhi_lgJs,1944
-tldextract/suffix_list.py,sha256=TcUpMTZwsicZn6_eHKqA4bjurQrKYde14P-4HT4s4yE,3896
-tldextract/tldextract.py,sha256=oUYLJcgWmeika0teDq2nNI5UCSbAR0c3eosYslVJPUY,18731
-tldextract-5.1.2.dist-info/LICENSE,sha256=dKIruBYZ9wJFoTWv8hvg2bhDv9TXDQ82u-0EERuGJYg,1527
-tldextract-5.1.2.dist-info/METADATA,sha256=dkiY2wl_8M2guJ0MGhGi0YQ9OgZI4vGpJ0I9LMLSGyQ,11464
-tldextract-5.1.2.dist-info/WHEEL,sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ,92
-tldextract-5.1.2.dist-info/entry_points.txt,sha256=EStkXC80BetCMp1UDhU3kWuXBo3qDpgKltZTJ1x4x1U,51
-tldextract-5.1.2.dist-info/top_level.txt,sha256=DWZIjV49WP30tyC1KOEP7t-EaS4IRCXQzc0KXAOn_bk,11
-tldextract-5.1.2.dist-info/RECORD,,

{tldextract-5.1.2.dist-info → tldextract-5.2.0.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{tldextract-5.1.2.dist-info → tldextract-5.2.0.dist-info}/top_level.txt RENAMED Viewed

File without changes

tldextract 5.1.2__py3-none-any.whl → 5.2.0__py3-none-any.whl

tldextract 5.1.2py3-none-any.whl → 5.2.0py3-none-any.whl