PyPI - ultralytics-actions - Versions diffs - 0.0.45__tar.gz → 0.0.46__tar.gz - Mend

ultralytics-actions 0.0.45tar.gz → 0.0.46tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

{ultralytics_actions-0.0.45 → ultralytics_actions-0.0.46}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: ultralytics-actions
-Version: 0.0.45
+Version: 0.0.46
 Summary: Ultralytics Actions for GitHub automation and PR management.
 Author-email: Glenn Jocher <glenn.jocher@ultralytics.com>
 Maintainer-email: Ultralytics <hello@ultralytics.com>

{ultralytics_actions-0.0.45 → ultralytics_actions-0.0.46}/actions/__init__.py RENAMED Viewed

@@ -22,4 +22,4 @@
 #     ├── test_summarize_pr.py
 #     └── ...
-__version__ = "0.0.45"
+__version__ = "0.0.46"

{ultralytics_actions-0.0.45 → ultralytics_actions-0.0.46}/actions/utils/common_utils.py RENAMED Viewed

@@ -23,22 +23,8 @@ REQUESTS_HEADERS = {
     "Origin": "https://www.google.com/",
 }
-def remove_html_comments(body: str) -> str:
-    """Removes HTML comments from a string using regex pattern matching."""
-    return re.sub(r"<!--.*?-->", "", body, flags=re.DOTALL).strip()
-def clean_url(url):
-    """Remove extra characters from URL strings."""
-    for _ in range(3):
-        url = str(url).strip('"').strip("'").rstrip(".,:;!?`\\").replace(".git@main", "").replace("git+", "")
-    return url
-def is_url(url, session=None, check=True, max_attempts=3, timeout=2):
-    """Check if string is URL and optionally verify it exists."""
-    allow_list = (
+URL_IGNORE_LIST = frozenset(
+    {
         "localhost",
         "127.0.0",
         ":5000",
@@ -56,10 +42,39 @@ def is_url(url, session=None, check=True, max_attempts=3, timeout=2):
         "twitter.com",
         "x.com",
         "storage.googleapis.com",  # private GCS buckets
-    )
+    }
+)
+URL_PATTERN = re.compile(
+    r"\[([^]]+)]\((.*?)(?=\)(?:\s|$))\)"  # Markdown links with lookahead for space/end
+    r"|"
+    r"("  # Start capturing group for plaintext URLs
+    r"(?:https?://)?"  # Optional http:// or https://
+    r"(?:www\.)?"  # Optional www.
+    r"(?:[\w.-]+)?"  # Optional domain name and subdomains
+    r"\.[a-zA-Z]{2,}"  # TLD
+    r"(?:/[^\s\"'\]]*)?"  # Optional path
+    r")"
+)
+def remove_html_comments(body: str) -> str:
+    """Removes HTML comments from a string using regex pattern matching."""
+    return re.sub(r"<!--.*?-->", "", body, flags=re.DOTALL).strip()
+def clean_url(url):
+    """Remove extra characters from URL strings."""
+    for _ in range(3):
+        url = str(url).strip('"').strip("'").rstrip(".,:;!?`\\").replace(".git@main", "").replace("git+", "")
+    return url
+def is_url(url, session=None, check=True, max_attempts=3, timeout=2):
+    """Check if string is URL and optionally verify it exists."""
     try:
         # Check allow list
-        if any(x in url for x in allow_list):
+        if any(x in url for x in URL_IGNORE_LIST):
             return True
         # Check structure
@@ -69,7 +84,7 @@ def is_url(url, session=None, check=True, max_attempts=3, timeout=2):
             return False
         if check:
-            requester = session if session else requests
+            requester = session or requests
             bad_codes = {404, 410, 500, 502, 503, 504}
             kwargs = {"timeout": timeout, "allow_redirects": True}
             if not session:
@@ -94,26 +109,13 @@ def is_url(url, session=None, check=True, max_attempts=3, timeout=2):
 def check_links_in_string(text, verbose=True, return_bad=False):
     """Process a given text, find unique URLs within it, and check for any 404 errors."""
-    pattern = (
-        r"\[([^\]]+)\]\(([^)]+)\)"  # Matches Markdown links [text](url)
-        r"|"
-        r"("  # Start capturing group for plaintext URLs
-        r"(?:https?://)?"  # Optional http:// or https://
-        r"(?:www\.)?"  # Optional www.
-        r"(?:[\w.-]+)?"  # Optional domain name and subdomains
-        r"\.[a-zA-Z]{2,}"  # TLD
-        r"(?:/[^\s\"')\]]*)?"  # Optional path
-        r")"
-    )
-    # all_urls.extend([url for url in match if url and parse.urlparse(url).scheme])
     all_urls = []
-    for md_text, md_url, plain_url in re.findall(pattern, text):
+    for md_text, md_url, plain_url in URL_PATTERN.findall(text):
         url = md_url or plain_url
         if url and parse.urlparse(url).scheme:
             all_urls.append(url)
     urls = set(map(clean_url, all_urls))  # remove extra characters and make unique
-    # bad_urls = [x for x in urls if not is_url(x, check=True)]  # single-thread
     with requests.Session() as session, ThreadPoolExecutor(max_workers=16) as executor:
         session.headers.update(REQUESTS_HEADERS)
         bad_urls = [url for url, valid in zip(urls, executor.map(lambda x: not is_url(x, session), urls)) if valid]
@@ -126,4 +128,8 @@ def check_links_in_string(text, verbose=True, return_bad=False):
 if __name__ == "__main__":
-    print(is_url("https://ultralytics.com/images/bus.jpg"))
+    url = "https://ultralytics.com/images/bus.jpg"
+    string = f"This is a string with a [Markdown link]({url}) inside it."
+    print(f"is_url(): {is_url(url)}")
+    print(f"check_links_in_string(): {check_links_in_string(string)}")

{ultralytics_actions-0.0.45 → ultralytics_actions-0.0.46}/tests/test_urls.py RENAMED Viewed

@@ -23,6 +23,7 @@ URLS = [
     "https://www.reddit.com/r/Ultralytics/comments/1fw3605/release_megathread/",
     "https://www.kaggle.com/models/ultralytics/yolo11",
     "https://apps.apple.com/xk/app/ultralytics/id1583935240",
+    "https://en.wikipedia.org/wiki/Active_learning_(machine_learning)",  # parentheses in link
 ]
@@ -38,6 +39,21 @@ def test_is_url():
         assert is_url(url), f"URL check failed: {url}"
+def test_links_in_string_func():
+    """Test URLs in strings function."""
+    assert check_links_in_string(" abc ".join(url for url in URLS))
+def test_markdown_links_in_string_func():
+    """Test Markdown links in strings function."""
+    assert check_links_in_string(" abc ".join(f"[text]({url})" for url in URLS))
+def test_html_links_in_string_func():
+    """Test HTML links in strings function."""
+    assert check_links_in_string(" abc ".join(f'<a href="{url}">text</a>' for url in URLS))
 def test_html_links(verbose):
     """Tests the validity of URLs within HTML anchor tags and returns any invalid URLs found."""
     text = "Visit <a href='https://err.com'>our site</a> or <a href=\"http://test.org\">test site</a>"

{ultralytics_actions-0.0.45 → ultralytics_actions-0.0.46}/ultralytics_actions.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: ultralytics-actions
-Version: 0.0.45
+Version: 0.0.46
 Summary: Ultralytics Actions for GitHub automation and PR management.
 Author-email: Glenn Jocher <glenn.jocher@ultralytics.com>
 Maintainer-email: Ultralytics <hello@ultralytics.com>