PyPI - flask-Humanify - Versions diffs - 0.1.4__py3-none-any.whl → 0.2.1__py3-none-any.whl - Mend

flask-Humanify 0.1.4py3-none-any.whl → 0.2.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

flask_humanify/__init__.py +1 -1
flask_humanify/datasets/ai_dogs.pkl +0 -0
flask_humanify/datasets/animals.pkl +0 -0
flask_humanify/datasets/characters.pkl +0 -0
flask_humanify/datasets/keys.pkl +0 -0
flask_humanify/features/rate_limiter.py +1 -1
flask_humanify/humanify.py +559 -20
flask_humanify/memory_server.py +838 -0
flask_humanify/templates/audio_challenge.html +208 -0
flask_humanify/templates/grid_challenge.html +232 -0
flask_humanify/templates/{oneclick_captcha.html → one_click_challenge.html} +4 -9
flask_humanify/utils.py +488 -2
{flask_humanify-0.1.4.dist-info → flask_humanify-0.2.1.dist-info}/METADATA +42 -4
flask_humanify-0.2.1.dist-info/RECORD +20 -0
flask_humanify/ipset.py +0 -315
flask_humanify-0.1.4.dist-info/RECORD +0 -14
{flask_humanify-0.1.4.dist-info → flask_humanify-0.2.1.dist-info}/WHEEL +0 -0
{flask_humanify-0.1.4.dist-info → flask_humanify-0.2.1.dist-info}/licenses/LICENSE +0 -0
{flask_humanify-0.1.4.dist-info → flask_humanify-0.2.1.dist-info}/top_level.txt +0 -0

flask_humanify/__init__.py CHANGED Viewed

@@ -4,7 +4,7 @@ Flask-Humanify
 A Flask extension that protects against bots and DDoS attacks.
 """
-__version__ = "0.1.4"
+__version__ = "0.2.1"
 from . import utils
 from .humanify import Humanify

flask_humanify/datasets/ai_dogs.pkl ADDED Viewed

Binary file

flask_humanify/datasets/animals.pkl ADDED Viewed

Binary file

flask_humanify/datasets/characters.pkl ADDED Viewed

Binary file

flask_humanify/datasets/keys.pkl ADDED Viewed

Binary file

flask_humanify/features/rate_limiter.py CHANGED Viewed

@@ -11,7 +11,7 @@ class RateLimiter:
     Rate limiter.
     """
-    def __init__(self, app=None, max_requests: int = 2, time_window: int = 10):
+    def __init__(self, app=None, max_requests: int = 10, time_window: int = 10):
         """
         Initialize the rate limiter.
         """

flask_humanify/humanify.py CHANGED Viewed

@@ -1,11 +1,35 @@
 from dataclasses import dataclass
 import logging
-from typing import List, Optional
+import random
+from typing import List, Optional, Union, Dict, Any, Pattern
+import re
+import fnmatch
 from werkzeug.wrappers import Response
-from flask import Blueprint, request, render_template, redirect, url_for, current_app
-from .ipset import IPSetClient, ensure_server_running
-from .utils import get_client_ip, get_return_url
+from flask import (
+    Blueprint,
+    request,
+    render_template,
+    redirect,
+    url_for,
+    current_app,
+    g,
+    abort,
+)
+from .memory_server import MemoryClient, ensure_server_running
+from .utils import (
+    get_client_ip,
+    get_return_url,
+    validate_clearance_token,
+    generate_user_hash,
+    manipulate_image_bytes,
+    image_bytes_to_data_url,
+    generate_captcha_token,
+    validate_captcha_token,
+    generate_clearance_token,
+    combine_audio_files,
+    audio_bytes_to_data_url,
+)
 VPN_PROVIDERS = [
@@ -19,6 +43,26 @@ VPN_PROVIDERS = [
     "Mullvad",
 ]
+IMAGE_CAPTCHA_MAPPING = {
+    "grid": {
+        "num_correct": (2, 3),
+        "num_images": 9,
+        "preview_image": False,
+        "hardness_range": (1, 3),
+    },
+    "one_click": {
+        "num_correct": 1,
+        "num_images": 6,
+        "preview_image": True,
+        "hardness_range": (1, 3),
+    },
+}
+AUDIO_CAPTCHA_CONFIG = {
+    "num_chars": 6,
+    "language": "en",
+}
 logger = logging.getLogger(__name__)
@@ -84,8 +128,17 @@ class Humanify:
     Protect against bots and DDoS attacks.
     """
-    def __init__(self, app=None):
+    def __init__(
+        self,
+        app=None,
+        challenge_type: str = "one_click",
+        image_dataset: Optional[str] = "ai_dogs",
+        audio_dataset: Optional[str] = None,
+    ):
         self.app = app
+        self.challenge_type = challenge_type
+        self.image_dataset = image_dataset
+        self.audio_dataset = audio_dataset
         if app is not None:
             self.init_app(app)
@@ -95,9 +148,13 @@ class Humanify:
         """
         self.app = app
-        ensure_server_running()
-        self.ipset_client = IPSetClient()
-        self.ipset_client.connect()
+        ensure_server_running(
+            image_dataset=self.image_dataset,
+            audio_dataset=self.audio_dataset,
+        )
+        self.memory_client = MemoryClient()
+        self.memory_client.connect()
+        self._secret_key = self.memory_client.get_secret_key()
         self.blueprint = Blueprint(
             "humanify", __name__, template_folder="templates", static_folder=None
@@ -108,6 +165,48 @@ class Humanify:
     def _register_routes(self) -> None:
         """Register the humanify routes."""
+        @self.blueprint.route("/humanify/challenge", methods=["GET"])
+        def challenge():
+            """
+            Challenge route.
+            """
+            if self.image_dataset is None:
+                return self._render_challenge(is_audio=True)
+            return self._render_challenge()
+        @self.blueprint.route("/humanify/audio_challenge", methods=["GET"])
+        def audio_challenge():
+            """
+            Audio challenge route.
+            """
+            if self.audio_dataset is None:
+                return redirect(
+                    url_for("humanify.challenge", return_url=request.full_path)
+                )
+            return self._render_challenge(is_audio=True)
+        @self.blueprint.route("/humanify/verify", methods=["POST"])
+        def verify():
+            """
+            Verify route.
+            """
+            if self.image_dataset is None:
+                abort(404)
+            return self._verify_captcha()
+        @self.blueprint.route("/humanify/verify_audio", methods=["POST"])
+        def verify_audio():
+            """
+            Verify audio route.
+            """
+            if self.audio_dataset is None:
+                abort(404)
+            return self._verify_audio_captcha()
         @self.blueprint.route("/humanify/access_denied", methods=["GET"])
         def access_denied():
             """
@@ -121,38 +220,478 @@ class Humanify:
                 {"Cache-Control": "public, max-age=15552000"},
             )
-    def register_middleware(self, action: str = "deny_access"):
-        """
-        Register the middleware.
+    def register_middleware(
+        self,
+        action: str = "challenge",
+        endpoint_patterns: Union[str, List[str], None] = None,
+        url_patterns: Union[str, List[str], None] = None,
+        exclude_patterns: Union[str, List[str], None] = None,
+        request_filters: Optional[Dict[str, Any]] = None,
+    ):
         """
+        Register the middleware with advanced filtering options.
+        Args:
+            action: The action to take when a bot is detected ('challenge' or 'deny_access')
+            endpoint_patterns: Endpoint patterns to match (regex or glob patterns)
+            url_patterns: URL patterns to match (regex or glob patterns)
+            exclude_patterns: Patterns to exclude from protection (regex or glob patterns)
+            request_filters: Dict of request attributes and values to filter by
+        """
         self.app = self.app or current_app
+        if isinstance(endpoint_patterns, str):
+            endpoint_patterns = [endpoint_patterns]
+        if isinstance(url_patterns, str):
+            url_patterns = [url_patterns]
+        if isinstance(exclude_patterns, str):
+            exclude_patterns = [exclude_patterns]
+        compiled_endpoint_patterns = (
+            self._compile_patterns(endpoint_patterns) if endpoint_patterns else None
+        )
+        compiled_url_patterns = (
+            self._compile_patterns(url_patterns) if url_patterns else None
+        )
+        compiled_exclude_patterns = (
+            self._compile_patterns(exclude_patterns) if exclude_patterns else None
+        )
         @self.app.before_request
         def before_request():
             """
-            Before request hook.
+            Before request hook with advanced filtering.
             """
-            if request.endpoint in ["humanify.rate_limited", "humanify.access_denied"]:
+            if request.endpoint and request.endpoint.startswith("humanify."):
+                return
+            current_endpoint = request.endpoint or ""
+            current_path = request.path
+            if compiled_exclude_patterns and self._matches_any_pattern(
+                current_endpoint, current_path, compiled_exclude_patterns
+            ):
                 return
-            if self.is_bot:
+            patterns_specified = (
+                compiled_endpoint_patterns is not None
+                or compiled_url_patterns is not None
+            )
+            matches_endpoint = not patterns_specified or (
+                compiled_endpoint_patterns
+                and self._matches_any_pattern(
+                    current_endpoint, None, compiled_endpoint_patterns
+                )
+            )
+            matches_url = not patterns_specified or (
+                compiled_url_patterns
+                and self._matches_any_pattern(None, current_path, compiled_url_patterns)
+            )
+            matches_request_filters = (
+                not request_filters or self._matches_request_filters(request_filters)
+            )
+            if (
+                (matches_endpoint or matches_url)
+                and matches_request_filters
+                and self.is_bot
+            ):
+                if action == "challenge":
+                    return self.challenge()
                 if action == "deny_access":
                     return self.deny_access()
+    def _compile_patterns(self, patterns):
+        """
+        Compile a list of patterns into regex patterns.
+        Handles glob patterns like * and ? by converting them to regex.
+        """
+        compiled = []
+        for pattern in patterns:
+            if pattern is None:
+                continue
+            if "*" in pattern or "?" in pattern:
+                regex_pattern = fnmatch.translate(pattern)
+                compiled.append(re.compile(regex_pattern))
+            else:
+                try:
+                    compiled.append(re.compile(pattern))
+                except re.error:
+                    compiled.append(re.compile(re.escape(pattern)))
+        return compiled
+    def _matches_any_pattern(
+        self,
+        endpoint: Optional[str],
+        path: Optional[str],
+        compiled_patterns: List[Pattern],
+    ):
+        """
+        Check if the current endpoint or path matches any of the compiled patterns.
+        """
+        for pattern in compiled_patterns:
+            if endpoint is not None and pattern.search(endpoint):
+                return True
+            if path is not None and pattern.search(path):
+                return True
+        return False
+    def _matches_request_filters(self, request_filters: Dict[str, Any]) -> bool:
+        """
+        Check if the current request matches all the specified filters.
+        Filters can target any attribute of the request object or its nested properties.
+        """
+        for key, value in request_filters.items():
+            parts = key.split(".")
+            obj = request
+            for part in parts[:-1]:
+                if hasattr(obj, part):
+                    obj = getattr(obj, part)
+                elif isinstance(obj, dict) and part in obj:
+                    obj = obj[part]
+                else:
+                    return False
+            final_attr = parts[-1]
+            if hasattr(obj, final_attr):
+                attr_value = getattr(obj, final_attr)
+            elif isinstance(obj, dict) and final_attr in obj:
+                attr_value = obj[final_attr]
+            else:
+                return False
+            if isinstance(value, str) and value.startswith("regex:"):
+                regex_pattern = value[6:]
+                try:
+                    if not re.search(regex_pattern, str(attr_value)):
+                        return False
+                except (re.error, TypeError):
+                    return False
+            elif isinstance(value, list):
+                if attr_value not in value:
+                    return False
+            elif attr_value != value:
+                return False
+        return True
+    @property
+    def client_ip(self) -> Optional[str]:
+        """Get the client IP address."""
+        if hasattr(g, "humanify_client_ip"):
+            return g.humanify_client_ip
+        client_ip = get_client_ip(request)
+        g.humanify_client_ip = client_ip
+        return client_ip
     @property
-    def is_bot(self) -> HumanifyResult:
+    def check_result(self) -> HumanifyResult:
         """
         Check if the IP is a bot.
         """
-        ip = get_client_ip(request)
-        if ip is None:
-            return HumanifyResult(ip=ip, is_invalid_ip=True)
-        ip_groups = self.ipset_client.lookup_ip(ip)
-        return HumanifyResult.from_ip_groups(ip, ip_groups)
+        if self.client_ip is None:
+            return HumanifyResult(ip=self.client_ip, is_invalid_ip=True)
+        if hasattr(g, "humanify_ip_groups"):
+            humanify_ip_groups = g.humanify_ip_groups
+            if isinstance(humanify_ip_groups, list):
+                return HumanifyResult.from_ip_groups(self.client_ip, humanify_ip_groups)
+        ip_groups = self.memory_client.lookup_ip(self.client_ip)
+        g.humanify_ip_groups = ip_groups
+        return HumanifyResult.from_ip_groups(self.client_ip, ip_groups)
+    @property
+    def has_valid_clearance_token(self) -> bool:
+        """Check if the current client has a valid clearance token."""
+        return validate_clearance_token(
+            request.cookies.get("clearance_token", ""),
+            self._secret_key,
+            generate_user_hash(
+                self.client_ip or "127.0.0.1",
+                request.user_agent.string or "",
+            ),
+        )
+    @property
+    def is_bot(self) -> bool:
+        """Check if the current client is a bot."""
+        return not self.has_valid_clearance_token and self.check_result.is_bot
     def deny_access(self) -> Response:
         """
         Redirect to the access denied page.
         """
         return redirect(url_for("humanify.access_denied", return_url=request.full_path))
+    def challenge(self) -> Response:
+        """
+        Challenge the client.
+        """
+        return redirect(url_for("humanify.challenge", return_url=request.full_path))
+    def _render_challenge(self, is_audio: bool = False) -> Response:
+        return_url = get_return_url(request)
+        if self.has_valid_clearance_token:
+            return redirect(return_url)
+        error = request.args.get("error", None)
+        if error not in [
+            "Invalid captcha token",
+            "Wrong selection. Try again.",
+            "Wrong response. Try again.",
+        ]:
+            error = None
+        if is_audio:
+            return self._render_audio_challenge(return_url, error)
+        if self.challenge_type in ["grid", "one_click"]:
+            return self._render_image_challenge(return_url, error)
+        abort(404, "Invalid challenge type")
+    def _render_image_challenge(
+        self, return_url: str, error: Optional[str]
+    ) -> Response:
+        """
+        Render the image challenge.
+        """
+        captcha_config = IMAGE_CAPTCHA_MAPPING[self.challenge_type]
+        use_preview_image = captcha_config["preview_image"]
+        images_bytes, correct_indexes, subject = self.memory_client.get_captcha_images(
+            num_correct=captcha_config["num_correct"],
+            num_images=captcha_config["num_images"],
+            preview_image=use_preview_image,
+            dataset_name=self.image_dataset,
+        )
+        if not images_bytes:
+            abort(500, "Could not load captcha images")
+        processed_images = []
+        for i, img_bytes in enumerate(images_bytes):
+            try:
+                distorted_img_bytes = manipulate_image_bytes(
+                    img_bytes,
+                    is_small=not (i == 0 and use_preview_image),
+                    hardness=random.randint(
+                        captcha_config["hardness_range"][0],
+                        captcha_config["hardness_range"][1],
+                    ),
+                )
+                processed_images.append(image_bytes_to_data_url(distorted_img_bytes))
+            except Exception as e:
+                current_app.logger.error(f"Error processing image: {e}")
+                processed_images.append(
+                    (
+                        "data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAAB"
+                        "CAQAAAC1HAwCAAAAC0lEQVR42mNk+A8AAQUBAScY42YAAAAASUVORK5CYII="
+                    )
+                )
+        preview_image = None
+        if use_preview_image:
+            preview_image = processed_images[0]
+            processed_images = processed_images[1:]
+        user_hash = generate_user_hash(
+            self.client_ip or "127.0.0.1", request.user_agent.string or ""
+        )
+        captcha_data = generate_captcha_token(
+            user_hash, correct_indexes, self._secret_key
+        )
+        return Response(
+            render_template(
+                f"{self.challenge_type}_challenge.html",
+                images=processed_images,
+                preview_image=preview_image,
+                subject=subject,
+                captcha_data=captcha_data,
+                return_url=return_url or "/",
+                error=error,
+                audio_challenge_available=self.audio_dataset is not None,
+            ),
+            mimetype="text/html",
+        )
+    def _render_audio_challenge(
+        self, return_url: str, error: Optional[str]
+    ) -> Response:
+        """
+        Render the audio challenge.
+        """
+        num_chars = AUDIO_CAPTCHA_CONFIG["num_chars"]
+        language = AUDIO_CAPTCHA_CONFIG["language"]
+        audio_files, correct_chars = self.memory_client.get_captcha_audio(
+            num_chars=num_chars, language=language
+        )
+        if not audio_files:
+            abort(500, "Could not load captcha audio")
+        combined_audio = combine_audio_files(audio_files)
+        if not combined_audio:
+            abort(500, "Could not process audio files")
+        audio_data_url = audio_bytes_to_data_url(combined_audio, "mp3")
+        user_hash = generate_user_hash(
+            self.client_ip or "127.0.0.1", request.user_agent.string or ""
+        )
+        captcha_data = generate_captcha_token(
+            user_hash, correct_chars, self._secret_key
+        )
+        return Response(
+            render_template(
+                "audio_challenge.html",
+                audio_file=audio_data_url,
+                captcha_data=captcha_data,
+                return_url=return_url or "/",
+                error=error,
+                image_challenge_available=self.image_dataset is not None,
+            ),
+            mimetype="text/html",
+        )
+    def _verify_captcha(self) -> Response:
+        """Verify the captcha solution."""
+        return_url = get_return_url(request)
+        if self.has_valid_clearance_token:
+            return redirect(return_url)
+        captcha_data = request.form.get("captcha_data", "")
+        if not captcha_data:
+            return redirect(
+                url_for(
+                    "humanify.challenge",
+                    error="Invalid captcha token",
+                    return_url=return_url,
+                )
+            )
+        user_hash = generate_user_hash(
+            self.client_ip or "127.0.0.1", request.user_agent.string or ""
+        )
+        decrypted_data = validate_captcha_token(
+            captcha_data, self._secret_key, user_hash
+        )
+        if decrypted_data is None:
+            return redirect(
+                url_for(
+                    "humanify.challenge",
+                    error="Invalid captcha token",
+                    return_url=return_url,
+                )
+            )
+        verify_functions = {
+            "grid": self._verify_image_captcha,
+            "one_click": self._verify_image_captcha,
+        }
+        verify_function = verify_functions[self.challenge_type]
+        if not verify_function(decrypted_data):
+            return redirect(
+                url_for(
+                    "humanify.challenge",
+                    error="Wrong selection. Try again.",
+                    return_url=return_url,
+                )
+            )
+        clearance_token = generate_clearance_token(user_hash, self._secret_key)
+        response = redirect(return_url or "/")
+        response.set_cookie(
+            "clearance_token",
+            clearance_token,
+            max_age=14400,
+            httponly=True,
+            samesite="Strict",
+        )
+        return response
+    def _verify_audio_captcha(self) -> Response:
+        """Verify the audio captcha solution."""
+        return_url = get_return_url(request)
+        if self.has_valid_clearance_token:
+            return redirect(return_url)
+        captcha_data = request.form.get("captcha_data", "")
+        if not captcha_data:
+            return redirect(
+                url_for(
+                    "humanify.audio_challenge",
+                    error="Invalid captcha token",
+                    return_url=return_url,
+                )
+            )
+        user_hash = generate_user_hash(
+            self.client_ip or "127.0.0.1", request.user_agent.string or ""
+        )
+        correct_chars = validate_captcha_token(
+            captcha_data, self._secret_key, user_hash, valid_lengths=[197]
+        )
+        if correct_chars is None:
+            return redirect(
+                url_for(
+                    "humanify.audio_challenge",
+                    error="Invalid captcha token",
+                    return_url=return_url,
+                )
+            )
+        audio_response = request.form.get("audio_response", "").lower().strip()
+        if not audio_response or audio_response != correct_chars:
+            return redirect(
+                url_for(
+                    "humanify.audio_challenge",
+                    error="Wrong response. Try again.",
+                    return_url=return_url,
+                )
+            )
+        clearance_token = generate_clearance_token(user_hash, self._secret_key)
+        response = redirect(return_url or "/")
+        response.set_cookie(
+            "clearance_token",
+            clearance_token,
+            max_age=14400,
+            httponly=True,
+            samesite="Strict",
+        )
+        return response
+    def _verify_image_captcha(self, decrypted_data: str) -> bool:
+        """Verify the image captcha."""
+        captcha_config = IMAGE_CAPTCHA_MAPPING[self.challenge_type]
+        selected_indexes = []
+        for i in range(1, captcha_config["num_images"] + 1):
+            if request.form.get(str(i), None) == "1":
+                selected_indexes.append(str(i - 1))
+        selected_str = "".join(sorted(selected_indexes))
+        correct_str = "".join(sorted(list(decrypted_data)))
+        return selected_str == correct_str

flask-Humanify 0.1.4__py3-none-any.whl → 0.2.1__py3-none-any.whl

flask-Humanify 0.1.4py3-none-any.whl → 0.2.1py3-none-any.whl