PyPI - tamar-file-hub-client - Versions diffs - 0.1.3__py3-none-any.whl → 0.1.4__py3-none-any.whl - Mend

tamar-file-hub-client 0.1.3py3-none-any.whl → 0.1.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

file_hub_client/client.py +24 -4
file_hub_client/rpc/async_client.py +31 -4
file_hub_client/rpc/gen/file_service_pb2.py +23 -5
file_hub_client/rpc/gen/file_service_pb2_grpc.py +173 -0
file_hub_client/rpc/protos/file_service.proto +66 -0
file_hub_client/rpc/sync_client.py +31 -4
file_hub_client/schemas/__init__.py +10 -0
file_hub_client/schemas/context.py +171 -160
file_hub_client/schemas/file.py +44 -0
file_hub_client/services/file/async_blob_service.py +259 -8
file_hub_client/services/file/async_file_service.py +217 -0
file_hub_client/services/file/sync_blob_service.py +260 -8
file_hub_client/services/file/sync_file_service.py +217 -0
file_hub_client/utils/__init__.py +14 -0
file_hub_client/utils/file_utils.py +186 -153
file_hub_client/utils/ip_detector.py +226 -0
{tamar_file_hub_client-0.1.3.dist-info → tamar_file_hub_client-0.1.4.dist-info}/METADATA +162 -1
{tamar_file_hub_client-0.1.3.dist-info → tamar_file_hub_client-0.1.4.dist-info}/RECORD +20 -19
{tamar_file_hub_client-0.1.3.dist-info → tamar_file_hub_client-0.1.4.dist-info}/WHEEL +0 -0
{tamar_file_hub_client-0.1.3.dist-info → tamar_file_hub_client-0.1.4.dist-info}/top_level.txt +0 -0

file_hub_client/utils/file_utils.py CHANGED Viewed

@@ -1,153 +1,186 @@
-"""
-文件工具函数
-"""
-import hashlib
-import mimetypes
-from pathlib import Path
-from typing import Generator, Optional, BinaryIO, Union
-def get_file_mime_type(file_path: Union[str, Path]) -> str:
-    """
-    获取文件的MIME类型
-    Args:
-        file_path: 文件路径
-    Returns:
-        MIME类型
-    """
-    file_path = Path(file_path)
-    # 定义常见文件扩展名到MIME类型的映射，确保跨平台一致性
-    extension_mime_map = {
-        '.csv': 'text/csv',
-        '.txt': 'text/plain',
-        '.json': 'application/json',
-        '.xml': 'application/xml',
-        '.html': 'text/html',
-        '.htm': 'text/html',
-        '.pdf': 'application/pdf',
-        '.doc': 'application/msword',
-        '.docx': 'application/vnd.openxmlformats-officedocument.wordprocessingml.document',
-        '.xls': 'application/vnd.ms-excel',
-        '.xlsx': 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet',
-        '.ppt': 'application/vnd.ms-powerpoint',
-        '.pptx': 'application/vnd.openxmlformats-officedocument.presentationml.presentation',
-        '.jpg': 'image/jpeg',
-        '.jpeg': 'image/jpeg',
-        '.png': 'image/png',
-        '.gif': 'image/gif',
-        '.bmp': 'image/bmp',
-        '.webp': 'image/webp',
-        '.mp3': 'audio/mpeg',
-        '.wav': 'audio/wav',
-        '.mp4': 'video/mp4',
-        '.avi': 'video/x-msvideo',
-        '.mov': 'video/quicktime',
-        '.zip': 'application/zip',
-        '.rar': 'application/vnd.rar',
-        '.7z': 'application/x-7z-compressed',
-        '.tar': 'application/x-tar',
-        '.gz': 'application/gzip',
-    }
-    # 获取文件扩展名（转为小写）
-    extension = file_path.suffix.lower()
-    # 优先使用自定义映射，确保常见文件类型的一致性
-    if extension in extension_mime_map:
-        return extension_mime_map[extension]
-    # 如果自定义映射中没有，尝试使用magic进行内容检测
-    try:
-        import magic
-        mime = magic.Magic(mime=True)
-        return mime.from_file(str(file_path))
-    except ImportError:
-        # 如果magic不可用，使用mimetypes作为fallback
-        mime_type, _ = mimetypes.guess_type(str(file_path))
-        return mime_type or "application/octet-stream"
-def get_file_extension(file_name: str) -> str:
-    """
-    获取文件扩展名
-    Args:
-        file_name: 文件名
-    Returns:
-        文件扩展名（包含点号）
-    """
-    return Path(file_name).suffix.lower()
-def humanize_file_size(size_bytes: int) -> str:
-    """
-    将文件大小转换为人类可读的格式
-    Args:
-        size_bytes: 文件大小（字节）
-    Returns:
-        人类可读的文件大小
-    """
-    for unit in ["B", "KB", "MB", "GB", "TB"]:
-        if size_bytes < 1024.0:
-            return f"{size_bytes:.2f} {unit}"
-        size_bytes /= 1024.0
-    return f"{size_bytes:.2f} PB"
-def calculate_file_hash(file_path: Union[str, Path], algorithm: str = "sha256") -> str:
-    """
-    计算文件哈希值
-    Args:
-        file_path: 文件路径
-        algorithm: 哈希算法（md5, sha1, sha256等）
-    Returns:
-        文件哈希值（十六进制）
-    """
-    file_path = Path(file_path)
-    hash_obj = hashlib.new(algorithm)
-    with open(file_path, "rb") as f:
-        while chunk := f.read(8192):
-            hash_obj.update(chunk)
-    return hash_obj.hexdigest()
-def split_file_chunks(
-        file_obj: BinaryIO,
-        chunk_size: int = 1024 * 1024,  # 默认1MB
-        start_offset: int = 0
-) -> Generator[tuple[bytes, int, bool], None, None]:
-    """
-    将文件分割成块
-    Args:
-        file_obj: 文件对象
-        chunk_size: 块大小（字节）
-        start_offset: 起始偏移量
-    Yields:
-        (块数据, 偏移量, 是否最后一块)
-    """
-    file_obj.seek(start_offset)
-    offset = start_offset
-    while True:
-        chunk = file_obj.read(chunk_size)
-        if not chunk:
-            break
-        is_last = len(chunk) < chunk_size
-        yield chunk, offset, is_last
-        offset += len(chunk)
-        if is_last:
-            break
+"""
+文件工具函数
+"""
+import hashlib
+import mimetypes
+from pathlib import Path
+from typing import Generator, Optional, BinaryIO, Union
+def get_file_mime_type(file_path: Union[str, Path]) -> str:
+    """
+    获取文件的MIME类型
+    Args:
+        file_path: 文件路径
+    Returns:
+        MIME类型
+    """
+    import json
+    file_path = Path(file_path)
+    # 定义常见文件扩展名到MIME类型的映射，确保跨平台一致性
+    extension_mime_map = {
+        '.csv': 'text/csv',
+        '.txt': 'text/plain',
+        '.json': 'application/json',
+        '.xml': 'application/xml',
+        '.html': 'text/html',
+        '.htm': 'text/html',
+        '.pdf': 'application/pdf',
+        '.doc': 'application/msword',
+        '.docx': 'application/vnd.openxmlformats-officedocument.wordprocessingml.document',
+        '.xls': 'application/vnd.ms-excel',
+        '.xlsx': 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet',
+        '.ppt': 'application/vnd.ms-powerpoint',
+        '.pptx': 'application/vnd.openxmlformats-officedocument.presentationml.presentation',
+        '.jpg': 'image/jpeg',
+        '.jpeg': 'image/jpeg',
+        '.png': 'image/png',
+        '.gif': 'image/gif',
+        '.bmp': 'image/bmp',
+        '.webp': 'image/webp',
+        '.mp3': 'audio/mpeg',
+        '.wav': 'audio/wav',
+        '.mp4': 'video/mp4',
+        '.avi': 'video/x-msvideo',
+        '.mov': 'video/quicktime',
+        '.zip': 'application/zip',
+        '.rar': 'application/vnd.rar',
+        '.7z': 'application/x-7z-compressed',
+        '.tar': 'application/x-tar',
+        '.gz': 'application/gzip',
+    }
+    # 获取文件扩展名（转为小写）
+    extension = file_path.suffix.lower()
+    # 对于JSON文件，进行内容验证
+    if extension == '.json':
+        if file_path.exists():
+            try:
+                # 尝试不同的编码方式读取文件
+                content = None
+                for encoding in ['utf-8-sig', 'utf-8', 'latin-1']:
+                    try:
+                        with open(file_path, 'r', encoding=encoding) as f:
+                            content = f.read().strip()
+                            break
+                    except UnicodeDecodeError:
+                        continue
+                if content is None:
+                    # 无法读取文件，返回text/plain
+                    return 'text/plain'
+                if not content:
+                    # 空文件，按扩展名处理
+                    return extension_mime_map[extension]
+                # 尝试解析JSON
+                json.loads(content)
+                # 如果解析成功，确实是JSON格式
+                return 'application/json'
+            except (json.JSONDecodeError, OSError):
+                # JSON解析失败或文件读取失败，可能是格式错误的JSON文件
+                # 返回text/plain避免服务器端的类型不匹配错误
+                return 'text/plain'
+    # 优先使用自定义映射，确保常见文件类型的一致性
+    if extension in extension_mime_map:
+        return extension_mime_map[extension]
+    # 如果自定义映射中没有，尝试使用magic进行内容检测
+    try:
+        import magic
+        mime = magic.Magic(mime=True)
+        return mime.from_file(str(file_path))
+    except ImportError:
+        # 如果magic不可用，使用mimetypes作为fallback
+        mime_type, _ = mimetypes.guess_type(str(file_path))
+        return mime_type or "application/octet-stream"
+def get_file_extension(file_name: str) -> str:
+    """
+    获取文件扩展名
+    Args:
+        file_name: 文件名
+    Returns:
+        文件扩展名（包含点号）
+    """
+    return Path(file_name).suffix.lower()
+def humanize_file_size(size_bytes: int) -> str:
+    """
+    将文件大小转换为人类可读的格式
+    Args:
+        size_bytes: 文件大小（字节）
+    Returns:
+        人类可读的文件大小
+    """
+    for unit in ["B", "KB", "MB", "GB", "TB"]:
+        if size_bytes < 1024.0:
+            return f"{size_bytes:.2f} {unit}"
+        size_bytes /= 1024.0
+    return f"{size_bytes:.2f} PB"
+def calculate_file_hash(file_path: Union[str, Path], algorithm: str = "sha256") -> str:
+    """
+    计算文件哈希值
+    Args:
+        file_path: 文件路径
+        algorithm: 哈希算法（md5, sha1, sha256等）
+    Returns:
+        文件哈希值（十六进制）
+    """
+    file_path = Path(file_path)
+    hash_obj = hashlib.new(algorithm)
+    with open(file_path, "rb") as f:
+        while chunk := f.read(8192):
+            hash_obj.update(chunk)
+    return hash_obj.hexdigest()
+def split_file_chunks(
+        file_obj: BinaryIO,
+        chunk_size: int = 1024 * 1024,  # 默认1MB
+        start_offset: int = 0
+) -> Generator[tuple[bytes, int, bool], None, None]:
+    """
+    将文件分割成块
+    Args:
+        file_obj: 文件对象
+        chunk_size: 块大小（字节）
+        start_offset: 起始偏移量
+    Yields:
+        (块数据, 偏移量, 是否最后一块)
+    """
+    file_obj.seek(start_offset)
+    offset = start_offset
+    while True:
+        chunk = file_obj.read(chunk_size)
+        if not chunk:
+            break
+        is_last = len(chunk) < chunk_size
+        yield chunk, offset, is_last
+        offset += len(chunk)
+        if is_last:
+            break

file_hub_client/utils/ip_detector.py ADDED Viewed

@@ -0,0 +1,226 @@
+"""
+用户真实IP自动检测模块
+从当前HTTP请求上下文中自动获取真实用户IP地址
+"""
+import os
+import threading
+from typing import Optional, Dict, Any, Callable
+from contextvars import ContextVar
+# 使用ContextVar存储当前请求的用户IP
+current_user_ip: ContextVar[Optional[str]] = ContextVar('current_user_ip', default=None)
+# 存储自定义IP提取器
+_custom_ip_extractor: Optional[Callable[[], Optional[str]]] = None
+# 线程本地存储（fallback）
+_thread_local = threading.local()
+def set_user_ip_extractor(extractor: Callable[[], Optional[str]]):
+    """
+    设置自定义用户IP提取器
+    Args:
+        extractor: 返回用户IP的函数，如果无法获取则返回None
+    """
+    global _custom_ip_extractor
+    _custom_ip_extractor = extractor
+def set_current_user_ip(ip: str):
+    """
+    设置当前请求的用户IP（通常在请求开始时调用）
+    Args:
+        ip: 用户真实IP地址
+    """
+    current_user_ip.set(ip)
+    # 同时设置线程本地存储作为fallback
+    _thread_local.user_ip = ip
+def get_current_user_ip() -> Optional[str]:
+    """
+    自动获取当前用户的真实IP地址
+    优先级:
+    1. ContextVar中的用户IP
+    2. 自定义IP提取器
+    3. 常见Web框架自动检测
+    4. 环境变量
+    5. 线程本地存储
+    Returns:
+        用户真实IP地址，如果无法获取则返回None
+    """
+    # 1. 优先使用ContextVar
+    ip = current_user_ip.get(None)
+    if ip:
+        return ip
+    # 2. 尝试自定义提取器
+    if _custom_ip_extractor:
+        try:
+            ip = _custom_ip_extractor()
+            if ip:
+                return ip
+        except:
+            pass
+    # 3. 尝试从常见Web框架中自动获取
+    ip = _auto_detect_from_web_frameworks()
+    if ip:
+        return ip
+    # 4. 尝试从环境变量获取
+    ip = os.environ.get('USER_IP') or os.environ.get('CLIENT_IP')
+    if ip:
+        return ip
+    # 5. Fallback到线程本地存储
+    try:
+        return getattr(_thread_local, 'user_ip', None)
+    except:
+        return None
+def _auto_detect_from_web_frameworks() -> Optional[str]:
+    """
+    从常见Web框架中自动检测用户IP
+    """
+    # Flask
+    try:
+        from flask import request
+        if request:
+            return _extract_ip_from_headers(request.environ)
+    except (ImportError, RuntimeError):
+        pass
+    # Django
+    try:
+        from django.http import HttpRequest
+        from django.utils.deprecation import MiddlewareMixin
+        # Django需要通过中间件设置，这里只能检查是否有请求对象
+        import django
+        from django.core.context_processors import request as django_request
+        # Django的请求需要通过其他方式获取，这里先跳过
+    except ImportError:
+        pass
+    # FastAPI/Starlette
+    try:
+        from starlette.requests import Request
+        # FastAPI需要在路由处理器中获取，这里先跳过
+    except ImportError:
+        pass
+    # Tornado
+    try:
+        import tornado.web
+        # Tornado需要在RequestHandler中获取，这里先跳过
+    except ImportError:
+        pass
+    return None
+def _extract_ip_from_headers(environ: Dict[str, Any]) -> Optional[str]:
+    """
+    从HTTP环境变量中提取用户真实IP
+    Args:
+        environ: WSGI environ字典或类似的HTTP环境变量
+    Returns:
+        用户真实IP，优先级: X-Forwarded-For > X-Real-IP > CF-Connecting-IP > Remote-Addr
+    """
+    # X-Forwarded-For: 最常用的代理头，包含原始客户端IP
+    forwarded_for = environ.get('HTTP_X_FORWARDED_FOR')
+    if forwarded_for:
+        # 取第一个IP（原始客户端IP），忽略代理IP
+        return forwarded_for.split(',')[0].strip()
+    # X-Real-IP: Nginx常用的真实IP头
+    real_ip = environ.get('HTTP_X_REAL_IP')
+    if real_ip:
+        return real_ip.strip()
+    # CF-Connecting-IP: Cloudflare的连接IP
+    cf_ip = environ.get('HTTP_CF_CONNECTING_IP')
+    if cf_ip:
+        return cf_ip.strip()
+    # Remote-Addr: 直接连接的IP（可能是代理IP）
+    remote_addr = environ.get('REMOTE_ADDR')
+    if remote_addr:
+        return remote_addr.strip()
+    return None
+def clear_current_user_ip():
+    """清除当前请求的用户IP（通常在请求结束时调用）"""
+    current_user_ip.set(None)
+    try:
+        delattr(_thread_local, 'user_ip')
+    except AttributeError:
+        pass
+# Flask集成装饰器
+def flask_auto_user_ip(app=None):
+    """
+    Flask应用自动用户IP检测装饰器
+    用法:
+        from flask import Flask
+        from file_hub_client.utils.ip_detector import flask_auto_user_ip
+        app = Flask(__name__)
+        flask_auto_user_ip(app)
+    """
+    def decorator(app_instance):
+        @app_instance.before_request
+        def extract_user_ip():
+            from flask import request
+            ip = _extract_ip_from_headers(request.environ)
+            if ip:
+                set_current_user_ip(ip)
+        @app_instance.after_request
+        def clear_user_ip(response):
+            clear_current_user_ip()
+            return response
+        return app_instance
+    if app is None:
+        return decorator
+    else:
+        return decorator(app)
+# 上下文管理器
+class UserIPContext:
+    """
+    用户IP上下文管理器
+    用法:
+        with UserIPContext("192.168.1.100"):
+            # 在此范围内SDK会自动使用这个IP
+            client.upload_file(...)
+    """
+    def __init__(self, user_ip: str):
+        self.user_ip = user_ip
+        self.token = None
+    def __enter__(self):
+        self.token = current_user_ip.set(self.user_ip)
+        return self
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        if self.token:
+            current_user_ip.reset(self.token)

tamar-file-hub-client 0.1.3__py3-none-any.whl → 0.1.4__py3-none-any.whl

tamar-file-hub-client 0.1.3py3-none-any.whl → 0.1.4py3-none-any.whl