PyPI - televault - Versions diffs - 0.1.0__py3-none-any.whl - Mend

televault 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

televault/__init__.py +16 -0
televault/chunker.py +189 -0
televault/cli.py +445 -0
televault/compress.py +138 -0
televault/config.py +81 -0
televault/core.py +479 -0
televault/crypto.py +170 -0
televault/models.py +149 -0
televault/telegram.py +375 -0
televault-0.1.0.dist-info/METADATA +242 -0
televault-0.1.0.dist-info/RECORD +13 -0
televault-0.1.0.dist-info/WHEEL +4 -0
televault-0.1.0.dist-info/entry_points.txt +3 -0

televault/crypto.py ADDED Viewed

@@ -0,0 +1,170 @@
+"""Encryption utilities for TeleVault - AES-256-GCM with Argon2id."""
+import os
+import struct
+from typing import BinaryIO, Iterator
+from dataclasses import dataclass
+from cryptography.hazmat.primitives.ciphers.aead import AESGCM
+from cryptography.hazmat.primitives.kdf.scrypt import Scrypt
+from cryptography.hazmat.backends import default_backend
+# Constants
+SALT_SIZE = 16
+NONCE_SIZE = 12
+TAG_SIZE = 16  # GCM auth tag
+KEY_SIZE = 32  # 256-bit key
+HEADER_SIZE = SALT_SIZE + NONCE_SIZE  # 28 bytes
+# For streaming, we encrypt in blocks
+BLOCK_SIZE = 64 * 1024  # 64KB blocks for streaming encryption
+@dataclass
+class EncryptionHeader:
+    """Header prepended to encrypted data."""
+    salt: bytes
+    nonce: bytes
+    def to_bytes(self) -> bytes:
+        return self.salt + self.nonce
+    @classmethod
+    def from_bytes(cls, data: bytes) -> "EncryptionHeader":
+        if len(data) < HEADER_SIZE:
+            raise ValueError(f"Header too short: {len(data)} < {HEADER_SIZE}")
+        return cls(
+            salt=data[:SALT_SIZE],
+            nonce=data[SALT_SIZE:HEADER_SIZE]
+        )
+    @classmethod
+    def generate(cls) -> "EncryptionHeader":
+        return cls(
+            salt=os.urandom(SALT_SIZE),
+            nonce=os.urandom(NONCE_SIZE)
+        )
+def derive_key(password: str, salt: bytes) -> bytes:
+    """
+    Derive encryption key from password using Scrypt.
+    Using Scrypt instead of Argon2id for broader compatibility.
+    Parameters tuned for ~100ms on modern hardware.
+    """
+    kdf = Scrypt(
+        salt=salt,
+        length=KEY_SIZE,
+        n=2**17,  # CPU/memory cost
+        r=8,      # Block size
+        p=1,      # Parallelization
+        backend=default_backend()
+    )
+    return kdf.derive(password.encode("utf-8"))
+def encrypt_chunk(data: bytes, password: str) -> bytes:
+    """
+    Encrypt a chunk of data.
+    Returns: header (28 bytes) + ciphertext + tag (16 bytes)
+    """
+    header = EncryptionHeader.generate()
+    key = derive_key(password, header.salt)
+    cipher = AESGCM(key)
+    ciphertext = cipher.encrypt(header.nonce, data, None)
+    return header.to_bytes() + ciphertext
+def decrypt_chunk(encrypted_data: bytes, password: str) -> bytes:
+    """
+    Decrypt a chunk of data.
+    Expects: header (28 bytes) + ciphertext + tag (16 bytes)
+    """
+    header = EncryptionHeader.from_bytes(encrypted_data)
+    key = derive_key(password, header.salt)
+    cipher = AESGCM(key)
+    ciphertext = encrypted_data[HEADER_SIZE:]
+    return cipher.decrypt(header.nonce, ciphertext, None)
+class StreamingEncryptor:
+    """
+    Streaming encryptor for large files.
+    Note: For simplicity, this encrypts the entire file with one key/nonce.
+    For very large files, consider chunking with per-chunk nonces.
+    """
+    def __init__(self, password: str):
+        self.password = password
+        self.header = EncryptionHeader.generate()
+        self.key = derive_key(password, self.header.salt)
+        self.cipher = AESGCM(self.key)
+        self._counter = 0
+    def get_header(self) -> bytes:
+        """Get the header to prepend to encrypted output."""
+        return self.header.to_bytes()
+    def _get_nonce(self) -> bytes:
+        """Generate unique nonce for each block using counter mode."""
+        # Use base nonce + counter to ensure uniqueness
+        counter_bytes = struct.pack(">Q", self._counter)  # 8 bytes
+        self._counter += 1
+        # XOR with base nonce (take first 8 bytes of nonce, keep last 4)
+        nonce = bytearray(self.header.nonce)
+        for i in range(8):
+            nonce[i] ^= counter_bytes[i]
+        return bytes(nonce)
+    def encrypt_block(self, data: bytes, is_last: bool = False) -> bytes:
+        """Encrypt a block of data."""
+        nonce = self._get_nonce()
+        # Prepend nonce to each block for independent decryption
+        ciphertext = self.cipher.encrypt(nonce, data, None)
+        return nonce + ciphertext
+class StreamingDecryptor:
+    """Streaming decryptor for large files."""
+    def __init__(self, password: str, header: EncryptionHeader):
+        self.password = password
+        self.header = header
+        self.key = derive_key(password, header.salt)
+        self.cipher = AESGCM(self.key)
+    def decrypt_block(self, encrypted_block: bytes) -> bytes:
+        """Decrypt a block of data."""
+        # Extract nonce from block
+        nonce = encrypted_block[:NONCE_SIZE]
+        ciphertext = encrypted_block[NONCE_SIZE:]
+        return self.cipher.decrypt(nonce, ciphertext, None)
+def encrypt_file_simple(input_path: str, output_path: str, password: str) -> None:
+    """Simple file encryption - loads entire file into memory."""
+    with open(input_path, "rb") as f:
+        data = f.read()
+    encrypted = encrypt_chunk(data, password)
+    with open(output_path, "wb") as f:
+        f.write(encrypted)
+def decrypt_file_simple(input_path: str, output_path: str, password: str) -> None:
+    """Simple file decryption - loads entire file into memory."""
+    with open(input_path, "rb") as f:
+        encrypted = f.read()
+    decrypted = decrypt_chunk(encrypted, password)
+    with open(output_path, "wb") as f:
+        f.write(decrypted)

televault/models.py ADDED Viewed

@@ -0,0 +1,149 @@
+"""Data models for TeleVault - stored as JSON on Telegram."""
+from dataclasses import dataclass, field, asdict
+from datetime import datetime
+from typing import Optional
+import json
+@dataclass
+class ChunkInfo:
+    """Information about a single chunk stored on Telegram."""
+    index: int  # Chunk order (0-based)
+    message_id: int  # Telegram message ID
+    size: int  # Chunk size in bytes
+    hash: str  # BLAKE3 hash for verification
+    def to_dict(self) -> dict:
+        return asdict(self)
+    @classmethod
+    def from_dict(cls, data: dict) -> "ChunkInfo":
+        return cls(**data)
+@dataclass
+class FileMetadata:
+    """
+    Metadata for a file stored on Telegram.
+    This is stored as a JSON text message, with chunks replying to it.
+    """
+    id: str  # Unique file ID (short hash)
+    name: str  # Original filename
+    size: int  # Original file size in bytes
+    hash: str  # BLAKE3 hash of original file
+    chunks: list[ChunkInfo] = field(default_factory=list)
+    # Optional fields
+    encrypted: bool = True
+    compressed: bool = False
+    compression_ratio: Optional[float] = None
+    mime_type: Optional[str] = None
+    # Timestamps
+    created_at: float = field(default_factory=lambda: datetime.now().timestamp())
+    modified_at: Optional[float] = None
+    # Telegram reference
+    message_id: Optional[int] = None  # Message ID of this metadata
+    def to_json(self) -> str:
+        """Serialize to JSON for storage on Telegram."""
+        data = asdict(self)
+        # Convert ChunkInfo objects
+        data["chunks"] = [c.to_dict() if isinstance(c, ChunkInfo) else c for c in data["chunks"]]
+        return json.dumps(data, separators=(",", ":"))  # Compact JSON
+    @classmethod
+    def from_json(cls, text: str) -> "FileMetadata":
+        """Deserialize from JSON stored on Telegram."""
+        data = json.loads(text)
+        data["chunks"] = [ChunkInfo.from_dict(c) for c in data.get("chunks", [])]
+        return cls(**data)
+    @property
+    def chunk_count(self) -> int:
+        return len(self.chunks)
+    @property
+    def total_stored_size(self) -> int:
+        """Total size of all chunks (after compression/encryption)."""
+        return sum(c.size for c in self.chunks)
+    def is_complete(self) -> bool:
+        """Check if all chunks are present."""
+        if not self.chunks:
+            return False
+        indices = {c.index for c in self.chunks}
+        expected = set(range(len(self.chunks)))
+        return indices == expected
+@dataclass
+class VaultIndex:
+    """
+    Master index of all files in the vault.
+    Stored as pinned message in the channel.
+    """
+    version: int = 1
+    files: dict[str, int] = field(default_factory=dict)  # file_id -> metadata_message_id
+    updated_at: float = field(default_factory=lambda: datetime.now().timestamp())
+    def to_json(self) -> str:
+        return json.dumps(asdict(self), separators=(",", ":"))
+    @classmethod
+    def from_json(cls, text: str) -> "VaultIndex":
+        data = json.loads(text)
+        # Only take known fields, ignore extras
+        return cls(
+            version=data.get("version", 1),
+            files=data.get("files", {}),
+            updated_at=data.get("updated_at", datetime.now().timestamp()),
+        )
+    def add_file(self, file_id: str, message_id: int) -> None:
+        self.files[file_id] = message_id
+        self.updated_at = datetime.now().timestamp()
+    def remove_file(self, file_id: str) -> Optional[int]:
+        msg_id = self.files.pop(file_id, None)
+        if msg_id:
+            self.updated_at = datetime.now().timestamp()
+        return msg_id
+@dataclass
+class TransferProgress:
+    """
+    Progress tracking for resumable transfers.
+    Stored as a temporary message, deleted on completion.
+    """
+    operation: str  # "upload" or "download"
+    file_id: str
+    file_name: str
+    total_chunks: int
+    completed_chunks: list[int] = field(default_factory=list)  # Completed chunk indices
+    started_at: float = field(default_factory=lambda: datetime.now().timestamp())
+    def to_json(self) -> str:
+        return json.dumps(asdict(self), separators=(",", ":"))
+    @classmethod
+    def from_json(cls, text: str) -> "TransferProgress":
+        return cls(**json.loads(text))
+    @property
+    def pending_chunks(self) -> list[int]:
+        completed = set(self.completed_chunks)
+        return [i for i in range(self.total_chunks) if i not in completed]
+    @property
+    def progress_percent(self) -> float:
+        if self.total_chunks == 0:
+            return 100.0
+        return (len(self.completed_chunks) / self.total_chunks) * 100

televault/telegram.py ADDED Viewed

@@ -0,0 +1,375 @@
+"""Telegram MTProto client wrapper for TeleVault."""
+import asyncio
+import json
+from pathlib import Path
+from typing import Optional, AsyncIterator
+from dataclasses import dataclass
+import io
+from telethon import TelegramClient
+from telethon.sessions import StringSession
+from telethon.tl.types import (
+    Channel,
+    Message,
+    DocumentAttributeFilename,
+    InputPeerChannel,
+)
+from telethon.tl.functions.messages import GetPinnedDialogsRequest
+from telethon.errors import FloodWaitError
+from .models import FileMetadata, VaultIndex, ChunkInfo, TransferProgress
+from .config import Config, get_config_dir
+# TeleVault Telegram app credentials
+API_ID = 22399403
+API_HASH = "9bf0e01ba1d63bc048172b8eb53d957b"
+@dataclass
+class TelegramConfig:
+    """Telegram connection configuration."""
+    api_id: int
+    api_hash: str
+    session_string: Optional[str] = None
+    @classmethod
+    def from_env(cls) -> "TelegramConfig":
+        """Load from environment or config file."""
+        import os
+        config_path = get_config_dir() / "telegram.json"
+        if config_path.exists():
+            with open(config_path) as f:
+                data = json.load(f)
+                return cls(**data)
+        return cls(
+            api_id=int(os.environ.get("TELEGRAM_API_ID", API_ID)),
+            api_hash=os.environ.get("TELEGRAM_API_HASH", API_HASH),
+            session_string=os.environ.get("TELEGRAM_SESSION"),
+        )
+    def save(self) -> None:
+        """Save config to file."""
+        config_path = get_config_dir() / "telegram.json"
+        config_path.parent.mkdir(parents=True, exist_ok=True)
+        with open(config_path, "w") as f:
+            json.dump({
+                "api_id": self.api_id,
+                "api_hash": self.api_hash,
+                "session_string": self.session_string,
+            }, f, indent=2)
+class TelegramVault:
+    """
+    Telegram MTProto client for TeleVault operations.
+    Handles:
+    - Authentication
+    - Channel management
+    - File upload/download
+    - Index management
+    """
+    def __init__(self, config: Optional[TelegramConfig] = None):
+        self.config = config or TelegramConfig.from_env()
+        self._client: Optional[TelegramClient] = None
+        self._channel: Optional[Channel] = None
+        self._channel_id: Optional[int] = None
+    async def connect(self) -> None:
+        """Connect to Telegram."""
+        if self.config.session_string:
+            session = StringSession(self.config.session_string)
+        else:
+            session = StringSession()
+        self._client = TelegramClient(
+            session,
+            self.config.api_id,
+            self.config.api_hash,
+        )
+        await self._client.connect()
+    async def disconnect(self) -> None:
+        """Disconnect from Telegram."""
+        if self._client:
+            await self._client.disconnect()
+    async def login(self, phone: Optional[str] = None) -> str:
+        """
+        Interactive login flow.
+        Returns session string for future use.
+        """
+        if not self._client:
+            await self.connect()
+        if not await self._client.is_user_authorized():
+            if phone is None:
+                phone = input("Enter phone number: ")
+            await self._client.send_code_request(phone)
+            code = input("Enter the code you received: ")
+            try:
+                await self._client.sign_in(phone, code)
+            except Exception:
+                # 2FA required
+                password = input("Enter 2FA password: ")
+                await self._client.sign_in(password=password)
+        # Save session
+        session_string = self._client.session.save()
+        self.config.session_string = session_string
+        self.config.save()
+        return session_string
+    async def set_channel(self, channel_id: int) -> None:
+        """Set the storage channel."""
+        self._channel_id = channel_id
+        self._channel = await self._client.get_entity(channel_id)
+    async def create_channel(self, name: str = "TeleVault Storage") -> int:
+        """Create a new private channel for storage."""
+        from telethon.tl.functions.channels import CreateChannelRequest
+        result = await self._client(CreateChannelRequest(
+            title=name,
+            about="TeleVault encrypted storage",
+            megagroup=False,  # Regular channel, not supergroup
+        ))
+        channel = result.chats[0]
+        self._channel = channel
+        self._channel_id = channel.id
+        # Return full channel ID format (negative with -100 prefix)
+        # Telegram channels need -100 prefix for MTProto
+        full_channel_id = int(f"-100{channel.id}")
+        return full_channel_id
+    # === Index Operations ===
+    async def get_index(self) -> VaultIndex:
+        """Get the vault index from pinned message."""
+        if not self._channel_id:
+            raise ValueError("No channel set")
+        # Get pinned messages
+        async for msg in self._client.iter_messages(
+            self._channel_id,
+            filter=None,
+            limit=10,
+        ):
+            if msg.pinned and msg.text:
+                try:
+                    data = json.loads(msg.text)
+                    # Check if it looks like our index (has 'files' key)
+                    if "files" in data:
+                        return VaultIndex.from_json(msg.text)
+                except json.JSONDecodeError:
+                    continue
+        # No valid index found, create empty one
+        return VaultIndex()
+    async def save_index(self, index: VaultIndex) -> int:
+        """Save the vault index as pinned message."""
+        if not self._channel_id:
+            raise ValueError("No channel set")
+        # Find existing pinned index message
+        existing_msg_id = None
+        async for msg in self._client.iter_messages(
+            self._channel_id,
+            filter=None,
+            limit=10,
+        ):
+            if msg.pinned and msg.text:
+                try:
+                    VaultIndex.from_json(msg.text)
+                    existing_msg_id = msg.id
+                    break
+                except json.JSONDecodeError:
+                    continue
+        if existing_msg_id:
+            # Edit existing
+            await self._client.edit_message(
+                self._channel_id,
+                existing_msg_id,
+                index.to_json(),
+            )
+            return existing_msg_id
+        else:
+            # Create new and pin
+            msg = await self._client.send_message(
+                self._channel_id,
+                index.to_json(),
+            )
+            await self._client.pin_message(self._channel_id, msg.id)
+            return msg.id
+    # === File Operations ===
+    async def upload_metadata(self, metadata: FileMetadata) -> int:
+        """Upload file metadata as a text message."""
+        if not self._channel_id:
+            raise ValueError("No channel set")
+        msg = await self._client.send_message(
+            self._channel_id,
+            metadata.to_json(),
+        )
+        return msg.id
+    async def get_metadata(self, message_id: int) -> FileMetadata:
+        """Get file metadata from message."""
+        if not self._channel_id:
+            raise ValueError("No channel set")
+        msg = await self._client.get_messages(self._channel_id, ids=message_id)
+        if not msg or not msg.text:
+            raise ValueError(f"Metadata message {message_id} not found")
+        return FileMetadata.from_json(msg.text)
+    async def update_metadata(self, message_id: int, metadata: FileMetadata) -> None:
+        """Update file metadata message."""
+        if not self._channel_id:
+            raise ValueError("No channel set")
+        await self._client.edit_message(
+            self._channel_id,
+            message_id,
+            metadata.to_json(),
+        )
+    async def upload_chunk(
+        self,
+        data: bytes,
+        filename: str,
+        reply_to: int,
+        progress_callback=None,
+    ) -> int:
+        """
+        Upload a chunk as a file message.
+        Args:
+            data: Chunk data
+            filename: Chunk filename (e.g., "0001.chunk")
+            reply_to: Metadata message ID to reply to
+            progress_callback: Optional progress callback
+        Returns:
+            Message ID of uploaded chunk
+        """
+        if not self._channel_id:
+            raise ValueError("No channel set")
+        # Create file-like object
+        file = io.BytesIO(data)
+        file.name = filename
+        try:
+            msg = await self._client.send_file(
+                self._channel_id,
+                file,
+                reply_to=reply_to,
+                progress_callback=progress_callback,
+                attributes=[DocumentAttributeFilename(filename)],
+            )
+            return msg.id
+        except FloodWaitError as e:
+            # Rate limited, wait and retry
+            await asyncio.sleep(e.seconds + 1)
+            return await self.upload_chunk(data, filename, reply_to, progress_callback)
+    async def download_chunk(
+        self,
+        message_id: int,
+        progress_callback=None,
+    ) -> bytes:
+        """Download a chunk by message ID."""
+        if not self._channel_id:
+            raise ValueError("No channel set")
+        msg = await self._client.get_messages(self._channel_id, ids=message_id)
+        if not msg or not msg.file:
+            raise ValueError(f"Chunk message {message_id} not found")
+        return await self._client.download_media(msg, file=bytes, progress_callback=progress_callback)
+    async def iter_file_chunks(self, metadata_msg_id: int) -> AsyncIterator[Message]:
+        """Iterate over chunk messages that reply to a metadata message."""
+        if not self._channel_id:
+            raise ValueError("No channel set")
+        async for msg in self._client.iter_messages(
+            self._channel_id,
+            reply_to=metadata_msg_id,
+        ):
+            if msg.file:
+                yield msg
+    async def delete_file(self, file_id: str) -> bool:
+        """Delete a file and all its chunks."""
+        if not self._channel_id:
+            raise ValueError("No channel set")
+        # Get index
+        index = await self.get_index()
+        if file_id not in index.files:
+            return False
+        metadata_msg_id = index.files[file_id]
+        # Collect all message IDs to delete
+        msg_ids = [metadata_msg_id]
+        async for chunk_msg in self.iter_file_chunks(metadata_msg_id):
+            msg_ids.append(chunk_msg.id)
+        # Delete messages
+        await self._client.delete_messages(self._channel_id, msg_ids)
+        # Update index
+        index.remove_file(file_id)
+        await self.save_index(index)
+        return True
+    # === Listing ===
+    async def list_files(self) -> list[FileMetadata]:
+        """List all files in the vault."""
+        index = await self.get_index()
+        files = []
+        for file_id, msg_id in index.files.items():
+            try:
+                metadata = await self.get_metadata(msg_id)
+                metadata.message_id = msg_id
+                files.append(metadata)
+            except Exception:
+                # Skip corrupted entries
+                continue
+        return files
+    async def search_files(self, query: str) -> list[FileMetadata]:
+        """Search files by name."""
+        files = await self.list_files()
+        query_lower = query.lower()
+        return [f for f in files if query_lower in f.name.lower()]