PyPI - hippius - Versions diffs - 0.2.0__py3-none-any.whl → 0.2.1__py3-none-any.whl - Mend

hippius 0.2.0py3-none-any.whl → 0.2.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

{hippius-0.2.0.dist-info → hippius-0.2.1.dist-info}/METADATA +2 -1
hippius-0.2.1.dist-info/RECORD +12 -0
hippius_sdk/__init__.py +1 -1
hippius_sdk/cli.py +414 -43
hippius_sdk/ipfs.py +124 -20
hippius_sdk/substrate.py +468 -10
hippius-0.2.0.dist-info/RECORD +0 -12
{hippius-0.2.0.dist-info → hippius-0.2.1.dist-info}/WHEEL +0 -0
{hippius-0.2.0.dist-info → hippius-0.2.1.dist-info}/entry_points.txt +0 -0

hippius_sdk/ipfs.py CHANGED Viewed

@@ -5,6 +5,7 @@ IPFS operations for the Hippius SDK.
 import hashlib
 import json
 import os
+import random
 import shutil
 import tempfile
 import time
@@ -650,6 +651,44 @@ class IPFSClient:
             "gateway_url": gateway_url if exists else None,
         }
+    async def publish_global(self, cid: str) -> Dict[str, Any]:
+        """
+        Publish a CID to the global IPFS network, ensuring it's widely available.
+        This makes the content available beyond the local IPFS node by pinning
+        it to multiple public services.
+        Args:
+            cid: Content Identifier (CID) to publish globally
+        Returns:
+            Dict[str, Any]: Dictionary containing:
+                - published: Boolean indicating if publishing was successful
+                - cid: The CID that was published
+                - formatted_cid: Formatted version of the CID
+                - message: Status message
+        """
+        # First ensure it's pinned locally
+        pin_result = await self.pin(cid)
+        if not pin_result.get("success", False):
+            return {
+                "published": False,
+                "cid": cid,
+                "formatted_cid": self.format_cid(cid),
+                "message": f"Failed to pin content locally: {pin_result.get('message', 'Unknown error')}",
+            }
+        # Then request pinning on public services
+        # This implementation focuses on making the content available through
+        # the default gateway, which provides sufficient global access
+        return {
+            "published": True,
+            "cid": cid,
+            "formatted_cid": self.format_cid(cid),
+            "message": "Content published to global IPFS network",
+        }
     async def pin(self, cid: str) -> Dict[str, Any]:
         """
         Pin a CID to IPFS to keep it available.
@@ -1032,6 +1071,7 @@ class IPFSClient:
             m = erasure_params["m"]
             is_encrypted = erasure_params.get("encrypted", False)
             chunk_size = erasure_params.get("chunk_size", 1024 * 1024)
+            total_original_size = original_file["size"]
             if verbose:
                 print(
@@ -1072,14 +1112,19 @@ class IPFSClient:
                         f"Need {k}, but only have {len(available_chunks)}."
                     )
-                # We only need k chunks, so take the first k
-                chunks_to_download = available_chunks[:k]
-                # Download the chunks
+                # Try to download all available chunks, but we only need k successful ones
                 downloaded_shares = []
                 share_indexes = []
+                chunks_to_try = available_chunks.copy()
+                # Shuffle to get a better variety of chunks
+                random.shuffle(chunks_to_try)
+                for chunk in chunks_to_try:
+                    # Break if we already have k chunks
+                    if len(downloaded_shares) >= k:
+                        break
-                for chunk in chunks_to_download:
                     chunk_path = os.path.join(temp_dir, chunk["name"])
                     try:
                         # Extract the CID string from the chunk's cid dictionary
@@ -1106,7 +1151,7 @@ class IPFSClient:
                         chunks_failed += 1
                         # Continue to the next chunk
-                # If we don't have enough chunks, try to download more
+                # If we don't have enough chunks, fail
                 if len(downloaded_shares) < k:
                     raise ValueError(
                         f"Failed to download enough chunks for original chunk {orig_idx}. "
@@ -1117,22 +1162,51 @@ class IPFSClient:
                 decoder = zfec.Decoder(k, m)
                 reconstructed_data = decoder.decode(downloaded_shares, share_indexes)
-                # If we used the sub-block approach during encoding, we need to recombine the sub-blocks
-                if isinstance(reconstructed_data, list):
-                    # Combine the sub-blocks back into a single chunk
-                    reconstructed_chunk = b"".join(reconstructed_data)
-                else:
-                    # The simple case where we didn't use sub-blocks
-                    reconstructed_chunk = reconstructed_data
+                if not isinstance(reconstructed_data, list):
+                    # Handle unexpected output type
+                    raise TypeError(
+                        f"Unexpected type from decoder: {type(reconstructed_data)}. Expected list of bytes."
+                    )
+                # Calculate the actual size of this original chunk
+                # For all chunks except possibly the last one, it should be chunk_size
+                is_last_chunk = orig_idx == max(chunks_by_original.keys())
+                original_chunk_size = total_original_size - orig_idx * chunk_size
+                if not is_last_chunk:
+                    original_chunk_size = min(chunk_size, original_chunk_size)
+                # Recombine the sub-blocks, respecting the original chunk size
+                reconstructed_chunk = b""
+                total_bytes = 0
+                for sub_block in reconstructed_data:
+                    # Calculate how many bytes we should take from this sub-block
+                    bytes_to_take = min(
+                        len(sub_block), original_chunk_size - total_bytes
+                    )
+                    if bytes_to_take <= 0:
+                        break
+                    reconstructed_chunk += sub_block[:bytes_to_take]
+                    total_bytes += bytes_to_take
                 reconstructed_chunks.append(reconstructed_chunk)
-                # Print progress
+                # Add debugging information if verbose
                 if verbose:
                     progress_pct = (orig_idx + 1) / total_original_chunks * 100
                     print(
                         f"  Progress: {orig_idx + 1}/{total_original_chunks} chunks ({progress_pct:.1f}%)"
                     )
+                    if (
+                        orig_idx == 0 or is_last_chunk
+                    ):  # Only show debug for first and last chunks to avoid spam
+                        print(f"  Debug info for chunk {orig_idx}:")
+                        print(f"    Original chunk size: {original_chunk_size} bytes")
+                        print(
+                            f"    Reconstructed chunk size: {len(reconstructed_chunk)} bytes"
+                        )
+                        print(f"    Share indexes used: {share_indexes}")
+                        print(f"    Sub-blocks received: {len(reconstructed_data)}")
             if verbose:
                 download_time = time.time() - start_time
@@ -1148,12 +1222,42 @@ class IPFSClient:
             if verbose:
                 print("Combining reconstructed chunks...")
-            # Concatenate all chunks
-            file_data = b"".join(reconstructed_chunks)
+            # Process chunks to remove padding correctly
+            processed_chunks = []
+            size_processed = 0
+            for i, chunk in enumerate(reconstructed_chunks):
+                # For all chunks except the last one, use full chunk size
+                if i < len(reconstructed_chunks) - 1:
+                    # Calculate how much of this chunk should be used (handle full chunks)
+                    chunk_valid_bytes = min(
+                        chunk_size, total_original_size - size_processed
+                    )
+                    processed_chunks.append(chunk[:chunk_valid_bytes])
+                    size_processed += chunk_valid_bytes
+                else:
+                    # For the last chunk, calculate the remaining bytes needed
+                    remaining_bytes = total_original_size - size_processed
+                    processed_chunks.append(chunk[:remaining_bytes])
+                    size_processed += remaining_bytes
-            # Remove padding from the last chunk
-            if original_file["size"] < len(file_data):
-                file_data = file_data[: original_file["size"]]
+            # Concatenate all processed chunks
+            file_data = b"".join(processed_chunks)
+            # Double-check the final size matches the original
+            if len(file_data) != original_file["size"]:
+                print(
+                    f"Warning: Reconstructed size ({len(file_data)}) differs from original ({original_file['size']})"
+                )
+                # Ensure we have exactly the right size
+                if len(file_data) > original_file["size"]:
+                    file_data = file_data[: original_file["size"]]
+                else:
+                    # If we're short, pad with zeros (shouldn't happen with proper reconstruction)
+                    print(
+                        "Warning: Reconstructed file is smaller than original, padding with zeros"
+                    )
+                    file_data += b"\0" * (original_file["size"] - len(file_data))
             # Step 6: Decrypt if necessary
             if is_encrypted:
@@ -1181,7 +1285,7 @@ class IPFSClient:
                     print("Warning: File hash mismatch!")
                     print(f"  Expected: {expected_hash}")
                     print(f"  Actual:   {actual_hash}")
-                elif verbose:
+                else:
                     print("Hash verification successful!")
             total_time = time.time() - start_time

hippius 0.2.0__py3-none-any.whl → 0.2.1__py3-none-any.whl

hippius 0.2.0py3-none-any.whl → 0.2.1py3-none-any.whl