PyPI - dgen-py - Versions diffs - 0.1.2__cp310-cp310-manylinux_2_24_x86_64.whl - Mend

dgen-py 0.1.2__cp310-cp310-manylinux_2_24_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

dgen_py/__init__.py +167 -0
dgen_py/__init__.pyi +61 -0
dgen_py/_dgen_rs.cpython-310-x86_64-linux-gnu.so +0 -0
dgen_py/docs/PERFORMANCE.md +241 -0
dgen_py/examples/README.md +201 -0
dgen_py/examples/benchmark_cpu_numa.py +299 -0
dgen_py/examples/benchmark_vs_numpy.py +146 -0
dgen_py/examples/demo.py +107 -0
dgen_py/examples/quick_perf_test.py +107 -0
dgen_py/examples/zero_copy_demo.py +97 -0
dgen_py-0.1.2.dist-info/METADATA +271 -0
dgen_py-0.1.2.dist-info/RECORD +14 -0
dgen_py-0.1.2.dist-info/WHEEL +4 -0
dgen_py-0.1.2.dist-info/licenses/LICENSE +39 -0

dgen_py/examples/zero_copy_demo.py ADDED Viewed

@@ -0,0 +1,97 @@
+#!/usr/bin/env python3
+"""
+Zero-Copy Demo
+==============
+Demonstrates TRUE zero-copy data generation and access.
+"""
+import dgen_py
+import numpy as np
+import time
+def main():
+    print("=" * 60)
+    print("dgen-py ZERO-COPY DEMONSTRATION")
+    print("=" * 60)
+    size = 100 * 1024 * 1024  # 100 MiB
+    print(f"\nGenerating {size // (1024*1024)} MiB of data...\n")
+    # =========================================================================
+    # Step 1: Generate data (Rust allocation)
+    # =========================================================================
+    start = time.perf_counter()
+    data = dgen_py.generate_data(size)
+    gen_time = time.perf_counter() - start
+    throughput = size / gen_time / 1e9
+    print(f"✓ Generation: {throughput:.2f} GB/s ({gen_time*1000:.1f} ms)")
+    print(f"  Type: {type(data).__name__}")
+    print(f"  Size: {len(data):,} bytes")
+    # =========================================================================
+    # Step 2: Create memoryview (ZERO COPY - just pointer!)
+    # =========================================================================
+    start = time.perf_counter()
+    view = memoryview(data)
+    view_time = time.perf_counter() - start
+    print(f"\n✓ Memoryview: {view_time * 1e6:.1f} µs (ZERO COPY)")
+    print(f"  Readonly: {view.readonly}")
+    print(f"  Format: '{view.format}' (unsigned byte)")
+    print(f"  Size: {len(view):,} bytes")
+    # =========================================================================
+    # Step 3: Create numpy array (ZERO COPY - same memory!)
+    # =========================================================================
+    start = time.perf_counter()
+    arr = np.frombuffer(view, dtype=np.uint8)
+    arr_time = time.perf_counter() - start
+    print(f"\n✓ Numpy array: {arr_time * 1e6:.1f} µs (ZERO COPY)")
+    print(f"  Shape: {arr.shape}")
+    print(f"  Dtype: {arr.dtype}")
+    print(f"  Size: {arr.nbytes:,} bytes")
+    # =========================================================================
+    # Verification: All share same memory
+    # =========================================================================
+    print("\n" + "=" * 60)
+    print("VERIFICATION: All three share the SAME memory location")
+    print("=" * 60)
+    # Sample first 10 bytes
+    print(f"\nFirst 10 bytes:")
+    print(f"  Memoryview: {bytes(view[:10]).hex()}")
+    print(f"  Numpy: {arr[:10].tobytes().hex()}")
+    print(f"  ✓ Identical!")
+    # Total time breakdown
+    total_copy_time = view_time + arr_time
+    print(f"\n" + "=" * 60)
+    print(f"PERFORMANCE SUMMARY")
+    print(f"=" * 60)
+    print(f"Generation: {gen_time*1000:6.1f} ms  ({throughput:.2f} GB/s)")
+    print(f"Memoryview: {view_time*1e6:6.1f} µs  (zero-copy)")
+    print(f"Numpy:      {arr_time*1e6:6.1f} µs  (zero-copy)")
+    print(f"            {'-'*20}")
+    print(f"Total copy: {total_copy_time*1e6:6.1f} µs  (<< 1% overhead)")
+    # Memory efficiency
+    print(f"\n" + "=" * 60)
+    print(f"MEMORY EFFICIENCY")
+    print(f"=" * 60)
+    print(f"Without zero-copy: {size * 3 / (1024**2):.1f} MiB (3 copies)")
+    print(f"With zero-copy:    {size / (1024**2):.1f} MiB (1 allocation)")
+    print(f"Savings:           {size * 2 / (1024**2):.1f} MiB (66% reduction)")
+    print(f"\n" + "=" * 60)
+    print("✓ TRUE ZERO-COPY: Same performance as Rust!")
+    print("=" * 60)
+if __name__ == "__main__":
+    main()

dgen_py-0.1.2.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,271 @@
+Metadata-Version: 2.4
+Name: dgen-py
+Version: 0.1.2
+Classifier: Development Status :: 4 - Beta
+Classifier: Intended Audience :: Developers
+Classifier: License :: OSI Approved :: MIT License
+Classifier: License :: OSI Approved :: Apache Software License
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Rust
+Classifier: Topic :: Software Development :: Libraries
+Classifier: Topic :: System :: Benchmark
+Requires-Dist: numpy>=1.21.0
+Requires-Dist: zstandard>=0.25.0
+Requires-Dist: pytest>=8.0.0 ; extra == 'dev'
+Requires-Dist: pytest-benchmark>=4.0.0 ; extra == 'dev'
+Requires-Dist: maturin>=1.0.0 ; extra == 'dev'
+Requires-Dist: numpy>=2.0.0 ; extra == 'numpy'
+Provides-Extra: dev
+Provides-Extra: numpy
+License-File: LICENSE
+Summary: High-performance random data generation with NUMA optimization and zero-copy Python interface
+Keywords: data-generation,benchmark,numa,performance,zero-copy
+Author-email: Russ Fellows <russ.fellows@gmail.com>
+License: MIT OR Apache-2.0
+Requires-Python: >=3.10
+Description-Content-Type: text/markdown; charset=UTF-8; variant=GFM
+# dgen-rs / dgen-py
+**High-performance random data generation with controllable deduplication, compression, and NUMA optimization**
+[![License: MIT OR Apache-2.0](https://img.shields.io/badge/license-MIT%20OR%20Apache--2.0-blue)](LICENSE)
+[![Rust Version](https://img.shields.io/badge/rust-1.90+-orange.svg)](https://www.rust-lang.org)
+[![Python Version](https://img.shields.io/badge/python-3.10+-blue.svg)](https://www.python.org)
+[![Tests](https://img.shields.io/badge/tests-14%20passing-brightgreen.svg)](#testing)
+## Features
+- 🚀 **Blazing Fast**: 5-15 GB/s per core using Xoshiro256++ RNG
+- 🎯 **Controllable Characteristics**:
+  - Deduplication ratios (1:1 to N:1)
+  - Compression ratios (1:1 to N:1)
+- 🔬 **NUMA-Aware**: Automatic topology detection and optimization on multi-socket systems
+- 🐍 **Zero-Copy Python API**: Direct buffer writes, no unnecessary copies
+- 📦 **Both Simple and Streaming**: Single-call or incremental generation
+- 🛠️ **Built with Rust**: Memory-safe, production-quality code
+## Quick Start
+### Python Installation
+```bash
+# Install from PyPI (when published)
+pip install dgen-py
+# Or build from source
+cd dgen-rs
+maturin develop --release
+```
+### Python Usage
+**Simple API** (generate all at once):
+```python
+import dgen_py
+# Generate 100 MiB incompressible data
+data = dgen_py.generate_data(100 * 1024 * 1024)
+print(f"Generated {len(data)} bytes")
+# Generate with 2:1 dedup and 3:1 compression
+data = dgen_py.generate_data(
+    size=100 * 1024 * 1024,
+    dedup_ratio=2.0,
+    compress_ratio=3.0
+)
+```
+**Zero-Copy API** (write into existing buffer):
+```python
+import dgen_py
+import numpy as np
+# Pre-allocate buffer
+buf = bytearray(1024 * 1024)
+# Generate directly into buffer (zero-copy!)
+nbytes = dgen_py.fill_buffer(buf, compress_ratio=2.0)
+print(f"Wrote {nbytes} bytes")
+# Works with NumPy arrays
+arr = np.zeros(100 * 1024 * 1024, dtype=np.uint8)
+dgen_py.fill_buffer(arr, dedup_ratio=2.0, compress_ratio=3.0)
+```
+**Streaming API** (incremental generation):
+```python
+import dgen_py
+# Create generator for 1 GiB
+gen = dgen_py.Generator(
+    size=1024 * 1024 * 1024,
+    dedup_ratio=2.0,
+    compress_ratio=3.0,
+    numa_aware=True  # Auto-detected by default
+)
+# Generate in chunks
+chunk_size = 8192
+buf = bytearray(chunk_size)
+total = 0
+while not gen.is_complete():
+    nbytes = gen.fill_chunk(buf)
+    if nbytes == 0:
+        break
+    total += nbytes
+    # Process chunk (write to file, network, etc.)
+    # ...
+print(f"Generated {total} bytes")
+```
+**NUMA Information**:
+```python
+import dgen_py
+info = dgen_py.get_system_info()
+if info:
+    print(f"NUMA nodes: {info['num_nodes']}")
+    print(f"Physical cores: {info['physical_cores']}")
+    print(f"Deployment: {info['deployment_type']}")
+```
+### Rust Usage
+```rust
+use dgen_rs::{generate_data_simple, GeneratorConfig, DataGenerator};
+// Simple API
+let data = generate_data_simple(100 * 1024 * 1024, 1, 1);
+// Full configuration
+let config = GeneratorConfig {
+    size: 100 * 1024 * 1024,
+    dedup_factor: 2,
+    compress_factor: 3,
+    numa_aware: true,
+};
+let data = dgen_rs::generate_data(config);
+// Streaming
+let mut gen = DataGenerator::new(config);
+let mut chunk = vec![0u8; 8192];
+while !gen.is_complete() {
+    let written = gen.fill_chunk(&mut chunk);
+    if written == 0 {
+        break;
+    }
+    // Process chunk...
+}
+```
+## How It Works
+### Deduplication
+Deduplication ratio `N` means:
+- Generate `total_blocks / N` unique blocks
+- Reuse blocks in round-robin fashion
+- Example: 100 blocks, dedup=2 → 50 unique blocks, repeated 2x each
+### Compression
+Compression ratio `N` means:
+- Fill block with high-entropy Xoshiro256++ keystream
+- Add local back-references to achieve N:1 compressibility
+- Example: compress=3 → zstd will compress to ~33% of original size
+**compress=1**: Truly incompressible (zstd ratio ~1.00-1.02)
+**compress>1**: Target ratio via local back-refs, evenly distributed
+### NUMA Optimization
+On multi-socket systems (NUMA nodes > 1):
+- Detects topology via `/sys/devices/system/node` (Linux)
+- Can pin rayon threads to specific NUMA nodes (optional)
+- Ensures memory locality for maximum bandwidth
+## Performance
+Typical throughput on modern CPUs:
+- **Incompressible** (compress=1): 5-15 GB/s per core
+- **Compressible** (compress=3): 1-4 GB/s per core
+- **Multi-core**: Near-linear scaling with rayon
+Benchmark on AMD EPYC 7742 (64 cores):
+```
+Incompressible:  ~500 GB/s (all cores)
+Compress 3:1:    ~150 GB/s (all cores)
+```
+## Algorithm Details
+Based on s3dlio's `data_gen_alt.rs`:
+1. **Block-level generation**: 4 MiB blocks processed in parallel
+2. **Xoshiro256++**: 5-10x faster than ChaCha20, cryptographically strong
+3. **Integer error accumulation**: Even compression distribution
+4. **No cross-block compression**: Realistic compressor behavior
+5. **Per-call entropy**: Unique data across distributed nodes
+## Use Cases
+- **Storage benchmarking**: Generate realistic test data
+- **Network testing**: High-throughput data sources
+- **AI/ML profiling**: Simulate data loading pipelines
+- **Compression testing**: Validate compressor behavior
+- **Deduplication testing**: Test dedup ratios
+## Building from Source
+```bash
+# Clone repository
+git clone https://github.com/russfellows/dgen-rs.git
+cd dgen-rs
+# Build Rust library
+cargo build --release
+# Build Python wheel
+maturin build --release
+# Install locally
+maturin develop --release
+# Run tests
+cargo test
+python -m pytest python/tests/
+```
+## Requirements
+- **Rust**: 1.90+ (edition 2021)
+- **Python**: 3.10+ (for Python bindings)
+- **Platform**: Linux (NUMA detection required)
+## License
+Dual-licensed under MIT OR Apache-2.0
+## Credits
+- Data generation algorithm ported from [s3dlio](https://github.com/russfellows/s3dlio)
+- Built with [PyO3](https://pyo3.rs/) and [Maturin](https://www.maturin.rs/)
+## See Also
+- **s3dlio**: High-performance multi-protocol storage I/O
+- **sai3-bench**: Multi-protocol I/O benchmarking suite
+- **kv-cache-bench**: LLM KV cache storage benchmarking

dgen_py-0.1.2.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,14 @@
+dgen_py/__init__.py,sha256=79ZYgtU8WmD_mBKvnJ5iFS4jWgr-4kwHy2ZkN1EyQsA,5168
+dgen_py/__init__.pyi,sha256=gkd3mNrCwYd2I1eLB7SlsqcJCVTfxV04VH2ZlgFSZXQ,1359
+dgen_py/_dgen_rs.cpython-310-x86_64-linux-gnu.so,sha256=9Zh6z6rd0H041R04cx-sX4faLpeuzvrwqZIP3d8rn9Y,850000
+dgen_py/docs/PERFORMANCE.md,sha256=4iBLdr40G_9WVgOV05fyh8is4d4oYhY9MMlUU4trezo,7615
+dgen_py/examples/README.md,sha256=ds1pNjwAZnL0LXhe0EVMDuCsFxezt5N9qpMlvvjNJXQ,5033
+dgen_py/examples/benchmark_cpu_numa.py,sha256=N0Z6h-lf8GxdN9fKv782i2eg65385kNGOPDB2dsvnyw,11500
+dgen_py/examples/benchmark_vs_numpy.py,sha256=rTuN93XpUv_STzTn1HYkmP_dw1YYjUxd1bhUre_LDnQ,4711
+dgen_py/examples/demo.py,sha256=_YlWxqVZockT3Lv6aWcYZ5WIr3KZLoCd9e4hQ_Lujwg,3161
+dgen_py/examples/quick_perf_test.py,sha256=o2GFu74gPKhEEldTeEI6CLgBeXRuZPJDfeb_g-mDzik,3360
+dgen_py/examples/zero_copy_demo.py,sha256=WTrg8o5t5HGYgoy4I2UxbUi5POQ2K8iyPz7wPlopSo4,3473
+dgen_py-0.1.2.dist-info/METADATA,sha256=poGy_DeXvtGuU2bkFq3qj_aNXJee9IU7nlboud7U_cc,7276
+dgen_py-0.1.2.dist-info/WHEEL,sha256=eoKEw9I9Gn4nu_ZUo2vZXZfzt_PDszeNEndfEj9KkmQ,109
+dgen_py-0.1.2.dist-info/licenses/LICENSE,sha256=ZG2WWfkEUQMV0SWnn4DKVsF-2BRjQjmuCxIA9hxmJzY,1648
+dgen_py-0.1.2.dist-info/RECORD,,

dgen_py-0.1.2.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,4 @@
+Wheel-Version: 1.0
+Generator: maturin (1.11.2)
+Root-Is-Purelib: false
+Tag: cp310-cp310-manylinux_2_24_x86_64

dgen_py-0.1.2.dist-info/licenses/LICENSE ADDED Viewed

@@ -0,0 +1,39 @@
+MIT License
+Copyright (c) 2026 Russ Fellows
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+---
+Apache License 2.0
+Copyright 2026 Russ Fellows
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+    http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.