PyPI - masster - Versions diffs - 0.5.20__py3-none-any.whl → 0.5.22__py3-none-any.whl - Mend

masster 0.5.20py3-none-any.whl → 0.5.22py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of masster might be problematic. Click here for more details.

Files changed (9) hide show

masster/_version.py +1 -1
masster/wizard/wizard.py +18 -17
{masster-0.5.20.dist-info → masster-0.5.22.dist-info}/METADATA +1 -1
{masster-0.5.20.dist-info → masster-0.5.22.dist-info}/RECORD +7 -9
masster/wizard/README.md +0 -373
masster/wizard/example.py +0 -223
{masster-0.5.20.dist-info → masster-0.5.22.dist-info}/WHEEL +0 -0
{masster-0.5.20.dist-info → masster-0.5.22.dist-info}/entry_points.txt +0 -0
{masster-0.5.20.dist-info → masster-0.5.22.dist-info}/licenses/LICENSE +0 -0

masster/_version.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from __future__ import annotations
-__version__ = "0.5.19"
+__version__ = "0.5.22"
 def get_version():

masster/wizard/wizard.py CHANGED Viewed

@@ -818,7 +818,8 @@ class Wizard:
             '',
             '@app.cell',
             'def __(masster):',
-            '    study = masster.Study(folder=".")',
+            f'    study = masster.Study(folder={str(self.folder_path)!r})',
+            '    study.load()',
             '    return (study,)',
             '',
             '@app.cell',
@@ -838,7 +839,7 @@ class Wizard:
             f"Polarity detected: {source_info.get('polarity', 'unknown')}",
             "Files created:"]
         for file_path in files_created:
-            instructions.append(f"  ✅ {str(Path(file_path).resolve())}")
+            instructions.append(f"  [OK] {str(Path(file_path).resolve())}")
         # Find the workflow script name from created files
         workflow_script_name = "1_masster_workflow.py"
@@ -877,7 +878,7 @@ class Wizard:
             # Add test mode print after the masster version line
             if 'print("masster' in line and 'Automated MS Data Analysis")' in line:
                 lines.insert(i + 1, '        if TEST_MODE:')
-                lines.insert(i + 2, '            print("🧪 TEST MODE: Processing single file only")')
+                lines.insert(i + 2, '            print("[TEST] TEST MODE: Processing single file only")')
                 break
         # Add mode info after num_cores print
@@ -894,7 +895,7 @@ class Wizard:
                 lines.insert(i + 2, '        # Limit to first file in test mode')
                 lines.insert(i + 3, '        if TEST_MODE:')
                 lines.insert(i + 4, '            raw_files = raw_files[:1]')
-                lines.insert(i + 5, '            print(f"\\n🧪 TEST MODE: Processing only first file: {raw_files[0].name}")')
+                lines.insert(i + 5, '            print(f"\\n[TEST] TEST MODE: Processing only first file: {raw_files[0].name}")')
                 break
         # Modify num_cores for test mode
@@ -909,7 +910,7 @@ class Wizard:
                 lines.insert(i + 1, '        ')
                 lines.insert(i + 2, '        # Stop here if test-only mode')
                 lines.insert(i + 3, '        if TEST_ONLY:')
-                lines.insert(i + 4, '            print("\\n🧪 TEST ONLY mode: Stopping after successful single file processing")')
+                lines.insert(i + 4, '            print("\\n[TEST] TEST ONLY mode: Stopping after successful single file processing")')
                 lines.insert(i + 5, '            print(f"Test file created: {sample5_files[0]}")')
                 lines.insert(i + 6, '            print("\\nTo run full batch, use: wizard.run()")')
                 lines.insert(i + 7, '            total_time = time.time() - start_time')
@@ -985,7 +986,7 @@ class Wizard:
                     "status": "error",
                     "message": "Workflow script not found. Please run create_scripts() first.",
                     "instructions": [
-                        "❌ Missing 1_masster_workflow.py",
+                        "[ERROR] Missing 1_masster_workflow.py",
                         "Run: wizard.create_scripts()",
                         "Then: wizard.run()"
                     ]
@@ -1008,8 +1009,8 @@ class Wizard:
                     env['MASSTER_TEST_ONLY'] = '1'
             # Execute the workflow script
-            print(f"🚀 Executing {mode_label} processing workflow...")
-            print(f"📄 Running: {workflow_script_path.name}")
+            print(f">> Executing {mode_label} processing workflow...")
+            print(f"[SCRIPT] Running: {workflow_script_path.name}")
             print("=" * 60)
             import subprocess
@@ -1022,16 +1023,16 @@ class Wizard:
             if success:
                 print("=" * 60)
                 if test_only:
-                    print("✅ Test-only processing completed successfully!")
-                    print("📋 Single file validated - ready for full batch")
+                    print("[OK] Test-only processing completed successfully!")
+                    print("[INFO] Single file validated - ready for full batch")
                     print("   wizard.run()")
                 elif test_mode:
-                    print("✅ Test processing completed successfully!")
-                    print("📋 Next step: Run full batch")
+                    print("[OK] Test processing completed successfully!")
+                    print("[INFO] Next step: Run full batch")
                     print("   wizard.run()")
                 else:
-                    print("✅ Sample processing completed successfully!")
-                    print("📋 Next step: Run interactive analysis")
+                    print("[OK] Sample processing completed successfully!")
+                    print("[INFO] Next step: Run interactive analysis")
                     print("   uv run marimo edit 2_interactive_analysis.py")
                 print("=" * 60)
@@ -1042,7 +1043,7 @@ class Wizard:
                     "status": "success",
                     "message": f"{mode_label.capitalize()} processing completed successfully",
                     "instructions": [
-                        f"✅ {mode_label.capitalize()} processing completed",
+                        f"[OK] {mode_label.capitalize()} processing completed",
                         next_step
                     ]
                 }
@@ -1051,7 +1052,7 @@ class Wizard:
                     "status": "error",
                     "message": f"Workflow execution failed with return code {result.returncode}",
                     "instructions": [
-                        "❌ Check the error messages above",
+                        "[ERROR] Check the error messages above",
                         "Review parameters in 1_masster_workflow.py",
                         f"Try running manually: python {workflow_script_path.name}"
                     ]
@@ -1062,7 +1063,7 @@ class Wizard:
                 "status": "error",
                 "message": f"Failed to execute workflow: {e}",
                 "instructions": [
-                    "❌ Execution failed",
+                    "[ERROR] Execution failed",
                     "Check that source files exist and are accessible",
                     "Verify folder permissions"
                 ]

{masster-0.5.20.dist-info → masster-0.5.22.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: masster
-Version: 0.5.20
+Version: 0.5.22
 Summary: Mass spectrometry data analysis package
 Project-URL: homepage, https://github.com/zamboni-lab/masster
 Project-URL: repository, https://github.com/zamboni-lab/masster

{masster-0.5.20.dist-info → masster-0.5.22.dist-info}/RECORD RENAMED Viewed

@@ -1,5 +1,5 @@
 masster/__init__.py,sha256=B7zftzdElF2Wb5B7KvkD6TONnMIY-Jxeen3s49dgmzs,1029
-masster/_version.py,sha256=uCkE1NJ7J1aQrPg6o1mVRwVi9N10aB8nbGRTr0cwkNY,257
+masster/_version.py,sha256=4HOjpCuCuNY78DZ2P_GWL7HWMcoGK_P8IwMz9LKoTq0,257
 masster/chromatogram.py,sha256=iYpdv8C17zVnlWvOFgAn9ns2uFGiF-GgoYf5QVVAbHs,19319
 masster/logger.py,sha256=XT2gUcUIct8LWzTp9n484g5MaB89toT76CGA41oBvfA,18375
 masster/spectrum.py,sha256=TWIgDcl0lveG40cLVZTWGp8-FxMolu-P8EjZyRBtXL4,49850
@@ -59,12 +59,10 @@ masster/study/defaults/integrate_chrom_def.py,sha256=0MNIWGTjty-Zu-NTQsIweuj3UVq
 masster/study/defaults/integrate_def.py,sha256=Vf4SAzdBfnsSZ3IRaF0qZvWu3gMDPHdgPfMYoPKeWv8,7246
 masster/study/defaults/merge_def.py,sha256=krR099IkENLlJVxpSjdje3E6h-_qtlc3Ep6Hpy6inrU,12978
 masster/study/defaults/study_def.py,sha256=h8dYbi9xv0sesCSQik49Z53IkskMmNtW6ixl7it5pL0,16033
-masster/wizard/README.md,sha256=RX3uxT1qD5i9iDSznZUbnukixonqr96JlUE4TwssAgY,14111
 masster/wizard/__init__.py,sha256=L9G_datyGSFJjrBVklEVpZVLGXzUhDiWobtiygBH8vQ,669
-masster/wizard/example.py,sha256=xEZFTH9UZ8HKOm6s3JL8Js0Uw5ChnISWBHSZCL32vsM,7983
-masster/wizard/wizard.py,sha256=ckOz-8zrk8i7tDjqkk-shYFA2Ni9fV4nejocEjTX78M,65265
-masster-0.5.20.dist-info/METADATA,sha256=FJGXFasiyqxkR1R34mXnMANYqQ_ArHLktC3DqLRvg1I,45153
-masster-0.5.20.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-masster-0.5.20.dist-info/entry_points.txt,sha256=ZHguQ_vPmdbpqq2uGtmEOLJfgP-DQ1T0c07Lxh30wc8,58
-masster-0.5.20.dist-info/licenses/LICENSE,sha256=bx5iLIKjgAdYQ7sISn7DsfHRKkoCUm1154sJJKhgqnU,35184
-masster-0.5.20.dist-info/RECORD,,
+masster/wizard/wizard.py,sha256=aTNVhYoMK5B1uR2zrdbwEyZX-Zd86e4sUGhkQ2bgiDo,65352
+masster-0.5.22.dist-info/METADATA,sha256=tLbIWPgMewKVqyz7MSbwLZZY5JOPUaEfYMx-q5w4rkk,45153
+masster-0.5.22.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+masster-0.5.22.dist-info/entry_points.txt,sha256=ZHguQ_vPmdbpqq2uGtmEOLJfgP-DQ1T0c07Lxh30wc8,58
+masster-0.5.22.dist-info/licenses/LICENSE,sha256=bx5iLIKjgAdYQ7sISn7DsfHRKkoCUm1154sJJKhgqnU,35184
+masster-0.5.22.dist-info/RECORD,,

masster/wizard/README.md DELETED Viewed

@@ -1,373 +0,0 @@
-# Wizard Class Documentation
-The `Wizard` class provides comprehensive automation for mass spectrometry data processing, from raw files to final study results. It handles the complete workflow with minimal user intervention while providing intelligent resume capabilities, parallel processing optimization, and adaptive output formats.
-## Quick Start
-### Basic Usage
-```python
-from masster import Wizard
-# Create wizard with minimal configuration
-wizard = Wizard(
-    data_source="./raw_data",      # Directory with raw files
-    study_folder="./processed",    # Output directory
-    polarity="positive",           # or "negative"
-    num_cores=4                    # CPU cores to use
-)
-# Run complete pipeline
-success = wizard.run_full_pipeline()
-if success:
-    wizard.info()  # Print summary
-```
-### Advanced Configuration
-```python
-from masster import Wizard, wizard_def
-# Create custom parameters
-params = wizard_def(
-    data_source="./raw_data",
-    study_folder="./processed_advanced",
-    polarity="negative",
-    num_cores=8,
-    # File discovery
-    file_extensions=[".wiff", ".raw", ".mzML"],
-    search_subfolders=True,
-    skip_patterns=["blank", "QC", "test"],
-    # Processing parameters
-    adducts=["H-1:-:0.95", "Cl:-:0.05", "CH2O2:0:0.2"],
-    chrom_fwhm=0.15,
-    noise_threshold=5e4,
-    # Study assembly
-    rt_tolerance=1.0,
-    mz_tolerance=0.008,
-    min_samples_for_merge=30,
-    # Output options
-    export_formats=["csv", "xlsx", "mgf", "parquet"],
-    generate_plots=True,
-    compress_output=True,
-)
-wizard = Wizard(params=params)
-wizard.run_full_pipeline()
-```
-## Key Features
-### 🔄 Automated Pipeline
-- **Raw Data Discovery**: Automatically finds and validates raw MS files
-- **Batch Conversion**: Parallel conversion to sample5 format with optimized parameters
-- **Study Assembly**: Creates study from processed samples with quality filtering
-- **Feature Alignment**: Cross-sample alignment using configurable algorithms
-- **Consensus Generation**: Merges aligned features with statistical validation
-- **Results Export**: Multiple output formats for downstream analysis
-### 💾 Intelligent Resume
-- **Checkpoint System**: Automatically saves progress at key points
-- **File Tracking**: Remembers which files have been processed successfully
-- **Smart Recovery**: Resumes from last successful step after interruption
-- **Validation**: Verifies existing outputs before skipping
-### ⚡ Performance Optimization
-- **Parallel Processing**: Utilizes multiple CPU cores efficiently
-- **Memory Management**: Adaptive batch sizing based on available memory
-- **Process Isolation**: Prevents memory leaks in long-running jobs
-- **Adaptive Compression**: Optimizes output format based on study size
-### 📊 Comprehensive Logging
-- **Progress Tracking**: Real-time status updates with time estimates
-- **Detailed Logs**: Complete processing history saved to files
-- **Error Reporting**: Clear error messages with recovery suggestions
-- **Performance Metrics**: Processing times and resource usage statistics
-## Pipeline Steps
-### 1. File Discovery
-- Searches for raw MS files (`.wiff`, `.raw`, `.mzML`, `.d`)
-- Applies skip patterns to exclude unwanted files
-- Validates file integrity and accessibility
-- Reports file sizes and estimates processing time
-### 2. Sample5 Conversion
-- **Feature Detection**: Two-pass algorithm with configurable parameters
-- **Adduct Detection**: Automated adduct grouping based on polarity
-- **MS2 Linking**: Associates fragmentation spectra with features
-- **Quality Control**: Validates outputs and reports statistics
-- **Parallel Processing**: Utilizes multiple CPU cores with batch optimization
-### 3. Study Assembly
-- **Sample Loading**: Imports all processed sample5 files
-- **Quality Filtering**: Removes low-quality features based on coherence/prominence
-- **Metadata Organization**: Organizes sample information and experimental design
-- **Memory Optimization**: Efficient data structures for large studies
-### 4. Feature Alignment
-- **RT Alignment**: Corrects retention time shifts between samples
-- **Mass Alignment**: Accounts for mass calibration differences
-- **Algorithm Selection**: Supports KD-tree, QT-clustering, and chunked methods
-- **Validation**: Reports alignment statistics and quality metrics
-### 5. Consensus Generation
-- **Feature Merging**: Groups aligned features into consensus features
-- **Statistical Validation**: Applies minimum sample requirements
-- **Gap Filling**: Extracts chromatograms for missing values
-- **MS2 Integration**: Links consensus features to MS2 spectra
-### 6. Visualization & Export
-- **Interactive Plots**: 2D feature maps, PCA plots, alignment visualizations
-- **Multiple Formats**: CSV, Excel, MGF, Parquet exports
-- **Study Archival**: Compressed study5 format for long-term storage
-- **Metadata Export**: Complete processing parameters and statistics
-## Configuration Options
-### Core Parameters
-| Parameter | Type | Default | Description |
-|-----------|------|---------|-------------|
-| `data_source` | str | **required** | Directory containing raw data files |
-| `study_folder` | str | **required** | Output directory for processed study |
-| `polarity` | str | `"positive"` | Ion polarity mode (`"positive"` or `"negative"`) |
-| `num_cores` | int | `4` | Number of CPU cores for parallel processing |
-| `adducts` | List[str] | auto-set | Adduct specifications (set based on polarity) |
-### File Discovery
-| Parameter | Type | Default | Description |
-|-----------|------|---------|-------------|
-| `file_extensions` | List[str] | `[".wiff", ".raw", ".mzML", ".d"]` | File types to search for |
-| `search_subfolders` | bool | `True` | Search subdirectories recursively |
-| `skip_patterns` | List[str] | `["blank", "QC", "test"]` | Filename patterns to skip |
-| `max_file_size_gb` | float | `4.0` | Maximum file size warning threshold |
-### Processing Parameters
-| Parameter | Type | Default | Description |
-|-----------|------|---------|-------------|
-| `batch_size` | int | `8` | Files processed per batch |
-| `memory_limit_gb` | float | `16.0` | Memory usage limit |
-| `chrom_fwhm` | float | `0.2` | Expected chromatographic peak width (s) |
-| `noise_threshold` | float | `1e5` | Intensity threshold for peak detection |
-| `chrom_peak_snr` | float | `5.0` | Signal-to-noise ratio requirement |
-| `tol_ppm` | float | `10.0` | Mass tolerance (ppm) |
-### Study Assembly
-| Parameter | Type | Default | Description |
-|-----------|------|---------|-------------|
-| `rt_tolerance` | float | `1.5` | RT tolerance for alignment (seconds) |
-| `mz_tolerance` | float | `0.01` | m/z tolerance for alignment (Da) |
-| `alignment_algorithm` | str | `"kd"` | Alignment algorithm (`"kd"`, `"qt"`, `"chunked"`) |
-| `merge_method` | str | `"chunked"` | Merge algorithm for consensus generation |
-| `min_samples_for_merge` | int | `50` | Minimum samples required for consensus |
-### Output & Logging
-| Parameter | Type | Default | Description |
-|-----------|------|---------|-------------|
-| `generate_plots` | bool | `True` | Generate visualization plots |
-| `export_formats` | List[str] | `["csv", "mgf", "xlsx"]` | Output formats to generate |
-| `compress_output` | bool | `True` | Compress final study file |
-| `adaptive_compression` | bool | `True` | Adapt compression based on study size |
-| `log_level` | str | `"INFO"` | Logging detail level |
-| `log_to_file` | bool | `True` | Save logs to file |
-### Resume & Recovery
-| Parameter | Type | Default | Description |
-|-----------|------|---------|-------------|
-| `resume_enabled` | bool | `True` | Enable automatic resume capability |
-| `force_reprocess` | bool | `False` | Force reprocessing of existing files |
-| `backup_enabled` | bool | `True` | Create backups of intermediate results |
-| `checkpoint_interval` | int | `10` | Save progress every N files |
-| `cleanup_temp_files` | bool | `True` | Remove temporary files after completion |
-## Methods
-### Pipeline Control
-#### `run_full_pipeline() -> bool`
-Executes the complete processing pipeline in sequence. Returns `True` if successful.
-#### Individual Steps
-- `discover_files() -> List[Path]` - Find raw data files
-- `convert_to_sample5(file_list=None) -> bool` - Convert to sample5 format
-- `assemble_study() -> bool` - Create study from sample5 files
-- `align_and_merge() -> bool` - Perform feature alignment and merging
-- `generate_plots() -> bool` - Create visualization plots
-- `export_results() -> bool` - Export in requested formats
-- `save_study() -> bool` - Save final study file
-- `cleanup_temp_files() -> bool` - Remove temporary files
-### Status & Information
-#### `info()`
-Prints comprehensive wizard status including progress, timings, and results.
-#### `get_status() -> Dict[str, Any]`
-Returns detailed status dictionary with current step, processed files, timing, and parameters.
-## Error Handling & Recovery
-### Common Issues and Solutions
-**Memory Errors**
-- Reduce `batch_size` parameter
-- Increase `memory_limit_gb` if available
-- Use `merge_method="chunked"` for large studies
-- Enable `cleanup_temp_files=True`
-**File Access Errors**
-- Check file permissions on source and destination folders
-- Verify network connectivity for remote file systems
-- Ensure sufficient disk space in output directory
-- Close any applications that might lock files
-**Processing Failures**
-- Check individual file integrity
-- Review `skip_patterns` to exclude problematic files
-- Examine detailed logs in `wizard.log` and `processing.log`
-- Try processing failed files individually for debugging
-**Resume Issues**
-- Delete `wizard_checkpoint.json` to force fresh start
-- Verify output directory permissions
-- Check for corrupted intermediate files
-### Validation and Quality Control
-The Wizard includes built-in validation at each step:
-- **File Validation**: Checks file accessibility and format compatibility
-- **Processing Validation**: Verifies sample5 outputs can be loaded
-- **Study Validation**: Ensures study assembly completed successfully
-- **Alignment Validation**: Reports alignment statistics and warnings
-- **Export Validation**: Confirms all requested outputs were created
-## Performance Guidelines
-### System Requirements
-- **Minimum**: 4 CPU cores, 8 GB RAM
-- **Recommended**: 8+ CPU cores, 16+ GB RAM
-- **Large Studies**: 16+ CPU cores, 32+ GB RAM
-- **Storage**: SSD recommended, ~2-3x raw data size free space
-### Optimization Tips
-**For Small Studies (< 50 samples)**
-- Use `num_cores = 4-6`
-- Set `batch_size = 4-8`
-- Use `merge_method = "kd"`
-- Enable all export formats
-**For Large Studies (100+ samples)**
-- Use `num_cores = 8-16`
-- Set `batch_size = 16-32`
-- Use `merge_method = "chunked"`
-- Enable `adaptive_compression = True`
-- Consider processing in polarity-specific batches
-**For Very Large Studies (500+ samples)**
-- Process positive/negative modes separately
-- Use `memory_limit_gb = 64+`
-- Set `checkpoint_interval = 50`
-- Enable `cleanup_temp_files = True`
-- Consider cluster/cloud processing
-## Integration Examples
-### With Existing Workflows
-```python
-# Integration with custom preprocessing
-wizard = Wizard(data_source="./preprocessed", ...)
-# Skip conversion if already done
-if not wizard.study_folder_path.glob("*.sample5"):
-    wizard.convert_to_sample5()
-# Continue with study-level processing
-wizard.assemble_study()
-wizard.align_and_merge()
-wizard.export_results()
-```
-### Batch Processing Multiple Studies
-```python
-studies = [
-    {"source": "./batch1", "output": "./results/batch1", "polarity": "pos"},
-    {"source": "./batch2", "output": "./results/batch2", "polarity": "neg"},
-]
-for study_config in studies:
-    wizard = Wizard(**study_config, num_cores=8)
-    success = wizard.run_full_pipeline()
-    if success:
-        print(f"✅ {study_config['output']} completed")
-    else:
-        print(f"❌ {study_config['output']} failed")
-```
-### Custom Processing Steps
-```python
-wizard = Wizard(...)
-# Standard conversion
-wizard.convert_to_sample5()
-# Custom study assembly with specific parameters
-wizard.assemble_study()
-# Custom filtering before alignment
-if hasattr(wizard.study, 'features_filter'):
-    selection = wizard.study.features_select(
-        chrom_coherence=0.5,  # Higher quality threshold
-        chrom_prominence_scaled=2.0
-    )
-    wizard.study.features_filter(selection)
-# Continue with standard pipeline
-wizard.align_and_merge()
-wizard.generate_plots()
-```
-## Output Files
-The Wizard generates several types of output files:
-### Primary Results
-- `final_study.study5` - Complete study in masster native format
-- `consensus_features.csv` - Feature table with RT, m/z, intensity data
-- `study_results.xlsx` - Multi-sheet Excel workbook with results and metadata
-- `consensus_ms2.mgf` - MS2 spectra for database searching
-### Visualizations
-- `alignment_plot.html` - Interactive alignment visualization
-- `consensus_2d.html` - 2D feature map of consensus features
-- `pca_plot.html` - Principal component analysis plot
-- `consensus_stats.html` - Study statistics and quality metrics
-### Processing Logs
-- `wizard.log` - Detailed processing log with debug information
-- `processing.log` - Simple progress log with timestamps
-- `study_metadata.txt` - Study summary with parameters and statistics
-### Individual Sample Outputs (if enabled)
-- `sample_name.sample5` - Processed sample in masster format
-- `sample_name.features.csv` - Individual sample feature table
-- `sample_name.mgf` - Individual sample MS2 spectra
-- `sample_name_2d.html` - Individual sample 2D plot
-The Wizard provides a complete, automated solution for mass spectrometry data processing while maintaining flexibility for custom workflows and providing robust error handling and recovery capabilities.

masster/wizard/example.py DELETED Viewed

@@ -1,223 +0,0 @@
-#!/usr/bin/env python3
-"""
-Example script demonstrating the Wizard class for automated study processing.
-This script shows how to use the Wizard class to automatically process
-mass spectrometry data from raw files to final study results.
-"""
-from pathlib import Path
-from masster import Wizard, wizard_def
-def main():
-    """Main example function."""
-    # =================================================================
-    # EXAMPLE 1: Basic Usage with Minimal Configuration
-    # =================================================================
-    print("=== Example 1: Basic Wizard Usage ===\n")
-    # Set up paths (adjust these for your data)
-    data_source = r"D:\Data\raw_files"  # Directory with .wiff, .raw, .mzML files
-    study_folder = r"D:\Data\processed_study"  # Output directory
-    # Create wizard with basic settings
-    wizard = Wizard(
-        data_source=data_source,
-        study_folder=study_folder,
-        polarity="positive",  # or "negative"
-        num_cores=4
-    )
-    # Run the complete pipeline
-    success = wizard.run_full_pipeline()
-    if success:
-        print("✅ Processing completed successfully!")
-        wizard.info()  # Print status summary
-    else:
-        print("❌ Processing failed. Check logs for details.")
-    print("\n" + "="*60 + "\n")
-    # =================================================================
-    # EXAMPLE 2: Advanced Configuration with Custom Parameters
-    # =================================================================
-    print("=== Example 2: Advanced Wizard Configuration ===\n")
-    # Create custom parameters
-    params = wizard_def(
-        # Core settings
-        data_source=data_source,
-        study_folder=study_folder + "_advanced",
-        polarity="negative",
-        num_cores=8,
-        # File discovery settings
-        file_extensions=[".wiff", ".raw", ".mzML"],
-        search_subfolders=True,
-        skip_patterns=["blank", "QC", "test", "solvent"],
-        # Processing parameters
-        adducts=["H-1:-:0.95", "Cl:-:0.05", "CH2O2:0:0.2"],
-        batch_size=4,  # Process 4 files at once
-        memory_limit_gb=32.0,
-        # Feature detection parameters
-        chrom_fwhm=0.15,  # Narrower peaks for UHPLC
-        noise_threshold=5e4,  # Lower noise threshold
-        chrom_peak_snr=7.0,  # Higher S/N requirement
-        tol_ppm=8.0,  # Tighter mass tolerance
-        # Study assembly parameters
-        rt_tolerance=1.0,  # Tighter RT tolerance
-        mz_tolerance=0.008,  # Tighter m/z tolerance
-        min_samples_for_merge=30,  # Require feature in at least 30 samples
-        merge_method="chunked",  # Memory-efficient merging
-        # Output options
-        generate_plots=True,
-        generate_interactive=True,
-        export_formats=["csv", "xlsx", "mgf", "parquet"],
-        compress_output=True,
-        adaptive_compression=True,
-        # Advanced options
-        resume_enabled=True,  # Can resume if interrupted
-        force_reprocess=False,  # Skip already processed files
-        backup_enabled=True,
-        cleanup_temp_files=True,
-        log_level="INFO",
-        verbose_progress=True,
-    )
-    # Create wizard with custom parameters
-    wizard_advanced = Wizard(params=params)
-    # You can also run individual steps for more control
-    print("Running step-by-step processing...")
-    # Step 1: Discover files
-    files = wizard_advanced.discover_files()
-    print(f"Found {len(files)} files for processing")
-    # Step 2: Convert to sample5 (can be resumed if interrupted)
-    if wizard_advanced.convert_to_sample5():
-        print("✅ Sample5 conversion completed")
-        # Step 3: Assemble study
-        if wizard_advanced.assemble_study():
-            print("✅ Study assembly completed")
-            # Step 4: Align and merge
-            if wizard_advanced.align_and_merge():
-                print("✅ Alignment and merging completed")
-                # Step 5: Generate plots
-                if wizard_advanced.generate_plots():
-                    print("✅ Plot generation completed")
-                # Step 6: Export results
-                if wizard_advanced.export_results():
-                    print("✅ Results exported")
-                # Step 7: Save final study
-                if wizard_advanced.save_study():
-                    print("✅ Study saved")
-                    # Optional cleanup
-                    wizard_advanced.cleanup_temp_files()
-                    print("✅ Cleanup completed")
-    # Print final status
-    wizard_advanced.info()
-    print("\n" + "="*60 + "\n")
-    # =================================================================
-    # EXAMPLE 3: Resume Interrupted Processing
-    # =================================================================
-    print("=== Example 3: Resume Capability ===\n")
-    # If processing was interrupted, you can resume by creating a new wizard
-    # with the same parameters. It will automatically detect and skip
-    # already processed files.
-    resume_wizard = Wizard(
-        data_source=data_source,
-        study_folder=study_folder + "_resume",
-        polarity="positive",
-        num_cores=4,
-        resume_enabled=True  # This is the default
-    )
-    # The wizard will automatically load checkpoint and continue from where it left off
-    print("Status after loading checkpoint:")
-    resume_wizard.info()
-    print("\n" + "="*60 + "\n")
-    # =================================================================
-    # EXAMPLE 4: Monitoring and Status
-    # =================================================================
-    print("=== Example 4: Status Monitoring ===\n")
-    # You can check wizard status at any time
-    status = wizard.get_status()
-    print("Wizard Status:")
-    for key, value in status.items():
-        print(f"  {key}: {value}")
-    # The wizard maintains comprehensive logs
-    log_file = Path(study_folder) / "wizard.log"
-    if log_file.exists():
-        print(f"\nDetailed logs available at: {log_file}")
-    processing_log = Path(study_folder) / "processing.log"
-    if processing_log.exists():
-        print(f"Processing summary at: {processing_log}")
-def example_batch_different_polarities():
-    """Example of processing positive and negative mode data separately."""
-    print("=== Processing Both Polarities ===\n")
-    base_data_source = r"D:\Data\raw_files"
-    base_output = r"D:\Data\processed_studies"
-    # Process positive mode
-    pos_wizard = Wizard(
-        data_source=base_data_source + r"\positive",
-        study_folder=base_output + r"\positive_study",
-        polarity="positive",
-        adducts=["H:+:0.8", "Na:+:0.1", "NH4:+:0.1"],
-        num_cores=6
-    )
-    print("Processing positive mode data...")
-    pos_success = pos_wizard.run_full_pipeline()
-    # Process negative mode
-    neg_wizard = Wizard(
-        data_source=base_data_source + r"\negative",
-        study_folder=base_output + r"\negative_study",
-        polarity="negative",
-        adducts=["H-1:-:0.95", "Cl:-:0.05"],
-        num_cores=6
-    )
-    print("Processing negative mode data...")
-    neg_success = neg_wizard.run_full_pipeline()
-    print("\nResults:")
-    print(f"Positive mode: {'✅ Success' if pos_success else '❌ Failed'}")
-    print(f"Negative mode: {'✅ Success' if neg_success else '❌ Failed'}")
-if __name__ == "__main__":
-    # Run basic examples
-    main()
-    # Uncomment to run polarity-specific processing
-    # example_batch_different_polarities()

{masster-0.5.20.dist-info → masster-0.5.22.dist-info}/WHEEL RENAMED Viewed

File without changes

{masster-0.5.20.dist-info → masster-0.5.22.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{masster-0.5.20.dist-info → masster-0.5.22.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

masster 0.5.20__py3-none-any.whl → 0.5.22__py3-none-any.whl

Potentially problematic release.

masster 0.5.20py3-none-any.whl → 0.5.22py3-none-any.whl