omnizip 0.3.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/.rspec +3 -0
- data/.rubocop.yml +32 -0
- data/.rubocop_todo.yml +754 -0
- data/COPYING +502 -0
- data/Gemfile +17 -0
- data/LICENSE +12 -0
- data/README.adoc +1045 -0
- data/Rakefile +12 -0
- data/benchmark/README.md +260 -0
- data/benchmark/benchmark_suite.rb +125 -0
- data/benchmark/compression_bench.rb +181 -0
- data/benchmark/filter_bench.rb +180 -0
- data/benchmark/models/benchmark_result.rb +59 -0
- data/benchmark/models/comparison_result.rb +69 -0
- data/benchmark/profile_suite.rb +167 -0
- data/benchmark/reporter.rb +150 -0
- data/benchmark/run_benchmarks.rb +66 -0
- data/benchmark/test_data.rb +137 -0
- data/config/formats/rar3_spec.yml +91 -0
- data/config/formats/rar5_spec.yml +102 -0
- data/docs/.github/workflows/docs.yml +142 -0
- data/docs/.gitignore +21 -0
- data/docs/.lychee.toml +67 -0
- data/docs/Gemfile +13 -0
- data/docs/RAR_WRITE_SUPPORT.md +26 -0
- data/docs/README.md +101 -0
- data/docs/_config.yml +112 -0
- data/docs/assets/logo.svg +1 -0
- data/docs/assets/omnizip-logo.pdf +1540 -11
- data/docs/comparison/feature-matrix.adoc +694 -0
- data/docs/comparison/index.adoc +113 -0
- data/docs/comparison/vs-7zip.adoc +309 -0
- data/docs/comparison/vs-peazip.adoc +77 -0
- data/docs/comparison/vs-rubyzip.adoc +342 -0
- data/docs/comparison/vs-winrar.adoc +100 -0
- data/docs/compatibility.adoc +579 -0
- data/docs/concepts/index.adoc +129 -0
- data/docs/developer/architecture.adoc +256 -0
- data/docs/developer/contributing.adoc +158 -0
- data/docs/developer/index.adoc +25 -0
- data/docs/developer/testing.adoc +212 -0
- data/docs/getting-started/basic-usage.adoc +271 -0
- data/docs/getting-started/index.adoc +42 -0
- data/docs/getting-started/installation.adoc +138 -0
- data/docs/getting-started/quick-start.adoc +185 -0
- data/docs/getting-started/your-first-archive.adoc +218 -0
- data/docs/guides/advanced-features/encryption.adoc +300 -0
- data/docs/guides/advanced-features/index.adoc +49 -0
- data/docs/guides/advanced-features/parallel-processing.adoc +246 -0
- data/docs/guides/advanced-features/progress-tracking.adoc +320 -0
- data/docs/guides/advanced-features/streaming.adoc +212 -0
- data/docs/guides/archive-formats/gzip-format.adoc +107 -0
- data/docs/guides/archive-formats/index.adoc +130 -0
- data/docs/guides/archive-formats/rar-format.adoc +104 -0
- data/docs/guides/archive-formats/rar5.adoc +521 -0
- data/docs/guides/archive-formats/seven-zip-format.adoc +35 -0
- data/docs/guides/archive-formats/tar-format.adoc +106 -0
- data/docs/guides/archive-formats/xz-format.adoc +118 -0
- data/docs/guides/archive-formats/zip-format.adoc +35 -0
- data/docs/guides/compression-algorithms/bzip2.adoc +113 -0
- data/docs/guides/compression-algorithms/deflate.adoc +319 -0
- data/docs/guides/compression-algorithms/index.adoc +190 -0
- data/docs/guides/compression-algorithms/lzma.adoc +398 -0
- data/docs/guides/compression-algorithms/lzma2.adoc +327 -0
- data/docs/guides/compression-algorithms/ppmd.adoc +316 -0
- data/docs/guides/compression-algorithms/zstandard.adoc +361 -0
- data/docs/guides/creating-archives.adoc +354 -0
- data/docs/guides/extracting-archives.adoc +53 -0
- data/docs/guides/format-conversion.adoc +64 -0
- data/docs/guides/index.adoc +49 -0
- data/docs/guides/migration-rubyzip.adoc +217 -0
- data/docs/guides/parity-archives.adoc +605 -0
- data/docs/guides/performance-tuning.adoc +88 -0
- data/docs/index.adoc +218 -0
- data/docs/lychee.toml +67 -0
- data/docs/reference/api/overview.adoc +188 -0
- data/docs/reference/cli/compress-command.adoc +114 -0
- data/docs/reference/cli/overview.adoc +140 -0
- data/docs/reference/index.adoc +26 -0
- data/docs/resources/faq.adoc +185 -0
- data/docs/resources/quick-reference.adoc +222 -0
- data/docs/troubleshooting/index.adoc +208 -0
- data/examples/api_comparison.rb +205 -0
- data/examples/deflate64_example.rb +96 -0
- data/examples/par2_demo.rb +121 -0
- data/examples/quick_start_native.rb +150 -0
- data/examples/quick_start_rubyzip.rb +115 -0
- data/examples/rubyzip_compatibility_demo.rb +194 -0
- data/exe/omnizip +27 -0
- data/lib/omnizip/algorithm.rb +130 -0
- data/lib/omnizip/algorithm_registry.rb +86 -0
- data/lib/omnizip/algorithms/.keep +0 -0
- data/lib/omnizip/algorithms/bzip2/bwt.rb +225 -0
- data/lib/omnizip/algorithms/bzip2/decoder.rb +193 -0
- data/lib/omnizip/algorithms/bzip2/encoder.rb +237 -0
- data/lib/omnizip/algorithms/bzip2/huffman.rb +206 -0
- data/lib/omnizip/algorithms/bzip2/mtf.rb +101 -0
- data/lib/omnizip/algorithms/bzip2/rle.rb +151 -0
- data/lib/omnizip/algorithms/bzip2.rb +130 -0
- data/lib/omnizip/algorithms/deflate/constants.rb +28 -0
- data/lib/omnizip/algorithms/deflate/decoder.rb +38 -0
- data/lib/omnizip/algorithms/deflate/encoder.rb +46 -0
- data/lib/omnizip/algorithms/deflate.rb +128 -0
- data/lib/omnizip/algorithms/deflate64/constants.rb +45 -0
- data/lib/omnizip/algorithms/deflate64/decoder.rb +153 -0
- data/lib/omnizip/algorithms/deflate64/encoder.rb +98 -0
- data/lib/omnizip/algorithms/deflate64/huffman_coder.rb +354 -0
- data/lib/omnizip/algorithms/deflate64/lz77_encoder.rb +142 -0
- data/lib/omnizip/algorithms/deflate64.rb +109 -0
- data/lib/omnizip/algorithms/lzma/bit_model.rb +120 -0
- data/lib/omnizip/algorithms/lzma/constants.rb +112 -0
- data/lib/omnizip/algorithms/lzma/decoder.rb +148 -0
- data/lib/omnizip/algorithms/lzma/dictionary.rb +69 -0
- data/lib/omnizip/algorithms/lzma/distance_coder.rb +415 -0
- data/lib/omnizip/algorithms/lzma/encoder.rb +142 -0
- data/lib/omnizip/algorithms/lzma/length_coder.rb +260 -0
- data/lib/omnizip/algorithms/lzma/literal_decoder.rb +320 -0
- data/lib/omnizip/algorithms/lzma/literal_encoder.rb +210 -0
- data/lib/omnizip/algorithms/lzma/lzip_decoder.rb +341 -0
- data/lib/omnizip/algorithms/lzma/lzma_alone_decoder.rb +192 -0
- data/lib/omnizip/algorithms/lzma/lzma_state.rb +128 -0
- data/lib/omnizip/algorithms/lzma/match.rb +32 -0
- data/lib/omnizip/algorithms/lzma/match_finder.rb +205 -0
- data/lib/omnizip/algorithms/lzma/match_finder_config.rb +142 -0
- data/lib/omnizip/algorithms/lzma/match_finder_factory.rb +88 -0
- data/lib/omnizip/algorithms/lzma/optimal_encoder.rb +130 -0
- data/lib/omnizip/algorithms/lzma/probability_models.rb +72 -0
- data/lib/omnizip/algorithms/lzma/range_coder.rb +85 -0
- data/lib/omnizip/algorithms/lzma/range_decoder.rb +434 -0
- data/lib/omnizip/algorithms/lzma/range_encoder.rb +194 -0
- data/lib/omnizip/algorithms/lzma/state.rb +127 -0
- data/lib/omnizip/algorithms/lzma/xz_buffered_range_encoder.rb +325 -0
- data/lib/omnizip/algorithms/lzma/xz_encoder.rb +426 -0
- data/lib/omnizip/algorithms/lzma/xz_encoder_fast.rb +645 -0
- data/lib/omnizip/algorithms/lzma/xz_match_finder_adapter.rb +227 -0
- data/lib/omnizip/algorithms/lzma/xz_price_calculator.rb +169 -0
- data/lib/omnizip/algorithms/lzma/xz_probability_models.rb +261 -0
- data/lib/omnizip/algorithms/lzma/xz_range_encoder.rb +223 -0
- data/lib/omnizip/algorithms/lzma/xz_range_encoder_exact.rb +331 -0
- data/lib/omnizip/algorithms/lzma/xz_state.rb +116 -0
- data/lib/omnizip/algorithms/lzma/xz_utils_decoder.rb +2055 -0
- data/lib/omnizip/algorithms/lzma.rb +238 -0
- data/lib/omnizip/algorithms/lzma2/chunk_manager.rb +182 -0
- data/lib/omnizip/algorithms/lzma2/constants.rb +41 -0
- data/lib/omnizip/algorithms/lzma2/encoder.rb +147 -0
- data/lib/omnizip/algorithms/lzma2/lzma2_chunk.rb +161 -0
- data/lib/omnizip/algorithms/lzma2/properties.rb +179 -0
- data/lib/omnizip/algorithms/lzma2/simple_lzma2_encoder.rb +127 -0
- data/lib/omnizip/algorithms/lzma2/xz_encoder_adapter.rb +85 -0
- data/lib/omnizip/algorithms/lzma2.rb +141 -0
- data/lib/omnizip/algorithms/ppmd7/constants.rb +74 -0
- data/lib/omnizip/algorithms/ppmd7/context.rb +154 -0
- data/lib/omnizip/algorithms/ppmd7/decoder.rb +126 -0
- data/lib/omnizip/algorithms/ppmd7/encoder.rb +163 -0
- data/lib/omnizip/algorithms/ppmd7/model.rb +248 -0
- data/lib/omnizip/algorithms/ppmd7/symbol_state.rb +57 -0
- data/lib/omnizip/algorithms/ppmd7.rb +116 -0
- data/lib/omnizip/algorithms/ppmd8/constants.rb +61 -0
- data/lib/omnizip/algorithms/ppmd8/context.rb +34 -0
- data/lib/omnizip/algorithms/ppmd8/decoder.rb +107 -0
- data/lib/omnizip/algorithms/ppmd8/encoder.rb +138 -0
- data/lib/omnizip/algorithms/ppmd8/model.rb +250 -0
- data/lib/omnizip/algorithms/ppmd8/restoration_method.rb +78 -0
- data/lib/omnizip/algorithms/ppmd8.rb +82 -0
- data/lib/omnizip/algorithms/ppmd_base.rb +138 -0
- data/lib/omnizip/algorithms/sevenzip_lzma2.rb +123 -0
- data/lib/omnizip/algorithms/xz_lzma2.rb +118 -0
- data/lib/omnizip/algorithms/zstandard/constants.rb +25 -0
- data/lib/omnizip/algorithms/zstandard/decoder.rb +46 -0
- data/lib/omnizip/algorithms/zstandard/encoder.rb +51 -0
- data/lib/omnizip/algorithms/zstandard.rb +138 -0
- data/lib/omnizip/buffer/memory_archive.rb +251 -0
- data/lib/omnizip/buffer/memory_extractor.rb +224 -0
- data/lib/omnizip/buffer.rb +176 -0
- data/lib/omnizip/checksum_registry.rb +114 -0
- data/lib/omnizip/checksums/crc32.rb +100 -0
- data/lib/omnizip/checksums/crc64.rb +101 -0
- data/lib/omnizip/checksums/crc_base.rb +158 -0
- data/lib/omnizip/checksums/verifier.rb +131 -0
- data/lib/omnizip/chunked/memory_manager.rb +194 -0
- data/lib/omnizip/chunked/reader.rb +78 -0
- data/lib/omnizip/chunked/writer.rb +120 -0
- data/lib/omnizip/chunked.rb +129 -0
- data/lib/omnizip/cli/output_formatter.rb +104 -0
- data/lib/omnizip/cli.rb +572 -0
- data/lib/omnizip/commands/.keep +0 -0
- data/lib/omnizip/commands/archive_create_command.rb +427 -0
- data/lib/omnizip/commands/archive_extract_command.rb +272 -0
- data/lib/omnizip/commands/archive_list_command.rb +218 -0
- data/lib/omnizip/commands/archive_repair_command.rb +131 -0
- data/lib/omnizip/commands/archive_verify_command.rb +117 -0
- data/lib/omnizip/commands/compress_command.rb +117 -0
- data/lib/omnizip/commands/decompress_command.rb +120 -0
- data/lib/omnizip/commands/list_command.rb +53 -0
- data/lib/omnizip/commands/metadata_command.rb +153 -0
- data/lib/omnizip/commands/parity_create_command.rb +122 -0
- data/lib/omnizip/commands/parity_repair_command.rb +122 -0
- data/lib/omnizip/commands/parity_verify_command.rb +124 -0
- data/lib/omnizip/commands/profile_list_command.rb +56 -0
- data/lib/omnizip/commands/profile_show_command.rb +44 -0
- data/lib/omnizip/convenience.rb +359 -0
- data/lib/omnizip/converter/conversion_registry.rb +49 -0
- data/lib/omnizip/converter/conversion_strategy.rb +121 -0
- data/lib/omnizip/converter/seven_zip_to_zip_strategy.rb +97 -0
- data/lib/omnizip/converter/zip_to_seven_zip_strategy.rb +112 -0
- data/lib/omnizip/converter.rb +105 -0
- data/lib/omnizip/crypto/aes256/cipher.rb +100 -0
- data/lib/omnizip/crypto/aes256/constants.rb +28 -0
- data/lib/omnizip/crypto/aes256/key_derivation.rb +101 -0
- data/lib/omnizip/crypto/aes256.rb +102 -0
- data/lib/omnizip/error.rb +106 -0
- data/lib/omnizip/eta/exponential_smoothing_estimator.rb +98 -0
- data/lib/omnizip/eta/moving_average_estimator.rb +99 -0
- data/lib/omnizip/eta/rate_calculator.rb +104 -0
- data/lib/omnizip/eta/sample_history.rb +143 -0
- data/lib/omnizip/eta/time_estimator.rb +106 -0
- data/lib/omnizip/eta.rb +63 -0
- data/lib/omnizip/extraction/filter_chain.rb +177 -0
- data/lib/omnizip/extraction/glob_pattern.rb +140 -0
- data/lib/omnizip/extraction/pattern_matcher.rb +70 -0
- data/lib/omnizip/extraction/predicate_pattern.rb +52 -0
- data/lib/omnizip/extraction/regex_pattern.rb +50 -0
- data/lib/omnizip/extraction/selective_extractor.rb +240 -0
- data/lib/omnizip/extraction.rb +111 -0
- data/lib/omnizip/file_type/mime_classifier.rb +144 -0
- data/lib/omnizip/file_type.rb +113 -0
- data/lib/omnizip/filter.rb +139 -0
- data/lib/omnizip/filter_pipeline.rb +108 -0
- data/lib/omnizip/filter_registry.rb +166 -0
- data/lib/omnizip/filters/bcj.rb +279 -0
- data/lib/omnizip/filters/bcj2/constants.rb +53 -0
- data/lib/omnizip/filters/bcj2/decoder.rb +200 -0
- data/lib/omnizip/filters/bcj2/encoder.rb +61 -0
- data/lib/omnizip/filters/bcj2/stream_data.rb +93 -0
- data/lib/omnizip/filters/bcj2.rb +99 -0
- data/lib/omnizip/filters/bcj_arm.rb +176 -0
- data/lib/omnizip/filters/bcj_arm64.rb +244 -0
- data/lib/omnizip/filters/bcj_ia64.rb +196 -0
- data/lib/omnizip/filters/bcj_ppc.rb +190 -0
- data/lib/omnizip/filters/bcj_sparc.rb +176 -0
- data/lib/omnizip/filters/bcj_x86.rb +193 -0
- data/lib/omnizip/filters/delta.rb +196 -0
- data/lib/omnizip/filters/filter_base.rb +72 -0
- data/lib/omnizip/filters/registry.rb +123 -0
- data/lib/omnizip/filters/xz_delta.rb +258 -0
- data/lib/omnizip/format_detector.rb +162 -0
- data/lib/omnizip/format_registry.rb +59 -0
- data/lib/omnizip/formats/.keep +0 -0
- data/lib/omnizip/formats/bzip2_file.rb +172 -0
- data/lib/omnizip/formats/cpio/constants.rb +55 -0
- data/lib/omnizip/formats/cpio/entry.rb +385 -0
- data/lib/omnizip/formats/cpio/reader.rb +196 -0
- data/lib/omnizip/formats/cpio/writer.rb +234 -0
- data/lib/omnizip/formats/cpio.rb +140 -0
- data/lib/omnizip/formats/format_spec_loader.rb +230 -0
- data/lib/omnizip/formats/gzip.rb +238 -0
- data/lib/omnizip/formats/iso/directory_builder.rb +297 -0
- data/lib/omnizip/formats/iso/directory_record.rb +152 -0
- data/lib/omnizip/formats/iso/joliet.rb +204 -0
- data/lib/omnizip/formats/iso/path_table.rb +125 -0
- data/lib/omnizip/formats/iso/reader.rb +197 -0
- data/lib/omnizip/formats/iso/rock_ridge.rb +349 -0
- data/lib/omnizip/formats/iso/volume_builder.rb +320 -0
- data/lib/omnizip/formats/iso/volume_descriptor.rb +168 -0
- data/lib/omnizip/formats/iso/writer.rb +530 -0
- data/lib/omnizip/formats/iso.rb +140 -0
- data/lib/omnizip/formats/lzip.rb +175 -0
- data/lib/omnizip/formats/lzma_alone.rb +171 -0
- data/lib/omnizip/formats/rar/archive_repairer.rb +243 -0
- data/lib/omnizip/formats/rar/archive_verifier.rb +195 -0
- data/lib/omnizip/formats/rar/block_parser.rb +243 -0
- data/lib/omnizip/formats/rar/compression/bit_stream.rb +180 -0
- data/lib/omnizip/formats/rar/compression/dispatcher.rb +217 -0
- data/lib/omnizip/formats/rar/compression/lz77_huffman/decoder.rb +216 -0
- data/lib/omnizip/formats/rar/compression/lz77_huffman/encoder.rb +158 -0
- data/lib/omnizip/formats/rar/compression/lz77_huffman/huffman_builder.rb +217 -0
- data/lib/omnizip/formats/rar/compression/lz77_huffman/huffman_coder.rb +189 -0
- data/lib/omnizip/formats/rar/compression/lz77_huffman/match_finder.rb +135 -0
- data/lib/omnizip/formats/rar/compression/lz77_huffman/sliding_window.rb +165 -0
- data/lib/omnizip/formats/rar/compression/ppmd/context.rb +105 -0
- data/lib/omnizip/formats/rar/compression/ppmd/decoder.rb +219 -0
- data/lib/omnizip/formats/rar/compression/ppmd/encoder.rb +262 -0
- data/lib/omnizip/formats/rar/compression_method_registry.rb +106 -0
- data/lib/omnizip/formats/rar/constants.rb +82 -0
- data/lib/omnizip/formats/rar/decompressor.rb +238 -0
- data/lib/omnizip/formats/rar/external_writer.rb +312 -0
- data/lib/omnizip/formats/rar/header.rb +192 -0
- data/lib/omnizip/formats/rar/license_validator.rb +109 -0
- data/lib/omnizip/formats/rar/models/rar_archive.rb +77 -0
- data/lib/omnizip/formats/rar/models/rar_entry.rb +65 -0
- data/lib/omnizip/formats/rar/models/rar_volume.rb +56 -0
- data/lib/omnizip/formats/rar/parity_handler.rb +292 -0
- data/lib/omnizip/formats/rar/rar5/compression/lzma.rb +202 -0
- data/lib/omnizip/formats/rar/rar5/compression/lzss.rb +578 -0
- data/lib/omnizip/formats/rar/rar5/compression/store.rb +60 -0
- data/lib/omnizip/formats/rar/rar5/crc32.rb +39 -0
- data/lib/omnizip/formats/rar/rar5/encryption/aes256_cbc.rb +97 -0
- data/lib/omnizip/formats/rar/rar5/encryption/encryption_header.rb +114 -0
- data/lib/omnizip/formats/rar/rar5/encryption/encryption_manager.rb +166 -0
- data/lib/omnizip/formats/rar/rar5/encryption/key_derivation.rb +97 -0
- data/lib/omnizip/formats/rar/rar5/header.rb +187 -0
- data/lib/omnizip/formats/rar/rar5/models/encryption_options.rb +74 -0
- data/lib/omnizip/formats/rar/rar5/models/recovery_options.rb +63 -0
- data/lib/omnizip/formats/rar/rar5/models/solid_options.rb +63 -0
- data/lib/omnizip/formats/rar/rar5/models/volume_options.rb +74 -0
- data/lib/omnizip/formats/rar/rar5/multi_volume/ARCHITECTURE.md +290 -0
- data/lib/omnizip/formats/rar/rar5/multi_volume/volume_manager.rb +264 -0
- data/lib/omnizip/formats/rar/rar5/multi_volume/volume_splitter.rb +155 -0
- data/lib/omnizip/formats/rar/rar5/multi_volume/volume_writer.rb +194 -0
- data/lib/omnizip/formats/rar/rar5/solid/solid_encoder.rb +109 -0
- data/lib/omnizip/formats/rar/rar5/solid/solid_manager.rb +142 -0
- data/lib/omnizip/formats/rar/rar5/solid/solid_stream.rb +121 -0
- data/lib/omnizip/formats/rar/rar5/vint.rb +65 -0
- data/lib/omnizip/formats/rar/rar5/writer.rb +466 -0
- data/lib/omnizip/formats/rar/rar_format_base.rb +241 -0
- data/lib/omnizip/formats/rar/reader.rb +366 -0
- data/lib/omnizip/formats/rar/recovery_record.rb +245 -0
- data/lib/omnizip/formats/rar/volume_manager.rb +168 -0
- data/lib/omnizip/formats/rar/writer.rb +431 -0
- data/lib/omnizip/formats/rar.rb +205 -0
- data/lib/omnizip/formats/rar3/compressor.rb +73 -0
- data/lib/omnizip/formats/rar3/decompressor.rb +66 -0
- data/lib/omnizip/formats/rar3/reader.rb +386 -0
- data/lib/omnizip/formats/rar3/writer.rb +219 -0
- data/lib/omnizip/formats/rar5/compressor.rb +73 -0
- data/lib/omnizip/formats/rar5/decompressor.rb +66 -0
- data/lib/omnizip/formats/rar5/reader.rb +342 -0
- data/lib/omnizip/formats/rar5/writer.rb +214 -0
- data/lib/omnizip/formats/seven_zip/coder_chain.rb +150 -0
- data/lib/omnizip/formats/seven_zip/constants.rb +126 -0
- data/lib/omnizip/formats/seven_zip/encoded_header.rb +114 -0
- data/lib/omnizip/formats/seven_zip/encrypted_header.rb +142 -0
- data/lib/omnizip/formats/seven_zip/file_collector.rb +144 -0
- data/lib/omnizip/formats/seven_zip/header.rb +106 -0
- data/lib/omnizip/formats/seven_zip/header_encryptor.rb +134 -0
- data/lib/omnizip/formats/seven_zip/header_writer.rb +466 -0
- data/lib/omnizip/formats/seven_zip/models/coder_info.rb +30 -0
- data/lib/omnizip/formats/seven_zip/models/file_entry.rb +58 -0
- data/lib/omnizip/formats/seven_zip/models/folder.rb +69 -0
- data/lib/omnizip/formats/seven_zip/models/stream_info.rb +42 -0
- data/lib/omnizip/formats/seven_zip/parser.rb +660 -0
- data/lib/omnizip/formats/seven_zip/reader.rb +458 -0
- data/lib/omnizip/formats/seven_zip/split_archive_reader.rb +632 -0
- data/lib/omnizip/formats/seven_zip/split_archive_writer.rb +315 -0
- data/lib/omnizip/formats/seven_zip/stream_compressor.rb +151 -0
- data/lib/omnizip/formats/seven_zip/stream_decompressor.rb +162 -0
- data/lib/omnizip/formats/seven_zip/writer.rb +740 -0
- data/lib/omnizip/formats/seven_zip.rb +93 -0
- data/lib/omnizip/formats/tar/constants.rb +73 -0
- data/lib/omnizip/formats/tar/entry.rb +94 -0
- data/lib/omnizip/formats/tar/header.rb +168 -0
- data/lib/omnizip/formats/tar/reader.rb +121 -0
- data/lib/omnizip/formats/tar/writer.rb +216 -0
- data/lib/omnizip/formats/tar.rb +84 -0
- data/lib/omnizip/formats/xz/reader.rb +116 -0
- data/lib/omnizip/formats/xz.rb +237 -0
- data/lib/omnizip/formats/xz_impl/block_decoder.rb +754 -0
- data/lib/omnizip/formats/xz_impl/block_encoder.rb +306 -0
- data/lib/omnizip/formats/xz_impl/block_header.rb +210 -0
- data/lib/omnizip/formats/xz_impl/block_header_parser.rb +186 -0
- data/lib/omnizip/formats/xz_impl/constants.rb +49 -0
- data/lib/omnizip/formats/xz_impl/index_decoder.rb +174 -0
- data/lib/omnizip/formats/xz_impl/index_encoder.rb +122 -0
- data/lib/omnizip/formats/xz_impl/stream_decoder.rb +468 -0
- data/lib/omnizip/formats/xz_impl/stream_encoder.rb +99 -0
- data/lib/omnizip/formats/xz_impl/stream_footer.rb +81 -0
- data/lib/omnizip/formats/xz_impl/stream_footer_parser.rb +117 -0
- data/lib/omnizip/formats/xz_impl/stream_header.rb +55 -0
- data/lib/omnizip/formats/xz_impl/stream_header_parser.rb +108 -0
- data/lib/omnizip/formats/xz_impl/vli.rb +128 -0
- data/lib/omnizip/formats/xz_impl/writer.rb +421 -0
- data/lib/omnizip/formats/zip/central_directory_header.rb +195 -0
- data/lib/omnizip/formats/zip/constants.rb +69 -0
- data/lib/omnizip/formats/zip/end_of_central_directory.rb +133 -0
- data/lib/omnizip/formats/zip/local_file_header.rb +138 -0
- data/lib/omnizip/formats/zip/reader.rb +250 -0
- data/lib/omnizip/formats/zip/unix_extra_field.rb +153 -0
- data/lib/omnizip/formats/zip/writer.rb +375 -0
- data/lib/omnizip/formats/zip/zip64_end_of_central_directory.rb +104 -0
- data/lib/omnizip/formats/zip/zip64_end_of_central_directory_locator.rb +66 -0
- data/lib/omnizip/formats/zip/zip64_extra_field.rb +114 -0
- data/lib/omnizip/formats/zip.rb +50 -0
- data/lib/omnizip/implementations/base/lzma2_decoder_base.rb +75 -0
- data/lib/omnizip/implementations/base/lzma2_encoder_base.rb +128 -0
- data/lib/omnizip/implementations/base/lzma_decoder_base.rb +83 -0
- data/lib/omnizip/implementations/base/lzma_encoder_base.rb +108 -0
- data/lib/omnizip/implementations/base/state_machine_base.rb +182 -0
- data/lib/omnizip/implementations/seven_zip/lzma/decoder.rb +421 -0
- data/lib/omnizip/implementations/seven_zip/lzma/encoder.rb +465 -0
- data/lib/omnizip/implementations/seven_zip/lzma/match_finder.rb +288 -0
- data/lib/omnizip/implementations/seven_zip/lzma/range_decoder.rb +200 -0
- data/lib/omnizip/implementations/seven_zip/lzma/range_encoder.rb +197 -0
- data/lib/omnizip/implementations/seven_zip/lzma/state_machine.rb +141 -0
- data/lib/omnizip/implementations/seven_zip/lzma2/encoder.rb +519 -0
- data/lib/omnizip/implementations/xz_utils/lzma2/decoder.rb +723 -0
- data/lib/omnizip/implementations/xz_utils/lzma2/encoder.rb +750 -0
- data/lib/omnizip/io/buffered_input.rb +146 -0
- data/lib/omnizip/io/buffered_output.rb +105 -0
- data/lib/omnizip/io/stream_manager.rb +115 -0
- data/lib/omnizip/link_handler/hard_link.rb +79 -0
- data/lib/omnizip/link_handler/symbolic_link.rb +74 -0
- data/lib/omnizip/link_handler.rb +124 -0
- data/lib/omnizip/metadata/archive_metadata.rb +114 -0
- data/lib/omnizip/metadata/entry_metadata.rb +146 -0
- data/lib/omnizip/metadata/metadata_editor.rb +171 -0
- data/lib/omnizip/metadata/metadata_registry.rb +64 -0
- data/lib/omnizip/metadata/metadata_validator.rb +99 -0
- data/lib/omnizip/metadata.rb +57 -0
- data/lib/omnizip/models/.keep +0 -0
- data/lib/omnizip/models/algorithm_metadata.rb +73 -0
- data/lib/omnizip/models/compression_options.rb +71 -0
- data/lib/omnizip/models/conversion_options.rb +87 -0
- data/lib/omnizip/models/conversion_result.rb +135 -0
- data/lib/omnizip/models/eta_result.rb +46 -0
- data/lib/omnizip/models/extraction_rule.rb +115 -0
- data/lib/omnizip/models/filter_chain.rb +144 -0
- data/lib/omnizip/models/filter_config.rb +183 -0
- data/lib/omnizip/models/match_result.rb +124 -0
- data/lib/omnizip/models/optimization_suggestion.rb +91 -0
- data/lib/omnizip/models/parallel_options.rb +104 -0
- data/lib/omnizip/models/performance_result.rb +79 -0
- data/lib/omnizip/models/profile_report.rb +82 -0
- data/lib/omnizip/models/progress_options.rb +38 -0
- data/lib/omnizip/models/split_options.rb +116 -0
- data/lib/omnizip/optimization_registry.rb +81 -0
- data/lib/omnizip/parallel/job_queue.rb +209 -0
- data/lib/omnizip/parallel/job_scheduler.rb +203 -0
- data/lib/omnizip/parallel/parallel_compressor.rb +347 -0
- data/lib/omnizip/parallel/parallel_extractor.rb +329 -0
- data/lib/omnizip/parallel/worker_pool.rb +223 -0
- data/lib/omnizip/parallel.rb +149 -0
- data/lib/omnizip/parity/chunked_block_processor.rb +196 -0
- data/lib/omnizip/parity/galois16.rb +145 -0
- data/lib/omnizip/parity/models/creator_packet.rb +73 -0
- data/lib/omnizip/parity/models/file_description_packet.rb +133 -0
- data/lib/omnizip/parity/models/ifsc_packet.rb +123 -0
- data/lib/omnizip/parity/models/main_packet.rb +128 -0
- data/lib/omnizip/parity/models/packet.rb +156 -0
- data/lib/omnizip/parity/models/packet_registry.rb +109 -0
- data/lib/omnizip/parity/models/recovery_slice_packet.rb +78 -0
- data/lib/omnizip/parity/par2_creator.rb +531 -0
- data/lib/omnizip/parity/par2_repairer.rb +407 -0
- data/lib/omnizip/parity/par2_verifier.rb +364 -0
- data/lib/omnizip/parity/par2cmdline_algorithm.rb +110 -0
- data/lib/omnizip/parity/par2cmdline_coefficients.rb +78 -0
- data/lib/omnizip/parity/reed_solomon_decoder.rb +266 -0
- data/lib/omnizip/parity/reed_solomon_encoder.rb +111 -0
- data/lib/omnizip/parity/reed_solomon_matrix.rb +342 -0
- data/lib/omnizip/parity.rb +186 -0
- data/lib/omnizip/password/encryption_registry.rb +65 -0
- data/lib/omnizip/password/encryption_strategy.rb +96 -0
- data/lib/omnizip/password/password_validator.rb +129 -0
- data/lib/omnizip/password/winzip_aes_strategy.rb +192 -0
- data/lib/omnizip/password/zip_crypto_strategy.rb +141 -0
- data/lib/omnizip/password.rb +87 -0
- data/lib/omnizip/pipe/stream_compressor.rb +124 -0
- data/lib/omnizip/pipe/stream_decompressor.rb +174 -0
- data/lib/omnizip/pipe.rb +121 -0
- data/lib/omnizip/platform/ntfs_streams.rb +201 -0
- data/lib/omnizip/platform.rb +189 -0
- data/lib/omnizip/profile/archive_profile.rb +39 -0
- data/lib/omnizip/profile/balanced_profile.rb +33 -0
- data/lib/omnizip/profile/binary_profile.rb +36 -0
- data/lib/omnizip/profile/compression_profile.rb +158 -0
- data/lib/omnizip/profile/custom_profile.rb +157 -0
- data/lib/omnizip/profile/fast_profile.rb +33 -0
- data/lib/omnizip/profile/maximum_profile.rb +33 -0
- data/lib/omnizip/profile/profile_detector.rb +110 -0
- data/lib/omnizip/profile/profile_registry.rb +161 -0
- data/lib/omnizip/profile/text_profile.rb +36 -0
- data/lib/omnizip/profile.rb +190 -0
- data/lib/omnizip/profiler/memory_profiler.rb +66 -0
- data/lib/omnizip/profiler/method_profiler.rb +49 -0
- data/lib/omnizip/profiler/report_generator.rb +169 -0
- data/lib/omnizip/profiler.rb +204 -0
- data/lib/omnizip/progress/callback_reporter.rb +36 -0
- data/lib/omnizip/progress/console_reporter.rb +62 -0
- data/lib/omnizip/progress/log_reporter.rb +91 -0
- data/lib/omnizip/progress/operation_progress.rb +118 -0
- data/lib/omnizip/progress/progress_bar.rb +156 -0
- data/lib/omnizip/progress/progress_reporter.rb +40 -0
- data/lib/omnizip/progress/progress_tracker.rb +190 -0
- data/lib/omnizip/progress/silent_reporter.rb +24 -0
- data/lib/omnizip/progress.rb +127 -0
- data/lib/omnizip/rubyzip_compat.rb +63 -0
- data/lib/omnizip/temp/safe_extract.rb +168 -0
- data/lib/omnizip/temp/temp_file.rb +124 -0
- data/lib/omnizip/temp/temp_file_pool.rb +109 -0
- data/lib/omnizip/temp.rb +181 -0
- data/lib/omnizip/version.rb +5 -0
- data/lib/omnizip/zip/entry.rb +156 -0
- data/lib/omnizip/zip/file.rb +485 -0
- data/lib/omnizip/zip/input_stream.rb +273 -0
- data/lib/omnizip/zip/output_stream.rb +324 -0
- data/lib/omnizip.rb +156 -0
- data/readme-docs/advanced-features.adoc +515 -0
- data/readme-docs/api-usage.adoc +444 -0
- data/readme-docs/architecture.adoc +449 -0
- data/readme-docs/archive-formats.adoc +479 -0
- data/readme-docs/cli-usage.adoc +222 -0
- data/readme-docs/compression-algorithms.adoc +442 -0
- data/readme-docs/compression-profiles.adoc +247 -0
- data/readme-docs/encryption-checksums.adoc +328 -0
- data/readme-docs/format-converter.adoc +325 -0
- data/readme-docs/installation.adoc +228 -0
- data/readme-docs/par2-archives.adoc +608 -0
- data/readme-docs/performance-profiler.adoc +389 -0
- data/readme-docs/preprocessing-filters.adoc +280 -0
- data/xz-file-format-1.2.1.txt +1174 -0
- metadata +617 -0
|
@@ -0,0 +1,407 @@
|
|
|
1
|
+
# frozen_string_literal: true
|
|
2
|
+
|
|
3
|
+
require "digest"
|
|
4
|
+
require "fileutils"
|
|
5
|
+
require_relative "par2_verifier"
|
|
6
|
+
require_relative "reed_solomon_matrix"
|
|
7
|
+
require_relative "chunked_block_processor"
|
|
8
|
+
|
|
9
|
+
module Omnizip
|
|
10
|
+
module Parity
|
|
11
|
+
# PAR2 archive repairer
|
|
12
|
+
#
|
|
13
|
+
# Repairs damaged or missing files using PAR2 recovery blocks
|
|
14
|
+
# and Reed-Solomon error correction.
|
|
15
|
+
#
|
|
16
|
+
# @example Repair damaged files
|
|
17
|
+
# repairer = Par2Repairer.new('backup.par2')
|
|
18
|
+
# result = repairer.repair
|
|
19
|
+
# puts "Repaired #{result.recovered_blocks} blocks"
|
|
20
|
+
class Par2Repairer
|
|
21
|
+
# Repair result
|
|
22
|
+
RepairResult = Struct.new(
|
|
23
|
+
:success, # Repair successful?
|
|
24
|
+
:recovered_files, # Array of recovered file names
|
|
25
|
+
:recovered_blocks, # Number of blocks recovered
|
|
26
|
+
:unrecoverable, # Array of unrecoverable file names
|
|
27
|
+
:error_message, # Error message if failed
|
|
28
|
+
keyword_init: true,
|
|
29
|
+
) do
|
|
30
|
+
# Check if repair was successful
|
|
31
|
+
#
|
|
32
|
+
# @return [Boolean] true if successful
|
|
33
|
+
def success?
|
|
34
|
+
success
|
|
35
|
+
end
|
|
36
|
+
|
|
37
|
+
# Check if any files remain unrecoverable
|
|
38
|
+
#
|
|
39
|
+
# @return [Boolean] true if some files couldn't be recovered
|
|
40
|
+
def has_unrecoverable?
|
|
41
|
+
!unrecoverable.empty?
|
|
42
|
+
end
|
|
43
|
+
end
|
|
44
|
+
|
|
45
|
+
# @return [String] Path to PAR2 index file
|
|
46
|
+
attr_reader :par2_file
|
|
47
|
+
|
|
48
|
+
# @return [Par2Verifier] Verifier instance
|
|
49
|
+
attr_reader :verifier
|
|
50
|
+
|
|
51
|
+
# @return [Proc, nil] Progress callback
|
|
52
|
+
attr_reader :progress_callback
|
|
53
|
+
|
|
54
|
+
# Initialize repairer
|
|
55
|
+
#
|
|
56
|
+
# @param par2_file [String] Path to .par2 index file
|
|
57
|
+
# @param progress [Proc, nil] Progress callback
|
|
58
|
+
# @raise [ArgumentError] if file doesn't exist
|
|
59
|
+
def initialize(par2_file, progress: nil)
|
|
60
|
+
raise ArgumentError, "PAR2 file not found: #{par2_file}" unless
|
|
61
|
+
File.exist?(par2_file)
|
|
62
|
+
|
|
63
|
+
@par2_file = par2_file
|
|
64
|
+
@progress_callback = progress
|
|
65
|
+
@verifier = Par2Verifier.new(par2_file)
|
|
66
|
+
end
|
|
67
|
+
|
|
68
|
+
# Repair damaged files
|
|
69
|
+
#
|
|
70
|
+
# @param output_dir [String, nil] Output directory (default: same as source)
|
|
71
|
+
# @return [RepairResult] Repair results
|
|
72
|
+
def repair(output_dir: nil)
|
|
73
|
+
report_progress(0, "Verifying files")
|
|
74
|
+
|
|
75
|
+
# First verify to find damage
|
|
76
|
+
verification = @verifier.verify
|
|
77
|
+
|
|
78
|
+
if verification.all_ok?
|
|
79
|
+
return RepairResult.new(
|
|
80
|
+
success: true,
|
|
81
|
+
recovered_files: [],
|
|
82
|
+
recovered_blocks: 0,
|
|
83
|
+
unrecoverable: [],
|
|
84
|
+
error_message: nil,
|
|
85
|
+
)
|
|
86
|
+
end
|
|
87
|
+
|
|
88
|
+
unless verification.repairable?
|
|
89
|
+
return RepairResult.new(
|
|
90
|
+
success: false,
|
|
91
|
+
recovered_files: [],
|
|
92
|
+
recovered_blocks: 0,
|
|
93
|
+
unrecoverable: verification.damaged_files + verification.missing_files,
|
|
94
|
+
error_message: "Insufficient recovery blocks to repair damage",
|
|
95
|
+
)
|
|
96
|
+
end
|
|
97
|
+
|
|
98
|
+
report_progress(10, "Loading recovery blocks")
|
|
99
|
+
|
|
100
|
+
# Load all data
|
|
101
|
+
data_blocks = load_data_blocks(verification)
|
|
102
|
+
parity_blocks_by_exp = load_parity_blocks_by_exponent
|
|
103
|
+
|
|
104
|
+
report_progress(30, "Calculating repairs")
|
|
105
|
+
|
|
106
|
+
# Identify erasures (damaged/missing blocks)
|
|
107
|
+
erasures = identify_erasures(verification)
|
|
108
|
+
|
|
109
|
+
report_progress(50, "Recovering damaged blocks")
|
|
110
|
+
|
|
111
|
+
# Perform Reed-Solomon decoding with new decoder
|
|
112
|
+
begin
|
|
113
|
+
recovered_data = perform_recovery(
|
|
114
|
+
data_blocks,
|
|
115
|
+
parity_blocks_by_exp,
|
|
116
|
+
erasures,
|
|
117
|
+
@verifier.metadata[:block_size],
|
|
118
|
+
)
|
|
119
|
+
rescue StandardError => e
|
|
120
|
+
return RepairResult.new(
|
|
121
|
+
success: false,
|
|
122
|
+
recovered_files: [],
|
|
123
|
+
recovered_blocks: 0,
|
|
124
|
+
unrecoverable: verification.damaged_files,
|
|
125
|
+
error_message: "Recovery failed: #{e.message}",
|
|
126
|
+
)
|
|
127
|
+
end
|
|
128
|
+
|
|
129
|
+
# Combine original good blocks with recovered blocks
|
|
130
|
+
recovered_blocks = data_blocks.each_with_index.map do |block, idx|
|
|
131
|
+
if erasures.include?(idx)
|
|
132
|
+
recovered_data[idx]
|
|
133
|
+
else
|
|
134
|
+
block
|
|
135
|
+
end
|
|
136
|
+
end
|
|
137
|
+
|
|
138
|
+
report_progress(80, "Writing repaired files")
|
|
139
|
+
|
|
140
|
+
# Write recovered files
|
|
141
|
+
recovered_files = write_recovered_files(
|
|
142
|
+
recovered_blocks,
|
|
143
|
+
erasures,
|
|
144
|
+
output_dir,
|
|
145
|
+
)
|
|
146
|
+
|
|
147
|
+
report_progress(100, "Repair complete")
|
|
148
|
+
|
|
149
|
+
RepairResult.new(
|
|
150
|
+
success: true,
|
|
151
|
+
recovered_files: recovered_files,
|
|
152
|
+
recovered_blocks: erasures.size,
|
|
153
|
+
unrecoverable: [],
|
|
154
|
+
error_message: nil,
|
|
155
|
+
)
|
|
156
|
+
end
|
|
157
|
+
|
|
158
|
+
private
|
|
159
|
+
|
|
160
|
+
# Load all data blocks from files
|
|
161
|
+
#
|
|
162
|
+
# @param verification [VerificationResult] Verification results
|
|
163
|
+
# @return [Array<String, nil>] Data blocks (nil for missing)
|
|
164
|
+
def load_data_blocks(verification)
|
|
165
|
+
blocks = []
|
|
166
|
+
block_size = @verifier.metadata[:block_size]
|
|
167
|
+
|
|
168
|
+
file_list = @verifier.instance_variable_get(:@file_list)
|
|
169
|
+
|
|
170
|
+
# Get list of damaged/missing files from verification
|
|
171
|
+
damaged_files = verification.damaged_files
|
|
172
|
+
missing_files = verification.missing_files
|
|
173
|
+
|
|
174
|
+
block_index = 0
|
|
175
|
+
|
|
176
|
+
file_list.each_with_index do |file_info, _file_idx|
|
|
177
|
+
file_path = @verifier.send(:find_file_path, file_info[:filename])
|
|
178
|
+
(file_info[:size].to_f / block_size).ceil
|
|
179
|
+
|
|
180
|
+
# Treat damaged files same as missing files - don't read corrupted data
|
|
181
|
+
if damaged_files.include?(file_info[:filename]) || missing_files.include?(file_info[:filename])
|
|
182
|
+
# File is damaged or missing - use nil blocks for recovery
|
|
183
|
+
num_blocks = (file_info[:size].to_f / block_size).ceil
|
|
184
|
+
blocks.concat([nil] * num_blocks)
|
|
185
|
+
block_index += num_blocks
|
|
186
|
+
elsif file_path && File.exist?(file_path)
|
|
187
|
+
# Read file blocks (only for intact files)
|
|
188
|
+
blocks_read = 0
|
|
189
|
+
File.open(file_path, "rb") do |io|
|
|
190
|
+
while (data = io.read(block_size))
|
|
191
|
+
# Pad last block
|
|
192
|
+
if data.bytesize < block_size
|
|
193
|
+
data += "\x00" * (block_size - data.bytesize)
|
|
194
|
+
end
|
|
195
|
+
blocks << data
|
|
196
|
+
block_index += 1
|
|
197
|
+
blocks_read += 1
|
|
198
|
+
end
|
|
199
|
+
end
|
|
200
|
+
else
|
|
201
|
+
# File not found and not in damaged list - shouldn't happen
|
|
202
|
+
num_blocks = (file_info[:size].to_f / block_size).ceil
|
|
203
|
+
blocks.concat([nil] * num_blocks)
|
|
204
|
+
block_index += num_blocks
|
|
205
|
+
end
|
|
206
|
+
end
|
|
207
|
+
|
|
208
|
+
blocks
|
|
209
|
+
end
|
|
210
|
+
|
|
211
|
+
# Load parity blocks indexed by exponent
|
|
212
|
+
#
|
|
213
|
+
# Returns unique recovery blocks sorted by exponent.
|
|
214
|
+
# Multiple blocks with same exponent are consolidated.
|
|
215
|
+
#
|
|
216
|
+
# @return [Hash] Map of exponent => recovery_block_data
|
|
217
|
+
def load_parity_blocks_by_exponent
|
|
218
|
+
recovery_blocks = @verifier.instance_variable_get(:@recovery_blocks)
|
|
219
|
+
|
|
220
|
+
# Group by exponent and take first block for each
|
|
221
|
+
# (PAR2 can have multiple slices with same exponent for large data)
|
|
222
|
+
blocks_by_exp = {}
|
|
223
|
+
recovery_blocks.each do |rb|
|
|
224
|
+
exp = rb[:exponent]
|
|
225
|
+
blocks_by_exp[exp] ||= rb[:data]
|
|
226
|
+
end
|
|
227
|
+
|
|
228
|
+
blocks_by_exp
|
|
229
|
+
end
|
|
230
|
+
|
|
231
|
+
# Identify erasure locations
|
|
232
|
+
#
|
|
233
|
+
# @param verification [VerificationResult] Verification results
|
|
234
|
+
# @return [Array<Integer>] Block indices that need recovery
|
|
235
|
+
def identify_erasures(verification)
|
|
236
|
+
erasures = []
|
|
237
|
+
|
|
238
|
+
# Build file-to-blocks mapping using verifier's file list
|
|
239
|
+
# Note: @verifier was populated by the verify() call in repair()
|
|
240
|
+
file_list = @verifier.instance_variable_get(:@file_list)
|
|
241
|
+
block_size = @verifier.metadata[:block_size]
|
|
242
|
+
|
|
243
|
+
# Ensure metadata is loaded
|
|
244
|
+
if file_list.nil? || file_list.empty?
|
|
245
|
+
raise "Internal error: file_list not populated in verifier"
|
|
246
|
+
end
|
|
247
|
+
|
|
248
|
+
block_idx = 0
|
|
249
|
+
file_blocks_map = {}
|
|
250
|
+
file_list.each do |file_info|
|
|
251
|
+
num_blocks = (file_info[:size].to_f / block_size).ceil
|
|
252
|
+
file_blocks_map[file_info[:filename]] =
|
|
253
|
+
(block_idx...(block_idx + num_blocks)).to_a
|
|
254
|
+
block_idx += num_blocks
|
|
255
|
+
end
|
|
256
|
+
|
|
257
|
+
# Add ALL blocks from damaged files
|
|
258
|
+
verification.damaged_files.each do |filename|
|
|
259
|
+
if file_blocks_map[filename]
|
|
260
|
+
erasures.concat(file_blocks_map[filename])
|
|
261
|
+
end
|
|
262
|
+
end
|
|
263
|
+
|
|
264
|
+
# Add ALL blocks from missing files
|
|
265
|
+
verification.missing_files.each do |filename|
|
|
266
|
+
if file_blocks_map[filename]
|
|
267
|
+
erasures.concat(file_blocks_map[filename])
|
|
268
|
+
end
|
|
269
|
+
end
|
|
270
|
+
|
|
271
|
+
erasures.sort.uniq
|
|
272
|
+
end
|
|
273
|
+
|
|
274
|
+
# Write recovered files to disk
|
|
275
|
+
#
|
|
276
|
+
# @param recovered_blocks [Array<String>] Complete set of data blocks (recovered + original)
|
|
277
|
+
# @param erasures [Array<Integer>] Block indices that were recovered
|
|
278
|
+
# @param output_dir [String, nil] Output directory
|
|
279
|
+
# @return [Array<String>] Recovered file names
|
|
280
|
+
def write_recovered_files(recovered_blocks, erasures, output_dir)
|
|
281
|
+
recovered_files = []
|
|
282
|
+
block_idx = 0
|
|
283
|
+
|
|
284
|
+
output_dir ||= File.dirname(@par2_file)
|
|
285
|
+
FileUtils.mkdir_p(output_dir)
|
|
286
|
+
|
|
287
|
+
@verifier.instance_variable_get(:@file_list).each do |file_info|
|
|
288
|
+
num_blocks = (file_info[:size].to_f / @verifier.metadata[:block_size]).ceil
|
|
289
|
+
file_blocks_range = (block_idx...(block_idx + num_blocks)).to_a
|
|
290
|
+
|
|
291
|
+
# Check if any blocks from this file were in the erasure list (damaged/missing)
|
|
292
|
+
damaged_blocks = file_blocks_range & erasures
|
|
293
|
+
if damaged_blocks.any?
|
|
294
|
+
output_path = File.join(output_dir, file_info[:filename])
|
|
295
|
+
|
|
296
|
+
# Extract blocks for this file from the complete recovered set
|
|
297
|
+
# recovered_blocks contains ALL blocks (both original and recovered)
|
|
298
|
+
file_blocks = recovered_blocks[block_idx, num_blocks]
|
|
299
|
+
|
|
300
|
+
# Only write if we have blocks to write
|
|
301
|
+
if file_blocks && !file_blocks.empty? && file_blocks.all?
|
|
302
|
+
write_recovered_file(
|
|
303
|
+
output_path,
|
|
304
|
+
file_blocks,
|
|
305
|
+
file_info[:size],
|
|
306
|
+
)
|
|
307
|
+
recovered_files << file_info[:filename]
|
|
308
|
+
end
|
|
309
|
+
end
|
|
310
|
+
|
|
311
|
+
block_idx += num_blocks
|
|
312
|
+
end
|
|
313
|
+
|
|
314
|
+
recovered_files
|
|
315
|
+
end
|
|
316
|
+
|
|
317
|
+
# Write single recovered file
|
|
318
|
+
#
|
|
319
|
+
# @param output_path [String] Output file path
|
|
320
|
+
# @param blocks [Array<String>] File blocks
|
|
321
|
+
# @param file_size [Integer] Original file size
|
|
322
|
+
def write_recovered_file(output_path, blocks, file_size)
|
|
323
|
+
FileUtils.mkdir_p(File.dirname(output_path))
|
|
324
|
+
|
|
325
|
+
File.open(output_path, "wb") do |io|
|
|
326
|
+
blocks.each do |block|
|
|
327
|
+
io.write(block)
|
|
328
|
+
end
|
|
329
|
+
|
|
330
|
+
# Truncate to exact size (remove padding)
|
|
331
|
+
io.truncate(file_size)
|
|
332
|
+
end
|
|
333
|
+
end
|
|
334
|
+
|
|
335
|
+
# Perform Reed-Solomon recovery using chunked processing
|
|
336
|
+
#
|
|
337
|
+
# Implements par2cmdline's incremental approach:
|
|
338
|
+
# 1. Compute matrix coefficients once
|
|
339
|
+
# 2. Process data in chunks (memory-efficient)
|
|
340
|
+
# 3. Incrementally build recovered blocks
|
|
341
|
+
#
|
|
342
|
+
# @param data_blocks [Array<String, nil>] Data blocks (nil for missing/damaged)
|
|
343
|
+
# @param parity_blocks_by_exp [Hash] Map of exponent => parity_block
|
|
344
|
+
# @param erasures [Array<Integer>] Block indices to recover
|
|
345
|
+
# @param block_size [Integer] Block size in bytes
|
|
346
|
+
# @return [Hash<Integer, String>] Map of block_index => recovered_block
|
|
347
|
+
def perform_recovery(data_blocks, parity_blocks_by_exp, erasures,
|
|
348
|
+
block_size)
|
|
349
|
+
# Build present_blocks hash (only non-erased, non-nil blocks)
|
|
350
|
+
present_blocks = {}
|
|
351
|
+
data_blocks.each_with_index do |block, idx|
|
|
352
|
+
unless erasures.include?(idx) || block.nil?
|
|
353
|
+
present_blocks[idx] =
|
|
354
|
+
block
|
|
355
|
+
end
|
|
356
|
+
end
|
|
357
|
+
|
|
358
|
+
# Build recovery_blocks hash (exponent => data)
|
|
359
|
+
recovery_blocks = {}
|
|
360
|
+
parity_blocks_by_exp.sort.each do |exponent, data|
|
|
361
|
+
recovery_blocks[exponent] = data
|
|
362
|
+
end
|
|
363
|
+
|
|
364
|
+
# Determine which recovery exponents to use (first N where N = missing count)
|
|
365
|
+
recovery_exponents = recovery_blocks.keys.sort.take(erasures.size)
|
|
366
|
+
|
|
367
|
+
# Build and compute RS matrix
|
|
368
|
+
matrix = ReedSolomonMatrix.new(
|
|
369
|
+
present_blocks.keys.sort,
|
|
370
|
+
erasures.sort,
|
|
371
|
+
recovery_exponents,
|
|
372
|
+
data_blocks.size, # total_inputs
|
|
373
|
+
block_size,
|
|
374
|
+
)
|
|
375
|
+
|
|
376
|
+
# Compute matrix coefficients (Gaussian elimination - done once)
|
|
377
|
+
matrix.compute!
|
|
378
|
+
|
|
379
|
+
# Select only the recovery blocks we're using
|
|
380
|
+
used_recovery_blocks = {}
|
|
381
|
+
recovery_exponents.each do |exp|
|
|
382
|
+
used_recovery_blocks[exp] = recovery_blocks[exp]
|
|
383
|
+
end
|
|
384
|
+
|
|
385
|
+
# Process blocks incrementally using chunked processor
|
|
386
|
+
processor = ChunkedBlockProcessor.new(
|
|
387
|
+
matrix,
|
|
388
|
+
present_blocks,
|
|
389
|
+
used_recovery_blocks,
|
|
390
|
+
erasures.sort,
|
|
391
|
+
block_size,
|
|
392
|
+
)
|
|
393
|
+
|
|
394
|
+
# Returns hash of recovered blocks
|
|
395
|
+
processor.process_all
|
|
396
|
+
end
|
|
397
|
+
|
|
398
|
+
# Report progress if callback provided
|
|
399
|
+
#
|
|
400
|
+
# @param percent [Integer] Completion percentage
|
|
401
|
+
# @param message [String] Progress message
|
|
402
|
+
def report_progress(percent, message)
|
|
403
|
+
@progress_callback&.call(percent, message)
|
|
404
|
+
end
|
|
405
|
+
end
|
|
406
|
+
end
|
|
407
|
+
end
|