react-native-quick-crypto 1.0.19 → 1.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/QuickCrypto.podspec +12 -38
- package/README.md +2 -0
- package/android/CMakeLists.txt +3 -0
- package/cpp/utils/HybridUtils.cpp +39 -77
- package/deps/simdutf/.clang-format +4 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/bug_report.md +62 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/config.yml +1 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/feature_request.md +35 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/standard-issue-template.md +29 -0
- package/deps/simdutf/.github/pull_request_template.md +51 -0
- package/deps/simdutf/.github/workflows/aarch64.yml +39 -0
- package/deps/simdutf/.github/workflows/alpine.yml +27 -0
- package/deps/simdutf/.github/workflows/amalgamation_demos.yml +34 -0
- package/deps/simdutf/.github/workflows/armv7.yml +32 -0
- package/deps/simdutf/.github/workflows/atomic_fuzz.yml +25 -0
- package/deps/simdutf/.github/workflows/cifuzz.yml +37 -0
- package/deps/simdutf/.github/workflows/clangformat.yml +36 -0
- package/deps/simdutf/.github/workflows/debian-latestcxxstandards.yml +40 -0
- package/deps/simdutf/.github/workflows/debian.yml +33 -0
- package/deps/simdutf/.github/workflows/documentation.yml +36 -0
- package/deps/simdutf/.github/workflows/emscripten.yml +19 -0
- package/deps/simdutf/.github/workflows/loongarch64-gcc-14.2.yml +39 -0
- package/deps/simdutf/.github/workflows/macos-latest.yml +29 -0
- package/deps/simdutf/.github/workflows/msys2-clang.yml +48 -0
- package/deps/simdutf/.github/workflows/msys2.yml +50 -0
- package/deps/simdutf/.github/workflows/ppc64le.yml +29 -0
- package/deps/simdutf/.github/workflows/rvv-1024-clang-18.yml +35 -0
- package/deps/simdutf/.github/workflows/rvv-128-clang-17.yml +35 -0
- package/deps/simdutf/.github/workflows/rvv-256-gcc-14.yml +31 -0
- package/deps/simdutf/.github/workflows/s390x.yml +29 -0
- package/deps/simdutf/.github/workflows/selective-amalgamation.yml +29 -0
- package/deps/simdutf/.github/workflows/typos.yml +19 -0
- package/deps/simdutf/.github/workflows/ubuntu22-cxx20.yml +30 -0
- package/deps/simdutf/.github/workflows/ubuntu22.yml +32 -0
- package/deps/simdutf/.github/workflows/ubuntu22_gcc12.yml +27 -0
- package/deps/simdutf/.github/workflows/ubuntu22sani.yml +29 -0
- package/deps/simdutf/.github/workflows/ubuntu24-cxxstandards.yml +34 -0
- package/deps/simdutf/.github/workflows/ubuntu24-unsignedchar.yml +34 -0
- package/deps/simdutf/.github/workflows/ubuntu24.yml +32 -0
- package/deps/simdutf/.github/workflows/ubuntu24sani.yml +36 -0
- package/deps/simdutf/.github/workflows/ubuntu24sani_clang.yml +29 -0
- package/deps/simdutf/.github/workflows/vs17-arm-ci.yml +21 -0
- package/deps/simdutf/.github/workflows/vs17-ci-cxx20.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-ci.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-clang-ci.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-cxxstandards.yml +36 -0
- package/deps/simdutf/AI_USAGE_POLICY.md +56 -0
- package/deps/simdutf/AUTHORS +6 -0
- package/deps/simdutf/CMakeLists.txt +231 -0
- package/deps/simdutf/CONTRIBUTING.md +214 -0
- package/deps/simdutf/CONTRIBUTORS +1 -0
- package/deps/simdutf/Doxyfile +2584 -0
- package/deps/simdutf/LICENSE-APACHE +201 -0
- package/deps/simdutf/LICENSE-MIT +18 -0
- package/deps/simdutf/Makefile.crosscompile +54 -0
- package/deps/simdutf/README-RVV.md +16 -0
- package/deps/simdutf/README.md +2782 -0
- package/deps/simdutf/SECURITY.md +8 -0
- package/deps/simdutf/benchmarks/CMakeLists.txt +101 -0
- package/deps/simdutf/benchmarks/alignment.cpp +150 -0
- package/deps/simdutf/benchmarks/base64/CMakeLists.txt +30 -0
- package/deps/simdutf/benchmarks/base64/benchmark_base64.cpp +875 -0
- package/deps/simdutf/benchmarks/base64/libbase64_spaces.h +49 -0
- package/deps/simdutf/benchmarks/base64/node_base64.h +227 -0
- package/deps/simdutf/benchmarks/base64/openssl3_base64.h +334 -0
- package/deps/simdutf/benchmarks/benchmark.cpp +65 -0
- package/deps/simdutf/benchmarks/benchmark_to_well_formed_utf16.cpp +347 -0
- package/deps/simdutf/benchmarks/competition/.clang-format-ignore +5 -0
- package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.cpp +1276 -0
- package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.h +595 -0
- package/deps/simdutf/benchmarks/competition/README.md +7 -0
- package/deps/simdutf/benchmarks/competition/hoehrmann/hoehrmann.h +91 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16.h +444 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16_tables.h +13183 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/script.py +73 -0
- package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.cpp +738 -0
- package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.h +293 -0
- package/deps/simdutf/benchmarks/competition/u8u16/COPYRIGHT +8 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Makefile +44 -0
- package/deps/simdutf/benchmarks/competition/u8u16/OSL3.0.txt +169 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/BOM_Profiler.h +148 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/i386_timer.h +45 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/ppc_timer.c +34 -0
- package/deps/simdutf/benchmarks/competition/u8u16/README +56 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/config_defs.h +43 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/g4_config.h +27 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/mmx_config.h +16 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/p4_config.h +18 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/p4_ideal_config.h +16 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/spu_config.h +28 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/ssse3_config.h +20 -0
- package/deps/simdutf/benchmarks/competition/u8u16/iconv_u8u16.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/altivec_simd.h +440 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_basic_ops.py +121 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_half_operand_versions.py +158 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_test.py +270 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd.h +141 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_basic.h +216 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_built_in.h +119 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_modified.h +2430 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/outline.txt +39 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/spu_simd.h +421 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/sse_simd.h +836 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/stdint.h +222 -0
- package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_BE.c +4 -0
- package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_LE.c +5 -0
- package/deps/simdutf/benchmarks/competition/u8u16/proto/u8u16.py +390 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/Makefile +18 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/bytelex.h +448 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/charsets/ASCII_EBCDIC.h +284 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.c +1975 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.pdf +0 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.w +2263 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/multiliteral.h +239 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/u8u16.c +232 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/x8x16.c +194 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.c +193 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.h +167 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.c +288 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.h +117 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_g4.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_mmx.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4.c +3 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4_ideal.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_spu.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_ssse3.c +3 -0
- package/deps/simdutf/benchmarks/competition/u8u16/x8x16_p4.c +2 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/LICENSE +23 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/data/test_minimal.txt +44 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/readme.md +106 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_corr_tests.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_example.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_file_conv.sh +14 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_lib.sh +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_sample.sh +8 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_corr_tests.cmd +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_example.cmd +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_file_conv.cmd +14 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_lib.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_sample.cmd +8 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_corr_tests.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_example.cmd +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_file_conv.cmd +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_lib.cmd +10 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_sample.cmd +9 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/html_table.py +25 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/measure.py +94 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/resize.py +20 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_all.cmd +2 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_interm.cmd +1 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/CustomMemcpy.h +75 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/PerfDefs.h +47 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.cpp +17 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.h +76 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/AllProcessors.cpp +35 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.cpp +117 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.h +210 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferDecoder.h +158 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferEncoder.h +104 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorPlugins.h +334 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorSelector.h +186 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.cpp +140 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.h +42 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderProcess.h +100 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/Dfa.h +57 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.cpp +85 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.h +27 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderProcess.h +126 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/ProcessTrivial.h +108 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.cpp +139 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.h +74 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.cpp +65 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.h +91 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/CorrectnessTests.cpp +772 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/Example.cpp +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/FileConverter.cpp +486 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/iconv_sample.c +162 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/utf8lut.h +15 -0
- package/deps/simdutf/benchmarks/competition/utf8sse4/fromutf8-sse.cpp +292 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/LICENSE +23 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/README.md +1503 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/checked.h +335 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/core.h +338 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp11.h +103 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp17.h +103 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/unchecked.h +274 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8.h +34 -0
- package/deps/simdutf/benchmarks/dataset/README.md +155 -0
- package/deps/simdutf/benchmarks/dataset/emoji.txt +204 -0
- package/deps/simdutf/benchmarks/dataset/scripts/utf8type.py +40 -0
- package/deps/simdutf/benchmarks/dataset/wikipedia_mars/Makefile +80 -0
- package/deps/simdutf/benchmarks/dataset/wikipedia_mars/convert_to_utf6.py +20 -0
- package/deps/simdutf/benchmarks/find/CMakeLists.txt +6 -0
- package/deps/simdutf/benchmarks/find/findbenchmark.cpp +63 -0
- package/deps/simdutf/benchmarks/find/findbenchmarker.h +46 -0
- package/deps/simdutf/benchmarks/shortbench.cpp +555 -0
- package/deps/simdutf/benchmarks/src/CMakeLists.txt +52 -0
- package/deps/simdutf/benchmarks/src/apple_arm_events.h +1104 -0
- package/deps/simdutf/benchmarks/src/benchmark.cpp +3899 -0
- package/deps/simdutf/benchmarks/src/benchmark.h +317 -0
- package/deps/simdutf/benchmarks/src/benchmark_base.cpp +144 -0
- package/deps/simdutf/benchmarks/src/benchmark_base.h +98 -0
- package/deps/simdutf/benchmarks/src/cmdline.cpp +176 -0
- package/deps/simdutf/benchmarks/src/cmdline.h +35 -0
- package/deps/simdutf/benchmarks/src/event_counter.h +162 -0
- package/deps/simdutf/benchmarks/src/linux-perf-events.h +104 -0
- package/deps/simdutf/benchmarks/stream.cpp +209 -0
- package/deps/simdutf/benchmarks/threaded.cpp +123 -0
- package/deps/simdutf/cmake/CPM.cmake +1363 -0
- package/deps/simdutf/cmake/JoinPaths.cmake +23 -0
- package/deps/simdutf/cmake/add_cpp_test.cmake +68 -0
- package/deps/simdutf/cmake/simdutf-config.cmake.in +2 -0
- package/deps/simdutf/cmake/simdutf-flags.cmake +26 -0
- package/deps/simdutf/cmake/toolchains-ci/riscv64-linux-gnu.cmake +4 -0
- package/deps/simdutf/cmake/toolchains-dev/README.md +32 -0
- package/deps/simdutf/cmake/toolchains-dev/aarch64.cmake +14 -0
- package/deps/simdutf/cmake/toolchains-dev/loongarch64.cmake +22 -0
- package/deps/simdutf/cmake/toolchains-dev/powerpc64.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/powerpc64le.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/riscv64.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/rvv-spike.cmake +38 -0
- package/deps/simdutf/doc/avx512.png +0 -0
- package/deps/simdutf/doc/logo.png +0 -0
- package/deps/simdutf/doc/logo.svg +165 -0
- package/deps/simdutf/doc/node2023.png +0 -0
- package/deps/simdutf/doc/shortinput.md +78 -0
- package/deps/simdutf/doc/utf16utf8.png +0 -0
- package/deps/simdutf/doc/utf8utf16.png +0 -0
- package/deps/simdutf/doc/widelogo.png +0 -0
- package/deps/simdutf/doxygen.py +50 -0
- package/deps/simdutf/fuzz/.clang-format +9 -0
- package/deps/simdutf/fuzz/CMakeLists.txt +45 -0
- package/deps/simdutf/fuzz/README.md +168 -0
- package/deps/simdutf/fuzz/atomic_base64.cpp +448 -0
- package/deps/simdutf/fuzz/base64.cpp +278 -0
- package/deps/simdutf/fuzz/build.sh +83 -0
- package/deps/simdutf/fuzz/conversion.cpp +669 -0
- package/deps/simdutf/fuzz/helpers/.clang-format-ignore +1 -0
- package/deps/simdutf/fuzz/helpers/common.h +135 -0
- package/deps/simdutf/fuzz/helpers/nameof.hpp +1258 -0
- package/deps/simdutf/fuzz/main.cpp +72 -0
- package/deps/simdutf/fuzz/minimize_and_cleanse.sh +87 -0
- package/deps/simdutf/fuzz/misc.cpp +216 -0
- package/deps/simdutf/fuzz/random_fuzz.sh +154 -0
- package/deps/simdutf/fuzz/roundtrip.cpp +588 -0
- package/deps/simdutf/fuzz/safe_conversion.cpp +104 -0
- package/deps/simdutf/include/simdutf/avx512.h +79 -0
- package/deps/simdutf/include/simdutf/base64_implementation.h +158 -0
- package/deps/simdutf/include/simdutf/base64_tables.h +887 -0
- package/deps/simdutf/include/simdutf/common_defs.h +186 -0
- package/deps/simdutf/include/simdutf/compiler_check.h +50 -0
- package/deps/simdutf/include/simdutf/constexpr_ptr.h +138 -0
- package/deps/simdutf/include/simdutf/encoding_types.h +189 -0
- package/deps/simdutf/include/simdutf/error.h +126 -0
- package/deps/simdutf/include/simdutf/implementation.h +7081 -0
- package/deps/simdutf/include/simdutf/internal/isadetection.h +325 -0
- package/deps/simdutf/include/simdutf/portability.h +285 -0
- package/deps/simdutf/include/simdutf/scalar/ascii.h +86 -0
- package/deps/simdutf/include/simdutf/scalar/atomic_util.h +105 -0
- package/deps/simdutf/include/simdutf/scalar/base64.h +911 -0
- package/deps/simdutf/include/simdutf/scalar/latin1.h +26 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf16/latin1_to_utf16.h +52 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf32/latin1_to_utf32.h +27 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf8/latin1_to_utf8.h +191 -0
- package/deps/simdutf/include/simdutf/scalar/swap_bytes.h +35 -0
- package/deps/simdutf/include/simdutf/scalar/utf16.h +226 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/utf16_to_latin1.h +108 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/valid_utf16_to_latin1.h +40 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/utf16_to_utf32.h +86 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/valid_utf16_to_utf32.h +44 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/utf16_to_utf8.h +295 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/valid_utf16_to_utf8.h +91 -0
- package/deps/simdutf/include/simdutf/scalar/utf32.h +82 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/utf32_to_latin1.h +68 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/valid_utf32_to_latin1.h +67 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/utf32_to_utf16.h +84 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/valid_utf32_to_utf16.h +44 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/utf32_to_utf8.h +142 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/valid_utf32_to_utf8.h +72 -0
- package/deps/simdutf/include/simdutf/scalar/utf8.h +326 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/utf8_to_latin1.h +225 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/valid_utf8_to_latin1.h +87 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/utf8_to_utf16.h +342 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/valid_utf8_to_utf16.h +106 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/utf8_to_utf32.h +299 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/valid_utf8_to_utf32.h +83 -0
- package/deps/simdutf/include/simdutf/simdutf_version.h +26 -0
- package/deps/simdutf/include/simdutf.h +26 -0
- package/deps/simdutf/include/simdutf_c.h +342 -0
- package/deps/simdutf/riscv/Dockerfile +16 -0
- package/deps/simdutf/riscv/README.md +24 -0
- package/deps/simdutf/riscv/remove-docker-station +8 -0
- package/deps/simdutf/riscv/run-docker-station +31 -0
- package/deps/simdutf/scripts/.flake8 +2 -0
- package/deps/simdutf/scripts/Makefile +2 -0
- package/deps/simdutf/scripts/README_ADD_FUNCTION.md +49 -0
- package/deps/simdutf/scripts/add_function.py +330 -0
- package/deps/simdutf/scripts/amalgamation_tests.py +156 -0
- package/deps/simdutf/scripts/base64/Makefile +2 -0
- package/deps/simdutf/scripts/base64/README.md +2 -0
- package/deps/simdutf/scripts/base64/avx512.py +76 -0
- package/deps/simdutf/scripts/base64/neon_decode.py +143 -0
- package/deps/simdutf/scripts/base64/neon_generate_lut.py +101 -0
- package/deps/simdutf/scripts/base64/sse.py +252 -0
- package/deps/simdutf/scripts/base64/sseregular.py +160 -0
- package/deps/simdutf/scripts/base64/sseurl.py +283 -0
- package/deps/simdutf/scripts/base64/table.py +59 -0
- package/deps/simdutf/scripts/base64bench_print.py +145 -0
- package/deps/simdutf/scripts/benchmark-all.py +119 -0
- package/deps/simdutf/scripts/benchmark_print.py +324 -0
- package/deps/simdutf/scripts/check_feature_macros.py +156 -0
- package/deps/simdutf/scripts/check_typos.sh +13 -0
- package/deps/simdutf/scripts/clang_format.sh +35 -0
- package/deps/simdutf/scripts/clang_format_docker.sh +38 -0
- package/deps/simdutf/scripts/common.py +24 -0
- package/deps/simdutf/scripts/compilation_benchmark.py +55 -0
- package/deps/simdutf/scripts/compile_many_variations.sh +64 -0
- package/deps/simdutf/scripts/create_latex_table.py +62 -0
- package/deps/simdutf/scripts/docker/Dockerfile +14 -0
- package/deps/simdutf/scripts/docker/Makefile +9 -0
- package/deps/simdutf/scripts/docker/README.md +30 -0
- package/deps/simdutf/scripts/docker/llvm.gpg +0 -0
- package/deps/simdutf/scripts/ppc64_convert_utf16_to_utf8.py +155 -0
- package/deps/simdutf/scripts/prepare_doxygen.sh +21 -0
- package/deps/simdutf/scripts/release.py +197 -0
- package/deps/simdutf/scripts/shortinputplots.py +97 -0
- package/deps/simdutf/scripts/sse_convert_utf16_to_utf8.py +422 -0
- package/deps/simdutf/scripts/sse_convert_utf32_to_utf16.py +105 -0
- package/deps/simdutf/scripts/sse_utf8_utf16_decode.py +186 -0
- package/deps/simdutf/scripts/sse_validate_utf16le_proof.py +137 -0
- package/deps/simdutf/scripts/sse_validate_utf16le_testcases.py +129 -0
- package/deps/simdutf/scripts/table.py +207 -0
- package/deps/simdutf/scripts/tests/new.txt +33 -0
- package/deps/simdutf/scripts/tests/old.txt +33 -0
- package/deps/simdutf/scripts/tests/results.txt +272 -0
- package/deps/simdutf/simdutf.pc.in +11 -0
- package/deps/simdutf/singleheader/.flake8 +2 -0
- package/deps/simdutf/singleheader/CMakeLists.txt +64 -0
- package/deps/simdutf/singleheader/README-dev.md +81 -0
- package/deps/simdutf/singleheader/README.md +19 -0
- package/deps/simdutf/singleheader/amalgamate.py +513 -0
- package/deps/simdutf/singleheader/amalgamation_demo.c +59 -0
- package/deps/simdutf/singleheader/amalgamation_demo.cpp +54 -0
- package/deps/simdutf/singleheader/test-features.py +262 -0
- package/deps/simdutf/src/CMakeLists.txt +78 -0
- package/deps/simdutf/src/arm64/arm_base64.cpp +791 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf16.cpp +24 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf32.cpp +24 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf8.cpp +70 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_latin1.cpp +61 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf32.cpp +185 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf8.cpp +780 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_latin1.cpp +60 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf16.cpp +208 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf8.cpp +505 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_latin1.cpp +69 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf16.cpp +313 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf32.cpp +179 -0
- package/deps/simdutf/src/arm64/arm_find.cpp +199 -0
- package/deps/simdutf/src/arm64/arm_utf16fix.cpp +185 -0
- package/deps/simdutf/src/arm64/arm_validate_utf16.cpp +165 -0
- package/deps/simdutf/src/arm64/arm_validate_utf32le.cpp +65 -0
- package/deps/simdutf/src/arm64/implementation.cpp +1442 -0
- package/deps/simdutf/src/encoding_types.cpp +67 -0
- package/deps/simdutf/src/error.cpp +3 -0
- package/deps/simdutf/src/fallback/implementation.cpp +589 -0
- package/deps/simdutf/src/generic/ascii_validation.h +50 -0
- package/deps/simdutf/src/generic/base64.h +233 -0
- package/deps/simdutf/src/generic/base64lengths.h +63 -0
- package/deps/simdutf/src/generic/buf_block_reader.h +109 -0
- package/deps/simdutf/src/generic/find.h +75 -0
- package/deps/simdutf/src/generic/utf16/change_endianness.h +24 -0
- package/deps/simdutf/src/generic/utf16/count_code_points_bytemask.h +58 -0
- package/deps/simdutf/src/generic/utf16/to_well_formed.h +93 -0
- package/deps/simdutf/src/generic/utf16/utf32_length_from_utf16.h +15 -0
- package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16.h +35 -0
- package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16_bytemask.h +199 -0
- package/deps/simdutf/src/generic/utf16.h +73 -0
- package/deps/simdutf/src/generic/utf32.h +136 -0
- package/deps/simdutf/src/generic/utf8/utf16_length_from_utf8_bytemask.h +53 -0
- package/deps/simdutf/src/generic/utf8.h +92 -0
- package/deps/simdutf/src/generic/utf8_to_latin1/utf8_to_latin1.h +316 -0
- package/deps/simdutf/src/generic/utf8_to_latin1/valid_utf8_to_latin1.h +78 -0
- package/deps/simdutf/src/generic/utf8_to_utf16/utf8_to_utf16.h +332 -0
- package/deps/simdutf/src/generic/utf8_to_utf16/valid_utf8_to_utf16.h +74 -0
- package/deps/simdutf/src/generic/utf8_to_utf32/utf8_to_utf32.h +318 -0
- package/deps/simdutf/src/generic/utf8_to_utf32/valid_utf8_to_utf32.h +42 -0
- package/deps/simdutf/src/generic/utf8_validation/utf8_lookup4_algorithm.h +223 -0
- package/deps/simdutf/src/generic/utf8_validation/utf8_validator.h +84 -0
- package/deps/simdutf/src/generic/validate_utf16.h +164 -0
- package/deps/simdutf/src/generic/validate_utf32.h +99 -0
- package/deps/simdutf/src/haswell/avx2_base64.cpp +837 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf16.cpp +28 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf32.cpp +20 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf8.cpp +83 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_latin1.cpp +83 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf32.cpp +210 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf8.cpp +602 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_latin1.cpp +116 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf16.cpp +164 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf8.cpp +569 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_latin1.cpp +60 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf16.cpp +195 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf32.cpp +135 -0
- package/deps/simdutf/src/haswell/avx2_utf16fix.cpp +173 -0
- package/deps/simdutf/src/haswell/avx2_validate_utf16.cpp +17 -0
- package/deps/simdutf/src/haswell/implementation.cpp +1447 -0
- package/deps/simdutf/src/icelake/icelake_ascii_validation.inl.cpp +19 -0
- package/deps/simdutf/src/icelake/icelake_base64.inl.cpp +630 -0
- package/deps/simdutf/src/icelake/icelake_common.inl.cpp +37 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf16.inl.cpp +36 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf32.inl.cpp +23 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf8.inl.cpp +107 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_latin1.inl.cpp +103 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf32.inl.cpp +136 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf8.inl.cpp +206 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_latin1.inl.cpp +74 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf16.inl.cpp +338 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf8.inl.cpp +574 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf8_to_latin1.inl.cpp +104 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf8_to_utf16.inl.cpp +75 -0
- package/deps/simdutf/src/icelake/icelake_convert_valid_utf8_to_latin1.inl.cpp +69 -0
- package/deps/simdutf/src/icelake/icelake_find.inl.cpp +146 -0
- package/deps/simdutf/src/icelake/icelake_from_utf8.inl.cpp +266 -0
- package/deps/simdutf/src/icelake/icelake_from_valid_utf8.inl.cpp +136 -0
- package/deps/simdutf/src/icelake/icelake_macros.inl.cpp +143 -0
- package/deps/simdutf/src/icelake/icelake_utf16fix.cpp +138 -0
- package/deps/simdutf/src/icelake/icelake_utf32_validation.inl.cpp +63 -0
- package/deps/simdutf/src/icelake/icelake_utf8_common.inl.cpp +753 -0
- package/deps/simdutf/src/icelake/icelake_utf8_length_from_utf16.inl.cpp +269 -0
- package/deps/simdutf/src/icelake/icelake_utf8_validation.inl.cpp +116 -0
- package/deps/simdutf/src/icelake/implementation.cpp +1903 -0
- package/deps/simdutf/src/implementation.cpp +2526 -0
- package/deps/simdutf/src/lasx/implementation.cpp +1531 -0
- package/deps/simdutf/src/lasx/lasx_base64.cpp +695 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf16.cpp +76 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf32.cpp +55 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf8.cpp +65 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_latin1.cpp +64 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf32.cpp +183 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf8.cpp +550 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_latin1.cpp +73 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf16.cpp +218 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf8.cpp +589 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_latin1.cpp +72 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf16.cpp +296 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf32.cpp +190 -0
- package/deps/simdutf/src/lasx/lasx_find.cpp +64 -0
- package/deps/simdutf/src/lasx/lasx_validate_utf16.cpp +13 -0
- package/deps/simdutf/src/lasx/lasx_validate_utf32le.cpp +84 -0
- package/deps/simdutf/src/lsx/implementation.cpp +1417 -0
- package/deps/simdutf/src/lsx/lsx_base64.cpp +675 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf16.cpp +39 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf32.cpp +27 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf8.cpp +56 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_latin1.cpp +64 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf32.cpp +133 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf8.cpp +518 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_latin1.cpp +66 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf16.cpp +155 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf8.cpp +459 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_latin1.cpp +75 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf16.cpp +291 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf32.cpp +179 -0
- package/deps/simdutf/src/lsx/lsx_find.cpp +60 -0
- package/deps/simdutf/src/lsx/lsx_validate_utf16.cpp +13 -0
- package/deps/simdutf/src/lsx/lsx_validate_utf32le.cpp +68 -0
- package/deps/simdutf/src/ppc64/implementation.cpp +992 -0
- package/deps/simdutf/src/ppc64/ppc64_base64.cpp +480 -0
- package/deps/simdutf/src/ppc64/ppc64_base64_internal_tests.cpp +401 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf16.cpp +12 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf32.cpp +12 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf8.cpp +149 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_latin1.cpp +67 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf32.cpp +87 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf8.cpp +296 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_latin1.cpp +57 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf16.cpp +117 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf8.cpp +166 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_latin1.cpp +69 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf16.cpp +211 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf32.cpp +153 -0
- package/deps/simdutf/src/ppc64/ppc64_utf16_to_utf8_tables.h +1011 -0
- package/deps/simdutf/src/ppc64/ppc64_utf8_length_from_latin1.cpp +37 -0
- package/deps/simdutf/src/ppc64/ppc64_validate_utf16.cpp +19 -0
- package/deps/simdutf/src/ppc64/templates.cpp +91 -0
- package/deps/simdutf/src/rvv/implementation.cpp +138 -0
- package/deps/simdutf/src/rvv/rvv_find.cpp +27 -0
- package/deps/simdutf/src/rvv/rvv_helpers.inl.cpp +23 -0
- package/deps/simdutf/src/rvv/rvv_latin1_to.inl.cpp +71 -0
- package/deps/simdutf/src/rvv/rvv_length_from.inl.cpp +164 -0
- package/deps/simdutf/src/rvv/rvv_utf16_to.inl.cpp +399 -0
- package/deps/simdutf/src/rvv/rvv_utf16fix.cpp +110 -0
- package/deps/simdutf/src/rvv/rvv_utf32_to.inl.cpp +307 -0
- package/deps/simdutf/src/rvv/rvv_utf8_to.inl.cpp +435 -0
- package/deps/simdutf/src/rvv/rvv_validate.inl.cpp +275 -0
- package/deps/simdutf/src/simdutf/arm64/begin.h +2 -0
- package/deps/simdutf/src/simdutf/arm64/bitmanipulation.h +34 -0
- package/deps/simdutf/src/simdutf/arm64/end.h +2 -0
- package/deps/simdutf/src/simdutf/arm64/implementation.h +307 -0
- package/deps/simdutf/src/simdutf/arm64/intrinsics.h +10 -0
- package/deps/simdutf/src/simdutf/arm64/simd.h +547 -0
- package/deps/simdutf/src/simdutf/arm64/simd16-inl.h +403 -0
- package/deps/simdutf/src/simdutf/arm64/simd32-inl.h +129 -0
- package/deps/simdutf/src/simdutf/arm64/simd64-inl.h +28 -0
- package/deps/simdutf/src/simdutf/arm64.h +43 -0
- package/deps/simdutf/src/simdutf/fallback/begin.h +1 -0
- package/deps/simdutf/src/simdutf/fallback/bitmanipulation.h +13 -0
- package/deps/simdutf/src/simdutf/fallback/end.h +1 -0
- package/deps/simdutf/src/simdutf/fallback/implementation.h +331 -0
- package/deps/simdutf/src/simdutf/fallback.h +42 -0
- package/deps/simdutf/src/simdutf/haswell/begin.h +15 -0
- package/deps/simdutf/src/simdutf/haswell/bitmanipulation.h +35 -0
- package/deps/simdutf/src/simdutf/haswell/end.h +13 -0
- package/deps/simdutf/src/simdutf/haswell/implementation.h +338 -0
- package/deps/simdutf/src/simdutf/haswell/intrinsics.h +67 -0
- package/deps/simdutf/src/simdutf/haswell/simd.h +363 -0
- package/deps/simdutf/src/simdutf/haswell/simd16-inl.h +261 -0
- package/deps/simdutf/src/simdutf/haswell/simd32-inl.h +111 -0
- package/deps/simdutf/src/simdutf/haswell/simd64-inl.h +34 -0
- package/deps/simdutf/src/simdutf/haswell.h +63 -0
- package/deps/simdutf/src/simdutf/icelake/begin.h +14 -0
- package/deps/simdutf/src/simdutf/icelake/bitmanipulation.h +44 -0
- package/deps/simdutf/src/simdutf/icelake/end.h +12 -0
- package/deps/simdutf/src/simdutf/icelake/implementation.h +346 -0
- package/deps/simdutf/src/simdutf/icelake/intrinsics.h +138 -0
- package/deps/simdutf/src/simdutf/icelake/simd.h +17 -0
- package/deps/simdutf/src/simdutf/icelake/simd16-inl.h +90 -0
- package/deps/simdutf/src/simdutf/icelake/simd32-inl.h +47 -0
- package/deps/simdutf/src/simdutf/icelake.h +81 -0
- package/deps/simdutf/src/simdutf/lasx/begin.h +8 -0
- package/deps/simdutf/src/simdutf/lasx/bitmanipulation.h +25 -0
- package/deps/simdutf/src/simdutf/lasx/end.h +8 -0
- package/deps/simdutf/src/simdutf/lasx/implementation.h +310 -0
- package/deps/simdutf/src/simdutf/lasx/intrinsics.h +319 -0
- package/deps/simdutf/src/simdutf/lasx/simd.h +551 -0
- package/deps/simdutf/src/simdutf/lasx/simd16-inl.h +234 -0
- package/deps/simdutf/src/simdutf/lasx/simd32-inl.h +74 -0
- package/deps/simdutf/src/simdutf/lasx/simd64-inl.h +52 -0
- package/deps/simdutf/src/simdutf/lasx.h +49 -0
- package/deps/simdutf/src/simdutf/lsx/begin.h +2 -0
- package/deps/simdutf/src/simdutf/lsx/bitmanipulation.h +25 -0
- package/deps/simdutf/src/simdutf/lsx/end.h +2 -0
- package/deps/simdutf/src/simdutf/lsx/implementation.h +309 -0
- package/deps/simdutf/src/simdutf/lsx/intrinsics.h +196 -0
- package/deps/simdutf/src/simdutf/lsx/simd.h +421 -0
- package/deps/simdutf/src/simdutf/lsx/simd16-inl.h +242 -0
- package/deps/simdutf/src/simdutf/lsx/simd32-inl.h +69 -0
- package/deps/simdutf/src/simdutf/lsx/simd64-inl.h +50 -0
- package/deps/simdutf/src/simdutf/lsx.h +52 -0
- package/deps/simdutf/src/simdutf/ppc64/begin.h +1 -0
- package/deps/simdutf/src/simdutf/ppc64/bitmanipulation.h +29 -0
- package/deps/simdutf/src/simdutf/ppc64/end.h +1 -0
- package/deps/simdutf/src/simdutf/ppc64/implementation.h +348 -0
- package/deps/simdutf/src/simdutf/ppc64/intrinsics.h +19 -0
- package/deps/simdutf/src/simdutf/ppc64/simd.h +177 -0
- package/deps/simdutf/src/simdutf/ppc64/simd16-inl.h +327 -0
- package/deps/simdutf/src/simdutf/ppc64/simd32-inl.h +247 -0
- package/deps/simdutf/src/simdutf/ppc64/simd8-inl.h +618 -0
- package/deps/simdutf/src/simdutf/ppc64.h +40 -0
- package/deps/simdutf/src/simdutf/rvv/begin.h +7 -0
- package/deps/simdutf/src/simdutf/rvv/end.h +7 -0
- package/deps/simdutf/src/simdutf/rvv/implementation.h +321 -0
- package/deps/simdutf/src/simdutf/rvv/intrinsics.h +131 -0
- package/deps/simdutf/src/simdutf/rvv.h +41 -0
- package/deps/simdutf/src/simdutf/westmere/begin.h +8 -0
- package/deps/simdutf/src/simdutf/westmere/bitmanipulation.h +37 -0
- package/deps/simdutf/src/simdutf/westmere/end.h +8 -0
- package/deps/simdutf/src/simdutf/westmere/implementation.h +338 -0
- package/deps/simdutf/src/simdutf/westmere/intrinsics.h +38 -0
- package/deps/simdutf/src/simdutf/westmere/simd.h +379 -0
- package/deps/simdutf/src/simdutf/westmere/simd16-inl.h +242 -0
- package/deps/simdutf/src/simdutf/westmere/simd32-inl.h +151 -0
- package/deps/simdutf/src/simdutf/westmere/simd64-inl.h +33 -0
- package/deps/simdutf/src/simdutf/westmere.h +59 -0
- package/deps/simdutf/src/simdutf.cpp +152 -0
- package/deps/simdutf/src/simdutf_c.cpp +525 -0
- package/deps/simdutf/src/tables/utf16_to_utf8_tables.h +768 -0
- package/deps/simdutf/src/tables/utf32_to_utf16_tables.h +53 -0
- package/deps/simdutf/src/tables/utf8_to_utf16_tables.h +826 -0
- package/deps/simdutf/src/westmere/implementation.cpp +1479 -0
- package/deps/simdutf/src/westmere/internal/loader.cpp +7 -0
- package/deps/simdutf/src/westmere/internal/write_v_u16_11bits_to_utf8.cpp +66 -0
- package/deps/simdutf/src/westmere/sse_base64.cpp +672 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf16.cpp +21 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf32.cpp +31 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf8.cpp +71 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_latin1.cpp +70 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf32.cpp +206 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf8.cpp +504 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_latin1.cpp +82 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf16.cpp +209 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf8.cpp +589 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_latin1.cpp +58 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf16.cpp +197 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf32.cpp +141 -0
- package/deps/simdutf/src/westmere/sse_utf16fix.cpp +82 -0
- package/deps/simdutf/src/westmere/sse_validate_utf16.cpp +17 -0
- package/deps/simdutf/tests/CMakeLists.txt +483 -0
- package/deps/simdutf/tests/atomic_base64_tests.cpp +2845 -0
- package/deps/simdutf/tests/base64_tests.cpp +3617 -0
- package/deps/simdutf/tests/basic_fuzzer.cpp +805 -0
- package/deps/simdutf/tests/bele_tests.cpp +182 -0
- package/deps/simdutf/tests/constexpr_base64_tests.cpp +387 -0
- package/deps/simdutf/tests/convert_latin1_to_utf16be_tests.cpp +52 -0
- package/deps/simdutf/tests/convert_latin1_to_utf16le_tests.cpp +80 -0
- package/deps/simdutf/tests/convert_latin1_to_utf32_tests.cpp +66 -0
- package/deps/simdutf/tests/convert_latin1_to_utf8_tests.cpp +120 -0
- package/deps/simdutf/tests/convert_utf16_to_utf8_safe_tests.cpp +203 -0
- package/deps/simdutf/tests/convert_utf16_to_utf8_with_replacement_tests.cpp +276 -0
- package/deps/simdutf/tests/convert_utf16be_to_latin1_tests.cpp +109 -0
- package/deps/simdutf/tests/convert_utf16be_to_latin1_tests_with_errors.cpp +136 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf32_tests.cpp +193 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf32_with_errors_tests.cpp +381 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf8_tests.cpp +259 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf8_with_errors_tests.cpp +266 -0
- package/deps/simdutf/tests/convert_utf16le_to_latin1_tests.cpp +148 -0
- package/deps/simdutf/tests/convert_utf16le_to_latin1_tests_with_errors.cpp +176 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf32_tests.cpp +213 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf32_with_errors_tests.cpp +318 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf8_tests.cpp +343 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf8_with_errors_tests.cpp +271 -0
- package/deps/simdutf/tests/convert_utf32_to_latin1_tests.cpp +111 -0
- package/deps/simdutf/tests/convert_utf32_to_latin1_with_errors_tests.cpp +96 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16be_tests.cpp +148 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16be_with_errors_tests.cpp +192 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16le_tests.cpp +166 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16le_with_errors_tests.cpp +215 -0
- package/deps/simdutf/tests/convert_utf32_to_utf8_tests.cpp +181 -0
- package/deps/simdutf/tests/convert_utf32_to_utf8_with_errors_tests.cpp +261 -0
- package/deps/simdutf/tests/convert_utf8_to_latin1_tests.cpp +516 -0
- package/deps/simdutf/tests/convert_utf8_to_latin1_with_errors_tests.cpp +579 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16be_tests.cpp +412 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16be_with_errors_tests.cpp +480 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16le_tests.cpp +671 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16le_with_errors_tests.cpp +455 -0
- package/deps/simdutf/tests/convert_utf8_to_utf32_tests.cpp +1204 -0
- package/deps/simdutf/tests/convert_utf8_to_utf32_with_errors_tests.cpp +337 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_latin1_tests.cpp +37 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_utf32_tests.cpp +97 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_utf8_tests.cpp +126 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_latin1_tests.cpp +71 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_utf32_tests.cpp +122 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_utf8_tests.cpp +244 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_latin1_tests.cpp +49 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf16be_tests.cpp +92 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf16le_tests.cpp +114 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf8_tests.cpp +109 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_latin1_tests.cpp +84 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf16be_tests.cpp +124 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf16le_tests.cpp +221 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf32_tests.cpp +155 -0
- package/deps/simdutf/tests/count_utf16be.cpp +64 -0
- package/deps/simdutf/tests/count_utf16le.cpp +61 -0
- package/deps/simdutf/tests/count_utf8.cpp +87 -0
- package/deps/simdutf/tests/detect_encodings_tests.cpp +312 -0
- package/deps/simdutf/tests/embed/valid_utf8.txt +1 -0
- package/deps/simdutf/tests/embed_tests.cpp +22 -0
- package/deps/simdutf/tests/find_tests.cpp +77 -0
- package/deps/simdutf/tests/fixed_string_tests.cpp +153 -0
- package/deps/simdutf/tests/helpers/CMakeLists.txt +25 -0
- package/deps/simdutf/tests/helpers/compiletime_conversions.h +222 -0
- package/deps/simdutf/tests/helpers/fixed_string.h +267 -0
- package/deps/simdutf/tests/helpers/random_int.cpp +30 -0
- package/deps/simdutf/tests/helpers/random_int.h +39 -0
- package/deps/simdutf/tests/helpers/random_utf16.cpp +123 -0
- package/deps/simdutf/tests/helpers/random_utf16.h +52 -0
- package/deps/simdutf/tests/helpers/random_utf32.cpp +41 -0
- package/deps/simdutf/tests/helpers/random_utf32.h +40 -0
- package/deps/simdutf/tests/helpers/random_utf8.cpp +93 -0
- package/deps/simdutf/tests/helpers/random_utf8.h +36 -0
- package/deps/simdutf/tests/helpers/test.cpp +231 -0
- package/deps/simdutf/tests/helpers/test.h +193 -0
- package/deps/simdutf/tests/helpers/transcode_test_base.cpp +1257 -0
- package/deps/simdutf/tests/helpers/transcode_test_base.h +683 -0
- package/deps/simdutf/tests/helpers/utf16.h +27 -0
- package/deps/simdutf/tests/installation_tests/find/CMakeLists.txt +43 -0
- package/deps/simdutf/tests/installation_tests/from_fetch/CMakeLists.txt +47 -0
- package/deps/simdutf/tests/internal_tests.cpp +27 -0
- package/deps/simdutf/tests/null_safety_tests.cpp +94 -0
- package/deps/simdutf/tests/random_fuzzer.cpp +779 -0
- package/deps/simdutf/tests/readme_tests.cpp +274 -0
- package/deps/simdutf/tests/reference/CMakeLists.txt +23 -0
- package/deps/simdutf/tests/reference/decode_utf16.h +81 -0
- package/deps/simdutf/tests/reference/decode_utf32.h +47 -0
- package/deps/simdutf/tests/reference/encode_latin1.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_latin1.h +32 -0
- package/deps/simdutf/tests/reference/encode_utf16.cpp +49 -0
- package/deps/simdutf/tests/reference/encode_utf16.h +20 -0
- package/deps/simdutf/tests/reference/encode_utf32.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_utf32.h +36 -0
- package/deps/simdutf/tests/reference/encode_utf8.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_utf8.h +40 -0
- package/deps/simdutf/tests/reference/validate_utf16.cpp +60 -0
- package/deps/simdutf/tests/reference/validate_utf16.h +14 -0
- package/deps/simdutf/tests/reference/validate_utf16_to_latin1.cpp +35 -0
- package/deps/simdutf/tests/reference/validate_utf16_to_latin1.h +13 -0
- package/deps/simdutf/tests/reference/validate_utf32.cpp +27 -0
- package/deps/simdutf/tests/reference/validate_utf32.h +12 -0
- package/deps/simdutf/tests/reference/validate_utf32_to_latin1.cpp +27 -0
- package/deps/simdutf/tests/reference/validate_utf32_to_latin1.h +12 -0
- package/deps/simdutf/tests/reference/validate_utf8.cpp +82 -0
- package/deps/simdutf/tests/reference/validate_utf8.h +11 -0
- package/deps/simdutf/tests/reference/validate_utf8_to_latin1.cpp +43 -0
- package/deps/simdutf/tests/reference/validate_utf8_to_latin1.h +12 -0
- package/deps/simdutf/tests/select_implementation.cpp +43 -0
- package/deps/simdutf/tests/simdutf_c_tests.cpp +244 -0
- package/deps/simdutf/tests/span_tests.cpp +401 -0
- package/deps/simdutf/tests/special_tests.cpp +559 -0
- package/deps/simdutf/tests/straight_c_test.c +187 -0
- package/deps/simdutf/tests/text_encoding_tests.cpp +77 -0
- package/deps/simdutf/tests/to_well_formed_utf16_tests.cpp +377 -0
- package/deps/simdutf/tests/utf8_length_from_utf16_tests.cpp +202 -0
- package/deps/simdutf/tests/validate_ascii_basic_tests.cpp +165 -0
- package/deps/simdutf/tests/validate_ascii_with_errors_tests.cpp +77 -0
- package/deps/simdutf/tests/validate_utf16be_basic_tests.cpp +175 -0
- package/deps/simdutf/tests/validate_utf16be_with_errors_tests.cpp +188 -0
- package/deps/simdutf/tests/validate_utf16le_basic_tests.cpp +268 -0
- package/deps/simdutf/tests/validate_utf16le_with_errors_tests.cpp +274 -0
- package/deps/simdutf/tests/validate_utf32_basic_tests.cpp +92 -0
- package/deps/simdutf/tests/validate_utf32_with_errors_tests.cpp +114 -0
- package/deps/simdutf/tests/validate_utf8_basic_tests.cpp +178 -0
- package/deps/simdutf/tests/validate_utf8_brute_force_tests.cpp +88 -0
- package/deps/simdutf/tests/validate_utf8_puzzler_tests.cpp +33 -0
- package/deps/simdutf/tests/validate_utf8_with_errors_tests.cpp +228 -0
- package/deps/simdutf/tools/CMakeLists.txt +85 -0
- package/deps/simdutf/tools/fastbase64.cpp +250 -0
- package/deps/simdutf/tools/sutf.cpp +556 -0
- package/deps/simdutf/tools/sutf.h +40 -0
- package/package.json +2 -2
|
@@ -0,0 +1,836 @@
|
|
|
1
|
+
/* Idealized SIMD Operations with SSE versions
|
|
2
|
+
Copyright (C) 2006, 2007, 2008, Robert D. Cameron
|
|
3
|
+
Licensed to the public under the Open Software License 3.0.
|
|
4
|
+
Licensed to International Characters Inc.
|
|
5
|
+
under the Academic Free License version 3.0.
|
|
6
|
+
*/
|
|
7
|
+
#ifndef SSE_SIMD_H
|
|
8
|
+
#define SSE_SIMD_H
|
|
9
|
+
|
|
10
|
+
/*------------------------------------------------------------*/
|
|
11
|
+
#ifndef _MSC_VER
|
|
12
|
+
#include <stdint.h>
|
|
13
|
+
#endif
|
|
14
|
+
#ifdef _MSC_VER
|
|
15
|
+
// Daniel Lemire (2022-05-17): the next few lines were slightly modified to get it to build under clangcl
|
|
16
|
+
#ifdef __clang__
|
|
17
|
+
#include <stdint.h>
|
|
18
|
+
#else
|
|
19
|
+
#include "stdint.h"
|
|
20
|
+
#endif
|
|
21
|
+
|
|
22
|
+
#ifndef LITTLE_ENDIAN
|
|
23
|
+
#define LITTLE_ENDIAN 1234
|
|
24
|
+
#endif
|
|
25
|
+
|
|
26
|
+
#ifndef BIG_ENDIAN
|
|
27
|
+
#define BIG_ENDIAN 4321
|
|
28
|
+
#endif
|
|
29
|
+
|
|
30
|
+
#ifndef BYTE_ORDER
|
|
31
|
+
#define BYTE_ORDER LITTLE_ENDIAN
|
|
32
|
+
#endif
|
|
33
|
+
|
|
34
|
+
#endif
|
|
35
|
+
#include <limits.h>
|
|
36
|
+
|
|
37
|
+
#ifndef LONG_BIT
|
|
38
|
+
#if ULONG_MAX == 0xFFFFFFFF
|
|
39
|
+
#define LONG_BIT 32
|
|
40
|
+
#endif
|
|
41
|
+
#if ULONG_MAX == 0xFFFFFFFFFFFFFFFF
|
|
42
|
+
#define LONG_BIT 64
|
|
43
|
+
#endif
|
|
44
|
+
#endif
|
|
45
|
+
|
|
46
|
+
#include <emmintrin.h>
|
|
47
|
+
#ifdef USE_LDDQU
|
|
48
|
+
#include <pmmintrin.h>
|
|
49
|
+
#endif
|
|
50
|
+
typedef __m128i SIMD_type;
|
|
51
|
+
|
|
52
|
+
|
|
53
|
+
|
|
54
|
+
#ifdef SSSE3
|
|
55
|
+
#include <tmmintrin.h>
|
|
56
|
+
|
|
57
|
+
#define simd_permute(bytepack, indexes) _mm_shuffle_epi8(bytepack, indexes)
|
|
58
|
+
#endif
|
|
59
|
+
|
|
60
|
+
/*------------------------------------------------------------*/
|
|
61
|
+
/* I. SIMD bitwise logical operations */
|
|
62
|
+
|
|
63
|
+
#define simd_or(b1, b2) _mm_or_si128(b1, b2)
|
|
64
|
+
#define simd_and(b1, b2) _mm_and_si128(b1, b2)
|
|
65
|
+
#define simd_xor(b1, b2) _mm_xor_si128(b1, b2)
|
|
66
|
+
#define simd_andc(b1, b2) _mm_andnot_si128(b2, b1)
|
|
67
|
+
#define simd_if(cond, then_val, else_val) \
|
|
68
|
+
simd_or(simd_and(then_val, cond), simd_andc(else_val, cond))
|
|
69
|
+
#define simd_not(b) (simd_xor(b, _mm_set1_epi32(0xFFFFFFFF)))
|
|
70
|
+
#define simd_nor(a,b) (simd_not(simd_or(a,b)))
|
|
71
|
+
|
|
72
|
+
|
|
73
|
+
/* Specific constants. */
|
|
74
|
+
#define simd_himask_2 _mm_set1_epi32(0xAAAAAAAA)
|
|
75
|
+
#define simd_himask_4 _mm_set1_epi32(0xCCCCCCCC)
|
|
76
|
+
#define simd_himask_8 _mm_set1_epi32(0xF0F0F0F0)
|
|
77
|
+
/* Little-endian */
|
|
78
|
+
#define simd_himask_16 _mm_set1_epi32(0xFF00FF00)
|
|
79
|
+
#define simd_himask_32 _mm_set1_epi32(0xFFFF0000)
|
|
80
|
+
#define simd_himask_64 _mm_set_epi32(-1,0,-1,0)
|
|
81
|
+
#define simd_himask_128 _mm_set_epi32(-1,-1,0,0)
|
|
82
|
+
|
|
83
|
+
/* Idealized operations with direct implementation by built-in
|
|
84
|
+
operations for various target architectures. */
|
|
85
|
+
|
|
86
|
+
#define simd_add_8(a, b) _mm_add_epi8(a, b)
|
|
87
|
+
#define simd_add_16(a, b) _mm_add_epi16(a, b)
|
|
88
|
+
#define simd_add_32(a, b) _mm_add_epi32(a, b)
|
|
89
|
+
#define simd_add_64(a, b) _mm_add_epi64(a, b)
|
|
90
|
+
#define simd_sub_8(a, b) _mm_sub_epi8(a, b)
|
|
91
|
+
#define simd_sub_16(a, b) _mm_sub_epi16(a, b)
|
|
92
|
+
#define simd_sub_32(a, b) _mm_sub_epi32(a, b)
|
|
93
|
+
#define simd_sub_64(a, b) _mm_sub_epi64(a, b)
|
|
94
|
+
#define simd_mult_16(a, b) _mm_mullo_epi16(a, b)
|
|
95
|
+
#define simd_slli_16(r, shft) _mm_slli_epi16(r, shft)
|
|
96
|
+
#define simd_srli_16(r, shft) _mm_srli_epi16(r, shft)
|
|
97
|
+
#define simd_srai_16(r, shft) _mm_srai_epi16(r, shft)
|
|
98
|
+
#define simd_slli_32(r, shft) _mm_slli_epi32(r, shft)
|
|
99
|
+
#define simd_srli_32(r, shft) _mm_srli_epi32(r, shft)
|
|
100
|
+
#define simd_srai_32(r, shft) _mm_srai_epi32(r, shft)
|
|
101
|
+
#define simd_slli_64(r, shft) _mm_slli_epi64(r, shft)
|
|
102
|
+
#define simd_srli_64(r, shft) _mm_srli_epi64(r, shft)
|
|
103
|
+
#define simd_sll_64(r, shft_reg) _mm_sll_epi64(r, shft_reg)
|
|
104
|
+
#define simd_srl_64(r, shft_reg) _mm_srl_epi64(r, shft_reg)
|
|
105
|
+
#define simd_packus_16(a, b) _mm_packus_epi16(b, a)
|
|
106
|
+
#define simd_pack_16(a, b) \
|
|
107
|
+
_mm_packus_epi16(simd_andc(b, simd_himask_16), simd_andc(a, simd_himask_16))
|
|
108
|
+
#define simd_mergeh_8(a, b) _mm_unpackhi_epi8(b, a)
|
|
109
|
+
#define simd_mergeh_16(a, b) _mm_unpackhi_epi16(b, a)
|
|
110
|
+
#define simd_mergeh_32(a, b) _mm_unpackhi_epi32(b, a)
|
|
111
|
+
#define simd_mergeh_64(a, b) _mm_unpackhi_epi64(b, a)
|
|
112
|
+
#define simd_mergel_8(a, b) _mm_unpacklo_epi8(b, a)
|
|
113
|
+
#define simd_mergel_16(a, b) _mm_unpacklo_epi16(b, a)
|
|
114
|
+
#define simd_mergel_32(a, b) _mm_unpacklo_epi32(b, a)
|
|
115
|
+
#define simd_mergel_64(a, b) _mm_unpacklo_epi64(b, a)
|
|
116
|
+
#define simd_eq_8(a, b) _mm_cmpeq_epi8(a, b)
|
|
117
|
+
#define simd_eq_16(a, b) _mm_cmpeq_epi16(a, b)
|
|
118
|
+
#define simd_eq_32(a, b) _mm_cmpeq_epi32(a, b)
|
|
119
|
+
|
|
120
|
+
#define simd_max_8(a, b) _mm_max_epu8(a, b)
|
|
121
|
+
|
|
122
|
+
#define simd_slli_128(r, shft) \
|
|
123
|
+
((shft) % 8 == 0 ? _mm_slli_si128(r, (shft)/8) : \
|
|
124
|
+
(shft) >= 64 ? simd_slli_64(_mm_slli_si128(r, 8), (shft) - 64) : \
|
|
125
|
+
simd_or(simd_slli_64(r, shft), _mm_slli_si128(simd_srli_64(r, 64-(shft)), 8)))
|
|
126
|
+
|
|
127
|
+
#define simd_srli_128(r, shft) \
|
|
128
|
+
((shft) % 8 == 0 ? _mm_srli_si128(r, (shft)/8) : \
|
|
129
|
+
(shft) >= 64 ? simd_srli_64(_mm_srli_si128(r, 8), (shft) - 64) : \
|
|
130
|
+
simd_or(simd_srli_64(r, shft), _mm_srli_si128(simd_slli_64(r, 64-(shft)), 8)))
|
|
131
|
+
|
|
132
|
+
#define simd_sll_128(r, shft) \
|
|
133
|
+
simd_or(simd_sll_64(r, shft), \
|
|
134
|
+
simd_or(_mm_slli_si128(simd_sll_64(r, simd_sub_32(shft, sisd_from_int(64))), 8), \
|
|
135
|
+
_mm_slli_si128(simd_srl_64(r, simd_sub_32(sisd_from_int(64), shft)), 8)))
|
|
136
|
+
|
|
137
|
+
#define simd_srl_128(r, shft) \
|
|
138
|
+
simd_or(simd_srl_64(r, shft), \
|
|
139
|
+
simd_or(_mm_srli_si128(simd_srl_64(r, simd_sub_32(shft, sisd_from_int(64))), 8), \
|
|
140
|
+
_mm_srli_si128(simd_sll_64(r, simd_sub_32(sisd_from_int(64), shft)), 8)))
|
|
141
|
+
|
|
142
|
+
#define sisd_sll(r, shft) simd_sll_128(r, shft)
|
|
143
|
+
#define sisd_srl(r, shft) simd_srl_128(r, shft)
|
|
144
|
+
#define sisd_slli(r, shft) simd_slli_128(r, shft)
|
|
145
|
+
#define sisd_srli(r, shft) simd_srli_128(r, shft)
|
|
146
|
+
#define sisd_add(a, b) simd_add_128(a, b)
|
|
147
|
+
#define sisd_sub(a, b) simd_sub_128(a, b)
|
|
148
|
+
|
|
149
|
+
#define sisd_store_aligned(r, addr) _mm_store_si128(addr, r)
|
|
150
|
+
#define sisd_store_unaligned(r, addr) _mm_storeu_si128(addr, r)
|
|
151
|
+
#define sisd_load_aligned(addr) _mm_load_si128(addr)
|
|
152
|
+
#ifndef USE_LDDQU
|
|
153
|
+
#define sisd_load_unaligned(addr) _mm_loadu_si128(addr)
|
|
154
|
+
#endif
|
|
155
|
+
#ifdef USE_LDDQU
|
|
156
|
+
#define sisd_load_unaligned(addr) _mm_lddqu_si128(addr)
|
|
157
|
+
#endif
|
|
158
|
+
|
|
159
|
+
|
|
160
|
+
|
|
161
|
+
#define simd_const_32(n) _mm_set1_epi32(n)
|
|
162
|
+
#define simd_const_16(n) _mm_set1_epi16(n)
|
|
163
|
+
#define simd_const_8(n) _mm_set1_epi8(n)
|
|
164
|
+
#define simd_const_4(n) _mm_set1_epi8((n)<<4|(n))
|
|
165
|
+
#define simd_const_2(n) simd_const_4((n)<<2|n)
|
|
166
|
+
#define simd_const_1(n) \
|
|
167
|
+
(n==0 ? simd_const_8(0): simd_const_8(-1))
|
|
168
|
+
|
|
169
|
+
#define simd_pack_16_ll(a, b) simd_pack_16(a, b)
|
|
170
|
+
#define simd_pack_16_hh(a, b) \
|
|
171
|
+
simd_pack_16(simd_srli_16(a, 8), simd_srli_16(b, 8))
|
|
172
|
+
|
|
173
|
+
|
|
174
|
+
static inline
|
|
175
|
+
SIMD_type simd_add_2(SIMD_type a, SIMD_type b)
|
|
176
|
+
{
|
|
177
|
+
SIMD_type c1 = simd_xor(a,b);
|
|
178
|
+
SIMD_type borrow = simd_and(a,b);
|
|
179
|
+
SIMD_type c2 = simd_xor(c1,(sisd_slli(borrow,1)));
|
|
180
|
+
return simd_if(simd_himask_2,c2,c1);
|
|
181
|
+
}
|
|
182
|
+
#define simd_add_4(a, b)\
|
|
183
|
+
simd_if(simd_himask_8, simd_add_8(simd_and(a,simd_himask_8),simd_and(b,simd_himask_8))\
|
|
184
|
+
,simd_add_8(simd_andc(a,simd_himask_8),simd_andc(b,simd_himask_8)))
|
|
185
|
+
|
|
186
|
+
#define simd_srli_2(r, sh)\
|
|
187
|
+
simd_and(simd_srli_32(r,sh),simd_const_2(3>>sh))
|
|
188
|
+
|
|
189
|
+
#define simd_srli_4(r, sh)\
|
|
190
|
+
simd_and(simd_srli_32(r,sh),simd_const_4(15>>sh))
|
|
191
|
+
#define simd_srli_8(r, sh)\
|
|
192
|
+
simd_and(simd_srli_32(r,sh),simd_const_8(255>>sh))
|
|
193
|
+
|
|
194
|
+
#define simd_slli_2(r, sh)\
|
|
195
|
+
simd_and(simd_slli_32(r,sh),simd_const_2((3<<sh)&3))
|
|
196
|
+
|
|
197
|
+
#define simd_slli_4(r, sh)\
|
|
198
|
+
simd_and(simd_slli_32(r,sh),simd_const_4((15<<sh)&15))
|
|
199
|
+
#define simd_slli_8(r, sh)\
|
|
200
|
+
(sh == 1 ? simd_add_8(r,r):\
|
|
201
|
+
simd_and(simd_slli_32(r,sh),simd_const_8(char((255<<sh) &255))))
|
|
202
|
+
|
|
203
|
+
|
|
204
|
+
|
|
205
|
+
|
|
206
|
+
#define simd_mergeh_4(a,b)\
|
|
207
|
+
simd_mergeh_8(simd_if(simd_himask_8,a,simd_srli_8(b,4)),\
|
|
208
|
+
simd_if(simd_himask_8,simd_slli_8(a,4),b))
|
|
209
|
+
#define simd_mergel_4(a,b)\
|
|
210
|
+
simd_mergel_8(simd_if(simd_himask_8,a,simd_srli_8(b,4)),\
|
|
211
|
+
simd_if(simd_himask_8,simd_slli_8(a,4),b))
|
|
212
|
+
#define simd_mergeh_2(a,b)\
|
|
213
|
+
simd_mergeh_4(simd_if(simd_himask_4,a,simd_srli_4(b,2)),\
|
|
214
|
+
simd_if(simd_himask_4,simd_slli_4(a,2),b))
|
|
215
|
+
#define simd_mergel_2(a,b)\
|
|
216
|
+
simd_mergel_4(simd_if(simd_himask_4,a,simd_srli_4(b,2)),\
|
|
217
|
+
simd_if(simd_himask_4,simd_slli_4(a,2),b))
|
|
218
|
+
#define simd_mergeh_1(a,b)\
|
|
219
|
+
simd_mergeh_2(simd_if(simd_himask_2,a,simd_srli_2(b,1)),\
|
|
220
|
+
simd_if(simd_himask_2,simd_slli_2(a,1),b))
|
|
221
|
+
#define simd_mergel_1(a,b)\
|
|
222
|
+
simd_mergel_2(simd_if(simd_himask_2,a,simd_srli_2(b,1)),\
|
|
223
|
+
simd_if(simd_himask_2,simd_slli_2(a,1),b))
|
|
224
|
+
|
|
225
|
+
#define sisd_to_int(x) _mm_cvtsi128_si32(x)
|
|
226
|
+
|
|
227
|
+
#define sisd_from_int(n) _mm_cvtsi32_si128(n)
|
|
228
|
+
|
|
229
|
+
static inline int simd_all_true_8(SIMD_type v) {
|
|
230
|
+
return _mm_movemask_epi8(v) == 0xFFFF;
|
|
231
|
+
}
|
|
232
|
+
|
|
233
|
+
static inline int simd_any_true_8(SIMD_type v) {
|
|
234
|
+
return _mm_movemask_epi8(v) != 0;
|
|
235
|
+
}
|
|
236
|
+
|
|
237
|
+
static inline int simd_any_sign_bit_8(SIMD_type v) {
|
|
238
|
+
return _mm_movemask_epi8(v) != 0;
|
|
239
|
+
}
|
|
240
|
+
|
|
241
|
+
#define simd_all_eq_8(v1, v2) simd_all_true_8(_mm_cmpeq_epi8(v1, v2))
|
|
242
|
+
#define simd_all_le_8(v1, v2) \
|
|
243
|
+
simd_all_eq_8(simd_max_8(v1, v2), v2)
|
|
244
|
+
|
|
245
|
+
#define simd_all_signed_gt_8(v1, v2) simd_all_true_8(_mm_cmpgt_epi8(v1, v2))
|
|
246
|
+
|
|
247
|
+
#define simd_cmpgt_8(v1,v2) _mm_cmpgt_epi8(v1, v2)
|
|
248
|
+
|
|
249
|
+
static inline int bitblock_has_bit(SIMD_type v) {
|
|
250
|
+
return !simd_all_true_8(simd_eq_8(v, simd_const_8(0)));
|
|
251
|
+
}
|
|
252
|
+
|
|
253
|
+
/* Packed test operation of SSE4. */
|
|
254
|
+
static inline int sisd_ptest(SIMD_type v, SIMD_type mask) {
|
|
255
|
+
return !simd_all_true_8(simd_eq_8(simd_and(v, mask), simd_const_8(0)));
|
|
256
|
+
}
|
|
257
|
+
|
|
258
|
+
|
|
259
|
+
|
|
260
|
+
#define bitblock_test_bit(blk, n) \
|
|
261
|
+
sisd_to_int(sisd_srli(sisd_slli(blk, ((BLOCKSIZE-1)-(n))), BLOCKSIZE-1))
|
|
262
|
+
|
|
263
|
+
#define simd_pack_2(a,b)\
|
|
264
|
+
simd_pack_4(simd_if(simd_himask_2,sisd_srli(a,1),a),\
|
|
265
|
+
simd_if(simd_himask_2,sisd_srli(b,1),b))
|
|
266
|
+
#define simd_pack_4(a,b)\
|
|
267
|
+
simd_pack_8(simd_if(simd_himask_4,sisd_srli(a,2),a),\
|
|
268
|
+
simd_if(simd_himask_4,sisd_srli(b,2),b))
|
|
269
|
+
#define simd_pack_8(a,b)\
|
|
270
|
+
simd_pack_16(simd_if(simd_himask_8,sisd_srli(a,4),a),\
|
|
271
|
+
simd_if(simd_himask_8,sisd_srli(b,4),b))
|
|
272
|
+
|
|
273
|
+
#ifndef simd_add_2_xx
|
|
274
|
+
#define simd_add_2_xx(v1, v2) simd_add_2(v1, v2)
|
|
275
|
+
#endif
|
|
276
|
+
|
|
277
|
+
#ifndef simd_add_2_xl
|
|
278
|
+
#define simd_add_2_xl(v1, v2) simd_add_2(v1, simd_andc(v2, simd_himask_2))
|
|
279
|
+
#endif
|
|
280
|
+
|
|
281
|
+
#ifndef simd_add_2_xh
|
|
282
|
+
#define simd_add_2_xh(v1, v2) simd_add_2(v1, simd_srli_2(v2, 1))
|
|
283
|
+
#endif
|
|
284
|
+
|
|
285
|
+
#ifndef simd_add_2_lx
|
|
286
|
+
#define simd_add_2_lx(v1, v2) simd_add_2(simd_andc(v1, simd_himask_2), v2)
|
|
287
|
+
#endif
|
|
288
|
+
|
|
289
|
+
#ifndef simd_add_2_ll
|
|
290
|
+
#define simd_add_2_ll(v1, v2) simd_add_8(simd_andc(v1, simd_himask_2), simd_andc(v2, simd_himask_2))
|
|
291
|
+
#endif
|
|
292
|
+
|
|
293
|
+
#ifndef simd_add_2_lh
|
|
294
|
+
#define simd_add_2_lh(v1, v2) simd_add_8(simd_andc(v1, simd_himask_2), simd_srli_2(v2, 1))
|
|
295
|
+
#endif
|
|
296
|
+
|
|
297
|
+
#ifndef simd_add_2_hx
|
|
298
|
+
#define simd_add_2_hx(v1, v2) simd_add_2(simd_srli_2(v1, 1), v2)
|
|
299
|
+
#endif
|
|
300
|
+
|
|
301
|
+
#ifndef simd_add_2_hl
|
|
302
|
+
#define simd_add_2_hl(v1, v2) simd_add_8(simd_srli_2(v1, 1), simd_andc(v2, simd_himask_2))
|
|
303
|
+
#endif
|
|
304
|
+
|
|
305
|
+
#ifndef simd_add_2_hh
|
|
306
|
+
#define simd_add_2_hh(v1, v2) simd_add_8(simd_srli_2(v1, 1), simd_srli_2(v2, 1))
|
|
307
|
+
#endif
|
|
308
|
+
|
|
309
|
+
#ifndef simd_add_4_xx
|
|
310
|
+
#define simd_add_4_xx(v1, v2) simd_add_4(v1, v2)
|
|
311
|
+
#endif
|
|
312
|
+
|
|
313
|
+
#ifndef simd_add_4_xl
|
|
314
|
+
#define simd_add_4_xl(v1, v2) simd_add_4(v1, simd_andc(v2, simd_himask_4))
|
|
315
|
+
#endif
|
|
316
|
+
|
|
317
|
+
#ifndef simd_add_4_xh
|
|
318
|
+
#define simd_add_4_xh(v1, v2) simd_add_4(v1, simd_srli_4(v2, 2))
|
|
319
|
+
#endif
|
|
320
|
+
|
|
321
|
+
#ifndef simd_add_4_lx
|
|
322
|
+
#define simd_add_4_lx(v1, v2) simd_add_4(simd_andc(v1, simd_himask_4), v2)
|
|
323
|
+
#endif
|
|
324
|
+
|
|
325
|
+
#ifndef simd_add_4_ll
|
|
326
|
+
#define simd_add_4_ll(v1, v2) simd_add_8(simd_andc(v1, simd_himask_4), simd_andc(v2, simd_himask_4))
|
|
327
|
+
#endif
|
|
328
|
+
|
|
329
|
+
#ifndef simd_add_4_lh
|
|
330
|
+
#define simd_add_4_lh(v1, v2) simd_add_8(simd_andc(v1, simd_himask_4), simd_srli_4(v2, 2))
|
|
331
|
+
#endif
|
|
332
|
+
|
|
333
|
+
#ifndef simd_add_4_hx
|
|
334
|
+
#define simd_add_4_hx(v1, v2) simd_add_4(simd_srli_4(v1, 2), v2)
|
|
335
|
+
#endif
|
|
336
|
+
|
|
337
|
+
#ifndef simd_add_4_hl
|
|
338
|
+
#define simd_add_4_hl(v1, v2) simd_add_8(simd_srli_4(v1, 2), simd_andc(v2, simd_himask_4))
|
|
339
|
+
#endif
|
|
340
|
+
|
|
341
|
+
#ifndef simd_add_4_hh
|
|
342
|
+
#define simd_add_4_hh(v1, v2) simd_add_8(simd_srli_4(v1, 2), simd_srli_4(v2, 2))
|
|
343
|
+
#endif
|
|
344
|
+
|
|
345
|
+
#ifndef simd_add_8_xx
|
|
346
|
+
#define simd_add_8_xx(v1, v2) simd_add_8(v1, v2)
|
|
347
|
+
#endif
|
|
348
|
+
|
|
349
|
+
#ifndef simd_add_8_xl
|
|
350
|
+
#define simd_add_8_xl(v1, v2) simd_add_8(v1, simd_andc(v2, simd_himask_8))
|
|
351
|
+
#endif
|
|
352
|
+
|
|
353
|
+
#ifndef simd_add_8_xh
|
|
354
|
+
#define simd_add_8_xh(v1, v2) simd_add_8(v1, simd_srli_8(v2, 4))
|
|
355
|
+
#endif
|
|
356
|
+
|
|
357
|
+
#ifndef simd_add_8_lx
|
|
358
|
+
#define simd_add_8_lx(v1, v2) simd_add_8(simd_andc(v1, simd_himask_8), v2)
|
|
359
|
+
#endif
|
|
360
|
+
|
|
361
|
+
#ifndef simd_add_8_ll
|
|
362
|
+
#define simd_add_8_ll(v1, v2) simd_add_8(simd_andc(v1, simd_himask_8), simd_andc(v2, simd_himask_8))
|
|
363
|
+
#endif
|
|
364
|
+
|
|
365
|
+
#ifndef simd_add_8_lh
|
|
366
|
+
#define simd_add_8_lh(v1, v2) simd_add_8(simd_andc(v1, simd_himask_8), simd_srli_8(v2, 4))
|
|
367
|
+
#endif
|
|
368
|
+
|
|
369
|
+
#ifndef simd_add_8_hx
|
|
370
|
+
#define simd_add_8_hx(v1, v2) simd_add_8(simd_srli_8(v1, 4), v2)
|
|
371
|
+
#endif
|
|
372
|
+
|
|
373
|
+
#ifndef simd_add_8_hl
|
|
374
|
+
#define simd_add_8_hl(v1, v2) simd_add_8(simd_srli_8(v1, 4), simd_andc(v2, simd_himask_8))
|
|
375
|
+
#endif
|
|
376
|
+
|
|
377
|
+
#ifndef simd_add_8_hh
|
|
378
|
+
#define simd_add_8_hh(v1, v2) simd_add_8(simd_srli_8(v1, 4), simd_srli_8(v2, 4))
|
|
379
|
+
#endif
|
|
380
|
+
|
|
381
|
+
#ifndef simd_add_16_xx
|
|
382
|
+
#define simd_add_16_xx(v1, v2) simd_add_16(v1, v2)
|
|
383
|
+
#endif
|
|
384
|
+
|
|
385
|
+
#ifndef simd_add_16_xl
|
|
386
|
+
#define simd_add_16_xl(v1, v2) simd_add_16(v1, simd_andc(v2, simd_himask_16))
|
|
387
|
+
#endif
|
|
388
|
+
|
|
389
|
+
#ifndef simd_add_16_xh
|
|
390
|
+
#define simd_add_16_xh(v1, v2) simd_add_16(v1, simd_srli_16(v2, 8))
|
|
391
|
+
#endif
|
|
392
|
+
|
|
393
|
+
#ifndef simd_add_16_lx
|
|
394
|
+
#define simd_add_16_lx(v1, v2) simd_add_16(simd_andc(v1, simd_himask_16), v2)
|
|
395
|
+
#endif
|
|
396
|
+
|
|
397
|
+
#ifndef simd_add_16_ll
|
|
398
|
+
#define simd_add_16_ll(v1, v2) simd_add_16(simd_andc(v1, simd_himask_16), simd_andc(v2, simd_himask_16))
|
|
399
|
+
#endif
|
|
400
|
+
|
|
401
|
+
#ifndef simd_add_16_lh
|
|
402
|
+
#define simd_add_16_lh(v1, v2) simd_add_16(simd_andc(v1, simd_himask_16), simd_srli_16(v2, 8))
|
|
403
|
+
#endif
|
|
404
|
+
|
|
405
|
+
#ifndef simd_add_16_hx
|
|
406
|
+
#define simd_add_16_hx(v1, v2) simd_add_16(simd_srli_16(v1, 8), v2)
|
|
407
|
+
#endif
|
|
408
|
+
|
|
409
|
+
#ifndef simd_add_16_hl
|
|
410
|
+
#define simd_add_16_hl(v1, v2) simd_add_16(simd_srli_16(v1, 8), simd_andc(v2, simd_himask_16))
|
|
411
|
+
#endif
|
|
412
|
+
|
|
413
|
+
#ifndef simd_add_16_hh
|
|
414
|
+
#define simd_add_16_hh(v1, v2) simd_add_16(simd_srli_16(v1, 8), simd_srli_16(v2, 8))
|
|
415
|
+
#endif
|
|
416
|
+
|
|
417
|
+
#ifndef simd_add_32_xx
|
|
418
|
+
#define simd_add_32_xx(v1, v2) simd_add_32(v1, v2)
|
|
419
|
+
#endif
|
|
420
|
+
|
|
421
|
+
#ifndef simd_add_32_xl
|
|
422
|
+
#define simd_add_32_xl(v1, v2) simd_add_32(v1, simd_andc(v2, simd_himask_32))
|
|
423
|
+
#endif
|
|
424
|
+
|
|
425
|
+
#ifndef simd_add_32_xh
|
|
426
|
+
#define simd_add_32_xh(v1, v2) simd_add_32(v1, simd_srli_32(v2, 16))
|
|
427
|
+
#endif
|
|
428
|
+
|
|
429
|
+
#ifndef simd_add_32_lx
|
|
430
|
+
#define simd_add_32_lx(v1, v2) simd_add_32(simd_andc(v1, simd_himask_32), v2)
|
|
431
|
+
#endif
|
|
432
|
+
|
|
433
|
+
#ifndef simd_add_32_ll
|
|
434
|
+
#define simd_add_32_ll(v1, v2) simd_add_32(simd_andc(v1, simd_himask_32), simd_andc(v2, simd_himask_32))
|
|
435
|
+
#endif
|
|
436
|
+
|
|
437
|
+
#ifndef simd_add_32_lh
|
|
438
|
+
#define simd_add_32_lh(v1, v2) simd_add_32(simd_andc(v1, simd_himask_32), simd_srli_32(v2, 16))
|
|
439
|
+
#endif
|
|
440
|
+
|
|
441
|
+
#ifndef simd_add_32_hx
|
|
442
|
+
#define simd_add_32_hx(v1, v2) simd_add_32(simd_srli_32(v1, 16), v2)
|
|
443
|
+
#endif
|
|
444
|
+
|
|
445
|
+
#ifndef simd_add_32_hl
|
|
446
|
+
#define simd_add_32_hl(v1, v2) simd_add_32(simd_srli_32(v1, 16), simd_andc(v2, simd_himask_32))
|
|
447
|
+
#endif
|
|
448
|
+
|
|
449
|
+
#ifndef simd_add_32_hh
|
|
450
|
+
#define simd_add_32_hh(v1, v2) simd_add_32(simd_srli_32(v1, 16), simd_srli_32(v2, 16))
|
|
451
|
+
#endif
|
|
452
|
+
|
|
453
|
+
#ifndef simd_add_64_xx
|
|
454
|
+
#define simd_add_64_xx(v1, v2) simd_add_64(v1, v2)
|
|
455
|
+
#endif
|
|
456
|
+
|
|
457
|
+
#ifndef simd_add_64_xl
|
|
458
|
+
#define simd_add_64_xl(v1, v2) simd_add_64(v1, simd_andc(v2, simd_himask_64))
|
|
459
|
+
#endif
|
|
460
|
+
|
|
461
|
+
#ifndef simd_add_64_xh
|
|
462
|
+
#define simd_add_64_xh(v1, v2) simd_add_64(v1, simd_srli_64(v2, 32))
|
|
463
|
+
#endif
|
|
464
|
+
|
|
465
|
+
#ifndef simd_add_64_lx
|
|
466
|
+
#define simd_add_64_lx(v1, v2) simd_add_64(simd_andc(v1, simd_himask_64), v2)
|
|
467
|
+
#endif
|
|
468
|
+
|
|
469
|
+
#ifndef simd_add_64_ll
|
|
470
|
+
#define simd_add_64_ll(v1, v2) simd_add_64(simd_andc(v1, simd_himask_64), simd_andc(v2, simd_himask_64))
|
|
471
|
+
#endif
|
|
472
|
+
|
|
473
|
+
#ifndef simd_add_64_lh
|
|
474
|
+
#define simd_add_64_lh(v1, v2) simd_add_64(simd_andc(v1, simd_himask_64), simd_srli_64(v2, 32))
|
|
475
|
+
#endif
|
|
476
|
+
|
|
477
|
+
#ifndef simd_add_64_hx
|
|
478
|
+
#define simd_add_64_hx(v1, v2) simd_add_64(simd_srli_64(v1, 32), v2)
|
|
479
|
+
#endif
|
|
480
|
+
|
|
481
|
+
#ifndef simd_add_64_hl
|
|
482
|
+
#define simd_add_64_hl(v1, v2) simd_add_64(simd_srli_64(v1, 32), simd_andc(v2, simd_himask_64))
|
|
483
|
+
#endif
|
|
484
|
+
|
|
485
|
+
#ifndef simd_add_64_hh
|
|
486
|
+
#define simd_add_64_hh(v1, v2) simd_add_64(simd_srli_64(v1, 32), simd_srli_64(v2, 32))
|
|
487
|
+
#endif
|
|
488
|
+
|
|
489
|
+
#ifndef simd_add_128_xx
|
|
490
|
+
#define simd_add_128_xx(v1, v2) simd_add_128(v1, v2)
|
|
491
|
+
#endif
|
|
492
|
+
|
|
493
|
+
#ifndef simd_add_128_xl
|
|
494
|
+
#define simd_add_128_xl(v1, v2) simd_add_128(v1, simd_andc(v2, simd_himask_128))
|
|
495
|
+
#endif
|
|
496
|
+
|
|
497
|
+
#ifndef simd_add_128_xh
|
|
498
|
+
#define simd_add_128_xh(v1, v2) simd_add_128(v1, simd_srli_128(v2, 64))
|
|
499
|
+
#endif
|
|
500
|
+
|
|
501
|
+
#ifndef simd_add_128_lx
|
|
502
|
+
#define simd_add_128_lx(v1, v2) simd_add_128(simd_andc(v1, simd_himask_128), v2)
|
|
503
|
+
#endif
|
|
504
|
+
|
|
505
|
+
#ifndef simd_add_128_ll
|
|
506
|
+
#define simd_add_128_ll(v1, v2) simd_add_128(simd_andc(v1, simd_himask_128), simd_andc(v2, simd_himask_128))
|
|
507
|
+
#endif
|
|
508
|
+
|
|
509
|
+
#ifndef simd_add_128_lh
|
|
510
|
+
#define simd_add_128_lh(v1, v2) simd_add_128(simd_andc(v1, simd_himask_128), simd_srli_128(v2, 64))
|
|
511
|
+
#endif
|
|
512
|
+
|
|
513
|
+
#ifndef simd_add_128_hx
|
|
514
|
+
#define simd_add_128_hx(v1, v2) simd_add_128(simd_srli_128(v1, 64), v2)
|
|
515
|
+
#endif
|
|
516
|
+
|
|
517
|
+
#ifndef simd_add_128_hl
|
|
518
|
+
#define simd_add_128_hl(v1, v2) simd_add_128(simd_srli_128(v1, 64), simd_andc(v2, simd_himask_128))
|
|
519
|
+
#endif
|
|
520
|
+
|
|
521
|
+
#ifndef simd_add_128_hh
|
|
522
|
+
#define simd_add_128_hh(v1, v2) simd_add_128(simd_srli_128(v1, 64), simd_srli_128(v2, 64))
|
|
523
|
+
#endif
|
|
524
|
+
|
|
525
|
+
#ifndef simd_pack_2_xx
|
|
526
|
+
#define simd_pack_2_xx(v1, v2) simd_pack_2(v1, v2)
|
|
527
|
+
#endif
|
|
528
|
+
|
|
529
|
+
#ifndef simd_pack_2_xl
|
|
530
|
+
#define simd_pack_2_xl(v1, v2) simd_pack_2(v1, v2)
|
|
531
|
+
#endif
|
|
532
|
+
|
|
533
|
+
#ifndef simd_pack_2_xh
|
|
534
|
+
#define simd_pack_2_xh(v1, v2) simd_pack_2(v1, simd_srli_16(v2, 1))
|
|
535
|
+
#endif
|
|
536
|
+
|
|
537
|
+
#ifndef simd_pack_2_lx
|
|
538
|
+
#define simd_pack_2_lx(v1, v2) simd_pack_2(v1, v2)
|
|
539
|
+
#endif
|
|
540
|
+
|
|
541
|
+
#ifndef simd_pack_2_ll
|
|
542
|
+
#define simd_pack_2_ll(v1, v2) simd_pack_2(v1, v2)
|
|
543
|
+
#endif
|
|
544
|
+
|
|
545
|
+
#ifndef simd_pack_2_lh
|
|
546
|
+
#define simd_pack_2_lh(v1, v2) simd_pack_2(v1, simd_srli_16(v2, 1))
|
|
547
|
+
#endif
|
|
548
|
+
|
|
549
|
+
#ifndef simd_pack_2_hx
|
|
550
|
+
#define simd_pack_2_hx(v1, v2) simd_pack_2(simd_srli_16(v1, 1), v2)
|
|
551
|
+
#endif
|
|
552
|
+
|
|
553
|
+
#ifndef simd_pack_2_hl
|
|
554
|
+
#define simd_pack_2_hl(v1, v2) simd_pack_2(simd_srli_16(v1, 1), v2)
|
|
555
|
+
#endif
|
|
556
|
+
|
|
557
|
+
#ifndef simd_pack_2_hh
|
|
558
|
+
#define simd_pack_2_hh(v1, v2) simd_pack_2(simd_srli_16(v1, 1), simd_srli_16(v2, 1))
|
|
559
|
+
#endif
|
|
560
|
+
|
|
561
|
+
#ifndef simd_pack_4_xx
|
|
562
|
+
#define simd_pack_4_xx(v1, v2) simd_pack_4(v1, v2)
|
|
563
|
+
#endif
|
|
564
|
+
|
|
565
|
+
#ifndef simd_pack_4_xl
|
|
566
|
+
#define simd_pack_4_xl(v1, v2) simd_pack_4(v1, v2)
|
|
567
|
+
#endif
|
|
568
|
+
|
|
569
|
+
#ifndef simd_pack_4_xh
|
|
570
|
+
#define simd_pack_4_xh(v1, v2) simd_pack_4(v1, simd_srli_16(v2, 2))
|
|
571
|
+
#endif
|
|
572
|
+
|
|
573
|
+
#ifndef simd_pack_4_lx
|
|
574
|
+
#define simd_pack_4_lx(v1, v2) simd_pack_4(v1, v2)
|
|
575
|
+
#endif
|
|
576
|
+
|
|
577
|
+
#ifndef simd_pack_4_ll
|
|
578
|
+
#define simd_pack_4_ll(v1, v2) simd_pack_4(v1, v2)
|
|
579
|
+
#endif
|
|
580
|
+
|
|
581
|
+
#ifndef simd_pack_4_lh
|
|
582
|
+
#define simd_pack_4_lh(v1, v2) simd_pack_4(v1, simd_srli_16(v2, 2))
|
|
583
|
+
#endif
|
|
584
|
+
|
|
585
|
+
#ifndef simd_pack_4_hx
|
|
586
|
+
#define simd_pack_4_hx(v1, v2) simd_pack_4(simd_srli_16(v1, 2), v2)
|
|
587
|
+
#endif
|
|
588
|
+
|
|
589
|
+
#ifndef simd_pack_4_hl
|
|
590
|
+
#define simd_pack_4_hl(v1, v2) simd_pack_4(simd_srli_16(v1, 2), v2)
|
|
591
|
+
#endif
|
|
592
|
+
|
|
593
|
+
#ifndef simd_pack_4_hh
|
|
594
|
+
#define simd_pack_4_hh(v1, v2) simd_pack_4(simd_srli_16(v1, 2), simd_srli_16(v2, 2))
|
|
595
|
+
#endif
|
|
596
|
+
|
|
597
|
+
#ifndef simd_pack_8_xx
|
|
598
|
+
#define simd_pack_8_xx(v1, v2) simd_pack_8(v1, v2)
|
|
599
|
+
#endif
|
|
600
|
+
|
|
601
|
+
#ifndef simd_pack_8_xl
|
|
602
|
+
#define simd_pack_8_xl(v1, v2) simd_pack_8(v1, v2)
|
|
603
|
+
#endif
|
|
604
|
+
|
|
605
|
+
#ifndef simd_pack_8_xh
|
|
606
|
+
#define simd_pack_8_xh(v1, v2) simd_pack_8(v1, simd_srli_16(v2, 4))
|
|
607
|
+
#endif
|
|
608
|
+
|
|
609
|
+
#ifndef simd_pack_8_lx
|
|
610
|
+
#define simd_pack_8_lx(v1, v2) simd_pack_8(v1, v2)
|
|
611
|
+
#endif
|
|
612
|
+
|
|
613
|
+
#ifndef simd_pack_8_ll
|
|
614
|
+
#define simd_pack_8_ll(v1, v2) simd_pack_8(v1, v2)
|
|
615
|
+
#endif
|
|
616
|
+
|
|
617
|
+
#ifndef simd_pack_8_lh
|
|
618
|
+
#define simd_pack_8_lh(v1, v2) simd_pack_8(v1, simd_srli_16(v2, 4))
|
|
619
|
+
#endif
|
|
620
|
+
|
|
621
|
+
#ifndef simd_pack_8_hx
|
|
622
|
+
#define simd_pack_8_hx(v1, v2) simd_pack_8(simd_srli_16(v1, 4), v2)
|
|
623
|
+
#endif
|
|
624
|
+
|
|
625
|
+
#ifndef simd_pack_8_hl
|
|
626
|
+
#define simd_pack_8_hl(v1, v2) simd_pack_8(simd_srli_16(v1, 4), v2)
|
|
627
|
+
#endif
|
|
628
|
+
|
|
629
|
+
#ifndef simd_pack_8_hh
|
|
630
|
+
#define simd_pack_8_hh(v1, v2) simd_pack_8(simd_srli_16(v1, 4), simd_srli_16(v2, 4))
|
|
631
|
+
#endif
|
|
632
|
+
|
|
633
|
+
#ifndef simd_pack_16_xx
|
|
634
|
+
#define simd_pack_16_xx(v1, v2) simd_pack_16(v1, v2)
|
|
635
|
+
#endif
|
|
636
|
+
|
|
637
|
+
#ifndef simd_pack_16_xl
|
|
638
|
+
#define simd_pack_16_xl(v1, v2) simd_pack_16(v1, v2)
|
|
639
|
+
#endif
|
|
640
|
+
|
|
641
|
+
#ifndef simd_pack_16_xh
|
|
642
|
+
#define simd_pack_16_xh(v1, v2) simd_pack_16(v1, simd_srli_16(v2, 8))
|
|
643
|
+
#endif
|
|
644
|
+
|
|
645
|
+
#ifndef simd_pack_16_lx
|
|
646
|
+
#define simd_pack_16_lx(v1, v2) simd_pack_16(v1, v2)
|
|
647
|
+
#endif
|
|
648
|
+
|
|
649
|
+
#ifndef simd_pack_16_ll
|
|
650
|
+
#define simd_pack_16_ll(v1, v2) simd_pack_16(v1, v2)
|
|
651
|
+
#endif
|
|
652
|
+
|
|
653
|
+
#ifndef simd_pack_16_lh
|
|
654
|
+
#define simd_pack_16_lh(v1, v2) simd_pack_16(v1, simd_srli_16(v2, 8))
|
|
655
|
+
#endif
|
|
656
|
+
|
|
657
|
+
#ifndef simd_pack_16_hx
|
|
658
|
+
#define simd_pack_16_hx(v1, v2) simd_pack_16(simd_srli_16(v1, 8), v2)
|
|
659
|
+
#endif
|
|
660
|
+
|
|
661
|
+
#ifndef simd_pack_16_hl
|
|
662
|
+
#define simd_pack_16_hl(v1, v2) simd_pack_16(simd_srli_16(v1, 8), v2)
|
|
663
|
+
#endif
|
|
664
|
+
|
|
665
|
+
#ifndef simd_pack_16_hh
|
|
666
|
+
//#define simd_pack_16_hh(v1, v2) simd_pack_16(simd_srli_16(v1, 8), simd_srli_16(v2, 8))
|
|
667
|
+
//Masking performned by simd_pack_16 is unnecessary.
|
|
668
|
+
#define simd_pack_16_hh(v1, v2) _mm_packus_epi16(simd_srli_16(v1, 8), simd_srli_16(v2, 8))
|
|
669
|
+
#endif
|
|
670
|
+
|
|
671
|
+
|
|
672
|
+
// Splat the first 16-bit int into all positions.
|
|
673
|
+
static inline SIMD_type simd_splat_16(SIMD_type x) {
|
|
674
|
+
SIMD_type t = _mm_shufflelo_epi16(x,0);
|
|
675
|
+
return _mm_shuffle_epi32(t,0);
|
|
676
|
+
}
|
|
677
|
+
|
|
678
|
+
// Splat the first 32-bit int into all positions.
|
|
679
|
+
static inline SIMD_type simd_splat_32(SIMD_type x) {
|
|
680
|
+
return _mm_shuffle_epi32(x,0);
|
|
681
|
+
}
|
|
682
|
+
|
|
683
|
+
|
|
684
|
+
void print_bit_block(char * var_name, SIMD_type v) {
|
|
685
|
+
union {SIMD_type vec; unsigned char elems[8];} x;
|
|
686
|
+
x.vec = v;
|
|
687
|
+
unsigned char c;//, bit_reversed;
|
|
688
|
+
size_t i;
|
|
689
|
+
printf("%20s = ", var_name);
|
|
690
|
+
for (i = 0; i < sizeof(SIMD_type); i++) {
|
|
691
|
+
c = x.elems[i];
|
|
692
|
+
printf("%02X ", c);
|
|
693
|
+
}
|
|
694
|
+
printf("\n");
|
|
695
|
+
}
|
|
696
|
+
|
|
697
|
+
static inline int bitblock_bit_count(SIMD_type v) {
|
|
698
|
+
//int bit_count = 0;
|
|
699
|
+
SIMD_type cts_2 = simd_add_2_lh(v, v);
|
|
700
|
+
SIMD_type cts_4 = simd_add_4_lh(cts_2, cts_2);
|
|
701
|
+
SIMD_type cts_8 = simd_add_8_lh(cts_4, cts_4);
|
|
702
|
+
SIMD_type cts_64 = _mm_sad_epu8(cts_8, simd_const_8(0));
|
|
703
|
+
/* SIMD_type cts_128 = simd_add_128_lh(cts_64, cts_64) */;
|
|
704
|
+
SIMD_type cts_128 = simd_add_64(cts_64, sisd_srli(cts_64,64));
|
|
705
|
+
return (int) sisd_to_int(cts_128);
|
|
706
|
+
}
|
|
707
|
+
|
|
708
|
+
#define sb_op(x, n) ((x)>>(n))
|
|
709
|
+
#define sf_op(x, n) ((x)<<(n))
|
|
710
|
+
#ifdef __GNUC__
|
|
711
|
+
#define cfzl __builtin_ctzl
|
|
712
|
+
#endif
|
|
713
|
+
#ifdef _MSC_VER
|
|
714
|
+
#include <intrin.h>
|
|
715
|
+
#pragma intrinsic(_BitScanForward)
|
|
716
|
+
// precondition: x > 0
|
|
717
|
+
static inline unsigned long cfzl(unsigned long x) {
|
|
718
|
+
unsigned long zeroes;
|
|
719
|
+
_BitScanForward(&zeroes, x);
|
|
720
|
+
return zeroes;
|
|
721
|
+
}
|
|
722
|
+
#endif
|
|
723
|
+
|
|
724
|
+
static inline int count_forward_zeroes(SIMD_type bits) {
|
|
725
|
+
union {SIMD_type vec; unsigned long elems[sizeof(SIMD_type)/sizeof(long)];} v;
|
|
726
|
+
v.vec = bits;
|
|
727
|
+
if (v.elems[0] != 0) return cfzl(v.elems[0]);
|
|
728
|
+
else if (v.elems[1] != 0) return LONG_BIT + cfzl(v.elems[1]);
|
|
729
|
+
#ifdef _MSC_VER
|
|
730
|
+
else if (v.elems[2] != 0) return 2*LONG_BIT + cfzl(v.elems[2]);
|
|
731
|
+
else if (v.elems[3] != 0) return 3*LONG_BIT + cfzl(v.elems[3]);
|
|
732
|
+
#endif
|
|
733
|
+
#ifndef _MSC_VER
|
|
734
|
+
#if LONG_BIT < 64
|
|
735
|
+
else if (v.elems[2] != 0) return 2*LONG_BIT + cfzl(v.elems[2]);
|
|
736
|
+
else if (v.elems[3] != 0) return 3*LONG_BIT + cfzl(v.elems[3]);
|
|
737
|
+
#endif
|
|
738
|
+
#endif
|
|
739
|
+
else return 8*sizeof(SIMD_type);
|
|
740
|
+
}
|
|
741
|
+
|
|
742
|
+
#ifdef ADC_128_VIA_GEN_REG
|
|
743
|
+
// 128-bit add with carry
|
|
744
|
+
// (rslt, carryout) = x + y + carryin
|
|
745
|
+
// where x = (x2, x1), y = (y2, y1), rslt = (rslt2, rslt1)
|
|
746
|
+
#define double_int64_adc(x1, x2, y1, y2, rslt1, rslt2, carry) \
|
|
747
|
+
__asm__ ("sahf\n\t" \
|
|
748
|
+
"adc %[e1], %[z1]\n\t" \
|
|
749
|
+
"adc %[e2], %[z2]\n\t" \
|
|
750
|
+
"lahf\n\t" \
|
|
751
|
+
: [z1] "=r" (rslt1), [z2] "=r" (rslt2), [carry] "=a" (carry) \
|
|
752
|
+
: "[z1]" (x1), "[z2]" (x2), \
|
|
753
|
+
[e1] "r" (y1), [e2] "r" (y2), \
|
|
754
|
+
"[carry]" (carry) \
|
|
755
|
+
: "cc")
|
|
756
|
+
|
|
757
|
+
static inline SIMD_type adc128(SIMD_type first, SIMD_type second, int &carry)
|
|
758
|
+
{
|
|
759
|
+
union {__m128i bitblock;
|
|
760
|
+
uint64_t int64[2];} rslt;
|
|
761
|
+
|
|
762
|
+
union {__m128i bitblock;
|
|
763
|
+
uint64_t int64[2];} x;
|
|
764
|
+
|
|
765
|
+
union {__m128i bitblock;
|
|
766
|
+
uint64_t int64[2];} y;
|
|
767
|
+
|
|
768
|
+
x.bitblock = first;
|
|
769
|
+
y.bitblock = second;
|
|
770
|
+
|
|
771
|
+
double_int64_adc(x.int64[0], x.int64[1], y.int64[0], y.int64[1],
|
|
772
|
+
rslt.int64[0], rslt.int64[1], carry);
|
|
773
|
+
|
|
774
|
+
return rslt.bitblock;
|
|
775
|
+
}
|
|
776
|
+
#endif
|
|
777
|
+
|
|
778
|
+
#ifndef ADC_128_VIA_GEN_REG
|
|
779
|
+
static inline void adc128(SIMD_type x, SIMD_type y, SIMD_type * carry, SIMD_type *sum)
|
|
780
|
+
{
|
|
781
|
+
/* Carries are always generated if both high bits are 1. */
|
|
782
|
+
SIMD_type gen = simd_and(x, y);
|
|
783
|
+
|
|
784
|
+
/* Carries may propagate if either high bit is 1. */
|
|
785
|
+
SIMD_type prop = simd_or(x, y);
|
|
786
|
+
|
|
787
|
+
/* Partial add without carry for high 64. */
|
|
788
|
+
SIMD_type partial = simd_add_64(simd_add_64(x, y), *carry);
|
|
789
|
+
|
|
790
|
+
/* Carry for high 64 */
|
|
791
|
+
SIMD_type c1 = sisd_slli(simd_srli_64(simd_or(gen, simd_andc(prop, partial)), 63), 64);
|
|
792
|
+
|
|
793
|
+
/* Final sum */
|
|
794
|
+
*sum = simd_add_64(c1, partial);
|
|
795
|
+
|
|
796
|
+
/* Carry out */
|
|
797
|
+
*carry = sisd_srli(simd_or(gen, simd_andc(prop, *sum)), 127);
|
|
798
|
+
|
|
799
|
+
}
|
|
800
|
+
|
|
801
|
+
static inline void sbb128(SIMD_type x, SIMD_type y, SIMD_type *borrow, SIMD_type *difference)
|
|
802
|
+
{
|
|
803
|
+
/* Borrows are always generated if the high bit of x is 0 and the high bit of y is 1. */
|
|
804
|
+
SIMD_type gen = simd_andc(y, x);
|
|
805
|
+
|
|
806
|
+
/* Borrows may propagate if the high bits of both x and y are 0 or if the high bits of both x and y are 1 . */
|
|
807
|
+
SIMD_type prop = simd_not(simd_xor(x, y));
|
|
808
|
+
|
|
809
|
+
/* Partial sub with borrow for high 64. */
|
|
810
|
+
SIMD_type partial = simd_sub_64(simd_sub_64(x, y), *borrow);
|
|
811
|
+
|
|
812
|
+
/* Borrow for high 64 */
|
|
813
|
+
SIMD_type b1 = sisd_slli(simd_srli_64(simd_or(gen, simd_and(prop, partial)), 63), 64);
|
|
814
|
+
|
|
815
|
+
/* Final difference */
|
|
816
|
+
*difference = simd_sub_64(partial, b1);
|
|
817
|
+
|
|
818
|
+
/* Borrow out */
|
|
819
|
+
*borrow = sisd_srli(simd_or(gen, simd_and(prop, *difference)), 127);
|
|
820
|
+
|
|
821
|
+
}
|
|
822
|
+
#endif
|
|
823
|
+
|
|
824
|
+
static inline SIMD_type advance_with_carry(SIMD_type cursor, SIMD_type &carry)
|
|
825
|
+
{
|
|
826
|
+
SIMD_type shift_out = simd_srli_64(cursor, 63);
|
|
827
|
+
SIMD_type low_bits = simd_mergel_64(shift_out, carry);
|
|
828
|
+
carry = sisd_srli(shift_out, 64);
|
|
829
|
+
return simd_or(simd_add_64(cursor, cursor), low_bits);
|
|
830
|
+
}
|
|
831
|
+
|
|
832
|
+
|
|
833
|
+
|
|
834
|
+
|
|
835
|
+
#endif
|
|
836
|
+
|