react-native-quick-crypto 1.0.19 → 1.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/QuickCrypto.podspec +12 -38
- package/README.md +2 -0
- package/android/CMakeLists.txt +3 -0
- package/cpp/utils/HybridUtils.cpp +39 -77
- package/deps/simdutf/.clang-format +4 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/bug_report.md +62 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/config.yml +1 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/feature_request.md +35 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/standard-issue-template.md +29 -0
- package/deps/simdutf/.github/pull_request_template.md +51 -0
- package/deps/simdutf/.github/workflows/aarch64.yml +39 -0
- package/deps/simdutf/.github/workflows/alpine.yml +27 -0
- package/deps/simdutf/.github/workflows/amalgamation_demos.yml +34 -0
- package/deps/simdutf/.github/workflows/armv7.yml +32 -0
- package/deps/simdutf/.github/workflows/atomic_fuzz.yml +25 -0
- package/deps/simdutf/.github/workflows/cifuzz.yml +37 -0
- package/deps/simdutf/.github/workflows/clangformat.yml +36 -0
- package/deps/simdutf/.github/workflows/debian-latestcxxstandards.yml +40 -0
- package/deps/simdutf/.github/workflows/debian.yml +33 -0
- package/deps/simdutf/.github/workflows/documentation.yml +36 -0
- package/deps/simdutf/.github/workflows/emscripten.yml +19 -0
- package/deps/simdutf/.github/workflows/loongarch64-gcc-14.2.yml +39 -0
- package/deps/simdutf/.github/workflows/macos-latest.yml +29 -0
- package/deps/simdutf/.github/workflows/msys2-clang.yml +48 -0
- package/deps/simdutf/.github/workflows/msys2.yml +50 -0
- package/deps/simdutf/.github/workflows/ppc64le.yml +29 -0
- package/deps/simdutf/.github/workflows/rvv-1024-clang-18.yml +35 -0
- package/deps/simdutf/.github/workflows/rvv-128-clang-17.yml +35 -0
- package/deps/simdutf/.github/workflows/rvv-256-gcc-14.yml +31 -0
- package/deps/simdutf/.github/workflows/s390x.yml +29 -0
- package/deps/simdutf/.github/workflows/selective-amalgamation.yml +29 -0
- package/deps/simdutf/.github/workflows/typos.yml +19 -0
- package/deps/simdutf/.github/workflows/ubuntu22-cxx20.yml +30 -0
- package/deps/simdutf/.github/workflows/ubuntu22.yml +32 -0
- package/deps/simdutf/.github/workflows/ubuntu22_gcc12.yml +27 -0
- package/deps/simdutf/.github/workflows/ubuntu22sani.yml +29 -0
- package/deps/simdutf/.github/workflows/ubuntu24-cxxstandards.yml +34 -0
- package/deps/simdutf/.github/workflows/ubuntu24-unsignedchar.yml +34 -0
- package/deps/simdutf/.github/workflows/ubuntu24.yml +32 -0
- package/deps/simdutf/.github/workflows/ubuntu24sani.yml +36 -0
- package/deps/simdutf/.github/workflows/ubuntu24sani_clang.yml +29 -0
- package/deps/simdutf/.github/workflows/vs17-arm-ci.yml +21 -0
- package/deps/simdutf/.github/workflows/vs17-ci-cxx20.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-ci.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-clang-ci.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-cxxstandards.yml +36 -0
- package/deps/simdutf/AI_USAGE_POLICY.md +56 -0
- package/deps/simdutf/AUTHORS +6 -0
- package/deps/simdutf/CMakeLists.txt +231 -0
- package/deps/simdutf/CONTRIBUTING.md +214 -0
- package/deps/simdutf/CONTRIBUTORS +1 -0
- package/deps/simdutf/Doxyfile +2584 -0
- package/deps/simdutf/LICENSE-APACHE +201 -0
- package/deps/simdutf/LICENSE-MIT +18 -0
- package/deps/simdutf/Makefile.crosscompile +54 -0
- package/deps/simdutf/README-RVV.md +16 -0
- package/deps/simdutf/README.md +2782 -0
- package/deps/simdutf/SECURITY.md +8 -0
- package/deps/simdutf/benchmarks/CMakeLists.txt +101 -0
- package/deps/simdutf/benchmarks/alignment.cpp +150 -0
- package/deps/simdutf/benchmarks/base64/CMakeLists.txt +30 -0
- package/deps/simdutf/benchmarks/base64/benchmark_base64.cpp +875 -0
- package/deps/simdutf/benchmarks/base64/libbase64_spaces.h +49 -0
- package/deps/simdutf/benchmarks/base64/node_base64.h +227 -0
- package/deps/simdutf/benchmarks/base64/openssl3_base64.h +334 -0
- package/deps/simdutf/benchmarks/benchmark.cpp +65 -0
- package/deps/simdutf/benchmarks/benchmark_to_well_formed_utf16.cpp +347 -0
- package/deps/simdutf/benchmarks/competition/.clang-format-ignore +5 -0
- package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.cpp +1276 -0
- package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.h +595 -0
- package/deps/simdutf/benchmarks/competition/README.md +7 -0
- package/deps/simdutf/benchmarks/competition/hoehrmann/hoehrmann.h +91 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16.h +444 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16_tables.h +13183 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/script.py +73 -0
- package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.cpp +738 -0
- package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.h +293 -0
- package/deps/simdutf/benchmarks/competition/u8u16/COPYRIGHT +8 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Makefile +44 -0
- package/deps/simdutf/benchmarks/competition/u8u16/OSL3.0.txt +169 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/BOM_Profiler.h +148 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/i386_timer.h +45 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/ppc_timer.c +34 -0
- package/deps/simdutf/benchmarks/competition/u8u16/README +56 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/config_defs.h +43 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/g4_config.h +27 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/mmx_config.h +16 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/p4_config.h +18 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/p4_ideal_config.h +16 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/spu_config.h +28 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/ssse3_config.h +20 -0
- package/deps/simdutf/benchmarks/competition/u8u16/iconv_u8u16.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/altivec_simd.h +440 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_basic_ops.py +121 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_half_operand_versions.py +158 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_test.py +270 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd.h +141 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_basic.h +216 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_built_in.h +119 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_modified.h +2430 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/outline.txt +39 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/spu_simd.h +421 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/sse_simd.h +836 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/stdint.h +222 -0
- package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_BE.c +4 -0
- package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_LE.c +5 -0
- package/deps/simdutf/benchmarks/competition/u8u16/proto/u8u16.py +390 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/Makefile +18 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/bytelex.h +448 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/charsets/ASCII_EBCDIC.h +284 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.c +1975 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.pdf +0 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.w +2263 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/multiliteral.h +239 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/u8u16.c +232 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/x8x16.c +194 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.c +193 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.h +167 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.c +288 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.h +117 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_g4.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_mmx.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4.c +3 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4_ideal.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_spu.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_ssse3.c +3 -0
- package/deps/simdutf/benchmarks/competition/u8u16/x8x16_p4.c +2 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/LICENSE +23 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/data/test_minimal.txt +44 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/readme.md +106 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_corr_tests.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_example.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_file_conv.sh +14 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_lib.sh +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_sample.sh +8 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_corr_tests.cmd +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_example.cmd +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_file_conv.cmd +14 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_lib.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_sample.cmd +8 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_corr_tests.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_example.cmd +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_file_conv.cmd +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_lib.cmd +10 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_sample.cmd +9 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/html_table.py +25 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/measure.py +94 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/resize.py +20 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_all.cmd +2 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_interm.cmd +1 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/CustomMemcpy.h +75 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/PerfDefs.h +47 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.cpp +17 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.h +76 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/AllProcessors.cpp +35 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.cpp +117 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.h +210 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferDecoder.h +158 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferEncoder.h +104 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorPlugins.h +334 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorSelector.h +186 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.cpp +140 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.h +42 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderProcess.h +100 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/Dfa.h +57 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.cpp +85 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.h +27 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderProcess.h +126 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/ProcessTrivial.h +108 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.cpp +139 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.h +74 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.cpp +65 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.h +91 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/CorrectnessTests.cpp +772 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/Example.cpp +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/FileConverter.cpp +486 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/iconv_sample.c +162 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/utf8lut.h +15 -0
- package/deps/simdutf/benchmarks/competition/utf8sse4/fromutf8-sse.cpp +292 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/LICENSE +23 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/README.md +1503 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/checked.h +335 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/core.h +338 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp11.h +103 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp17.h +103 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/unchecked.h +274 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8.h +34 -0
- package/deps/simdutf/benchmarks/dataset/README.md +155 -0
- package/deps/simdutf/benchmarks/dataset/emoji.txt +204 -0
- package/deps/simdutf/benchmarks/dataset/scripts/utf8type.py +40 -0
- package/deps/simdutf/benchmarks/dataset/wikipedia_mars/Makefile +80 -0
- package/deps/simdutf/benchmarks/dataset/wikipedia_mars/convert_to_utf6.py +20 -0
- package/deps/simdutf/benchmarks/find/CMakeLists.txt +6 -0
- package/deps/simdutf/benchmarks/find/findbenchmark.cpp +63 -0
- package/deps/simdutf/benchmarks/find/findbenchmarker.h +46 -0
- package/deps/simdutf/benchmarks/shortbench.cpp +555 -0
- package/deps/simdutf/benchmarks/src/CMakeLists.txt +52 -0
- package/deps/simdutf/benchmarks/src/apple_arm_events.h +1104 -0
- package/deps/simdutf/benchmarks/src/benchmark.cpp +3899 -0
- package/deps/simdutf/benchmarks/src/benchmark.h +317 -0
- package/deps/simdutf/benchmarks/src/benchmark_base.cpp +144 -0
- package/deps/simdutf/benchmarks/src/benchmark_base.h +98 -0
- package/deps/simdutf/benchmarks/src/cmdline.cpp +176 -0
- package/deps/simdutf/benchmarks/src/cmdline.h +35 -0
- package/deps/simdutf/benchmarks/src/event_counter.h +162 -0
- package/deps/simdutf/benchmarks/src/linux-perf-events.h +104 -0
- package/deps/simdutf/benchmarks/stream.cpp +209 -0
- package/deps/simdutf/benchmarks/threaded.cpp +123 -0
- package/deps/simdutf/cmake/CPM.cmake +1363 -0
- package/deps/simdutf/cmake/JoinPaths.cmake +23 -0
- package/deps/simdutf/cmake/add_cpp_test.cmake +68 -0
- package/deps/simdutf/cmake/simdutf-config.cmake.in +2 -0
- package/deps/simdutf/cmake/simdutf-flags.cmake +26 -0
- package/deps/simdutf/cmake/toolchains-ci/riscv64-linux-gnu.cmake +4 -0
- package/deps/simdutf/cmake/toolchains-dev/README.md +32 -0
- package/deps/simdutf/cmake/toolchains-dev/aarch64.cmake +14 -0
- package/deps/simdutf/cmake/toolchains-dev/loongarch64.cmake +22 -0
- package/deps/simdutf/cmake/toolchains-dev/powerpc64.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/powerpc64le.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/riscv64.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/rvv-spike.cmake +38 -0
- package/deps/simdutf/doc/avx512.png +0 -0
- package/deps/simdutf/doc/logo.png +0 -0
- package/deps/simdutf/doc/logo.svg +165 -0
- package/deps/simdutf/doc/node2023.png +0 -0
- package/deps/simdutf/doc/shortinput.md +78 -0
- package/deps/simdutf/doc/utf16utf8.png +0 -0
- package/deps/simdutf/doc/utf8utf16.png +0 -0
- package/deps/simdutf/doc/widelogo.png +0 -0
- package/deps/simdutf/doxygen.py +50 -0
- package/deps/simdutf/fuzz/.clang-format +9 -0
- package/deps/simdutf/fuzz/CMakeLists.txt +45 -0
- package/deps/simdutf/fuzz/README.md +168 -0
- package/deps/simdutf/fuzz/atomic_base64.cpp +448 -0
- package/deps/simdutf/fuzz/base64.cpp +278 -0
- package/deps/simdutf/fuzz/build.sh +83 -0
- package/deps/simdutf/fuzz/conversion.cpp +669 -0
- package/deps/simdutf/fuzz/helpers/.clang-format-ignore +1 -0
- package/deps/simdutf/fuzz/helpers/common.h +135 -0
- package/deps/simdutf/fuzz/helpers/nameof.hpp +1258 -0
- package/deps/simdutf/fuzz/main.cpp +72 -0
- package/deps/simdutf/fuzz/minimize_and_cleanse.sh +87 -0
- package/deps/simdutf/fuzz/misc.cpp +216 -0
- package/deps/simdutf/fuzz/random_fuzz.sh +154 -0
- package/deps/simdutf/fuzz/roundtrip.cpp +588 -0
- package/deps/simdutf/fuzz/safe_conversion.cpp +104 -0
- package/deps/simdutf/include/simdutf/avx512.h +79 -0
- package/deps/simdutf/include/simdutf/base64_implementation.h +158 -0
- package/deps/simdutf/include/simdutf/base64_tables.h +887 -0
- package/deps/simdutf/include/simdutf/common_defs.h +186 -0
- package/deps/simdutf/include/simdutf/compiler_check.h +50 -0
- package/deps/simdutf/include/simdutf/constexpr_ptr.h +138 -0
- package/deps/simdutf/include/simdutf/encoding_types.h +189 -0
- package/deps/simdutf/include/simdutf/error.h +126 -0
- package/deps/simdutf/include/simdutf/implementation.h +7081 -0
- package/deps/simdutf/include/simdutf/internal/isadetection.h +325 -0
- package/deps/simdutf/include/simdutf/portability.h +285 -0
- package/deps/simdutf/include/simdutf/scalar/ascii.h +86 -0
- package/deps/simdutf/include/simdutf/scalar/atomic_util.h +105 -0
- package/deps/simdutf/include/simdutf/scalar/base64.h +911 -0
- package/deps/simdutf/include/simdutf/scalar/latin1.h +26 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf16/latin1_to_utf16.h +52 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf32/latin1_to_utf32.h +27 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf8/latin1_to_utf8.h +191 -0
- package/deps/simdutf/include/simdutf/scalar/swap_bytes.h +35 -0
- package/deps/simdutf/include/simdutf/scalar/utf16.h +226 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/utf16_to_latin1.h +108 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/valid_utf16_to_latin1.h +40 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/utf16_to_utf32.h +86 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/valid_utf16_to_utf32.h +44 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/utf16_to_utf8.h +295 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/valid_utf16_to_utf8.h +91 -0
- package/deps/simdutf/include/simdutf/scalar/utf32.h +82 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/utf32_to_latin1.h +68 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/valid_utf32_to_latin1.h +67 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/utf32_to_utf16.h +84 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/valid_utf32_to_utf16.h +44 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/utf32_to_utf8.h +142 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/valid_utf32_to_utf8.h +72 -0
- package/deps/simdutf/include/simdutf/scalar/utf8.h +326 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/utf8_to_latin1.h +225 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/valid_utf8_to_latin1.h +87 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/utf8_to_utf16.h +342 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/valid_utf8_to_utf16.h +106 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/utf8_to_utf32.h +299 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/valid_utf8_to_utf32.h +83 -0
- package/deps/simdutf/include/simdutf/simdutf_version.h +26 -0
- package/deps/simdutf/include/simdutf.h +26 -0
- package/deps/simdutf/include/simdutf_c.h +342 -0
- package/deps/simdutf/riscv/Dockerfile +16 -0
- package/deps/simdutf/riscv/README.md +24 -0
- package/deps/simdutf/riscv/remove-docker-station +8 -0
- package/deps/simdutf/riscv/run-docker-station +31 -0
- package/deps/simdutf/scripts/.flake8 +2 -0
- package/deps/simdutf/scripts/Makefile +2 -0
- package/deps/simdutf/scripts/README_ADD_FUNCTION.md +49 -0
- package/deps/simdutf/scripts/add_function.py +330 -0
- package/deps/simdutf/scripts/amalgamation_tests.py +156 -0
- package/deps/simdutf/scripts/base64/Makefile +2 -0
- package/deps/simdutf/scripts/base64/README.md +2 -0
- package/deps/simdutf/scripts/base64/avx512.py +76 -0
- package/deps/simdutf/scripts/base64/neon_decode.py +143 -0
- package/deps/simdutf/scripts/base64/neon_generate_lut.py +101 -0
- package/deps/simdutf/scripts/base64/sse.py +252 -0
- package/deps/simdutf/scripts/base64/sseregular.py +160 -0
- package/deps/simdutf/scripts/base64/sseurl.py +283 -0
- package/deps/simdutf/scripts/base64/table.py +59 -0
- package/deps/simdutf/scripts/base64bench_print.py +145 -0
- package/deps/simdutf/scripts/benchmark-all.py +119 -0
- package/deps/simdutf/scripts/benchmark_print.py +324 -0
- package/deps/simdutf/scripts/check_feature_macros.py +156 -0
- package/deps/simdutf/scripts/check_typos.sh +13 -0
- package/deps/simdutf/scripts/clang_format.sh +35 -0
- package/deps/simdutf/scripts/clang_format_docker.sh +38 -0
- package/deps/simdutf/scripts/common.py +24 -0
- package/deps/simdutf/scripts/compilation_benchmark.py +55 -0
- package/deps/simdutf/scripts/compile_many_variations.sh +64 -0
- package/deps/simdutf/scripts/create_latex_table.py +62 -0
- package/deps/simdutf/scripts/docker/Dockerfile +14 -0
- package/deps/simdutf/scripts/docker/Makefile +9 -0
- package/deps/simdutf/scripts/docker/README.md +30 -0
- package/deps/simdutf/scripts/docker/llvm.gpg +0 -0
- package/deps/simdutf/scripts/ppc64_convert_utf16_to_utf8.py +155 -0
- package/deps/simdutf/scripts/prepare_doxygen.sh +21 -0
- package/deps/simdutf/scripts/release.py +197 -0
- package/deps/simdutf/scripts/shortinputplots.py +97 -0
- package/deps/simdutf/scripts/sse_convert_utf16_to_utf8.py +422 -0
- package/deps/simdutf/scripts/sse_convert_utf32_to_utf16.py +105 -0
- package/deps/simdutf/scripts/sse_utf8_utf16_decode.py +186 -0
- package/deps/simdutf/scripts/sse_validate_utf16le_proof.py +137 -0
- package/deps/simdutf/scripts/sse_validate_utf16le_testcases.py +129 -0
- package/deps/simdutf/scripts/table.py +207 -0
- package/deps/simdutf/scripts/tests/new.txt +33 -0
- package/deps/simdutf/scripts/tests/old.txt +33 -0
- package/deps/simdutf/scripts/tests/results.txt +272 -0
- package/deps/simdutf/simdutf.pc.in +11 -0
- package/deps/simdutf/singleheader/.flake8 +2 -0
- package/deps/simdutf/singleheader/CMakeLists.txt +64 -0
- package/deps/simdutf/singleheader/README-dev.md +81 -0
- package/deps/simdutf/singleheader/README.md +19 -0
- package/deps/simdutf/singleheader/amalgamate.py +513 -0
- package/deps/simdutf/singleheader/amalgamation_demo.c +59 -0
- package/deps/simdutf/singleheader/amalgamation_demo.cpp +54 -0
- package/deps/simdutf/singleheader/test-features.py +262 -0
- package/deps/simdutf/src/CMakeLists.txt +78 -0
- package/deps/simdutf/src/arm64/arm_base64.cpp +791 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf16.cpp +24 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf32.cpp +24 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf8.cpp +70 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_latin1.cpp +61 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf32.cpp +185 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf8.cpp +780 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_latin1.cpp +60 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf16.cpp +208 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf8.cpp +505 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_latin1.cpp +69 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf16.cpp +313 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf32.cpp +179 -0
- package/deps/simdutf/src/arm64/arm_find.cpp +199 -0
- package/deps/simdutf/src/arm64/arm_utf16fix.cpp +185 -0
- package/deps/simdutf/src/arm64/arm_validate_utf16.cpp +165 -0
- package/deps/simdutf/src/arm64/arm_validate_utf32le.cpp +65 -0
- package/deps/simdutf/src/arm64/implementation.cpp +1442 -0
- package/deps/simdutf/src/encoding_types.cpp +67 -0
- package/deps/simdutf/src/error.cpp +3 -0
- package/deps/simdutf/src/fallback/implementation.cpp +589 -0
- package/deps/simdutf/src/generic/ascii_validation.h +50 -0
- package/deps/simdutf/src/generic/base64.h +233 -0
- package/deps/simdutf/src/generic/base64lengths.h +63 -0
- package/deps/simdutf/src/generic/buf_block_reader.h +109 -0
- package/deps/simdutf/src/generic/find.h +75 -0
- package/deps/simdutf/src/generic/utf16/change_endianness.h +24 -0
- package/deps/simdutf/src/generic/utf16/count_code_points_bytemask.h +58 -0
- package/deps/simdutf/src/generic/utf16/to_well_formed.h +93 -0
- package/deps/simdutf/src/generic/utf16/utf32_length_from_utf16.h +15 -0
- package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16.h +35 -0
- package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16_bytemask.h +199 -0
- package/deps/simdutf/src/generic/utf16.h +73 -0
- package/deps/simdutf/src/generic/utf32.h +136 -0
- package/deps/simdutf/src/generic/utf8/utf16_length_from_utf8_bytemask.h +53 -0
- package/deps/simdutf/src/generic/utf8.h +92 -0
- package/deps/simdutf/src/generic/utf8_to_latin1/utf8_to_latin1.h +316 -0
- package/deps/simdutf/src/generic/utf8_to_latin1/valid_utf8_to_latin1.h +78 -0
- package/deps/simdutf/src/generic/utf8_to_utf16/utf8_to_utf16.h +332 -0
- package/deps/simdutf/src/generic/utf8_to_utf16/valid_utf8_to_utf16.h +74 -0
- package/deps/simdutf/src/generic/utf8_to_utf32/utf8_to_utf32.h +318 -0
- package/deps/simdutf/src/generic/utf8_to_utf32/valid_utf8_to_utf32.h +42 -0
- package/deps/simdutf/src/generic/utf8_validation/utf8_lookup4_algorithm.h +223 -0
- package/deps/simdutf/src/generic/utf8_validation/utf8_validator.h +84 -0
- package/deps/simdutf/src/generic/validate_utf16.h +164 -0
- package/deps/simdutf/src/generic/validate_utf32.h +99 -0
- package/deps/simdutf/src/haswell/avx2_base64.cpp +837 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf16.cpp +28 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf32.cpp +20 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf8.cpp +83 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_latin1.cpp +83 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf32.cpp +210 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf8.cpp +602 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_latin1.cpp +116 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf16.cpp +164 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf8.cpp +569 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_latin1.cpp +60 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf16.cpp +195 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf32.cpp +135 -0
- package/deps/simdutf/src/haswell/avx2_utf16fix.cpp +173 -0
- package/deps/simdutf/src/haswell/avx2_validate_utf16.cpp +17 -0
- package/deps/simdutf/src/haswell/implementation.cpp +1447 -0
- package/deps/simdutf/src/icelake/icelake_ascii_validation.inl.cpp +19 -0
- package/deps/simdutf/src/icelake/icelake_base64.inl.cpp +630 -0
- package/deps/simdutf/src/icelake/icelake_common.inl.cpp +37 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf16.inl.cpp +36 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf32.inl.cpp +23 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf8.inl.cpp +107 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_latin1.inl.cpp +103 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf32.inl.cpp +136 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf8.inl.cpp +206 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_latin1.inl.cpp +74 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf16.inl.cpp +338 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf8.inl.cpp +574 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf8_to_latin1.inl.cpp +104 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf8_to_utf16.inl.cpp +75 -0
- package/deps/simdutf/src/icelake/icelake_convert_valid_utf8_to_latin1.inl.cpp +69 -0
- package/deps/simdutf/src/icelake/icelake_find.inl.cpp +146 -0
- package/deps/simdutf/src/icelake/icelake_from_utf8.inl.cpp +266 -0
- package/deps/simdutf/src/icelake/icelake_from_valid_utf8.inl.cpp +136 -0
- package/deps/simdutf/src/icelake/icelake_macros.inl.cpp +143 -0
- package/deps/simdutf/src/icelake/icelake_utf16fix.cpp +138 -0
- package/deps/simdutf/src/icelake/icelake_utf32_validation.inl.cpp +63 -0
- package/deps/simdutf/src/icelake/icelake_utf8_common.inl.cpp +753 -0
- package/deps/simdutf/src/icelake/icelake_utf8_length_from_utf16.inl.cpp +269 -0
- package/deps/simdutf/src/icelake/icelake_utf8_validation.inl.cpp +116 -0
- package/deps/simdutf/src/icelake/implementation.cpp +1903 -0
- package/deps/simdutf/src/implementation.cpp +2526 -0
- package/deps/simdutf/src/lasx/implementation.cpp +1531 -0
- package/deps/simdutf/src/lasx/lasx_base64.cpp +695 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf16.cpp +76 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf32.cpp +55 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf8.cpp +65 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_latin1.cpp +64 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf32.cpp +183 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf8.cpp +550 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_latin1.cpp +73 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf16.cpp +218 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf8.cpp +589 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_latin1.cpp +72 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf16.cpp +296 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf32.cpp +190 -0
- package/deps/simdutf/src/lasx/lasx_find.cpp +64 -0
- package/deps/simdutf/src/lasx/lasx_validate_utf16.cpp +13 -0
- package/deps/simdutf/src/lasx/lasx_validate_utf32le.cpp +84 -0
- package/deps/simdutf/src/lsx/implementation.cpp +1417 -0
- package/deps/simdutf/src/lsx/lsx_base64.cpp +675 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf16.cpp +39 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf32.cpp +27 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf8.cpp +56 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_latin1.cpp +64 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf32.cpp +133 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf8.cpp +518 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_latin1.cpp +66 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf16.cpp +155 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf8.cpp +459 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_latin1.cpp +75 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf16.cpp +291 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf32.cpp +179 -0
- package/deps/simdutf/src/lsx/lsx_find.cpp +60 -0
- package/deps/simdutf/src/lsx/lsx_validate_utf16.cpp +13 -0
- package/deps/simdutf/src/lsx/lsx_validate_utf32le.cpp +68 -0
- package/deps/simdutf/src/ppc64/implementation.cpp +992 -0
- package/deps/simdutf/src/ppc64/ppc64_base64.cpp +480 -0
- package/deps/simdutf/src/ppc64/ppc64_base64_internal_tests.cpp +401 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf16.cpp +12 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf32.cpp +12 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf8.cpp +149 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_latin1.cpp +67 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf32.cpp +87 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf8.cpp +296 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_latin1.cpp +57 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf16.cpp +117 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf8.cpp +166 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_latin1.cpp +69 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf16.cpp +211 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf32.cpp +153 -0
- package/deps/simdutf/src/ppc64/ppc64_utf16_to_utf8_tables.h +1011 -0
- package/deps/simdutf/src/ppc64/ppc64_utf8_length_from_latin1.cpp +37 -0
- package/deps/simdutf/src/ppc64/ppc64_validate_utf16.cpp +19 -0
- package/deps/simdutf/src/ppc64/templates.cpp +91 -0
- package/deps/simdutf/src/rvv/implementation.cpp +138 -0
- package/deps/simdutf/src/rvv/rvv_find.cpp +27 -0
- package/deps/simdutf/src/rvv/rvv_helpers.inl.cpp +23 -0
- package/deps/simdutf/src/rvv/rvv_latin1_to.inl.cpp +71 -0
- package/deps/simdutf/src/rvv/rvv_length_from.inl.cpp +164 -0
- package/deps/simdutf/src/rvv/rvv_utf16_to.inl.cpp +399 -0
- package/deps/simdutf/src/rvv/rvv_utf16fix.cpp +110 -0
- package/deps/simdutf/src/rvv/rvv_utf32_to.inl.cpp +307 -0
- package/deps/simdutf/src/rvv/rvv_utf8_to.inl.cpp +435 -0
- package/deps/simdutf/src/rvv/rvv_validate.inl.cpp +275 -0
- package/deps/simdutf/src/simdutf/arm64/begin.h +2 -0
- package/deps/simdutf/src/simdutf/arm64/bitmanipulation.h +34 -0
- package/deps/simdutf/src/simdutf/arm64/end.h +2 -0
- package/deps/simdutf/src/simdutf/arm64/implementation.h +307 -0
- package/deps/simdutf/src/simdutf/arm64/intrinsics.h +10 -0
- package/deps/simdutf/src/simdutf/arm64/simd.h +547 -0
- package/deps/simdutf/src/simdutf/arm64/simd16-inl.h +403 -0
- package/deps/simdutf/src/simdutf/arm64/simd32-inl.h +129 -0
- package/deps/simdutf/src/simdutf/arm64/simd64-inl.h +28 -0
- package/deps/simdutf/src/simdutf/arm64.h +43 -0
- package/deps/simdutf/src/simdutf/fallback/begin.h +1 -0
- package/deps/simdutf/src/simdutf/fallback/bitmanipulation.h +13 -0
- package/deps/simdutf/src/simdutf/fallback/end.h +1 -0
- package/deps/simdutf/src/simdutf/fallback/implementation.h +331 -0
- package/deps/simdutf/src/simdutf/fallback.h +42 -0
- package/deps/simdutf/src/simdutf/haswell/begin.h +15 -0
- package/deps/simdutf/src/simdutf/haswell/bitmanipulation.h +35 -0
- package/deps/simdutf/src/simdutf/haswell/end.h +13 -0
- package/deps/simdutf/src/simdutf/haswell/implementation.h +338 -0
- package/deps/simdutf/src/simdutf/haswell/intrinsics.h +67 -0
- package/deps/simdutf/src/simdutf/haswell/simd.h +363 -0
- package/deps/simdutf/src/simdutf/haswell/simd16-inl.h +261 -0
- package/deps/simdutf/src/simdutf/haswell/simd32-inl.h +111 -0
- package/deps/simdutf/src/simdutf/haswell/simd64-inl.h +34 -0
- package/deps/simdutf/src/simdutf/haswell.h +63 -0
- package/deps/simdutf/src/simdutf/icelake/begin.h +14 -0
- package/deps/simdutf/src/simdutf/icelake/bitmanipulation.h +44 -0
- package/deps/simdutf/src/simdutf/icelake/end.h +12 -0
- package/deps/simdutf/src/simdutf/icelake/implementation.h +346 -0
- package/deps/simdutf/src/simdutf/icelake/intrinsics.h +138 -0
- package/deps/simdutf/src/simdutf/icelake/simd.h +17 -0
- package/deps/simdutf/src/simdutf/icelake/simd16-inl.h +90 -0
- package/deps/simdutf/src/simdutf/icelake/simd32-inl.h +47 -0
- package/deps/simdutf/src/simdutf/icelake.h +81 -0
- package/deps/simdutf/src/simdutf/lasx/begin.h +8 -0
- package/deps/simdutf/src/simdutf/lasx/bitmanipulation.h +25 -0
- package/deps/simdutf/src/simdutf/lasx/end.h +8 -0
- package/deps/simdutf/src/simdutf/lasx/implementation.h +310 -0
- package/deps/simdutf/src/simdutf/lasx/intrinsics.h +319 -0
- package/deps/simdutf/src/simdutf/lasx/simd.h +551 -0
- package/deps/simdutf/src/simdutf/lasx/simd16-inl.h +234 -0
- package/deps/simdutf/src/simdutf/lasx/simd32-inl.h +74 -0
- package/deps/simdutf/src/simdutf/lasx/simd64-inl.h +52 -0
- package/deps/simdutf/src/simdutf/lasx.h +49 -0
- package/deps/simdutf/src/simdutf/lsx/begin.h +2 -0
- package/deps/simdutf/src/simdutf/lsx/bitmanipulation.h +25 -0
- package/deps/simdutf/src/simdutf/lsx/end.h +2 -0
- package/deps/simdutf/src/simdutf/lsx/implementation.h +309 -0
- package/deps/simdutf/src/simdutf/lsx/intrinsics.h +196 -0
- package/deps/simdutf/src/simdutf/lsx/simd.h +421 -0
- package/deps/simdutf/src/simdutf/lsx/simd16-inl.h +242 -0
- package/deps/simdutf/src/simdutf/lsx/simd32-inl.h +69 -0
- package/deps/simdutf/src/simdutf/lsx/simd64-inl.h +50 -0
- package/deps/simdutf/src/simdutf/lsx.h +52 -0
- package/deps/simdutf/src/simdutf/ppc64/begin.h +1 -0
- package/deps/simdutf/src/simdutf/ppc64/bitmanipulation.h +29 -0
- package/deps/simdutf/src/simdutf/ppc64/end.h +1 -0
- package/deps/simdutf/src/simdutf/ppc64/implementation.h +348 -0
- package/deps/simdutf/src/simdutf/ppc64/intrinsics.h +19 -0
- package/deps/simdutf/src/simdutf/ppc64/simd.h +177 -0
- package/deps/simdutf/src/simdutf/ppc64/simd16-inl.h +327 -0
- package/deps/simdutf/src/simdutf/ppc64/simd32-inl.h +247 -0
- package/deps/simdutf/src/simdutf/ppc64/simd8-inl.h +618 -0
- package/deps/simdutf/src/simdutf/ppc64.h +40 -0
- package/deps/simdutf/src/simdutf/rvv/begin.h +7 -0
- package/deps/simdutf/src/simdutf/rvv/end.h +7 -0
- package/deps/simdutf/src/simdutf/rvv/implementation.h +321 -0
- package/deps/simdutf/src/simdutf/rvv/intrinsics.h +131 -0
- package/deps/simdutf/src/simdutf/rvv.h +41 -0
- package/deps/simdutf/src/simdutf/westmere/begin.h +8 -0
- package/deps/simdutf/src/simdutf/westmere/bitmanipulation.h +37 -0
- package/deps/simdutf/src/simdutf/westmere/end.h +8 -0
- package/deps/simdutf/src/simdutf/westmere/implementation.h +338 -0
- package/deps/simdutf/src/simdutf/westmere/intrinsics.h +38 -0
- package/deps/simdutf/src/simdutf/westmere/simd.h +379 -0
- package/deps/simdutf/src/simdutf/westmere/simd16-inl.h +242 -0
- package/deps/simdutf/src/simdutf/westmere/simd32-inl.h +151 -0
- package/deps/simdutf/src/simdutf/westmere/simd64-inl.h +33 -0
- package/deps/simdutf/src/simdutf/westmere.h +59 -0
- package/deps/simdutf/src/simdutf.cpp +152 -0
- package/deps/simdutf/src/simdutf_c.cpp +525 -0
- package/deps/simdutf/src/tables/utf16_to_utf8_tables.h +768 -0
- package/deps/simdutf/src/tables/utf32_to_utf16_tables.h +53 -0
- package/deps/simdutf/src/tables/utf8_to_utf16_tables.h +826 -0
- package/deps/simdutf/src/westmere/implementation.cpp +1479 -0
- package/deps/simdutf/src/westmere/internal/loader.cpp +7 -0
- package/deps/simdutf/src/westmere/internal/write_v_u16_11bits_to_utf8.cpp +66 -0
- package/deps/simdutf/src/westmere/sse_base64.cpp +672 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf16.cpp +21 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf32.cpp +31 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf8.cpp +71 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_latin1.cpp +70 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf32.cpp +206 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf8.cpp +504 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_latin1.cpp +82 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf16.cpp +209 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf8.cpp +589 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_latin1.cpp +58 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf16.cpp +197 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf32.cpp +141 -0
- package/deps/simdutf/src/westmere/sse_utf16fix.cpp +82 -0
- package/deps/simdutf/src/westmere/sse_validate_utf16.cpp +17 -0
- package/deps/simdutf/tests/CMakeLists.txt +483 -0
- package/deps/simdutf/tests/atomic_base64_tests.cpp +2845 -0
- package/deps/simdutf/tests/base64_tests.cpp +3617 -0
- package/deps/simdutf/tests/basic_fuzzer.cpp +805 -0
- package/deps/simdutf/tests/bele_tests.cpp +182 -0
- package/deps/simdutf/tests/constexpr_base64_tests.cpp +387 -0
- package/deps/simdutf/tests/convert_latin1_to_utf16be_tests.cpp +52 -0
- package/deps/simdutf/tests/convert_latin1_to_utf16le_tests.cpp +80 -0
- package/deps/simdutf/tests/convert_latin1_to_utf32_tests.cpp +66 -0
- package/deps/simdutf/tests/convert_latin1_to_utf8_tests.cpp +120 -0
- package/deps/simdutf/tests/convert_utf16_to_utf8_safe_tests.cpp +203 -0
- package/deps/simdutf/tests/convert_utf16_to_utf8_with_replacement_tests.cpp +276 -0
- package/deps/simdutf/tests/convert_utf16be_to_latin1_tests.cpp +109 -0
- package/deps/simdutf/tests/convert_utf16be_to_latin1_tests_with_errors.cpp +136 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf32_tests.cpp +193 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf32_with_errors_tests.cpp +381 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf8_tests.cpp +259 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf8_with_errors_tests.cpp +266 -0
- package/deps/simdutf/tests/convert_utf16le_to_latin1_tests.cpp +148 -0
- package/deps/simdutf/tests/convert_utf16le_to_latin1_tests_with_errors.cpp +176 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf32_tests.cpp +213 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf32_with_errors_tests.cpp +318 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf8_tests.cpp +343 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf8_with_errors_tests.cpp +271 -0
- package/deps/simdutf/tests/convert_utf32_to_latin1_tests.cpp +111 -0
- package/deps/simdutf/tests/convert_utf32_to_latin1_with_errors_tests.cpp +96 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16be_tests.cpp +148 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16be_with_errors_tests.cpp +192 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16le_tests.cpp +166 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16le_with_errors_tests.cpp +215 -0
- package/deps/simdutf/tests/convert_utf32_to_utf8_tests.cpp +181 -0
- package/deps/simdutf/tests/convert_utf32_to_utf8_with_errors_tests.cpp +261 -0
- package/deps/simdutf/tests/convert_utf8_to_latin1_tests.cpp +516 -0
- package/deps/simdutf/tests/convert_utf8_to_latin1_with_errors_tests.cpp +579 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16be_tests.cpp +412 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16be_with_errors_tests.cpp +480 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16le_tests.cpp +671 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16le_with_errors_tests.cpp +455 -0
- package/deps/simdutf/tests/convert_utf8_to_utf32_tests.cpp +1204 -0
- package/deps/simdutf/tests/convert_utf8_to_utf32_with_errors_tests.cpp +337 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_latin1_tests.cpp +37 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_utf32_tests.cpp +97 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_utf8_tests.cpp +126 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_latin1_tests.cpp +71 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_utf32_tests.cpp +122 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_utf8_tests.cpp +244 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_latin1_tests.cpp +49 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf16be_tests.cpp +92 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf16le_tests.cpp +114 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf8_tests.cpp +109 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_latin1_tests.cpp +84 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf16be_tests.cpp +124 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf16le_tests.cpp +221 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf32_tests.cpp +155 -0
- package/deps/simdutf/tests/count_utf16be.cpp +64 -0
- package/deps/simdutf/tests/count_utf16le.cpp +61 -0
- package/deps/simdutf/tests/count_utf8.cpp +87 -0
- package/deps/simdutf/tests/detect_encodings_tests.cpp +312 -0
- package/deps/simdutf/tests/embed/valid_utf8.txt +1 -0
- package/deps/simdutf/tests/embed_tests.cpp +22 -0
- package/deps/simdutf/tests/find_tests.cpp +77 -0
- package/deps/simdutf/tests/fixed_string_tests.cpp +153 -0
- package/deps/simdutf/tests/helpers/CMakeLists.txt +25 -0
- package/deps/simdutf/tests/helpers/compiletime_conversions.h +222 -0
- package/deps/simdutf/tests/helpers/fixed_string.h +267 -0
- package/deps/simdutf/tests/helpers/random_int.cpp +30 -0
- package/deps/simdutf/tests/helpers/random_int.h +39 -0
- package/deps/simdutf/tests/helpers/random_utf16.cpp +123 -0
- package/deps/simdutf/tests/helpers/random_utf16.h +52 -0
- package/deps/simdutf/tests/helpers/random_utf32.cpp +41 -0
- package/deps/simdutf/tests/helpers/random_utf32.h +40 -0
- package/deps/simdutf/tests/helpers/random_utf8.cpp +93 -0
- package/deps/simdutf/tests/helpers/random_utf8.h +36 -0
- package/deps/simdutf/tests/helpers/test.cpp +231 -0
- package/deps/simdutf/tests/helpers/test.h +193 -0
- package/deps/simdutf/tests/helpers/transcode_test_base.cpp +1257 -0
- package/deps/simdutf/tests/helpers/transcode_test_base.h +683 -0
- package/deps/simdutf/tests/helpers/utf16.h +27 -0
- package/deps/simdutf/tests/installation_tests/find/CMakeLists.txt +43 -0
- package/deps/simdutf/tests/installation_tests/from_fetch/CMakeLists.txt +47 -0
- package/deps/simdutf/tests/internal_tests.cpp +27 -0
- package/deps/simdutf/tests/null_safety_tests.cpp +94 -0
- package/deps/simdutf/tests/random_fuzzer.cpp +779 -0
- package/deps/simdutf/tests/readme_tests.cpp +274 -0
- package/deps/simdutf/tests/reference/CMakeLists.txt +23 -0
- package/deps/simdutf/tests/reference/decode_utf16.h +81 -0
- package/deps/simdutf/tests/reference/decode_utf32.h +47 -0
- package/deps/simdutf/tests/reference/encode_latin1.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_latin1.h +32 -0
- package/deps/simdutf/tests/reference/encode_utf16.cpp +49 -0
- package/deps/simdutf/tests/reference/encode_utf16.h +20 -0
- package/deps/simdutf/tests/reference/encode_utf32.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_utf32.h +36 -0
- package/deps/simdutf/tests/reference/encode_utf8.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_utf8.h +40 -0
- package/deps/simdutf/tests/reference/validate_utf16.cpp +60 -0
- package/deps/simdutf/tests/reference/validate_utf16.h +14 -0
- package/deps/simdutf/tests/reference/validate_utf16_to_latin1.cpp +35 -0
- package/deps/simdutf/tests/reference/validate_utf16_to_latin1.h +13 -0
- package/deps/simdutf/tests/reference/validate_utf32.cpp +27 -0
- package/deps/simdutf/tests/reference/validate_utf32.h +12 -0
- package/deps/simdutf/tests/reference/validate_utf32_to_latin1.cpp +27 -0
- package/deps/simdutf/tests/reference/validate_utf32_to_latin1.h +12 -0
- package/deps/simdutf/tests/reference/validate_utf8.cpp +82 -0
- package/deps/simdutf/tests/reference/validate_utf8.h +11 -0
- package/deps/simdutf/tests/reference/validate_utf8_to_latin1.cpp +43 -0
- package/deps/simdutf/tests/reference/validate_utf8_to_latin1.h +12 -0
- package/deps/simdutf/tests/select_implementation.cpp +43 -0
- package/deps/simdutf/tests/simdutf_c_tests.cpp +244 -0
- package/deps/simdutf/tests/span_tests.cpp +401 -0
- package/deps/simdutf/tests/special_tests.cpp +559 -0
- package/deps/simdutf/tests/straight_c_test.c +187 -0
- package/deps/simdutf/tests/text_encoding_tests.cpp +77 -0
- package/deps/simdutf/tests/to_well_formed_utf16_tests.cpp +377 -0
- package/deps/simdutf/tests/utf8_length_from_utf16_tests.cpp +202 -0
- package/deps/simdutf/tests/validate_ascii_basic_tests.cpp +165 -0
- package/deps/simdutf/tests/validate_ascii_with_errors_tests.cpp +77 -0
- package/deps/simdutf/tests/validate_utf16be_basic_tests.cpp +175 -0
- package/deps/simdutf/tests/validate_utf16be_with_errors_tests.cpp +188 -0
- package/deps/simdutf/tests/validate_utf16le_basic_tests.cpp +268 -0
- package/deps/simdutf/tests/validate_utf16le_with_errors_tests.cpp +274 -0
- package/deps/simdutf/tests/validate_utf32_basic_tests.cpp +92 -0
- package/deps/simdutf/tests/validate_utf32_with_errors_tests.cpp +114 -0
- package/deps/simdutf/tests/validate_utf8_basic_tests.cpp +178 -0
- package/deps/simdutf/tests/validate_utf8_brute_force_tests.cpp +88 -0
- package/deps/simdutf/tests/validate_utf8_puzzler_tests.cpp +33 -0
- package/deps/simdutf/tests/validate_utf8_with_errors_tests.cpp +228 -0
- package/deps/simdutf/tools/CMakeLists.txt +85 -0
- package/deps/simdutf/tools/fastbase64.cpp +250 -0
- package/deps/simdutf/tools/sutf.cpp +556 -0
- package/deps/simdutf/tools/sutf.h +40 -0
- package/package.json +2 -2
|
@@ -0,0 +1,440 @@
|
|
|
1
|
+
/* Idealized SIMD Operations with Altivec, SSE and MMX versions
|
|
2
|
+
Copyright (C) 2006, Robert D. Cameron
|
|
3
|
+
Licensed to International Characters Inc.
|
|
4
|
+
under the Academic Free License version 3.0.
|
|
5
|
+
October 30, 2006 */
|
|
6
|
+
|
|
7
|
+
/*------------------------------------------------------------*/
|
|
8
|
+
|
|
9
|
+
#include <limits.h>
|
|
10
|
+
|
|
11
|
+
typedef vector unsigned short vUInt16;
|
|
12
|
+
typedef vector unsigned int vUInt32;
|
|
13
|
+
typedef vector unsigned char SIMD_type;
|
|
14
|
+
|
|
15
|
+
|
|
16
|
+
#define vec_lvsl1(x) vec_lvsl(x, (unsigned char *) 0)
|
|
17
|
+
#define vec_lvsr1(x) vec_lvsr(x, (unsigned char *) 0)
|
|
18
|
+
|
|
19
|
+
|
|
20
|
+
/*------------------------------------------------------------*/
|
|
21
|
+
/* I. SIMD bitwise logical operations */
|
|
22
|
+
|
|
23
|
+
#define simd_or(b1, b2) vec_or(b1, b2)
|
|
24
|
+
#define simd_and(b1, b2) vec_and(b1, b2)
|
|
25
|
+
#define simd_xor(b1, b2) vec_xor(b1, b2)
|
|
26
|
+
#define simd_nor(b1, b2) vec_nor(b1, b2)
|
|
27
|
+
#define simd_andc(b1, b2) vec_andc(b1, b2)
|
|
28
|
+
#define simd_if(cond, then_val, else_val) vec_sel(else_val, then_val, cond)
|
|
29
|
+
#define simd_not(x) vec_nor(x, x)
|
|
30
|
+
|
|
31
|
+
|
|
32
|
+
/* Idealized operations with direct implementation by built-in
|
|
33
|
+
operations for Altivec. */
|
|
34
|
+
|
|
35
|
+
#define simd_add_8(a, b) vec_vaddubm(a, b)
|
|
36
|
+
#define simd_add_16(a, b) (SIMD_type) vec_vadduhw((vUInt16) a, (vUInt16) b)
|
|
37
|
+
#define simd_add_32(a, b) (SIMD_type) vec_vadduwm((vUInt32) a, (vUInt32) b)
|
|
38
|
+
#define simd_sub_8(a, b) vec_vsububm(a, b)
|
|
39
|
+
#define simd_sub_16(a, b) (SIMD_type) vec_vsubuhm((vUInt16) a, (vUInt16) b)
|
|
40
|
+
#define simd_sub_32(a, b) (SIMD_type) vec_vsubuwm((vUInt32) a, (vUInt32) b)
|
|
41
|
+
#define simd_mult_16(a, b) (SIMD_type) vec_mladd((vUInt16) a, (vUInt16) b, (vUInt16) vec_splat_u8(0))
|
|
42
|
+
#define simd_mergeh_8(v1, v2) vec_vmrghb(v1, v2)
|
|
43
|
+
#define simd_mergeh_16(v1, v2) (SIMD_type) vec_vmrghh((vUInt16) v1, (vUInt16) v2)
|
|
44
|
+
#define simd_mergeh_32(v1, v2) (SIMD_type) vec_vmrghw((vUInt32) v1, (vUInt32) v2)
|
|
45
|
+
#define simd_mergel_8(v1, v2) vec_vmrglb(v1, v2)
|
|
46
|
+
#define simd_mergel_16(v1, v2) (SIMD_type) vec_vmrglh((vUInt16) v1, (vUInt16) v2)
|
|
47
|
+
#define simd_mergel_32(v1, v2) (SIMD_type) vec_vmrglw((vUInt32) v1, (vUInt32) v2)
|
|
48
|
+
#define simd_pack_16(v1, v2) vec_vpkuhum((vUInt16) v1, (vUInt16) v2)
|
|
49
|
+
#define simd_pack_32(v1, v2) (SIMD_type) vec_vpkuwum((vUInt32) v1, (vUInt32) v2)
|
|
50
|
+
#define simd_sll_8(r, shft) vec_vslb(r, shft)
|
|
51
|
+
#define simd_srl_8(r, shft) vec_vsrb(r, shft)
|
|
52
|
+
#define simd_sra_8(r, shft) vec_vsrab(r, shft)
|
|
53
|
+
#define simd_rotl_8(r, shft) vec_vrlb(r, shft)
|
|
54
|
+
#define simd_sll_16(r, shft) (SIMD_type) vec_vslh((vUInt16) r, (vUInt16) shft)
|
|
55
|
+
#define simd_srl_16(r, shft) (SIMD_type) vec_vsrh((vUInt16) r, (vUInt16) shft)
|
|
56
|
+
#define simd_sra_16(r, shft) (SIMD_type) vec_vsrah((vUInt16) r, (vUInt16) shft)
|
|
57
|
+
#define simd_rotl_16(r, shft) (SIMD_type) vec_vrlh((vUInt16) r, (vUInt16) shft)
|
|
58
|
+
#define simd_sll_32(r, shft) (SIMD_type) vec_vslw((vUInt32) r, (vUInt32) shft)
|
|
59
|
+
#define simd_srl_32(r, shft) (SIMD_type) vec_vsrw((vUInt32) r, (vUInt32) shft)
|
|
60
|
+
#define simd_sra_32(r, shft) (SIMD_type) vec_vsraw((vUInt32) r, (vUInt32) shft)
|
|
61
|
+
#define simd_rotl_32(r, shft) (SIMD_type) vec_vrlw((vUInt32) r, (vUInt32) shft)
|
|
62
|
+
#define simd_slli_8(r, shft) vec_vslb(r, vec_splat_u8(shft))
|
|
63
|
+
#define simd_srli_8(r, shft) vec_vsrb(r, vec_splat_u8(shft))
|
|
64
|
+
#define simd_srai_8(r, shft) vec_vsrab(r, vec_splat_u8(shft))
|
|
65
|
+
#define simd_rotli_8(r, shft) vec_vrlb(r, vec_splat_u8(shft))
|
|
66
|
+
/* For shifts of 16 or 32, the shift values could be loaded by
|
|
67
|
+
vec_splat_u16 or vec_splat_32. However, using vec_splat_u8
|
|
68
|
+
works as well, as only the low 4 or 5 bits are used. The
|
|
69
|
+
vec_splat_u8 is used to increase the chance that the
|
|
70
|
+
optimizer will find this value already in a register. */
|
|
71
|
+
#define simd_slli_16(r, shft) (SIMD_type) vec_vslh((vUInt16) r, (vUInt16) vec_splat_u8(shft))
|
|
72
|
+
#define simd_srli_16(r, shft) (SIMD_type) vec_vsrh((vUInt16) r, (vUInt16) vec_splat_u8(shft))
|
|
73
|
+
#define simd_srai_16(r, shft) (SIMD_type) vec_vsrah((vUInt16) r, (vUInt16) vec_splat_u8(shft))
|
|
74
|
+
#define simd_rotli_16(r, shft) (SIMD_type) vec_vrlh((vUInt16) r, (vUInt16) vec_splat_u8(shft))
|
|
75
|
+
/* Because only the least significant 5 bits are used in 32 bit
|
|
76
|
+
shifts, shifts of 16 to 31 are equivalent to shifts of -16 to -1.
|
|
77
|
+
Translating to the negative values allows the shift constant to be
|
|
78
|
+
loaded with a single vec_splat_u8. */
|
|
79
|
+
#define splat_shft(shft) vec_splat_u8((shft) >= 16 ? (shft)-32 : (shft))
|
|
80
|
+
#define simd_slli_32(r, shft) (SIMD_type) vec_vslw((vUInt32) r, (vUInt32) splat_shft(shft))
|
|
81
|
+
#define simd_srli_32(r, shft) (SIMD_type) vec_vsrw((vUInt32) r, (vUInt32) splat_shft(shft))
|
|
82
|
+
#define simd_srai_32(r, shft) (SIMD_type) vec_vsraw((vUInt32) r, (vUInt32) splat_shft(shft))
|
|
83
|
+
#define simd_rotli_32(r, shft) (SIMD_type) vec_vrlw((vUInt32) r, (vUInt32) splat_shft(shft))
|
|
84
|
+
#define simd_eq_8(a, b) (SIMD_type) vec_vcmpequb(a, b)
|
|
85
|
+
#define simd_eq_16(a, b) (SIMD_type) vec_vcmpequh((vUInt16) a, (vUInt16) b)
|
|
86
|
+
#define simd_eq_32(a, b) (SIMD_type) vec_vcmpequw((vUInt32) a, (vUInt32) b)
|
|
87
|
+
|
|
88
|
+
#define simd_max_8(a, b) vec_vmaxub(a, b)
|
|
89
|
+
|
|
90
|
+
|
|
91
|
+
#define simd_permute(a, b, c) vec_perm(a, b, c)
|
|
92
|
+
|
|
93
|
+
/* 64-bit and 128-bit add/sub */
|
|
94
|
+
|
|
95
|
+
#define simd_add_64(a, b) \
|
|
96
|
+
(SIMD_type) vec_add(vec_add((vUInt32) a, (vUInt32) b), \
|
|
97
|
+
vec_andc(vec_sld(vec_addc((vUInt32) a, (vUInt32) b), vec_0, 4), \
|
|
98
|
+
(vUInt32) alt_words))
|
|
99
|
+
#define simd_sub_64(a, b) \
|
|
100
|
+
(SIMD_type) vec_sub(vec_sub((vUInt32) a, (vUInt32) b), \
|
|
101
|
+
vec_add(vec_sld(vec_sub((vUInt32) vec_0, vec_subc((vUInt32) a, (vUInt32) b)), vec_0, 4), \
|
|
102
|
+
(vUInt32) alt_words))
|
|
103
|
+
|
|
104
|
+
static inline SIMD_type simd_add_128(SIMD_type a, SIMD_type b) {
|
|
105
|
+
vUInt32 sum1 = vec_add((vUInt32) a, (vUInt32) b);
|
|
106
|
+
vUInt32 carry1 = vec_sld(vec_addc((vUInt32) a, (vUInt32) b), (vUInt32) vec_splat_u8(0), 4);
|
|
107
|
+
vUInt32 sum2 = vec_add(sum1, carry1);
|
|
108
|
+
vUInt32 carry2 = vec_sld(vec_addc(sum1, carry1), (vUInt32) vec_splat_u8(0), 4);
|
|
109
|
+
vUInt32 sum3 = vec_add(sum2, carry2);
|
|
110
|
+
vUInt32 carry3 = vec_sld(vec_addc(sum2, carry2), (vUInt32) vec_splat_u8(0), 4);
|
|
111
|
+
return vec_add(sum3, carry3);
|
|
112
|
+
}
|
|
113
|
+
|
|
114
|
+
|
|
115
|
+
/* Altivec has separate full register shift instructions for
|
|
116
|
+
small shifts < 8 (vec_sll, vec_srl) and for shifts in
|
|
117
|
+
multiples of 8 (vec_slo, vec_sro, vec_sld). The bytealign
|
|
118
|
+
macros handle the mod 8 shift, while vec_sld is used for
|
|
119
|
+
to complete the shift. */
|
|
120
|
+
#define sl_bytealign(r, shft) \
|
|
121
|
+
((shft) % 8 == 0 ? r : vec_sll(r, vec_splat_u8(shft)))
|
|
122
|
+
#define sr_bytealign(r, shft) \
|
|
123
|
+
((shft) % 8 == 0 ? r : vec_srl(r, vec_splat_u8(shft)))
|
|
124
|
+
#define simd_slli_128(r, shft) \
|
|
125
|
+
((shft) < 8 ? sl_bytealign(r, shft):\
|
|
126
|
+
(shft) < 16 ? vec_slo(sl_bytealign(r, shft), vec_splat_u8(shft)) :\
|
|
127
|
+
(shft) >= 112 ? vec_slo(sl_bytealign(r, (shft)-128), vec_splat_u8((shft)-128)):\
|
|
128
|
+
vec_sld(sl_bytealign(r, (shft) % 8), vec_splat_u8(0), (shft) >> 3))
|
|
129
|
+
#define simd_srli_128(r, shft) \
|
|
130
|
+
((shft) < 8 ? sr_bytealign(r, shft):\
|
|
131
|
+
(shft) < 16 ? vec_sro(sr_bytealign(r, shft), vec_splat_u8(shft)) :\
|
|
132
|
+
(shft) >= 112 ? vec_sro(sr_bytealign(r, (shft)-128), vec_splat_u8((shft)-128)):\
|
|
133
|
+
vec_sld(vec_splat_u8(0), sr_bytealign(r, (shft) % 8), 16 - ((shft) >> 3)))
|
|
134
|
+
|
|
135
|
+
/* The vec_splat(r2, 15) ensures that the shift constant is duplicated
|
|
136
|
+
in all bytes prior to vec_sll or vec_srl. */
|
|
137
|
+
#define simd_sll_128(r1, r2) vec_sll(vec_slo(r1, r2), vec_splat(r2, 15))
|
|
138
|
+
#define simd_srl_128(r1, r2) vec_srl(vec_sro(r1, r2), vec_splat(r2, 15))
|
|
139
|
+
|
|
140
|
+
|
|
141
|
+
|
|
142
|
+
#define sisd_store_aligned(r, addr) *((SIMD_type *) (addr)) = r
|
|
143
|
+
#define sisd_load_aligned(addr) ((SIMD_type) *((SIMD_type *) (addr)))
|
|
144
|
+
|
|
145
|
+
|
|
146
|
+
#define simd_pack_16_ll(a, b) simd_pack_16(a, b)
|
|
147
|
+
|
|
148
|
+
#ifndef ALTIVEC_USE_EVEN_INDICES
|
|
149
|
+
#define simd_pack_16_hh(a, b) \
|
|
150
|
+
simd_pack_16(simd_srli_16(a, 8), simd_srli_16(b, 8))
|
|
151
|
+
#endif
|
|
152
|
+
|
|
153
|
+
|
|
154
|
+
#ifdef ALTIVEC_USE_EVEN_INDICES
|
|
155
|
+
#define even_byte_indices vec_add(vec_lvsl1(0), vec_lvsl1(0))
|
|
156
|
+
#define simd_pack_16_hh(a, b) vec_perm(a, b, even_byte_indices)
|
|
157
|
+
#endif
|
|
158
|
+
|
|
159
|
+
|
|
160
|
+
#define sisd_sll(r, shft) simd_sll_128(r, shft)
|
|
161
|
+
#define sisd_srl(r, shft) simd_srl_128(r, shft)
|
|
162
|
+
#define sisd_slli(r, shft) simd_slli_128(r, shft)
|
|
163
|
+
#define sisd_srli(r, shft) simd_srli_128(r, shft)
|
|
164
|
+
#define sisd_add(a, b) simd_add_128(a, b)
|
|
165
|
+
#define sisd_sub(a, b) simd_sub_128(a, b)
|
|
166
|
+
|
|
167
|
+
|
|
168
|
+
|
|
169
|
+
|
|
170
|
+
|
|
171
|
+
#define simd_himask_2 vec_or(vec_splat_u8(10), vec_sl(vec_splat_u8(10), vec_splat_u8(4)))
|
|
172
|
+
#define simd_himask_4 vec_or(vec_splat_u8(12), vec_sl(vec_splat_u8(12), vec_splat_u8(4)))
|
|
173
|
+
#define simd_himask_8 vec_splat_u8(-16)
|
|
174
|
+
|
|
175
|
+
|
|
176
|
+
|
|
177
|
+
#define simd_const_8(n) \
|
|
178
|
+
((n) >= -16 && (n) < 15 ? vec_splat_u8(n):\
|
|
179
|
+
vec_or(vec_sl(vec_splat_u8((n)>>4), vec_splat_u8(4), vec_splat_u8((n)&15))))
|
|
180
|
+
|
|
181
|
+
#define simd_const_16(n) \
|
|
182
|
+
((SIMD_type) vec_splat_u16(n))
|
|
183
|
+
|
|
184
|
+
#define simd_const_32(n) \
|
|
185
|
+
(SIMD_type) ((n) >= -16 && (n) < 15 ? vec_splat_u32(n):\
|
|
186
|
+
vec_or(vec_sl(vec_splat_u32((n)>>4), vec_splat_u32(4), vec_splat_u32((n)&15))))
|
|
187
|
+
|
|
188
|
+
#define simd_const_4(n) \
|
|
189
|
+
vec_or(vec_sl(vec_splat_u8(n), vec_splat_u8(4)), vec_splat_u8(n))
|
|
190
|
+
|
|
191
|
+
#define simd_const_2(n) \
|
|
192
|
+
vec_or(vec_sl(vec_splat_u8(5*(n)), vec_splat_u8(4)), vec_splat_u8(5*(n)))
|
|
193
|
+
|
|
194
|
+
#define simd_const_1(n) \
|
|
195
|
+
(n==0 ? simd_const_8(0): simd_const_8(-1))
|
|
196
|
+
|
|
197
|
+
#define sisd_const(n) vec_sld(vec_splat_u8(0), simd_const_8(n))
|
|
198
|
+
|
|
199
|
+
|
|
200
|
+
static inline int sisd_to_int(SIMD_type x) {
|
|
201
|
+
union {vector signed int vec; signed int elems[4];} xunion;
|
|
202
|
+
xunion.vec = (vector signed int) x;
|
|
203
|
+
return xunion.elems[3];
|
|
204
|
+
}
|
|
205
|
+
|
|
206
|
+
static inline SIMD_type sisd_from_int(unsigned int x) {
|
|
207
|
+
union {SIMD_type vec; unsigned int elems[4];} y;
|
|
208
|
+
y.elems[0] = 0;
|
|
209
|
+
y.elems[1] = 0;
|
|
210
|
+
y.elems[2] = 0;
|
|
211
|
+
y.elems[3] = x;
|
|
212
|
+
return y.vec;
|
|
213
|
+
}
|
|
214
|
+
|
|
215
|
+
#define bitblock_has_bit(blk) vec_any_ne(blk, vec_splat_u8(0))
|
|
216
|
+
|
|
217
|
+
#define simd_all_le_8(v1, v2) vec_vcmpleub(v1, v2)
|
|
218
|
+
static inline int simd_all_signed_gt_8(SIMD_type v1, SIMD_type v2) {
|
|
219
|
+
//#define simd_all_signed_gt_8(v1, v2) \
|
|
220
|
+
return vec_all_gt((vector signed char) v1, (vector signed char) v2);
|
|
221
|
+
}
|
|
222
|
+
|
|
223
|
+
|
|
224
|
+
#define simd_any_sign_bit_8(v) \
|
|
225
|
+
vec_any_lt((vector signed char) v, (vector signed char) vec_splat_u8(0))
|
|
226
|
+
|
|
227
|
+
static inline vector unsigned char bits_per_nybble_table() {
|
|
228
|
+
vector unsigned char zeroes = vec_splat_u8(0);
|
|
229
|
+
vector unsigned char ones = vec_splat_u8(1);
|
|
230
|
+
return simd_add_8
|
|
231
|
+
(simd_add_8(simd_pack_16(zeroes, ones), // 0000000011111111
|
|
232
|
+
simd_mergeh_32(zeroes, ones)), // 0000111100001111
|
|
233
|
+
simd_add_8(simd_mergeh_16(zeroes, ones), // 0011001100110011
|
|
234
|
+
simd_mergeh_8(zeroes, ones))); // 0101010101010101
|
|
235
|
+
// ----------------
|
|
236
|
+
// 0112122312232334
|
|
237
|
+
}
|
|
238
|
+
static inline int bitblock_bit_count(SIMD_type v) {
|
|
239
|
+
union {vector signed int vec; signed int elems[4];} result_count;
|
|
240
|
+
SIMD_type bit_count_tbl = bits_per_nybble_table();
|
|
241
|
+
/* SIMD_type bit_count_tbl = u8u16_control_vector[bits_per_nybble_tbl]; */
|
|
242
|
+
SIMD_type byte_counts;
|
|
243
|
+
byte_counts = vec_add(vec_perm(bit_count_tbl, bit_count_tbl, vec_sr(v, vec_splat_u8(4))),
|
|
244
|
+
vec_perm(bit_count_tbl, bit_count_tbl, v));
|
|
245
|
+
vector unsigned int acc = vec_sum4s(byte_counts, vec_splat_u32(0));
|
|
246
|
+
result_count.vec = vec_sums((vector signed int) acc, vec_splat_s32(0));
|
|
247
|
+
return result_count.elems[3];
|
|
248
|
+
}
|
|
249
|
+
|
|
250
|
+
#define bitblock_test_bit(blk, n) \
|
|
251
|
+
sisd_to_int(sisd_srli(sisd_slli(blk, (n)), BLOCKSIZE-1))
|
|
252
|
+
|
|
253
|
+
|
|
254
|
+
|
|
255
|
+
static inline int count_fwd_zeroes(SIMD_type v) {
|
|
256
|
+
int zeroes;
|
|
257
|
+
union {SIMD_type vec; signed int elems[4];} vu;
|
|
258
|
+
vu.vec = v;
|
|
259
|
+
asm volatile("cntlzw %0, %1\n" : "=r" (zeroes) : "r" (vu.elems[0]));
|
|
260
|
+
if (zeroes < 32) return zeroes;
|
|
261
|
+
asm volatile("cntlzw %0, %1\n" : "=r" (zeroes) : "r" (vu.elems[1]));
|
|
262
|
+
if (zeroes < 32) return zeroes+32;
|
|
263
|
+
asm volatile("cntlzw %0, %1\n" : "=r" (zeroes) : "r" (vu.elems[2]));
|
|
264
|
+
if (zeroes < 32) return zeroes+64;
|
|
265
|
+
asm volatile("cntlzw %0, %1\n" : "=r" (zeroes) : "r" (vu.elems[3]));
|
|
266
|
+
return zeroes+96;
|
|
267
|
+
}
|
|
268
|
+
|
|
269
|
+
|
|
270
|
+
static inline int count_forward_zeroes(SIMD_type bits) {
|
|
271
|
+
union {SIMD_type vec; unsigned long elems[sizeof(SIMD_type)/LONG_BIT];} v;
|
|
272
|
+
v.vec = bits;
|
|
273
|
+
if (v.elems[0] != 0) return __builtin_clzl(v.elems[0]);
|
|
274
|
+
else if (v.elems[1] != 0) return LONG_BIT + __builtin_clzl(v.elems[1]);
|
|
275
|
+
#if LONG_BIT < 64
|
|
276
|
+
else if (v.elems[2] != 0) return 2*LONG_BIT + __builtin_clzl(v.elems[2]);
|
|
277
|
+
else if (v.elems[3] != 0) return 3*LONG_BIT + __builtin_clzl(v.elems[3]);
|
|
278
|
+
#endif
|
|
279
|
+
else return 8*sizeof(SIMD_type);
|
|
280
|
+
}
|
|
281
|
+
|
|
282
|
+
|
|
283
|
+
|
|
284
|
+
|
|
285
|
+
void print_bit_block(char * var_name, SIMD_type v) {
|
|
286
|
+
union {SIMD_type vec; unsigned char elems[16];} x;
|
|
287
|
+
x.vec = v;
|
|
288
|
+
int i;
|
|
289
|
+
printf("%20s = ", var_name);
|
|
290
|
+
for (i = 0; i < 16; i++) {
|
|
291
|
+
printf("%02X ", x.elems[i]);
|
|
292
|
+
}
|
|
293
|
+
printf("\n");
|
|
294
|
+
}
|
|
295
|
+
|
|
296
|
+
|
|
297
|
+
static inline SIMD_type simd_add_2(SIMD_type a, SIMD_type b)
|
|
298
|
+
{
|
|
299
|
+
SIMD_type c1 = simd_xor(a,b);
|
|
300
|
+
SIMD_type borrow = simd_and(a,b);
|
|
301
|
+
SIMD_type c2 = simd_xor(c1,(sisd_slli(borrow,1)));
|
|
302
|
+
return simd_if(simd_himask_2,c2,c1);
|
|
303
|
+
}
|
|
304
|
+
#define simd_add_4(a, b)\
|
|
305
|
+
simd_if(simd_himask_8, simd_add_8(simd_and(a,simd_himask_8),simd_and(b,simd_himask_8))\
|
|
306
|
+
,simd_add_8(simd_andc(a,simd_himask_8),simd_andc(b,simd_himask_8)))
|
|
307
|
+
|
|
308
|
+
#define simd_srli_2(r, sh)\
|
|
309
|
+
simd_and(sisd_srli(r,sh),simd_const_2(3>>sh))
|
|
310
|
+
|
|
311
|
+
#define simd_srli_4(r, sh)\
|
|
312
|
+
simd_and(sisd_srli(r,sh),simd_const_4(15>>sh))
|
|
313
|
+
|
|
314
|
+
|
|
315
|
+
#define simd_add_2_xx(a, b) simd_add_2(a, b)
|
|
316
|
+
#define simd_add_2_xl(a, b) simd_add_2(a, simd_andc(b, simd_himask_2))
|
|
317
|
+
#define simd_add_2_xh(a, b) simd_add_2(a, simd_srli_2(b, 1))
|
|
318
|
+
#define simd_add_2_lx(a, b) simd_add_2(simd_andc(a, simd_himask_2), b)
|
|
319
|
+
#define simd_add_2_ll(a, b) simd_add_2(simd_andc(a, simd_himask_2), simd_andc(b, simd_himask_2))
|
|
320
|
+
#define simd_add_2_lh(a, b) simd_add_2(simd_andc(a, simd_himask_2), simd_srli_2(b, 1))
|
|
321
|
+
#define simd_add_2_hx(a, b) simd_add_2(simd_srli_2(a, 1), b)
|
|
322
|
+
#define simd_add_2_hl(a, b) simd_add_2(simd_srli_2(a, 1), simd_andc(b, simd_himask_2))
|
|
323
|
+
#define simd_add_2_hh(a, b) simd_add_2(simd_srli_2(a, 1), simd_srli_2(b, 1))
|
|
324
|
+
#define simd_add_4_xx(a, b) simd_add_4(a, b)
|
|
325
|
+
#define simd_add_4_xl(a, b) simd_add_4(a, simd_andc(b, simd_himask_4))
|
|
326
|
+
#define simd_add_4_xh(a, b) simd_add_4(a, simd_srli_4(b, 2))
|
|
327
|
+
#define simd_add_4_lx(a, b) simd_add_4(simd_andc(a, simd_himask_4), b)
|
|
328
|
+
#define simd_add_4_ll(a, b) simd_add_4(simd_andc(a, simd_himask_4), simd_andc(b, simd_himask_4))
|
|
329
|
+
#define simd_add_4_lh(a, b) simd_add_4(simd_andc(a, simd_himask_4), simd_srli_4(b, 2))
|
|
330
|
+
#define simd_add_4_hx(a, b) simd_add_4(simd_srli_4(a, 2), b)
|
|
331
|
+
#define simd_add_4_hl(a, b) simd_add_4(simd_srli_4(a, 2), simd_andc(b, simd_himask_4))
|
|
332
|
+
#define simd_add_4_hh(a, b) simd_add_4(simd_srli_4(a, 2), simd_srli_4(b, 2))
|
|
333
|
+
#define simd_add_8_xx(a, b) simd_add_8(a, b)
|
|
334
|
+
#define simd_add_8_xl(a, b) simd_add_8(a, simd_andc(b, simd_himask_8))
|
|
335
|
+
#define simd_add_8_xh(a, b) simd_add_8(a, simd_srli_8(b, 4))
|
|
336
|
+
#define simd_add_8_lx(a, b) simd_add_8(simd_andc(a, simd_himask_8), b)
|
|
337
|
+
#define simd_add_8_ll(a, b) simd_add_8(simd_andc(a, simd_himask_8), simd_andc(b, simd_himask_8))
|
|
338
|
+
#define simd_add_8_lh(a, b) simd_add_8(simd_andc(a, simd_himask_8), simd_srli_8(b, 4))
|
|
339
|
+
#define simd_add_8_hx(a, b) simd_add_8(simd_srli_8(a, 4), b)
|
|
340
|
+
#define simd_add_8_hl(a, b) simd_add_8(simd_srli_8(a, 4), simd_andc(b, simd_himask_8))
|
|
341
|
+
#define simd_add_8_hh(a, b) simd_add_8(simd_srli_8(a, 4), simd_srli_8(b, 4))
|
|
342
|
+
|
|
343
|
+
#define simd_pack_2(a,b)\
|
|
344
|
+
simd_pack_4(simd_if(simd_himask_2,a,sisd_srli(a,1)),\
|
|
345
|
+
simd_if(simd_himask_2,b,sisd_srli(b,1)))
|
|
346
|
+
#define simd_pack_4(a,b)\
|
|
347
|
+
simd_pack_8(simd_if(simd_himask_4,a,sisd_srli(a,2)),\
|
|
348
|
+
simd_if(simd_himask_4,b,sisd_srli(b,2)))
|
|
349
|
+
#define simd_pack_8(a,b)\
|
|
350
|
+
simd_pack_16(simd_if(simd_himask_8,a,sisd_srli(a,4)),\
|
|
351
|
+
simd_if(simd_himask_8,b,sisd_srli(b,4)))
|
|
352
|
+
#define simd_pack_2_xx(a, b) simd_pack_2(a, b)
|
|
353
|
+
#define simd_pack_2_xl(a, b) simd_pack_2(a, b)
|
|
354
|
+
#define simd_pack_2_xh(a, b) simd_pack_2(a, simd_srli_2(b, 1))
|
|
355
|
+
#define simd_pack_2_lx(a, b) simd_pack_2(a, b)
|
|
356
|
+
#define simd_pack_2_ll(a, b) simd_pack_2(a, b)
|
|
357
|
+
#define simd_pack_2_lh(a, b) simd_pack_2(a, simd_srli_2(b, 1))
|
|
358
|
+
#define simd_pack_2_hx(a, b) simd_pack_2(simd_srli_2(a, 1), b)
|
|
359
|
+
#define simd_pack_2_hl(a, b) simd_pack_2(simd_srli_2(a, 1), b)
|
|
360
|
+
#define simd_pack_2_hh(a, b) simd_pack_2(simd_srli_2(a, 1), simd_srli_2(b, 1))
|
|
361
|
+
#define simd_pack_4_xx(a, b) simd_pack_4(a, b)
|
|
362
|
+
#define simd_pack_4_xl(a, b) simd_pack_4(a, b)
|
|
363
|
+
#define simd_pack_4_xh(a, b) simd_pack_4(a, simd_srli_4(b, 2))
|
|
364
|
+
#define simd_pack_4_lx(a, b) simd_pack_4(a, b)
|
|
365
|
+
#define simd_pack_4_ll(a, b) simd_pack_4(a, b)
|
|
366
|
+
#define simd_pack_4_lh(a, b) simd_pack_4(a, simd_srli_4(b, 2))
|
|
367
|
+
#define simd_pack_4_hx(a, b) simd_pack_4(simd_srli_4(a, 2), b)
|
|
368
|
+
#define simd_pack_4_hl(a, b) simd_pack_4(simd_srli_4(a, 2), b)
|
|
369
|
+
#define simd_pack_4_hh(a, b) simd_pack_4(simd_srli_4(a, 2), simd_srli_4(b, 2))
|
|
370
|
+
#define simd_pack_8_xx(a, b) simd_pack_8(a, b)
|
|
371
|
+
#define simd_pack_8_xl(a, b) simd_pack_8(a, b)
|
|
372
|
+
#define simd_pack_8_xh(a, b) simd_pack_8(a, simd_srli_8(b, 4))
|
|
373
|
+
#define simd_pack_8_lx(a, b) simd_pack_8(a, b)
|
|
374
|
+
#define simd_pack_8_ll(a, b) simd_pack_8(a, b)
|
|
375
|
+
#define simd_pack_8_lh(a, b) simd_pack_8(a, simd_srli_8(b, 4))
|
|
376
|
+
#define simd_pack_8_hx(a, b) simd_pack_8(simd_srli_8(a, 4), b)
|
|
377
|
+
#define simd_pack_8_hl(a, b) simd_pack_8(simd_srli_8(a, 4), b)
|
|
378
|
+
#define simd_pack_8_hh(a, b) simd_pack_8(simd_srli_8(a, 4), simd_srli_8(b, 4))
|
|
379
|
+
|
|
380
|
+
static inline
|
|
381
|
+
SIMD_type simd_sub_2(SIMD_type a, SIMD_type b)
|
|
382
|
+
{
|
|
383
|
+
SIMD_type c1 = simd_xor(a,b);
|
|
384
|
+
SIMD_type borrow = simd_andc(b,a);
|
|
385
|
+
SIMD_type c2 = simd_xor(c1,(sisd_slli(borrow,1)));
|
|
386
|
+
return simd_if(simd_himask_2,c2,c1);
|
|
387
|
+
}
|
|
388
|
+
static inline
|
|
389
|
+
SIMD_type simd_srl_2(SIMD_type a, SIMD_type b)
|
|
390
|
+
{
|
|
391
|
+
SIMD_type c1 = simd_or((simd_andc(a,b)),(simd_and(b,sisd_srli(a,1))));
|
|
392
|
+
SIMD_type c2 = simd_andc(a,sisd_slli(b,1));
|
|
393
|
+
return simd_if(simd_himask_2,c2,c1);
|
|
394
|
+
}
|
|
395
|
+
static inline
|
|
396
|
+
SIMD_type simd_sra_2(SIMD_type a, SIMD_type b)
|
|
397
|
+
{
|
|
398
|
+
SIMD_type c1 = simd_or((simd_andc(a,b)),(simd_and(b,sisd_srli(a,1))));
|
|
399
|
+
return simd_if(simd_himask_2,a,c1);
|
|
400
|
+
}
|
|
401
|
+
static inline
|
|
402
|
+
SIMD_type simd_sll_2(SIMD_type a, SIMD_type b)
|
|
403
|
+
{
|
|
404
|
+
SIMD_type c1 = simd_andc(a,b);
|
|
405
|
+
SIMD_type c2 = simd_or((simd_andc(a,(sisd_slli(b,1)))),(simd_and((sisd_slli(b,1)),(sisd_slli(a,1)))));
|
|
406
|
+
return simd_if(simd_himask_2,c2,c1);
|
|
407
|
+
}
|
|
408
|
+
static inline
|
|
409
|
+
SIMD_type simd_rotl_2(SIMD_type a, SIMD_type b)
|
|
410
|
+
{
|
|
411
|
+
SIMD_type c1 = simd_or((simd_andc(a,b)),(simd_and(b,sisd_srli(a,1))));
|
|
412
|
+
SIMD_type c2 = simd_or((simd_andc(a,(sisd_slli(b,1)))),(simd_and((sisd_slli(b,1)),(sisd_slli(a,1)))));
|
|
413
|
+
return simd_if(simd_himask_2,c2,c1);
|
|
414
|
+
}
|
|
415
|
+
|
|
416
|
+
#ifndef simd_sub_4
|
|
417
|
+
inline SIMD_type simd_sub_4(SIMD_type a,SIMD_type b){
|
|
418
|
+
return simd_if(simd_himask_8, simd_sub_8(simd_and(a,simd_himask_8),simd_and(b,simd_himask_8))
|
|
419
|
+
,simd_sub_8(simd_andc(a,simd_himask_8),simd_andc(b,simd_himask_8)));}
|
|
420
|
+
#endif
|
|
421
|
+
|
|
422
|
+
#ifndef simd_sll_4
|
|
423
|
+
inline SIMD_type simd_sll_4(SIMD_type a,SIMD_type b){
|
|
424
|
+
return simd_if(simd_himask_8, simd_sll_8(simd_and(a,simd_himask_8),simd_and(simd_const_4(3),simd_srli_8(b,4)))
|
|
425
|
+
,simd_sll_8(a,simd_and(b,simd_const_8(3))));}
|
|
426
|
+
#endif
|
|
427
|
+
|
|
428
|
+
#ifndef simd_srl_4
|
|
429
|
+
inline SIMD_type simd_srl_4(SIMD_type a,SIMD_type b){
|
|
430
|
+
return simd_if(simd_himask_8, simd_srl_8(a,simd_and(simd_const_4(3),simd_srli_8(b,4)))
|
|
431
|
+
,simd_srl_8(simd_andc(a,simd_himask_8),simd_and(b,simd_const_8(3))));}
|
|
432
|
+
#endif
|
|
433
|
+
|
|
434
|
+
#ifndef simd_rotl_4
|
|
435
|
+
inline SIMD_type simd_rotl_4(SIMD_type a,SIMD_type b){
|
|
436
|
+
return simd_or(simd_sll_4(a,b),simd_srl_4(a,simd_sub_4(simd_const_4(4),b)));}
|
|
437
|
+
#endif
|
|
438
|
+
|
|
439
|
+
|
|
440
|
+
|
|
@@ -0,0 +1,121 @@
|
|
|
1
|
+
#
|
|
2
|
+
# make_basic_ops.py
|
|
3
|
+
#
|
|
4
|
+
# Copyright (C) 2007 Dan Lin, Robert D. Cameron
|
|
5
|
+
# Licensed to International Characters Inc. and Simon Fraser University
|
|
6
|
+
# under the Academic Free License version 3.0
|
|
7
|
+
# Licensed to the public under the Open Software License version 3.0.
|
|
8
|
+
|
|
9
|
+
# make_basic_ops.py generates inline definitions for
|
|
10
|
+
# idealized basic SIMD operations that are not included
|
|
11
|
+
# in the built-in functions.
|
|
12
|
+
ops = ["sub", "add", "sll", "srl", "sra", "pack", "mergeh", "mergel", "rotl"]
|
|
13
|
+
|
|
14
|
+
# 1 for "add" and "sub"
|
|
15
|
+
# 2 for "sll", "srl" and "sra"
|
|
16
|
+
# 3 for "pack"
|
|
17
|
+
# 4 for "mergel" and "mergeh"
|
|
18
|
+
# Note: For new operations added into this file,
|
|
19
|
+
# if different fieldwidths are needed, add more to the following list
|
|
20
|
+
# otherwise share with the operations above
|
|
21
|
+
fws = { 1: [4], 2: [32,16,8,4], 3: [8,4,2], 4: [4,2,1]}
|
|
22
|
+
|
|
23
|
+
ops_immediateshift= ["sll","srl"]
|
|
24
|
+
fws_immediateshift = [2,4,8]
|
|
25
|
+
|
|
26
|
+
|
|
27
|
+
# make the structure of a inline function
|
|
28
|
+
|
|
29
|
+
def make_inline(op,fw,body):
|
|
30
|
+
operation = "simd_%s_%i" % (op,fw)
|
|
31
|
+
return "#ifndef %s\ninline SIMD_type %s(SIMD_type a,SIMD_type b){\n\treturn %s;}\n#endif\n\n" % (operation,operation,body)
|
|
32
|
+
|
|
33
|
+
# this is the main function that generate simd operations in n bit field
|
|
34
|
+
# by using simd operations in 2n bit field
|
|
35
|
+
#
|
|
36
|
+
# Considering that simd_const_64() is not included in simd_built_in operations
|
|
37
|
+
# we use _mm_cvtsi32_si64() as the mask for shift operations in 32 bit field
|
|
38
|
+
# instead of masking the operand twice with simd_himask_32 and smid_const_32()
|
|
39
|
+
#
|
|
40
|
+
# Note: "rotl" has not been tested
|
|
41
|
+
# "srl", "sll" and "sra" in 4 bit field might not be efficient
|
|
42
|
+
# by using 8 bit field operations
|
|
43
|
+
def make_halfsize_defn(op,fw):
|
|
44
|
+
template = "simd_if(simd_himask_"+str(fw*2)+", simd_"+op+"_%i(%s,%s)\n\t,"+"simd_"+op+"_%i(%s,%s))"
|
|
45
|
+
if (op == "add") or (op == "sub"):
|
|
46
|
+
return template % (fw*2, "simd_and(a,simd_himask_"+str(fw*2)+")",
|
|
47
|
+
"simd_and(b,simd_himask_"+str(fw*2)+")",
|
|
48
|
+
fw*2,"simd_andc(a,simd_himask_"+str(fw*2)+")",
|
|
49
|
+
"simd_andc(b,simd_himask_"+str(fw*2)+")")
|
|
50
|
+
elif op == "srl":
|
|
51
|
+
common_part = template % (fw*2,"a","simd_and(simd_const_"+str(fw)+"("+str(fw-1)+"),simd_srli_"+str(fw*2)+"(b,"+str(fw)+"))",
|
|
52
|
+
fw*2,"simd_andc(a,simd_himask_"+str(fw*2)+")","simd_and(%s)")
|
|
53
|
+
if fw == 32:
|
|
54
|
+
return common_part % "_mm_cvtsi32_si64(31),b"
|
|
55
|
+
else:
|
|
56
|
+
return common_part % ("b,simd_const_"+str(fw*2)+"("+str(fw-1)+")")
|
|
57
|
+
elif op == "sll":
|
|
58
|
+
common_part = template % (fw*2, "simd_and(a,simd_himask_"+str(fw*2)+")",
|
|
59
|
+
"simd_and(simd_const_"+str(fw)+"("+str(fw-1)+"),simd_srli_"+str(fw*2)+"(b,"+str(fw)+"))",
|
|
60
|
+
fw*2,"a", "simd_and(%s)")
|
|
61
|
+
if fw == 32:
|
|
62
|
+
return common_part % "_mm_cvtsi32_si64(31),b"
|
|
63
|
+
else:
|
|
64
|
+
return common_part % ("b,simd_const_"+str(fw*2)+"("+str(fw-1)+")")
|
|
65
|
+
elif op == "sra":
|
|
66
|
+
if fw == 32:
|
|
67
|
+
return """simd_if(simd_himask_64(),
|
|
68
|
+
_mm_sra_pi32(a, simd_and(simd_const_32(31),simd_srli_64(b,32))),
|
|
69
|
+
_mm_sra_pi32(a, simd_and(_mm_cvtsi32_si64(31), b)))"""
|
|
70
|
+
else:
|
|
71
|
+
return template % (fw*2,"simd_and(a,simd_himask_"+str(fw*2)+")",
|
|
72
|
+
"simd_and(sisd_srli(b,"+str(fw)+"),simd_const_"+str(fw*2)+"("+str(fw-1)+"))",
|
|
73
|
+
fw*2,"simd_srai_"+str(fw*2)+"(sisd_slli(a,"+str(fw)+"),"+str(fw)+")",
|
|
74
|
+
"simd_and(b,simd_const_"+str(fw*2)+"("+str(fw-1)+"))")
|
|
75
|
+
elif op == "rotl":
|
|
76
|
+
return "simd_or(simd_sll_"+str(fw)+"(a,b),simd_srl_"+str(fw)+"(a,simd_sub_"+str(fw)+"(simd_const_"+str(fw)+"("+str(fw)+"),b)))"
|
|
77
|
+
elif op == "pack":
|
|
78
|
+
return "simd_pack_"+str(fw*2)+"(%s,\n\t%s)" % ("simd_if(simd_himask_"+str(fw)+",sisd_srli(a,"+str(fw/2)+"),a)",
|
|
79
|
+
"simd_if(simd_himask_"+str(fw)+",sisd_srli(b,"+str(fw/2)+"),b)")
|
|
80
|
+
elif op == "mergeh" or op == "mergel":
|
|
81
|
+
return "simd_"+op+"_"+str(fw*2)+"(%s,\n\t%s)" % ("simd_if(simd_himask_"+str(fw*2)+",a,sisd_srli(b,"+str(fw)+"))",
|
|
82
|
+
"simd_if(simd_himask_"+str(fw*2)+",sisd_slli(a,"+str(fw)+"),b)")
|
|
83
|
+
else:
|
|
84
|
+
raise Exception("Bad operator %s" % op)
|
|
85
|
+
|
|
86
|
+
def make_immediateshift_defn(op,fw):
|
|
87
|
+
template = "inline SIMD_type simd_"+op+"i_"+str(fw)+"(SIMD_type r, int sh){\n\t return %s"
|
|
88
|
+
if op== "sll":
|
|
89
|
+
return template % "simd_and(sisd_"+op+"i(r,sh),simd_const_"+str(fw)+"(("+str(2**fw-1)+"<<sh)&"+str(2**fw-1)+"));}\n"
|
|
90
|
+
else:
|
|
91
|
+
return template % "simd_and(sisd_"+op+"i(r,sh),simd_const_"+str(fw)+"("+str(2**fw-1)+">>sh));}\n"
|
|
92
|
+
|
|
93
|
+
def make_all_half_fieldwidth_versions (ops, fws):
|
|
94
|
+
defn_list = ''
|
|
95
|
+
for op in ops_immediateshift:
|
|
96
|
+
for fw in fws_immediateshift:
|
|
97
|
+
defn_list += make_immediateshift_defn(op, fw)
|
|
98
|
+
for op in ops:
|
|
99
|
+
if (op=="add" or op=="sub"):
|
|
100
|
+
for fw in fws[1]:
|
|
101
|
+
defn_list += make_inline(op, fw, make_halfsize_defn(op,fw))
|
|
102
|
+
elif (op=="sll" or op=="srl" or op=="sra" or op=="rotl"):
|
|
103
|
+
for fw in fws[2]:
|
|
104
|
+
defn_list += make_inline(op, fw, make_halfsize_defn(op,fw))
|
|
105
|
+
elif (op=="pack"):
|
|
106
|
+
for fw in fws[3]:
|
|
107
|
+
defn_list += make_inline(op, fw, make_halfsize_defn(op,fw))
|
|
108
|
+
elif (op=="mergeh" or op=="mergel"):
|
|
109
|
+
for fw in fws[4]:
|
|
110
|
+
defn_list += make_inline(op, fw, make_halfsize_defn(op,fw))
|
|
111
|
+
else: raise Exception("Bad operator %s" % op)
|
|
112
|
+
return defn_list
|
|
113
|
+
|
|
114
|
+
def generate_and_write_versions(filename, ops, fws):
|
|
115
|
+
defn_list = make_all_half_fieldwidth_versions (ops, fws)
|
|
116
|
+
file = open(filename, 'w')
|
|
117
|
+
file.write(defn_list)
|
|
118
|
+
file.close()
|
|
119
|
+
|
|
120
|
+
if __name__ == "__main__":
|
|
121
|
+
generate_and_write_versions("mmx_simd_basic.h", ops, fws)
|