react-native-quick-crypto 1.0.19 → 1.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/QuickCrypto.podspec +12 -38
- package/README.md +2 -0
- package/android/CMakeLists.txt +3 -0
- package/cpp/utils/HybridUtils.cpp +39 -77
- package/deps/simdutf/.clang-format +4 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/bug_report.md +62 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/config.yml +1 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/feature_request.md +35 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/standard-issue-template.md +29 -0
- package/deps/simdutf/.github/pull_request_template.md +51 -0
- package/deps/simdutf/.github/workflows/aarch64.yml +39 -0
- package/deps/simdutf/.github/workflows/alpine.yml +27 -0
- package/deps/simdutf/.github/workflows/amalgamation_demos.yml +34 -0
- package/deps/simdutf/.github/workflows/armv7.yml +32 -0
- package/deps/simdutf/.github/workflows/atomic_fuzz.yml +25 -0
- package/deps/simdutf/.github/workflows/cifuzz.yml +37 -0
- package/deps/simdutf/.github/workflows/clangformat.yml +36 -0
- package/deps/simdutf/.github/workflows/debian-latestcxxstandards.yml +40 -0
- package/deps/simdutf/.github/workflows/debian.yml +33 -0
- package/deps/simdutf/.github/workflows/documentation.yml +36 -0
- package/deps/simdutf/.github/workflows/emscripten.yml +19 -0
- package/deps/simdutf/.github/workflows/loongarch64-gcc-14.2.yml +39 -0
- package/deps/simdutf/.github/workflows/macos-latest.yml +29 -0
- package/deps/simdutf/.github/workflows/msys2-clang.yml +48 -0
- package/deps/simdutf/.github/workflows/msys2.yml +50 -0
- package/deps/simdutf/.github/workflows/ppc64le.yml +29 -0
- package/deps/simdutf/.github/workflows/rvv-1024-clang-18.yml +35 -0
- package/deps/simdutf/.github/workflows/rvv-128-clang-17.yml +35 -0
- package/deps/simdutf/.github/workflows/rvv-256-gcc-14.yml +31 -0
- package/deps/simdutf/.github/workflows/s390x.yml +29 -0
- package/deps/simdutf/.github/workflows/selective-amalgamation.yml +29 -0
- package/deps/simdutf/.github/workflows/typos.yml +19 -0
- package/deps/simdutf/.github/workflows/ubuntu22-cxx20.yml +30 -0
- package/deps/simdutf/.github/workflows/ubuntu22.yml +32 -0
- package/deps/simdutf/.github/workflows/ubuntu22_gcc12.yml +27 -0
- package/deps/simdutf/.github/workflows/ubuntu22sani.yml +29 -0
- package/deps/simdutf/.github/workflows/ubuntu24-cxxstandards.yml +34 -0
- package/deps/simdutf/.github/workflows/ubuntu24-unsignedchar.yml +34 -0
- package/deps/simdutf/.github/workflows/ubuntu24.yml +32 -0
- package/deps/simdutf/.github/workflows/ubuntu24sani.yml +36 -0
- package/deps/simdutf/.github/workflows/ubuntu24sani_clang.yml +29 -0
- package/deps/simdutf/.github/workflows/vs17-arm-ci.yml +21 -0
- package/deps/simdutf/.github/workflows/vs17-ci-cxx20.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-ci.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-clang-ci.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-cxxstandards.yml +36 -0
- package/deps/simdutf/AI_USAGE_POLICY.md +56 -0
- package/deps/simdutf/AUTHORS +6 -0
- package/deps/simdutf/CMakeLists.txt +231 -0
- package/deps/simdutf/CONTRIBUTING.md +214 -0
- package/deps/simdutf/CONTRIBUTORS +1 -0
- package/deps/simdutf/Doxyfile +2584 -0
- package/deps/simdutf/LICENSE-APACHE +201 -0
- package/deps/simdutf/LICENSE-MIT +18 -0
- package/deps/simdutf/Makefile.crosscompile +54 -0
- package/deps/simdutf/README-RVV.md +16 -0
- package/deps/simdutf/README.md +2782 -0
- package/deps/simdutf/SECURITY.md +8 -0
- package/deps/simdutf/benchmarks/CMakeLists.txt +101 -0
- package/deps/simdutf/benchmarks/alignment.cpp +150 -0
- package/deps/simdutf/benchmarks/base64/CMakeLists.txt +30 -0
- package/deps/simdutf/benchmarks/base64/benchmark_base64.cpp +875 -0
- package/deps/simdutf/benchmarks/base64/libbase64_spaces.h +49 -0
- package/deps/simdutf/benchmarks/base64/node_base64.h +227 -0
- package/deps/simdutf/benchmarks/base64/openssl3_base64.h +334 -0
- package/deps/simdutf/benchmarks/benchmark.cpp +65 -0
- package/deps/simdutf/benchmarks/benchmark_to_well_formed_utf16.cpp +347 -0
- package/deps/simdutf/benchmarks/competition/.clang-format-ignore +5 -0
- package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.cpp +1276 -0
- package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.h +595 -0
- package/deps/simdutf/benchmarks/competition/README.md +7 -0
- package/deps/simdutf/benchmarks/competition/hoehrmann/hoehrmann.h +91 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16.h +444 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16_tables.h +13183 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/script.py +73 -0
- package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.cpp +738 -0
- package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.h +293 -0
- package/deps/simdutf/benchmarks/competition/u8u16/COPYRIGHT +8 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Makefile +44 -0
- package/deps/simdutf/benchmarks/competition/u8u16/OSL3.0.txt +169 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/BOM_Profiler.h +148 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/i386_timer.h +45 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/ppc_timer.c +34 -0
- package/deps/simdutf/benchmarks/competition/u8u16/README +56 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/config_defs.h +43 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/g4_config.h +27 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/mmx_config.h +16 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/p4_config.h +18 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/p4_ideal_config.h +16 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/spu_config.h +28 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/ssse3_config.h +20 -0
- package/deps/simdutf/benchmarks/competition/u8u16/iconv_u8u16.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/altivec_simd.h +440 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_basic_ops.py +121 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_half_operand_versions.py +158 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_test.py +270 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd.h +141 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_basic.h +216 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_built_in.h +119 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_modified.h +2430 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/outline.txt +39 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/spu_simd.h +421 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/sse_simd.h +836 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/stdint.h +222 -0
- package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_BE.c +4 -0
- package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_LE.c +5 -0
- package/deps/simdutf/benchmarks/competition/u8u16/proto/u8u16.py +390 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/Makefile +18 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/bytelex.h +448 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/charsets/ASCII_EBCDIC.h +284 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.c +1975 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.pdf +0 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.w +2263 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/multiliteral.h +239 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/u8u16.c +232 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/x8x16.c +194 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.c +193 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.h +167 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.c +288 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.h +117 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_g4.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_mmx.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4.c +3 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4_ideal.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_spu.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_ssse3.c +3 -0
- package/deps/simdutf/benchmarks/competition/u8u16/x8x16_p4.c +2 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/LICENSE +23 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/data/test_minimal.txt +44 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/readme.md +106 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_corr_tests.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_example.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_file_conv.sh +14 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_lib.sh +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_sample.sh +8 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_corr_tests.cmd +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_example.cmd +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_file_conv.cmd +14 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_lib.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_sample.cmd +8 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_corr_tests.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_example.cmd +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_file_conv.cmd +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_lib.cmd +10 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_sample.cmd +9 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/html_table.py +25 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/measure.py +94 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/resize.py +20 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_all.cmd +2 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_interm.cmd +1 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/CustomMemcpy.h +75 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/PerfDefs.h +47 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.cpp +17 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.h +76 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/AllProcessors.cpp +35 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.cpp +117 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.h +210 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferDecoder.h +158 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferEncoder.h +104 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorPlugins.h +334 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorSelector.h +186 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.cpp +140 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.h +42 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderProcess.h +100 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/Dfa.h +57 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.cpp +85 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.h +27 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderProcess.h +126 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/ProcessTrivial.h +108 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.cpp +139 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.h +74 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.cpp +65 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.h +91 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/CorrectnessTests.cpp +772 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/Example.cpp +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/FileConverter.cpp +486 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/iconv_sample.c +162 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/utf8lut.h +15 -0
- package/deps/simdutf/benchmarks/competition/utf8sse4/fromutf8-sse.cpp +292 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/LICENSE +23 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/README.md +1503 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/checked.h +335 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/core.h +338 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp11.h +103 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp17.h +103 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/unchecked.h +274 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8.h +34 -0
- package/deps/simdutf/benchmarks/dataset/README.md +155 -0
- package/deps/simdutf/benchmarks/dataset/emoji.txt +204 -0
- package/deps/simdutf/benchmarks/dataset/scripts/utf8type.py +40 -0
- package/deps/simdutf/benchmarks/dataset/wikipedia_mars/Makefile +80 -0
- package/deps/simdutf/benchmarks/dataset/wikipedia_mars/convert_to_utf6.py +20 -0
- package/deps/simdutf/benchmarks/find/CMakeLists.txt +6 -0
- package/deps/simdutf/benchmarks/find/findbenchmark.cpp +63 -0
- package/deps/simdutf/benchmarks/find/findbenchmarker.h +46 -0
- package/deps/simdutf/benchmarks/shortbench.cpp +555 -0
- package/deps/simdutf/benchmarks/src/CMakeLists.txt +52 -0
- package/deps/simdutf/benchmarks/src/apple_arm_events.h +1104 -0
- package/deps/simdutf/benchmarks/src/benchmark.cpp +3899 -0
- package/deps/simdutf/benchmarks/src/benchmark.h +317 -0
- package/deps/simdutf/benchmarks/src/benchmark_base.cpp +144 -0
- package/deps/simdutf/benchmarks/src/benchmark_base.h +98 -0
- package/deps/simdutf/benchmarks/src/cmdline.cpp +176 -0
- package/deps/simdutf/benchmarks/src/cmdline.h +35 -0
- package/deps/simdutf/benchmarks/src/event_counter.h +162 -0
- package/deps/simdutf/benchmarks/src/linux-perf-events.h +104 -0
- package/deps/simdutf/benchmarks/stream.cpp +209 -0
- package/deps/simdutf/benchmarks/threaded.cpp +123 -0
- package/deps/simdutf/cmake/CPM.cmake +1363 -0
- package/deps/simdutf/cmake/JoinPaths.cmake +23 -0
- package/deps/simdutf/cmake/add_cpp_test.cmake +68 -0
- package/deps/simdutf/cmake/simdutf-config.cmake.in +2 -0
- package/deps/simdutf/cmake/simdutf-flags.cmake +26 -0
- package/deps/simdutf/cmake/toolchains-ci/riscv64-linux-gnu.cmake +4 -0
- package/deps/simdutf/cmake/toolchains-dev/README.md +32 -0
- package/deps/simdutf/cmake/toolchains-dev/aarch64.cmake +14 -0
- package/deps/simdutf/cmake/toolchains-dev/loongarch64.cmake +22 -0
- package/deps/simdutf/cmake/toolchains-dev/powerpc64.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/powerpc64le.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/riscv64.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/rvv-spike.cmake +38 -0
- package/deps/simdutf/doc/avx512.png +0 -0
- package/deps/simdutf/doc/logo.png +0 -0
- package/deps/simdutf/doc/logo.svg +165 -0
- package/deps/simdutf/doc/node2023.png +0 -0
- package/deps/simdutf/doc/shortinput.md +78 -0
- package/deps/simdutf/doc/utf16utf8.png +0 -0
- package/deps/simdutf/doc/utf8utf16.png +0 -0
- package/deps/simdutf/doc/widelogo.png +0 -0
- package/deps/simdutf/doxygen.py +50 -0
- package/deps/simdutf/fuzz/.clang-format +9 -0
- package/deps/simdutf/fuzz/CMakeLists.txt +45 -0
- package/deps/simdutf/fuzz/README.md +168 -0
- package/deps/simdutf/fuzz/atomic_base64.cpp +448 -0
- package/deps/simdutf/fuzz/base64.cpp +278 -0
- package/deps/simdutf/fuzz/build.sh +83 -0
- package/deps/simdutf/fuzz/conversion.cpp +669 -0
- package/deps/simdutf/fuzz/helpers/.clang-format-ignore +1 -0
- package/deps/simdutf/fuzz/helpers/common.h +135 -0
- package/deps/simdutf/fuzz/helpers/nameof.hpp +1258 -0
- package/deps/simdutf/fuzz/main.cpp +72 -0
- package/deps/simdutf/fuzz/minimize_and_cleanse.sh +87 -0
- package/deps/simdutf/fuzz/misc.cpp +216 -0
- package/deps/simdutf/fuzz/random_fuzz.sh +154 -0
- package/deps/simdutf/fuzz/roundtrip.cpp +588 -0
- package/deps/simdutf/fuzz/safe_conversion.cpp +104 -0
- package/deps/simdutf/include/simdutf/avx512.h +79 -0
- package/deps/simdutf/include/simdutf/base64_implementation.h +158 -0
- package/deps/simdutf/include/simdutf/base64_tables.h +887 -0
- package/deps/simdutf/include/simdutf/common_defs.h +186 -0
- package/deps/simdutf/include/simdutf/compiler_check.h +50 -0
- package/deps/simdutf/include/simdutf/constexpr_ptr.h +138 -0
- package/deps/simdutf/include/simdutf/encoding_types.h +189 -0
- package/deps/simdutf/include/simdutf/error.h +126 -0
- package/deps/simdutf/include/simdutf/implementation.h +7081 -0
- package/deps/simdutf/include/simdutf/internal/isadetection.h +325 -0
- package/deps/simdutf/include/simdutf/portability.h +285 -0
- package/deps/simdutf/include/simdutf/scalar/ascii.h +86 -0
- package/deps/simdutf/include/simdutf/scalar/atomic_util.h +105 -0
- package/deps/simdutf/include/simdutf/scalar/base64.h +911 -0
- package/deps/simdutf/include/simdutf/scalar/latin1.h +26 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf16/latin1_to_utf16.h +52 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf32/latin1_to_utf32.h +27 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf8/latin1_to_utf8.h +191 -0
- package/deps/simdutf/include/simdutf/scalar/swap_bytes.h +35 -0
- package/deps/simdutf/include/simdutf/scalar/utf16.h +226 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/utf16_to_latin1.h +108 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/valid_utf16_to_latin1.h +40 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/utf16_to_utf32.h +86 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/valid_utf16_to_utf32.h +44 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/utf16_to_utf8.h +295 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/valid_utf16_to_utf8.h +91 -0
- package/deps/simdutf/include/simdutf/scalar/utf32.h +82 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/utf32_to_latin1.h +68 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/valid_utf32_to_latin1.h +67 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/utf32_to_utf16.h +84 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/valid_utf32_to_utf16.h +44 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/utf32_to_utf8.h +142 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/valid_utf32_to_utf8.h +72 -0
- package/deps/simdutf/include/simdutf/scalar/utf8.h +326 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/utf8_to_latin1.h +225 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/valid_utf8_to_latin1.h +87 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/utf8_to_utf16.h +342 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/valid_utf8_to_utf16.h +106 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/utf8_to_utf32.h +299 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/valid_utf8_to_utf32.h +83 -0
- package/deps/simdutf/include/simdutf/simdutf_version.h +26 -0
- package/deps/simdutf/include/simdutf.h +26 -0
- package/deps/simdutf/include/simdutf_c.h +342 -0
- package/deps/simdutf/riscv/Dockerfile +16 -0
- package/deps/simdutf/riscv/README.md +24 -0
- package/deps/simdutf/riscv/remove-docker-station +8 -0
- package/deps/simdutf/riscv/run-docker-station +31 -0
- package/deps/simdutf/scripts/.flake8 +2 -0
- package/deps/simdutf/scripts/Makefile +2 -0
- package/deps/simdutf/scripts/README_ADD_FUNCTION.md +49 -0
- package/deps/simdutf/scripts/add_function.py +330 -0
- package/deps/simdutf/scripts/amalgamation_tests.py +156 -0
- package/deps/simdutf/scripts/base64/Makefile +2 -0
- package/deps/simdutf/scripts/base64/README.md +2 -0
- package/deps/simdutf/scripts/base64/avx512.py +76 -0
- package/deps/simdutf/scripts/base64/neon_decode.py +143 -0
- package/deps/simdutf/scripts/base64/neon_generate_lut.py +101 -0
- package/deps/simdutf/scripts/base64/sse.py +252 -0
- package/deps/simdutf/scripts/base64/sseregular.py +160 -0
- package/deps/simdutf/scripts/base64/sseurl.py +283 -0
- package/deps/simdutf/scripts/base64/table.py +59 -0
- package/deps/simdutf/scripts/base64bench_print.py +145 -0
- package/deps/simdutf/scripts/benchmark-all.py +119 -0
- package/deps/simdutf/scripts/benchmark_print.py +324 -0
- package/deps/simdutf/scripts/check_feature_macros.py +156 -0
- package/deps/simdutf/scripts/check_typos.sh +13 -0
- package/deps/simdutf/scripts/clang_format.sh +35 -0
- package/deps/simdutf/scripts/clang_format_docker.sh +38 -0
- package/deps/simdutf/scripts/common.py +24 -0
- package/deps/simdutf/scripts/compilation_benchmark.py +55 -0
- package/deps/simdutf/scripts/compile_many_variations.sh +64 -0
- package/deps/simdutf/scripts/create_latex_table.py +62 -0
- package/deps/simdutf/scripts/docker/Dockerfile +14 -0
- package/deps/simdutf/scripts/docker/Makefile +9 -0
- package/deps/simdutf/scripts/docker/README.md +30 -0
- package/deps/simdutf/scripts/docker/llvm.gpg +0 -0
- package/deps/simdutf/scripts/ppc64_convert_utf16_to_utf8.py +155 -0
- package/deps/simdutf/scripts/prepare_doxygen.sh +21 -0
- package/deps/simdutf/scripts/release.py +197 -0
- package/deps/simdutf/scripts/shortinputplots.py +97 -0
- package/deps/simdutf/scripts/sse_convert_utf16_to_utf8.py +422 -0
- package/deps/simdutf/scripts/sse_convert_utf32_to_utf16.py +105 -0
- package/deps/simdutf/scripts/sse_utf8_utf16_decode.py +186 -0
- package/deps/simdutf/scripts/sse_validate_utf16le_proof.py +137 -0
- package/deps/simdutf/scripts/sse_validate_utf16le_testcases.py +129 -0
- package/deps/simdutf/scripts/table.py +207 -0
- package/deps/simdutf/scripts/tests/new.txt +33 -0
- package/deps/simdutf/scripts/tests/old.txt +33 -0
- package/deps/simdutf/scripts/tests/results.txt +272 -0
- package/deps/simdutf/simdutf.pc.in +11 -0
- package/deps/simdutf/singleheader/.flake8 +2 -0
- package/deps/simdutf/singleheader/CMakeLists.txt +64 -0
- package/deps/simdutf/singleheader/README-dev.md +81 -0
- package/deps/simdutf/singleheader/README.md +19 -0
- package/deps/simdutf/singleheader/amalgamate.py +513 -0
- package/deps/simdutf/singleheader/amalgamation_demo.c +59 -0
- package/deps/simdutf/singleheader/amalgamation_demo.cpp +54 -0
- package/deps/simdutf/singleheader/test-features.py +262 -0
- package/deps/simdutf/src/CMakeLists.txt +78 -0
- package/deps/simdutf/src/arm64/arm_base64.cpp +791 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf16.cpp +24 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf32.cpp +24 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf8.cpp +70 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_latin1.cpp +61 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf32.cpp +185 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf8.cpp +780 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_latin1.cpp +60 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf16.cpp +208 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf8.cpp +505 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_latin1.cpp +69 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf16.cpp +313 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf32.cpp +179 -0
- package/deps/simdutf/src/arm64/arm_find.cpp +199 -0
- package/deps/simdutf/src/arm64/arm_utf16fix.cpp +185 -0
- package/deps/simdutf/src/arm64/arm_validate_utf16.cpp +165 -0
- package/deps/simdutf/src/arm64/arm_validate_utf32le.cpp +65 -0
- package/deps/simdutf/src/arm64/implementation.cpp +1442 -0
- package/deps/simdutf/src/encoding_types.cpp +67 -0
- package/deps/simdutf/src/error.cpp +3 -0
- package/deps/simdutf/src/fallback/implementation.cpp +589 -0
- package/deps/simdutf/src/generic/ascii_validation.h +50 -0
- package/deps/simdutf/src/generic/base64.h +233 -0
- package/deps/simdutf/src/generic/base64lengths.h +63 -0
- package/deps/simdutf/src/generic/buf_block_reader.h +109 -0
- package/deps/simdutf/src/generic/find.h +75 -0
- package/deps/simdutf/src/generic/utf16/change_endianness.h +24 -0
- package/deps/simdutf/src/generic/utf16/count_code_points_bytemask.h +58 -0
- package/deps/simdutf/src/generic/utf16/to_well_formed.h +93 -0
- package/deps/simdutf/src/generic/utf16/utf32_length_from_utf16.h +15 -0
- package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16.h +35 -0
- package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16_bytemask.h +199 -0
- package/deps/simdutf/src/generic/utf16.h +73 -0
- package/deps/simdutf/src/generic/utf32.h +136 -0
- package/deps/simdutf/src/generic/utf8/utf16_length_from_utf8_bytemask.h +53 -0
- package/deps/simdutf/src/generic/utf8.h +92 -0
- package/deps/simdutf/src/generic/utf8_to_latin1/utf8_to_latin1.h +316 -0
- package/deps/simdutf/src/generic/utf8_to_latin1/valid_utf8_to_latin1.h +78 -0
- package/deps/simdutf/src/generic/utf8_to_utf16/utf8_to_utf16.h +332 -0
- package/deps/simdutf/src/generic/utf8_to_utf16/valid_utf8_to_utf16.h +74 -0
- package/deps/simdutf/src/generic/utf8_to_utf32/utf8_to_utf32.h +318 -0
- package/deps/simdutf/src/generic/utf8_to_utf32/valid_utf8_to_utf32.h +42 -0
- package/deps/simdutf/src/generic/utf8_validation/utf8_lookup4_algorithm.h +223 -0
- package/deps/simdutf/src/generic/utf8_validation/utf8_validator.h +84 -0
- package/deps/simdutf/src/generic/validate_utf16.h +164 -0
- package/deps/simdutf/src/generic/validate_utf32.h +99 -0
- package/deps/simdutf/src/haswell/avx2_base64.cpp +837 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf16.cpp +28 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf32.cpp +20 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf8.cpp +83 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_latin1.cpp +83 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf32.cpp +210 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf8.cpp +602 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_latin1.cpp +116 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf16.cpp +164 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf8.cpp +569 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_latin1.cpp +60 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf16.cpp +195 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf32.cpp +135 -0
- package/deps/simdutf/src/haswell/avx2_utf16fix.cpp +173 -0
- package/deps/simdutf/src/haswell/avx2_validate_utf16.cpp +17 -0
- package/deps/simdutf/src/haswell/implementation.cpp +1447 -0
- package/deps/simdutf/src/icelake/icelake_ascii_validation.inl.cpp +19 -0
- package/deps/simdutf/src/icelake/icelake_base64.inl.cpp +630 -0
- package/deps/simdutf/src/icelake/icelake_common.inl.cpp +37 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf16.inl.cpp +36 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf32.inl.cpp +23 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf8.inl.cpp +107 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_latin1.inl.cpp +103 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf32.inl.cpp +136 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf8.inl.cpp +206 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_latin1.inl.cpp +74 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf16.inl.cpp +338 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf8.inl.cpp +574 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf8_to_latin1.inl.cpp +104 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf8_to_utf16.inl.cpp +75 -0
- package/deps/simdutf/src/icelake/icelake_convert_valid_utf8_to_latin1.inl.cpp +69 -0
- package/deps/simdutf/src/icelake/icelake_find.inl.cpp +146 -0
- package/deps/simdutf/src/icelake/icelake_from_utf8.inl.cpp +266 -0
- package/deps/simdutf/src/icelake/icelake_from_valid_utf8.inl.cpp +136 -0
- package/deps/simdutf/src/icelake/icelake_macros.inl.cpp +143 -0
- package/deps/simdutf/src/icelake/icelake_utf16fix.cpp +138 -0
- package/deps/simdutf/src/icelake/icelake_utf32_validation.inl.cpp +63 -0
- package/deps/simdutf/src/icelake/icelake_utf8_common.inl.cpp +753 -0
- package/deps/simdutf/src/icelake/icelake_utf8_length_from_utf16.inl.cpp +269 -0
- package/deps/simdutf/src/icelake/icelake_utf8_validation.inl.cpp +116 -0
- package/deps/simdutf/src/icelake/implementation.cpp +1903 -0
- package/deps/simdutf/src/implementation.cpp +2526 -0
- package/deps/simdutf/src/lasx/implementation.cpp +1531 -0
- package/deps/simdutf/src/lasx/lasx_base64.cpp +695 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf16.cpp +76 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf32.cpp +55 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf8.cpp +65 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_latin1.cpp +64 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf32.cpp +183 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf8.cpp +550 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_latin1.cpp +73 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf16.cpp +218 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf8.cpp +589 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_latin1.cpp +72 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf16.cpp +296 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf32.cpp +190 -0
- package/deps/simdutf/src/lasx/lasx_find.cpp +64 -0
- package/deps/simdutf/src/lasx/lasx_validate_utf16.cpp +13 -0
- package/deps/simdutf/src/lasx/lasx_validate_utf32le.cpp +84 -0
- package/deps/simdutf/src/lsx/implementation.cpp +1417 -0
- package/deps/simdutf/src/lsx/lsx_base64.cpp +675 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf16.cpp +39 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf32.cpp +27 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf8.cpp +56 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_latin1.cpp +64 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf32.cpp +133 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf8.cpp +518 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_latin1.cpp +66 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf16.cpp +155 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf8.cpp +459 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_latin1.cpp +75 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf16.cpp +291 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf32.cpp +179 -0
- package/deps/simdutf/src/lsx/lsx_find.cpp +60 -0
- package/deps/simdutf/src/lsx/lsx_validate_utf16.cpp +13 -0
- package/deps/simdutf/src/lsx/lsx_validate_utf32le.cpp +68 -0
- package/deps/simdutf/src/ppc64/implementation.cpp +992 -0
- package/deps/simdutf/src/ppc64/ppc64_base64.cpp +480 -0
- package/deps/simdutf/src/ppc64/ppc64_base64_internal_tests.cpp +401 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf16.cpp +12 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf32.cpp +12 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf8.cpp +149 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_latin1.cpp +67 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf32.cpp +87 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf8.cpp +296 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_latin1.cpp +57 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf16.cpp +117 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf8.cpp +166 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_latin1.cpp +69 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf16.cpp +211 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf32.cpp +153 -0
- package/deps/simdutf/src/ppc64/ppc64_utf16_to_utf8_tables.h +1011 -0
- package/deps/simdutf/src/ppc64/ppc64_utf8_length_from_latin1.cpp +37 -0
- package/deps/simdutf/src/ppc64/ppc64_validate_utf16.cpp +19 -0
- package/deps/simdutf/src/ppc64/templates.cpp +91 -0
- package/deps/simdutf/src/rvv/implementation.cpp +138 -0
- package/deps/simdutf/src/rvv/rvv_find.cpp +27 -0
- package/deps/simdutf/src/rvv/rvv_helpers.inl.cpp +23 -0
- package/deps/simdutf/src/rvv/rvv_latin1_to.inl.cpp +71 -0
- package/deps/simdutf/src/rvv/rvv_length_from.inl.cpp +164 -0
- package/deps/simdutf/src/rvv/rvv_utf16_to.inl.cpp +399 -0
- package/deps/simdutf/src/rvv/rvv_utf16fix.cpp +110 -0
- package/deps/simdutf/src/rvv/rvv_utf32_to.inl.cpp +307 -0
- package/deps/simdutf/src/rvv/rvv_utf8_to.inl.cpp +435 -0
- package/deps/simdutf/src/rvv/rvv_validate.inl.cpp +275 -0
- package/deps/simdutf/src/simdutf/arm64/begin.h +2 -0
- package/deps/simdutf/src/simdutf/arm64/bitmanipulation.h +34 -0
- package/deps/simdutf/src/simdutf/arm64/end.h +2 -0
- package/deps/simdutf/src/simdutf/arm64/implementation.h +307 -0
- package/deps/simdutf/src/simdutf/arm64/intrinsics.h +10 -0
- package/deps/simdutf/src/simdutf/arm64/simd.h +547 -0
- package/deps/simdutf/src/simdutf/arm64/simd16-inl.h +403 -0
- package/deps/simdutf/src/simdutf/arm64/simd32-inl.h +129 -0
- package/deps/simdutf/src/simdutf/arm64/simd64-inl.h +28 -0
- package/deps/simdutf/src/simdutf/arm64.h +43 -0
- package/deps/simdutf/src/simdutf/fallback/begin.h +1 -0
- package/deps/simdutf/src/simdutf/fallback/bitmanipulation.h +13 -0
- package/deps/simdutf/src/simdutf/fallback/end.h +1 -0
- package/deps/simdutf/src/simdutf/fallback/implementation.h +331 -0
- package/deps/simdutf/src/simdutf/fallback.h +42 -0
- package/deps/simdutf/src/simdutf/haswell/begin.h +15 -0
- package/deps/simdutf/src/simdutf/haswell/bitmanipulation.h +35 -0
- package/deps/simdutf/src/simdutf/haswell/end.h +13 -0
- package/deps/simdutf/src/simdutf/haswell/implementation.h +338 -0
- package/deps/simdutf/src/simdutf/haswell/intrinsics.h +67 -0
- package/deps/simdutf/src/simdutf/haswell/simd.h +363 -0
- package/deps/simdutf/src/simdutf/haswell/simd16-inl.h +261 -0
- package/deps/simdutf/src/simdutf/haswell/simd32-inl.h +111 -0
- package/deps/simdutf/src/simdutf/haswell/simd64-inl.h +34 -0
- package/deps/simdutf/src/simdutf/haswell.h +63 -0
- package/deps/simdutf/src/simdutf/icelake/begin.h +14 -0
- package/deps/simdutf/src/simdutf/icelake/bitmanipulation.h +44 -0
- package/deps/simdutf/src/simdutf/icelake/end.h +12 -0
- package/deps/simdutf/src/simdutf/icelake/implementation.h +346 -0
- package/deps/simdutf/src/simdutf/icelake/intrinsics.h +138 -0
- package/deps/simdutf/src/simdutf/icelake/simd.h +17 -0
- package/deps/simdutf/src/simdutf/icelake/simd16-inl.h +90 -0
- package/deps/simdutf/src/simdutf/icelake/simd32-inl.h +47 -0
- package/deps/simdutf/src/simdutf/icelake.h +81 -0
- package/deps/simdutf/src/simdutf/lasx/begin.h +8 -0
- package/deps/simdutf/src/simdutf/lasx/bitmanipulation.h +25 -0
- package/deps/simdutf/src/simdutf/lasx/end.h +8 -0
- package/deps/simdutf/src/simdutf/lasx/implementation.h +310 -0
- package/deps/simdutf/src/simdutf/lasx/intrinsics.h +319 -0
- package/deps/simdutf/src/simdutf/lasx/simd.h +551 -0
- package/deps/simdutf/src/simdutf/lasx/simd16-inl.h +234 -0
- package/deps/simdutf/src/simdutf/lasx/simd32-inl.h +74 -0
- package/deps/simdutf/src/simdutf/lasx/simd64-inl.h +52 -0
- package/deps/simdutf/src/simdutf/lasx.h +49 -0
- package/deps/simdutf/src/simdutf/lsx/begin.h +2 -0
- package/deps/simdutf/src/simdutf/lsx/bitmanipulation.h +25 -0
- package/deps/simdutf/src/simdutf/lsx/end.h +2 -0
- package/deps/simdutf/src/simdutf/lsx/implementation.h +309 -0
- package/deps/simdutf/src/simdutf/lsx/intrinsics.h +196 -0
- package/deps/simdutf/src/simdutf/lsx/simd.h +421 -0
- package/deps/simdutf/src/simdutf/lsx/simd16-inl.h +242 -0
- package/deps/simdutf/src/simdutf/lsx/simd32-inl.h +69 -0
- package/deps/simdutf/src/simdutf/lsx/simd64-inl.h +50 -0
- package/deps/simdutf/src/simdutf/lsx.h +52 -0
- package/deps/simdutf/src/simdutf/ppc64/begin.h +1 -0
- package/deps/simdutf/src/simdutf/ppc64/bitmanipulation.h +29 -0
- package/deps/simdutf/src/simdutf/ppc64/end.h +1 -0
- package/deps/simdutf/src/simdutf/ppc64/implementation.h +348 -0
- package/deps/simdutf/src/simdutf/ppc64/intrinsics.h +19 -0
- package/deps/simdutf/src/simdutf/ppc64/simd.h +177 -0
- package/deps/simdutf/src/simdutf/ppc64/simd16-inl.h +327 -0
- package/deps/simdutf/src/simdutf/ppc64/simd32-inl.h +247 -0
- package/deps/simdutf/src/simdutf/ppc64/simd8-inl.h +618 -0
- package/deps/simdutf/src/simdutf/ppc64.h +40 -0
- package/deps/simdutf/src/simdutf/rvv/begin.h +7 -0
- package/deps/simdutf/src/simdutf/rvv/end.h +7 -0
- package/deps/simdutf/src/simdutf/rvv/implementation.h +321 -0
- package/deps/simdutf/src/simdutf/rvv/intrinsics.h +131 -0
- package/deps/simdutf/src/simdutf/rvv.h +41 -0
- package/deps/simdutf/src/simdutf/westmere/begin.h +8 -0
- package/deps/simdutf/src/simdutf/westmere/bitmanipulation.h +37 -0
- package/deps/simdutf/src/simdutf/westmere/end.h +8 -0
- package/deps/simdutf/src/simdutf/westmere/implementation.h +338 -0
- package/deps/simdutf/src/simdutf/westmere/intrinsics.h +38 -0
- package/deps/simdutf/src/simdutf/westmere/simd.h +379 -0
- package/deps/simdutf/src/simdutf/westmere/simd16-inl.h +242 -0
- package/deps/simdutf/src/simdutf/westmere/simd32-inl.h +151 -0
- package/deps/simdutf/src/simdutf/westmere/simd64-inl.h +33 -0
- package/deps/simdutf/src/simdutf/westmere.h +59 -0
- package/deps/simdutf/src/simdutf.cpp +152 -0
- package/deps/simdutf/src/simdutf_c.cpp +525 -0
- package/deps/simdutf/src/tables/utf16_to_utf8_tables.h +768 -0
- package/deps/simdutf/src/tables/utf32_to_utf16_tables.h +53 -0
- package/deps/simdutf/src/tables/utf8_to_utf16_tables.h +826 -0
- package/deps/simdutf/src/westmere/implementation.cpp +1479 -0
- package/deps/simdutf/src/westmere/internal/loader.cpp +7 -0
- package/deps/simdutf/src/westmere/internal/write_v_u16_11bits_to_utf8.cpp +66 -0
- package/deps/simdutf/src/westmere/sse_base64.cpp +672 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf16.cpp +21 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf32.cpp +31 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf8.cpp +71 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_latin1.cpp +70 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf32.cpp +206 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf8.cpp +504 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_latin1.cpp +82 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf16.cpp +209 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf8.cpp +589 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_latin1.cpp +58 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf16.cpp +197 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf32.cpp +141 -0
- package/deps/simdutf/src/westmere/sse_utf16fix.cpp +82 -0
- package/deps/simdutf/src/westmere/sse_validate_utf16.cpp +17 -0
- package/deps/simdutf/tests/CMakeLists.txt +483 -0
- package/deps/simdutf/tests/atomic_base64_tests.cpp +2845 -0
- package/deps/simdutf/tests/base64_tests.cpp +3617 -0
- package/deps/simdutf/tests/basic_fuzzer.cpp +805 -0
- package/deps/simdutf/tests/bele_tests.cpp +182 -0
- package/deps/simdutf/tests/constexpr_base64_tests.cpp +387 -0
- package/deps/simdutf/tests/convert_latin1_to_utf16be_tests.cpp +52 -0
- package/deps/simdutf/tests/convert_latin1_to_utf16le_tests.cpp +80 -0
- package/deps/simdutf/tests/convert_latin1_to_utf32_tests.cpp +66 -0
- package/deps/simdutf/tests/convert_latin1_to_utf8_tests.cpp +120 -0
- package/deps/simdutf/tests/convert_utf16_to_utf8_safe_tests.cpp +203 -0
- package/deps/simdutf/tests/convert_utf16_to_utf8_with_replacement_tests.cpp +276 -0
- package/deps/simdutf/tests/convert_utf16be_to_latin1_tests.cpp +109 -0
- package/deps/simdutf/tests/convert_utf16be_to_latin1_tests_with_errors.cpp +136 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf32_tests.cpp +193 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf32_with_errors_tests.cpp +381 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf8_tests.cpp +259 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf8_with_errors_tests.cpp +266 -0
- package/deps/simdutf/tests/convert_utf16le_to_latin1_tests.cpp +148 -0
- package/deps/simdutf/tests/convert_utf16le_to_latin1_tests_with_errors.cpp +176 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf32_tests.cpp +213 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf32_with_errors_tests.cpp +318 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf8_tests.cpp +343 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf8_with_errors_tests.cpp +271 -0
- package/deps/simdutf/tests/convert_utf32_to_latin1_tests.cpp +111 -0
- package/deps/simdutf/tests/convert_utf32_to_latin1_with_errors_tests.cpp +96 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16be_tests.cpp +148 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16be_with_errors_tests.cpp +192 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16le_tests.cpp +166 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16le_with_errors_tests.cpp +215 -0
- package/deps/simdutf/tests/convert_utf32_to_utf8_tests.cpp +181 -0
- package/deps/simdutf/tests/convert_utf32_to_utf8_with_errors_tests.cpp +261 -0
- package/deps/simdutf/tests/convert_utf8_to_latin1_tests.cpp +516 -0
- package/deps/simdutf/tests/convert_utf8_to_latin1_with_errors_tests.cpp +579 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16be_tests.cpp +412 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16be_with_errors_tests.cpp +480 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16le_tests.cpp +671 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16le_with_errors_tests.cpp +455 -0
- package/deps/simdutf/tests/convert_utf8_to_utf32_tests.cpp +1204 -0
- package/deps/simdutf/tests/convert_utf8_to_utf32_with_errors_tests.cpp +337 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_latin1_tests.cpp +37 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_utf32_tests.cpp +97 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_utf8_tests.cpp +126 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_latin1_tests.cpp +71 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_utf32_tests.cpp +122 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_utf8_tests.cpp +244 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_latin1_tests.cpp +49 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf16be_tests.cpp +92 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf16le_tests.cpp +114 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf8_tests.cpp +109 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_latin1_tests.cpp +84 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf16be_tests.cpp +124 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf16le_tests.cpp +221 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf32_tests.cpp +155 -0
- package/deps/simdutf/tests/count_utf16be.cpp +64 -0
- package/deps/simdutf/tests/count_utf16le.cpp +61 -0
- package/deps/simdutf/tests/count_utf8.cpp +87 -0
- package/deps/simdutf/tests/detect_encodings_tests.cpp +312 -0
- package/deps/simdutf/tests/embed/valid_utf8.txt +1 -0
- package/deps/simdutf/tests/embed_tests.cpp +22 -0
- package/deps/simdutf/tests/find_tests.cpp +77 -0
- package/deps/simdutf/tests/fixed_string_tests.cpp +153 -0
- package/deps/simdutf/tests/helpers/CMakeLists.txt +25 -0
- package/deps/simdutf/tests/helpers/compiletime_conversions.h +222 -0
- package/deps/simdutf/tests/helpers/fixed_string.h +267 -0
- package/deps/simdutf/tests/helpers/random_int.cpp +30 -0
- package/deps/simdutf/tests/helpers/random_int.h +39 -0
- package/deps/simdutf/tests/helpers/random_utf16.cpp +123 -0
- package/deps/simdutf/tests/helpers/random_utf16.h +52 -0
- package/deps/simdutf/tests/helpers/random_utf32.cpp +41 -0
- package/deps/simdutf/tests/helpers/random_utf32.h +40 -0
- package/deps/simdutf/tests/helpers/random_utf8.cpp +93 -0
- package/deps/simdutf/tests/helpers/random_utf8.h +36 -0
- package/deps/simdutf/tests/helpers/test.cpp +231 -0
- package/deps/simdutf/tests/helpers/test.h +193 -0
- package/deps/simdutf/tests/helpers/transcode_test_base.cpp +1257 -0
- package/deps/simdutf/tests/helpers/transcode_test_base.h +683 -0
- package/deps/simdutf/tests/helpers/utf16.h +27 -0
- package/deps/simdutf/tests/installation_tests/find/CMakeLists.txt +43 -0
- package/deps/simdutf/tests/installation_tests/from_fetch/CMakeLists.txt +47 -0
- package/deps/simdutf/tests/internal_tests.cpp +27 -0
- package/deps/simdutf/tests/null_safety_tests.cpp +94 -0
- package/deps/simdutf/tests/random_fuzzer.cpp +779 -0
- package/deps/simdutf/tests/readme_tests.cpp +274 -0
- package/deps/simdutf/tests/reference/CMakeLists.txt +23 -0
- package/deps/simdutf/tests/reference/decode_utf16.h +81 -0
- package/deps/simdutf/tests/reference/decode_utf32.h +47 -0
- package/deps/simdutf/tests/reference/encode_latin1.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_latin1.h +32 -0
- package/deps/simdutf/tests/reference/encode_utf16.cpp +49 -0
- package/deps/simdutf/tests/reference/encode_utf16.h +20 -0
- package/deps/simdutf/tests/reference/encode_utf32.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_utf32.h +36 -0
- package/deps/simdutf/tests/reference/encode_utf8.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_utf8.h +40 -0
- package/deps/simdutf/tests/reference/validate_utf16.cpp +60 -0
- package/deps/simdutf/tests/reference/validate_utf16.h +14 -0
- package/deps/simdutf/tests/reference/validate_utf16_to_latin1.cpp +35 -0
- package/deps/simdutf/tests/reference/validate_utf16_to_latin1.h +13 -0
- package/deps/simdutf/tests/reference/validate_utf32.cpp +27 -0
- package/deps/simdutf/tests/reference/validate_utf32.h +12 -0
- package/deps/simdutf/tests/reference/validate_utf32_to_latin1.cpp +27 -0
- package/deps/simdutf/tests/reference/validate_utf32_to_latin1.h +12 -0
- package/deps/simdutf/tests/reference/validate_utf8.cpp +82 -0
- package/deps/simdutf/tests/reference/validate_utf8.h +11 -0
- package/deps/simdutf/tests/reference/validate_utf8_to_latin1.cpp +43 -0
- package/deps/simdutf/tests/reference/validate_utf8_to_latin1.h +12 -0
- package/deps/simdutf/tests/select_implementation.cpp +43 -0
- package/deps/simdutf/tests/simdutf_c_tests.cpp +244 -0
- package/deps/simdutf/tests/span_tests.cpp +401 -0
- package/deps/simdutf/tests/special_tests.cpp +559 -0
- package/deps/simdutf/tests/straight_c_test.c +187 -0
- package/deps/simdutf/tests/text_encoding_tests.cpp +77 -0
- package/deps/simdutf/tests/to_well_formed_utf16_tests.cpp +377 -0
- package/deps/simdutf/tests/utf8_length_from_utf16_tests.cpp +202 -0
- package/deps/simdutf/tests/validate_ascii_basic_tests.cpp +165 -0
- package/deps/simdutf/tests/validate_ascii_with_errors_tests.cpp +77 -0
- package/deps/simdutf/tests/validate_utf16be_basic_tests.cpp +175 -0
- package/deps/simdutf/tests/validate_utf16be_with_errors_tests.cpp +188 -0
- package/deps/simdutf/tests/validate_utf16le_basic_tests.cpp +268 -0
- package/deps/simdutf/tests/validate_utf16le_with_errors_tests.cpp +274 -0
- package/deps/simdutf/tests/validate_utf32_basic_tests.cpp +92 -0
- package/deps/simdutf/tests/validate_utf32_with_errors_tests.cpp +114 -0
- package/deps/simdutf/tests/validate_utf8_basic_tests.cpp +178 -0
- package/deps/simdutf/tests/validate_utf8_brute_force_tests.cpp +88 -0
- package/deps/simdutf/tests/validate_utf8_puzzler_tests.cpp +33 -0
- package/deps/simdutf/tests/validate_utf8_with_errors_tests.cpp +228 -0
- package/deps/simdutf/tools/CMakeLists.txt +85 -0
- package/deps/simdutf/tools/fastbase64.cpp +250 -0
- package/deps/simdutf/tools/sutf.cpp +556 -0
- package/deps/simdutf/tools/sutf.h +40 -0
- package/package.json +2 -2
|
@@ -0,0 +1,36 @@
|
|
|
1
|
+
// file included directly
|
|
2
|
+
template <endianness big_endian>
|
|
3
|
+
size_t icelake_convert_latin1_to_utf16(const char *latin1_input, size_t len,
|
|
4
|
+
char16_t *utf16_output) {
|
|
5
|
+
size_t rounded_len = len & ~0x1F; // Round down to nearest multiple of 32
|
|
6
|
+
|
|
7
|
+
__m512i byteflip = _mm512_setr_epi64(0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
8
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
9
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
10
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809);
|
|
11
|
+
for (size_t i = 0; i < rounded_len; i += 32) {
|
|
12
|
+
// Load 32 Latin1 characters into a 256-bit register
|
|
13
|
+
__m256i in = _mm256_loadu_si256((__m256i *)&latin1_input[i]);
|
|
14
|
+
// Zero extend each set of 8 Latin1 characters to 32 16-bit integers
|
|
15
|
+
__m512i out = _mm512_cvtepu8_epi16(in);
|
|
16
|
+
if (big_endian) {
|
|
17
|
+
out = _mm512_shuffle_epi8(out, byteflip);
|
|
18
|
+
}
|
|
19
|
+
// Store the results back to memory
|
|
20
|
+
_mm512_storeu_si512((__m512i *)&utf16_output[i], out);
|
|
21
|
+
}
|
|
22
|
+
if (rounded_len != len) {
|
|
23
|
+
uint32_t mask = uint32_t(1 << (len - rounded_len)) - 1;
|
|
24
|
+
__m256i in = _mm256_maskz_loadu_epi8(mask, latin1_input + rounded_len);
|
|
25
|
+
|
|
26
|
+
// Zero extend each set of 8 Latin1 characters to 32 16-bit integers
|
|
27
|
+
__m512i out = _mm512_cvtepu8_epi16(in);
|
|
28
|
+
if (big_endian) {
|
|
29
|
+
out = _mm512_shuffle_epi8(out, byteflip);
|
|
30
|
+
}
|
|
31
|
+
// Store the results back to memory
|
|
32
|
+
_mm512_mask_storeu_epi16(utf16_output + rounded_len, mask, out);
|
|
33
|
+
}
|
|
34
|
+
|
|
35
|
+
return len;
|
|
36
|
+
}
|
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
void avx512_convert_latin1_to_utf32(const char *buf, size_t len,
|
|
2
|
+
char32_t *utf32_output) {
|
|
3
|
+
while (len >= 16) {
|
|
4
|
+
// Load 16 Latin1 characters into a 128-bit register
|
|
5
|
+
__m128i in = _mm_loadu_si128((__m128i *)buf);
|
|
6
|
+
|
|
7
|
+
// Zero extend each set of 8 Latin1 characters to 16 32-bit integers using
|
|
8
|
+
// vpmovzxbd
|
|
9
|
+
__m512i out = _mm512_cvtepu8_epi32(in);
|
|
10
|
+
|
|
11
|
+
// Store the results back to memory
|
|
12
|
+
_mm512_storeu_si512((__m512i *)utf32_output, out);
|
|
13
|
+
|
|
14
|
+
len -= 16;
|
|
15
|
+
buf += 16;
|
|
16
|
+
utf32_output += 16;
|
|
17
|
+
}
|
|
18
|
+
|
|
19
|
+
__mmask16 mask = __mmask16((1 << len) - 1);
|
|
20
|
+
__m128i in = _mm_maskz_loadu_epi8(mask, buf);
|
|
21
|
+
__m512i out = _mm512_cvtepu8_epi32(in);
|
|
22
|
+
_mm512_mask_storeu_epi32((__m512i *)utf32_output, mask, out);
|
|
23
|
+
}
|
|
@@ -0,0 +1,107 @@
|
|
|
1
|
+
// file included directly
|
|
2
|
+
|
|
3
|
+
static inline size_t latin1_to_utf8_avx512_vec(__m512i input, size_t input_len,
|
|
4
|
+
char *utf8_output,
|
|
5
|
+
int mask_output) {
|
|
6
|
+
__mmask64 nonascii = _mm512_movepi8_mask(input);
|
|
7
|
+
size_t output_size = input_len + (size_t)count_ones(nonascii);
|
|
8
|
+
|
|
9
|
+
// Mask to denote whether the byte is a leading byte that is not ascii
|
|
10
|
+
__mmask64 sixth = _mm512_cmpge_epu8_mask(
|
|
11
|
+
input, _mm512_set1_epi8(-64)); // binary representation of -64: 1100 0000
|
|
12
|
+
|
|
13
|
+
const uint64_t alternate_bits = UINT64_C(0x5555555555555555);
|
|
14
|
+
uint64_t ascii = ~nonascii;
|
|
15
|
+
// the bits in ascii are inverted and zeros are interspersed in between them
|
|
16
|
+
uint64_t maskA = ~_pdep_u64(ascii, alternate_bits);
|
|
17
|
+
uint64_t maskB = ~_pdep_u64(ascii >> 32, alternate_bits);
|
|
18
|
+
|
|
19
|
+
// interleave bytes from top and bottom halves (abcd...ABCD -> aAbBcCdD)
|
|
20
|
+
__m512i input_interleaved = _mm512_permutexvar_epi8(
|
|
21
|
+
_mm512_set_epi32(0x3f1f3e1e, 0x3d1d3c1c, 0x3b1b3a1a, 0x39193818,
|
|
22
|
+
0x37173616, 0x35153414, 0x33133212, 0x31113010,
|
|
23
|
+
0x2f0f2e0e, 0x2d0d2c0c, 0x2b0b2a0a, 0x29092808,
|
|
24
|
+
0x27072606, 0x25052404, 0x23032202, 0x21012000),
|
|
25
|
+
input);
|
|
26
|
+
|
|
27
|
+
// double size of each byte, and insert the leading byte 1100 0010
|
|
28
|
+
|
|
29
|
+
/*
|
|
30
|
+
upscale the bytes to 16-bit value, adding the 0b11000000 leading byte in the
|
|
31
|
+
process. We adjust for the bytes that have their two most significant bits.
|
|
32
|
+
This takes care of the first 32 bytes, assuming we interleaved the bytes. */
|
|
33
|
+
__m512i outputA =
|
|
34
|
+
_mm512_shldi_epi16(input_interleaved, _mm512_set1_epi8(-62), 8);
|
|
35
|
+
outputA = _mm512_mask_add_epi16(
|
|
36
|
+
outputA, (__mmask32)sixth, outputA,
|
|
37
|
+
_mm512_set1_epi16(1 - 0x4000)); // 1- 0x4000 = 1100 0000 0000 0001????
|
|
38
|
+
|
|
39
|
+
// in the second 32-bit half, set first or second option based on whether
|
|
40
|
+
// original input is leading byte (second case) or not (first case)
|
|
41
|
+
__m512i leadingB =
|
|
42
|
+
_mm512_mask_blend_epi16((__mmask32)(sixth >> 32),
|
|
43
|
+
_mm512_set1_epi16(0x00c2), // 0000 0000 1101 0010
|
|
44
|
+
_mm512_set1_epi16(0x40c3)); // 0100 0000 1100 0011
|
|
45
|
+
__m512i outputB = _mm512_ternarylogic_epi32(
|
|
46
|
+
input_interleaved, leadingB, _mm512_set1_epi16((short)0xff00),
|
|
47
|
+
(240 & 170) ^ 204); // (input_interleaved & 0xff00) ^ leadingB
|
|
48
|
+
|
|
49
|
+
// prune redundant bytes
|
|
50
|
+
outputA = _mm512_maskz_compress_epi8(maskA, outputA);
|
|
51
|
+
outputB = _mm512_maskz_compress_epi8(maskB, outputB);
|
|
52
|
+
|
|
53
|
+
size_t output_sizeA = (size_t)count_ones((uint32_t)nonascii) + 32;
|
|
54
|
+
|
|
55
|
+
if (mask_output) {
|
|
56
|
+
if (input_len > 32) { // is the second half of the input vector used?
|
|
57
|
+
__mmask64 write_mask = _bzhi_u64(~0ULL, (unsigned int)output_sizeA);
|
|
58
|
+
_mm512_mask_storeu_epi8(utf8_output, write_mask, outputA);
|
|
59
|
+
utf8_output += output_sizeA;
|
|
60
|
+
write_mask = _bzhi_u64(~0ULL, (unsigned int)(output_size - output_sizeA));
|
|
61
|
+
_mm512_mask_storeu_epi8(utf8_output, write_mask, outputB);
|
|
62
|
+
} else {
|
|
63
|
+
__mmask64 write_mask = _bzhi_u64(~0ULL, (unsigned int)output_size);
|
|
64
|
+
_mm512_mask_storeu_epi8(utf8_output, write_mask, outputA);
|
|
65
|
+
}
|
|
66
|
+
} else {
|
|
67
|
+
_mm512_storeu_si512(utf8_output, outputA);
|
|
68
|
+
utf8_output += output_sizeA;
|
|
69
|
+
_mm512_storeu_si512(utf8_output, outputB);
|
|
70
|
+
}
|
|
71
|
+
return output_size;
|
|
72
|
+
}
|
|
73
|
+
|
|
74
|
+
static inline size_t latin1_to_utf8_avx512_branch(__m512i input,
|
|
75
|
+
char *utf8_output) {
|
|
76
|
+
__mmask64 nonascii = _mm512_movepi8_mask(input);
|
|
77
|
+
if (nonascii) {
|
|
78
|
+
return latin1_to_utf8_avx512_vec(input, 64, utf8_output, 0);
|
|
79
|
+
} else {
|
|
80
|
+
_mm512_storeu_si512(utf8_output, input);
|
|
81
|
+
return 64;
|
|
82
|
+
}
|
|
83
|
+
}
|
|
84
|
+
|
|
85
|
+
size_t latin1_to_utf8_avx512_start(const char *buf, size_t len,
|
|
86
|
+
char *utf8_output) {
|
|
87
|
+
char *start = utf8_output;
|
|
88
|
+
size_t pos = 0;
|
|
89
|
+
// if there's at least 128 bytes remaining, we don't need to mask the output
|
|
90
|
+
for (; pos + 128 <= len; pos += 64) {
|
|
91
|
+
__m512i input = _mm512_loadu_si512((__m512i *)(buf + pos));
|
|
92
|
+
utf8_output += latin1_to_utf8_avx512_branch(input, utf8_output);
|
|
93
|
+
}
|
|
94
|
+
// in the last 128 bytes, the first 64 may require masking the output
|
|
95
|
+
if (pos + 64 <= len) {
|
|
96
|
+
__m512i input = _mm512_loadu_si512((__m512i *)(buf + pos));
|
|
97
|
+
utf8_output += latin1_to_utf8_avx512_vec(input, 64, utf8_output, 1);
|
|
98
|
+
pos += 64;
|
|
99
|
+
}
|
|
100
|
+
// with the last 64 bytes, the input also needs to be masked
|
|
101
|
+
if (pos < len) {
|
|
102
|
+
__mmask64 load_mask = _bzhi_u64(~0ULL, (unsigned int)(len - pos));
|
|
103
|
+
__m512i input = _mm512_maskz_loadu_epi8(load_mask, (__m512i *)(buf + pos));
|
|
104
|
+
utf8_output += latin1_to_utf8_avx512_vec(input, len - pos, utf8_output, 1);
|
|
105
|
+
}
|
|
106
|
+
return (size_t)(utf8_output - start);
|
|
107
|
+
}
|
|
@@ -0,0 +1,103 @@
|
|
|
1
|
+
// file included directly
|
|
2
|
+
template <endianness big_endian>
|
|
3
|
+
size_t icelake_convert_utf16_to_latin1(const char16_t *buf, size_t len,
|
|
4
|
+
char *latin1_output) {
|
|
5
|
+
const char16_t *end = buf + len;
|
|
6
|
+
__m512i v_0xFF = _mm512_set1_epi16(0xff);
|
|
7
|
+
__m512i byteflip = _mm512_setr_epi64(0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
8
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
9
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
10
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809);
|
|
11
|
+
__m512i shufmask = _mm512_set_epi8(
|
|
12
|
+
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
|
13
|
+
0, 0, 0, 0, 0, 0, 0, 62, 60, 58, 56, 54, 52, 50, 48, 46, 44, 42, 40, 38,
|
|
14
|
+
36, 34, 32, 30, 28, 26, 24, 22, 20, 18, 16, 14, 12, 10, 8, 6, 4, 2, 0);
|
|
15
|
+
while (end - buf >= 32) {
|
|
16
|
+
__m512i in = _mm512_loadu_si512((__m512i *)buf);
|
|
17
|
+
if (big_endian) {
|
|
18
|
+
in = _mm512_shuffle_epi8(in, byteflip);
|
|
19
|
+
}
|
|
20
|
+
if (_mm512_cmpgt_epu16_mask(in, v_0xFF)) {
|
|
21
|
+
return 0;
|
|
22
|
+
}
|
|
23
|
+
_mm256_storeu_si256(
|
|
24
|
+
(__m256i *)latin1_output,
|
|
25
|
+
_mm512_castsi512_si256(_mm512_permutexvar_epi8(shufmask, in)));
|
|
26
|
+
latin1_output += 32;
|
|
27
|
+
buf += 32;
|
|
28
|
+
}
|
|
29
|
+
if (buf < end) {
|
|
30
|
+
uint32_t mask(uint32_t(1 << (end - buf)) - 1);
|
|
31
|
+
__m512i in = _mm512_maskz_loadu_epi16(mask, buf);
|
|
32
|
+
if (big_endian) {
|
|
33
|
+
in = _mm512_shuffle_epi8(in, byteflip);
|
|
34
|
+
}
|
|
35
|
+
if (_mm512_cmpgt_epu16_mask(in, v_0xFF)) {
|
|
36
|
+
return 0;
|
|
37
|
+
}
|
|
38
|
+
_mm256_mask_storeu_epi8(
|
|
39
|
+
latin1_output, mask,
|
|
40
|
+
_mm512_castsi512_si256(_mm512_permutexvar_epi8(shufmask, in)));
|
|
41
|
+
}
|
|
42
|
+
return len;
|
|
43
|
+
}
|
|
44
|
+
|
|
45
|
+
template <endianness big_endian>
|
|
46
|
+
std::pair<result, char *>
|
|
47
|
+
icelake_convert_utf16_to_latin1_with_errors(const char16_t *buf, size_t len,
|
|
48
|
+
char *latin1_output) {
|
|
49
|
+
const char16_t *end = buf + len;
|
|
50
|
+
const char16_t *start = buf;
|
|
51
|
+
__m512i byteflip = _mm512_setr_epi64(0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
52
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
53
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
54
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809);
|
|
55
|
+
__m512i v_0xFF = _mm512_set1_epi16(0xff);
|
|
56
|
+
__m512i shufmask = _mm512_set_epi8(
|
|
57
|
+
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
|
58
|
+
0, 0, 0, 0, 0, 0, 0, 62, 60, 58, 56, 54, 52, 50, 48, 46, 44, 42, 40, 38,
|
|
59
|
+
36, 34, 32, 30, 28, 26, 24, 22, 20, 18, 16, 14, 12, 10, 8, 6, 4, 2, 0);
|
|
60
|
+
while (end - buf >= 32) {
|
|
61
|
+
__m512i in = _mm512_loadu_si512((__m512i *)buf);
|
|
62
|
+
if (big_endian) {
|
|
63
|
+
in = _mm512_shuffle_epi8(in, byteflip);
|
|
64
|
+
}
|
|
65
|
+
if (_mm512_cmpgt_epu16_mask(in, v_0xFF)) {
|
|
66
|
+
uint16_t word;
|
|
67
|
+
while ((word = scalar::utf16::swap_if_needed<big_endian>(
|
|
68
|
+
uint16_t(*buf))) <= 0xff) {
|
|
69
|
+
*latin1_output++ = uint8_t(word);
|
|
70
|
+
buf++;
|
|
71
|
+
}
|
|
72
|
+
return std::make_pair(result(error_code::TOO_LARGE, buf - start),
|
|
73
|
+
latin1_output);
|
|
74
|
+
}
|
|
75
|
+
_mm256_storeu_si256(
|
|
76
|
+
(__m256i *)latin1_output,
|
|
77
|
+
_mm512_castsi512_si256(_mm512_permutexvar_epi8(shufmask, in)));
|
|
78
|
+
latin1_output += 32;
|
|
79
|
+
buf += 32;
|
|
80
|
+
}
|
|
81
|
+
if (buf < end) {
|
|
82
|
+
uint32_t mask(uint32_t(1 << (end - buf)) - 1);
|
|
83
|
+
__m512i in = _mm512_maskz_loadu_epi16(mask, buf);
|
|
84
|
+
if (big_endian) {
|
|
85
|
+
in = _mm512_shuffle_epi8(in, byteflip);
|
|
86
|
+
}
|
|
87
|
+
if (_mm512_cmpgt_epu16_mask(in, v_0xFF)) {
|
|
88
|
+
|
|
89
|
+
uint16_t word;
|
|
90
|
+
while ((word = scalar::utf16::swap_if_needed<big_endian>(
|
|
91
|
+
uint16_t(*buf))) <= 0xff) {
|
|
92
|
+
*latin1_output++ = uint8_t(word);
|
|
93
|
+
buf++;
|
|
94
|
+
}
|
|
95
|
+
return std::make_pair(result(error_code::TOO_LARGE, buf - start),
|
|
96
|
+
latin1_output);
|
|
97
|
+
}
|
|
98
|
+
_mm256_mask_storeu_epi8(
|
|
99
|
+
latin1_output, mask,
|
|
100
|
+
_mm512_castsi512_si256(_mm512_permutexvar_epi8(shufmask, in)));
|
|
101
|
+
}
|
|
102
|
+
return std::make_pair(result(error_code::SUCCESS, len), latin1_output);
|
|
103
|
+
}
|
|
@@ -0,0 +1,136 @@
|
|
|
1
|
+
// file included directly
|
|
2
|
+
|
|
3
|
+
/*
|
|
4
|
+
Returns a pair: the first unprocessed byte from buf and utf32_output
|
|
5
|
+
A scalar routing should carry on the conversion of the tail.
|
|
6
|
+
*/
|
|
7
|
+
template <endianness big_endian>
|
|
8
|
+
std::tuple<const char16_t *, char32_t *, bool>
|
|
9
|
+
convert_utf16_to_utf32(const char16_t *buf, size_t len,
|
|
10
|
+
char32_t *utf32_output) {
|
|
11
|
+
const char16_t *end = buf + len;
|
|
12
|
+
const __m512i v_fc00 = _mm512_set1_epi16((uint16_t)0xfc00);
|
|
13
|
+
const __m512i v_d800 = _mm512_set1_epi16((uint16_t)0xd800);
|
|
14
|
+
const __m512i v_dc00 = _mm512_set1_epi16((uint16_t)0xdc00);
|
|
15
|
+
__mmask32 carry{0};
|
|
16
|
+
const __m512i byteflip = _mm512_setr_epi64(
|
|
17
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809, 0x0607040502030001,
|
|
18
|
+
0x0e0f0c0d0a0b0809, 0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
19
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809);
|
|
20
|
+
while (std::distance(buf, end) >= 32) {
|
|
21
|
+
// Always safe because buf + 32 <= end so that end - buf >= 32 bytes:
|
|
22
|
+
__m512i in = _mm512_loadu_si512((__m512i *)buf);
|
|
23
|
+
if (big_endian) {
|
|
24
|
+
in = _mm512_shuffle_epi8(in, byteflip);
|
|
25
|
+
}
|
|
26
|
+
|
|
27
|
+
// H - bitmask for high surrogates
|
|
28
|
+
const __mmask32 H =
|
|
29
|
+
_mm512_cmpeq_epi16_mask(_mm512_and_si512(in, v_fc00), v_d800);
|
|
30
|
+
// H - bitmask for low surrogates
|
|
31
|
+
const __mmask32 L =
|
|
32
|
+
_mm512_cmpeq_epi16_mask(_mm512_and_si512(in, v_fc00), v_dc00);
|
|
33
|
+
|
|
34
|
+
if ((H | L)) {
|
|
35
|
+
// surrogate pair(s) in a register
|
|
36
|
+
const __mmask32 V =
|
|
37
|
+
(L ^
|
|
38
|
+
(carry | (H << 1))); // A high surrogate must be followed by low one
|
|
39
|
+
// and a low one must be preceded by a high one.
|
|
40
|
+
// If valid, V should be equal to 0
|
|
41
|
+
|
|
42
|
+
if (V == 0) {
|
|
43
|
+
// valid case
|
|
44
|
+
/*
|
|
45
|
+
Input surrogate pair:
|
|
46
|
+
|1101.11aa.aaaa.aaaa|1101.10bb.bbbb.bbbb|
|
|
47
|
+
low surrogate high surrogate
|
|
48
|
+
*/
|
|
49
|
+
/* 1. Expand all code units to 32-bit code units
|
|
50
|
+
in
|
|
51
|
+
|0000.0000.0000.0000.1101.11aa.aaaa.aaaa|0000.0000.0000.0000.1101.10bb.bbbb.bbbb|
|
|
52
|
+
*/
|
|
53
|
+
const __m512i first = _mm512_cvtepu16_epi32(_mm512_castsi512_si256(in));
|
|
54
|
+
const __m512i second =
|
|
55
|
+
_mm512_cvtepu16_epi32(_mm512_extracti32x8_epi32(in, 1));
|
|
56
|
+
|
|
57
|
+
/* 2. Shift by one 16-bit word to align low surrogates with high
|
|
58
|
+
surrogates in
|
|
59
|
+
|0000.0000.0000.0000.1101.11aa.aaaa.aaaa|0000.0000.0000.0000.1101.10bb.bbbb.bbbb|
|
|
60
|
+
shifted
|
|
61
|
+
|????.????.????.????.????.????.????.????|0000.0000.0000.0000.1101.11aa.aaaa.aaaa|
|
|
62
|
+
*/
|
|
63
|
+
const __m512i shifted_first = _mm512_alignr_epi32(second, first, 1);
|
|
64
|
+
const __m512i shifted_second =
|
|
65
|
+
_mm512_alignr_epi32(_mm512_setzero_si512(), second, 1);
|
|
66
|
+
|
|
67
|
+
/* 3. Align all high surrogates in first and second by shifting to the
|
|
68
|
+
left by 10 bits
|
|
69
|
+
|0000.0000.0000.0000.1101.11aa.aaaa.aaaa|0000.0011.0110.bbbb.bbbb.bb00.0000.0000|
|
|
70
|
+
*/
|
|
71
|
+
const __m512i aligned_first =
|
|
72
|
+
_mm512_mask_slli_epi32(first, (__mmask16)H, first, 10);
|
|
73
|
+
const __m512i aligned_second =
|
|
74
|
+
_mm512_mask_slli_epi32(second, (__mmask16)(H >> 16), second, 10);
|
|
75
|
+
|
|
76
|
+
/* 4. Remove surrogate prefixes and add offset 0x10000 by adding in,
|
|
77
|
+
shifted and constant in
|
|
78
|
+
|0000.0000.0000.0000.1101.11aa.aaaa.aaaa|0000.0011.0110.bbbb.bbbb.bb00.0000.0000|
|
|
79
|
+
shifted
|
|
80
|
+
|????.????.????.????.????.????.????.????|0000.0000.0000.0000.1101.11aa.aaaa.aaaa|
|
|
81
|
+
constant|1111.1100.1010.0000.0010.0100.0000.0000|1111.1100.1010.0000.0010.0100.0000.0000|
|
|
82
|
+
*/
|
|
83
|
+
const __m512i constant = _mm512_set1_epi32((uint32_t)0xfca02400);
|
|
84
|
+
const __m512i added_first = _mm512_mask_add_epi32(
|
|
85
|
+
aligned_first, (__mmask16)H, aligned_first, shifted_first);
|
|
86
|
+
const __m512i utf32_first = _mm512_mask_add_epi32(
|
|
87
|
+
added_first, (__mmask16)H, added_first, constant);
|
|
88
|
+
|
|
89
|
+
const __m512i added_second =
|
|
90
|
+
_mm512_mask_add_epi32(aligned_second, (__mmask16)(H >> 16),
|
|
91
|
+
aligned_second, shifted_second);
|
|
92
|
+
const __m512i utf32_second = _mm512_mask_add_epi32(
|
|
93
|
+
added_second, (__mmask16)(H >> 16), added_second, constant);
|
|
94
|
+
|
|
95
|
+
// 5. Store all valid UTF-32 code units (low surrogate positions and
|
|
96
|
+
// 32nd word are invalid)
|
|
97
|
+
const __mmask32 valid = ~L & 0x7fffffff;
|
|
98
|
+
// We deliberately do a _mm512_maskz_compress_epi32 followed by
|
|
99
|
+
// storeu_epi32 to ease performance portability to Zen 4.
|
|
100
|
+
const __m512i compressed_first =
|
|
101
|
+
_mm512_maskz_compress_epi32((__mmask16)(valid), utf32_first);
|
|
102
|
+
const size_t howmany1 = count_ones((uint16_t)(valid));
|
|
103
|
+
_mm512_storeu_si512((__m512i *)utf32_output, compressed_first);
|
|
104
|
+
utf32_output += howmany1;
|
|
105
|
+
const __m512i compressed_second =
|
|
106
|
+
_mm512_maskz_compress_epi32((__mmask16)(valid >> 16), utf32_second);
|
|
107
|
+
const size_t howmany2 = count_ones((uint16_t)(valid >> 16));
|
|
108
|
+
// The following could be unsafe in some cases?
|
|
109
|
+
//_mm512_storeu_epi32((__m512i *) utf32_output, compressed_second);
|
|
110
|
+
_mm512_mask_storeu_epi32((__m512i *)utf32_output,
|
|
111
|
+
__mmask16((1 << howmany2) - 1),
|
|
112
|
+
compressed_second);
|
|
113
|
+
utf32_output += howmany2;
|
|
114
|
+
// Only process 31 code units, but keep track if the 31st word is a high
|
|
115
|
+
// surrogate as a carry
|
|
116
|
+
buf += 31;
|
|
117
|
+
carry = (H >> 30) & 0x1;
|
|
118
|
+
} else {
|
|
119
|
+
// invalid case
|
|
120
|
+
return std::make_tuple(buf + carry, utf32_output, false);
|
|
121
|
+
}
|
|
122
|
+
} else {
|
|
123
|
+
// no surrogates
|
|
124
|
+
// extend all thirty-two 16-bit code units to thirty-two 32-bit code units
|
|
125
|
+
_mm512_storeu_si512((__m512i *)(utf32_output),
|
|
126
|
+
_mm512_cvtepu16_epi32(_mm512_castsi512_si256(in)));
|
|
127
|
+
_mm512_storeu_si512(
|
|
128
|
+
(__m512i *)(utf32_output) + 1,
|
|
129
|
+
_mm512_cvtepu16_epi32(_mm512_extracti32x8_epi32(in, 1)));
|
|
130
|
+
utf32_output += 32;
|
|
131
|
+
buf += 32;
|
|
132
|
+
carry = 0;
|
|
133
|
+
}
|
|
134
|
+
} // while
|
|
135
|
+
return std::make_tuple(buf + carry, utf32_output, true);
|
|
136
|
+
}
|
|
@@ -0,0 +1,206 @@
|
|
|
1
|
+
// file included directly
|
|
2
|
+
|
|
3
|
+
/**
|
|
4
|
+
* This function converts the input (inbuf, inlen), assumed to be valid
|
|
5
|
+
* UTF16 (little endian) into UTF-8 (to outbuf). The number of code units
|
|
6
|
+
* written is written to 'outlen' and the function reports the number of input
|
|
7
|
+
* word consumed.
|
|
8
|
+
*/
|
|
9
|
+
template <endianness big_endian>
|
|
10
|
+
size_t utf16_to_utf8_avx512i(const char16_t *inbuf, size_t inlen,
|
|
11
|
+
unsigned char *outbuf, size_t *outlen) {
|
|
12
|
+
__m512i in;
|
|
13
|
+
__mmask32 inmask = _cvtu32_mask32(0x7fffffff);
|
|
14
|
+
__m512i byteflip = _mm512_setr_epi64(0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
15
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
16
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809,
|
|
17
|
+
0x0607040502030001, 0x0e0f0c0d0a0b0809);
|
|
18
|
+
const char16_t *const inbuf_orig = inbuf;
|
|
19
|
+
const unsigned char *const outbuf_orig = outbuf;
|
|
20
|
+
int adjust = 0;
|
|
21
|
+
int carry = 0;
|
|
22
|
+
|
|
23
|
+
while (inlen >= 32) {
|
|
24
|
+
in = _mm512_loadu_si512(inbuf);
|
|
25
|
+
if (big_endian) {
|
|
26
|
+
in = _mm512_shuffle_epi8(in, byteflip);
|
|
27
|
+
}
|
|
28
|
+
inlen -= 31;
|
|
29
|
+
lastiteration:
|
|
30
|
+
inbuf += 31;
|
|
31
|
+
|
|
32
|
+
failiteration:
|
|
33
|
+
const __mmask32 is234byte = _mm512_mask_cmp_epu16_mask(
|
|
34
|
+
inmask, in, _mm512_set1_epi16(0x0080), _MM_CMPINT_NLT);
|
|
35
|
+
|
|
36
|
+
if (_ktestz_mask32_u8(inmask, is234byte)) {
|
|
37
|
+
// fast path for ASCII only
|
|
38
|
+
_mm512_mask_cvtepi16_storeu_epi8(outbuf, inmask, in);
|
|
39
|
+
outbuf += 31;
|
|
40
|
+
carry = 0;
|
|
41
|
+
|
|
42
|
+
if (inlen < 32) {
|
|
43
|
+
goto tail;
|
|
44
|
+
} else {
|
|
45
|
+
continue;
|
|
46
|
+
}
|
|
47
|
+
}
|
|
48
|
+
|
|
49
|
+
const __mmask32 is12byte =
|
|
50
|
+
_mm512_cmp_epu16_mask(in, _mm512_set1_epi16(0x0800), _MM_CMPINT_LT);
|
|
51
|
+
|
|
52
|
+
if (_ktestc_mask32_u8(is12byte, inmask)) {
|
|
53
|
+
// fast path for 1 and 2 byte only
|
|
54
|
+
|
|
55
|
+
const __m512i twobytes = _mm512_ternarylogic_epi32(
|
|
56
|
+
_mm512_slli_epi16(in, 8), _mm512_srli_epi16(in, 6),
|
|
57
|
+
_mm512_set1_epi16(0x3f3f), 0xa8); // (A|B)&C
|
|
58
|
+
in = _mm512_mask_add_epi16(in, is234byte, twobytes,
|
|
59
|
+
_mm512_set1_epi16(int16_t(0x80c0)));
|
|
60
|
+
const __m512i cmpmask =
|
|
61
|
+
_mm512_mask_blend_epi16(inmask, _mm512_set1_epi16(int16_t(0xffff)),
|
|
62
|
+
_mm512_set1_epi16(0x0800));
|
|
63
|
+
const __mmask64 smoosh =
|
|
64
|
+
_mm512_cmp_epu8_mask(in, cmpmask, _MM_CMPINT_NLT);
|
|
65
|
+
const __m512i out = _mm512_maskz_compress_epi8(smoosh, in);
|
|
66
|
+
_mm512_mask_storeu_epi8(outbuf,
|
|
67
|
+
_cvtu64_mask64(_pext_u64(_cvtmask64_u64(smoosh),
|
|
68
|
+
_cvtmask64_u64(smoosh))),
|
|
69
|
+
out);
|
|
70
|
+
outbuf += 31 + _mm_popcnt_u32(_cvtmask32_u32(is234byte));
|
|
71
|
+
carry = 0;
|
|
72
|
+
|
|
73
|
+
if (inlen < 32) {
|
|
74
|
+
goto tail;
|
|
75
|
+
} else {
|
|
76
|
+
continue;
|
|
77
|
+
}
|
|
78
|
+
}
|
|
79
|
+
__m512i lo = _mm512_cvtepu16_epi32(_mm512_castsi512_si256(in));
|
|
80
|
+
__m512i hi = _mm512_cvtepu16_epi32(_mm512_extracti32x8_epi32(in, 1));
|
|
81
|
+
|
|
82
|
+
__m512i taglo = _mm512_set1_epi32(0x8080e000);
|
|
83
|
+
__m512i taghi = taglo;
|
|
84
|
+
|
|
85
|
+
const __m512i fc00masked =
|
|
86
|
+
_mm512_and_epi32(in, _mm512_set1_epi16(int16_t(0xfc00)));
|
|
87
|
+
const __mmask32 hisurr = _mm512_mask_cmp_epu16_mask(
|
|
88
|
+
inmask, fc00masked, _mm512_set1_epi16(int16_t(0xd800)), _MM_CMPINT_EQ);
|
|
89
|
+
const __mmask32 losurr = _mm512_cmp_epu16_mask(
|
|
90
|
+
fc00masked, _mm512_set1_epi16(int16_t(0xdc00)), _MM_CMPINT_EQ);
|
|
91
|
+
|
|
92
|
+
int carryout = 0;
|
|
93
|
+
if (!_kortestz_mask32_u8(hisurr, losurr)) {
|
|
94
|
+
// handle surrogates
|
|
95
|
+
|
|
96
|
+
__m512i los = _mm512_alignr_epi32(hi, lo, 1);
|
|
97
|
+
__m512i his = _mm512_alignr_epi32(lo, hi, 1);
|
|
98
|
+
|
|
99
|
+
const __mmask32 hisurrhi = _kshiftri_mask32(hisurr, 16);
|
|
100
|
+
taglo = _mm512_mask_mov_epi32(taglo, __mmask16(hisurr),
|
|
101
|
+
_mm512_set1_epi32(0x808080f0));
|
|
102
|
+
taghi = _mm512_mask_mov_epi32(taghi, __mmask16(hisurrhi),
|
|
103
|
+
_mm512_set1_epi32(0x808080f0));
|
|
104
|
+
|
|
105
|
+
lo = _mm512_mask_slli_epi32(lo, __mmask16(hisurr), lo, 10);
|
|
106
|
+
hi = _mm512_mask_slli_epi32(hi, __mmask16(hisurrhi), hi, 10);
|
|
107
|
+
los = _mm512_add_epi32(los, _mm512_set1_epi32(0xfca02400));
|
|
108
|
+
his = _mm512_add_epi32(his, _mm512_set1_epi32(0xfca02400));
|
|
109
|
+
lo = _mm512_mask_add_epi32(lo, __mmask16(hisurr), lo, los);
|
|
110
|
+
hi = _mm512_mask_add_epi32(hi, __mmask16(hisurrhi), hi, his);
|
|
111
|
+
|
|
112
|
+
carryout = _cvtu32_mask32(_kshiftri_mask32(hisurr, 30));
|
|
113
|
+
|
|
114
|
+
const uint32_t h = _cvtmask32_u32(hisurr);
|
|
115
|
+
const uint32_t l = _cvtmask32_u32(losurr);
|
|
116
|
+
// check for mismatched surrogates
|
|
117
|
+
if ((h + h + carry) ^ l) {
|
|
118
|
+
const uint32_t lonohi = l & ~(h + h + carry);
|
|
119
|
+
const uint32_t hinolo = h & ~(l >> 1);
|
|
120
|
+
inlen = _tzcnt_u32(hinolo | lonohi);
|
|
121
|
+
inmask = __mmask32(0x7fffffff & ((1U << inlen) - 1));
|
|
122
|
+
in = _mm512_maskz_mov_epi16(inmask, in);
|
|
123
|
+
adjust = (int)inlen - 31;
|
|
124
|
+
inlen = 0;
|
|
125
|
+
goto failiteration;
|
|
126
|
+
}
|
|
127
|
+
}
|
|
128
|
+
|
|
129
|
+
hi = _mm512_maskz_mov_epi32(_cvtu32_mask16(0x7fff), hi);
|
|
130
|
+
carry = carryout;
|
|
131
|
+
|
|
132
|
+
__m512i mslo =
|
|
133
|
+
_mm512_multishift_epi64_epi8(_mm512_set1_epi64(0x20262c3200060c12), lo);
|
|
134
|
+
|
|
135
|
+
__m512i mshi =
|
|
136
|
+
_mm512_multishift_epi64_epi8(_mm512_set1_epi64(0x20262c3200060c12), hi);
|
|
137
|
+
|
|
138
|
+
const __mmask32 outmask = __mmask32(_kandn_mask64(losurr, inmask));
|
|
139
|
+
const __mmask64 outmhi = _kshiftri_mask64(outmask, 16);
|
|
140
|
+
|
|
141
|
+
const __mmask32 is1byte = __mmask32(_knot_mask64(is234byte));
|
|
142
|
+
const __mmask64 is1bhi = _kshiftri_mask64(is1byte, 16);
|
|
143
|
+
const __mmask64 is12bhi = _kshiftri_mask64(is12byte, 16);
|
|
144
|
+
|
|
145
|
+
taglo = _mm512_mask_mov_epi32(taglo, __mmask16(is12byte),
|
|
146
|
+
_mm512_set1_epi32(0x80c00000));
|
|
147
|
+
taghi = _mm512_mask_mov_epi32(taghi, __mmask16(is12bhi),
|
|
148
|
+
_mm512_set1_epi32(0x80c00000));
|
|
149
|
+
__m512i magiclo = _mm512_mask_blend_epi32(__mmask16(outmask),
|
|
150
|
+
_mm512_set1_epi32(0xffffffff),
|
|
151
|
+
_mm512_set1_epi32(0x00010101));
|
|
152
|
+
__m512i magichi = _mm512_mask_blend_epi32(__mmask16(outmhi),
|
|
153
|
+
_mm512_set1_epi32(0xffffffff),
|
|
154
|
+
_mm512_set1_epi32(0x00010101));
|
|
155
|
+
|
|
156
|
+
magiclo = _mm512_mask_blend_epi32(__mmask16(outmask),
|
|
157
|
+
_mm512_set1_epi32(0xffffffff),
|
|
158
|
+
_mm512_set1_epi32(0x00010101));
|
|
159
|
+
magichi = _mm512_mask_blend_epi32(__mmask16(outmhi),
|
|
160
|
+
_mm512_set1_epi32(0xffffffff),
|
|
161
|
+
_mm512_set1_epi32(0x00010101));
|
|
162
|
+
|
|
163
|
+
mslo = _mm512_ternarylogic_epi32(mslo, _mm512_set1_epi32(0x3f3f3f3f), taglo,
|
|
164
|
+
0xea); // A&B|C
|
|
165
|
+
mshi = _mm512_ternarylogic_epi32(mshi, _mm512_set1_epi32(0x3f3f3f3f), taghi,
|
|
166
|
+
0xea);
|
|
167
|
+
mslo = _mm512_mask_slli_epi32(mslo, __mmask16(is1byte), lo, 24);
|
|
168
|
+
|
|
169
|
+
mshi = _mm512_mask_slli_epi32(mshi, __mmask16(is1bhi), hi, 24);
|
|
170
|
+
|
|
171
|
+
const __mmask64 wantlo =
|
|
172
|
+
_mm512_cmp_epu8_mask(mslo, magiclo, _MM_CMPINT_NLT);
|
|
173
|
+
const __mmask64 wanthi =
|
|
174
|
+
_mm512_cmp_epu8_mask(mshi, magichi, _MM_CMPINT_NLT);
|
|
175
|
+
const __m512i outlo = _mm512_maskz_compress_epi8(wantlo, mslo);
|
|
176
|
+
const __m512i outhi = _mm512_maskz_compress_epi8(wanthi, mshi);
|
|
177
|
+
const uint64_t wantlo_uint64 = _cvtmask64_u64(wantlo);
|
|
178
|
+
const uint64_t wanthi_uint64 = _cvtmask64_u64(wanthi);
|
|
179
|
+
|
|
180
|
+
uint64_t advlo = _mm_popcnt_u64(wantlo_uint64);
|
|
181
|
+
uint64_t advhi = _mm_popcnt_u64(wanthi_uint64);
|
|
182
|
+
|
|
183
|
+
_mm512_mask_storeu_epi8(
|
|
184
|
+
outbuf, _cvtu64_mask64(_pext_u64(wantlo_uint64, wantlo_uint64)), outlo);
|
|
185
|
+
_mm512_mask_storeu_epi8(
|
|
186
|
+
outbuf + advlo, _cvtu64_mask64(_pext_u64(wanthi_uint64, wanthi_uint64)),
|
|
187
|
+
outhi);
|
|
188
|
+
outbuf += advlo + advhi;
|
|
189
|
+
}
|
|
190
|
+
outbuf += -adjust;
|
|
191
|
+
|
|
192
|
+
tail:
|
|
193
|
+
if (inlen != 0) {
|
|
194
|
+
// We must have inlen < 31.
|
|
195
|
+
inmask = _cvtu32_mask32((1U << inlen) - 1);
|
|
196
|
+
in = _mm512_maskz_loadu_epi16(inmask, inbuf);
|
|
197
|
+
if (big_endian) {
|
|
198
|
+
in = _mm512_shuffle_epi8(in, byteflip);
|
|
199
|
+
}
|
|
200
|
+
adjust = (int)inlen - 31;
|
|
201
|
+
inlen = 0;
|
|
202
|
+
goto lastiteration;
|
|
203
|
+
}
|
|
204
|
+
*outlen = (outbuf - outbuf_orig) + adjust;
|
|
205
|
+
return ((inbuf - inbuf_orig) + adjust);
|
|
206
|
+
}
|
|
@@ -0,0 +1,74 @@
|
|
|
1
|
+
// file included directly
|
|
2
|
+
size_t icelake_convert_utf32_to_latin1(const char32_t *buf, size_t len,
|
|
3
|
+
char *latin1_output) {
|
|
4
|
+
const char32_t *end = buf + len;
|
|
5
|
+
__m512i v_0xFF = _mm512_set1_epi32(0xff);
|
|
6
|
+
__m512i shufmask = _mm512_set_epi8(
|
|
7
|
+
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
|
8
|
+
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 60,
|
|
9
|
+
56, 52, 48, 44, 40, 36, 32, 28, 24, 20, 16, 12, 8, 4, 0);
|
|
10
|
+
while (end - buf >= 16) {
|
|
11
|
+
__m512i in = _mm512_loadu_si512((__m512i *)buf);
|
|
12
|
+
if (_mm512_cmpgt_epu32_mask(in, v_0xFF)) {
|
|
13
|
+
return 0;
|
|
14
|
+
}
|
|
15
|
+
_mm_storeu_si128(
|
|
16
|
+
(__m128i *)latin1_output,
|
|
17
|
+
_mm512_castsi512_si128(_mm512_permutexvar_epi8(shufmask, in)));
|
|
18
|
+
latin1_output += 16;
|
|
19
|
+
buf += 16;
|
|
20
|
+
}
|
|
21
|
+
if (buf < end) {
|
|
22
|
+
uint16_t mask = uint16_t((1 << (end - buf)) - 1);
|
|
23
|
+
__m512i in = _mm512_maskz_loadu_epi32(mask, buf);
|
|
24
|
+
if (_mm512_cmpgt_epu32_mask(in, v_0xFF)) {
|
|
25
|
+
return 0;
|
|
26
|
+
}
|
|
27
|
+
_mm_mask_storeu_epi8(
|
|
28
|
+
latin1_output, mask,
|
|
29
|
+
_mm512_castsi512_si128(_mm512_permutexvar_epi8(shufmask, in)));
|
|
30
|
+
}
|
|
31
|
+
return len;
|
|
32
|
+
}
|
|
33
|
+
|
|
34
|
+
std::pair<result, char *>
|
|
35
|
+
icelake_convert_utf32_to_latin1_with_errors(const char32_t *buf, size_t len,
|
|
36
|
+
char *latin1_output) {
|
|
37
|
+
const char32_t *end = buf + len;
|
|
38
|
+
const char32_t *start = buf;
|
|
39
|
+
__m512i v_0xFF = _mm512_set1_epi32(0xff);
|
|
40
|
+
__m512i shufmask = _mm512_set_epi8(
|
|
41
|
+
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
|
42
|
+
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 60,
|
|
43
|
+
56, 52, 48, 44, 40, 36, 32, 28, 24, 20, 16, 12, 8, 4, 0);
|
|
44
|
+
while (end - buf >= 16) {
|
|
45
|
+
__m512i in = _mm512_loadu_si512((__m512i *)buf);
|
|
46
|
+
if (_mm512_cmpgt_epu32_mask(in, v_0xFF)) {
|
|
47
|
+
while (uint32_t(*buf) <= 0xff) {
|
|
48
|
+
*latin1_output++ = uint8_t(*buf++);
|
|
49
|
+
}
|
|
50
|
+
return std::make_pair(result(error_code::TOO_LARGE, buf - start),
|
|
51
|
+
latin1_output);
|
|
52
|
+
}
|
|
53
|
+
_mm_storeu_si128(
|
|
54
|
+
(__m128i *)latin1_output,
|
|
55
|
+
_mm512_castsi512_si128(_mm512_permutexvar_epi8(shufmask, in)));
|
|
56
|
+
latin1_output += 16;
|
|
57
|
+
buf += 16;
|
|
58
|
+
}
|
|
59
|
+
if (buf < end) {
|
|
60
|
+
uint16_t mask = uint16_t((1 << (end - buf)) - 1);
|
|
61
|
+
__m512i in = _mm512_maskz_loadu_epi32(mask, buf);
|
|
62
|
+
if (_mm512_cmpgt_epu32_mask(in, v_0xFF)) {
|
|
63
|
+
while (uint32_t(*buf) <= 0xff) {
|
|
64
|
+
*latin1_output++ = uint8_t(*buf++);
|
|
65
|
+
}
|
|
66
|
+
return std::make_pair(result(error_code::TOO_LARGE, buf - start),
|
|
67
|
+
latin1_output);
|
|
68
|
+
}
|
|
69
|
+
_mm_mask_storeu_epi8(
|
|
70
|
+
latin1_output, mask,
|
|
71
|
+
_mm512_castsi512_si128(_mm512_permutexvar_epi8(shufmask, in)));
|
|
72
|
+
}
|
|
73
|
+
return std::make_pair(result(error_code::SUCCESS, len), latin1_output);
|
|
74
|
+
}
|