react-native-quick-crypto 1.0.19 → 1.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/QuickCrypto.podspec +12 -38
- package/README.md +2 -0
- package/android/CMakeLists.txt +3 -0
- package/cpp/utils/HybridUtils.cpp +39 -77
- package/deps/simdutf/.clang-format +4 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/bug_report.md +62 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/config.yml +1 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/feature_request.md +35 -0
- package/deps/simdutf/.github/ISSUE_TEMPLATE/standard-issue-template.md +29 -0
- package/deps/simdutf/.github/pull_request_template.md +51 -0
- package/deps/simdutf/.github/workflows/aarch64.yml +39 -0
- package/deps/simdutf/.github/workflows/alpine.yml +27 -0
- package/deps/simdutf/.github/workflows/amalgamation_demos.yml +34 -0
- package/deps/simdutf/.github/workflows/armv7.yml +32 -0
- package/deps/simdutf/.github/workflows/atomic_fuzz.yml +25 -0
- package/deps/simdutf/.github/workflows/cifuzz.yml +37 -0
- package/deps/simdutf/.github/workflows/clangformat.yml +36 -0
- package/deps/simdutf/.github/workflows/debian-latestcxxstandards.yml +40 -0
- package/deps/simdutf/.github/workflows/debian.yml +33 -0
- package/deps/simdutf/.github/workflows/documentation.yml +36 -0
- package/deps/simdutf/.github/workflows/emscripten.yml +19 -0
- package/deps/simdutf/.github/workflows/loongarch64-gcc-14.2.yml +39 -0
- package/deps/simdutf/.github/workflows/macos-latest.yml +29 -0
- package/deps/simdutf/.github/workflows/msys2-clang.yml +48 -0
- package/deps/simdutf/.github/workflows/msys2.yml +50 -0
- package/deps/simdutf/.github/workflows/ppc64le.yml +29 -0
- package/deps/simdutf/.github/workflows/rvv-1024-clang-18.yml +35 -0
- package/deps/simdutf/.github/workflows/rvv-128-clang-17.yml +35 -0
- package/deps/simdutf/.github/workflows/rvv-256-gcc-14.yml +31 -0
- package/deps/simdutf/.github/workflows/s390x.yml +29 -0
- package/deps/simdutf/.github/workflows/selective-amalgamation.yml +29 -0
- package/deps/simdutf/.github/workflows/typos.yml +19 -0
- package/deps/simdutf/.github/workflows/ubuntu22-cxx20.yml +30 -0
- package/deps/simdutf/.github/workflows/ubuntu22.yml +32 -0
- package/deps/simdutf/.github/workflows/ubuntu22_gcc12.yml +27 -0
- package/deps/simdutf/.github/workflows/ubuntu22sani.yml +29 -0
- package/deps/simdutf/.github/workflows/ubuntu24-cxxstandards.yml +34 -0
- package/deps/simdutf/.github/workflows/ubuntu24-unsignedchar.yml +34 -0
- package/deps/simdutf/.github/workflows/ubuntu24.yml +32 -0
- package/deps/simdutf/.github/workflows/ubuntu24sani.yml +36 -0
- package/deps/simdutf/.github/workflows/ubuntu24sani_clang.yml +29 -0
- package/deps/simdutf/.github/workflows/vs17-arm-ci.yml +21 -0
- package/deps/simdutf/.github/workflows/vs17-ci-cxx20.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-ci.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-clang-ci.yml +41 -0
- package/deps/simdutf/.github/workflows/vs17-cxxstandards.yml +36 -0
- package/deps/simdutf/AI_USAGE_POLICY.md +56 -0
- package/deps/simdutf/AUTHORS +6 -0
- package/deps/simdutf/CMakeLists.txt +231 -0
- package/deps/simdutf/CONTRIBUTING.md +214 -0
- package/deps/simdutf/CONTRIBUTORS +1 -0
- package/deps/simdutf/Doxyfile +2584 -0
- package/deps/simdutf/LICENSE-APACHE +201 -0
- package/deps/simdutf/LICENSE-MIT +18 -0
- package/deps/simdutf/Makefile.crosscompile +54 -0
- package/deps/simdutf/README-RVV.md +16 -0
- package/deps/simdutf/README.md +2782 -0
- package/deps/simdutf/SECURITY.md +8 -0
- package/deps/simdutf/benchmarks/CMakeLists.txt +101 -0
- package/deps/simdutf/benchmarks/alignment.cpp +150 -0
- package/deps/simdutf/benchmarks/base64/CMakeLists.txt +30 -0
- package/deps/simdutf/benchmarks/base64/benchmark_base64.cpp +875 -0
- package/deps/simdutf/benchmarks/base64/libbase64_spaces.h +49 -0
- package/deps/simdutf/benchmarks/base64/node_base64.h +227 -0
- package/deps/simdutf/benchmarks/base64/openssl3_base64.h +334 -0
- package/deps/simdutf/benchmarks/benchmark.cpp +65 -0
- package/deps/simdutf/benchmarks/benchmark_to_well_formed_utf16.cpp +347 -0
- package/deps/simdutf/benchmarks/competition/.clang-format-ignore +5 -0
- package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.cpp +1276 -0
- package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.h +595 -0
- package/deps/simdutf/benchmarks/competition/README.md +7 -0
- package/deps/simdutf/benchmarks/competition/hoehrmann/hoehrmann.h +91 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16.h +444 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16_tables.h +13183 -0
- package/deps/simdutf/benchmarks/competition/inoue2008/script.py +73 -0
- package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.cpp +738 -0
- package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.h +293 -0
- package/deps/simdutf/benchmarks/competition/u8u16/COPYRIGHT +8 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Makefile +44 -0
- package/deps/simdutf/benchmarks/competition/u8u16/OSL3.0.txt +169 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/BOM_Profiler.h +148 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/i386_timer.h +45 -0
- package/deps/simdutf/benchmarks/competition/u8u16/Profiling/ppc_timer.c +34 -0
- package/deps/simdutf/benchmarks/competition/u8u16/README +56 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/config_defs.h +43 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/g4_config.h +27 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/mmx_config.h +16 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/p4_config.h +18 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/p4_ideal_config.h +16 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/spu_config.h +28 -0
- package/deps/simdutf/benchmarks/competition/u8u16/config/ssse3_config.h +20 -0
- package/deps/simdutf/benchmarks/competition/u8u16/iconv_u8u16.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/altivec_simd.h +440 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_basic_ops.py +121 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_half_operand_versions.py +158 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_test.py +270 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd.h +141 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_basic.h +216 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_built_in.h +119 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_modified.h +2430 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/outline.txt +39 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/spu_simd.h +421 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/sse_simd.h +836 -0
- package/deps/simdutf/benchmarks/competition/u8u16/lib/stdint.h +222 -0
- package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_BE.c +4 -0
- package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_LE.c +5 -0
- package/deps/simdutf/benchmarks/competition/u8u16/proto/u8u16.py +390 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/Makefile +18 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/bytelex.h +448 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/charsets/ASCII_EBCDIC.h +284 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.c +1975 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.pdf +0 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.w +2263 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/multiliteral.h +239 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/u8u16.c +232 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/x8x16.c +194 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.c +193 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.h +167 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.c +288 -0
- package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.h +117 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_g4.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_mmx.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4.c +3 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4_ideal.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_spu.c +2 -0
- package/deps/simdutf/benchmarks/competition/u8u16/u8u16_ssse3.c +3 -0
- package/deps/simdutf/benchmarks/competition/u8u16/x8x16_p4.c +2 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/LICENSE +23 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/data/test_minimal.txt +44 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/readme.md +106 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_corr_tests.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_example.sh +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_file_conv.sh +14 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_lib.sh +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_sample.sh +8 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_corr_tests.cmd +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_example.cmd +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_file_conv.cmd +14 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_lib.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_sample.cmd +8 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_corr_tests.cmd +11 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_example.cmd +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_file_conv.cmd +13 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_lib.cmd +10 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_sample.cmd +9 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/html_table.py +25 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/measure.py +94 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/resize.py +20 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_all.cmd +2 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_interm.cmd +1 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/CustomMemcpy.h +75 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/PerfDefs.h +47 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.cpp +17 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.h +76 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/AllProcessors.cpp +35 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.cpp +117 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.h +210 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferDecoder.h +158 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferEncoder.h +104 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorPlugins.h +334 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorSelector.h +186 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.cpp +140 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.h +42 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderProcess.h +100 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/Dfa.h +57 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.cpp +85 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.h +27 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderProcess.h +126 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/core/ProcessTrivial.h +108 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.cpp +139 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.h +74 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.cpp +65 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.h +91 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/CorrectnessTests.cpp +772 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/Example.cpp +12 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/FileConverter.cpp +486 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/iconv_sample.c +162 -0
- package/deps/simdutf/benchmarks/competition/utf8lut/src/utf8lut.h +15 -0
- package/deps/simdutf/benchmarks/competition/utf8sse4/fromutf8-sse.cpp +292 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/LICENSE +23 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/README.md +1503 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/checked.h +335 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/core.h +338 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp11.h +103 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp17.h +103 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/unchecked.h +274 -0
- package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8.h +34 -0
- package/deps/simdutf/benchmarks/dataset/README.md +155 -0
- package/deps/simdutf/benchmarks/dataset/emoji.txt +204 -0
- package/deps/simdutf/benchmarks/dataset/scripts/utf8type.py +40 -0
- package/deps/simdutf/benchmarks/dataset/wikipedia_mars/Makefile +80 -0
- package/deps/simdutf/benchmarks/dataset/wikipedia_mars/convert_to_utf6.py +20 -0
- package/deps/simdutf/benchmarks/find/CMakeLists.txt +6 -0
- package/deps/simdutf/benchmarks/find/findbenchmark.cpp +63 -0
- package/deps/simdutf/benchmarks/find/findbenchmarker.h +46 -0
- package/deps/simdutf/benchmarks/shortbench.cpp +555 -0
- package/deps/simdutf/benchmarks/src/CMakeLists.txt +52 -0
- package/deps/simdutf/benchmarks/src/apple_arm_events.h +1104 -0
- package/deps/simdutf/benchmarks/src/benchmark.cpp +3899 -0
- package/deps/simdutf/benchmarks/src/benchmark.h +317 -0
- package/deps/simdutf/benchmarks/src/benchmark_base.cpp +144 -0
- package/deps/simdutf/benchmarks/src/benchmark_base.h +98 -0
- package/deps/simdutf/benchmarks/src/cmdline.cpp +176 -0
- package/deps/simdutf/benchmarks/src/cmdline.h +35 -0
- package/deps/simdutf/benchmarks/src/event_counter.h +162 -0
- package/deps/simdutf/benchmarks/src/linux-perf-events.h +104 -0
- package/deps/simdutf/benchmarks/stream.cpp +209 -0
- package/deps/simdutf/benchmarks/threaded.cpp +123 -0
- package/deps/simdutf/cmake/CPM.cmake +1363 -0
- package/deps/simdutf/cmake/JoinPaths.cmake +23 -0
- package/deps/simdutf/cmake/add_cpp_test.cmake +68 -0
- package/deps/simdutf/cmake/simdutf-config.cmake.in +2 -0
- package/deps/simdutf/cmake/simdutf-flags.cmake +26 -0
- package/deps/simdutf/cmake/toolchains-ci/riscv64-linux-gnu.cmake +4 -0
- package/deps/simdutf/cmake/toolchains-dev/README.md +32 -0
- package/deps/simdutf/cmake/toolchains-dev/aarch64.cmake +14 -0
- package/deps/simdutf/cmake/toolchains-dev/loongarch64.cmake +22 -0
- package/deps/simdutf/cmake/toolchains-dev/powerpc64.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/powerpc64le.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/riscv64.cmake +16 -0
- package/deps/simdutf/cmake/toolchains-dev/rvv-spike.cmake +38 -0
- package/deps/simdutf/doc/avx512.png +0 -0
- package/deps/simdutf/doc/logo.png +0 -0
- package/deps/simdutf/doc/logo.svg +165 -0
- package/deps/simdutf/doc/node2023.png +0 -0
- package/deps/simdutf/doc/shortinput.md +78 -0
- package/deps/simdutf/doc/utf16utf8.png +0 -0
- package/deps/simdutf/doc/utf8utf16.png +0 -0
- package/deps/simdutf/doc/widelogo.png +0 -0
- package/deps/simdutf/doxygen.py +50 -0
- package/deps/simdutf/fuzz/.clang-format +9 -0
- package/deps/simdutf/fuzz/CMakeLists.txt +45 -0
- package/deps/simdutf/fuzz/README.md +168 -0
- package/deps/simdutf/fuzz/atomic_base64.cpp +448 -0
- package/deps/simdutf/fuzz/base64.cpp +278 -0
- package/deps/simdutf/fuzz/build.sh +83 -0
- package/deps/simdutf/fuzz/conversion.cpp +669 -0
- package/deps/simdutf/fuzz/helpers/.clang-format-ignore +1 -0
- package/deps/simdutf/fuzz/helpers/common.h +135 -0
- package/deps/simdutf/fuzz/helpers/nameof.hpp +1258 -0
- package/deps/simdutf/fuzz/main.cpp +72 -0
- package/deps/simdutf/fuzz/minimize_and_cleanse.sh +87 -0
- package/deps/simdutf/fuzz/misc.cpp +216 -0
- package/deps/simdutf/fuzz/random_fuzz.sh +154 -0
- package/deps/simdutf/fuzz/roundtrip.cpp +588 -0
- package/deps/simdutf/fuzz/safe_conversion.cpp +104 -0
- package/deps/simdutf/include/simdutf/avx512.h +79 -0
- package/deps/simdutf/include/simdutf/base64_implementation.h +158 -0
- package/deps/simdutf/include/simdutf/base64_tables.h +887 -0
- package/deps/simdutf/include/simdutf/common_defs.h +186 -0
- package/deps/simdutf/include/simdutf/compiler_check.h +50 -0
- package/deps/simdutf/include/simdutf/constexpr_ptr.h +138 -0
- package/deps/simdutf/include/simdutf/encoding_types.h +189 -0
- package/deps/simdutf/include/simdutf/error.h +126 -0
- package/deps/simdutf/include/simdutf/implementation.h +7081 -0
- package/deps/simdutf/include/simdutf/internal/isadetection.h +325 -0
- package/deps/simdutf/include/simdutf/portability.h +285 -0
- package/deps/simdutf/include/simdutf/scalar/ascii.h +86 -0
- package/deps/simdutf/include/simdutf/scalar/atomic_util.h +105 -0
- package/deps/simdutf/include/simdutf/scalar/base64.h +911 -0
- package/deps/simdutf/include/simdutf/scalar/latin1.h +26 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf16/latin1_to_utf16.h +52 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf32/latin1_to_utf32.h +27 -0
- package/deps/simdutf/include/simdutf/scalar/latin1_to_utf8/latin1_to_utf8.h +191 -0
- package/deps/simdutf/include/simdutf/scalar/swap_bytes.h +35 -0
- package/deps/simdutf/include/simdutf/scalar/utf16.h +226 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/utf16_to_latin1.h +108 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/valid_utf16_to_latin1.h +40 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/utf16_to_utf32.h +86 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/valid_utf16_to_utf32.h +44 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/utf16_to_utf8.h +295 -0
- package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/valid_utf16_to_utf8.h +91 -0
- package/deps/simdutf/include/simdutf/scalar/utf32.h +82 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/utf32_to_latin1.h +68 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/valid_utf32_to_latin1.h +67 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/utf32_to_utf16.h +84 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/valid_utf32_to_utf16.h +44 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/utf32_to_utf8.h +142 -0
- package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/valid_utf32_to_utf8.h +72 -0
- package/deps/simdutf/include/simdutf/scalar/utf8.h +326 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/utf8_to_latin1.h +225 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/valid_utf8_to_latin1.h +87 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/utf8_to_utf16.h +342 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/valid_utf8_to_utf16.h +106 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/utf8_to_utf32.h +299 -0
- package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/valid_utf8_to_utf32.h +83 -0
- package/deps/simdutf/include/simdutf/simdutf_version.h +26 -0
- package/deps/simdutf/include/simdutf.h +26 -0
- package/deps/simdutf/include/simdutf_c.h +342 -0
- package/deps/simdutf/riscv/Dockerfile +16 -0
- package/deps/simdutf/riscv/README.md +24 -0
- package/deps/simdutf/riscv/remove-docker-station +8 -0
- package/deps/simdutf/riscv/run-docker-station +31 -0
- package/deps/simdutf/scripts/.flake8 +2 -0
- package/deps/simdutf/scripts/Makefile +2 -0
- package/deps/simdutf/scripts/README_ADD_FUNCTION.md +49 -0
- package/deps/simdutf/scripts/add_function.py +330 -0
- package/deps/simdutf/scripts/amalgamation_tests.py +156 -0
- package/deps/simdutf/scripts/base64/Makefile +2 -0
- package/deps/simdutf/scripts/base64/README.md +2 -0
- package/deps/simdutf/scripts/base64/avx512.py +76 -0
- package/deps/simdutf/scripts/base64/neon_decode.py +143 -0
- package/deps/simdutf/scripts/base64/neon_generate_lut.py +101 -0
- package/deps/simdutf/scripts/base64/sse.py +252 -0
- package/deps/simdutf/scripts/base64/sseregular.py +160 -0
- package/deps/simdutf/scripts/base64/sseurl.py +283 -0
- package/deps/simdutf/scripts/base64/table.py +59 -0
- package/deps/simdutf/scripts/base64bench_print.py +145 -0
- package/deps/simdutf/scripts/benchmark-all.py +119 -0
- package/deps/simdutf/scripts/benchmark_print.py +324 -0
- package/deps/simdutf/scripts/check_feature_macros.py +156 -0
- package/deps/simdutf/scripts/check_typos.sh +13 -0
- package/deps/simdutf/scripts/clang_format.sh +35 -0
- package/deps/simdutf/scripts/clang_format_docker.sh +38 -0
- package/deps/simdutf/scripts/common.py +24 -0
- package/deps/simdutf/scripts/compilation_benchmark.py +55 -0
- package/deps/simdutf/scripts/compile_many_variations.sh +64 -0
- package/deps/simdutf/scripts/create_latex_table.py +62 -0
- package/deps/simdutf/scripts/docker/Dockerfile +14 -0
- package/deps/simdutf/scripts/docker/Makefile +9 -0
- package/deps/simdutf/scripts/docker/README.md +30 -0
- package/deps/simdutf/scripts/docker/llvm.gpg +0 -0
- package/deps/simdutf/scripts/ppc64_convert_utf16_to_utf8.py +155 -0
- package/deps/simdutf/scripts/prepare_doxygen.sh +21 -0
- package/deps/simdutf/scripts/release.py +197 -0
- package/deps/simdutf/scripts/shortinputplots.py +97 -0
- package/deps/simdutf/scripts/sse_convert_utf16_to_utf8.py +422 -0
- package/deps/simdutf/scripts/sse_convert_utf32_to_utf16.py +105 -0
- package/deps/simdutf/scripts/sse_utf8_utf16_decode.py +186 -0
- package/deps/simdutf/scripts/sse_validate_utf16le_proof.py +137 -0
- package/deps/simdutf/scripts/sse_validate_utf16le_testcases.py +129 -0
- package/deps/simdutf/scripts/table.py +207 -0
- package/deps/simdutf/scripts/tests/new.txt +33 -0
- package/deps/simdutf/scripts/tests/old.txt +33 -0
- package/deps/simdutf/scripts/tests/results.txt +272 -0
- package/deps/simdutf/simdutf.pc.in +11 -0
- package/deps/simdutf/singleheader/.flake8 +2 -0
- package/deps/simdutf/singleheader/CMakeLists.txt +64 -0
- package/deps/simdutf/singleheader/README-dev.md +81 -0
- package/deps/simdutf/singleheader/README.md +19 -0
- package/deps/simdutf/singleheader/amalgamate.py +513 -0
- package/deps/simdutf/singleheader/amalgamation_demo.c +59 -0
- package/deps/simdutf/singleheader/amalgamation_demo.cpp +54 -0
- package/deps/simdutf/singleheader/test-features.py +262 -0
- package/deps/simdutf/src/CMakeLists.txt +78 -0
- package/deps/simdutf/src/arm64/arm_base64.cpp +791 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf16.cpp +24 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf32.cpp +24 -0
- package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf8.cpp +70 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_latin1.cpp +61 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf32.cpp +185 -0
- package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf8.cpp +780 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_latin1.cpp +60 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf16.cpp +208 -0
- package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf8.cpp +505 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_latin1.cpp +69 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf16.cpp +313 -0
- package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf32.cpp +179 -0
- package/deps/simdutf/src/arm64/arm_find.cpp +199 -0
- package/deps/simdutf/src/arm64/arm_utf16fix.cpp +185 -0
- package/deps/simdutf/src/arm64/arm_validate_utf16.cpp +165 -0
- package/deps/simdutf/src/arm64/arm_validate_utf32le.cpp +65 -0
- package/deps/simdutf/src/arm64/implementation.cpp +1442 -0
- package/deps/simdutf/src/encoding_types.cpp +67 -0
- package/deps/simdutf/src/error.cpp +3 -0
- package/deps/simdutf/src/fallback/implementation.cpp +589 -0
- package/deps/simdutf/src/generic/ascii_validation.h +50 -0
- package/deps/simdutf/src/generic/base64.h +233 -0
- package/deps/simdutf/src/generic/base64lengths.h +63 -0
- package/deps/simdutf/src/generic/buf_block_reader.h +109 -0
- package/deps/simdutf/src/generic/find.h +75 -0
- package/deps/simdutf/src/generic/utf16/change_endianness.h +24 -0
- package/deps/simdutf/src/generic/utf16/count_code_points_bytemask.h +58 -0
- package/deps/simdutf/src/generic/utf16/to_well_formed.h +93 -0
- package/deps/simdutf/src/generic/utf16/utf32_length_from_utf16.h +15 -0
- package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16.h +35 -0
- package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16_bytemask.h +199 -0
- package/deps/simdutf/src/generic/utf16.h +73 -0
- package/deps/simdutf/src/generic/utf32.h +136 -0
- package/deps/simdutf/src/generic/utf8/utf16_length_from_utf8_bytemask.h +53 -0
- package/deps/simdutf/src/generic/utf8.h +92 -0
- package/deps/simdutf/src/generic/utf8_to_latin1/utf8_to_latin1.h +316 -0
- package/deps/simdutf/src/generic/utf8_to_latin1/valid_utf8_to_latin1.h +78 -0
- package/deps/simdutf/src/generic/utf8_to_utf16/utf8_to_utf16.h +332 -0
- package/deps/simdutf/src/generic/utf8_to_utf16/valid_utf8_to_utf16.h +74 -0
- package/deps/simdutf/src/generic/utf8_to_utf32/utf8_to_utf32.h +318 -0
- package/deps/simdutf/src/generic/utf8_to_utf32/valid_utf8_to_utf32.h +42 -0
- package/deps/simdutf/src/generic/utf8_validation/utf8_lookup4_algorithm.h +223 -0
- package/deps/simdutf/src/generic/utf8_validation/utf8_validator.h +84 -0
- package/deps/simdutf/src/generic/validate_utf16.h +164 -0
- package/deps/simdutf/src/generic/validate_utf32.h +99 -0
- package/deps/simdutf/src/haswell/avx2_base64.cpp +837 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf16.cpp +28 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf32.cpp +20 -0
- package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf8.cpp +83 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_latin1.cpp +83 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf32.cpp +210 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf8.cpp +602 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_latin1.cpp +116 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf16.cpp +164 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf8.cpp +569 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_latin1.cpp +60 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf16.cpp +195 -0
- package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf32.cpp +135 -0
- package/deps/simdutf/src/haswell/avx2_utf16fix.cpp +173 -0
- package/deps/simdutf/src/haswell/avx2_validate_utf16.cpp +17 -0
- package/deps/simdutf/src/haswell/implementation.cpp +1447 -0
- package/deps/simdutf/src/icelake/icelake_ascii_validation.inl.cpp +19 -0
- package/deps/simdutf/src/icelake/icelake_base64.inl.cpp +630 -0
- package/deps/simdutf/src/icelake/icelake_common.inl.cpp +37 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf16.inl.cpp +36 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf32.inl.cpp +23 -0
- package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf8.inl.cpp +107 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_latin1.inl.cpp +103 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf32.inl.cpp +136 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf8.inl.cpp +206 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_latin1.inl.cpp +74 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf16.inl.cpp +338 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf8.inl.cpp +574 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf8_to_latin1.inl.cpp +104 -0
- package/deps/simdutf/src/icelake/icelake_convert_utf8_to_utf16.inl.cpp +75 -0
- package/deps/simdutf/src/icelake/icelake_convert_valid_utf8_to_latin1.inl.cpp +69 -0
- package/deps/simdutf/src/icelake/icelake_find.inl.cpp +146 -0
- package/deps/simdutf/src/icelake/icelake_from_utf8.inl.cpp +266 -0
- package/deps/simdutf/src/icelake/icelake_from_valid_utf8.inl.cpp +136 -0
- package/deps/simdutf/src/icelake/icelake_macros.inl.cpp +143 -0
- package/deps/simdutf/src/icelake/icelake_utf16fix.cpp +138 -0
- package/deps/simdutf/src/icelake/icelake_utf32_validation.inl.cpp +63 -0
- package/deps/simdutf/src/icelake/icelake_utf8_common.inl.cpp +753 -0
- package/deps/simdutf/src/icelake/icelake_utf8_length_from_utf16.inl.cpp +269 -0
- package/deps/simdutf/src/icelake/icelake_utf8_validation.inl.cpp +116 -0
- package/deps/simdutf/src/icelake/implementation.cpp +1903 -0
- package/deps/simdutf/src/implementation.cpp +2526 -0
- package/deps/simdutf/src/lasx/implementation.cpp +1531 -0
- package/deps/simdutf/src/lasx/lasx_base64.cpp +695 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf16.cpp +76 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf32.cpp +55 -0
- package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf8.cpp +65 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_latin1.cpp +64 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf32.cpp +183 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf8.cpp +550 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_latin1.cpp +73 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf16.cpp +218 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf8.cpp +589 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_latin1.cpp +72 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf16.cpp +296 -0
- package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf32.cpp +190 -0
- package/deps/simdutf/src/lasx/lasx_find.cpp +64 -0
- package/deps/simdutf/src/lasx/lasx_validate_utf16.cpp +13 -0
- package/deps/simdutf/src/lasx/lasx_validate_utf32le.cpp +84 -0
- package/deps/simdutf/src/lsx/implementation.cpp +1417 -0
- package/deps/simdutf/src/lsx/lsx_base64.cpp +675 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf16.cpp +39 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf32.cpp +27 -0
- package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf8.cpp +56 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_latin1.cpp +64 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf32.cpp +133 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf8.cpp +518 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_latin1.cpp +66 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf16.cpp +155 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf8.cpp +459 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_latin1.cpp +75 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf16.cpp +291 -0
- package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf32.cpp +179 -0
- package/deps/simdutf/src/lsx/lsx_find.cpp +60 -0
- package/deps/simdutf/src/lsx/lsx_validate_utf16.cpp +13 -0
- package/deps/simdutf/src/lsx/lsx_validate_utf32le.cpp +68 -0
- package/deps/simdutf/src/ppc64/implementation.cpp +992 -0
- package/deps/simdutf/src/ppc64/ppc64_base64.cpp +480 -0
- package/deps/simdutf/src/ppc64/ppc64_base64_internal_tests.cpp +401 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf16.cpp +12 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf32.cpp +12 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf8.cpp +149 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_latin1.cpp +67 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf32.cpp +87 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf8.cpp +296 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_latin1.cpp +57 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf16.cpp +117 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf8.cpp +166 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_latin1.cpp +69 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf16.cpp +211 -0
- package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf32.cpp +153 -0
- package/deps/simdutf/src/ppc64/ppc64_utf16_to_utf8_tables.h +1011 -0
- package/deps/simdutf/src/ppc64/ppc64_utf8_length_from_latin1.cpp +37 -0
- package/deps/simdutf/src/ppc64/ppc64_validate_utf16.cpp +19 -0
- package/deps/simdutf/src/ppc64/templates.cpp +91 -0
- package/deps/simdutf/src/rvv/implementation.cpp +138 -0
- package/deps/simdutf/src/rvv/rvv_find.cpp +27 -0
- package/deps/simdutf/src/rvv/rvv_helpers.inl.cpp +23 -0
- package/deps/simdutf/src/rvv/rvv_latin1_to.inl.cpp +71 -0
- package/deps/simdutf/src/rvv/rvv_length_from.inl.cpp +164 -0
- package/deps/simdutf/src/rvv/rvv_utf16_to.inl.cpp +399 -0
- package/deps/simdutf/src/rvv/rvv_utf16fix.cpp +110 -0
- package/deps/simdutf/src/rvv/rvv_utf32_to.inl.cpp +307 -0
- package/deps/simdutf/src/rvv/rvv_utf8_to.inl.cpp +435 -0
- package/deps/simdutf/src/rvv/rvv_validate.inl.cpp +275 -0
- package/deps/simdutf/src/simdutf/arm64/begin.h +2 -0
- package/deps/simdutf/src/simdutf/arm64/bitmanipulation.h +34 -0
- package/deps/simdutf/src/simdutf/arm64/end.h +2 -0
- package/deps/simdutf/src/simdutf/arm64/implementation.h +307 -0
- package/deps/simdutf/src/simdutf/arm64/intrinsics.h +10 -0
- package/deps/simdutf/src/simdutf/arm64/simd.h +547 -0
- package/deps/simdutf/src/simdutf/arm64/simd16-inl.h +403 -0
- package/deps/simdutf/src/simdutf/arm64/simd32-inl.h +129 -0
- package/deps/simdutf/src/simdutf/arm64/simd64-inl.h +28 -0
- package/deps/simdutf/src/simdutf/arm64.h +43 -0
- package/deps/simdutf/src/simdutf/fallback/begin.h +1 -0
- package/deps/simdutf/src/simdutf/fallback/bitmanipulation.h +13 -0
- package/deps/simdutf/src/simdutf/fallback/end.h +1 -0
- package/deps/simdutf/src/simdutf/fallback/implementation.h +331 -0
- package/deps/simdutf/src/simdutf/fallback.h +42 -0
- package/deps/simdutf/src/simdutf/haswell/begin.h +15 -0
- package/deps/simdutf/src/simdutf/haswell/bitmanipulation.h +35 -0
- package/deps/simdutf/src/simdutf/haswell/end.h +13 -0
- package/deps/simdutf/src/simdutf/haswell/implementation.h +338 -0
- package/deps/simdutf/src/simdutf/haswell/intrinsics.h +67 -0
- package/deps/simdutf/src/simdutf/haswell/simd.h +363 -0
- package/deps/simdutf/src/simdutf/haswell/simd16-inl.h +261 -0
- package/deps/simdutf/src/simdutf/haswell/simd32-inl.h +111 -0
- package/deps/simdutf/src/simdutf/haswell/simd64-inl.h +34 -0
- package/deps/simdutf/src/simdutf/haswell.h +63 -0
- package/deps/simdutf/src/simdutf/icelake/begin.h +14 -0
- package/deps/simdutf/src/simdutf/icelake/bitmanipulation.h +44 -0
- package/deps/simdutf/src/simdutf/icelake/end.h +12 -0
- package/deps/simdutf/src/simdutf/icelake/implementation.h +346 -0
- package/deps/simdutf/src/simdutf/icelake/intrinsics.h +138 -0
- package/deps/simdutf/src/simdutf/icelake/simd.h +17 -0
- package/deps/simdutf/src/simdutf/icelake/simd16-inl.h +90 -0
- package/deps/simdutf/src/simdutf/icelake/simd32-inl.h +47 -0
- package/deps/simdutf/src/simdutf/icelake.h +81 -0
- package/deps/simdutf/src/simdutf/lasx/begin.h +8 -0
- package/deps/simdutf/src/simdutf/lasx/bitmanipulation.h +25 -0
- package/deps/simdutf/src/simdutf/lasx/end.h +8 -0
- package/deps/simdutf/src/simdutf/lasx/implementation.h +310 -0
- package/deps/simdutf/src/simdutf/lasx/intrinsics.h +319 -0
- package/deps/simdutf/src/simdutf/lasx/simd.h +551 -0
- package/deps/simdutf/src/simdutf/lasx/simd16-inl.h +234 -0
- package/deps/simdutf/src/simdutf/lasx/simd32-inl.h +74 -0
- package/deps/simdutf/src/simdutf/lasx/simd64-inl.h +52 -0
- package/deps/simdutf/src/simdutf/lasx.h +49 -0
- package/deps/simdutf/src/simdutf/lsx/begin.h +2 -0
- package/deps/simdutf/src/simdutf/lsx/bitmanipulation.h +25 -0
- package/deps/simdutf/src/simdutf/lsx/end.h +2 -0
- package/deps/simdutf/src/simdutf/lsx/implementation.h +309 -0
- package/deps/simdutf/src/simdutf/lsx/intrinsics.h +196 -0
- package/deps/simdutf/src/simdutf/lsx/simd.h +421 -0
- package/deps/simdutf/src/simdutf/lsx/simd16-inl.h +242 -0
- package/deps/simdutf/src/simdutf/lsx/simd32-inl.h +69 -0
- package/deps/simdutf/src/simdutf/lsx/simd64-inl.h +50 -0
- package/deps/simdutf/src/simdutf/lsx.h +52 -0
- package/deps/simdutf/src/simdutf/ppc64/begin.h +1 -0
- package/deps/simdutf/src/simdutf/ppc64/bitmanipulation.h +29 -0
- package/deps/simdutf/src/simdutf/ppc64/end.h +1 -0
- package/deps/simdutf/src/simdutf/ppc64/implementation.h +348 -0
- package/deps/simdutf/src/simdutf/ppc64/intrinsics.h +19 -0
- package/deps/simdutf/src/simdutf/ppc64/simd.h +177 -0
- package/deps/simdutf/src/simdutf/ppc64/simd16-inl.h +327 -0
- package/deps/simdutf/src/simdutf/ppc64/simd32-inl.h +247 -0
- package/deps/simdutf/src/simdutf/ppc64/simd8-inl.h +618 -0
- package/deps/simdutf/src/simdutf/ppc64.h +40 -0
- package/deps/simdutf/src/simdutf/rvv/begin.h +7 -0
- package/deps/simdutf/src/simdutf/rvv/end.h +7 -0
- package/deps/simdutf/src/simdutf/rvv/implementation.h +321 -0
- package/deps/simdutf/src/simdutf/rvv/intrinsics.h +131 -0
- package/deps/simdutf/src/simdutf/rvv.h +41 -0
- package/deps/simdutf/src/simdutf/westmere/begin.h +8 -0
- package/deps/simdutf/src/simdutf/westmere/bitmanipulation.h +37 -0
- package/deps/simdutf/src/simdutf/westmere/end.h +8 -0
- package/deps/simdutf/src/simdutf/westmere/implementation.h +338 -0
- package/deps/simdutf/src/simdutf/westmere/intrinsics.h +38 -0
- package/deps/simdutf/src/simdutf/westmere/simd.h +379 -0
- package/deps/simdutf/src/simdutf/westmere/simd16-inl.h +242 -0
- package/deps/simdutf/src/simdutf/westmere/simd32-inl.h +151 -0
- package/deps/simdutf/src/simdutf/westmere/simd64-inl.h +33 -0
- package/deps/simdutf/src/simdutf/westmere.h +59 -0
- package/deps/simdutf/src/simdutf.cpp +152 -0
- package/deps/simdutf/src/simdutf_c.cpp +525 -0
- package/deps/simdutf/src/tables/utf16_to_utf8_tables.h +768 -0
- package/deps/simdutf/src/tables/utf32_to_utf16_tables.h +53 -0
- package/deps/simdutf/src/tables/utf8_to_utf16_tables.h +826 -0
- package/deps/simdutf/src/westmere/implementation.cpp +1479 -0
- package/deps/simdutf/src/westmere/internal/loader.cpp +7 -0
- package/deps/simdutf/src/westmere/internal/write_v_u16_11bits_to_utf8.cpp +66 -0
- package/deps/simdutf/src/westmere/sse_base64.cpp +672 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf16.cpp +21 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf32.cpp +31 -0
- package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf8.cpp +71 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_latin1.cpp +70 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf32.cpp +206 -0
- package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf8.cpp +504 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_latin1.cpp +82 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf16.cpp +209 -0
- package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf8.cpp +589 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_latin1.cpp +58 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf16.cpp +197 -0
- package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf32.cpp +141 -0
- package/deps/simdutf/src/westmere/sse_utf16fix.cpp +82 -0
- package/deps/simdutf/src/westmere/sse_validate_utf16.cpp +17 -0
- package/deps/simdutf/tests/CMakeLists.txt +483 -0
- package/deps/simdutf/tests/atomic_base64_tests.cpp +2845 -0
- package/deps/simdutf/tests/base64_tests.cpp +3617 -0
- package/deps/simdutf/tests/basic_fuzzer.cpp +805 -0
- package/deps/simdutf/tests/bele_tests.cpp +182 -0
- package/deps/simdutf/tests/constexpr_base64_tests.cpp +387 -0
- package/deps/simdutf/tests/convert_latin1_to_utf16be_tests.cpp +52 -0
- package/deps/simdutf/tests/convert_latin1_to_utf16le_tests.cpp +80 -0
- package/deps/simdutf/tests/convert_latin1_to_utf32_tests.cpp +66 -0
- package/deps/simdutf/tests/convert_latin1_to_utf8_tests.cpp +120 -0
- package/deps/simdutf/tests/convert_utf16_to_utf8_safe_tests.cpp +203 -0
- package/deps/simdutf/tests/convert_utf16_to_utf8_with_replacement_tests.cpp +276 -0
- package/deps/simdutf/tests/convert_utf16be_to_latin1_tests.cpp +109 -0
- package/deps/simdutf/tests/convert_utf16be_to_latin1_tests_with_errors.cpp +136 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf32_tests.cpp +193 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf32_with_errors_tests.cpp +381 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf8_tests.cpp +259 -0
- package/deps/simdutf/tests/convert_utf16be_to_utf8_with_errors_tests.cpp +266 -0
- package/deps/simdutf/tests/convert_utf16le_to_latin1_tests.cpp +148 -0
- package/deps/simdutf/tests/convert_utf16le_to_latin1_tests_with_errors.cpp +176 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf32_tests.cpp +213 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf32_with_errors_tests.cpp +318 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf8_tests.cpp +343 -0
- package/deps/simdutf/tests/convert_utf16le_to_utf8_with_errors_tests.cpp +271 -0
- package/deps/simdutf/tests/convert_utf32_to_latin1_tests.cpp +111 -0
- package/deps/simdutf/tests/convert_utf32_to_latin1_with_errors_tests.cpp +96 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16be_tests.cpp +148 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16be_with_errors_tests.cpp +192 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16le_tests.cpp +166 -0
- package/deps/simdutf/tests/convert_utf32_to_utf16le_with_errors_tests.cpp +215 -0
- package/deps/simdutf/tests/convert_utf32_to_utf8_tests.cpp +181 -0
- package/deps/simdutf/tests/convert_utf32_to_utf8_with_errors_tests.cpp +261 -0
- package/deps/simdutf/tests/convert_utf8_to_latin1_tests.cpp +516 -0
- package/deps/simdutf/tests/convert_utf8_to_latin1_with_errors_tests.cpp +579 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16be_tests.cpp +412 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16be_with_errors_tests.cpp +480 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16le_tests.cpp +671 -0
- package/deps/simdutf/tests/convert_utf8_to_utf16le_with_errors_tests.cpp +455 -0
- package/deps/simdutf/tests/convert_utf8_to_utf32_tests.cpp +1204 -0
- package/deps/simdutf/tests/convert_utf8_to_utf32_with_errors_tests.cpp +337 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_latin1_tests.cpp +37 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_utf32_tests.cpp +97 -0
- package/deps/simdutf/tests/convert_valid_utf16be_to_utf8_tests.cpp +126 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_latin1_tests.cpp +71 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_utf32_tests.cpp +122 -0
- package/deps/simdutf/tests/convert_valid_utf16le_to_utf8_tests.cpp +244 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_latin1_tests.cpp +49 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf16be_tests.cpp +92 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf16le_tests.cpp +114 -0
- package/deps/simdutf/tests/convert_valid_utf32_to_utf8_tests.cpp +109 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_latin1_tests.cpp +84 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf16be_tests.cpp +124 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf16le_tests.cpp +221 -0
- package/deps/simdutf/tests/convert_valid_utf8_to_utf32_tests.cpp +155 -0
- package/deps/simdutf/tests/count_utf16be.cpp +64 -0
- package/deps/simdutf/tests/count_utf16le.cpp +61 -0
- package/deps/simdutf/tests/count_utf8.cpp +87 -0
- package/deps/simdutf/tests/detect_encodings_tests.cpp +312 -0
- package/deps/simdutf/tests/embed/valid_utf8.txt +1 -0
- package/deps/simdutf/tests/embed_tests.cpp +22 -0
- package/deps/simdutf/tests/find_tests.cpp +77 -0
- package/deps/simdutf/tests/fixed_string_tests.cpp +153 -0
- package/deps/simdutf/tests/helpers/CMakeLists.txt +25 -0
- package/deps/simdutf/tests/helpers/compiletime_conversions.h +222 -0
- package/deps/simdutf/tests/helpers/fixed_string.h +267 -0
- package/deps/simdutf/tests/helpers/random_int.cpp +30 -0
- package/deps/simdutf/tests/helpers/random_int.h +39 -0
- package/deps/simdutf/tests/helpers/random_utf16.cpp +123 -0
- package/deps/simdutf/tests/helpers/random_utf16.h +52 -0
- package/deps/simdutf/tests/helpers/random_utf32.cpp +41 -0
- package/deps/simdutf/tests/helpers/random_utf32.h +40 -0
- package/deps/simdutf/tests/helpers/random_utf8.cpp +93 -0
- package/deps/simdutf/tests/helpers/random_utf8.h +36 -0
- package/deps/simdutf/tests/helpers/test.cpp +231 -0
- package/deps/simdutf/tests/helpers/test.h +193 -0
- package/deps/simdutf/tests/helpers/transcode_test_base.cpp +1257 -0
- package/deps/simdutf/tests/helpers/transcode_test_base.h +683 -0
- package/deps/simdutf/tests/helpers/utf16.h +27 -0
- package/deps/simdutf/tests/installation_tests/find/CMakeLists.txt +43 -0
- package/deps/simdutf/tests/installation_tests/from_fetch/CMakeLists.txt +47 -0
- package/deps/simdutf/tests/internal_tests.cpp +27 -0
- package/deps/simdutf/tests/null_safety_tests.cpp +94 -0
- package/deps/simdutf/tests/random_fuzzer.cpp +779 -0
- package/deps/simdutf/tests/readme_tests.cpp +274 -0
- package/deps/simdutf/tests/reference/CMakeLists.txt +23 -0
- package/deps/simdutf/tests/reference/decode_utf16.h +81 -0
- package/deps/simdutf/tests/reference/decode_utf32.h +47 -0
- package/deps/simdutf/tests/reference/encode_latin1.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_latin1.h +32 -0
- package/deps/simdutf/tests/reference/encode_utf16.cpp +49 -0
- package/deps/simdutf/tests/reference/encode_utf16.h +20 -0
- package/deps/simdutf/tests/reference/encode_utf32.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_utf32.h +36 -0
- package/deps/simdutf/tests/reference/encode_utf8.cpp +1 -0
- package/deps/simdutf/tests/reference/encode_utf8.h +40 -0
- package/deps/simdutf/tests/reference/validate_utf16.cpp +60 -0
- package/deps/simdutf/tests/reference/validate_utf16.h +14 -0
- package/deps/simdutf/tests/reference/validate_utf16_to_latin1.cpp +35 -0
- package/deps/simdutf/tests/reference/validate_utf16_to_latin1.h +13 -0
- package/deps/simdutf/tests/reference/validate_utf32.cpp +27 -0
- package/deps/simdutf/tests/reference/validate_utf32.h +12 -0
- package/deps/simdutf/tests/reference/validate_utf32_to_latin1.cpp +27 -0
- package/deps/simdutf/tests/reference/validate_utf32_to_latin1.h +12 -0
- package/deps/simdutf/tests/reference/validate_utf8.cpp +82 -0
- package/deps/simdutf/tests/reference/validate_utf8.h +11 -0
- package/deps/simdutf/tests/reference/validate_utf8_to_latin1.cpp +43 -0
- package/deps/simdutf/tests/reference/validate_utf8_to_latin1.h +12 -0
- package/deps/simdutf/tests/select_implementation.cpp +43 -0
- package/deps/simdutf/tests/simdutf_c_tests.cpp +244 -0
- package/deps/simdutf/tests/span_tests.cpp +401 -0
- package/deps/simdutf/tests/special_tests.cpp +559 -0
- package/deps/simdutf/tests/straight_c_test.c +187 -0
- package/deps/simdutf/tests/text_encoding_tests.cpp +77 -0
- package/deps/simdutf/tests/to_well_formed_utf16_tests.cpp +377 -0
- package/deps/simdutf/tests/utf8_length_from_utf16_tests.cpp +202 -0
- package/deps/simdutf/tests/validate_ascii_basic_tests.cpp +165 -0
- package/deps/simdutf/tests/validate_ascii_with_errors_tests.cpp +77 -0
- package/deps/simdutf/tests/validate_utf16be_basic_tests.cpp +175 -0
- package/deps/simdutf/tests/validate_utf16be_with_errors_tests.cpp +188 -0
- package/deps/simdutf/tests/validate_utf16le_basic_tests.cpp +268 -0
- package/deps/simdutf/tests/validate_utf16le_with_errors_tests.cpp +274 -0
- package/deps/simdutf/tests/validate_utf32_basic_tests.cpp +92 -0
- package/deps/simdutf/tests/validate_utf32_with_errors_tests.cpp +114 -0
- package/deps/simdutf/tests/validate_utf8_basic_tests.cpp +178 -0
- package/deps/simdutf/tests/validate_utf8_brute_force_tests.cpp +88 -0
- package/deps/simdutf/tests/validate_utf8_puzzler_tests.cpp +33 -0
- package/deps/simdutf/tests/validate_utf8_with_errors_tests.cpp +228 -0
- package/deps/simdutf/tools/CMakeLists.txt +85 -0
- package/deps/simdutf/tools/fastbase64.cpp +250 -0
- package/deps/simdutf/tools/sutf.cpp +556 -0
- package/deps/simdutf/tools/sutf.h +40 -0
- package/package.json +2 -2
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
#pragma once
|
|
2
|
+
|
|
3
|
+
#include <stdint.h>
|
|
4
|
+
#include <emmintrin.h>
|
|
5
|
+
#include "../base/PerfDefs.h"
|
|
6
|
+
|
|
7
|
+
struct shufstep {
|
|
8
|
+
uint32_t _shufC_part0;
|
|
9
|
+
uint32_t _shufC_part1;
|
|
10
|
+
uint32_t srcStep; //number of bytes processed in input buffer
|
|
11
|
+
uint32_t dstStep; //number of symbols produced in output buffer (doubled)
|
|
12
|
+
};
|
|
13
|
+
|
|
14
|
+
struct DecoderCoreInfo {
|
|
15
|
+
__m128i shufAB; //shuffling mask to get lower two bytes of symbols
|
|
16
|
+
union {
|
|
17
|
+
__m128i shufC; //shuffling mask to get third bytes of symbols
|
|
18
|
+
shufstep s;
|
|
19
|
+
};
|
|
20
|
+
};
|
|
21
|
+
struct DecoderValidationInfo {
|
|
22
|
+
__m128i headerMask; //mask of "111..10" bits required in each byte
|
|
23
|
+
__m128i minValues; //minimal value allowed for not being overlong (sign-shifted, 16-bit)
|
|
24
|
+
};
|
|
25
|
+
|
|
26
|
+
//a single entry of each LUT is defined
|
|
27
|
+
template<bool Validate> struct DecoderLutEntry {};
|
|
28
|
+
template<> struct DecoderLutEntry<false> : DecoderCoreInfo {};
|
|
29
|
+
template<> struct DecoderLutEntry<true> : DecoderCoreInfo, DecoderValidationInfo {};
|
|
30
|
+
|
|
31
|
+
//a whole LUT table type
|
|
32
|
+
template<bool Validate> struct DecoderLutTable {
|
|
33
|
+
//note: odd-indexed entries are removed (they are impossible with correct input)
|
|
34
|
+
CACHEALIGN DecoderLutEntry<Validate> data[32768];
|
|
35
|
+
|
|
36
|
+
static const DecoderLutTable<Validate> *CreateInstance();
|
|
37
|
+
inline static const DecoderLutEntry<Validate> *GetArray() { return CreateInstance()->data; }
|
|
38
|
+
private:
|
|
39
|
+
void ComputeAll();
|
|
40
|
+
void ComputeRec(int *sizes, int num, int total);
|
|
41
|
+
void ComputeEntry(const int *sizes, int num);
|
|
42
|
+
};
|
|
@@ -0,0 +1,100 @@
|
|
|
1
|
+
#pragma once
|
|
2
|
+
|
|
3
|
+
#include <stdint.h>
|
|
4
|
+
#include <tmmintrin.h>
|
|
5
|
+
#include "../base/PerfDefs.h"
|
|
6
|
+
#include "../core/DecoderLut.h"
|
|
7
|
+
|
|
8
|
+
/** template params:
|
|
9
|
+
* MaxBytes = 1, 2, 3
|
|
10
|
+
* CheckExceed = false, true
|
|
11
|
+
* Validate = false, true
|
|
12
|
+
* OutputType = 2, 4 //UTF16/32
|
|
13
|
+
*/
|
|
14
|
+
|
|
15
|
+
template<int MaxBytes, bool CheckExceed, bool Validate, int OutputType>
|
|
16
|
+
struct DecoderCore {
|
|
17
|
+
FORCEINLINE bool operator()(const char *&ptrSource, char *&ptrDest, const DecoderLutEntry<Validate> *RESTRICT lutTable) {
|
|
18
|
+
static_assert(!Validate || CheckExceed, "Validate core mode requires CheckExceed enabled");
|
|
19
|
+
const char *RESTRICT pSource = ptrSource;
|
|
20
|
+
char *RESTRICT pDest = ptrDest;
|
|
21
|
+
|
|
22
|
+
if (MaxBytes == 1) {
|
|
23
|
+
__m128i reg = _mm_loadu_si128((__m128i*)pSource);
|
|
24
|
+
__m128i zero = _mm_setzero_si128();
|
|
25
|
+
if (CheckExceed && _mm_movemask_epi8(reg))
|
|
26
|
+
return false;
|
|
27
|
+
__m128i half0 = _mm_unpacklo_epi8(reg, zero);
|
|
28
|
+
__m128i half1 = _mm_unpackhi_epi8(reg, zero);
|
|
29
|
+
if (OutputType == 2) {
|
|
30
|
+
_mm_storeu_si128((__m128i*)pDest + 0, half0);
|
|
31
|
+
_mm_storeu_si128((__m128i*)pDest + 1, half1);
|
|
32
|
+
}
|
|
33
|
+
else {
|
|
34
|
+
_mm_storeu_si128((__m128i*)pDest + 0, _mm_unpacklo_epi16(half0, zero));
|
|
35
|
+
_mm_storeu_si128((__m128i*)pDest + 1, _mm_unpackhi_epi16(half0, zero));
|
|
36
|
+
_mm_storeu_si128((__m128i*)pDest + 2, _mm_unpacklo_epi16(half1, zero));
|
|
37
|
+
_mm_storeu_si128((__m128i*)pDest + 3, _mm_unpackhi_epi16(half1, zero));
|
|
38
|
+
}
|
|
39
|
+
ptrSource += 16;
|
|
40
|
+
ptrDest += 16 * OutputType;
|
|
41
|
+
return true;
|
|
42
|
+
}
|
|
43
|
+
else { //MaxBytes = 2 or 3
|
|
44
|
+
__m128i reg = _mm_loadu_si128((__m128i*)pSource);
|
|
45
|
+
if (CheckExceed && !Validate) {
|
|
46
|
+
__m128i pl = _mm_xor_si128(reg, _mm_set1_epi8(char(0x80U))); //_mm_sub_epi8
|
|
47
|
+
__m128i cmpRes = _mm_cmpgt_epi8(pl, _mm_set1_epi8(MaxBytes == 3 ? 0x6F : 0x5F));
|
|
48
|
+
if (!_mm_cmp_allzero(cmpRes))
|
|
49
|
+
return false;
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
uint32_t mask = _mm_movemask_epi8(_mm_cmplt_epi8(reg, _mm_set1_epi8(char(0xC0U))));
|
|
53
|
+
if (Validate && (mask & 1))
|
|
54
|
+
return false;
|
|
55
|
+
//note: optimized half-index access
|
|
56
|
+
const DecoderLutEntry<Validate> *RESTRICT lookup = TPNT(lutTable, DecoderLutEntry<Validate>, mask * (sizeof(lutTable[0]) / 2));
|
|
57
|
+
|
|
58
|
+
__m128i Rab = _mm_shuffle_epi8(reg, lookup->shufAB);
|
|
59
|
+
Rab = _mm_and_si128(Rab, _mm_set1_epi16(0x3F7F));
|
|
60
|
+
Rab = _mm_maddubs_epi16(Rab, _mm_set1_epi16(0x4001));
|
|
61
|
+
__m128i sum = Rab;
|
|
62
|
+
|
|
63
|
+
if (MaxBytes == 3) {
|
|
64
|
+
__m128i shufC = _mm_unpacklo_epi8(lookup->shufC, lookup->shufC);
|
|
65
|
+
__m128i Rc = _mm_shuffle_epi8(reg, shufC);
|
|
66
|
+
Rc = _mm_slli_epi16(Rc, 12);
|
|
67
|
+
sum = _mm_add_epi16(sum, Rc);
|
|
68
|
+
}
|
|
69
|
+
|
|
70
|
+
if (Validate) {
|
|
71
|
+
const DecoderLutEntry<true> *RESTRICT lookupX = (const DecoderLutEntry<true> *)lookup;
|
|
72
|
+
__m128i byteMask = lookupX->headerMask;
|
|
73
|
+
__m128i header = _mm_and_si128(reg, byteMask);
|
|
74
|
+
__m128i hdrRef = _mm_add_epi8(byteMask, byteMask);
|
|
75
|
+
__m128i hdrCorrect = _mm_cmpeq_epi8(header, hdrRef);
|
|
76
|
+
__m128i overlongSymbol = _mm_cmplt_epi16(_mm_xor_si128(sum, _mm_set1_epi16((short int)0x8000U)), lookupX->minValues);
|
|
77
|
+
__m128i surrogate = _mm_cmpgt_epi16(_mm_sub_epi16(sum, _mm_set1_epi16(0x6000)), _mm_set1_epi16(0x77FF));
|
|
78
|
+
if (MaxBytes == 2) {
|
|
79
|
+
__m128i shufC = _mm_unpacklo_epi8(lookupX->shufC, lookupX->shufC);
|
|
80
|
+
hdrCorrect = _mm_and_si128(hdrCorrect, shufC); //forbid 3-byte symbols
|
|
81
|
+
}
|
|
82
|
+
__m128i allCorr = _mm_andnot_si128(_mm_or_si128(overlongSymbol, surrogate), hdrCorrect);
|
|
83
|
+
if (!_mm_cmp_allone(allCorr))
|
|
84
|
+
return false;
|
|
85
|
+
}
|
|
86
|
+
|
|
87
|
+
if (OutputType == 2)
|
|
88
|
+
_mm_storeu_si128((__m128i*)pDest, sum);
|
|
89
|
+
else {
|
|
90
|
+
__m128i zero = _mm_setzero_si128();
|
|
91
|
+
_mm_storeu_si128((__m128i*)pDest + 0, _mm_unpacklo_epi16(sum, zero));
|
|
92
|
+
_mm_storeu_si128((__m128i*)pDest + 1, _mm_unpackhi_epi16(sum, zero));
|
|
93
|
+
}
|
|
94
|
+
ptrSource += lookup->s.srcStep;
|
|
95
|
+
ptrDest += lookup->s.dstStep * (OutputType/2);
|
|
96
|
+
|
|
97
|
+
return true;
|
|
98
|
+
}
|
|
99
|
+
}
|
|
100
|
+
};
|
|
@@ -0,0 +1,57 @@
|
|
|
1
|
+
// Automaton-based utf8 decoder:
|
|
2
|
+
// http://bjoern.hoehrmann.de/utf-8/decoder/dfa/
|
|
3
|
+
//
|
|
4
|
+
// Copyright (c) 2008-2009 Bjoern Hoehrmann <bjoern@hoehrmann.de>
|
|
5
|
+
//
|
|
6
|
+
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
7
|
+
// of this software and associated documentation files (the "Software"),
|
|
8
|
+
// to deal in the Software without restriction, including without limitation
|
|
9
|
+
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
10
|
+
// and/or sell copies of the Software, and to permit persons to whom the Software
|
|
11
|
+
// is furnished to do so, subject to the following conditions:
|
|
12
|
+
//
|
|
13
|
+
// The above copyright notice and this permission notice shall be included
|
|
14
|
+
// in all copies or substantial portions of the Software.
|
|
15
|
+
//
|
|
16
|
+
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
|
17
|
+
// EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
|
|
18
|
+
// OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
|
|
19
|
+
// IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
|
|
20
|
+
// DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
21
|
+
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
|
22
|
+
|
|
23
|
+
#define UTF8_ACCEPT 0
|
|
24
|
+
#define UTF8_REJECT 12
|
|
25
|
+
|
|
26
|
+
static const uint8_t utf8d[] = {
|
|
27
|
+
// The first part of the table maps bytes to character classes that
|
|
28
|
+
// to reduce the size of the transition table and create bitmasks.
|
|
29
|
+
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
|
|
30
|
+
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
|
|
31
|
+
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
|
|
32
|
+
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
|
|
33
|
+
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, 9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,
|
|
34
|
+
7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7, 7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,
|
|
35
|
+
8,8,2,2,2,2,2,2,2,2,2,2,2,2,2,2, 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,
|
|
36
|
+
10,3,3,3,3,3,3,3,3,3,3,3,3,4,3,3, 11,6,6,6,5,8,8,8,8,8,8,8,8,8,8,8,
|
|
37
|
+
|
|
38
|
+
// The second part is a transition table that maps a combination
|
|
39
|
+
// of a state of the automaton and a character class to a state.
|
|
40
|
+
0,12,24,36,60,96,84,12,12,12,48,72, 12,12,12,12,12,12,12,12,12,12,12,12,
|
|
41
|
+
12, 0,12,12,12,12,12, 0,12, 0,12,12, 12,24,12,12,12,12,12,24,12,24,12,12,
|
|
42
|
+
12,12,12,12,12,12,12,24,12,12,12,12, 12,24,12,12,12,12,12,12,12,24,12,12,
|
|
43
|
+
12,12,12,12,12,12,12,36,12,36,12,12, 12,36,12,12,12,12,12,36,12,36,12,12,
|
|
44
|
+
12,36,12,12,12,12,12,12,12,12,12,12,
|
|
45
|
+
};
|
|
46
|
+
|
|
47
|
+
uint32_t inline
|
|
48
|
+
decode(uint32_t* state, uint32_t* codep, uint32_t byte) {
|
|
49
|
+
uint32_t type = utf8d[byte];
|
|
50
|
+
|
|
51
|
+
*codep = (*state != UTF8_ACCEPT) ?
|
|
52
|
+
(byte & 0x3fu) | (*codep << 6) :
|
|
53
|
+
(0xff >> type) & (byte);
|
|
54
|
+
|
|
55
|
+
*state = utf8d[256 + *state + type];
|
|
56
|
+
return *state;
|
|
57
|
+
}
|
|
@@ -0,0 +1,85 @@
|
|
|
1
|
+
#include "../core/EncoderLut.h"
|
|
2
|
+
#include <assert.h>
|
|
3
|
+
#include <string.h>
|
|
4
|
+
|
|
5
|
+
template<bool ThreeBytes> void EncoderLutTable<ThreeBytes>::ComputeAll() {
|
|
6
|
+
//start search for all masks
|
|
7
|
+
for (int lensMask = 0; lensMask < 256; lensMask++)
|
|
8
|
+
ComputeEntry(lensMask);
|
|
9
|
+
}
|
|
10
|
+
|
|
11
|
+
typedef int (*PartPosGetter)(int, int);
|
|
12
|
+
static void HandleChar(int idx, int len, int &pos, char *shuf, char *header, PartPosGetter getPart) {
|
|
13
|
+
for (int j = 0; j < len; j++) {
|
|
14
|
+
shuf[pos + j] = (char)getPart(idx, len-1 - j);
|
|
15
|
+
header[pos + j] = (char)0xC0U;
|
|
16
|
+
}
|
|
17
|
+
static const int firstByteHeader[] = {0xFF, 0x80, 0xE0, 0xF0};
|
|
18
|
+
header[pos] = char(firstByteHeader[len]);
|
|
19
|
+
pos += len;
|
|
20
|
+
}
|
|
21
|
+
|
|
22
|
+
int TwoBytesPartPosGetter(int idx, int part) {
|
|
23
|
+
return 2 * idx + (1 - part);
|
|
24
|
+
}
|
|
25
|
+
template<> void EncoderLutTable<false>::ComputeEntry(int lensMask) {
|
|
26
|
+
//init shuffle bitmask and header mask
|
|
27
|
+
char shuf[16], header[16];
|
|
28
|
+
memset(shuf, -1, sizeof(shuf));
|
|
29
|
+
memset(header, 0, sizeof(header));
|
|
30
|
+
//go over all 8 input symbols
|
|
31
|
+
int pos = 0;
|
|
32
|
+
for (int i = 0; i < 8; i++) {
|
|
33
|
+
int len = 1 + (1 & (lensMask >> i));
|
|
34
|
+
HandleChar(i, len, pos, shuf, header, TwoBytesPartPosGetter);
|
|
35
|
+
}
|
|
36
|
+
//save data into LUT entry
|
|
37
|
+
EncoderLutEntry &entry = data[lensMask];
|
|
38
|
+
entry.shuf = _mm_loadu_si128((__m128i*)shuf);
|
|
39
|
+
entry.headerMask = _mm_loadu_si128((__m128i*)header);
|
|
40
|
+
entry.dstStep = pos;
|
|
41
|
+
}
|
|
42
|
+
|
|
43
|
+
int ThreeBytesPartPosGetter(int idx, int part) {
|
|
44
|
+
if (part == 0)
|
|
45
|
+
return 2 * idx + 0;
|
|
46
|
+
if (part == 2)
|
|
47
|
+
return 2 * idx + 1;
|
|
48
|
+
if (part == 1)
|
|
49
|
+
return 8 + 2 * idx;
|
|
50
|
+
return -1;
|
|
51
|
+
}
|
|
52
|
+
template<> void EncoderLutTable<true>::ComputeEntry(int lensMask) {
|
|
53
|
+
//init shuffle bitmask and header mask
|
|
54
|
+
char shuf[16], header[16];
|
|
55
|
+
memset(shuf, -1, sizeof(shuf));
|
|
56
|
+
memset(header, 0, sizeof(header));
|
|
57
|
+
//go over all 8 input symbols
|
|
58
|
+
int pos = 0;
|
|
59
|
+
int index = 0;
|
|
60
|
+
for (int i = 0; i < 4; i++) {
|
|
61
|
+
int len = 1 + (3 & (lensMask >> (2 * i)));
|
|
62
|
+
if (len > 3)
|
|
63
|
+
return; //impossible entry
|
|
64
|
+
HandleChar(i, len, pos, shuf, header, ThreeBytesPartPosGetter);
|
|
65
|
+
index ^= (len ^ 1) << (2 * i); //xor 1 just suits...
|
|
66
|
+
}
|
|
67
|
+
//save data into LUT entry
|
|
68
|
+
EncoderLutEntry &entry = data[index];
|
|
69
|
+
entry.shuf = _mm_loadu_si128((__m128i*)shuf);
|
|
70
|
+
entry.headerMask = _mm_loadu_si128((__m128i*)header);
|
|
71
|
+
entry.dstStep = pos;
|
|
72
|
+
}
|
|
73
|
+
|
|
74
|
+
template<bool ThreeBytes> const EncoderLutTable<ThreeBytes> *EncoderLutTable<ThreeBytes>::CreateInstance() {
|
|
75
|
+
static EncoderLutTable<ThreeBytes> *singletonTable = 0;
|
|
76
|
+
if (!singletonTable) {
|
|
77
|
+
singletonTable = (EncoderLutTable<ThreeBytes> *)_mm_malloc(sizeof(EncoderLutTable<ThreeBytes>), CACHE_LINE);
|
|
78
|
+
singletonTable->ComputeAll();
|
|
79
|
+
}
|
|
80
|
+
return singletonTable;
|
|
81
|
+
}
|
|
82
|
+
|
|
83
|
+
|
|
84
|
+
template struct EncoderLutTable<false>;
|
|
85
|
+
template struct EncoderLutTable<true>;
|
|
@@ -0,0 +1,27 @@
|
|
|
1
|
+
#pragma once
|
|
2
|
+
|
|
3
|
+
#include <stdint.h>
|
|
4
|
+
#include <emmintrin.h>
|
|
5
|
+
#include "../base/PerfDefs.h"
|
|
6
|
+
|
|
7
|
+
//a single entry of each LUT is defined
|
|
8
|
+
struct m128pair { __m128i __a, __b; };
|
|
9
|
+
struct EncoderLutEntry {
|
|
10
|
+
__m128i shuf; //shuffling mask to move bytes into position
|
|
11
|
+
__m128i headerMask; //mask of bits which represents header (for each byte)
|
|
12
|
+
union {
|
|
13
|
+
uint32_t dstStep; //number of bytes processed in output buffer
|
|
14
|
+
m128pair s; //padding up to 64 bytes
|
|
15
|
+
};
|
|
16
|
+
};
|
|
17
|
+
|
|
18
|
+
//a whole LUT table type
|
|
19
|
+
template<bool ThreeBytes> struct EncoderLutTable {
|
|
20
|
+
CACHEALIGN EncoderLutEntry data[256];
|
|
21
|
+
|
|
22
|
+
static const EncoderLutTable<ThreeBytes> *CreateInstance();
|
|
23
|
+
inline static const EncoderLutEntry *GetArray() { return CreateInstance()->data; }
|
|
24
|
+
private:
|
|
25
|
+
void ComputeAll();
|
|
26
|
+
void ComputeEntry(int lensMask);
|
|
27
|
+
};
|
|
@@ -0,0 +1,126 @@
|
|
|
1
|
+
#pragma once
|
|
2
|
+
|
|
3
|
+
#include "../base/PerfDefs.h"
|
|
4
|
+
#include <tmmintrin.h>
|
|
5
|
+
|
|
6
|
+
/** template params:
|
|
7
|
+
* MaxBytes = 1, 2, 3
|
|
8
|
+
* CheckExceed = false, true
|
|
9
|
+
* InputType = 2, 4 //UTF16/32
|
|
10
|
+
*/
|
|
11
|
+
|
|
12
|
+
template<int MaxBytes, bool CheckExceed, int InputType>
|
|
13
|
+
struct EncoderCore {
|
|
14
|
+
FORCEINLINE bool operator()(const char *&ptrSource, char *&ptrDest, const EncoderLutEntry *RESTRICT lutTable) {
|
|
15
|
+
const char *RESTRICT pSource = ptrSource;
|
|
16
|
+
char *RESTRICT pDest = ptrDest;
|
|
17
|
+
|
|
18
|
+
//read block of 8 symbols
|
|
19
|
+
__m128i reg;
|
|
20
|
+
if (InputType == 2)
|
|
21
|
+
reg = _mm_loadu_si128((const __m128i *)pSource);
|
|
22
|
+
else {
|
|
23
|
+
//read in two halves
|
|
24
|
+
__m128i reg0 = _mm_loadu_si128((const __m128i *)pSource + 0);
|
|
25
|
+
__m128i reg1 = _mm_loadu_si128((const __m128i *)pSource + 1);
|
|
26
|
+
__m128i shuf = _mm_setr_epi8(0, 1, 4, 5, 8, 9, 12, 13, 2, 3, 6, 7, 10, 11, 14, 15);
|
|
27
|
+
//shuffle all lower 16-bit words to lower halves of registers
|
|
28
|
+
reg0 = _mm_shuffle_epi8(reg0, shuf);
|
|
29
|
+
reg1 = _mm_shuffle_epi8(reg1, shuf);
|
|
30
|
+
//get all 8 lower 16-bit words
|
|
31
|
+
reg = _mm_unpacklo_epi64(reg0, reg1);
|
|
32
|
+
//if required, check that higher 16-bit words are zero
|
|
33
|
+
if (CheckExceed && !_mm_cmp_allone(_mm_cmpeq_epi16(_mm_unpackhi_epi64(reg0, reg1), _mm_setzero_si128())))
|
|
34
|
+
return false;
|
|
35
|
+
}
|
|
36
|
+
|
|
37
|
+
if (MaxBytes == 1) {
|
|
38
|
+
if (CheckExceed && !_mm_cmp_allone(_mm_cmpeq_epi16(_mm_andnot_si128(_mm_set1_epi16(0x007FU), reg), _mm_setzero_si128())))
|
|
39
|
+
return false;
|
|
40
|
+
__m128i res = _mm_packus_epi16(reg, _mm_setzero_si128());
|
|
41
|
+
_mm_storeu_si128((__m128i *)pDest, res);
|
|
42
|
+
pDest += 8;
|
|
43
|
+
}
|
|
44
|
+
else if (MaxBytes == 2) {
|
|
45
|
+
//levels of bytes
|
|
46
|
+
__m128i levelA = reg; //abcdefgh|ABCDEFGH
|
|
47
|
+
__m128i levelB = _mm_srli_epi16(reg, 6); //ghABCDEF|GH......
|
|
48
|
+
//put all bytes of each half into a register
|
|
49
|
+
__m128i levBA = _mm_xor_si128(levelB, _mm_slli_epi16(levelA, 8)); //ghABC,,,|abcdefgh
|
|
50
|
+
|
|
51
|
+
//check which symbols are long
|
|
52
|
+
__m128i lenGe2 = _mm_cmpgt_epi16(levelB, _mm_set1_epi16(0x0001U));
|
|
53
|
+
//check if there are three+ bytes symbols
|
|
54
|
+
if (CheckExceed && !_mm_cmp_allzero(_mm_cmpgt_epi16(levelB, _mm_set1_epi16(0x001FU))))
|
|
55
|
+
return false;
|
|
56
|
+
//compose lens mask for lookup (with a 6-byte shift)
|
|
57
|
+
__m128i lensAll = _mm_shuffle_epi8(lenGe2, _mm_setr_epi8(-1, -1, -1, -1, -1, -1, 0, 2, 4, 6, 8, 10, 12, 14, -1, -1));
|
|
58
|
+
//get byte offset into lookup table (i.e. index multiplied by 64 = entry size)
|
|
59
|
+
uint32_t offset = _mm_movemask_epi8(lensAll);
|
|
60
|
+
static_assert(sizeof(EncoderLutEntry) == 64, "Wrong size of EncoderLutEntry");
|
|
61
|
+
|
|
62
|
+
//load info from LUT (using byte offset)
|
|
63
|
+
const EncoderLutEntry *RESTRICT lookup = TPNT(lutTable, EncoderLutEntry, offset);
|
|
64
|
+
//shuffle bytes to compact layout
|
|
65
|
+
__m128i res = _mm_shuffle_epi8(levBA, lookup->shuf);
|
|
66
|
+
//add headers to all bytes
|
|
67
|
+
__m128i header = lookup->headerMask;
|
|
68
|
+
res = _mm_andnot_si128(header, res);
|
|
69
|
+
res = _mm_xor_si128(res, _mm_add_epi8(header, header)); //add_epi8
|
|
70
|
+
|
|
71
|
+
//write results
|
|
72
|
+
_mm_storeu_si128((__m128i *)pDest, res);
|
|
73
|
+
pDest += lookup->dstStep;
|
|
74
|
+
}
|
|
75
|
+
else if (MaxBytes == 3) {
|
|
76
|
+
//levels of bytes
|
|
77
|
+
__m128i levAC = _mm_maddubs_epi16(_mm_and_si128(reg, _mm_set1_epi16((short int)0xF0FFU)), _mm_set1_epi16(0x1001U));
|
|
78
|
+
__m128i levelB = _mm_srli_epi16(reg, 6);
|
|
79
|
+
//put all bytes of each half into a separate register
|
|
80
|
+
__m128i levels0 = _mm_unpacklo_epi64(levAC, levelB);
|
|
81
|
+
__m128i levels1 = _mm_unpackhi_epi64(levAC, levelB);
|
|
82
|
+
|
|
83
|
+
if (CheckExceed) {
|
|
84
|
+
//check if there are any surrogates
|
|
85
|
+
__m128i diff = _mm_sub_epi16(reg, _mm_set1_epi16(0x5800U));
|
|
86
|
+
if (!_mm_cmp_allzero(_mm_cmplt_epi16(diff, _mm_set1_epi16((short int)0x8800U))))
|
|
87
|
+
return false;
|
|
88
|
+
}
|
|
89
|
+
|
|
90
|
+
//check for symbols with len at least 2 and 3
|
|
91
|
+
__m128i lenGe2 = _mm_cmpgt_epi16(levelB, _mm_set1_epi16(0x0001U));
|
|
92
|
+
__m128i lenGe3 = _mm_cmpgt_epi16(levelB, _mm_set1_epi16(0x001FU));
|
|
93
|
+
//get a single mask from the two comparison results
|
|
94
|
+
__m128i lensMix = _mm_xor_si128(_mm_srli_epi16(lenGe3, 8), lenGe2);
|
|
95
|
+
uint32_t allMask = _mm_movemask_epi8(lensMix);
|
|
96
|
+
//each half of the mask corresponds to a LUT index
|
|
97
|
+
uint32_t offset0 = (allMask & 255U) * sizeof(EncoderLutEntry);
|
|
98
|
+
uint32_t offset1 = (allMask >> 8U) * sizeof(EncoderLutEntry);
|
|
99
|
+
|
|
100
|
+
//load info from LUT
|
|
101
|
+
const EncoderLutEntry *RESTRICT lookup0 = TPNT(lutTable, EncoderLutEntry, offset0);
|
|
102
|
+
const EncoderLutEntry *RESTRICT lookup1 = TPNT(lutTable, EncoderLutEntry, offset1);
|
|
103
|
+
//shuffle bytes of each half to compact layout
|
|
104
|
+
__m128i res0 = _mm_shuffle_epi8(levels0, lookup0->shuf);
|
|
105
|
+
__m128i res1 = _mm_shuffle_epi8(levels1, lookup1->shuf);
|
|
106
|
+
//add headers to all bytes
|
|
107
|
+
__m128i header0 = lookup0->headerMask;
|
|
108
|
+
__m128i header1 = lookup1->headerMask;
|
|
109
|
+
res0 = _mm_andnot_si128(header0, res0);
|
|
110
|
+
res1 = _mm_andnot_si128(header1, res1);
|
|
111
|
+
res0 = _mm_xor_si128(res0, _mm_add_epi8(header0, header0));
|
|
112
|
+
res1 = _mm_xor_si128(res1, _mm_add_epi8(header1, header1));
|
|
113
|
+
|
|
114
|
+
//write results
|
|
115
|
+
_mm_storeu_si128((__m128i *)pDest, res0);
|
|
116
|
+
pDest += lookup0->dstStep;
|
|
117
|
+
_mm_storeu_si128((__m128i *)pDest, res1);
|
|
118
|
+
pDest += lookup1->dstStep;
|
|
119
|
+
}
|
|
120
|
+
|
|
121
|
+
//save new addresses
|
|
122
|
+
ptrSource += 8 * InputType;
|
|
123
|
+
ptrDest = pDest;
|
|
124
|
+
return true;
|
|
125
|
+
}
|
|
126
|
+
};
|
|
@@ -0,0 +1,108 @@
|
|
|
1
|
+
#pragma once
|
|
2
|
+
|
|
3
|
+
#include <stdint.h>
|
|
4
|
+
#include "../base/PerfDefs.h"
|
|
5
|
+
|
|
6
|
+
namespace DfaUtf8 {
|
|
7
|
+
#include "Dfa.h"
|
|
8
|
+
}
|
|
9
|
+
|
|
10
|
+
template<int OutputType>
|
|
11
|
+
FORCEINLINE bool DecodeTrivial(const char *&pSource, const char *pEnd, char *&pDest) {
|
|
12
|
+
static_assert(OutputType == 2 || OutputType == 4, "Only 2-byte and 4-byte output supported");
|
|
13
|
+
using namespace DfaUtf8;
|
|
14
|
+
assert(pSource <= pEnd);
|
|
15
|
+
|
|
16
|
+
const uint8_t *RESTRICT s = (const uint8_t *)pSource;
|
|
17
|
+
uint16_t *RESTRICT d = (uint16_t *)pDest;
|
|
18
|
+
uint32_t codepoint;
|
|
19
|
+
uint32_t state = 0;
|
|
20
|
+
|
|
21
|
+
const uint8_t *ans_s = s;
|
|
22
|
+
uint16_t *ans_d = d;
|
|
23
|
+
|
|
24
|
+
while (s < (const uint8_t *)pEnd) {
|
|
25
|
+
if (decode(&state, &codepoint, *s++))
|
|
26
|
+
continue;
|
|
27
|
+
if (OutputType == 2) {
|
|
28
|
+
if (codepoint > 0xFFFFU) {
|
|
29
|
+
*d++ = (uint16_t)(0xD7C0U + (codepoint >> 10));
|
|
30
|
+
*d++ = (uint16_t)(0xDC00U + (codepoint & 0x3FFU));
|
|
31
|
+
} else {
|
|
32
|
+
*d++ = (uint16_t)codepoint;
|
|
33
|
+
}
|
|
34
|
+
}
|
|
35
|
+
else {
|
|
36
|
+
*(uint32_t *)d = codepoint;
|
|
37
|
+
d += 2;
|
|
38
|
+
}
|
|
39
|
+
if (state == UTF8_ACCEPT) {
|
|
40
|
+
ans_s = s;
|
|
41
|
+
ans_d = d;
|
|
42
|
+
}
|
|
43
|
+
}
|
|
44
|
+
|
|
45
|
+
pSource = (const char *)ans_s;
|
|
46
|
+
pDest = (char *)ans_d;
|
|
47
|
+
return state != UTF8_REJECT;
|
|
48
|
+
}
|
|
49
|
+
|
|
50
|
+
template<int InputType>
|
|
51
|
+
FORCEINLINE bool EncodeTrivial(const char *&pSource, const char *pEnd, char *&pDest) {
|
|
52
|
+
static_assert(InputType == 2 || InputType == 4, "Only 2-byte and 4-byte input supported");
|
|
53
|
+
assert(pSource <= pEnd);
|
|
54
|
+
|
|
55
|
+
const uint16_t *RESTRICT s = (const uint16_t *)pSource;
|
|
56
|
+
uint8_t *RESTRICT d = (uint8_t *)pDest;
|
|
57
|
+
const uint16_t *end = s + (pEnd - pSource) / InputType * (InputType / 2);
|
|
58
|
+
|
|
59
|
+
while (s < end) {
|
|
60
|
+
uint32_t codepoint;
|
|
61
|
+
|
|
62
|
+
if (InputType == 2) {
|
|
63
|
+
codepoint = *s++;
|
|
64
|
+
|
|
65
|
+
if (codepoint - 0xD800U < 0x0800U) {
|
|
66
|
+
if (s < end) {
|
|
67
|
+
uint32_t tail = *s++;
|
|
68
|
+
if ((codepoint & 0xFC00U) != 0xD800U || (tail & 0xFC00U) != 0xDC00U)
|
|
69
|
+
return false;
|
|
70
|
+
codepoint = 0x10000U + ((codepoint & 0x03FFU) << 10) + (tail & 0x03FFU);
|
|
71
|
+
}
|
|
72
|
+
else {
|
|
73
|
+
s--;
|
|
74
|
+
break;
|
|
75
|
+
}
|
|
76
|
+
}
|
|
77
|
+
}
|
|
78
|
+
else {
|
|
79
|
+
codepoint = *(const uint32_t*)s;
|
|
80
|
+
s += 2;
|
|
81
|
+
if (codepoint > 0x10FFFFU || codepoint - 0xD800U < 0x0800U)
|
|
82
|
+
return false;
|
|
83
|
+
}
|
|
84
|
+
|
|
85
|
+
if (codepoint <= 0x7FU)
|
|
86
|
+
*d++ = uint8_t(codepoint);
|
|
87
|
+
else if (codepoint <= 0x7FFU) {
|
|
88
|
+
*d++ = uint8_t(0xC0U + (codepoint >> 6));
|
|
89
|
+
*d++ = uint8_t(0x80U + (codepoint & 0x3FU));
|
|
90
|
+
}
|
|
91
|
+
else if (codepoint <= 0xFFFFU) {
|
|
92
|
+
*d++ = uint8_t(0xE0U + (codepoint >> 12));
|
|
93
|
+
*d++ = uint8_t(0x80U + ((codepoint >> 6) & 0x3FU));
|
|
94
|
+
*d++ = uint8_t(0x80U + (codepoint & 0x3FU));
|
|
95
|
+
}
|
|
96
|
+
else {
|
|
97
|
+
*d++ = uint8_t(0xF0U + (codepoint >> 18));
|
|
98
|
+
*d++ = uint8_t(0x80U + ((codepoint >> 12) & 0x3FU));
|
|
99
|
+
*d++ = uint8_t(0x80U + ((codepoint >> 6) & 0x3FU));
|
|
100
|
+
*d++ = uint8_t(0x80U + (codepoint & 0x3FU));
|
|
101
|
+
}
|
|
102
|
+
|
|
103
|
+
pSource = (const char *)s;
|
|
104
|
+
pDest = (char *)d;
|
|
105
|
+
}
|
|
106
|
+
|
|
107
|
+
return true;
|
|
108
|
+
}
|
|
@@ -0,0 +1,139 @@
|
|
|
1
|
+
#include "iconv/iconv.h"
|
|
2
|
+
#include "buffer/BaseBufferProcessor.h"
|
|
3
|
+
#include "buffer/ProcessorPlugins.h"
|
|
4
|
+
#include "buffer/BufferDecoder.h"
|
|
5
|
+
#include "buffer/BufferEncoder.h"
|
|
6
|
+
#include <assert.h>
|
|
7
|
+
|
|
8
|
+
size_t iconv(iconv_t cd, const char **inbuf, size_t *inbytesleft, char **outbuf, size_t *outbytesleft) {
|
|
9
|
+
if (cd == (iconv_t)0 || cd == (iconv_t)-1) {
|
|
10
|
+
errno = EBADF;
|
|
11
|
+
return (size_t)-1;
|
|
12
|
+
}
|
|
13
|
+
BaseBufferProcessor *processor = (BaseBufferProcessor*)cd;
|
|
14
|
+
|
|
15
|
+
if (!inbuf || !*inbuf) {
|
|
16
|
+
//no state carried between calls
|
|
17
|
+
return 0;
|
|
18
|
+
}
|
|
19
|
+
else if (!inbytesleft || !outbytesleft) {
|
|
20
|
+
//error: input / output size not specified
|
|
21
|
+
errno = EBADF;
|
|
22
|
+
return (size_t)-1;
|
|
23
|
+
}
|
|
24
|
+
else if (!outbuf || !*outbuf) {
|
|
25
|
+
//extension: return estimated size of output buffer
|
|
26
|
+
//which is surely enough to hold all the converted data
|
|
27
|
+
*outbytesleft = processor->GetOutputBufferMinSize(*inbytesleft);
|
|
28
|
+
return 0;
|
|
29
|
+
}
|
|
30
|
+
|
|
31
|
+
processor->Clear();
|
|
32
|
+
ContiguousInput input(*processor, *inbuf, *inbytesleft);
|
|
33
|
+
ContiguousOutput output(*processor, *outbuf, *outbytesleft);
|
|
34
|
+
|
|
35
|
+
bool overflow = false;
|
|
36
|
+
bool ok;
|
|
37
|
+
while (!input.Finished()) {
|
|
38
|
+
//check if we surely have space for next block converted
|
|
39
|
+
int inputChunk = input.GetNextChunkSize();
|
|
40
|
+
int maxOutputNeeded = int(output.GetMaxOutputSize(*processor, inputChunk));
|
|
41
|
+
long long freeOutputSpace = output.GetBufferSize() - output.GetFilledOutputSize();
|
|
42
|
+
if (maxOutputNeeded > freeOutputSpace) {
|
|
43
|
+
//note: a lot of input data may be left unconverted (up to chunk size)
|
|
44
|
+
overflow = true;
|
|
45
|
+
break;
|
|
46
|
+
}
|
|
47
|
+
//convert a block
|
|
48
|
+
ok = processor->Process();
|
|
49
|
+
if (!ok)
|
|
50
|
+
break;
|
|
51
|
+
}
|
|
52
|
+
|
|
53
|
+
long long remains = input.GetRemainingDataSize();
|
|
54
|
+
long long converted = output.GetFilledOutputSize();
|
|
55
|
+
*inbuf += *inbytesleft - remains;
|
|
56
|
+
*inbytesleft = remains;
|
|
57
|
+
*outbuf += converted;
|
|
58
|
+
*outbytesleft -= converted;
|
|
59
|
+
|
|
60
|
+
if (overflow) {
|
|
61
|
+
errno = E2BIG;
|
|
62
|
+
return (size_t)-1;
|
|
63
|
+
}
|
|
64
|
+
else if (ok) {
|
|
65
|
+
if (remains == 0) {
|
|
66
|
+
//major difference: return 1 instead of number of characters converted
|
|
67
|
+
return 1;
|
|
68
|
+
}
|
|
69
|
+
else {
|
|
70
|
+
errno = EINVAL;
|
|
71
|
+
return (size_t)-1;
|
|
72
|
+
}
|
|
73
|
+
}
|
|
74
|
+
else {
|
|
75
|
+
errno = EILSEQ;
|
|
76
|
+
return (size_t)-1;
|
|
77
|
+
}
|
|
78
|
+
}
|
|
79
|
+
|
|
80
|
+
int iconv_close(iconv_t cd) {
|
|
81
|
+
if (cd == (iconv_t)0 || cd == (iconv_t)-1) {
|
|
82
|
+
errno = EBADF;
|
|
83
|
+
return -1;
|
|
84
|
+
}
|
|
85
|
+
BaseBufferProcessor *processor = (BaseBufferProcessor*)cd;
|
|
86
|
+
|
|
87
|
+
delete processor;
|
|
88
|
+
return 0;
|
|
89
|
+
}
|
|
90
|
+
|
|
91
|
+
|
|
92
|
+
|
|
93
|
+
#include "buffer/BufferDecoder.h"
|
|
94
|
+
#include "buffer/BufferEncoder.h"
|
|
95
|
+
|
|
96
|
+
enum Format {
|
|
97
|
+
Unsupported = 0,
|
|
98
|
+
Utf8,
|
|
99
|
+
Utf16,
|
|
100
|
+
Utf32
|
|
101
|
+
};
|
|
102
|
+
Format ParseFormat(const char *str) {
|
|
103
|
+
if (strcmp(str, "UTF-8") == 0)
|
|
104
|
+
return Utf8;
|
|
105
|
+
if (strcmp(str, "UTF-16LE") == 0)
|
|
106
|
+
return Utf16;
|
|
107
|
+
if (strcmp(str, "UTF-32LE") == 0)
|
|
108
|
+
return Utf32;
|
|
109
|
+
return Unsupported;
|
|
110
|
+
}
|
|
111
|
+
|
|
112
|
+
iconv_t iconv_open(const char *tocode, const char *fromcode) {
|
|
113
|
+
Format dstFormat = ParseFormat(tocode);
|
|
114
|
+
Format srcFormat = ParseFormat(fromcode);
|
|
115
|
+
if (srcFormat == Unsupported || dstFormat == Unsupported || (dstFormat != Utf8 && srcFormat != Utf8) || dstFormat == srcFormat) {
|
|
116
|
+
errno = EINVAL;
|
|
117
|
+
return (iconv_t)-1;
|
|
118
|
+
}
|
|
119
|
+
|
|
120
|
+
#ifdef ICONV_SMALL
|
|
121
|
+
static const int Multiplier = 1; //compact version for small buffers
|
|
122
|
+
#else
|
|
123
|
+
static const int Multiplier = 4; //fastest for large buffers
|
|
124
|
+
#endif
|
|
125
|
+
|
|
126
|
+
if (0);
|
|
127
|
+
else if (dstFormat == Utf8 && srcFormat == Utf16)
|
|
128
|
+
return new BufferEncoder<3, 2, emValidate, Multiplier>();
|
|
129
|
+
else if (dstFormat == Utf8 && srcFormat == Utf32)
|
|
130
|
+
return new BufferEncoder<3, 4, emValidate, Multiplier>();
|
|
131
|
+
else if (dstFormat == Utf16 && srcFormat == Utf8)
|
|
132
|
+
return new BufferDecoder<3, 2, dmValidate, Multiplier>();
|
|
133
|
+
else if (dstFormat == Utf32 && srcFormat == Utf8)
|
|
134
|
+
return new BufferDecoder<3, 4, dmValidate, Multiplier>();
|
|
135
|
+
else {
|
|
136
|
+
assert(0);
|
|
137
|
+
return 0;
|
|
138
|
+
}
|
|
139
|
+
}
|