react-native-quick-crypto 1.0.18 → 1.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (751) hide show
  1. package/QuickCrypto.podspec +12 -38
  2. package/README.md +2 -0
  3. package/android/CMakeLists.txt +3 -0
  4. package/cpp/utils/HybridUtils.cpp +39 -77
  5. package/deps/simdutf/.clang-format +4 -0
  6. package/deps/simdutf/.github/ISSUE_TEMPLATE/bug_report.md +62 -0
  7. package/deps/simdutf/.github/ISSUE_TEMPLATE/config.yml +1 -0
  8. package/deps/simdutf/.github/ISSUE_TEMPLATE/feature_request.md +35 -0
  9. package/deps/simdutf/.github/ISSUE_TEMPLATE/standard-issue-template.md +29 -0
  10. package/deps/simdutf/.github/pull_request_template.md +51 -0
  11. package/deps/simdutf/.github/workflows/aarch64.yml +39 -0
  12. package/deps/simdutf/.github/workflows/alpine.yml +27 -0
  13. package/deps/simdutf/.github/workflows/amalgamation_demos.yml +34 -0
  14. package/deps/simdutf/.github/workflows/armv7.yml +32 -0
  15. package/deps/simdutf/.github/workflows/atomic_fuzz.yml +25 -0
  16. package/deps/simdutf/.github/workflows/cifuzz.yml +37 -0
  17. package/deps/simdutf/.github/workflows/clangformat.yml +36 -0
  18. package/deps/simdutf/.github/workflows/debian-latestcxxstandards.yml +40 -0
  19. package/deps/simdutf/.github/workflows/debian.yml +33 -0
  20. package/deps/simdutf/.github/workflows/documentation.yml +36 -0
  21. package/deps/simdutf/.github/workflows/emscripten.yml +19 -0
  22. package/deps/simdutf/.github/workflows/loongarch64-gcc-14.2.yml +39 -0
  23. package/deps/simdutf/.github/workflows/macos-latest.yml +29 -0
  24. package/deps/simdutf/.github/workflows/msys2-clang.yml +48 -0
  25. package/deps/simdutf/.github/workflows/msys2.yml +50 -0
  26. package/deps/simdutf/.github/workflows/ppc64le.yml +29 -0
  27. package/deps/simdutf/.github/workflows/rvv-1024-clang-18.yml +35 -0
  28. package/deps/simdutf/.github/workflows/rvv-128-clang-17.yml +35 -0
  29. package/deps/simdutf/.github/workflows/rvv-256-gcc-14.yml +31 -0
  30. package/deps/simdutf/.github/workflows/s390x.yml +29 -0
  31. package/deps/simdutf/.github/workflows/selective-amalgamation.yml +29 -0
  32. package/deps/simdutf/.github/workflows/typos.yml +19 -0
  33. package/deps/simdutf/.github/workflows/ubuntu22-cxx20.yml +30 -0
  34. package/deps/simdutf/.github/workflows/ubuntu22.yml +32 -0
  35. package/deps/simdutf/.github/workflows/ubuntu22_gcc12.yml +27 -0
  36. package/deps/simdutf/.github/workflows/ubuntu22sani.yml +29 -0
  37. package/deps/simdutf/.github/workflows/ubuntu24-cxxstandards.yml +34 -0
  38. package/deps/simdutf/.github/workflows/ubuntu24-unsignedchar.yml +34 -0
  39. package/deps/simdutf/.github/workflows/ubuntu24.yml +32 -0
  40. package/deps/simdutf/.github/workflows/ubuntu24sani.yml +36 -0
  41. package/deps/simdutf/.github/workflows/ubuntu24sani_clang.yml +29 -0
  42. package/deps/simdutf/.github/workflows/vs17-arm-ci.yml +21 -0
  43. package/deps/simdutf/.github/workflows/vs17-ci-cxx20.yml +41 -0
  44. package/deps/simdutf/.github/workflows/vs17-ci.yml +41 -0
  45. package/deps/simdutf/.github/workflows/vs17-clang-ci.yml +41 -0
  46. package/deps/simdutf/.github/workflows/vs17-cxxstandards.yml +36 -0
  47. package/deps/simdutf/AI_USAGE_POLICY.md +56 -0
  48. package/deps/simdutf/AUTHORS +6 -0
  49. package/deps/simdutf/CMakeLists.txt +231 -0
  50. package/deps/simdutf/CONTRIBUTING.md +214 -0
  51. package/deps/simdutf/CONTRIBUTORS +1 -0
  52. package/deps/simdutf/Doxyfile +2584 -0
  53. package/deps/simdutf/LICENSE-APACHE +201 -0
  54. package/deps/simdutf/LICENSE-MIT +18 -0
  55. package/deps/simdutf/Makefile.crosscompile +54 -0
  56. package/deps/simdutf/README-RVV.md +16 -0
  57. package/deps/simdutf/README.md +2782 -0
  58. package/deps/simdutf/SECURITY.md +8 -0
  59. package/deps/simdutf/benchmarks/CMakeLists.txt +101 -0
  60. package/deps/simdutf/benchmarks/alignment.cpp +150 -0
  61. package/deps/simdutf/benchmarks/base64/CMakeLists.txt +30 -0
  62. package/deps/simdutf/benchmarks/base64/benchmark_base64.cpp +875 -0
  63. package/deps/simdutf/benchmarks/base64/libbase64_spaces.h +49 -0
  64. package/deps/simdutf/benchmarks/base64/node_base64.h +227 -0
  65. package/deps/simdutf/benchmarks/base64/openssl3_base64.h +334 -0
  66. package/deps/simdutf/benchmarks/benchmark.cpp +65 -0
  67. package/deps/simdutf/benchmarks/benchmark_to_well_formed_utf16.cpp +347 -0
  68. package/deps/simdutf/benchmarks/competition/.clang-format-ignore +5 -0
  69. package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.cpp +1276 -0
  70. package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.h +595 -0
  71. package/deps/simdutf/benchmarks/competition/README.md +7 -0
  72. package/deps/simdutf/benchmarks/competition/hoehrmann/hoehrmann.h +91 -0
  73. package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16.h +444 -0
  74. package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16_tables.h +13183 -0
  75. package/deps/simdutf/benchmarks/competition/inoue2008/script.py +73 -0
  76. package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.cpp +738 -0
  77. package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.h +293 -0
  78. package/deps/simdutf/benchmarks/competition/u8u16/COPYRIGHT +8 -0
  79. package/deps/simdutf/benchmarks/competition/u8u16/Makefile +44 -0
  80. package/deps/simdutf/benchmarks/competition/u8u16/OSL3.0.txt +169 -0
  81. package/deps/simdutf/benchmarks/competition/u8u16/Profiling/BOM_Profiler.h +148 -0
  82. package/deps/simdutf/benchmarks/competition/u8u16/Profiling/i386_timer.h +45 -0
  83. package/deps/simdutf/benchmarks/competition/u8u16/Profiling/ppc_timer.c +34 -0
  84. package/deps/simdutf/benchmarks/competition/u8u16/README +56 -0
  85. package/deps/simdutf/benchmarks/competition/u8u16/config/config_defs.h +43 -0
  86. package/deps/simdutf/benchmarks/competition/u8u16/config/g4_config.h +27 -0
  87. package/deps/simdutf/benchmarks/competition/u8u16/config/mmx_config.h +16 -0
  88. package/deps/simdutf/benchmarks/competition/u8u16/config/p4_config.h +18 -0
  89. package/deps/simdutf/benchmarks/competition/u8u16/config/p4_ideal_config.h +16 -0
  90. package/deps/simdutf/benchmarks/competition/u8u16/config/spu_config.h +28 -0
  91. package/deps/simdutf/benchmarks/competition/u8u16/config/ssse3_config.h +20 -0
  92. package/deps/simdutf/benchmarks/competition/u8u16/iconv_u8u16.c +2 -0
  93. package/deps/simdutf/benchmarks/competition/u8u16/lib/altivec_simd.h +440 -0
  94. package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_basic_ops.py +121 -0
  95. package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_half_operand_versions.py +158 -0
  96. package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_test.py +270 -0
  97. package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd.h +141 -0
  98. package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_basic.h +216 -0
  99. package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_built_in.h +119 -0
  100. package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_modified.h +2430 -0
  101. package/deps/simdutf/benchmarks/competition/u8u16/lib/outline.txt +39 -0
  102. package/deps/simdutf/benchmarks/competition/u8u16/lib/spu_simd.h +421 -0
  103. package/deps/simdutf/benchmarks/competition/u8u16/lib/sse_simd.h +836 -0
  104. package/deps/simdutf/benchmarks/competition/u8u16/lib/stdint.h +222 -0
  105. package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_BE.c +4 -0
  106. package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_LE.c +5 -0
  107. package/deps/simdutf/benchmarks/competition/u8u16/proto/u8u16.py +390 -0
  108. package/deps/simdutf/benchmarks/competition/u8u16/src/Makefile +18 -0
  109. package/deps/simdutf/benchmarks/competition/u8u16/src/bytelex.h +448 -0
  110. package/deps/simdutf/benchmarks/competition/u8u16/src/charsets/ASCII_EBCDIC.h +284 -0
  111. package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.c +1975 -0
  112. package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.pdf +0 -0
  113. package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.w +2263 -0
  114. package/deps/simdutf/benchmarks/competition/u8u16/src/multiliteral.h +239 -0
  115. package/deps/simdutf/benchmarks/competition/u8u16/src/u8u16.c +232 -0
  116. package/deps/simdutf/benchmarks/competition/u8u16/src/x8x16.c +194 -0
  117. package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.c +193 -0
  118. package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.h +167 -0
  119. package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.c +288 -0
  120. package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.h +117 -0
  121. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_g4.c +2 -0
  122. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_mmx.c +2 -0
  123. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4.c +3 -0
  124. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4_ideal.c +2 -0
  125. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_spu.c +2 -0
  126. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_ssse3.c +3 -0
  127. package/deps/simdutf/benchmarks/competition/u8u16/x8x16_p4.c +2 -0
  128. package/deps/simdutf/benchmarks/competition/utf8lut/LICENSE +23 -0
  129. package/deps/simdutf/benchmarks/competition/utf8lut/data/test_minimal.txt +44 -0
  130. package/deps/simdutf/benchmarks/competition/utf8lut/readme.md +106 -0
  131. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.cmd +11 -0
  132. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.sh +13 -0
  133. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_corr_tests.sh +13 -0
  134. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_example.sh +13 -0
  135. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_file_conv.sh +14 -0
  136. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_lib.sh +11 -0
  137. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_sample.sh +8 -0
  138. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_corr_tests.cmd +12 -0
  139. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_example.cmd +13 -0
  140. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_file_conv.cmd +14 -0
  141. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_lib.cmd +11 -0
  142. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_sample.cmd +8 -0
  143. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_corr_tests.cmd +11 -0
  144. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_example.cmd +12 -0
  145. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_file_conv.cmd +13 -0
  146. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_lib.cmd +10 -0
  147. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_sample.cmd +9 -0
  148. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/html_table.py +25 -0
  149. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/measure.py +94 -0
  150. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/resize.py +20 -0
  151. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_all.cmd +2 -0
  152. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_interm.cmd +1 -0
  153. package/deps/simdutf/benchmarks/competition/utf8lut/src/base/CustomMemcpy.h +75 -0
  154. package/deps/simdutf/benchmarks/competition/utf8lut/src/base/PerfDefs.h +47 -0
  155. package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.cpp +17 -0
  156. package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.h +76 -0
  157. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/AllProcessors.cpp +35 -0
  158. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.cpp +117 -0
  159. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.h +210 -0
  160. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferDecoder.h +158 -0
  161. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferEncoder.h +104 -0
  162. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorPlugins.h +334 -0
  163. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorSelector.h +186 -0
  164. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.cpp +140 -0
  165. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.h +42 -0
  166. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderProcess.h +100 -0
  167. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/Dfa.h +57 -0
  168. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.cpp +85 -0
  169. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.h +27 -0
  170. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderProcess.h +126 -0
  171. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/ProcessTrivial.h +108 -0
  172. package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.cpp +139 -0
  173. package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.h +74 -0
  174. package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.cpp +65 -0
  175. package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.h +91 -0
  176. package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/CorrectnessTests.cpp +772 -0
  177. package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/Example.cpp +12 -0
  178. package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/FileConverter.cpp +486 -0
  179. package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/iconv_sample.c +162 -0
  180. package/deps/simdutf/benchmarks/competition/utf8lut/src/utf8lut.h +15 -0
  181. package/deps/simdutf/benchmarks/competition/utf8sse4/fromutf8-sse.cpp +292 -0
  182. package/deps/simdutf/benchmarks/competition/utfcpp/LICENSE +23 -0
  183. package/deps/simdutf/benchmarks/competition/utfcpp/README.md +1503 -0
  184. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/checked.h +335 -0
  185. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/core.h +338 -0
  186. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp11.h +103 -0
  187. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp17.h +103 -0
  188. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/unchecked.h +274 -0
  189. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8.h +34 -0
  190. package/deps/simdutf/benchmarks/dataset/README.md +155 -0
  191. package/deps/simdutf/benchmarks/dataset/emoji.txt +204 -0
  192. package/deps/simdutf/benchmarks/dataset/scripts/utf8type.py +40 -0
  193. package/deps/simdutf/benchmarks/dataset/wikipedia_mars/Makefile +80 -0
  194. package/deps/simdutf/benchmarks/dataset/wikipedia_mars/convert_to_utf6.py +20 -0
  195. package/deps/simdutf/benchmarks/find/CMakeLists.txt +6 -0
  196. package/deps/simdutf/benchmarks/find/findbenchmark.cpp +63 -0
  197. package/deps/simdutf/benchmarks/find/findbenchmarker.h +46 -0
  198. package/deps/simdutf/benchmarks/shortbench.cpp +555 -0
  199. package/deps/simdutf/benchmarks/src/CMakeLists.txt +52 -0
  200. package/deps/simdutf/benchmarks/src/apple_arm_events.h +1104 -0
  201. package/deps/simdutf/benchmarks/src/benchmark.cpp +3899 -0
  202. package/deps/simdutf/benchmarks/src/benchmark.h +317 -0
  203. package/deps/simdutf/benchmarks/src/benchmark_base.cpp +144 -0
  204. package/deps/simdutf/benchmarks/src/benchmark_base.h +98 -0
  205. package/deps/simdutf/benchmarks/src/cmdline.cpp +176 -0
  206. package/deps/simdutf/benchmarks/src/cmdline.h +35 -0
  207. package/deps/simdutf/benchmarks/src/event_counter.h +162 -0
  208. package/deps/simdutf/benchmarks/src/linux-perf-events.h +104 -0
  209. package/deps/simdutf/benchmarks/stream.cpp +209 -0
  210. package/deps/simdutf/benchmarks/threaded.cpp +123 -0
  211. package/deps/simdutf/cmake/CPM.cmake +1363 -0
  212. package/deps/simdutf/cmake/JoinPaths.cmake +23 -0
  213. package/deps/simdutf/cmake/add_cpp_test.cmake +68 -0
  214. package/deps/simdutf/cmake/simdutf-config.cmake.in +2 -0
  215. package/deps/simdutf/cmake/simdutf-flags.cmake +26 -0
  216. package/deps/simdutf/cmake/toolchains-ci/riscv64-linux-gnu.cmake +4 -0
  217. package/deps/simdutf/cmake/toolchains-dev/README.md +32 -0
  218. package/deps/simdutf/cmake/toolchains-dev/aarch64.cmake +14 -0
  219. package/deps/simdutf/cmake/toolchains-dev/loongarch64.cmake +22 -0
  220. package/deps/simdutf/cmake/toolchains-dev/powerpc64.cmake +16 -0
  221. package/deps/simdutf/cmake/toolchains-dev/powerpc64le.cmake +16 -0
  222. package/deps/simdutf/cmake/toolchains-dev/riscv64.cmake +16 -0
  223. package/deps/simdutf/cmake/toolchains-dev/rvv-spike.cmake +38 -0
  224. package/deps/simdutf/doc/avx512.png +0 -0
  225. package/deps/simdutf/doc/logo.png +0 -0
  226. package/deps/simdutf/doc/logo.svg +165 -0
  227. package/deps/simdutf/doc/node2023.png +0 -0
  228. package/deps/simdutf/doc/shortinput.md +78 -0
  229. package/deps/simdutf/doc/utf16utf8.png +0 -0
  230. package/deps/simdutf/doc/utf8utf16.png +0 -0
  231. package/deps/simdutf/doc/widelogo.png +0 -0
  232. package/deps/simdutf/doxygen.py +50 -0
  233. package/deps/simdutf/fuzz/.clang-format +9 -0
  234. package/deps/simdutf/fuzz/CMakeLists.txt +45 -0
  235. package/deps/simdutf/fuzz/README.md +168 -0
  236. package/deps/simdutf/fuzz/atomic_base64.cpp +448 -0
  237. package/deps/simdutf/fuzz/base64.cpp +278 -0
  238. package/deps/simdutf/fuzz/build.sh +83 -0
  239. package/deps/simdutf/fuzz/conversion.cpp +669 -0
  240. package/deps/simdutf/fuzz/helpers/.clang-format-ignore +1 -0
  241. package/deps/simdutf/fuzz/helpers/common.h +135 -0
  242. package/deps/simdutf/fuzz/helpers/nameof.hpp +1258 -0
  243. package/deps/simdutf/fuzz/main.cpp +72 -0
  244. package/deps/simdutf/fuzz/minimize_and_cleanse.sh +87 -0
  245. package/deps/simdutf/fuzz/misc.cpp +216 -0
  246. package/deps/simdutf/fuzz/random_fuzz.sh +154 -0
  247. package/deps/simdutf/fuzz/roundtrip.cpp +588 -0
  248. package/deps/simdutf/fuzz/safe_conversion.cpp +104 -0
  249. package/deps/simdutf/include/simdutf/avx512.h +79 -0
  250. package/deps/simdutf/include/simdutf/base64_implementation.h +158 -0
  251. package/deps/simdutf/include/simdutf/base64_tables.h +887 -0
  252. package/deps/simdutf/include/simdutf/common_defs.h +186 -0
  253. package/deps/simdutf/include/simdutf/compiler_check.h +50 -0
  254. package/deps/simdutf/include/simdutf/constexpr_ptr.h +138 -0
  255. package/deps/simdutf/include/simdutf/encoding_types.h +189 -0
  256. package/deps/simdutf/include/simdutf/error.h +126 -0
  257. package/deps/simdutf/include/simdutf/implementation.h +7081 -0
  258. package/deps/simdutf/include/simdutf/internal/isadetection.h +325 -0
  259. package/deps/simdutf/include/simdutf/portability.h +285 -0
  260. package/deps/simdutf/include/simdutf/scalar/ascii.h +86 -0
  261. package/deps/simdutf/include/simdutf/scalar/atomic_util.h +105 -0
  262. package/deps/simdutf/include/simdutf/scalar/base64.h +911 -0
  263. package/deps/simdutf/include/simdutf/scalar/latin1.h +26 -0
  264. package/deps/simdutf/include/simdutf/scalar/latin1_to_utf16/latin1_to_utf16.h +52 -0
  265. package/deps/simdutf/include/simdutf/scalar/latin1_to_utf32/latin1_to_utf32.h +27 -0
  266. package/deps/simdutf/include/simdutf/scalar/latin1_to_utf8/latin1_to_utf8.h +191 -0
  267. package/deps/simdutf/include/simdutf/scalar/swap_bytes.h +35 -0
  268. package/deps/simdutf/include/simdutf/scalar/utf16.h +226 -0
  269. package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/utf16_to_latin1.h +108 -0
  270. package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/valid_utf16_to_latin1.h +40 -0
  271. package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/utf16_to_utf32.h +86 -0
  272. package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/valid_utf16_to_utf32.h +44 -0
  273. package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/utf16_to_utf8.h +295 -0
  274. package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/valid_utf16_to_utf8.h +91 -0
  275. package/deps/simdutf/include/simdutf/scalar/utf32.h +82 -0
  276. package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/utf32_to_latin1.h +68 -0
  277. package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/valid_utf32_to_latin1.h +67 -0
  278. package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/utf32_to_utf16.h +84 -0
  279. package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/valid_utf32_to_utf16.h +44 -0
  280. package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/utf32_to_utf8.h +142 -0
  281. package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/valid_utf32_to_utf8.h +72 -0
  282. package/deps/simdutf/include/simdutf/scalar/utf8.h +326 -0
  283. package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/utf8_to_latin1.h +225 -0
  284. package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/valid_utf8_to_latin1.h +87 -0
  285. package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/utf8_to_utf16.h +342 -0
  286. package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/valid_utf8_to_utf16.h +106 -0
  287. package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/utf8_to_utf32.h +299 -0
  288. package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/valid_utf8_to_utf32.h +83 -0
  289. package/deps/simdutf/include/simdutf/simdutf_version.h +26 -0
  290. package/deps/simdutf/include/simdutf.h +26 -0
  291. package/deps/simdutf/include/simdutf_c.h +342 -0
  292. package/deps/simdutf/riscv/Dockerfile +16 -0
  293. package/deps/simdutf/riscv/README.md +24 -0
  294. package/deps/simdutf/riscv/remove-docker-station +8 -0
  295. package/deps/simdutf/riscv/run-docker-station +31 -0
  296. package/deps/simdutf/scripts/.flake8 +2 -0
  297. package/deps/simdutf/scripts/Makefile +2 -0
  298. package/deps/simdutf/scripts/README_ADD_FUNCTION.md +49 -0
  299. package/deps/simdutf/scripts/add_function.py +330 -0
  300. package/deps/simdutf/scripts/amalgamation_tests.py +156 -0
  301. package/deps/simdutf/scripts/base64/Makefile +2 -0
  302. package/deps/simdutf/scripts/base64/README.md +2 -0
  303. package/deps/simdutf/scripts/base64/avx512.py +76 -0
  304. package/deps/simdutf/scripts/base64/neon_decode.py +143 -0
  305. package/deps/simdutf/scripts/base64/neon_generate_lut.py +101 -0
  306. package/deps/simdutf/scripts/base64/sse.py +252 -0
  307. package/deps/simdutf/scripts/base64/sseregular.py +160 -0
  308. package/deps/simdutf/scripts/base64/sseurl.py +283 -0
  309. package/deps/simdutf/scripts/base64/table.py +59 -0
  310. package/deps/simdutf/scripts/base64bench_print.py +145 -0
  311. package/deps/simdutf/scripts/benchmark-all.py +119 -0
  312. package/deps/simdutf/scripts/benchmark_print.py +324 -0
  313. package/deps/simdutf/scripts/check_feature_macros.py +156 -0
  314. package/deps/simdutf/scripts/check_typos.sh +13 -0
  315. package/deps/simdutf/scripts/clang_format.sh +35 -0
  316. package/deps/simdutf/scripts/clang_format_docker.sh +38 -0
  317. package/deps/simdutf/scripts/common.py +24 -0
  318. package/deps/simdutf/scripts/compilation_benchmark.py +55 -0
  319. package/deps/simdutf/scripts/compile_many_variations.sh +64 -0
  320. package/deps/simdutf/scripts/create_latex_table.py +62 -0
  321. package/deps/simdutf/scripts/docker/Dockerfile +14 -0
  322. package/deps/simdutf/scripts/docker/Makefile +9 -0
  323. package/deps/simdutf/scripts/docker/README.md +30 -0
  324. package/deps/simdutf/scripts/docker/llvm.gpg +0 -0
  325. package/deps/simdutf/scripts/ppc64_convert_utf16_to_utf8.py +155 -0
  326. package/deps/simdutf/scripts/prepare_doxygen.sh +21 -0
  327. package/deps/simdutf/scripts/release.py +197 -0
  328. package/deps/simdutf/scripts/shortinputplots.py +97 -0
  329. package/deps/simdutf/scripts/sse_convert_utf16_to_utf8.py +422 -0
  330. package/deps/simdutf/scripts/sse_convert_utf32_to_utf16.py +105 -0
  331. package/deps/simdutf/scripts/sse_utf8_utf16_decode.py +186 -0
  332. package/deps/simdutf/scripts/sse_validate_utf16le_proof.py +137 -0
  333. package/deps/simdutf/scripts/sse_validate_utf16le_testcases.py +129 -0
  334. package/deps/simdutf/scripts/table.py +207 -0
  335. package/deps/simdutf/scripts/tests/new.txt +33 -0
  336. package/deps/simdutf/scripts/tests/old.txt +33 -0
  337. package/deps/simdutf/scripts/tests/results.txt +272 -0
  338. package/deps/simdutf/simdutf.pc.in +11 -0
  339. package/deps/simdutf/singleheader/.flake8 +2 -0
  340. package/deps/simdutf/singleheader/CMakeLists.txt +64 -0
  341. package/deps/simdutf/singleheader/README-dev.md +81 -0
  342. package/deps/simdutf/singleheader/README.md +19 -0
  343. package/deps/simdutf/singleheader/amalgamate.py +513 -0
  344. package/deps/simdutf/singleheader/amalgamation_demo.c +59 -0
  345. package/deps/simdutf/singleheader/amalgamation_demo.cpp +54 -0
  346. package/deps/simdutf/singleheader/test-features.py +262 -0
  347. package/deps/simdutf/src/CMakeLists.txt +78 -0
  348. package/deps/simdutf/src/arm64/arm_base64.cpp +791 -0
  349. package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf16.cpp +24 -0
  350. package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf32.cpp +24 -0
  351. package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf8.cpp +70 -0
  352. package/deps/simdutf/src/arm64/arm_convert_utf16_to_latin1.cpp +61 -0
  353. package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf32.cpp +185 -0
  354. package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf8.cpp +780 -0
  355. package/deps/simdutf/src/arm64/arm_convert_utf32_to_latin1.cpp +60 -0
  356. package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf16.cpp +208 -0
  357. package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf8.cpp +505 -0
  358. package/deps/simdutf/src/arm64/arm_convert_utf8_to_latin1.cpp +69 -0
  359. package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf16.cpp +313 -0
  360. package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf32.cpp +179 -0
  361. package/deps/simdutf/src/arm64/arm_find.cpp +199 -0
  362. package/deps/simdutf/src/arm64/arm_utf16fix.cpp +185 -0
  363. package/deps/simdutf/src/arm64/arm_validate_utf16.cpp +165 -0
  364. package/deps/simdutf/src/arm64/arm_validate_utf32le.cpp +65 -0
  365. package/deps/simdutf/src/arm64/implementation.cpp +1442 -0
  366. package/deps/simdutf/src/encoding_types.cpp +67 -0
  367. package/deps/simdutf/src/error.cpp +3 -0
  368. package/deps/simdutf/src/fallback/implementation.cpp +589 -0
  369. package/deps/simdutf/src/generic/ascii_validation.h +50 -0
  370. package/deps/simdutf/src/generic/base64.h +233 -0
  371. package/deps/simdutf/src/generic/base64lengths.h +63 -0
  372. package/deps/simdutf/src/generic/buf_block_reader.h +109 -0
  373. package/deps/simdutf/src/generic/find.h +75 -0
  374. package/deps/simdutf/src/generic/utf16/change_endianness.h +24 -0
  375. package/deps/simdutf/src/generic/utf16/count_code_points_bytemask.h +58 -0
  376. package/deps/simdutf/src/generic/utf16/to_well_formed.h +93 -0
  377. package/deps/simdutf/src/generic/utf16/utf32_length_from_utf16.h +15 -0
  378. package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16.h +35 -0
  379. package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16_bytemask.h +199 -0
  380. package/deps/simdutf/src/generic/utf16.h +73 -0
  381. package/deps/simdutf/src/generic/utf32.h +136 -0
  382. package/deps/simdutf/src/generic/utf8/utf16_length_from_utf8_bytemask.h +53 -0
  383. package/deps/simdutf/src/generic/utf8.h +92 -0
  384. package/deps/simdutf/src/generic/utf8_to_latin1/utf8_to_latin1.h +316 -0
  385. package/deps/simdutf/src/generic/utf8_to_latin1/valid_utf8_to_latin1.h +78 -0
  386. package/deps/simdutf/src/generic/utf8_to_utf16/utf8_to_utf16.h +332 -0
  387. package/deps/simdutf/src/generic/utf8_to_utf16/valid_utf8_to_utf16.h +74 -0
  388. package/deps/simdutf/src/generic/utf8_to_utf32/utf8_to_utf32.h +318 -0
  389. package/deps/simdutf/src/generic/utf8_to_utf32/valid_utf8_to_utf32.h +42 -0
  390. package/deps/simdutf/src/generic/utf8_validation/utf8_lookup4_algorithm.h +223 -0
  391. package/deps/simdutf/src/generic/utf8_validation/utf8_validator.h +84 -0
  392. package/deps/simdutf/src/generic/validate_utf16.h +164 -0
  393. package/deps/simdutf/src/generic/validate_utf32.h +99 -0
  394. package/deps/simdutf/src/haswell/avx2_base64.cpp +837 -0
  395. package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf16.cpp +28 -0
  396. package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf32.cpp +20 -0
  397. package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf8.cpp +83 -0
  398. package/deps/simdutf/src/haswell/avx2_convert_utf16_to_latin1.cpp +83 -0
  399. package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf32.cpp +210 -0
  400. package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf8.cpp +602 -0
  401. package/deps/simdutf/src/haswell/avx2_convert_utf32_to_latin1.cpp +116 -0
  402. package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf16.cpp +164 -0
  403. package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf8.cpp +569 -0
  404. package/deps/simdutf/src/haswell/avx2_convert_utf8_to_latin1.cpp +60 -0
  405. package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf16.cpp +195 -0
  406. package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf32.cpp +135 -0
  407. package/deps/simdutf/src/haswell/avx2_utf16fix.cpp +173 -0
  408. package/deps/simdutf/src/haswell/avx2_validate_utf16.cpp +17 -0
  409. package/deps/simdutf/src/haswell/implementation.cpp +1447 -0
  410. package/deps/simdutf/src/icelake/icelake_ascii_validation.inl.cpp +19 -0
  411. package/deps/simdutf/src/icelake/icelake_base64.inl.cpp +630 -0
  412. package/deps/simdutf/src/icelake/icelake_common.inl.cpp +37 -0
  413. package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf16.inl.cpp +36 -0
  414. package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf32.inl.cpp +23 -0
  415. package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf8.inl.cpp +107 -0
  416. package/deps/simdutf/src/icelake/icelake_convert_utf16_to_latin1.inl.cpp +103 -0
  417. package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf32.inl.cpp +136 -0
  418. package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf8.inl.cpp +206 -0
  419. package/deps/simdutf/src/icelake/icelake_convert_utf32_to_latin1.inl.cpp +74 -0
  420. package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf16.inl.cpp +338 -0
  421. package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf8.inl.cpp +574 -0
  422. package/deps/simdutf/src/icelake/icelake_convert_utf8_to_latin1.inl.cpp +104 -0
  423. package/deps/simdutf/src/icelake/icelake_convert_utf8_to_utf16.inl.cpp +75 -0
  424. package/deps/simdutf/src/icelake/icelake_convert_valid_utf8_to_latin1.inl.cpp +69 -0
  425. package/deps/simdutf/src/icelake/icelake_find.inl.cpp +146 -0
  426. package/deps/simdutf/src/icelake/icelake_from_utf8.inl.cpp +266 -0
  427. package/deps/simdutf/src/icelake/icelake_from_valid_utf8.inl.cpp +136 -0
  428. package/deps/simdutf/src/icelake/icelake_macros.inl.cpp +143 -0
  429. package/deps/simdutf/src/icelake/icelake_utf16fix.cpp +138 -0
  430. package/deps/simdutf/src/icelake/icelake_utf32_validation.inl.cpp +63 -0
  431. package/deps/simdutf/src/icelake/icelake_utf8_common.inl.cpp +753 -0
  432. package/deps/simdutf/src/icelake/icelake_utf8_length_from_utf16.inl.cpp +269 -0
  433. package/deps/simdutf/src/icelake/icelake_utf8_validation.inl.cpp +116 -0
  434. package/deps/simdutf/src/icelake/implementation.cpp +1903 -0
  435. package/deps/simdutf/src/implementation.cpp +2526 -0
  436. package/deps/simdutf/src/lasx/implementation.cpp +1531 -0
  437. package/deps/simdutf/src/lasx/lasx_base64.cpp +695 -0
  438. package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf16.cpp +76 -0
  439. package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf32.cpp +55 -0
  440. package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf8.cpp +65 -0
  441. package/deps/simdutf/src/lasx/lasx_convert_utf16_to_latin1.cpp +64 -0
  442. package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf32.cpp +183 -0
  443. package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf8.cpp +550 -0
  444. package/deps/simdutf/src/lasx/lasx_convert_utf32_to_latin1.cpp +73 -0
  445. package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf16.cpp +218 -0
  446. package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf8.cpp +589 -0
  447. package/deps/simdutf/src/lasx/lasx_convert_utf8_to_latin1.cpp +72 -0
  448. package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf16.cpp +296 -0
  449. package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf32.cpp +190 -0
  450. package/deps/simdutf/src/lasx/lasx_find.cpp +64 -0
  451. package/deps/simdutf/src/lasx/lasx_validate_utf16.cpp +13 -0
  452. package/deps/simdutf/src/lasx/lasx_validate_utf32le.cpp +84 -0
  453. package/deps/simdutf/src/lsx/implementation.cpp +1417 -0
  454. package/deps/simdutf/src/lsx/lsx_base64.cpp +675 -0
  455. package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf16.cpp +39 -0
  456. package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf32.cpp +27 -0
  457. package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf8.cpp +56 -0
  458. package/deps/simdutf/src/lsx/lsx_convert_utf16_to_latin1.cpp +64 -0
  459. package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf32.cpp +133 -0
  460. package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf8.cpp +518 -0
  461. package/deps/simdutf/src/lsx/lsx_convert_utf32_to_latin1.cpp +66 -0
  462. package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf16.cpp +155 -0
  463. package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf8.cpp +459 -0
  464. package/deps/simdutf/src/lsx/lsx_convert_utf8_to_latin1.cpp +75 -0
  465. package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf16.cpp +291 -0
  466. package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf32.cpp +179 -0
  467. package/deps/simdutf/src/lsx/lsx_find.cpp +60 -0
  468. package/deps/simdutf/src/lsx/lsx_validate_utf16.cpp +13 -0
  469. package/deps/simdutf/src/lsx/lsx_validate_utf32le.cpp +68 -0
  470. package/deps/simdutf/src/ppc64/implementation.cpp +992 -0
  471. package/deps/simdutf/src/ppc64/ppc64_base64.cpp +480 -0
  472. package/deps/simdutf/src/ppc64/ppc64_base64_internal_tests.cpp +401 -0
  473. package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf16.cpp +12 -0
  474. package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf32.cpp +12 -0
  475. package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf8.cpp +149 -0
  476. package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_latin1.cpp +67 -0
  477. package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf32.cpp +87 -0
  478. package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf8.cpp +296 -0
  479. package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_latin1.cpp +57 -0
  480. package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf16.cpp +117 -0
  481. package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf8.cpp +166 -0
  482. package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_latin1.cpp +69 -0
  483. package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf16.cpp +211 -0
  484. package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf32.cpp +153 -0
  485. package/deps/simdutf/src/ppc64/ppc64_utf16_to_utf8_tables.h +1011 -0
  486. package/deps/simdutf/src/ppc64/ppc64_utf8_length_from_latin1.cpp +37 -0
  487. package/deps/simdutf/src/ppc64/ppc64_validate_utf16.cpp +19 -0
  488. package/deps/simdutf/src/ppc64/templates.cpp +91 -0
  489. package/deps/simdutf/src/rvv/implementation.cpp +138 -0
  490. package/deps/simdutf/src/rvv/rvv_find.cpp +27 -0
  491. package/deps/simdutf/src/rvv/rvv_helpers.inl.cpp +23 -0
  492. package/deps/simdutf/src/rvv/rvv_latin1_to.inl.cpp +71 -0
  493. package/deps/simdutf/src/rvv/rvv_length_from.inl.cpp +164 -0
  494. package/deps/simdutf/src/rvv/rvv_utf16_to.inl.cpp +399 -0
  495. package/deps/simdutf/src/rvv/rvv_utf16fix.cpp +110 -0
  496. package/deps/simdutf/src/rvv/rvv_utf32_to.inl.cpp +307 -0
  497. package/deps/simdutf/src/rvv/rvv_utf8_to.inl.cpp +435 -0
  498. package/deps/simdutf/src/rvv/rvv_validate.inl.cpp +275 -0
  499. package/deps/simdutf/src/simdutf/arm64/begin.h +2 -0
  500. package/deps/simdutf/src/simdutf/arm64/bitmanipulation.h +34 -0
  501. package/deps/simdutf/src/simdutf/arm64/end.h +2 -0
  502. package/deps/simdutf/src/simdutf/arm64/implementation.h +307 -0
  503. package/deps/simdutf/src/simdutf/arm64/intrinsics.h +10 -0
  504. package/deps/simdutf/src/simdutf/arm64/simd.h +547 -0
  505. package/deps/simdutf/src/simdutf/arm64/simd16-inl.h +403 -0
  506. package/deps/simdutf/src/simdutf/arm64/simd32-inl.h +129 -0
  507. package/deps/simdutf/src/simdutf/arm64/simd64-inl.h +28 -0
  508. package/deps/simdutf/src/simdutf/arm64.h +43 -0
  509. package/deps/simdutf/src/simdutf/fallback/begin.h +1 -0
  510. package/deps/simdutf/src/simdutf/fallback/bitmanipulation.h +13 -0
  511. package/deps/simdutf/src/simdutf/fallback/end.h +1 -0
  512. package/deps/simdutf/src/simdutf/fallback/implementation.h +331 -0
  513. package/deps/simdutf/src/simdutf/fallback.h +42 -0
  514. package/deps/simdutf/src/simdutf/haswell/begin.h +15 -0
  515. package/deps/simdutf/src/simdutf/haswell/bitmanipulation.h +35 -0
  516. package/deps/simdutf/src/simdutf/haswell/end.h +13 -0
  517. package/deps/simdutf/src/simdutf/haswell/implementation.h +338 -0
  518. package/deps/simdutf/src/simdutf/haswell/intrinsics.h +67 -0
  519. package/deps/simdutf/src/simdutf/haswell/simd.h +363 -0
  520. package/deps/simdutf/src/simdutf/haswell/simd16-inl.h +261 -0
  521. package/deps/simdutf/src/simdutf/haswell/simd32-inl.h +111 -0
  522. package/deps/simdutf/src/simdutf/haswell/simd64-inl.h +34 -0
  523. package/deps/simdutf/src/simdutf/haswell.h +63 -0
  524. package/deps/simdutf/src/simdutf/icelake/begin.h +14 -0
  525. package/deps/simdutf/src/simdutf/icelake/bitmanipulation.h +44 -0
  526. package/deps/simdutf/src/simdutf/icelake/end.h +12 -0
  527. package/deps/simdutf/src/simdutf/icelake/implementation.h +346 -0
  528. package/deps/simdutf/src/simdutf/icelake/intrinsics.h +138 -0
  529. package/deps/simdutf/src/simdutf/icelake/simd.h +17 -0
  530. package/deps/simdutf/src/simdutf/icelake/simd16-inl.h +90 -0
  531. package/deps/simdutf/src/simdutf/icelake/simd32-inl.h +47 -0
  532. package/deps/simdutf/src/simdutf/icelake.h +81 -0
  533. package/deps/simdutf/src/simdutf/lasx/begin.h +8 -0
  534. package/deps/simdutf/src/simdutf/lasx/bitmanipulation.h +25 -0
  535. package/deps/simdutf/src/simdutf/lasx/end.h +8 -0
  536. package/deps/simdutf/src/simdutf/lasx/implementation.h +310 -0
  537. package/deps/simdutf/src/simdutf/lasx/intrinsics.h +319 -0
  538. package/deps/simdutf/src/simdutf/lasx/simd.h +551 -0
  539. package/deps/simdutf/src/simdutf/lasx/simd16-inl.h +234 -0
  540. package/deps/simdutf/src/simdutf/lasx/simd32-inl.h +74 -0
  541. package/deps/simdutf/src/simdutf/lasx/simd64-inl.h +52 -0
  542. package/deps/simdutf/src/simdutf/lasx.h +49 -0
  543. package/deps/simdutf/src/simdutf/lsx/begin.h +2 -0
  544. package/deps/simdutf/src/simdutf/lsx/bitmanipulation.h +25 -0
  545. package/deps/simdutf/src/simdutf/lsx/end.h +2 -0
  546. package/deps/simdutf/src/simdutf/lsx/implementation.h +309 -0
  547. package/deps/simdutf/src/simdutf/lsx/intrinsics.h +196 -0
  548. package/deps/simdutf/src/simdutf/lsx/simd.h +421 -0
  549. package/deps/simdutf/src/simdutf/lsx/simd16-inl.h +242 -0
  550. package/deps/simdutf/src/simdutf/lsx/simd32-inl.h +69 -0
  551. package/deps/simdutf/src/simdutf/lsx/simd64-inl.h +50 -0
  552. package/deps/simdutf/src/simdutf/lsx.h +52 -0
  553. package/deps/simdutf/src/simdutf/ppc64/begin.h +1 -0
  554. package/deps/simdutf/src/simdutf/ppc64/bitmanipulation.h +29 -0
  555. package/deps/simdutf/src/simdutf/ppc64/end.h +1 -0
  556. package/deps/simdutf/src/simdutf/ppc64/implementation.h +348 -0
  557. package/deps/simdutf/src/simdutf/ppc64/intrinsics.h +19 -0
  558. package/deps/simdutf/src/simdutf/ppc64/simd.h +177 -0
  559. package/deps/simdutf/src/simdutf/ppc64/simd16-inl.h +327 -0
  560. package/deps/simdutf/src/simdutf/ppc64/simd32-inl.h +247 -0
  561. package/deps/simdutf/src/simdutf/ppc64/simd8-inl.h +618 -0
  562. package/deps/simdutf/src/simdutf/ppc64.h +40 -0
  563. package/deps/simdutf/src/simdutf/rvv/begin.h +7 -0
  564. package/deps/simdutf/src/simdutf/rvv/end.h +7 -0
  565. package/deps/simdutf/src/simdutf/rvv/implementation.h +321 -0
  566. package/deps/simdutf/src/simdutf/rvv/intrinsics.h +131 -0
  567. package/deps/simdutf/src/simdutf/rvv.h +41 -0
  568. package/deps/simdutf/src/simdutf/westmere/begin.h +8 -0
  569. package/deps/simdutf/src/simdutf/westmere/bitmanipulation.h +37 -0
  570. package/deps/simdutf/src/simdutf/westmere/end.h +8 -0
  571. package/deps/simdutf/src/simdutf/westmere/implementation.h +338 -0
  572. package/deps/simdutf/src/simdutf/westmere/intrinsics.h +38 -0
  573. package/deps/simdutf/src/simdutf/westmere/simd.h +379 -0
  574. package/deps/simdutf/src/simdutf/westmere/simd16-inl.h +242 -0
  575. package/deps/simdutf/src/simdutf/westmere/simd32-inl.h +151 -0
  576. package/deps/simdutf/src/simdutf/westmere/simd64-inl.h +33 -0
  577. package/deps/simdutf/src/simdutf/westmere.h +59 -0
  578. package/deps/simdutf/src/simdutf.cpp +152 -0
  579. package/deps/simdutf/src/simdutf_c.cpp +525 -0
  580. package/deps/simdutf/src/tables/utf16_to_utf8_tables.h +768 -0
  581. package/deps/simdutf/src/tables/utf32_to_utf16_tables.h +53 -0
  582. package/deps/simdutf/src/tables/utf8_to_utf16_tables.h +826 -0
  583. package/deps/simdutf/src/westmere/implementation.cpp +1479 -0
  584. package/deps/simdutf/src/westmere/internal/loader.cpp +7 -0
  585. package/deps/simdutf/src/westmere/internal/write_v_u16_11bits_to_utf8.cpp +66 -0
  586. package/deps/simdutf/src/westmere/sse_base64.cpp +672 -0
  587. package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf16.cpp +21 -0
  588. package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf32.cpp +31 -0
  589. package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf8.cpp +71 -0
  590. package/deps/simdutf/src/westmere/sse_convert_utf16_to_latin1.cpp +70 -0
  591. package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf32.cpp +206 -0
  592. package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf8.cpp +504 -0
  593. package/deps/simdutf/src/westmere/sse_convert_utf32_to_latin1.cpp +82 -0
  594. package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf16.cpp +209 -0
  595. package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf8.cpp +589 -0
  596. package/deps/simdutf/src/westmere/sse_convert_utf8_to_latin1.cpp +58 -0
  597. package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf16.cpp +197 -0
  598. package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf32.cpp +141 -0
  599. package/deps/simdutf/src/westmere/sse_utf16fix.cpp +82 -0
  600. package/deps/simdutf/src/westmere/sse_validate_utf16.cpp +17 -0
  601. package/deps/simdutf/tests/CMakeLists.txt +483 -0
  602. package/deps/simdutf/tests/atomic_base64_tests.cpp +2845 -0
  603. package/deps/simdutf/tests/base64_tests.cpp +3617 -0
  604. package/deps/simdutf/tests/basic_fuzzer.cpp +805 -0
  605. package/deps/simdutf/tests/bele_tests.cpp +182 -0
  606. package/deps/simdutf/tests/constexpr_base64_tests.cpp +387 -0
  607. package/deps/simdutf/tests/convert_latin1_to_utf16be_tests.cpp +52 -0
  608. package/deps/simdutf/tests/convert_latin1_to_utf16le_tests.cpp +80 -0
  609. package/deps/simdutf/tests/convert_latin1_to_utf32_tests.cpp +66 -0
  610. package/deps/simdutf/tests/convert_latin1_to_utf8_tests.cpp +120 -0
  611. package/deps/simdutf/tests/convert_utf16_to_utf8_safe_tests.cpp +203 -0
  612. package/deps/simdutf/tests/convert_utf16_to_utf8_with_replacement_tests.cpp +276 -0
  613. package/deps/simdutf/tests/convert_utf16be_to_latin1_tests.cpp +109 -0
  614. package/deps/simdutf/tests/convert_utf16be_to_latin1_tests_with_errors.cpp +136 -0
  615. package/deps/simdutf/tests/convert_utf16be_to_utf32_tests.cpp +193 -0
  616. package/deps/simdutf/tests/convert_utf16be_to_utf32_with_errors_tests.cpp +381 -0
  617. package/deps/simdutf/tests/convert_utf16be_to_utf8_tests.cpp +259 -0
  618. package/deps/simdutf/tests/convert_utf16be_to_utf8_with_errors_tests.cpp +266 -0
  619. package/deps/simdutf/tests/convert_utf16le_to_latin1_tests.cpp +148 -0
  620. package/deps/simdutf/tests/convert_utf16le_to_latin1_tests_with_errors.cpp +176 -0
  621. package/deps/simdutf/tests/convert_utf16le_to_utf32_tests.cpp +213 -0
  622. package/deps/simdutf/tests/convert_utf16le_to_utf32_with_errors_tests.cpp +318 -0
  623. package/deps/simdutf/tests/convert_utf16le_to_utf8_tests.cpp +343 -0
  624. package/deps/simdutf/tests/convert_utf16le_to_utf8_with_errors_tests.cpp +271 -0
  625. package/deps/simdutf/tests/convert_utf32_to_latin1_tests.cpp +111 -0
  626. package/deps/simdutf/tests/convert_utf32_to_latin1_with_errors_tests.cpp +96 -0
  627. package/deps/simdutf/tests/convert_utf32_to_utf16be_tests.cpp +148 -0
  628. package/deps/simdutf/tests/convert_utf32_to_utf16be_with_errors_tests.cpp +192 -0
  629. package/deps/simdutf/tests/convert_utf32_to_utf16le_tests.cpp +166 -0
  630. package/deps/simdutf/tests/convert_utf32_to_utf16le_with_errors_tests.cpp +215 -0
  631. package/deps/simdutf/tests/convert_utf32_to_utf8_tests.cpp +181 -0
  632. package/deps/simdutf/tests/convert_utf32_to_utf8_with_errors_tests.cpp +261 -0
  633. package/deps/simdutf/tests/convert_utf8_to_latin1_tests.cpp +516 -0
  634. package/deps/simdutf/tests/convert_utf8_to_latin1_with_errors_tests.cpp +579 -0
  635. package/deps/simdutf/tests/convert_utf8_to_utf16be_tests.cpp +412 -0
  636. package/deps/simdutf/tests/convert_utf8_to_utf16be_with_errors_tests.cpp +480 -0
  637. package/deps/simdutf/tests/convert_utf8_to_utf16le_tests.cpp +671 -0
  638. package/deps/simdutf/tests/convert_utf8_to_utf16le_with_errors_tests.cpp +455 -0
  639. package/deps/simdutf/tests/convert_utf8_to_utf32_tests.cpp +1204 -0
  640. package/deps/simdutf/tests/convert_utf8_to_utf32_with_errors_tests.cpp +337 -0
  641. package/deps/simdutf/tests/convert_valid_utf16be_to_latin1_tests.cpp +37 -0
  642. package/deps/simdutf/tests/convert_valid_utf16be_to_utf32_tests.cpp +97 -0
  643. package/deps/simdutf/tests/convert_valid_utf16be_to_utf8_tests.cpp +126 -0
  644. package/deps/simdutf/tests/convert_valid_utf16le_to_latin1_tests.cpp +71 -0
  645. package/deps/simdutf/tests/convert_valid_utf16le_to_utf32_tests.cpp +122 -0
  646. package/deps/simdutf/tests/convert_valid_utf16le_to_utf8_tests.cpp +244 -0
  647. package/deps/simdutf/tests/convert_valid_utf32_to_latin1_tests.cpp +49 -0
  648. package/deps/simdutf/tests/convert_valid_utf32_to_utf16be_tests.cpp +92 -0
  649. package/deps/simdutf/tests/convert_valid_utf32_to_utf16le_tests.cpp +114 -0
  650. package/deps/simdutf/tests/convert_valid_utf32_to_utf8_tests.cpp +109 -0
  651. package/deps/simdutf/tests/convert_valid_utf8_to_latin1_tests.cpp +84 -0
  652. package/deps/simdutf/tests/convert_valid_utf8_to_utf16be_tests.cpp +124 -0
  653. package/deps/simdutf/tests/convert_valid_utf8_to_utf16le_tests.cpp +221 -0
  654. package/deps/simdutf/tests/convert_valid_utf8_to_utf32_tests.cpp +155 -0
  655. package/deps/simdutf/tests/count_utf16be.cpp +64 -0
  656. package/deps/simdutf/tests/count_utf16le.cpp +61 -0
  657. package/deps/simdutf/tests/count_utf8.cpp +87 -0
  658. package/deps/simdutf/tests/detect_encodings_tests.cpp +312 -0
  659. package/deps/simdutf/tests/embed/valid_utf8.txt +1 -0
  660. package/deps/simdutf/tests/embed_tests.cpp +22 -0
  661. package/deps/simdutf/tests/find_tests.cpp +77 -0
  662. package/deps/simdutf/tests/fixed_string_tests.cpp +153 -0
  663. package/deps/simdutf/tests/helpers/CMakeLists.txt +25 -0
  664. package/deps/simdutf/tests/helpers/compiletime_conversions.h +222 -0
  665. package/deps/simdutf/tests/helpers/fixed_string.h +267 -0
  666. package/deps/simdutf/tests/helpers/random_int.cpp +30 -0
  667. package/deps/simdutf/tests/helpers/random_int.h +39 -0
  668. package/deps/simdutf/tests/helpers/random_utf16.cpp +123 -0
  669. package/deps/simdutf/tests/helpers/random_utf16.h +52 -0
  670. package/deps/simdutf/tests/helpers/random_utf32.cpp +41 -0
  671. package/deps/simdutf/tests/helpers/random_utf32.h +40 -0
  672. package/deps/simdutf/tests/helpers/random_utf8.cpp +93 -0
  673. package/deps/simdutf/tests/helpers/random_utf8.h +36 -0
  674. package/deps/simdutf/tests/helpers/test.cpp +231 -0
  675. package/deps/simdutf/tests/helpers/test.h +193 -0
  676. package/deps/simdutf/tests/helpers/transcode_test_base.cpp +1257 -0
  677. package/deps/simdutf/tests/helpers/transcode_test_base.h +683 -0
  678. package/deps/simdutf/tests/helpers/utf16.h +27 -0
  679. package/deps/simdutf/tests/installation_tests/find/CMakeLists.txt +43 -0
  680. package/deps/simdutf/tests/installation_tests/from_fetch/CMakeLists.txt +47 -0
  681. package/deps/simdutf/tests/internal_tests.cpp +27 -0
  682. package/deps/simdutf/tests/null_safety_tests.cpp +94 -0
  683. package/deps/simdutf/tests/random_fuzzer.cpp +779 -0
  684. package/deps/simdutf/tests/readme_tests.cpp +274 -0
  685. package/deps/simdutf/tests/reference/CMakeLists.txt +23 -0
  686. package/deps/simdutf/tests/reference/decode_utf16.h +81 -0
  687. package/deps/simdutf/tests/reference/decode_utf32.h +47 -0
  688. package/deps/simdutf/tests/reference/encode_latin1.cpp +1 -0
  689. package/deps/simdutf/tests/reference/encode_latin1.h +32 -0
  690. package/deps/simdutf/tests/reference/encode_utf16.cpp +49 -0
  691. package/deps/simdutf/tests/reference/encode_utf16.h +20 -0
  692. package/deps/simdutf/tests/reference/encode_utf32.cpp +1 -0
  693. package/deps/simdutf/tests/reference/encode_utf32.h +36 -0
  694. package/deps/simdutf/tests/reference/encode_utf8.cpp +1 -0
  695. package/deps/simdutf/tests/reference/encode_utf8.h +40 -0
  696. package/deps/simdutf/tests/reference/validate_utf16.cpp +60 -0
  697. package/deps/simdutf/tests/reference/validate_utf16.h +14 -0
  698. package/deps/simdutf/tests/reference/validate_utf16_to_latin1.cpp +35 -0
  699. package/deps/simdutf/tests/reference/validate_utf16_to_latin1.h +13 -0
  700. package/deps/simdutf/tests/reference/validate_utf32.cpp +27 -0
  701. package/deps/simdutf/tests/reference/validate_utf32.h +12 -0
  702. package/deps/simdutf/tests/reference/validate_utf32_to_latin1.cpp +27 -0
  703. package/deps/simdutf/tests/reference/validate_utf32_to_latin1.h +12 -0
  704. package/deps/simdutf/tests/reference/validate_utf8.cpp +82 -0
  705. package/deps/simdutf/tests/reference/validate_utf8.h +11 -0
  706. package/deps/simdutf/tests/reference/validate_utf8_to_latin1.cpp +43 -0
  707. package/deps/simdutf/tests/reference/validate_utf8_to_latin1.h +12 -0
  708. package/deps/simdutf/tests/select_implementation.cpp +43 -0
  709. package/deps/simdutf/tests/simdutf_c_tests.cpp +244 -0
  710. package/deps/simdutf/tests/span_tests.cpp +401 -0
  711. package/deps/simdutf/tests/special_tests.cpp +559 -0
  712. package/deps/simdutf/tests/straight_c_test.c +187 -0
  713. package/deps/simdutf/tests/text_encoding_tests.cpp +77 -0
  714. package/deps/simdutf/tests/to_well_formed_utf16_tests.cpp +377 -0
  715. package/deps/simdutf/tests/utf8_length_from_utf16_tests.cpp +202 -0
  716. package/deps/simdutf/tests/validate_ascii_basic_tests.cpp +165 -0
  717. package/deps/simdutf/tests/validate_ascii_with_errors_tests.cpp +77 -0
  718. package/deps/simdutf/tests/validate_utf16be_basic_tests.cpp +175 -0
  719. package/deps/simdutf/tests/validate_utf16be_with_errors_tests.cpp +188 -0
  720. package/deps/simdutf/tests/validate_utf16le_basic_tests.cpp +268 -0
  721. package/deps/simdutf/tests/validate_utf16le_with_errors_tests.cpp +274 -0
  722. package/deps/simdutf/tests/validate_utf32_basic_tests.cpp +92 -0
  723. package/deps/simdutf/tests/validate_utf32_with_errors_tests.cpp +114 -0
  724. package/deps/simdutf/tests/validate_utf8_basic_tests.cpp +178 -0
  725. package/deps/simdutf/tests/validate_utf8_brute_force_tests.cpp +88 -0
  726. package/deps/simdutf/tests/validate_utf8_puzzler_tests.cpp +33 -0
  727. package/deps/simdutf/tests/validate_utf8_with_errors_tests.cpp +228 -0
  728. package/deps/simdutf/tools/CMakeLists.txt +85 -0
  729. package/deps/simdutf/tools/fastbase64.cpp +250 -0
  730. package/deps/simdutf/tools/sutf.cpp +556 -0
  731. package/deps/simdutf/tools/sutf.h +40 -0
  732. package/lib/commonjs/blake3.js +2 -1
  733. package/lib/commonjs/blake3.js.map +1 -1
  734. package/lib/commonjs/diffie-hellman.js +5 -4
  735. package/lib/commonjs/diffie-hellman.js.map +1 -1
  736. package/lib/commonjs/ecdh.js +5 -4
  737. package/lib/commonjs/ecdh.js.map +1 -1
  738. package/lib/module/blake3.js +2 -1
  739. package/lib/module/blake3.js.map +1 -1
  740. package/lib/module/diffie-hellman.js +5 -4
  741. package/lib/module/diffie-hellman.js.map +1 -1
  742. package/lib/module/ecdh.js +5 -4
  743. package/lib/module/ecdh.js.map +1 -1
  744. package/lib/tsconfig.tsbuildinfo +1 -1
  745. package/lib/typescript/blake3.d.ts.map +1 -1
  746. package/lib/typescript/diffie-hellman.d.ts.map +1 -1
  747. package/lib/typescript/ecdh.d.ts.map +1 -1
  748. package/package.json +2 -2
  749. package/src/blake3.ts +2 -1
  750. package/src/diffie-hellman.ts +5 -7
  751. package/src/ecdh.ts +5 -8
@@ -0,0 +1,166 @@
1
+ struct utf32_to_utf8_t {
2
+ error_code err;
3
+ const char32_t *input;
4
+ char *output;
5
+ };
6
+
7
+ template <ErrorReporting er>
8
+ utf32_to_utf8_t ppc64_convert_utf32_to_utf8(const char32_t *buf, size_t len,
9
+ char *utf8_output) {
10
+ const char32_t *end = buf + len;
11
+
12
+ const auto v_f800 = vector_u16::splat(0xf800);
13
+ const auto v_d800 = vector_u16::splat(0xd800);
14
+
15
+ const auto v_ffff0000 = vector_u32::splat(0xffff0000);
16
+ const auto v_00000000 = vector_u32::zero();
17
+ auto forbidden_bytemask = simd16<bool>();
18
+ const size_t safety_margin =
19
+ 12; // to avoid overruns, see issue
20
+ // https://github.com/simdutf/simdutf/issues/92
21
+
22
+ while (end - buf >=
23
+ std::ptrdiff_t(
24
+ 16 + safety_margin)) { // buf is a char32_t pointer, each char32_t
25
+ // has 4 bytes or 32 bits, thus buf + 16 *
26
+ // char_32t = 512 bits = 64 bytes
27
+ // We load two 16 bytes registers for a total of 32 bytes or 16 characters.
28
+ // These two values can hold only 8 UTF32 chars
29
+ auto in0 = vector_u32::load(buf);
30
+ auto in1 = vector_u32::load(buf + vector_u32::ELEMENTS);
31
+
32
+ // Pack 32-bit UTF-32 code units to 16-bit UTF-16 code units with unsigned
33
+ // saturation
34
+ auto in = vector_u32::pack(in0, in1);
35
+
36
+ // Try to apply UTF-16 => UTF-8 from ./ppc64_convert_utf16_to_utf8.cpp
37
+
38
+ // Check for ASCII fast path
39
+
40
+ // ASCII fast path!!!!
41
+ // We eagerly load another 32 bytes, hoping that they will be ASCII too.
42
+ // The intuition is that we try to collect 16 ASCII characters which
43
+ // requires a total of 64 bytes of input. If we fail, we just pass thirdin
44
+ // and fourthin as our new inputs.
45
+ if (in.is_ascii()) { // if the first two blocks are ASCII
46
+ const auto in2 = vector_u32::load(buf + 2 * vector_u32::ELEMENTS);
47
+ const auto in3 = vector_u32::load(buf + 3 * vector_u32::ELEMENTS);
48
+
49
+ const auto next = vector_u32::pack(in2, in3);
50
+ if (next.is_ascii()) {
51
+ // 1. pack the bytes
52
+ const auto utf8_packed = vector_u16::pack(in, next);
53
+ // 2. store (16 bytes)
54
+ utf8_packed.store(utf8_output);
55
+ // 3. adjust pointers
56
+ buf += 16;
57
+ utf8_output += 16;
58
+ continue; // we are done for this round!
59
+ }
60
+
61
+ // `next` is not ASCII, write `in` and carry on with next
62
+
63
+ // 1. pack the bytes
64
+ const auto utf8_packed = vector_u16::pack(in, in);
65
+ utf8_packed.store(utf8_output);
66
+ // 3. adjust pointers
67
+ buf += 8;
68
+ utf8_output += 8;
69
+
70
+ // Proceed with next input
71
+ in = next;
72
+ in0 = in2;
73
+ in1 = in3;
74
+ }
75
+
76
+ // no bits set above 7th bit
77
+ const auto one_byte_bytemask = in < uint16_t(1 << 7);
78
+ const uint16_t one_byte_bitmask = one_byte_bytemask.to_bitmask();
79
+
80
+ // no bits set above 11th bit
81
+ const auto one_or_two_bytes_bytemask = in < uint16_t(1 << 11);
82
+ const uint16_t one_or_two_bytes_bitmask =
83
+ one_or_two_bytes_bytemask.to_bitmask();
84
+
85
+ if (one_or_two_bytes_bitmask == 0xffff) {
86
+ write_v_u16_11bits_to_utf8(
87
+ in, utf8_output, as_vector_u8(one_byte_bytemask), one_byte_bitmask);
88
+ buf += 8;
89
+ continue;
90
+ }
91
+
92
+ // Check for overflow in packing
93
+ const auto saturation_bytemask = ((in0 | in1) & v_ffff0000) == v_00000000;
94
+ const uint16_t saturation_bitmask = saturation_bytemask.to_bitmask();
95
+ if (saturation_bitmask == 0xffff) {
96
+ switch (er) {
97
+ case ErrorReporting::precise: {
98
+ const auto forbidden = (in & v_f800) == v_d800;
99
+ if (forbidden.any()) {
100
+ // We return no error code, instead we force the scalar procedure
101
+ // to rescan the portion of input where we've just found an error.
102
+ return utf32_to_utf8_t{error_code::SUCCESS, buf, utf8_output};
103
+ }
104
+ } break;
105
+ case ErrorReporting::at_the_end:
106
+ forbidden_bytemask |= (in & v_f800) == v_d800;
107
+ break;
108
+ case ErrorReporting::none:
109
+ break;
110
+ }
111
+
112
+ ppc64_convert_utf16_to_1_2_3_bytes_of_utf8(
113
+ in, one_byte_bitmask, one_or_two_bytes_bytemask,
114
+ one_or_two_bytes_bitmask, utf8_output);
115
+ buf += 8;
116
+ } else {
117
+ // case: at least one 32-bit word produce a surrogate pair in UTF-16 <=>
118
+ // will produce four UTF-8 bytes Let us do a scalar fallback. It may seem
119
+ // wasteful to use scalar code, but being efficient with SIMD in the
120
+ // presence of surrogate pairs may require non-trivial tables.
121
+ size_t forward = 15;
122
+ size_t k = 0;
123
+ if (size_t(end - buf) < forward + 1) {
124
+ forward = size_t(end - buf - 1);
125
+ }
126
+ for (; k < forward; k++) {
127
+ uint32_t word = buf[k];
128
+ if ((word & 0xFFFFFF80) == 0) {
129
+ *utf8_output++ = char(word);
130
+ } else if ((word & 0xFFFFF800) == 0) {
131
+ *utf8_output++ = char((word >> 6) | 0b11000000);
132
+ *utf8_output++ = char((word & 0b111111) | 0b10000000);
133
+ } else if ((word & 0xFFFF0000) == 0) {
134
+ if (er != ErrorReporting::none and
135
+ (word >= 0xD800 && word <= 0xDFFF)) {
136
+ return utf32_to_utf8_t{error_code::SURROGATE, buf + k, utf8_output};
137
+ }
138
+ *utf8_output++ = char((word >> 12) | 0b11100000);
139
+ *utf8_output++ = char(((word >> 6) & 0b111111) | 0b10000000);
140
+ *utf8_output++ = char((word & 0b111111) | 0b10000000);
141
+ } else {
142
+ if (er != ErrorReporting::none and (word > 0x10FFFF)) {
143
+ return utf32_to_utf8_t{error_code::TOO_LARGE, buf + k, utf8_output};
144
+ }
145
+ *utf8_output++ = char((word >> 18) | 0b11110000);
146
+ *utf8_output++ = char(((word >> 12) & 0b111111) | 0b10000000);
147
+ *utf8_output++ = char(((word >> 6) & 0b111111) | 0b10000000);
148
+ *utf8_output++ = char((word & 0b111111) | 0b10000000);
149
+ }
150
+ }
151
+ buf += k;
152
+ }
153
+ } // while
154
+
155
+ if (er == ErrorReporting::at_the_end) {
156
+ if (forbidden_bytemask.any()) {
157
+ return utf32_to_utf8_t{error_code::SURROGATE, buf, utf8_output};
158
+ }
159
+ }
160
+
161
+ return utf32_to_utf8_t{
162
+ error_code::SUCCESS,
163
+ buf,
164
+ utf8_output,
165
+ };
166
+ }
@@ -0,0 +1,69 @@
1
+ // depends on "tables/utf8_to_utf16_tables.h"
2
+
3
+ // Convert up to 12 bytes from utf8 to latin1 using a mask indicating the
4
+ // end of the code points. Only the least significant 12 bits of the mask
5
+ // are accessed.
6
+ // It returns how many bytes were consumed (up to 12).
7
+ size_t convert_masked_utf8_to_latin1(const char *input,
8
+ uint64_t utf8_end_of_code_point_mask,
9
+ char *&latin1_output) {
10
+ // we use an approach where we try to process up to 12 input bytes.
11
+ // Why 12 input bytes and not 16? Because we are concerned with the size of
12
+ // the lookup tables. Also 12 is nicely divisible by two and three.
13
+ //
14
+ //
15
+ // Optimization note: our main path below is load-latency dependent. Thus it
16
+ // is maybe beneficial to have fast paths that depend on branch prediction but
17
+ // have less latency. This results in more instructions but, potentially, also
18
+ // higher speeds.
19
+ //
20
+ const auto in = vector_u8::load(input);
21
+ const uint16_t input_utf8_end_of_code_point_mask =
22
+ utf8_end_of_code_point_mask &
23
+ 0xfff; // we are only processing 12 bytes in case it is not all ASCII
24
+ if (utf8_end_of_code_point_mask == 0xfff) {
25
+ // We process the data in chunks of 12 bytes.
26
+ in.store(latin1_output);
27
+ latin1_output += 12; // We wrote 12 characters.
28
+ return 12; // We consumed 12 bytes.
29
+ }
30
+ /// We do not have a fast path available, so we fallback.
31
+ const uint8_t idx =
32
+ tables::utf8_to_utf16::utf8bigindex[input_utf8_end_of_code_point_mask][0];
33
+ const uint8_t consumed =
34
+ tables::utf8_to_utf16::utf8bigindex[input_utf8_end_of_code_point_mask][1];
35
+ // this indicates an invalid input:
36
+ if (idx >= 64) {
37
+ return consumed;
38
+ }
39
+ // Here we should have (idx < 64), if not, there is a bug in the validation or
40
+ // elsewhere. SIX (6) input code-code units this is a relatively easy scenario
41
+ // we process SIX (6) input code-code units. The max length in bytes of six
42
+ // code code units spanning between 1 and 2 bytes each is 12 bytes. On
43
+ // processors where pdep/pext is fast, we might be able to use a small lookup
44
+ // table.
45
+
46
+ const auto reshuffle = vector_u8::load(&tables::utf8_to_utf16::shufutf8[idx]);
47
+ const auto perm8 = reshuffle.lookup_32(in, vector_u8::zero());
48
+ #if SIMDUTF_IS_BIG_ENDIAN
49
+ const auto perm16 = as_vector_u16(perm8).swap_bytes();
50
+ #else
51
+ const auto perm16 = as_vector_u16(perm8);
52
+ #endif // SIMDUTF_IS_BIG_ENDIAN
53
+ const auto ascii = perm16 & uint16_t(0x7f);
54
+ const auto highbyte = perm16 & uint16_t(0x1f00);
55
+ const auto composed = ascii | highbyte.shr<2>();
56
+
57
+ const auto latin1_packed = vector_u16::pack(composed, composed);
58
+ #if defined(__clang__)
59
+ __attribute__((aligned(16))) char buf[16];
60
+ latin1_packed.store(buf);
61
+ memcpy(latin1_output, buf, 6);
62
+ #else
63
+ // writing 8 bytes even though we only care about the first 6 bytes.
64
+ const auto tmp = vec_u64_t(latin1_packed.value);
65
+ memcpy(latin1_output, &tmp[0], 8);
66
+ #endif
67
+ latin1_output += 6; // We wrote 6 bytes.
68
+ return consumed;
69
+ }
@@ -0,0 +1,211 @@
1
+ // depends on "tables/utf8_to_utf16_tables.h"
2
+
3
+ // Convert up to 12 bytes from utf8 to utf16 using a mask indicating the
4
+ // end of the code points. Only the least significant 12 bits of the mask
5
+ // are accessed.
6
+ // It returns how many bytes were consumed (up to 12).
7
+ template <endianness big_endian>
8
+ size_t convert_masked_utf8_to_utf16(const char *input,
9
+ uint64_t utf8_end_of_code_point_mask,
10
+ char16_t *&utf16_output) {
11
+ // we use an approach where we try to process up to 12 input bytes.
12
+ // Why 12 input bytes and not 16? Because we are concerned with the size of
13
+ // the lookup tables. Also 12 is nicely divisible by two and three.
14
+ //
15
+ //
16
+ // Optimization note: our main path below is load-latency dependent. Thus it
17
+ // is maybe beneficial to have fast paths that depend on branch prediction but
18
+ // have less latency. This results in more instructions but, potentially, also
19
+ // higher speeds.
20
+ //
21
+ // We first try a few fast paths.
22
+ const auto in = vector_u8::load(input);
23
+ const uint16_t input_utf8_end_of_code_point_mask =
24
+ utf8_end_of_code_point_mask & 0xfff;
25
+ if (utf8_end_of_code_point_mask == 0xfff) {
26
+ // We process the data in chunks of 12 bytes.
27
+ // Note: using 16 bytes is unsafe, see issue_ossfuzz_71218
28
+ in.store_bytes_as_utf16<big_endian>(utf16_output);
29
+ utf16_output += 12; // We wrote 12 16-bit characters.
30
+ return 12; // We consumed 12 bytes.
31
+ }
32
+ if (((utf8_end_of_code_point_mask & 0xFFFF) == 0xaaaa)) {
33
+ // We want to take 8 2-byte UTF-8 code units and turn them into 8 2-byte
34
+ // UTF-16 code units.
35
+ #if SIMDUTF_IS_BIG_ENDIAN
36
+ const auto in16 = as_vector_u16(in);
37
+ #else
38
+ const auto in16 = as_vector_u16(in).swap_bytes();
39
+ #endif // SIMDUTF_IS_BIG_ENDIAN
40
+ const auto lo = in16 & uint16_t(0x007f);
41
+ const auto hi = in16.shr<2>();
42
+
43
+ auto composed = select(uint16_t(0x1f00 >> 2), hi, lo);
44
+ if simdutf_constexpr (!match_system(big_endian)) {
45
+ composed = composed.swap_bytes();
46
+ }
47
+
48
+ composed.store(utf16_output);
49
+ utf16_output += 8; // We wrote 16 bytes, 8 code points.
50
+ return 16;
51
+ }
52
+ if (input_utf8_end_of_code_point_mask == 0x924) {
53
+ // We want to take 4 3-byte UTF-8 code units and turn them into 4 2-byte
54
+ // UTF-16 code units. There is probably a more efficient sequence, but the
55
+ // following might do.
56
+
57
+ // AltiVec: it might be done better, for now SSE translation
58
+
59
+ const auto sh =
60
+ vector_u8(2, 1, 0, 16, 5, 4, 3, 16, 8, 7, 6, 16, 11, 10, 9, 16);
61
+ #if SIMDUTF_IS_BIG_ENDIAN
62
+ const auto perm =
63
+ as_vector_u32(sh.lookup_32(in, vector_u8::zero())).swap_bytes();
64
+ #else
65
+ const auto perm = as_vector_u32(sh.lookup_32(in, vector_u8::zero()));
66
+ #endif // SIMDUTF_IS_BIG_ENDIAN
67
+ const auto b0 = perm & uint32_t(0x0000007f);
68
+ const auto b1 = select(uint32_t(0x00003f00 >> 2), perm.shr<2>(), b0);
69
+ const auto b2 = select(uint32_t(0x000f0000 >> 4), perm.shr<4>(), b1);
70
+ const auto composed = b2;
71
+ auto packed = vector_u32::pack(composed, composed);
72
+
73
+ if simdutf_constexpr (!match_system(big_endian)) {
74
+ packed = packed.swap_bytes();
75
+ }
76
+
77
+ packed.store(utf16_output);
78
+ utf16_output += 4;
79
+ return 12;
80
+ }
81
+ /// We do not have a fast path available, so we fallback.
82
+
83
+ const uint8_t idx =
84
+ tables::utf8_to_utf16::utf8bigindex[input_utf8_end_of_code_point_mask][0];
85
+ const uint8_t consumed =
86
+ tables::utf8_to_utf16::utf8bigindex[input_utf8_end_of_code_point_mask][1];
87
+
88
+ if (idx < 64) {
89
+ // SIX (6) input code-code units
90
+ // this is a relatively easy scenario
91
+ // we process SIX (6) input code-code units. The max length in bytes of six
92
+ // code code units spanning between 1 and 2 bytes each is 12 bytes. On
93
+ // processors where pdep/pext is fast, we might be able to use a small
94
+ // lookup table.
95
+ const auto sh = vector_u8::load(&tables::utf8_to_utf16::shufutf8[idx]);
96
+ #if SIMDUTF_IS_BIG_ENDIAN
97
+ const auto perm =
98
+ as_vector_u16(sh.lookup_32(in, vector_u8::zero())).swap_bytes();
99
+ #else
100
+ const auto perm = as_vector_u16(sh.lookup_32(in, vector_u8::zero()));
101
+ #endif // SIMDUTF_IS_BIG_ENDIAN
102
+ const auto b0 = perm & uint16_t(0x007f);
103
+ const auto b1 = perm & uint16_t(0x1f00);
104
+
105
+ auto composed = b0 | b1.shr<2>();
106
+
107
+ if simdutf_constexpr (!match_system(big_endian)) {
108
+ composed = composed.swap_bytes();
109
+ }
110
+
111
+ composed.store(utf16_output);
112
+ utf16_output += 6; // We wrote 12 bytes, 6 code points.
113
+ } else if (idx < 145) {
114
+ // FOUR (4) input code-code units
115
+ const auto sh = vector_u8::load(&tables::utf8_to_utf16::shufutf8[idx]);
116
+ #if SIMDUTF_IS_BIG_ENDIAN
117
+ const auto perm =
118
+ as_vector_u32(sh.lookup_32(in, vector_u8::zero())).swap_bytes();
119
+ #else
120
+ const auto perm = as_vector_u32(sh.lookup_32(in, vector_u8::zero()));
121
+ #endif // SIMDUTF_IS_BIG_ENDIAN
122
+ const auto b0 = perm & uint32_t(0x0000007f);
123
+ const auto b1 = perm & uint32_t(0x00003f00);
124
+ const auto b2 = perm & uint32_t(0x000f0000);
125
+
126
+ const auto composed = b0 | b1.shr<2>() | b2.shr<4>();
127
+
128
+ auto packed = vector_u32::pack(composed, composed);
129
+
130
+ if simdutf_constexpr (!match_system(big_endian)) {
131
+ packed = packed.swap_bytes();
132
+ }
133
+
134
+ packed.store(utf16_output);
135
+ utf16_output += 4;
136
+ } else if (idx < 209) {
137
+ // TWO (2) input code-code units
138
+ //////////////
139
+ // There might be garbage inputs where a leading byte mascarades as a
140
+ // four-byte leading byte (by being followed by 3 continuation byte), but is
141
+ // not greater than 0xf0. This could trigger a buffer overflow if we only
142
+ // counted leading bytes of the form 0xf0 as generating surrogate pairs,
143
+ // without further UTF-8 validation. Thus we must be careful to ensure that
144
+ // only leading bytes at least as large as 0xf0 generate surrogate pairs. We
145
+ // do as at the cost of an extra mask.
146
+ /////////////
147
+ const auto sh = vector_u8::load(&tables::utf8_to_utf16::shufutf8[idx]);
148
+ #if SIMDUTF_IS_BIG_ENDIAN
149
+ const auto perm =
150
+ as_vector_u32(sh.lookup_32(in, vector_u8::zero())).swap_bytes();
151
+ #else
152
+ const auto perm = as_vector_u32(sh.lookup_32(in, vector_u8::zero()));
153
+ #endif // SIMDUTF_IS_BIG_ENDIAN
154
+ const auto ascii = perm & uint32_t(0x00000007f);
155
+ const auto middlebyte = perm & uint32_t(0x00003f00);
156
+ const auto middlebyte_shifted = middlebyte.shr<2>();
157
+
158
+ auto middlehighbyte = perm & uint32_t(0x003f0000);
159
+ // correct for spurious high bit
160
+
161
+ const auto correct = (perm & uint32_t(0x00400000)).shr<1>();
162
+ middlehighbyte = correct ^ middlehighbyte;
163
+ const auto middlehighbyte_shifted = middlehighbyte.shr<4>();
164
+ // We deliberately carry the leading four bits in highbyte if they are
165
+ // present, we remove them later when computing hightenbits.
166
+ const auto highbyte = perm & uint32_t(0xff000000);
167
+ const auto highbyte_shifted = highbyte.shr<6>();
168
+ // When we need to generate a surrogate pair (leading byte > 0xF0), then
169
+ // the corresponding 32-bit value in 'composed' will be greater than
170
+ // > (0xff00000>>6) or > 0x3c00000. This can be used later to identify the
171
+ // location of the surrogate pairs.
172
+ const auto composed =
173
+ ascii | middlebyte_shifted | highbyte_shifted | middlehighbyte_shifted;
174
+
175
+ const auto composedminus = composed - uint32_t(0x10000);
176
+ const auto lowtenbits = composedminus & uint32_t(0x3ff);
177
+ // Notice the 0x3ff mask:
178
+ const auto hightenbits = composedminus.shr<10>() & uint32_t(0x3ff);
179
+ const auto lowtenbitsadd = lowtenbits + uint32_t(0xDC00);
180
+ const auto hightenbitsadd = hightenbits + uint32_t(0xD800);
181
+ const auto lowtenbitsaddshifted = lowtenbitsadd.shl<16>();
182
+ auto surrogates = hightenbitsadd | lowtenbitsaddshifted;
183
+
184
+ uint32_t basic_buffer[4];
185
+ composed.store(basic_buffer);
186
+ uint32_t surrogate_buffer[4];
187
+ surrogates.swap_bytes().store(surrogate_buffer);
188
+
189
+ for (size_t i = 0; i < 3; i++) {
190
+ if (basic_buffer[i] > 0x3c00000) {
191
+ const auto ch0 = uint16_t(surrogate_buffer[i] & 0xffff);
192
+ const auto ch1 = uint16_t(surrogate_buffer[i] >> 16);
193
+ if (match_system(big_endian)) {
194
+ utf16_output[1] = scalar::u16_swap_bytes(ch0);
195
+ utf16_output[0] = scalar::u16_swap_bytes(ch1);
196
+ } else {
197
+ utf16_output[1] = ch0;
198
+ utf16_output[0] = ch1;
199
+ }
200
+ utf16_output += 2;
201
+ } else {
202
+ const auto chr = uint16_t(basic_buffer[i]);
203
+ utf16_output[0] = scalar::utf16::swap_if_needed<big_endian>(chr);
204
+ utf16_output++;
205
+ }
206
+ }
207
+ } else {
208
+ // here we know that there is an error but we do not handle errors
209
+ }
210
+ return consumed;
211
+ }
@@ -0,0 +1,153 @@
1
+ // depends on "tables/utf8_to_utf16_tables.h"
2
+
3
+ // Convert up to 12 bytes from utf8 to utf32 using a mask indicating the
4
+ // end of the code points. Only the least significant 12 bits of the mask
5
+ // are accessed.
6
+ // It returns how many bytes were consumed (up to 12).
7
+ size_t convert_masked_utf8_to_utf32(const char *input,
8
+ uint64_t utf8_end_of_code_point_mask,
9
+ char32_t *&utf32_output) {
10
+ // we use an approach where we try to process up to 12 input bytes.
11
+ // Why 12 input bytes and not 16? Because we are concerned with the size of
12
+ // the lookup tables. Also 12 is nicely divisible by two and three.
13
+ //
14
+ //
15
+ // Optimization note: our main path below is load-latency dependent. Thus it
16
+ // is maybe beneficial to have fast paths that depend on branch prediction but
17
+ // have less latency. This results in more instructions but, potentially, also
18
+ // higher speeds.
19
+ //
20
+ // We first try a few fast paths.
21
+ const auto in = vector_u8::load(input);
22
+ const uint16_t input_utf8_end_of_code_point_mask =
23
+ utf8_end_of_code_point_mask & 0xfff;
24
+ if (utf8_end_of_code_point_mask == 0xfff) {
25
+ // We process the data in chunks of 12 bytes.
26
+ in.store_bytes_as_utf32(utf32_output);
27
+ utf32_output += 12; // We wrote 12 32-bit characters.
28
+ return 12; // We consumed 12 bytes.
29
+ }
30
+ if (((utf8_end_of_code_point_mask & 0xffff) == 0xaaaa)) {
31
+ // We want to take 8 2-byte UTF-8 code units and turn them into 8 4-byte
32
+ // UTF-32 code units.
33
+ #if SIMDUTF_IS_BIG_ENDIAN
34
+ const auto perm = as_vector_u16(in);
35
+ #else
36
+ const auto perm = as_vector_u16(in).swap_bytes();
37
+ #endif // SIMDUTF_IS_BIG_ENDIAN
38
+ // in = [110aaaaa|10bbbbbb]
39
+ // t0 = [00000000|00bbbbbb]
40
+ const auto t0 = perm & uint16_t(0x007f);
41
+
42
+ // t1 = [00110aaa|aabbbbbb]
43
+ const auto t1 = perm.shr<2>();
44
+ const auto composed = select(uint16_t(0x1f00 >> 2), t1, t0);
45
+
46
+ const auto composed8 = as_vector_u8(composed);
47
+ composed8.store_words_as_utf32(utf32_output);
48
+
49
+ utf32_output += 8; // We wrote 32 bytes, 8 code points.
50
+ return 16;
51
+ }
52
+ if (input_utf8_end_of_code_point_mask == 0x924) {
53
+ // We want to take 4 3-byte UTF-8 code units and turn them into 4 4-byte
54
+ // UTF-32 code units.
55
+ #if SIMDUTF_IS_BIG_ENDIAN
56
+ const auto sh =
57
+ vector_u8(-1, 0, 1, 2, -1, 3, 4, 5, -1, 6, 7, 8, -1, 9, 10, 11);
58
+ #else
59
+ const auto sh =
60
+ vector_u8(2, 1, 0, -1, 5, 4, 3, -1, 8, 7, 6, -1, 11, 10, 9, -1);
61
+ #endif // SIMDUTF_IS_BIG_ENDIAN
62
+ const auto perm = as_vector_u32(sh.lookup_32(in, vector_u8::zero()));
63
+
64
+ // in = [1110aaaa|10bbbbbb|10cccccc]
65
+
66
+ // t0 = [00000000|00000000|00cccccc]
67
+ const auto t0 = perm & uint32_t(0x0000007f);
68
+
69
+ // t2 = [00000000|0000bbbb|bbcccccc]
70
+ const auto t1 = perm.shr<2>();
71
+ const auto t2 = select(uint32_t(0x00003f00 >> 2), t1, t0);
72
+
73
+ // t4 = [00000000|aaaabbbb|bbcccccc]
74
+ const auto t3 = perm.shr<4>();
75
+ const auto t4 = select(uint32_t(0x0f0000 >> 4), t3, t2);
76
+
77
+ t4.store(utf32_output);
78
+ utf32_output += 4;
79
+ return 12;
80
+ }
81
+ /// We do not have a fast path available, so we fallback.
82
+
83
+ const uint8_t idx =
84
+ tables::utf8_to_utf16::utf8bigindex[input_utf8_end_of_code_point_mask][0];
85
+ const uint8_t consumed =
86
+ tables::utf8_to_utf16::utf8bigindex[input_utf8_end_of_code_point_mask][1];
87
+ if (idx < 64) {
88
+ // SIX (6) input code-code units
89
+ // this is a relatively easy scenario
90
+ // we process SIX (6) input code-code units. The max length in bytes of six
91
+ // code code units spanning between 1 and 2 bytes each is 12 bytes. On
92
+ // processors where pdep/pext is fast, we might be able to use a small
93
+ // lookup table.
94
+ const auto sh = vector_u8::load(&tables::utf8_to_utf16::shufutf8[idx]);
95
+ #if SIMDUTF_IS_BIG_ENDIAN
96
+ const auto perm =
97
+ as_vector_u16(sh.lookup_32(in, vector_u8::zero())).swap_bytes();
98
+ #else
99
+ const auto perm = as_vector_u16(sh.lookup_32(in, vector_u8::zero()));
100
+ #endif // SIMDUTF_IS_BIG_ENDIAN
101
+ const auto ascii = perm & uint16_t(0x7f);
102
+ const auto highbyte = perm & uint16_t(0x1f00);
103
+ const auto composed = ascii | highbyte.shr<2>();
104
+
105
+ as_vector_u8(composed).store_words_as_utf32(utf32_output);
106
+ utf32_output += 6; // We wrote 12 bytes, 6 code points.
107
+ } else if (idx < 145) {
108
+ // FOUR (4) input code-code units
109
+ const auto sh = vector_u8::load(&tables::utf8_to_utf16::shufutf8[idx]);
110
+ #if SIMDUTF_IS_BIG_ENDIAN
111
+ const auto perm =
112
+ as_vector_u32(sh.lookup_32(in, vector_u8::zero())).swap_bytes();
113
+ #else
114
+ const auto perm = as_vector_u32(sh.lookup_32(in, vector_u8::zero()));
115
+ #endif // SIMDUTF_IS_BIG_ENDIAN
116
+ const auto ascii = perm & uint32_t(0x7f);
117
+ const auto middlebyte = perm & uint32_t(0x3f00);
118
+ const auto middlebyte_shifted = middlebyte.shr<2>();
119
+ const auto highbyte = perm & uint32_t(0x0f0000);
120
+ const auto highbyte_shifted = highbyte.shr<4>();
121
+ const auto composed = ascii | middlebyte_shifted | highbyte_shifted;
122
+
123
+ composed.store(utf32_output);
124
+ utf32_output += 4;
125
+ } else if (idx < 209) {
126
+ // TWO (2) input code-code units
127
+ const auto sh = vector_u8::load(&tables::utf8_to_utf16::shufutf8[idx]);
128
+ #if SIMDUTF_IS_BIG_ENDIAN
129
+ const auto perm =
130
+ as_vector_u32(sh.lookup_32(in, vector_u8::zero())).swap_bytes();
131
+ #else
132
+ const auto perm = as_vector_u32(sh.lookup_32(in, vector_u8::zero()));
133
+ #endif // SIMDUTF_IS_BIG_ENDIAN
134
+ const auto ascii = perm & uint32_t(0x0000007f);
135
+ const auto middlebyte = perm & uint32_t(0x3f00);
136
+ const auto middlebyte_shifted = middlebyte.shr<2>();
137
+ auto middlehighbyte = perm & uint32_t(0x003f0000);
138
+ // correct for spurious high bit
139
+ const auto correct0 = perm & uint32_t(0x00400000);
140
+ const auto correct = correct0.shr<1>();
141
+ middlehighbyte = correct ^ middlehighbyte;
142
+ const auto middlehighbyte_shifted = middlehighbyte.shr<4>();
143
+ const auto highbyte = perm & uint32_t(0x07000000);
144
+ const auto highbyte_shifted = highbyte.shr<6>();
145
+ const auto composed =
146
+ ascii | middlebyte_shifted | highbyte_shifted | middlehighbyte_shifted;
147
+ composed.store(utf32_output);
148
+ utf32_output += 3;
149
+ } else {
150
+ // here we know that there is an error but we do not handle errors
151
+ }
152
+ return consumed;
153
+ }