react-native-quick-crypto 1.0.18 → 1.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (751) hide show
  1. package/QuickCrypto.podspec +12 -38
  2. package/README.md +2 -0
  3. package/android/CMakeLists.txt +3 -0
  4. package/cpp/utils/HybridUtils.cpp +39 -77
  5. package/deps/simdutf/.clang-format +4 -0
  6. package/deps/simdutf/.github/ISSUE_TEMPLATE/bug_report.md +62 -0
  7. package/deps/simdutf/.github/ISSUE_TEMPLATE/config.yml +1 -0
  8. package/deps/simdutf/.github/ISSUE_TEMPLATE/feature_request.md +35 -0
  9. package/deps/simdutf/.github/ISSUE_TEMPLATE/standard-issue-template.md +29 -0
  10. package/deps/simdutf/.github/pull_request_template.md +51 -0
  11. package/deps/simdutf/.github/workflows/aarch64.yml +39 -0
  12. package/deps/simdutf/.github/workflows/alpine.yml +27 -0
  13. package/deps/simdutf/.github/workflows/amalgamation_demos.yml +34 -0
  14. package/deps/simdutf/.github/workflows/armv7.yml +32 -0
  15. package/deps/simdutf/.github/workflows/atomic_fuzz.yml +25 -0
  16. package/deps/simdutf/.github/workflows/cifuzz.yml +37 -0
  17. package/deps/simdutf/.github/workflows/clangformat.yml +36 -0
  18. package/deps/simdutf/.github/workflows/debian-latestcxxstandards.yml +40 -0
  19. package/deps/simdutf/.github/workflows/debian.yml +33 -0
  20. package/deps/simdutf/.github/workflows/documentation.yml +36 -0
  21. package/deps/simdutf/.github/workflows/emscripten.yml +19 -0
  22. package/deps/simdutf/.github/workflows/loongarch64-gcc-14.2.yml +39 -0
  23. package/deps/simdutf/.github/workflows/macos-latest.yml +29 -0
  24. package/deps/simdutf/.github/workflows/msys2-clang.yml +48 -0
  25. package/deps/simdutf/.github/workflows/msys2.yml +50 -0
  26. package/deps/simdutf/.github/workflows/ppc64le.yml +29 -0
  27. package/deps/simdutf/.github/workflows/rvv-1024-clang-18.yml +35 -0
  28. package/deps/simdutf/.github/workflows/rvv-128-clang-17.yml +35 -0
  29. package/deps/simdutf/.github/workflows/rvv-256-gcc-14.yml +31 -0
  30. package/deps/simdutf/.github/workflows/s390x.yml +29 -0
  31. package/deps/simdutf/.github/workflows/selective-amalgamation.yml +29 -0
  32. package/deps/simdutf/.github/workflows/typos.yml +19 -0
  33. package/deps/simdutf/.github/workflows/ubuntu22-cxx20.yml +30 -0
  34. package/deps/simdutf/.github/workflows/ubuntu22.yml +32 -0
  35. package/deps/simdutf/.github/workflows/ubuntu22_gcc12.yml +27 -0
  36. package/deps/simdutf/.github/workflows/ubuntu22sani.yml +29 -0
  37. package/deps/simdutf/.github/workflows/ubuntu24-cxxstandards.yml +34 -0
  38. package/deps/simdutf/.github/workflows/ubuntu24-unsignedchar.yml +34 -0
  39. package/deps/simdutf/.github/workflows/ubuntu24.yml +32 -0
  40. package/deps/simdutf/.github/workflows/ubuntu24sani.yml +36 -0
  41. package/deps/simdutf/.github/workflows/ubuntu24sani_clang.yml +29 -0
  42. package/deps/simdutf/.github/workflows/vs17-arm-ci.yml +21 -0
  43. package/deps/simdutf/.github/workflows/vs17-ci-cxx20.yml +41 -0
  44. package/deps/simdutf/.github/workflows/vs17-ci.yml +41 -0
  45. package/deps/simdutf/.github/workflows/vs17-clang-ci.yml +41 -0
  46. package/deps/simdutf/.github/workflows/vs17-cxxstandards.yml +36 -0
  47. package/deps/simdutf/AI_USAGE_POLICY.md +56 -0
  48. package/deps/simdutf/AUTHORS +6 -0
  49. package/deps/simdutf/CMakeLists.txt +231 -0
  50. package/deps/simdutf/CONTRIBUTING.md +214 -0
  51. package/deps/simdutf/CONTRIBUTORS +1 -0
  52. package/deps/simdutf/Doxyfile +2584 -0
  53. package/deps/simdutf/LICENSE-APACHE +201 -0
  54. package/deps/simdutf/LICENSE-MIT +18 -0
  55. package/deps/simdutf/Makefile.crosscompile +54 -0
  56. package/deps/simdutf/README-RVV.md +16 -0
  57. package/deps/simdutf/README.md +2782 -0
  58. package/deps/simdutf/SECURITY.md +8 -0
  59. package/deps/simdutf/benchmarks/CMakeLists.txt +101 -0
  60. package/deps/simdutf/benchmarks/alignment.cpp +150 -0
  61. package/deps/simdutf/benchmarks/base64/CMakeLists.txt +30 -0
  62. package/deps/simdutf/benchmarks/base64/benchmark_base64.cpp +875 -0
  63. package/deps/simdutf/benchmarks/base64/libbase64_spaces.h +49 -0
  64. package/deps/simdutf/benchmarks/base64/node_base64.h +227 -0
  65. package/deps/simdutf/benchmarks/base64/openssl3_base64.h +334 -0
  66. package/deps/simdutf/benchmarks/benchmark.cpp +65 -0
  67. package/deps/simdutf/benchmarks/benchmark_to_well_formed_utf16.cpp +347 -0
  68. package/deps/simdutf/benchmarks/competition/.clang-format-ignore +5 -0
  69. package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.cpp +1276 -0
  70. package/deps/simdutf/benchmarks/competition/CppCon2018/utf_utils.h +595 -0
  71. package/deps/simdutf/benchmarks/competition/README.md +7 -0
  72. package/deps/simdutf/benchmarks/competition/hoehrmann/hoehrmann.h +91 -0
  73. package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16.h +444 -0
  74. package/deps/simdutf/benchmarks/competition/inoue2008/inoue_utf8_to_utf16_tables.h +13183 -0
  75. package/deps/simdutf/benchmarks/competition/inoue2008/script.py +73 -0
  76. package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.cpp +738 -0
  77. package/deps/simdutf/benchmarks/competition/llvm/ConvertUTF.h +293 -0
  78. package/deps/simdutf/benchmarks/competition/u8u16/COPYRIGHT +8 -0
  79. package/deps/simdutf/benchmarks/competition/u8u16/Makefile +44 -0
  80. package/deps/simdutf/benchmarks/competition/u8u16/OSL3.0.txt +169 -0
  81. package/deps/simdutf/benchmarks/competition/u8u16/Profiling/BOM_Profiler.h +148 -0
  82. package/deps/simdutf/benchmarks/competition/u8u16/Profiling/i386_timer.h +45 -0
  83. package/deps/simdutf/benchmarks/competition/u8u16/Profiling/ppc_timer.c +34 -0
  84. package/deps/simdutf/benchmarks/competition/u8u16/README +56 -0
  85. package/deps/simdutf/benchmarks/competition/u8u16/config/config_defs.h +43 -0
  86. package/deps/simdutf/benchmarks/competition/u8u16/config/g4_config.h +27 -0
  87. package/deps/simdutf/benchmarks/competition/u8u16/config/mmx_config.h +16 -0
  88. package/deps/simdutf/benchmarks/competition/u8u16/config/p4_config.h +18 -0
  89. package/deps/simdutf/benchmarks/competition/u8u16/config/p4_ideal_config.h +16 -0
  90. package/deps/simdutf/benchmarks/competition/u8u16/config/spu_config.h +28 -0
  91. package/deps/simdutf/benchmarks/competition/u8u16/config/ssse3_config.h +20 -0
  92. package/deps/simdutf/benchmarks/competition/u8u16/iconv_u8u16.c +2 -0
  93. package/deps/simdutf/benchmarks/competition/u8u16/lib/altivec_simd.h +440 -0
  94. package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_basic_ops.py +121 -0
  95. package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_half_operand_versions.py +158 -0
  96. package/deps/simdutf/benchmarks/competition/u8u16/lib/libgen/make_test.py +270 -0
  97. package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd.h +141 -0
  98. package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_basic.h +216 -0
  99. package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_built_in.h +119 -0
  100. package/deps/simdutf/benchmarks/competition/u8u16/lib/mmx_simd_modified.h +2430 -0
  101. package/deps/simdutf/benchmarks/competition/u8u16/lib/outline.txt +39 -0
  102. package/deps/simdutf/benchmarks/competition/u8u16/lib/spu_simd.h +421 -0
  103. package/deps/simdutf/benchmarks/competition/u8u16/lib/sse_simd.h +836 -0
  104. package/deps/simdutf/benchmarks/competition/u8u16/lib/stdint.h +222 -0
  105. package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_BE.c +4 -0
  106. package/deps/simdutf/benchmarks/competition/u8u16/libu8u16_LE.c +5 -0
  107. package/deps/simdutf/benchmarks/competition/u8u16/proto/u8u16.py +390 -0
  108. package/deps/simdutf/benchmarks/competition/u8u16/src/Makefile +18 -0
  109. package/deps/simdutf/benchmarks/competition/u8u16/src/bytelex.h +448 -0
  110. package/deps/simdutf/benchmarks/competition/u8u16/src/charsets/ASCII_EBCDIC.h +284 -0
  111. package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.c +1975 -0
  112. package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.pdf +0 -0
  113. package/deps/simdutf/benchmarks/competition/u8u16/src/libu8u16.w +2263 -0
  114. package/deps/simdutf/benchmarks/competition/u8u16/src/multiliteral.h +239 -0
  115. package/deps/simdutf/benchmarks/competition/u8u16/src/u8u16.c +232 -0
  116. package/deps/simdutf/benchmarks/competition/u8u16/src/x8x16.c +194 -0
  117. package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.c +193 -0
  118. package/deps/simdutf/benchmarks/competition/u8u16/src/xml_error.h +167 -0
  119. package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.c +288 -0
  120. package/deps/simdutf/benchmarks/competition/u8u16/src/xmldecl.h +117 -0
  121. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_g4.c +2 -0
  122. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_mmx.c +2 -0
  123. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4.c +3 -0
  124. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_p4_ideal.c +2 -0
  125. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_spu.c +2 -0
  126. package/deps/simdutf/benchmarks/competition/u8u16/u8u16_ssse3.c +3 -0
  127. package/deps/simdutf/benchmarks/competition/u8u16/x8x16_p4.c +2 -0
  128. package/deps/simdutf/benchmarks/competition/utf8lut/LICENSE +23 -0
  129. package/deps/simdutf/benchmarks/competition/utf8lut/data/test_minimal.txt +44 -0
  130. package/deps/simdutf/benchmarks/competition/utf8lut/readme.md +106 -0
  131. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.cmd +11 -0
  132. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_clang_corr_tests.sh +13 -0
  133. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_corr_tests.sh +13 -0
  134. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_example.sh +13 -0
  135. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_file_conv.sh +14 -0
  136. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_lib.sh +11 -0
  137. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_gcc_iconv_sample.sh +8 -0
  138. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_corr_tests.cmd +12 -0
  139. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_example.cmd +13 -0
  140. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_file_conv.cmd +14 -0
  141. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_lib.cmd +11 -0
  142. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_mingw_iconv_sample.cmd +8 -0
  143. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_corr_tests.cmd +11 -0
  144. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_example.cmd +12 -0
  145. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_file_conv.cmd +13 -0
  146. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_lib.cmd +10 -0
  147. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/build_msvc_iconv_sample.cmd +9 -0
  148. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/html_table.py +25 -0
  149. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/measure.py +94 -0
  150. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/resize.py +20 -0
  151. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_all.cmd +2 -0
  152. package/deps/simdutf/benchmarks/competition/utf8lut/scripts/wipe_interm.cmd +1 -0
  153. package/deps/simdutf/benchmarks/competition/utf8lut/src/base/CustomMemcpy.h +75 -0
  154. package/deps/simdutf/benchmarks/competition/utf8lut/src/base/PerfDefs.h +47 -0
  155. package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.cpp +17 -0
  156. package/deps/simdutf/benchmarks/competition/utf8lut/src/base/Timing.h +76 -0
  157. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/AllProcessors.cpp +35 -0
  158. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.cpp +117 -0
  159. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BaseBufferProcessor.h +210 -0
  160. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferDecoder.h +158 -0
  161. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/BufferEncoder.h +104 -0
  162. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorPlugins.h +334 -0
  163. package/deps/simdutf/benchmarks/competition/utf8lut/src/buffer/ProcessorSelector.h +186 -0
  164. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.cpp +140 -0
  165. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderLut.h +42 -0
  166. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/DecoderProcess.h +100 -0
  167. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/Dfa.h +57 -0
  168. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.cpp +85 -0
  169. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderLut.h +27 -0
  170. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/EncoderProcess.h +126 -0
  171. package/deps/simdutf/benchmarks/competition/utf8lut/src/core/ProcessTrivial.h +108 -0
  172. package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.cpp +139 -0
  173. package/deps/simdutf/benchmarks/competition/utf8lut/src/iconv/iconv.h +74 -0
  174. package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.cpp +65 -0
  175. package/deps/simdutf/benchmarks/competition/utf8lut/src/message/MessageConverter.h +91 -0
  176. package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/CorrectnessTests.cpp +772 -0
  177. package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/Example.cpp +12 -0
  178. package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/FileConverter.cpp +486 -0
  179. package/deps/simdutf/benchmarks/competition/utf8lut/src/tests/iconv_sample.c +162 -0
  180. package/deps/simdutf/benchmarks/competition/utf8lut/src/utf8lut.h +15 -0
  181. package/deps/simdutf/benchmarks/competition/utf8sse4/fromutf8-sse.cpp +292 -0
  182. package/deps/simdutf/benchmarks/competition/utfcpp/LICENSE +23 -0
  183. package/deps/simdutf/benchmarks/competition/utfcpp/README.md +1503 -0
  184. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/checked.h +335 -0
  185. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/core.h +338 -0
  186. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp11.h +103 -0
  187. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/cpp17.h +103 -0
  188. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8/unchecked.h +274 -0
  189. package/deps/simdutf/benchmarks/competition/utfcpp/source/utf8.h +34 -0
  190. package/deps/simdutf/benchmarks/dataset/README.md +155 -0
  191. package/deps/simdutf/benchmarks/dataset/emoji.txt +204 -0
  192. package/deps/simdutf/benchmarks/dataset/scripts/utf8type.py +40 -0
  193. package/deps/simdutf/benchmarks/dataset/wikipedia_mars/Makefile +80 -0
  194. package/deps/simdutf/benchmarks/dataset/wikipedia_mars/convert_to_utf6.py +20 -0
  195. package/deps/simdutf/benchmarks/find/CMakeLists.txt +6 -0
  196. package/deps/simdutf/benchmarks/find/findbenchmark.cpp +63 -0
  197. package/deps/simdutf/benchmarks/find/findbenchmarker.h +46 -0
  198. package/deps/simdutf/benchmarks/shortbench.cpp +555 -0
  199. package/deps/simdutf/benchmarks/src/CMakeLists.txt +52 -0
  200. package/deps/simdutf/benchmarks/src/apple_arm_events.h +1104 -0
  201. package/deps/simdutf/benchmarks/src/benchmark.cpp +3899 -0
  202. package/deps/simdutf/benchmarks/src/benchmark.h +317 -0
  203. package/deps/simdutf/benchmarks/src/benchmark_base.cpp +144 -0
  204. package/deps/simdutf/benchmarks/src/benchmark_base.h +98 -0
  205. package/deps/simdutf/benchmarks/src/cmdline.cpp +176 -0
  206. package/deps/simdutf/benchmarks/src/cmdline.h +35 -0
  207. package/deps/simdutf/benchmarks/src/event_counter.h +162 -0
  208. package/deps/simdutf/benchmarks/src/linux-perf-events.h +104 -0
  209. package/deps/simdutf/benchmarks/stream.cpp +209 -0
  210. package/deps/simdutf/benchmarks/threaded.cpp +123 -0
  211. package/deps/simdutf/cmake/CPM.cmake +1363 -0
  212. package/deps/simdutf/cmake/JoinPaths.cmake +23 -0
  213. package/deps/simdutf/cmake/add_cpp_test.cmake +68 -0
  214. package/deps/simdutf/cmake/simdutf-config.cmake.in +2 -0
  215. package/deps/simdutf/cmake/simdutf-flags.cmake +26 -0
  216. package/deps/simdutf/cmake/toolchains-ci/riscv64-linux-gnu.cmake +4 -0
  217. package/deps/simdutf/cmake/toolchains-dev/README.md +32 -0
  218. package/deps/simdutf/cmake/toolchains-dev/aarch64.cmake +14 -0
  219. package/deps/simdutf/cmake/toolchains-dev/loongarch64.cmake +22 -0
  220. package/deps/simdutf/cmake/toolchains-dev/powerpc64.cmake +16 -0
  221. package/deps/simdutf/cmake/toolchains-dev/powerpc64le.cmake +16 -0
  222. package/deps/simdutf/cmake/toolchains-dev/riscv64.cmake +16 -0
  223. package/deps/simdutf/cmake/toolchains-dev/rvv-spike.cmake +38 -0
  224. package/deps/simdutf/doc/avx512.png +0 -0
  225. package/deps/simdutf/doc/logo.png +0 -0
  226. package/deps/simdutf/doc/logo.svg +165 -0
  227. package/deps/simdutf/doc/node2023.png +0 -0
  228. package/deps/simdutf/doc/shortinput.md +78 -0
  229. package/deps/simdutf/doc/utf16utf8.png +0 -0
  230. package/deps/simdutf/doc/utf8utf16.png +0 -0
  231. package/deps/simdutf/doc/widelogo.png +0 -0
  232. package/deps/simdutf/doxygen.py +50 -0
  233. package/deps/simdutf/fuzz/.clang-format +9 -0
  234. package/deps/simdutf/fuzz/CMakeLists.txt +45 -0
  235. package/deps/simdutf/fuzz/README.md +168 -0
  236. package/deps/simdutf/fuzz/atomic_base64.cpp +448 -0
  237. package/deps/simdutf/fuzz/base64.cpp +278 -0
  238. package/deps/simdutf/fuzz/build.sh +83 -0
  239. package/deps/simdutf/fuzz/conversion.cpp +669 -0
  240. package/deps/simdutf/fuzz/helpers/.clang-format-ignore +1 -0
  241. package/deps/simdutf/fuzz/helpers/common.h +135 -0
  242. package/deps/simdutf/fuzz/helpers/nameof.hpp +1258 -0
  243. package/deps/simdutf/fuzz/main.cpp +72 -0
  244. package/deps/simdutf/fuzz/minimize_and_cleanse.sh +87 -0
  245. package/deps/simdutf/fuzz/misc.cpp +216 -0
  246. package/deps/simdutf/fuzz/random_fuzz.sh +154 -0
  247. package/deps/simdutf/fuzz/roundtrip.cpp +588 -0
  248. package/deps/simdutf/fuzz/safe_conversion.cpp +104 -0
  249. package/deps/simdutf/include/simdutf/avx512.h +79 -0
  250. package/deps/simdutf/include/simdutf/base64_implementation.h +158 -0
  251. package/deps/simdutf/include/simdutf/base64_tables.h +887 -0
  252. package/deps/simdutf/include/simdutf/common_defs.h +186 -0
  253. package/deps/simdutf/include/simdutf/compiler_check.h +50 -0
  254. package/deps/simdutf/include/simdutf/constexpr_ptr.h +138 -0
  255. package/deps/simdutf/include/simdutf/encoding_types.h +189 -0
  256. package/deps/simdutf/include/simdutf/error.h +126 -0
  257. package/deps/simdutf/include/simdutf/implementation.h +7081 -0
  258. package/deps/simdutf/include/simdutf/internal/isadetection.h +325 -0
  259. package/deps/simdutf/include/simdutf/portability.h +285 -0
  260. package/deps/simdutf/include/simdutf/scalar/ascii.h +86 -0
  261. package/deps/simdutf/include/simdutf/scalar/atomic_util.h +105 -0
  262. package/deps/simdutf/include/simdutf/scalar/base64.h +911 -0
  263. package/deps/simdutf/include/simdutf/scalar/latin1.h +26 -0
  264. package/deps/simdutf/include/simdutf/scalar/latin1_to_utf16/latin1_to_utf16.h +52 -0
  265. package/deps/simdutf/include/simdutf/scalar/latin1_to_utf32/latin1_to_utf32.h +27 -0
  266. package/deps/simdutf/include/simdutf/scalar/latin1_to_utf8/latin1_to_utf8.h +191 -0
  267. package/deps/simdutf/include/simdutf/scalar/swap_bytes.h +35 -0
  268. package/deps/simdutf/include/simdutf/scalar/utf16.h +226 -0
  269. package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/utf16_to_latin1.h +108 -0
  270. package/deps/simdutf/include/simdutf/scalar/utf16_to_latin1/valid_utf16_to_latin1.h +40 -0
  271. package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/utf16_to_utf32.h +86 -0
  272. package/deps/simdutf/include/simdutf/scalar/utf16_to_utf32/valid_utf16_to_utf32.h +44 -0
  273. package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/utf16_to_utf8.h +295 -0
  274. package/deps/simdutf/include/simdutf/scalar/utf16_to_utf8/valid_utf16_to_utf8.h +91 -0
  275. package/deps/simdutf/include/simdutf/scalar/utf32.h +82 -0
  276. package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/utf32_to_latin1.h +68 -0
  277. package/deps/simdutf/include/simdutf/scalar/utf32_to_latin1/valid_utf32_to_latin1.h +67 -0
  278. package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/utf32_to_utf16.h +84 -0
  279. package/deps/simdutf/include/simdutf/scalar/utf32_to_utf16/valid_utf32_to_utf16.h +44 -0
  280. package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/utf32_to_utf8.h +142 -0
  281. package/deps/simdutf/include/simdutf/scalar/utf32_to_utf8/valid_utf32_to_utf8.h +72 -0
  282. package/deps/simdutf/include/simdutf/scalar/utf8.h +326 -0
  283. package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/utf8_to_latin1.h +225 -0
  284. package/deps/simdutf/include/simdutf/scalar/utf8_to_latin1/valid_utf8_to_latin1.h +87 -0
  285. package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/utf8_to_utf16.h +342 -0
  286. package/deps/simdutf/include/simdutf/scalar/utf8_to_utf16/valid_utf8_to_utf16.h +106 -0
  287. package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/utf8_to_utf32.h +299 -0
  288. package/deps/simdutf/include/simdutf/scalar/utf8_to_utf32/valid_utf8_to_utf32.h +83 -0
  289. package/deps/simdutf/include/simdutf/simdutf_version.h +26 -0
  290. package/deps/simdutf/include/simdutf.h +26 -0
  291. package/deps/simdutf/include/simdutf_c.h +342 -0
  292. package/deps/simdutf/riscv/Dockerfile +16 -0
  293. package/deps/simdutf/riscv/README.md +24 -0
  294. package/deps/simdutf/riscv/remove-docker-station +8 -0
  295. package/deps/simdutf/riscv/run-docker-station +31 -0
  296. package/deps/simdutf/scripts/.flake8 +2 -0
  297. package/deps/simdutf/scripts/Makefile +2 -0
  298. package/deps/simdutf/scripts/README_ADD_FUNCTION.md +49 -0
  299. package/deps/simdutf/scripts/add_function.py +330 -0
  300. package/deps/simdutf/scripts/amalgamation_tests.py +156 -0
  301. package/deps/simdutf/scripts/base64/Makefile +2 -0
  302. package/deps/simdutf/scripts/base64/README.md +2 -0
  303. package/deps/simdutf/scripts/base64/avx512.py +76 -0
  304. package/deps/simdutf/scripts/base64/neon_decode.py +143 -0
  305. package/deps/simdutf/scripts/base64/neon_generate_lut.py +101 -0
  306. package/deps/simdutf/scripts/base64/sse.py +252 -0
  307. package/deps/simdutf/scripts/base64/sseregular.py +160 -0
  308. package/deps/simdutf/scripts/base64/sseurl.py +283 -0
  309. package/deps/simdutf/scripts/base64/table.py +59 -0
  310. package/deps/simdutf/scripts/base64bench_print.py +145 -0
  311. package/deps/simdutf/scripts/benchmark-all.py +119 -0
  312. package/deps/simdutf/scripts/benchmark_print.py +324 -0
  313. package/deps/simdutf/scripts/check_feature_macros.py +156 -0
  314. package/deps/simdutf/scripts/check_typos.sh +13 -0
  315. package/deps/simdutf/scripts/clang_format.sh +35 -0
  316. package/deps/simdutf/scripts/clang_format_docker.sh +38 -0
  317. package/deps/simdutf/scripts/common.py +24 -0
  318. package/deps/simdutf/scripts/compilation_benchmark.py +55 -0
  319. package/deps/simdutf/scripts/compile_many_variations.sh +64 -0
  320. package/deps/simdutf/scripts/create_latex_table.py +62 -0
  321. package/deps/simdutf/scripts/docker/Dockerfile +14 -0
  322. package/deps/simdutf/scripts/docker/Makefile +9 -0
  323. package/deps/simdutf/scripts/docker/README.md +30 -0
  324. package/deps/simdutf/scripts/docker/llvm.gpg +0 -0
  325. package/deps/simdutf/scripts/ppc64_convert_utf16_to_utf8.py +155 -0
  326. package/deps/simdutf/scripts/prepare_doxygen.sh +21 -0
  327. package/deps/simdutf/scripts/release.py +197 -0
  328. package/deps/simdutf/scripts/shortinputplots.py +97 -0
  329. package/deps/simdutf/scripts/sse_convert_utf16_to_utf8.py +422 -0
  330. package/deps/simdutf/scripts/sse_convert_utf32_to_utf16.py +105 -0
  331. package/deps/simdutf/scripts/sse_utf8_utf16_decode.py +186 -0
  332. package/deps/simdutf/scripts/sse_validate_utf16le_proof.py +137 -0
  333. package/deps/simdutf/scripts/sse_validate_utf16le_testcases.py +129 -0
  334. package/deps/simdutf/scripts/table.py +207 -0
  335. package/deps/simdutf/scripts/tests/new.txt +33 -0
  336. package/deps/simdutf/scripts/tests/old.txt +33 -0
  337. package/deps/simdutf/scripts/tests/results.txt +272 -0
  338. package/deps/simdutf/simdutf.pc.in +11 -0
  339. package/deps/simdutf/singleheader/.flake8 +2 -0
  340. package/deps/simdutf/singleheader/CMakeLists.txt +64 -0
  341. package/deps/simdutf/singleheader/README-dev.md +81 -0
  342. package/deps/simdutf/singleheader/README.md +19 -0
  343. package/deps/simdutf/singleheader/amalgamate.py +513 -0
  344. package/deps/simdutf/singleheader/amalgamation_demo.c +59 -0
  345. package/deps/simdutf/singleheader/amalgamation_demo.cpp +54 -0
  346. package/deps/simdutf/singleheader/test-features.py +262 -0
  347. package/deps/simdutf/src/CMakeLists.txt +78 -0
  348. package/deps/simdutf/src/arm64/arm_base64.cpp +791 -0
  349. package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf16.cpp +24 -0
  350. package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf32.cpp +24 -0
  351. package/deps/simdutf/src/arm64/arm_convert_latin1_to_utf8.cpp +70 -0
  352. package/deps/simdutf/src/arm64/arm_convert_utf16_to_latin1.cpp +61 -0
  353. package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf32.cpp +185 -0
  354. package/deps/simdutf/src/arm64/arm_convert_utf16_to_utf8.cpp +780 -0
  355. package/deps/simdutf/src/arm64/arm_convert_utf32_to_latin1.cpp +60 -0
  356. package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf16.cpp +208 -0
  357. package/deps/simdutf/src/arm64/arm_convert_utf32_to_utf8.cpp +505 -0
  358. package/deps/simdutf/src/arm64/arm_convert_utf8_to_latin1.cpp +69 -0
  359. package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf16.cpp +313 -0
  360. package/deps/simdutf/src/arm64/arm_convert_utf8_to_utf32.cpp +179 -0
  361. package/deps/simdutf/src/arm64/arm_find.cpp +199 -0
  362. package/deps/simdutf/src/arm64/arm_utf16fix.cpp +185 -0
  363. package/deps/simdutf/src/arm64/arm_validate_utf16.cpp +165 -0
  364. package/deps/simdutf/src/arm64/arm_validate_utf32le.cpp +65 -0
  365. package/deps/simdutf/src/arm64/implementation.cpp +1442 -0
  366. package/deps/simdutf/src/encoding_types.cpp +67 -0
  367. package/deps/simdutf/src/error.cpp +3 -0
  368. package/deps/simdutf/src/fallback/implementation.cpp +589 -0
  369. package/deps/simdutf/src/generic/ascii_validation.h +50 -0
  370. package/deps/simdutf/src/generic/base64.h +233 -0
  371. package/deps/simdutf/src/generic/base64lengths.h +63 -0
  372. package/deps/simdutf/src/generic/buf_block_reader.h +109 -0
  373. package/deps/simdutf/src/generic/find.h +75 -0
  374. package/deps/simdutf/src/generic/utf16/change_endianness.h +24 -0
  375. package/deps/simdutf/src/generic/utf16/count_code_points_bytemask.h +58 -0
  376. package/deps/simdutf/src/generic/utf16/to_well_formed.h +93 -0
  377. package/deps/simdutf/src/generic/utf16/utf32_length_from_utf16.h +15 -0
  378. package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16.h +35 -0
  379. package/deps/simdutf/src/generic/utf16/utf8_length_from_utf16_bytemask.h +199 -0
  380. package/deps/simdutf/src/generic/utf16.h +73 -0
  381. package/deps/simdutf/src/generic/utf32.h +136 -0
  382. package/deps/simdutf/src/generic/utf8/utf16_length_from_utf8_bytemask.h +53 -0
  383. package/deps/simdutf/src/generic/utf8.h +92 -0
  384. package/deps/simdutf/src/generic/utf8_to_latin1/utf8_to_latin1.h +316 -0
  385. package/deps/simdutf/src/generic/utf8_to_latin1/valid_utf8_to_latin1.h +78 -0
  386. package/deps/simdutf/src/generic/utf8_to_utf16/utf8_to_utf16.h +332 -0
  387. package/deps/simdutf/src/generic/utf8_to_utf16/valid_utf8_to_utf16.h +74 -0
  388. package/deps/simdutf/src/generic/utf8_to_utf32/utf8_to_utf32.h +318 -0
  389. package/deps/simdutf/src/generic/utf8_to_utf32/valid_utf8_to_utf32.h +42 -0
  390. package/deps/simdutf/src/generic/utf8_validation/utf8_lookup4_algorithm.h +223 -0
  391. package/deps/simdutf/src/generic/utf8_validation/utf8_validator.h +84 -0
  392. package/deps/simdutf/src/generic/validate_utf16.h +164 -0
  393. package/deps/simdutf/src/generic/validate_utf32.h +99 -0
  394. package/deps/simdutf/src/haswell/avx2_base64.cpp +837 -0
  395. package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf16.cpp +28 -0
  396. package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf32.cpp +20 -0
  397. package/deps/simdutf/src/haswell/avx2_convert_latin1_to_utf8.cpp +83 -0
  398. package/deps/simdutf/src/haswell/avx2_convert_utf16_to_latin1.cpp +83 -0
  399. package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf32.cpp +210 -0
  400. package/deps/simdutf/src/haswell/avx2_convert_utf16_to_utf8.cpp +602 -0
  401. package/deps/simdutf/src/haswell/avx2_convert_utf32_to_latin1.cpp +116 -0
  402. package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf16.cpp +164 -0
  403. package/deps/simdutf/src/haswell/avx2_convert_utf32_to_utf8.cpp +569 -0
  404. package/deps/simdutf/src/haswell/avx2_convert_utf8_to_latin1.cpp +60 -0
  405. package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf16.cpp +195 -0
  406. package/deps/simdutf/src/haswell/avx2_convert_utf8_to_utf32.cpp +135 -0
  407. package/deps/simdutf/src/haswell/avx2_utf16fix.cpp +173 -0
  408. package/deps/simdutf/src/haswell/avx2_validate_utf16.cpp +17 -0
  409. package/deps/simdutf/src/haswell/implementation.cpp +1447 -0
  410. package/deps/simdutf/src/icelake/icelake_ascii_validation.inl.cpp +19 -0
  411. package/deps/simdutf/src/icelake/icelake_base64.inl.cpp +630 -0
  412. package/deps/simdutf/src/icelake/icelake_common.inl.cpp +37 -0
  413. package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf16.inl.cpp +36 -0
  414. package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf32.inl.cpp +23 -0
  415. package/deps/simdutf/src/icelake/icelake_convert_latin1_to_utf8.inl.cpp +107 -0
  416. package/deps/simdutf/src/icelake/icelake_convert_utf16_to_latin1.inl.cpp +103 -0
  417. package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf32.inl.cpp +136 -0
  418. package/deps/simdutf/src/icelake/icelake_convert_utf16_to_utf8.inl.cpp +206 -0
  419. package/deps/simdutf/src/icelake/icelake_convert_utf32_to_latin1.inl.cpp +74 -0
  420. package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf16.inl.cpp +338 -0
  421. package/deps/simdutf/src/icelake/icelake_convert_utf32_to_utf8.inl.cpp +574 -0
  422. package/deps/simdutf/src/icelake/icelake_convert_utf8_to_latin1.inl.cpp +104 -0
  423. package/deps/simdutf/src/icelake/icelake_convert_utf8_to_utf16.inl.cpp +75 -0
  424. package/deps/simdutf/src/icelake/icelake_convert_valid_utf8_to_latin1.inl.cpp +69 -0
  425. package/deps/simdutf/src/icelake/icelake_find.inl.cpp +146 -0
  426. package/deps/simdutf/src/icelake/icelake_from_utf8.inl.cpp +266 -0
  427. package/deps/simdutf/src/icelake/icelake_from_valid_utf8.inl.cpp +136 -0
  428. package/deps/simdutf/src/icelake/icelake_macros.inl.cpp +143 -0
  429. package/deps/simdutf/src/icelake/icelake_utf16fix.cpp +138 -0
  430. package/deps/simdutf/src/icelake/icelake_utf32_validation.inl.cpp +63 -0
  431. package/deps/simdutf/src/icelake/icelake_utf8_common.inl.cpp +753 -0
  432. package/deps/simdutf/src/icelake/icelake_utf8_length_from_utf16.inl.cpp +269 -0
  433. package/deps/simdutf/src/icelake/icelake_utf8_validation.inl.cpp +116 -0
  434. package/deps/simdutf/src/icelake/implementation.cpp +1903 -0
  435. package/deps/simdutf/src/implementation.cpp +2526 -0
  436. package/deps/simdutf/src/lasx/implementation.cpp +1531 -0
  437. package/deps/simdutf/src/lasx/lasx_base64.cpp +695 -0
  438. package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf16.cpp +76 -0
  439. package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf32.cpp +55 -0
  440. package/deps/simdutf/src/lasx/lasx_convert_latin1_to_utf8.cpp +65 -0
  441. package/deps/simdutf/src/lasx/lasx_convert_utf16_to_latin1.cpp +64 -0
  442. package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf32.cpp +183 -0
  443. package/deps/simdutf/src/lasx/lasx_convert_utf16_to_utf8.cpp +550 -0
  444. package/deps/simdutf/src/lasx/lasx_convert_utf32_to_latin1.cpp +73 -0
  445. package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf16.cpp +218 -0
  446. package/deps/simdutf/src/lasx/lasx_convert_utf32_to_utf8.cpp +589 -0
  447. package/deps/simdutf/src/lasx/lasx_convert_utf8_to_latin1.cpp +72 -0
  448. package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf16.cpp +296 -0
  449. package/deps/simdutf/src/lasx/lasx_convert_utf8_to_utf32.cpp +190 -0
  450. package/deps/simdutf/src/lasx/lasx_find.cpp +64 -0
  451. package/deps/simdutf/src/lasx/lasx_validate_utf16.cpp +13 -0
  452. package/deps/simdutf/src/lasx/lasx_validate_utf32le.cpp +84 -0
  453. package/deps/simdutf/src/lsx/implementation.cpp +1417 -0
  454. package/deps/simdutf/src/lsx/lsx_base64.cpp +675 -0
  455. package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf16.cpp +39 -0
  456. package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf32.cpp +27 -0
  457. package/deps/simdutf/src/lsx/lsx_convert_latin1_to_utf8.cpp +56 -0
  458. package/deps/simdutf/src/lsx/lsx_convert_utf16_to_latin1.cpp +64 -0
  459. package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf32.cpp +133 -0
  460. package/deps/simdutf/src/lsx/lsx_convert_utf16_to_utf8.cpp +518 -0
  461. package/deps/simdutf/src/lsx/lsx_convert_utf32_to_latin1.cpp +66 -0
  462. package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf16.cpp +155 -0
  463. package/deps/simdutf/src/lsx/lsx_convert_utf32_to_utf8.cpp +459 -0
  464. package/deps/simdutf/src/lsx/lsx_convert_utf8_to_latin1.cpp +75 -0
  465. package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf16.cpp +291 -0
  466. package/deps/simdutf/src/lsx/lsx_convert_utf8_to_utf32.cpp +179 -0
  467. package/deps/simdutf/src/lsx/lsx_find.cpp +60 -0
  468. package/deps/simdutf/src/lsx/lsx_validate_utf16.cpp +13 -0
  469. package/deps/simdutf/src/lsx/lsx_validate_utf32le.cpp +68 -0
  470. package/deps/simdutf/src/ppc64/implementation.cpp +992 -0
  471. package/deps/simdutf/src/ppc64/ppc64_base64.cpp +480 -0
  472. package/deps/simdutf/src/ppc64/ppc64_base64_internal_tests.cpp +401 -0
  473. package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf16.cpp +12 -0
  474. package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf32.cpp +12 -0
  475. package/deps/simdutf/src/ppc64/ppc64_convert_latin1_to_utf8.cpp +149 -0
  476. package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_latin1.cpp +67 -0
  477. package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf32.cpp +87 -0
  478. package/deps/simdutf/src/ppc64/ppc64_convert_utf16_to_utf8.cpp +296 -0
  479. package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_latin1.cpp +57 -0
  480. package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf16.cpp +117 -0
  481. package/deps/simdutf/src/ppc64/ppc64_convert_utf32_to_utf8.cpp +166 -0
  482. package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_latin1.cpp +69 -0
  483. package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf16.cpp +211 -0
  484. package/deps/simdutf/src/ppc64/ppc64_convert_utf8_to_utf32.cpp +153 -0
  485. package/deps/simdutf/src/ppc64/ppc64_utf16_to_utf8_tables.h +1011 -0
  486. package/deps/simdutf/src/ppc64/ppc64_utf8_length_from_latin1.cpp +37 -0
  487. package/deps/simdutf/src/ppc64/ppc64_validate_utf16.cpp +19 -0
  488. package/deps/simdutf/src/ppc64/templates.cpp +91 -0
  489. package/deps/simdutf/src/rvv/implementation.cpp +138 -0
  490. package/deps/simdutf/src/rvv/rvv_find.cpp +27 -0
  491. package/deps/simdutf/src/rvv/rvv_helpers.inl.cpp +23 -0
  492. package/deps/simdutf/src/rvv/rvv_latin1_to.inl.cpp +71 -0
  493. package/deps/simdutf/src/rvv/rvv_length_from.inl.cpp +164 -0
  494. package/deps/simdutf/src/rvv/rvv_utf16_to.inl.cpp +399 -0
  495. package/deps/simdutf/src/rvv/rvv_utf16fix.cpp +110 -0
  496. package/deps/simdutf/src/rvv/rvv_utf32_to.inl.cpp +307 -0
  497. package/deps/simdutf/src/rvv/rvv_utf8_to.inl.cpp +435 -0
  498. package/deps/simdutf/src/rvv/rvv_validate.inl.cpp +275 -0
  499. package/deps/simdutf/src/simdutf/arm64/begin.h +2 -0
  500. package/deps/simdutf/src/simdutf/arm64/bitmanipulation.h +34 -0
  501. package/deps/simdutf/src/simdutf/arm64/end.h +2 -0
  502. package/deps/simdutf/src/simdutf/arm64/implementation.h +307 -0
  503. package/deps/simdutf/src/simdutf/arm64/intrinsics.h +10 -0
  504. package/deps/simdutf/src/simdutf/arm64/simd.h +547 -0
  505. package/deps/simdutf/src/simdutf/arm64/simd16-inl.h +403 -0
  506. package/deps/simdutf/src/simdutf/arm64/simd32-inl.h +129 -0
  507. package/deps/simdutf/src/simdutf/arm64/simd64-inl.h +28 -0
  508. package/deps/simdutf/src/simdutf/arm64.h +43 -0
  509. package/deps/simdutf/src/simdutf/fallback/begin.h +1 -0
  510. package/deps/simdutf/src/simdutf/fallback/bitmanipulation.h +13 -0
  511. package/deps/simdutf/src/simdutf/fallback/end.h +1 -0
  512. package/deps/simdutf/src/simdutf/fallback/implementation.h +331 -0
  513. package/deps/simdutf/src/simdutf/fallback.h +42 -0
  514. package/deps/simdutf/src/simdutf/haswell/begin.h +15 -0
  515. package/deps/simdutf/src/simdutf/haswell/bitmanipulation.h +35 -0
  516. package/deps/simdutf/src/simdutf/haswell/end.h +13 -0
  517. package/deps/simdutf/src/simdutf/haswell/implementation.h +338 -0
  518. package/deps/simdutf/src/simdutf/haswell/intrinsics.h +67 -0
  519. package/deps/simdutf/src/simdutf/haswell/simd.h +363 -0
  520. package/deps/simdutf/src/simdutf/haswell/simd16-inl.h +261 -0
  521. package/deps/simdutf/src/simdutf/haswell/simd32-inl.h +111 -0
  522. package/deps/simdutf/src/simdutf/haswell/simd64-inl.h +34 -0
  523. package/deps/simdutf/src/simdutf/haswell.h +63 -0
  524. package/deps/simdutf/src/simdutf/icelake/begin.h +14 -0
  525. package/deps/simdutf/src/simdutf/icelake/bitmanipulation.h +44 -0
  526. package/deps/simdutf/src/simdutf/icelake/end.h +12 -0
  527. package/deps/simdutf/src/simdutf/icelake/implementation.h +346 -0
  528. package/deps/simdutf/src/simdutf/icelake/intrinsics.h +138 -0
  529. package/deps/simdutf/src/simdutf/icelake/simd.h +17 -0
  530. package/deps/simdutf/src/simdutf/icelake/simd16-inl.h +90 -0
  531. package/deps/simdutf/src/simdutf/icelake/simd32-inl.h +47 -0
  532. package/deps/simdutf/src/simdutf/icelake.h +81 -0
  533. package/deps/simdutf/src/simdutf/lasx/begin.h +8 -0
  534. package/deps/simdutf/src/simdutf/lasx/bitmanipulation.h +25 -0
  535. package/deps/simdutf/src/simdutf/lasx/end.h +8 -0
  536. package/deps/simdutf/src/simdutf/lasx/implementation.h +310 -0
  537. package/deps/simdutf/src/simdutf/lasx/intrinsics.h +319 -0
  538. package/deps/simdutf/src/simdutf/lasx/simd.h +551 -0
  539. package/deps/simdutf/src/simdutf/lasx/simd16-inl.h +234 -0
  540. package/deps/simdutf/src/simdutf/lasx/simd32-inl.h +74 -0
  541. package/deps/simdutf/src/simdutf/lasx/simd64-inl.h +52 -0
  542. package/deps/simdutf/src/simdutf/lasx.h +49 -0
  543. package/deps/simdutf/src/simdutf/lsx/begin.h +2 -0
  544. package/deps/simdutf/src/simdutf/lsx/bitmanipulation.h +25 -0
  545. package/deps/simdutf/src/simdutf/lsx/end.h +2 -0
  546. package/deps/simdutf/src/simdutf/lsx/implementation.h +309 -0
  547. package/deps/simdutf/src/simdutf/lsx/intrinsics.h +196 -0
  548. package/deps/simdutf/src/simdutf/lsx/simd.h +421 -0
  549. package/deps/simdutf/src/simdutf/lsx/simd16-inl.h +242 -0
  550. package/deps/simdutf/src/simdutf/lsx/simd32-inl.h +69 -0
  551. package/deps/simdutf/src/simdutf/lsx/simd64-inl.h +50 -0
  552. package/deps/simdutf/src/simdutf/lsx.h +52 -0
  553. package/deps/simdutf/src/simdutf/ppc64/begin.h +1 -0
  554. package/deps/simdutf/src/simdutf/ppc64/bitmanipulation.h +29 -0
  555. package/deps/simdutf/src/simdutf/ppc64/end.h +1 -0
  556. package/deps/simdutf/src/simdutf/ppc64/implementation.h +348 -0
  557. package/deps/simdutf/src/simdutf/ppc64/intrinsics.h +19 -0
  558. package/deps/simdutf/src/simdutf/ppc64/simd.h +177 -0
  559. package/deps/simdutf/src/simdutf/ppc64/simd16-inl.h +327 -0
  560. package/deps/simdutf/src/simdutf/ppc64/simd32-inl.h +247 -0
  561. package/deps/simdutf/src/simdutf/ppc64/simd8-inl.h +618 -0
  562. package/deps/simdutf/src/simdutf/ppc64.h +40 -0
  563. package/deps/simdutf/src/simdutf/rvv/begin.h +7 -0
  564. package/deps/simdutf/src/simdutf/rvv/end.h +7 -0
  565. package/deps/simdutf/src/simdutf/rvv/implementation.h +321 -0
  566. package/deps/simdutf/src/simdutf/rvv/intrinsics.h +131 -0
  567. package/deps/simdutf/src/simdutf/rvv.h +41 -0
  568. package/deps/simdutf/src/simdutf/westmere/begin.h +8 -0
  569. package/deps/simdutf/src/simdutf/westmere/bitmanipulation.h +37 -0
  570. package/deps/simdutf/src/simdutf/westmere/end.h +8 -0
  571. package/deps/simdutf/src/simdutf/westmere/implementation.h +338 -0
  572. package/deps/simdutf/src/simdutf/westmere/intrinsics.h +38 -0
  573. package/deps/simdutf/src/simdutf/westmere/simd.h +379 -0
  574. package/deps/simdutf/src/simdutf/westmere/simd16-inl.h +242 -0
  575. package/deps/simdutf/src/simdutf/westmere/simd32-inl.h +151 -0
  576. package/deps/simdutf/src/simdutf/westmere/simd64-inl.h +33 -0
  577. package/deps/simdutf/src/simdutf/westmere.h +59 -0
  578. package/deps/simdutf/src/simdutf.cpp +152 -0
  579. package/deps/simdutf/src/simdutf_c.cpp +525 -0
  580. package/deps/simdutf/src/tables/utf16_to_utf8_tables.h +768 -0
  581. package/deps/simdutf/src/tables/utf32_to_utf16_tables.h +53 -0
  582. package/deps/simdutf/src/tables/utf8_to_utf16_tables.h +826 -0
  583. package/deps/simdutf/src/westmere/implementation.cpp +1479 -0
  584. package/deps/simdutf/src/westmere/internal/loader.cpp +7 -0
  585. package/deps/simdutf/src/westmere/internal/write_v_u16_11bits_to_utf8.cpp +66 -0
  586. package/deps/simdutf/src/westmere/sse_base64.cpp +672 -0
  587. package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf16.cpp +21 -0
  588. package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf32.cpp +31 -0
  589. package/deps/simdutf/src/westmere/sse_convert_latin1_to_utf8.cpp +71 -0
  590. package/deps/simdutf/src/westmere/sse_convert_utf16_to_latin1.cpp +70 -0
  591. package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf32.cpp +206 -0
  592. package/deps/simdutf/src/westmere/sse_convert_utf16_to_utf8.cpp +504 -0
  593. package/deps/simdutf/src/westmere/sse_convert_utf32_to_latin1.cpp +82 -0
  594. package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf16.cpp +209 -0
  595. package/deps/simdutf/src/westmere/sse_convert_utf32_to_utf8.cpp +589 -0
  596. package/deps/simdutf/src/westmere/sse_convert_utf8_to_latin1.cpp +58 -0
  597. package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf16.cpp +197 -0
  598. package/deps/simdutf/src/westmere/sse_convert_utf8_to_utf32.cpp +141 -0
  599. package/deps/simdutf/src/westmere/sse_utf16fix.cpp +82 -0
  600. package/deps/simdutf/src/westmere/sse_validate_utf16.cpp +17 -0
  601. package/deps/simdutf/tests/CMakeLists.txt +483 -0
  602. package/deps/simdutf/tests/atomic_base64_tests.cpp +2845 -0
  603. package/deps/simdutf/tests/base64_tests.cpp +3617 -0
  604. package/deps/simdutf/tests/basic_fuzzer.cpp +805 -0
  605. package/deps/simdutf/tests/bele_tests.cpp +182 -0
  606. package/deps/simdutf/tests/constexpr_base64_tests.cpp +387 -0
  607. package/deps/simdutf/tests/convert_latin1_to_utf16be_tests.cpp +52 -0
  608. package/deps/simdutf/tests/convert_latin1_to_utf16le_tests.cpp +80 -0
  609. package/deps/simdutf/tests/convert_latin1_to_utf32_tests.cpp +66 -0
  610. package/deps/simdutf/tests/convert_latin1_to_utf8_tests.cpp +120 -0
  611. package/deps/simdutf/tests/convert_utf16_to_utf8_safe_tests.cpp +203 -0
  612. package/deps/simdutf/tests/convert_utf16_to_utf8_with_replacement_tests.cpp +276 -0
  613. package/deps/simdutf/tests/convert_utf16be_to_latin1_tests.cpp +109 -0
  614. package/deps/simdutf/tests/convert_utf16be_to_latin1_tests_with_errors.cpp +136 -0
  615. package/deps/simdutf/tests/convert_utf16be_to_utf32_tests.cpp +193 -0
  616. package/deps/simdutf/tests/convert_utf16be_to_utf32_with_errors_tests.cpp +381 -0
  617. package/deps/simdutf/tests/convert_utf16be_to_utf8_tests.cpp +259 -0
  618. package/deps/simdutf/tests/convert_utf16be_to_utf8_with_errors_tests.cpp +266 -0
  619. package/deps/simdutf/tests/convert_utf16le_to_latin1_tests.cpp +148 -0
  620. package/deps/simdutf/tests/convert_utf16le_to_latin1_tests_with_errors.cpp +176 -0
  621. package/deps/simdutf/tests/convert_utf16le_to_utf32_tests.cpp +213 -0
  622. package/deps/simdutf/tests/convert_utf16le_to_utf32_with_errors_tests.cpp +318 -0
  623. package/deps/simdutf/tests/convert_utf16le_to_utf8_tests.cpp +343 -0
  624. package/deps/simdutf/tests/convert_utf16le_to_utf8_with_errors_tests.cpp +271 -0
  625. package/deps/simdutf/tests/convert_utf32_to_latin1_tests.cpp +111 -0
  626. package/deps/simdutf/tests/convert_utf32_to_latin1_with_errors_tests.cpp +96 -0
  627. package/deps/simdutf/tests/convert_utf32_to_utf16be_tests.cpp +148 -0
  628. package/deps/simdutf/tests/convert_utf32_to_utf16be_with_errors_tests.cpp +192 -0
  629. package/deps/simdutf/tests/convert_utf32_to_utf16le_tests.cpp +166 -0
  630. package/deps/simdutf/tests/convert_utf32_to_utf16le_with_errors_tests.cpp +215 -0
  631. package/deps/simdutf/tests/convert_utf32_to_utf8_tests.cpp +181 -0
  632. package/deps/simdutf/tests/convert_utf32_to_utf8_with_errors_tests.cpp +261 -0
  633. package/deps/simdutf/tests/convert_utf8_to_latin1_tests.cpp +516 -0
  634. package/deps/simdutf/tests/convert_utf8_to_latin1_with_errors_tests.cpp +579 -0
  635. package/deps/simdutf/tests/convert_utf8_to_utf16be_tests.cpp +412 -0
  636. package/deps/simdutf/tests/convert_utf8_to_utf16be_with_errors_tests.cpp +480 -0
  637. package/deps/simdutf/tests/convert_utf8_to_utf16le_tests.cpp +671 -0
  638. package/deps/simdutf/tests/convert_utf8_to_utf16le_with_errors_tests.cpp +455 -0
  639. package/deps/simdutf/tests/convert_utf8_to_utf32_tests.cpp +1204 -0
  640. package/deps/simdutf/tests/convert_utf8_to_utf32_with_errors_tests.cpp +337 -0
  641. package/deps/simdutf/tests/convert_valid_utf16be_to_latin1_tests.cpp +37 -0
  642. package/deps/simdutf/tests/convert_valid_utf16be_to_utf32_tests.cpp +97 -0
  643. package/deps/simdutf/tests/convert_valid_utf16be_to_utf8_tests.cpp +126 -0
  644. package/deps/simdutf/tests/convert_valid_utf16le_to_latin1_tests.cpp +71 -0
  645. package/deps/simdutf/tests/convert_valid_utf16le_to_utf32_tests.cpp +122 -0
  646. package/deps/simdutf/tests/convert_valid_utf16le_to_utf8_tests.cpp +244 -0
  647. package/deps/simdutf/tests/convert_valid_utf32_to_latin1_tests.cpp +49 -0
  648. package/deps/simdutf/tests/convert_valid_utf32_to_utf16be_tests.cpp +92 -0
  649. package/deps/simdutf/tests/convert_valid_utf32_to_utf16le_tests.cpp +114 -0
  650. package/deps/simdutf/tests/convert_valid_utf32_to_utf8_tests.cpp +109 -0
  651. package/deps/simdutf/tests/convert_valid_utf8_to_latin1_tests.cpp +84 -0
  652. package/deps/simdutf/tests/convert_valid_utf8_to_utf16be_tests.cpp +124 -0
  653. package/deps/simdutf/tests/convert_valid_utf8_to_utf16le_tests.cpp +221 -0
  654. package/deps/simdutf/tests/convert_valid_utf8_to_utf32_tests.cpp +155 -0
  655. package/deps/simdutf/tests/count_utf16be.cpp +64 -0
  656. package/deps/simdutf/tests/count_utf16le.cpp +61 -0
  657. package/deps/simdutf/tests/count_utf8.cpp +87 -0
  658. package/deps/simdutf/tests/detect_encodings_tests.cpp +312 -0
  659. package/deps/simdutf/tests/embed/valid_utf8.txt +1 -0
  660. package/deps/simdutf/tests/embed_tests.cpp +22 -0
  661. package/deps/simdutf/tests/find_tests.cpp +77 -0
  662. package/deps/simdutf/tests/fixed_string_tests.cpp +153 -0
  663. package/deps/simdutf/tests/helpers/CMakeLists.txt +25 -0
  664. package/deps/simdutf/tests/helpers/compiletime_conversions.h +222 -0
  665. package/deps/simdutf/tests/helpers/fixed_string.h +267 -0
  666. package/deps/simdutf/tests/helpers/random_int.cpp +30 -0
  667. package/deps/simdutf/tests/helpers/random_int.h +39 -0
  668. package/deps/simdutf/tests/helpers/random_utf16.cpp +123 -0
  669. package/deps/simdutf/tests/helpers/random_utf16.h +52 -0
  670. package/deps/simdutf/tests/helpers/random_utf32.cpp +41 -0
  671. package/deps/simdutf/tests/helpers/random_utf32.h +40 -0
  672. package/deps/simdutf/tests/helpers/random_utf8.cpp +93 -0
  673. package/deps/simdutf/tests/helpers/random_utf8.h +36 -0
  674. package/deps/simdutf/tests/helpers/test.cpp +231 -0
  675. package/deps/simdutf/tests/helpers/test.h +193 -0
  676. package/deps/simdutf/tests/helpers/transcode_test_base.cpp +1257 -0
  677. package/deps/simdutf/tests/helpers/transcode_test_base.h +683 -0
  678. package/deps/simdutf/tests/helpers/utf16.h +27 -0
  679. package/deps/simdutf/tests/installation_tests/find/CMakeLists.txt +43 -0
  680. package/deps/simdutf/tests/installation_tests/from_fetch/CMakeLists.txt +47 -0
  681. package/deps/simdutf/tests/internal_tests.cpp +27 -0
  682. package/deps/simdutf/tests/null_safety_tests.cpp +94 -0
  683. package/deps/simdutf/tests/random_fuzzer.cpp +779 -0
  684. package/deps/simdutf/tests/readme_tests.cpp +274 -0
  685. package/deps/simdutf/tests/reference/CMakeLists.txt +23 -0
  686. package/deps/simdutf/tests/reference/decode_utf16.h +81 -0
  687. package/deps/simdutf/tests/reference/decode_utf32.h +47 -0
  688. package/deps/simdutf/tests/reference/encode_latin1.cpp +1 -0
  689. package/deps/simdutf/tests/reference/encode_latin1.h +32 -0
  690. package/deps/simdutf/tests/reference/encode_utf16.cpp +49 -0
  691. package/deps/simdutf/tests/reference/encode_utf16.h +20 -0
  692. package/deps/simdutf/tests/reference/encode_utf32.cpp +1 -0
  693. package/deps/simdutf/tests/reference/encode_utf32.h +36 -0
  694. package/deps/simdutf/tests/reference/encode_utf8.cpp +1 -0
  695. package/deps/simdutf/tests/reference/encode_utf8.h +40 -0
  696. package/deps/simdutf/tests/reference/validate_utf16.cpp +60 -0
  697. package/deps/simdutf/tests/reference/validate_utf16.h +14 -0
  698. package/deps/simdutf/tests/reference/validate_utf16_to_latin1.cpp +35 -0
  699. package/deps/simdutf/tests/reference/validate_utf16_to_latin1.h +13 -0
  700. package/deps/simdutf/tests/reference/validate_utf32.cpp +27 -0
  701. package/deps/simdutf/tests/reference/validate_utf32.h +12 -0
  702. package/deps/simdutf/tests/reference/validate_utf32_to_latin1.cpp +27 -0
  703. package/deps/simdutf/tests/reference/validate_utf32_to_latin1.h +12 -0
  704. package/deps/simdutf/tests/reference/validate_utf8.cpp +82 -0
  705. package/deps/simdutf/tests/reference/validate_utf8.h +11 -0
  706. package/deps/simdutf/tests/reference/validate_utf8_to_latin1.cpp +43 -0
  707. package/deps/simdutf/tests/reference/validate_utf8_to_latin1.h +12 -0
  708. package/deps/simdutf/tests/select_implementation.cpp +43 -0
  709. package/deps/simdutf/tests/simdutf_c_tests.cpp +244 -0
  710. package/deps/simdutf/tests/span_tests.cpp +401 -0
  711. package/deps/simdutf/tests/special_tests.cpp +559 -0
  712. package/deps/simdutf/tests/straight_c_test.c +187 -0
  713. package/deps/simdutf/tests/text_encoding_tests.cpp +77 -0
  714. package/deps/simdutf/tests/to_well_formed_utf16_tests.cpp +377 -0
  715. package/deps/simdutf/tests/utf8_length_from_utf16_tests.cpp +202 -0
  716. package/deps/simdutf/tests/validate_ascii_basic_tests.cpp +165 -0
  717. package/deps/simdutf/tests/validate_ascii_with_errors_tests.cpp +77 -0
  718. package/deps/simdutf/tests/validate_utf16be_basic_tests.cpp +175 -0
  719. package/deps/simdutf/tests/validate_utf16be_with_errors_tests.cpp +188 -0
  720. package/deps/simdutf/tests/validate_utf16le_basic_tests.cpp +268 -0
  721. package/deps/simdutf/tests/validate_utf16le_with_errors_tests.cpp +274 -0
  722. package/deps/simdutf/tests/validate_utf32_basic_tests.cpp +92 -0
  723. package/deps/simdutf/tests/validate_utf32_with_errors_tests.cpp +114 -0
  724. package/deps/simdutf/tests/validate_utf8_basic_tests.cpp +178 -0
  725. package/deps/simdutf/tests/validate_utf8_brute_force_tests.cpp +88 -0
  726. package/deps/simdutf/tests/validate_utf8_puzzler_tests.cpp +33 -0
  727. package/deps/simdutf/tests/validate_utf8_with_errors_tests.cpp +228 -0
  728. package/deps/simdutf/tools/CMakeLists.txt +85 -0
  729. package/deps/simdutf/tools/fastbase64.cpp +250 -0
  730. package/deps/simdutf/tools/sutf.cpp +556 -0
  731. package/deps/simdutf/tools/sutf.h +40 -0
  732. package/lib/commonjs/blake3.js +2 -1
  733. package/lib/commonjs/blake3.js.map +1 -1
  734. package/lib/commonjs/diffie-hellman.js +5 -4
  735. package/lib/commonjs/diffie-hellman.js.map +1 -1
  736. package/lib/commonjs/ecdh.js +5 -4
  737. package/lib/commonjs/ecdh.js.map +1 -1
  738. package/lib/module/blake3.js +2 -1
  739. package/lib/module/blake3.js.map +1 -1
  740. package/lib/module/diffie-hellman.js +5 -4
  741. package/lib/module/diffie-hellman.js.map +1 -1
  742. package/lib/module/ecdh.js +5 -4
  743. package/lib/module/ecdh.js.map +1 -1
  744. package/lib/tsconfig.tsbuildinfo +1 -1
  745. package/lib/typescript/blake3.d.ts.map +1 -1
  746. package/lib/typescript/diffie-hellman.d.ts.map +1 -1
  747. package/lib/typescript/ecdh.d.ts.map +1 -1
  748. package/package.json +2 -2
  749. package/src/blake3.ts +2 -1
  750. package/src/diffie-hellman.ts +5 -7
  751. package/src/ecdh.ts +5 -8
@@ -0,0 +1,36 @@
1
+ // file included directly
2
+ template <endianness big_endian>
3
+ size_t icelake_convert_latin1_to_utf16(const char *latin1_input, size_t len,
4
+ char16_t *utf16_output) {
5
+ size_t rounded_len = len & ~0x1F; // Round down to nearest multiple of 32
6
+
7
+ __m512i byteflip = _mm512_setr_epi64(0x0607040502030001, 0x0e0f0c0d0a0b0809,
8
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809,
9
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809,
10
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809);
11
+ for (size_t i = 0; i < rounded_len; i += 32) {
12
+ // Load 32 Latin1 characters into a 256-bit register
13
+ __m256i in = _mm256_loadu_si256((__m256i *)&latin1_input[i]);
14
+ // Zero extend each set of 8 Latin1 characters to 32 16-bit integers
15
+ __m512i out = _mm512_cvtepu8_epi16(in);
16
+ if (big_endian) {
17
+ out = _mm512_shuffle_epi8(out, byteflip);
18
+ }
19
+ // Store the results back to memory
20
+ _mm512_storeu_si512((__m512i *)&utf16_output[i], out);
21
+ }
22
+ if (rounded_len != len) {
23
+ uint32_t mask = uint32_t(1 << (len - rounded_len)) - 1;
24
+ __m256i in = _mm256_maskz_loadu_epi8(mask, latin1_input + rounded_len);
25
+
26
+ // Zero extend each set of 8 Latin1 characters to 32 16-bit integers
27
+ __m512i out = _mm512_cvtepu8_epi16(in);
28
+ if (big_endian) {
29
+ out = _mm512_shuffle_epi8(out, byteflip);
30
+ }
31
+ // Store the results back to memory
32
+ _mm512_mask_storeu_epi16(utf16_output + rounded_len, mask, out);
33
+ }
34
+
35
+ return len;
36
+ }
@@ -0,0 +1,23 @@
1
+ void avx512_convert_latin1_to_utf32(const char *buf, size_t len,
2
+ char32_t *utf32_output) {
3
+ while (len >= 16) {
4
+ // Load 16 Latin1 characters into a 128-bit register
5
+ __m128i in = _mm_loadu_si128((__m128i *)buf);
6
+
7
+ // Zero extend each set of 8 Latin1 characters to 16 32-bit integers using
8
+ // vpmovzxbd
9
+ __m512i out = _mm512_cvtepu8_epi32(in);
10
+
11
+ // Store the results back to memory
12
+ _mm512_storeu_si512((__m512i *)utf32_output, out);
13
+
14
+ len -= 16;
15
+ buf += 16;
16
+ utf32_output += 16;
17
+ }
18
+
19
+ __mmask16 mask = __mmask16((1 << len) - 1);
20
+ __m128i in = _mm_maskz_loadu_epi8(mask, buf);
21
+ __m512i out = _mm512_cvtepu8_epi32(in);
22
+ _mm512_mask_storeu_epi32((__m512i *)utf32_output, mask, out);
23
+ }
@@ -0,0 +1,107 @@
1
+ // file included directly
2
+
3
+ static inline size_t latin1_to_utf8_avx512_vec(__m512i input, size_t input_len,
4
+ char *utf8_output,
5
+ int mask_output) {
6
+ __mmask64 nonascii = _mm512_movepi8_mask(input);
7
+ size_t output_size = input_len + (size_t)count_ones(nonascii);
8
+
9
+ // Mask to denote whether the byte is a leading byte that is not ascii
10
+ __mmask64 sixth = _mm512_cmpge_epu8_mask(
11
+ input, _mm512_set1_epi8(-64)); // binary representation of -64: 1100 0000
12
+
13
+ const uint64_t alternate_bits = UINT64_C(0x5555555555555555);
14
+ uint64_t ascii = ~nonascii;
15
+ // the bits in ascii are inverted and zeros are interspersed in between them
16
+ uint64_t maskA = ~_pdep_u64(ascii, alternate_bits);
17
+ uint64_t maskB = ~_pdep_u64(ascii >> 32, alternate_bits);
18
+
19
+ // interleave bytes from top and bottom halves (abcd...ABCD -> aAbBcCdD)
20
+ __m512i input_interleaved = _mm512_permutexvar_epi8(
21
+ _mm512_set_epi32(0x3f1f3e1e, 0x3d1d3c1c, 0x3b1b3a1a, 0x39193818,
22
+ 0x37173616, 0x35153414, 0x33133212, 0x31113010,
23
+ 0x2f0f2e0e, 0x2d0d2c0c, 0x2b0b2a0a, 0x29092808,
24
+ 0x27072606, 0x25052404, 0x23032202, 0x21012000),
25
+ input);
26
+
27
+ // double size of each byte, and insert the leading byte 1100 0010
28
+
29
+ /*
30
+ upscale the bytes to 16-bit value, adding the 0b11000000 leading byte in the
31
+ process. We adjust for the bytes that have their two most significant bits.
32
+ This takes care of the first 32 bytes, assuming we interleaved the bytes. */
33
+ __m512i outputA =
34
+ _mm512_shldi_epi16(input_interleaved, _mm512_set1_epi8(-62), 8);
35
+ outputA = _mm512_mask_add_epi16(
36
+ outputA, (__mmask32)sixth, outputA,
37
+ _mm512_set1_epi16(1 - 0x4000)); // 1- 0x4000 = 1100 0000 0000 0001????
38
+
39
+ // in the second 32-bit half, set first or second option based on whether
40
+ // original input is leading byte (second case) or not (first case)
41
+ __m512i leadingB =
42
+ _mm512_mask_blend_epi16((__mmask32)(sixth >> 32),
43
+ _mm512_set1_epi16(0x00c2), // 0000 0000 1101 0010
44
+ _mm512_set1_epi16(0x40c3)); // 0100 0000 1100 0011
45
+ __m512i outputB = _mm512_ternarylogic_epi32(
46
+ input_interleaved, leadingB, _mm512_set1_epi16((short)0xff00),
47
+ (240 & 170) ^ 204); // (input_interleaved & 0xff00) ^ leadingB
48
+
49
+ // prune redundant bytes
50
+ outputA = _mm512_maskz_compress_epi8(maskA, outputA);
51
+ outputB = _mm512_maskz_compress_epi8(maskB, outputB);
52
+
53
+ size_t output_sizeA = (size_t)count_ones((uint32_t)nonascii) + 32;
54
+
55
+ if (mask_output) {
56
+ if (input_len > 32) { // is the second half of the input vector used?
57
+ __mmask64 write_mask = _bzhi_u64(~0ULL, (unsigned int)output_sizeA);
58
+ _mm512_mask_storeu_epi8(utf8_output, write_mask, outputA);
59
+ utf8_output += output_sizeA;
60
+ write_mask = _bzhi_u64(~0ULL, (unsigned int)(output_size - output_sizeA));
61
+ _mm512_mask_storeu_epi8(utf8_output, write_mask, outputB);
62
+ } else {
63
+ __mmask64 write_mask = _bzhi_u64(~0ULL, (unsigned int)output_size);
64
+ _mm512_mask_storeu_epi8(utf8_output, write_mask, outputA);
65
+ }
66
+ } else {
67
+ _mm512_storeu_si512(utf8_output, outputA);
68
+ utf8_output += output_sizeA;
69
+ _mm512_storeu_si512(utf8_output, outputB);
70
+ }
71
+ return output_size;
72
+ }
73
+
74
+ static inline size_t latin1_to_utf8_avx512_branch(__m512i input,
75
+ char *utf8_output) {
76
+ __mmask64 nonascii = _mm512_movepi8_mask(input);
77
+ if (nonascii) {
78
+ return latin1_to_utf8_avx512_vec(input, 64, utf8_output, 0);
79
+ } else {
80
+ _mm512_storeu_si512(utf8_output, input);
81
+ return 64;
82
+ }
83
+ }
84
+
85
+ size_t latin1_to_utf8_avx512_start(const char *buf, size_t len,
86
+ char *utf8_output) {
87
+ char *start = utf8_output;
88
+ size_t pos = 0;
89
+ // if there's at least 128 bytes remaining, we don't need to mask the output
90
+ for (; pos + 128 <= len; pos += 64) {
91
+ __m512i input = _mm512_loadu_si512((__m512i *)(buf + pos));
92
+ utf8_output += latin1_to_utf8_avx512_branch(input, utf8_output);
93
+ }
94
+ // in the last 128 bytes, the first 64 may require masking the output
95
+ if (pos + 64 <= len) {
96
+ __m512i input = _mm512_loadu_si512((__m512i *)(buf + pos));
97
+ utf8_output += latin1_to_utf8_avx512_vec(input, 64, utf8_output, 1);
98
+ pos += 64;
99
+ }
100
+ // with the last 64 bytes, the input also needs to be masked
101
+ if (pos < len) {
102
+ __mmask64 load_mask = _bzhi_u64(~0ULL, (unsigned int)(len - pos));
103
+ __m512i input = _mm512_maskz_loadu_epi8(load_mask, (__m512i *)(buf + pos));
104
+ utf8_output += latin1_to_utf8_avx512_vec(input, len - pos, utf8_output, 1);
105
+ }
106
+ return (size_t)(utf8_output - start);
107
+ }
@@ -0,0 +1,103 @@
1
+ // file included directly
2
+ template <endianness big_endian>
3
+ size_t icelake_convert_utf16_to_latin1(const char16_t *buf, size_t len,
4
+ char *latin1_output) {
5
+ const char16_t *end = buf + len;
6
+ __m512i v_0xFF = _mm512_set1_epi16(0xff);
7
+ __m512i byteflip = _mm512_setr_epi64(0x0607040502030001, 0x0e0f0c0d0a0b0809,
8
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809,
9
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809,
10
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809);
11
+ __m512i shufmask = _mm512_set_epi8(
12
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
13
+ 0, 0, 0, 0, 0, 0, 0, 62, 60, 58, 56, 54, 52, 50, 48, 46, 44, 42, 40, 38,
14
+ 36, 34, 32, 30, 28, 26, 24, 22, 20, 18, 16, 14, 12, 10, 8, 6, 4, 2, 0);
15
+ while (end - buf >= 32) {
16
+ __m512i in = _mm512_loadu_si512((__m512i *)buf);
17
+ if (big_endian) {
18
+ in = _mm512_shuffle_epi8(in, byteflip);
19
+ }
20
+ if (_mm512_cmpgt_epu16_mask(in, v_0xFF)) {
21
+ return 0;
22
+ }
23
+ _mm256_storeu_si256(
24
+ (__m256i *)latin1_output,
25
+ _mm512_castsi512_si256(_mm512_permutexvar_epi8(shufmask, in)));
26
+ latin1_output += 32;
27
+ buf += 32;
28
+ }
29
+ if (buf < end) {
30
+ uint32_t mask(uint32_t(1 << (end - buf)) - 1);
31
+ __m512i in = _mm512_maskz_loadu_epi16(mask, buf);
32
+ if (big_endian) {
33
+ in = _mm512_shuffle_epi8(in, byteflip);
34
+ }
35
+ if (_mm512_cmpgt_epu16_mask(in, v_0xFF)) {
36
+ return 0;
37
+ }
38
+ _mm256_mask_storeu_epi8(
39
+ latin1_output, mask,
40
+ _mm512_castsi512_si256(_mm512_permutexvar_epi8(shufmask, in)));
41
+ }
42
+ return len;
43
+ }
44
+
45
+ template <endianness big_endian>
46
+ std::pair<result, char *>
47
+ icelake_convert_utf16_to_latin1_with_errors(const char16_t *buf, size_t len,
48
+ char *latin1_output) {
49
+ const char16_t *end = buf + len;
50
+ const char16_t *start = buf;
51
+ __m512i byteflip = _mm512_setr_epi64(0x0607040502030001, 0x0e0f0c0d0a0b0809,
52
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809,
53
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809,
54
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809);
55
+ __m512i v_0xFF = _mm512_set1_epi16(0xff);
56
+ __m512i shufmask = _mm512_set_epi8(
57
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
58
+ 0, 0, 0, 0, 0, 0, 0, 62, 60, 58, 56, 54, 52, 50, 48, 46, 44, 42, 40, 38,
59
+ 36, 34, 32, 30, 28, 26, 24, 22, 20, 18, 16, 14, 12, 10, 8, 6, 4, 2, 0);
60
+ while (end - buf >= 32) {
61
+ __m512i in = _mm512_loadu_si512((__m512i *)buf);
62
+ if (big_endian) {
63
+ in = _mm512_shuffle_epi8(in, byteflip);
64
+ }
65
+ if (_mm512_cmpgt_epu16_mask(in, v_0xFF)) {
66
+ uint16_t word;
67
+ while ((word = scalar::utf16::swap_if_needed<big_endian>(
68
+ uint16_t(*buf))) <= 0xff) {
69
+ *latin1_output++ = uint8_t(word);
70
+ buf++;
71
+ }
72
+ return std::make_pair(result(error_code::TOO_LARGE, buf - start),
73
+ latin1_output);
74
+ }
75
+ _mm256_storeu_si256(
76
+ (__m256i *)latin1_output,
77
+ _mm512_castsi512_si256(_mm512_permutexvar_epi8(shufmask, in)));
78
+ latin1_output += 32;
79
+ buf += 32;
80
+ }
81
+ if (buf < end) {
82
+ uint32_t mask(uint32_t(1 << (end - buf)) - 1);
83
+ __m512i in = _mm512_maskz_loadu_epi16(mask, buf);
84
+ if (big_endian) {
85
+ in = _mm512_shuffle_epi8(in, byteflip);
86
+ }
87
+ if (_mm512_cmpgt_epu16_mask(in, v_0xFF)) {
88
+
89
+ uint16_t word;
90
+ while ((word = scalar::utf16::swap_if_needed<big_endian>(
91
+ uint16_t(*buf))) <= 0xff) {
92
+ *latin1_output++ = uint8_t(word);
93
+ buf++;
94
+ }
95
+ return std::make_pair(result(error_code::TOO_LARGE, buf - start),
96
+ latin1_output);
97
+ }
98
+ _mm256_mask_storeu_epi8(
99
+ latin1_output, mask,
100
+ _mm512_castsi512_si256(_mm512_permutexvar_epi8(shufmask, in)));
101
+ }
102
+ return std::make_pair(result(error_code::SUCCESS, len), latin1_output);
103
+ }
@@ -0,0 +1,136 @@
1
+ // file included directly
2
+
3
+ /*
4
+ Returns a pair: the first unprocessed byte from buf and utf32_output
5
+ A scalar routing should carry on the conversion of the tail.
6
+ */
7
+ template <endianness big_endian>
8
+ std::tuple<const char16_t *, char32_t *, bool>
9
+ convert_utf16_to_utf32(const char16_t *buf, size_t len,
10
+ char32_t *utf32_output) {
11
+ const char16_t *end = buf + len;
12
+ const __m512i v_fc00 = _mm512_set1_epi16((uint16_t)0xfc00);
13
+ const __m512i v_d800 = _mm512_set1_epi16((uint16_t)0xd800);
14
+ const __m512i v_dc00 = _mm512_set1_epi16((uint16_t)0xdc00);
15
+ __mmask32 carry{0};
16
+ const __m512i byteflip = _mm512_setr_epi64(
17
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809, 0x0607040502030001,
18
+ 0x0e0f0c0d0a0b0809, 0x0607040502030001, 0x0e0f0c0d0a0b0809,
19
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809);
20
+ while (std::distance(buf, end) >= 32) {
21
+ // Always safe because buf + 32 <= end so that end - buf >= 32 bytes:
22
+ __m512i in = _mm512_loadu_si512((__m512i *)buf);
23
+ if (big_endian) {
24
+ in = _mm512_shuffle_epi8(in, byteflip);
25
+ }
26
+
27
+ // H - bitmask for high surrogates
28
+ const __mmask32 H =
29
+ _mm512_cmpeq_epi16_mask(_mm512_and_si512(in, v_fc00), v_d800);
30
+ // H - bitmask for low surrogates
31
+ const __mmask32 L =
32
+ _mm512_cmpeq_epi16_mask(_mm512_and_si512(in, v_fc00), v_dc00);
33
+
34
+ if ((H | L)) {
35
+ // surrogate pair(s) in a register
36
+ const __mmask32 V =
37
+ (L ^
38
+ (carry | (H << 1))); // A high surrogate must be followed by low one
39
+ // and a low one must be preceded by a high one.
40
+ // If valid, V should be equal to 0
41
+
42
+ if (V == 0) {
43
+ // valid case
44
+ /*
45
+ Input surrogate pair:
46
+ |1101.11aa.aaaa.aaaa|1101.10bb.bbbb.bbbb|
47
+ low surrogate high surrogate
48
+ */
49
+ /* 1. Expand all code units to 32-bit code units
50
+ in
51
+ |0000.0000.0000.0000.1101.11aa.aaaa.aaaa|0000.0000.0000.0000.1101.10bb.bbbb.bbbb|
52
+ */
53
+ const __m512i first = _mm512_cvtepu16_epi32(_mm512_castsi512_si256(in));
54
+ const __m512i second =
55
+ _mm512_cvtepu16_epi32(_mm512_extracti32x8_epi32(in, 1));
56
+
57
+ /* 2. Shift by one 16-bit word to align low surrogates with high
58
+ surrogates in
59
+ |0000.0000.0000.0000.1101.11aa.aaaa.aaaa|0000.0000.0000.0000.1101.10bb.bbbb.bbbb|
60
+ shifted
61
+ |????.????.????.????.????.????.????.????|0000.0000.0000.0000.1101.11aa.aaaa.aaaa|
62
+ */
63
+ const __m512i shifted_first = _mm512_alignr_epi32(second, first, 1);
64
+ const __m512i shifted_second =
65
+ _mm512_alignr_epi32(_mm512_setzero_si512(), second, 1);
66
+
67
+ /* 3. Align all high surrogates in first and second by shifting to the
68
+ left by 10 bits
69
+ |0000.0000.0000.0000.1101.11aa.aaaa.aaaa|0000.0011.0110.bbbb.bbbb.bb00.0000.0000|
70
+ */
71
+ const __m512i aligned_first =
72
+ _mm512_mask_slli_epi32(first, (__mmask16)H, first, 10);
73
+ const __m512i aligned_second =
74
+ _mm512_mask_slli_epi32(second, (__mmask16)(H >> 16), second, 10);
75
+
76
+ /* 4. Remove surrogate prefixes and add offset 0x10000 by adding in,
77
+ shifted and constant in
78
+ |0000.0000.0000.0000.1101.11aa.aaaa.aaaa|0000.0011.0110.bbbb.bbbb.bb00.0000.0000|
79
+ shifted
80
+ |????.????.????.????.????.????.????.????|0000.0000.0000.0000.1101.11aa.aaaa.aaaa|
81
+ constant|1111.1100.1010.0000.0010.0100.0000.0000|1111.1100.1010.0000.0010.0100.0000.0000|
82
+ */
83
+ const __m512i constant = _mm512_set1_epi32((uint32_t)0xfca02400);
84
+ const __m512i added_first = _mm512_mask_add_epi32(
85
+ aligned_first, (__mmask16)H, aligned_first, shifted_first);
86
+ const __m512i utf32_first = _mm512_mask_add_epi32(
87
+ added_first, (__mmask16)H, added_first, constant);
88
+
89
+ const __m512i added_second =
90
+ _mm512_mask_add_epi32(aligned_second, (__mmask16)(H >> 16),
91
+ aligned_second, shifted_second);
92
+ const __m512i utf32_second = _mm512_mask_add_epi32(
93
+ added_second, (__mmask16)(H >> 16), added_second, constant);
94
+
95
+ // 5. Store all valid UTF-32 code units (low surrogate positions and
96
+ // 32nd word are invalid)
97
+ const __mmask32 valid = ~L & 0x7fffffff;
98
+ // We deliberately do a _mm512_maskz_compress_epi32 followed by
99
+ // storeu_epi32 to ease performance portability to Zen 4.
100
+ const __m512i compressed_first =
101
+ _mm512_maskz_compress_epi32((__mmask16)(valid), utf32_first);
102
+ const size_t howmany1 = count_ones((uint16_t)(valid));
103
+ _mm512_storeu_si512((__m512i *)utf32_output, compressed_first);
104
+ utf32_output += howmany1;
105
+ const __m512i compressed_second =
106
+ _mm512_maskz_compress_epi32((__mmask16)(valid >> 16), utf32_second);
107
+ const size_t howmany2 = count_ones((uint16_t)(valid >> 16));
108
+ // The following could be unsafe in some cases?
109
+ //_mm512_storeu_epi32((__m512i *) utf32_output, compressed_second);
110
+ _mm512_mask_storeu_epi32((__m512i *)utf32_output,
111
+ __mmask16((1 << howmany2) - 1),
112
+ compressed_second);
113
+ utf32_output += howmany2;
114
+ // Only process 31 code units, but keep track if the 31st word is a high
115
+ // surrogate as a carry
116
+ buf += 31;
117
+ carry = (H >> 30) & 0x1;
118
+ } else {
119
+ // invalid case
120
+ return std::make_tuple(buf + carry, utf32_output, false);
121
+ }
122
+ } else {
123
+ // no surrogates
124
+ // extend all thirty-two 16-bit code units to thirty-two 32-bit code units
125
+ _mm512_storeu_si512((__m512i *)(utf32_output),
126
+ _mm512_cvtepu16_epi32(_mm512_castsi512_si256(in)));
127
+ _mm512_storeu_si512(
128
+ (__m512i *)(utf32_output) + 1,
129
+ _mm512_cvtepu16_epi32(_mm512_extracti32x8_epi32(in, 1)));
130
+ utf32_output += 32;
131
+ buf += 32;
132
+ carry = 0;
133
+ }
134
+ } // while
135
+ return std::make_tuple(buf + carry, utf32_output, true);
136
+ }
@@ -0,0 +1,206 @@
1
+ // file included directly
2
+
3
+ /**
4
+ * This function converts the input (inbuf, inlen), assumed to be valid
5
+ * UTF16 (little endian) into UTF-8 (to outbuf). The number of code units
6
+ * written is written to 'outlen' and the function reports the number of input
7
+ * word consumed.
8
+ */
9
+ template <endianness big_endian>
10
+ size_t utf16_to_utf8_avx512i(const char16_t *inbuf, size_t inlen,
11
+ unsigned char *outbuf, size_t *outlen) {
12
+ __m512i in;
13
+ __mmask32 inmask = _cvtu32_mask32(0x7fffffff);
14
+ __m512i byteflip = _mm512_setr_epi64(0x0607040502030001, 0x0e0f0c0d0a0b0809,
15
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809,
16
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809,
17
+ 0x0607040502030001, 0x0e0f0c0d0a0b0809);
18
+ const char16_t *const inbuf_orig = inbuf;
19
+ const unsigned char *const outbuf_orig = outbuf;
20
+ int adjust = 0;
21
+ int carry = 0;
22
+
23
+ while (inlen >= 32) {
24
+ in = _mm512_loadu_si512(inbuf);
25
+ if (big_endian) {
26
+ in = _mm512_shuffle_epi8(in, byteflip);
27
+ }
28
+ inlen -= 31;
29
+ lastiteration:
30
+ inbuf += 31;
31
+
32
+ failiteration:
33
+ const __mmask32 is234byte = _mm512_mask_cmp_epu16_mask(
34
+ inmask, in, _mm512_set1_epi16(0x0080), _MM_CMPINT_NLT);
35
+
36
+ if (_ktestz_mask32_u8(inmask, is234byte)) {
37
+ // fast path for ASCII only
38
+ _mm512_mask_cvtepi16_storeu_epi8(outbuf, inmask, in);
39
+ outbuf += 31;
40
+ carry = 0;
41
+
42
+ if (inlen < 32) {
43
+ goto tail;
44
+ } else {
45
+ continue;
46
+ }
47
+ }
48
+
49
+ const __mmask32 is12byte =
50
+ _mm512_cmp_epu16_mask(in, _mm512_set1_epi16(0x0800), _MM_CMPINT_LT);
51
+
52
+ if (_ktestc_mask32_u8(is12byte, inmask)) {
53
+ // fast path for 1 and 2 byte only
54
+
55
+ const __m512i twobytes = _mm512_ternarylogic_epi32(
56
+ _mm512_slli_epi16(in, 8), _mm512_srli_epi16(in, 6),
57
+ _mm512_set1_epi16(0x3f3f), 0xa8); // (A|B)&C
58
+ in = _mm512_mask_add_epi16(in, is234byte, twobytes,
59
+ _mm512_set1_epi16(int16_t(0x80c0)));
60
+ const __m512i cmpmask =
61
+ _mm512_mask_blend_epi16(inmask, _mm512_set1_epi16(int16_t(0xffff)),
62
+ _mm512_set1_epi16(0x0800));
63
+ const __mmask64 smoosh =
64
+ _mm512_cmp_epu8_mask(in, cmpmask, _MM_CMPINT_NLT);
65
+ const __m512i out = _mm512_maskz_compress_epi8(smoosh, in);
66
+ _mm512_mask_storeu_epi8(outbuf,
67
+ _cvtu64_mask64(_pext_u64(_cvtmask64_u64(smoosh),
68
+ _cvtmask64_u64(smoosh))),
69
+ out);
70
+ outbuf += 31 + _mm_popcnt_u32(_cvtmask32_u32(is234byte));
71
+ carry = 0;
72
+
73
+ if (inlen < 32) {
74
+ goto tail;
75
+ } else {
76
+ continue;
77
+ }
78
+ }
79
+ __m512i lo = _mm512_cvtepu16_epi32(_mm512_castsi512_si256(in));
80
+ __m512i hi = _mm512_cvtepu16_epi32(_mm512_extracti32x8_epi32(in, 1));
81
+
82
+ __m512i taglo = _mm512_set1_epi32(0x8080e000);
83
+ __m512i taghi = taglo;
84
+
85
+ const __m512i fc00masked =
86
+ _mm512_and_epi32(in, _mm512_set1_epi16(int16_t(0xfc00)));
87
+ const __mmask32 hisurr = _mm512_mask_cmp_epu16_mask(
88
+ inmask, fc00masked, _mm512_set1_epi16(int16_t(0xd800)), _MM_CMPINT_EQ);
89
+ const __mmask32 losurr = _mm512_cmp_epu16_mask(
90
+ fc00masked, _mm512_set1_epi16(int16_t(0xdc00)), _MM_CMPINT_EQ);
91
+
92
+ int carryout = 0;
93
+ if (!_kortestz_mask32_u8(hisurr, losurr)) {
94
+ // handle surrogates
95
+
96
+ __m512i los = _mm512_alignr_epi32(hi, lo, 1);
97
+ __m512i his = _mm512_alignr_epi32(lo, hi, 1);
98
+
99
+ const __mmask32 hisurrhi = _kshiftri_mask32(hisurr, 16);
100
+ taglo = _mm512_mask_mov_epi32(taglo, __mmask16(hisurr),
101
+ _mm512_set1_epi32(0x808080f0));
102
+ taghi = _mm512_mask_mov_epi32(taghi, __mmask16(hisurrhi),
103
+ _mm512_set1_epi32(0x808080f0));
104
+
105
+ lo = _mm512_mask_slli_epi32(lo, __mmask16(hisurr), lo, 10);
106
+ hi = _mm512_mask_slli_epi32(hi, __mmask16(hisurrhi), hi, 10);
107
+ los = _mm512_add_epi32(los, _mm512_set1_epi32(0xfca02400));
108
+ his = _mm512_add_epi32(his, _mm512_set1_epi32(0xfca02400));
109
+ lo = _mm512_mask_add_epi32(lo, __mmask16(hisurr), lo, los);
110
+ hi = _mm512_mask_add_epi32(hi, __mmask16(hisurrhi), hi, his);
111
+
112
+ carryout = _cvtu32_mask32(_kshiftri_mask32(hisurr, 30));
113
+
114
+ const uint32_t h = _cvtmask32_u32(hisurr);
115
+ const uint32_t l = _cvtmask32_u32(losurr);
116
+ // check for mismatched surrogates
117
+ if ((h + h + carry) ^ l) {
118
+ const uint32_t lonohi = l & ~(h + h + carry);
119
+ const uint32_t hinolo = h & ~(l >> 1);
120
+ inlen = _tzcnt_u32(hinolo | lonohi);
121
+ inmask = __mmask32(0x7fffffff & ((1U << inlen) - 1));
122
+ in = _mm512_maskz_mov_epi16(inmask, in);
123
+ adjust = (int)inlen - 31;
124
+ inlen = 0;
125
+ goto failiteration;
126
+ }
127
+ }
128
+
129
+ hi = _mm512_maskz_mov_epi32(_cvtu32_mask16(0x7fff), hi);
130
+ carry = carryout;
131
+
132
+ __m512i mslo =
133
+ _mm512_multishift_epi64_epi8(_mm512_set1_epi64(0x20262c3200060c12), lo);
134
+
135
+ __m512i mshi =
136
+ _mm512_multishift_epi64_epi8(_mm512_set1_epi64(0x20262c3200060c12), hi);
137
+
138
+ const __mmask32 outmask = __mmask32(_kandn_mask64(losurr, inmask));
139
+ const __mmask64 outmhi = _kshiftri_mask64(outmask, 16);
140
+
141
+ const __mmask32 is1byte = __mmask32(_knot_mask64(is234byte));
142
+ const __mmask64 is1bhi = _kshiftri_mask64(is1byte, 16);
143
+ const __mmask64 is12bhi = _kshiftri_mask64(is12byte, 16);
144
+
145
+ taglo = _mm512_mask_mov_epi32(taglo, __mmask16(is12byte),
146
+ _mm512_set1_epi32(0x80c00000));
147
+ taghi = _mm512_mask_mov_epi32(taghi, __mmask16(is12bhi),
148
+ _mm512_set1_epi32(0x80c00000));
149
+ __m512i magiclo = _mm512_mask_blend_epi32(__mmask16(outmask),
150
+ _mm512_set1_epi32(0xffffffff),
151
+ _mm512_set1_epi32(0x00010101));
152
+ __m512i magichi = _mm512_mask_blend_epi32(__mmask16(outmhi),
153
+ _mm512_set1_epi32(0xffffffff),
154
+ _mm512_set1_epi32(0x00010101));
155
+
156
+ magiclo = _mm512_mask_blend_epi32(__mmask16(outmask),
157
+ _mm512_set1_epi32(0xffffffff),
158
+ _mm512_set1_epi32(0x00010101));
159
+ magichi = _mm512_mask_blend_epi32(__mmask16(outmhi),
160
+ _mm512_set1_epi32(0xffffffff),
161
+ _mm512_set1_epi32(0x00010101));
162
+
163
+ mslo = _mm512_ternarylogic_epi32(mslo, _mm512_set1_epi32(0x3f3f3f3f), taglo,
164
+ 0xea); // A&B|C
165
+ mshi = _mm512_ternarylogic_epi32(mshi, _mm512_set1_epi32(0x3f3f3f3f), taghi,
166
+ 0xea);
167
+ mslo = _mm512_mask_slli_epi32(mslo, __mmask16(is1byte), lo, 24);
168
+
169
+ mshi = _mm512_mask_slli_epi32(mshi, __mmask16(is1bhi), hi, 24);
170
+
171
+ const __mmask64 wantlo =
172
+ _mm512_cmp_epu8_mask(mslo, magiclo, _MM_CMPINT_NLT);
173
+ const __mmask64 wanthi =
174
+ _mm512_cmp_epu8_mask(mshi, magichi, _MM_CMPINT_NLT);
175
+ const __m512i outlo = _mm512_maskz_compress_epi8(wantlo, mslo);
176
+ const __m512i outhi = _mm512_maskz_compress_epi8(wanthi, mshi);
177
+ const uint64_t wantlo_uint64 = _cvtmask64_u64(wantlo);
178
+ const uint64_t wanthi_uint64 = _cvtmask64_u64(wanthi);
179
+
180
+ uint64_t advlo = _mm_popcnt_u64(wantlo_uint64);
181
+ uint64_t advhi = _mm_popcnt_u64(wanthi_uint64);
182
+
183
+ _mm512_mask_storeu_epi8(
184
+ outbuf, _cvtu64_mask64(_pext_u64(wantlo_uint64, wantlo_uint64)), outlo);
185
+ _mm512_mask_storeu_epi8(
186
+ outbuf + advlo, _cvtu64_mask64(_pext_u64(wanthi_uint64, wanthi_uint64)),
187
+ outhi);
188
+ outbuf += advlo + advhi;
189
+ }
190
+ outbuf += -adjust;
191
+
192
+ tail:
193
+ if (inlen != 0) {
194
+ // We must have inlen < 31.
195
+ inmask = _cvtu32_mask32((1U << inlen) - 1);
196
+ in = _mm512_maskz_loadu_epi16(inmask, inbuf);
197
+ if (big_endian) {
198
+ in = _mm512_shuffle_epi8(in, byteflip);
199
+ }
200
+ adjust = (int)inlen - 31;
201
+ inlen = 0;
202
+ goto lastiteration;
203
+ }
204
+ *outlen = (outbuf - outbuf_orig) + adjust;
205
+ return ((inbuf - inbuf_orig) + adjust);
206
+ }
@@ -0,0 +1,74 @@
1
+ // file included directly
2
+ size_t icelake_convert_utf32_to_latin1(const char32_t *buf, size_t len,
3
+ char *latin1_output) {
4
+ const char32_t *end = buf + len;
5
+ __m512i v_0xFF = _mm512_set1_epi32(0xff);
6
+ __m512i shufmask = _mm512_set_epi8(
7
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
8
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 60,
9
+ 56, 52, 48, 44, 40, 36, 32, 28, 24, 20, 16, 12, 8, 4, 0);
10
+ while (end - buf >= 16) {
11
+ __m512i in = _mm512_loadu_si512((__m512i *)buf);
12
+ if (_mm512_cmpgt_epu32_mask(in, v_0xFF)) {
13
+ return 0;
14
+ }
15
+ _mm_storeu_si128(
16
+ (__m128i *)latin1_output,
17
+ _mm512_castsi512_si128(_mm512_permutexvar_epi8(shufmask, in)));
18
+ latin1_output += 16;
19
+ buf += 16;
20
+ }
21
+ if (buf < end) {
22
+ uint16_t mask = uint16_t((1 << (end - buf)) - 1);
23
+ __m512i in = _mm512_maskz_loadu_epi32(mask, buf);
24
+ if (_mm512_cmpgt_epu32_mask(in, v_0xFF)) {
25
+ return 0;
26
+ }
27
+ _mm_mask_storeu_epi8(
28
+ latin1_output, mask,
29
+ _mm512_castsi512_si128(_mm512_permutexvar_epi8(shufmask, in)));
30
+ }
31
+ return len;
32
+ }
33
+
34
+ std::pair<result, char *>
35
+ icelake_convert_utf32_to_latin1_with_errors(const char32_t *buf, size_t len,
36
+ char *latin1_output) {
37
+ const char32_t *end = buf + len;
38
+ const char32_t *start = buf;
39
+ __m512i v_0xFF = _mm512_set1_epi32(0xff);
40
+ __m512i shufmask = _mm512_set_epi8(
41
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
42
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 60,
43
+ 56, 52, 48, 44, 40, 36, 32, 28, 24, 20, 16, 12, 8, 4, 0);
44
+ while (end - buf >= 16) {
45
+ __m512i in = _mm512_loadu_si512((__m512i *)buf);
46
+ if (_mm512_cmpgt_epu32_mask(in, v_0xFF)) {
47
+ while (uint32_t(*buf) <= 0xff) {
48
+ *latin1_output++ = uint8_t(*buf++);
49
+ }
50
+ return std::make_pair(result(error_code::TOO_LARGE, buf - start),
51
+ latin1_output);
52
+ }
53
+ _mm_storeu_si128(
54
+ (__m128i *)latin1_output,
55
+ _mm512_castsi512_si128(_mm512_permutexvar_epi8(shufmask, in)));
56
+ latin1_output += 16;
57
+ buf += 16;
58
+ }
59
+ if (buf < end) {
60
+ uint16_t mask = uint16_t((1 << (end - buf)) - 1);
61
+ __m512i in = _mm512_maskz_loadu_epi32(mask, buf);
62
+ if (_mm512_cmpgt_epu32_mask(in, v_0xFF)) {
63
+ while (uint32_t(*buf) <= 0xff) {
64
+ *latin1_output++ = uint8_t(*buf++);
65
+ }
66
+ return std::make_pair(result(error_code::TOO_LARGE, buf - start),
67
+ latin1_output);
68
+ }
69
+ _mm_mask_storeu_epi8(
70
+ latin1_output, mask,
71
+ _mm512_castsi512_si128(_mm512_permutexvar_epi8(shufmask, in)));
72
+ }
73
+ return std::make_pair(result(error_code::SUCCESS, len), latin1_output);
74
+ }