react-native-quick-crypto 1.0.0-beta.20 → 1.0.0-beta.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (899) hide show
  1. package/QuickCrypto.podspec +70 -7
  2. package/android/CMakeLists.txt +31 -1
  3. package/cpp/blake3/HybridBlake3.cpp +118 -0
  4. package/cpp/blake3/HybridBlake3.hpp +35 -0
  5. package/cpp/cipher/HybridCipherFactory.hpp +5 -0
  6. package/cpp/ec/HybridEcKeyPair.cpp +428 -0
  7. package/cpp/ec/HybridEcKeyPair.hpp +48 -0
  8. package/cpp/ed25519/HybridEdKeyPair.cpp +78 -4
  9. package/cpp/ed25519/HybridEdKeyPair.hpp +9 -2
  10. package/cpp/hash/HybridHash.cpp +37 -3
  11. package/cpp/hash/HybridHash.hpp +5 -3
  12. package/cpp/keys/HybridKeyObjectHandle.cpp +243 -0
  13. package/cpp/keys/HybridKeyObjectHandle.hpp +42 -0
  14. package/cpp/keys/KeyObjectData.cpp +226 -0
  15. package/cpp/keys/KeyObjectData.hpp +71 -0
  16. package/cpp/keys/node.h +5 -0
  17. package/cpp/rsa/HybridRsaKeyPair.cpp +154 -0
  18. package/cpp/rsa/HybridRsaKeyPair.hpp +43 -0
  19. package/cpp/utils/Macros.hpp +68 -0
  20. package/cpp/utils/Utils.hpp +27 -0
  21. package/deps/blake3/.cargo/config.toml +2 -0
  22. package/deps/blake3/.git-blame-ignore-revs +2 -0
  23. package/deps/blake3/.github/workflows/build_b3sum.py +38 -0
  24. package/deps/blake3/.github/workflows/ci.yml +491 -0
  25. package/deps/blake3/.github/workflows/tag.yml +43 -0
  26. package/deps/blake3/.github/workflows/upload_github_release_asset.py +73 -0
  27. package/deps/blake3/CONTRIBUTING.md +31 -0
  28. package/deps/blake3/Cargo.toml +135 -0
  29. package/deps/blake3/LICENSE_A2 +202 -0
  30. package/deps/blake3/LICENSE_A2LLVM +219 -0
  31. package/deps/blake3/LICENSE_CC0 +121 -0
  32. package/deps/blake3/README.md +229 -0
  33. package/deps/blake3/b3sum/Cargo.lock +513 -0
  34. package/deps/blake3/b3sum/Cargo.toml +26 -0
  35. package/deps/blake3/b3sum/README.md +72 -0
  36. package/deps/blake3/b3sum/src/main.rs +564 -0
  37. package/deps/blake3/b3sum/src/unit_tests.rs +235 -0
  38. package/deps/blake3/b3sum/tests/cli_tests.rs +680 -0
  39. package/deps/blake3/b3sum/what_does_check_do.md +176 -0
  40. package/deps/blake3/benches/bench.rs +623 -0
  41. package/deps/blake3/build.rs +389 -0
  42. package/deps/blake3/c/CMakeLists.txt +383 -0
  43. package/deps/blake3/c/CMakePresets.json +73 -0
  44. package/deps/blake3/c/Makefile.testing +82 -0
  45. package/deps/blake3/c/README.md +403 -0
  46. package/deps/blake3/c/blake3-config.cmake.in +14 -0
  47. package/deps/blake3/c/blake3.c +650 -0
  48. package/deps/blake3/c/blake3.h +86 -0
  49. package/deps/blake3/c/blake3_avx2.c +326 -0
  50. package/deps/blake3/c/blake3_avx2_x86-64_unix.S +1815 -0
  51. package/deps/blake3/c/blake3_avx2_x86-64_windows_gnu.S +1817 -0
  52. package/deps/blake3/c/blake3_avx2_x86-64_windows_msvc.asm +1828 -0
  53. package/deps/blake3/c/blake3_avx512.c +1388 -0
  54. package/deps/blake3/c/blake3_avx512_x86-64_unix.S +4824 -0
  55. package/deps/blake3/c/blake3_avx512_x86-64_windows_gnu.S +2615 -0
  56. package/deps/blake3/c/blake3_avx512_x86-64_windows_msvc.asm +2634 -0
  57. package/deps/blake3/c/blake3_c_rust_bindings/Cargo.toml +32 -0
  58. package/deps/blake3/c/blake3_c_rust_bindings/README.md +4 -0
  59. package/deps/blake3/c/blake3_c_rust_bindings/benches/bench.rs +477 -0
  60. package/deps/blake3/c/blake3_c_rust_bindings/build.rs +253 -0
  61. package/deps/blake3/c/blake3_c_rust_bindings/cross_test.sh +31 -0
  62. package/deps/blake3/c/blake3_c_rust_bindings/src/lib.rs +333 -0
  63. package/deps/blake3/c/blake3_c_rust_bindings/src/test.rs +696 -0
  64. package/deps/blake3/c/blake3_dispatch.c +332 -0
  65. package/deps/blake3/c/blake3_impl.h +333 -0
  66. package/deps/blake3/c/blake3_neon.c +366 -0
  67. package/deps/blake3/c/blake3_portable.c +160 -0
  68. package/deps/blake3/c/blake3_sse2.c +566 -0
  69. package/deps/blake3/c/blake3_sse2_x86-64_unix.S +2291 -0
  70. package/deps/blake3/c/blake3_sse2_x86-64_windows_gnu.S +2332 -0
  71. package/deps/blake3/c/blake3_sse2_x86-64_windows_msvc.asm +2350 -0
  72. package/deps/blake3/c/blake3_sse41.c +560 -0
  73. package/deps/blake3/c/blake3_sse41_x86-64_unix.S +2028 -0
  74. package/deps/blake3/c/blake3_sse41_x86-64_windows_gnu.S +2069 -0
  75. package/deps/blake3/c/blake3_sse41_x86-64_windows_msvc.asm +2089 -0
  76. package/deps/blake3/c/blake3_tbb.cpp +37 -0
  77. package/deps/blake3/c/dependencies/CMakeLists.txt +3 -0
  78. package/deps/blake3/c/dependencies/tbb/CMakeLists.txt +28 -0
  79. package/deps/blake3/c/example.c +36 -0
  80. package/deps/blake3/c/example_tbb.c +57 -0
  81. package/deps/blake3/c/libblake3.pc.in +12 -0
  82. package/deps/blake3/c/main.c +166 -0
  83. package/deps/blake3/c/test.py +97 -0
  84. package/deps/blake3/media/B3.svg +70 -0
  85. package/deps/blake3/media/BLAKE3.svg +85 -0
  86. package/deps/blake3/media/speed.svg +1474 -0
  87. package/deps/blake3/reference_impl/Cargo.toml +8 -0
  88. package/deps/blake3/reference_impl/README.md +14 -0
  89. package/deps/blake3/reference_impl/reference_impl.rs +374 -0
  90. package/deps/blake3/src/ffi_avx2.rs +65 -0
  91. package/deps/blake3/src/ffi_avx512.rs +169 -0
  92. package/deps/blake3/src/ffi_neon.rs +82 -0
  93. package/deps/blake3/src/ffi_sse2.rs +126 -0
  94. package/deps/blake3/src/ffi_sse41.rs +126 -0
  95. package/deps/blake3/src/guts.rs +60 -0
  96. package/deps/blake3/src/hazmat.rs +704 -0
  97. package/deps/blake3/src/io.rs +64 -0
  98. package/deps/blake3/src/join.rs +92 -0
  99. package/deps/blake3/src/lib.rs +1835 -0
  100. package/deps/blake3/src/platform.rs +587 -0
  101. package/deps/blake3/src/portable.rs +198 -0
  102. package/deps/blake3/src/rust_avx2.rs +474 -0
  103. package/deps/blake3/src/rust_sse2.rs +775 -0
  104. package/deps/blake3/src/rust_sse41.rs +766 -0
  105. package/deps/blake3/src/test.rs +1049 -0
  106. package/deps/blake3/src/traits.rs +227 -0
  107. package/deps/blake3/src/wasm32_simd.rs +794 -0
  108. package/deps/blake3/test_vectors/Cargo.toml +19 -0
  109. package/deps/blake3/test_vectors/cross_test.sh +25 -0
  110. package/deps/blake3/test_vectors/src/bin/generate.rs +4 -0
  111. package/deps/blake3/test_vectors/src/lib.rs +350 -0
  112. package/deps/blake3/test_vectors/test_vectors.json +217 -0
  113. package/deps/blake3/tools/compiler_version/Cargo.toml +7 -0
  114. package/deps/blake3/tools/compiler_version/build.rs +6 -0
  115. package/deps/blake3/tools/compiler_version/src/main.rs +27 -0
  116. package/deps/blake3/tools/instruction_set_support/Cargo.toml +6 -0
  117. package/deps/blake3/tools/instruction_set_support/src/main.rs +10 -0
  118. package/deps/blake3/tools/release.md +16 -0
  119. package/deps/ncrypto/ncrypto.cc +4679 -0
  120. package/deps/ncrypto/ncrypto.h +1625 -0
  121. package/lib/commonjs/blake3.js +98 -0
  122. package/lib/commonjs/blake3.js.map +1 -0
  123. package/lib/commonjs/ec.js +344 -0
  124. package/lib/commonjs/ec.js.map +1 -0
  125. package/lib/commonjs/ed.js +143 -0
  126. package/lib/commonjs/ed.js.map +1 -1
  127. package/lib/commonjs/expo-plugin/withXCode.js +3 -3
  128. package/lib/commonjs/hash.js +48 -1
  129. package/lib/commonjs/hash.js.map +1 -1
  130. package/lib/commonjs/index.js +54 -4
  131. package/lib/commonjs/index.js.map +1 -1
  132. package/lib/commonjs/keys/classes.js +111 -52
  133. package/lib/commonjs/keys/classes.js.map +1 -1
  134. package/lib/commonjs/keys/generateKeyPair.js +98 -144
  135. package/lib/commonjs/keys/generateKeyPair.js.map +1 -1
  136. package/lib/commonjs/keys/index.js +27 -0
  137. package/lib/commonjs/keys/index.js.map +1 -1
  138. package/lib/commonjs/keys/utils.js +18 -13
  139. package/lib/commonjs/keys/utils.js.map +1 -1
  140. package/lib/commonjs/rsa.js +129 -0
  141. package/lib/commonjs/rsa.js.map +1 -0
  142. package/lib/commonjs/specs/blake3.nitro.js +6 -0
  143. package/lib/commonjs/specs/blake3.nitro.js.map +1 -0
  144. package/lib/commonjs/specs/ecKeyPair.nitro.js +6 -0
  145. package/lib/commonjs/specs/ecKeyPair.nitro.js.map +1 -0
  146. package/lib/commonjs/specs/rsaKeyPair.nitro.js +6 -0
  147. package/lib/commonjs/specs/rsaKeyPair.nitro.js.map +1 -0
  148. package/lib/commonjs/subtle.js +365 -0
  149. package/lib/commonjs/subtle.js.map +1 -0
  150. package/lib/commonjs/utils/conversion.js +25 -2
  151. package/lib/commonjs/utils/conversion.js.map +1 -1
  152. package/lib/commonjs/utils/hashnames.js +2 -1
  153. package/lib/commonjs/utils/hashnames.js.map +1 -1
  154. package/lib/commonjs/utils/index.js +11 -0
  155. package/lib/commonjs/utils/index.js.map +1 -1
  156. package/lib/commonjs/utils/noble.js +82 -0
  157. package/lib/commonjs/utils/noble.js.map +1 -0
  158. package/lib/commonjs/utils/types.js +28 -16
  159. package/lib/commonjs/utils/types.js.map +1 -1
  160. package/lib/commonjs/utils/validation.js +74 -1
  161. package/lib/commonjs/utils/validation.js.map +1 -1
  162. package/lib/module/blake3.js +90 -0
  163. package/lib/module/blake3.js.map +1 -0
  164. package/lib/module/ec.js +336 -0
  165. package/lib/module/ec.js.map +1 -0
  166. package/lib/module/ed.js +141 -0
  167. package/lib/module/ed.js.map +1 -1
  168. package/lib/module/expo-plugin/withXCode.js +3 -3
  169. package/lib/module/hash.js +47 -2
  170. package/lib/module/hash.js.map +1 -1
  171. package/lib/module/index.js +9 -1
  172. package/lib/module/index.js.map +1 -1
  173. package/lib/module/keys/classes.js +108 -49
  174. package/lib/module/keys/classes.js.map +1 -1
  175. package/lib/module/keys/generateKeyPair.js +91 -143
  176. package/lib/module/keys/generateKeyPair.js.map +1 -1
  177. package/lib/module/keys/index.js +9 -6
  178. package/lib/module/keys/index.js.map +1 -1
  179. package/lib/module/keys/utils.js +16 -12
  180. package/lib/module/keys/utils.js.map +1 -1
  181. package/lib/module/rsa.js +123 -0
  182. package/lib/module/rsa.js.map +1 -0
  183. package/lib/module/specs/blake3.nitro.js +4 -0
  184. package/lib/module/specs/blake3.nitro.js.map +1 -0
  185. package/lib/module/specs/ecKeyPair.nitro.js +4 -0
  186. package/lib/module/specs/ecKeyPair.nitro.js.map +1 -0
  187. package/lib/module/specs/rsaKeyPair.nitro.js +4 -0
  188. package/lib/module/specs/rsaKeyPair.nitro.js.map +1 -0
  189. package/lib/module/subtle.js +360 -0
  190. package/lib/module/subtle.js.map +1 -0
  191. package/lib/module/utils/conversion.js +7 -2
  192. package/lib/module/utils/conversion.js.map +1 -1
  193. package/lib/module/utils/hashnames.js +2 -1
  194. package/lib/module/utils/hashnames.js.map +1 -1
  195. package/lib/module/utils/index.js +1 -0
  196. package/lib/module/utils/index.js.map +1 -1
  197. package/lib/module/utils/noble.js +76 -0
  198. package/lib/module/utils/noble.js.map +1 -0
  199. package/lib/module/utils/types.js +26 -17
  200. package/lib/module/utils/types.js.map +1 -1
  201. package/lib/module/utils/validation.js +69 -1
  202. package/lib/module/utils/validation.js.map +1 -1
  203. package/lib/tsconfig.tsbuildinfo +1 -1
  204. package/lib/typescript/blake3.d.ts +33 -0
  205. package/lib/typescript/blake3.d.ts.map +1 -0
  206. package/lib/typescript/ec.d.ts +13 -0
  207. package/lib/typescript/ec.d.ts.map +1 -0
  208. package/lib/typescript/ed.d.ts +27 -1
  209. package/lib/typescript/ed.d.ts.map +1 -1
  210. package/lib/typescript/hash.d.ts +14 -1
  211. package/lib/typescript/hash.d.ts.map +1 -1
  212. package/lib/typescript/index.d.ts +45 -1
  213. package/lib/typescript/index.d.ts.map +1 -1
  214. package/lib/typescript/keys/classes.d.ts +49 -8
  215. package/lib/typescript/keys/classes.d.ts.map +1 -1
  216. package/lib/typescript/keys/generateKeyPair.d.ts +5 -0
  217. package/lib/typescript/keys/generateKeyPair.d.ts.map +1 -1
  218. package/lib/typescript/keys/index.d.ts +5 -2
  219. package/lib/typescript/keys/index.d.ts.map +1 -1
  220. package/lib/typescript/keys/utils.d.ts +3 -1
  221. package/lib/typescript/keys/utils.d.ts.map +1 -1
  222. package/lib/typescript/rsa.d.ts +10 -0
  223. package/lib/typescript/rsa.d.ts.map +1 -0
  224. package/lib/typescript/specs/blake3.nitro.d.ts +15 -0
  225. package/lib/typescript/specs/blake3.nitro.d.ts.map +1 -0
  226. package/lib/typescript/specs/ecKeyPair.nitro.d.ts +20 -0
  227. package/lib/typescript/specs/ecKeyPair.nitro.d.ts.map +1 -0
  228. package/lib/typescript/specs/edKeyPair.nitro.d.ts +1 -0
  229. package/lib/typescript/specs/edKeyPair.nitro.d.ts.map +1 -1
  230. package/lib/typescript/specs/hash.nitro.d.ts +1 -0
  231. package/lib/typescript/specs/hash.nitro.d.ts.map +1 -1
  232. package/lib/typescript/specs/keyObjectHandle.nitro.d.ts +0 -1
  233. package/lib/typescript/specs/keyObjectHandle.nitro.d.ts.map +1 -1
  234. package/lib/typescript/specs/rsaKeyPair.nitro.d.ts +20 -0
  235. package/lib/typescript/specs/rsaKeyPair.nitro.d.ts.map +1 -0
  236. package/lib/typescript/subtle.d.ts +17 -0
  237. package/lib/typescript/subtle.d.ts.map +1 -0
  238. package/lib/typescript/utils/cipher.d.ts +1 -1
  239. package/lib/typescript/utils/conversion.d.ts +1 -0
  240. package/lib/typescript/utils/conversion.d.ts.map +1 -1
  241. package/lib/typescript/utils/hashnames.d.ts +3 -1
  242. package/lib/typescript/utils/hashnames.d.ts.map +1 -1
  243. package/lib/typescript/utils/index.d.ts +1 -0
  244. package/lib/typescript/utils/index.d.ts.map +1 -1
  245. package/lib/typescript/utils/noble.d.ts +19 -0
  246. package/lib/typescript/utils/noble.d.ts.map +1 -0
  247. package/lib/typescript/utils/types.d.ts +101 -17
  248. package/lib/typescript/utils/types.d.ts.map +1 -1
  249. package/lib/typescript/utils/validation.d.ts +5 -0
  250. package/lib/typescript/utils/validation.d.ts.map +1 -1
  251. package/nitrogen/generated/.gitattributes +1 -1
  252. package/nitrogen/generated/android/QuickCrypto+autolinking.cmake +3 -0
  253. package/nitrogen/generated/android/QuickCryptoOnLoad.cpp +40 -0
  254. package/nitrogen/generated/ios/QuickCrypto-Swift-Cxx-Umbrella.hpp +2 -1
  255. package/nitrogen/generated/ios/QuickCryptoAutolinking.mm +40 -0
  256. package/nitrogen/generated/shared/c++/CFRGKeyPairType.hpp +11 -13
  257. package/nitrogen/generated/shared/c++/CipherArgs.hpp +4 -6
  258. package/nitrogen/generated/shared/c++/HybridBlake3Spec.cpp +28 -0
  259. package/nitrogen/generated/shared/c++/HybridBlake3Spec.hpp +76 -0
  260. package/nitrogen/generated/shared/c++/HybridCipherFactorySpec.hpp +1 -1
  261. package/nitrogen/generated/shared/c++/HybridCipherSpec.hpp +1 -1
  262. package/nitrogen/generated/shared/c++/HybridEcKeyPairSpec.cpp +29 -0
  263. package/nitrogen/generated/shared/c++/HybridEcKeyPairSpec.hpp +77 -0
  264. package/nitrogen/generated/shared/c++/HybridEdKeyPairSpec.cpp +1 -0
  265. package/nitrogen/generated/shared/c++/HybridEdKeyPairSpec.hpp +3 -2
  266. package/nitrogen/generated/shared/c++/HybridHashSpec.cpp +1 -0
  267. package/nitrogen/generated/shared/c++/HybridHashSpec.hpp +2 -1
  268. package/nitrogen/generated/shared/c++/HybridKeyObjectHandleSpec.cpp +0 -1
  269. package/nitrogen/generated/shared/c++/HybridKeyObjectHandleSpec.hpp +1 -2
  270. package/nitrogen/generated/shared/c++/HybridPbkdf2Spec.hpp +1 -1
  271. package/nitrogen/generated/shared/c++/HybridRandomSpec.hpp +1 -1
  272. package/nitrogen/generated/shared/c++/HybridRsaKeyPairSpec.cpp +29 -0
  273. package/nitrogen/generated/shared/c++/HybridRsaKeyPairSpec.hpp +77 -0
  274. package/nitrogen/generated/shared/c++/JWK.hpp +15 -17
  275. package/nitrogen/generated/shared/c++/JWKkty.hpp +11 -13
  276. package/nitrogen/generated/shared/c++/JWKuse.hpp +7 -9
  277. package/nitrogen/generated/shared/c++/KFormatType.hpp +12 -14
  278. package/nitrogen/generated/shared/c++/KeyDetail.hpp +4 -6
  279. package/nitrogen/generated/shared/c++/KeyEncoding.hpp +13 -15
  280. package/nitrogen/generated/shared/c++/KeyObject.hpp +67 -0
  281. package/nitrogen/generated/shared/c++/KeyType.hpp +9 -11
  282. package/nitrogen/generated/shared/c++/KeyUsage.hpp +37 -23
  283. package/nitrogen/generated/shared/c++/NamedCurve.hpp +9 -11
  284. package/package.json +14 -11
  285. package/src/blake3.ts +123 -0
  286. package/src/ec.ts +432 -0
  287. package/src/ed.ts +179 -2
  288. package/src/expo-plugin/withXCode.ts +3 -3
  289. package/src/hash.ts +68 -2
  290. package/src/index.ts +8 -0
  291. package/src/keys/classes.ts +161 -55
  292. package/src/keys/generateKeyPair.ts +133 -134
  293. package/src/keys/index.ts +13 -3
  294. package/src/keys/utils.ts +24 -18
  295. package/src/rsa.ts +176 -0
  296. package/src/specs/blake3.nitro.ts +12 -0
  297. package/src/specs/ecKeyPair.nitro.ts +38 -0
  298. package/src/specs/edKeyPair.nitro.ts +2 -0
  299. package/src/specs/hash.nitro.ts +1 -0
  300. package/src/specs/keyObjectHandle.nitro.ts +0 -1
  301. package/src/specs/rsaKeyPair.nitro.ts +33 -0
  302. package/src/subtle.ts +614 -0
  303. package/src/utils/conversion.ts +7 -1
  304. package/src/utils/hashnames.ts +4 -2
  305. package/src/utils/index.ts +1 -0
  306. package/src/utils/noble.ts +85 -0
  307. package/src/utils/types.ts +142 -20
  308. package/src/utils/validation.ts +96 -1
  309. package/ios/libsodium-stable/.github/workflows/autocloser.yml +0 -12
  310. package/ios/libsodium-stable/.github/workflows/ci.yml +0 -180
  311. package/ios/libsodium-stable/.github/workflows/cifuzz.yml +0 -32
  312. package/ios/libsodium-stable/.github/workflows/codeql-analysis.yml +0 -48
  313. package/ios/libsodium-stable/.github/workflows/dotnet-core.yml +0 -388
  314. package/ios/libsodium-stable/AUTHORS +0 -144
  315. package/ios/libsodium-stable/CITATION.cff +0 -18
  316. package/ios/libsodium-stable/ChangeLog +0 -677
  317. package/ios/libsodium-stable/LICENSE +0 -18
  318. package/ios/libsodium-stable/Makefile.am +0 -23
  319. package/ios/libsodium-stable/README.markdown +0 -76
  320. package/ios/libsodium-stable/THANKS +0 -92
  321. package/ios/libsodium-stable/appveyor.yml +0 -24
  322. package/ios/libsodium-stable/autogen.sh +0 -117
  323. package/ios/libsodium-stable/azure-pipelines.yml +0 -122
  324. package/ios/libsodium-stable/build.zig +0 -281
  325. package/ios/libsodium-stable/builds/Makefile.am +0 -81
  326. package/ios/libsodium-stable/builds/msvc/build/buildall.bat +0 -18
  327. package/ios/libsodium-stable/builds/msvc/build/buildbase.bat +0 -132
  328. package/ios/libsodium-stable/builds/msvc/properties/ARM64.props +0 -23
  329. package/ios/libsodium-stable/builds/msvc/properties/Common.props +0 -21
  330. package/ios/libsodium-stable/builds/msvc/properties/DLL.props +0 -16
  331. package/ios/libsodium-stable/builds/msvc/properties/Debug.props +0 -29
  332. package/ios/libsodium-stable/builds/msvc/properties/DebugDEXE.props +0 -21
  333. package/ios/libsodium-stable/builds/msvc/properties/DebugDLL.props +0 -20
  334. package/ios/libsodium-stable/builds/msvc/properties/DebugLEXE.props +0 -20
  335. package/ios/libsodium-stable/builds/msvc/properties/DebugLIB.props +0 -21
  336. package/ios/libsodium-stable/builds/msvc/properties/DebugLTCG.props +0 -20
  337. package/ios/libsodium-stable/builds/msvc/properties/DebugSEXE.props +0 -21
  338. package/ios/libsodium-stable/builds/msvc/properties/EXE.props +0 -17
  339. package/ios/libsodium-stable/builds/msvc/properties/LIB.props +0 -16
  340. package/ios/libsodium-stable/builds/msvc/properties/LTCG.props +0 -13
  341. package/ios/libsodium-stable/builds/msvc/properties/Link.props +0 -21
  342. package/ios/libsodium-stable/builds/msvc/properties/Messages.props +0 -15
  343. package/ios/libsodium-stable/builds/msvc/properties/Output.props +0 -30
  344. package/ios/libsodium-stable/builds/msvc/properties/Release.props +0 -41
  345. package/ios/libsodium-stable/builds/msvc/properties/ReleaseDEXE.props +0 -20
  346. package/ios/libsodium-stable/builds/msvc/properties/ReleaseDLL.props +0 -19
  347. package/ios/libsodium-stable/builds/msvc/properties/ReleaseLEXE.props +0 -20
  348. package/ios/libsodium-stable/builds/msvc/properties/ReleaseLIB.props +0 -19
  349. package/ios/libsodium-stable/builds/msvc/properties/ReleaseLTCG.props +0 -19
  350. package/ios/libsodium-stable/builds/msvc/properties/ReleaseSEXE.props +0 -20
  351. package/ios/libsodium-stable/builds/msvc/properties/Win32.props +0 -23
  352. package/ios/libsodium-stable/builds/msvc/properties/x64.props +0 -26
  353. package/ios/libsodium-stable/builds/msvc/resource.h +0 -14
  354. package/ios/libsodium-stable/builds/msvc/resource.rc +0 -65
  355. package/ios/libsodium-stable/builds/msvc/version.h +0 -33
  356. package/ios/libsodium-stable/builds/msvc/vs2010/libsodium/libsodium.props +0 -48
  357. package/ios/libsodium-stable/builds/msvc/vs2010/libsodium/libsodium.vcxproj +0 -346
  358. package/ios/libsodium-stable/builds/msvc/vs2010/libsodium/libsodium.vcxproj.filters +0 -1088
  359. package/ios/libsodium-stable/builds/msvc/vs2010/libsodium/libsodium.xml +0 -15
  360. package/ios/libsodium-stable/builds/msvc/vs2010/libsodium.import.props +0 -52
  361. package/ios/libsodium-stable/builds/msvc/vs2010/libsodium.import.xml +0 -17
  362. package/ios/libsodium-stable/builds/msvc/vs2010/libsodium.sln +0 -50
  363. package/ios/libsodium-stable/builds/msvc/vs2012/libsodium/libsodium.props +0 -48
  364. package/ios/libsodium-stable/builds/msvc/vs2012/libsodium/libsodium.vcxproj +0 -346
  365. package/ios/libsodium-stable/builds/msvc/vs2012/libsodium/libsodium.vcxproj.filters +0 -1088
  366. package/ios/libsodium-stable/builds/msvc/vs2012/libsodium/libsodium.xml +0 -15
  367. package/ios/libsodium-stable/builds/msvc/vs2012/libsodium.import.props +0 -52
  368. package/ios/libsodium-stable/builds/msvc/vs2012/libsodium.import.xml +0 -17
  369. package/ios/libsodium-stable/builds/msvc/vs2012/libsodium.sln +0 -50
  370. package/ios/libsodium-stable/builds/msvc/vs2013/libsodium/libsodium.props +0 -48
  371. package/ios/libsodium-stable/builds/msvc/vs2013/libsodium/libsodium.vcxproj +0 -346
  372. package/ios/libsodium-stable/builds/msvc/vs2013/libsodium/libsodium.vcxproj.filters +0 -1088
  373. package/ios/libsodium-stable/builds/msvc/vs2013/libsodium/libsodium.xml +0 -15
  374. package/ios/libsodium-stable/builds/msvc/vs2013/libsodium.import.props +0 -52
  375. package/ios/libsodium-stable/builds/msvc/vs2013/libsodium.import.xml +0 -17
  376. package/ios/libsodium-stable/builds/msvc/vs2013/libsodium.sln +0 -52
  377. package/ios/libsodium-stable/builds/msvc/vs2015/libsodium/libsodium.props +0 -48
  378. package/ios/libsodium-stable/builds/msvc/vs2015/libsodium/libsodium.vcxproj +0 -346
  379. package/ios/libsodium-stable/builds/msvc/vs2015/libsodium/libsodium.vcxproj.filters +0 -1088
  380. package/ios/libsodium-stable/builds/msvc/vs2015/libsodium/libsodium.xml +0 -15
  381. package/ios/libsodium-stable/builds/msvc/vs2015/libsodium.import.props +0 -52
  382. package/ios/libsodium-stable/builds/msvc/vs2015/libsodium.import.xml +0 -17
  383. package/ios/libsodium-stable/builds/msvc/vs2015/libsodium.sln +0 -52
  384. package/ios/libsodium-stable/builds/msvc/vs2017/libsodium/libsodium.props +0 -48
  385. package/ios/libsodium-stable/builds/msvc/vs2017/libsodium/libsodium.vcxproj +0 -346
  386. package/ios/libsodium-stable/builds/msvc/vs2017/libsodium/libsodium.vcxproj.filters +0 -1088
  387. package/ios/libsodium-stable/builds/msvc/vs2017/libsodium/libsodium.xml +0 -15
  388. package/ios/libsodium-stable/builds/msvc/vs2017/libsodium.import.props +0 -52
  389. package/ios/libsodium-stable/builds/msvc/vs2017/libsodium.import.xml +0 -17
  390. package/ios/libsodium-stable/builds/msvc/vs2017/libsodium.sln +0 -52
  391. package/ios/libsodium-stable/builds/msvc/vs2019/libsodium/libsodium.props +0 -48
  392. package/ios/libsodium-stable/builds/msvc/vs2019/libsodium/libsodium.vcxproj +0 -370
  393. package/ios/libsodium-stable/builds/msvc/vs2019/libsodium/libsodium.vcxproj.filters +0 -1088
  394. package/ios/libsodium-stable/builds/msvc/vs2019/libsodium/libsodium.xml +0 -15
  395. package/ios/libsodium-stable/builds/msvc/vs2019/libsodium.import.props +0 -52
  396. package/ios/libsodium-stable/builds/msvc/vs2019/libsodium.import.xml +0 -17
  397. package/ios/libsodium-stable/builds/msvc/vs2019/libsodium.sln +0 -52
  398. package/ios/libsodium-stable/builds/msvc/vs2022/libsodium/libsodium.props +0 -48
  399. package/ios/libsodium-stable/builds/msvc/vs2022/libsodium/libsodium.vcxproj +0 -370
  400. package/ios/libsodium-stable/builds/msvc/vs2022/libsodium/libsodium.vcxproj.filters +0 -1088
  401. package/ios/libsodium-stable/builds/msvc/vs2022/libsodium/libsodium.xml +0 -15
  402. package/ios/libsodium-stable/builds/msvc/vs2022/libsodium.import.props +0 -52
  403. package/ios/libsodium-stable/builds/msvc/vs2022/libsodium.import.xml +0 -17
  404. package/ios/libsodium-stable/builds/msvc/vs2022/libsodium.sln +0 -70
  405. package/ios/libsodium-stable/ci/appveyor/libsodium.sln +0 -40
  406. package/ios/libsodium-stable/ci/appveyor/libsodium.vcxproj +0 -594
  407. package/ios/libsodium-stable/ci/appveyor/libsodium.vcxproj.filters +0 -813
  408. package/ios/libsodium-stable/ci/appveyor/msvc-scripts/process.bat +0 -5
  409. package/ios/libsodium-stable/ci/appveyor/msvc-scripts/rep.vbs +0 -12
  410. package/ios/libsodium-stable/ci/appveyor/msvc-scripts/sodium.props +0 -29
  411. package/ios/libsodium-stable/configure.ac +0 -1004
  412. package/ios/libsodium-stable/contrib/Findsodium.cmake +0 -297
  413. package/ios/libsodium-stable/contrib/Makefile.am +0 -3
  414. package/ios/libsodium-stable/dist-build/Makefile.am +0 -14
  415. package/ios/libsodium-stable/dist-build/android-aar.sh +0 -194
  416. package/ios/libsodium-stable/dist-build/android-armv7-a.sh +0 -5
  417. package/ios/libsodium-stable/dist-build/android-armv8-a.sh +0 -5
  418. package/ios/libsodium-stable/dist-build/android-build.sh +0 -95
  419. package/ios/libsodium-stable/dist-build/android-x86.sh +0 -5
  420. package/ios/libsodium-stable/dist-build/android-x86_64.sh +0 -5
  421. package/ios/libsodium-stable/dist-build/apple-xcframework.sh +0 -628
  422. package/ios/libsodium-stable/dist-build/emscripten-symbols.def +0 -651
  423. package/ios/libsodium-stable/dist-build/emscripten.sh +0 -206
  424. package/ios/libsodium-stable/dist-build/generate-emscripten-symbols.sh +0 -59
  425. package/ios/libsodium-stable/dist-build/macos.sh +0 -26
  426. package/ios/libsodium-stable/dist-build/msys2-win32.sh +0 -18
  427. package/ios/libsodium-stable/dist-build/msys2-win64.sh +0 -18
  428. package/ios/libsodium-stable/dist-build/wasm32-wasi.sh +0 -45
  429. package/ios/libsodium-stable/lgtm.yml +0 -6
  430. package/ios/libsodium-stable/libsodium-uninstalled.pc.in +0 -7
  431. package/ios/libsodium-stable/libsodium.pc.in +0 -12
  432. package/ios/libsodium-stable/logo.png +0 -0
  433. package/ios/libsodium-stable/m4/ax_add_fortify_source.m4 +0 -119
  434. package/ios/libsodium-stable/m4/ax_check_catchable_abrt.m4 +0 -57
  435. package/ios/libsodium-stable/m4/ax_check_catchable_segv.m4 +0 -47
  436. package/ios/libsodium-stable/m4/ax_check_compile_flag.m4 +0 -55
  437. package/ios/libsodium-stable/m4/ax_check_define.m4 +0 -73
  438. package/ios/libsodium-stable/m4/ax_check_gnu_make.m4 +0 -95
  439. package/ios/libsodium-stable/m4/ax_check_link_flag.m4 +0 -75
  440. package/ios/libsodium-stable/m4/ax_pthread.m4 +0 -522
  441. package/ios/libsodium-stable/m4/ax_tls.m4 +0 -71
  442. package/ios/libsodium-stable/m4/ax_valgrind_check.m4 +0 -239
  443. package/ios/libsodium-stable/m4/ld-output-def.m4 +0 -29
  444. package/ios/libsodium-stable/packaging/dotnet-core/libsodium.pkgproj +0 -49
  445. package/ios/libsodium-stable/packaging/dotnet-core/test.cs +0 -43
  446. package/ios/libsodium-stable/packaging/nuget/package.bat +0 -13
  447. package/ios/libsodium-stable/packaging/nuget/package.config +0 -4
  448. package/ios/libsodium-stable/packaging/nuget/package.gsl +0 -260
  449. package/ios/libsodium-stable/regen-msvc/libsodium.vcxproj +0 -326
  450. package/ios/libsodium-stable/regen-msvc/libsodium.vcxproj.filters +0 -23
  451. package/ios/libsodium-stable/regen-msvc/libsodium.vcxproj.filters.tpl +0 -35
  452. package/ios/libsodium-stable/regen-msvc/libsodium.vcxproj.tpl +0 -37
  453. package/ios/libsodium-stable/regen-msvc/regen-msvc.py +0 -240
  454. package/ios/libsodium-stable/regen-msvc/tl_libsodium.vcxproj.filters.tpl +0 -23
  455. package/ios/libsodium-stable/regen-msvc/tl_libsodium.vcxproj.tpl +0 -332
  456. package/ios/libsodium-stable/src/Makefile.am +0 -3
  457. package/ios/libsodium-stable/src/libsodium/Makefile.am +0 -314
  458. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis128l/aead_aegis128l.c +0 -159
  459. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis128l/aegis128l_aesni.c +0 -70
  460. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis128l/aegis128l_aesni.h +0 -8
  461. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis128l/aegis128l_armcrypto.c +0 -72
  462. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis128l/aegis128l_armcrypto.h +0 -8
  463. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis128l/aegis128l_common.h +0 -248
  464. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis128l/aegis128l_soft.c +0 -59
  465. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis128l/aegis128l_soft.h +0 -8
  466. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis128l/implementations.h +0 -17
  467. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis256/aead_aegis256.c +0 -158
  468. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis256/aegis256_aesni.c +0 -65
  469. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis256/aegis256_aesni.h +0 -8
  470. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis256/aegis256_armcrypto.c +0 -70
  471. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis256/aegis256_armcrypto.h +0 -8
  472. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis256/aegis256_common.h +0 -231
  473. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis256/aegis256_soft.c +0 -54
  474. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis256/aegis256_soft.h +0 -8
  475. package/ios/libsodium-stable/src/libsodium/crypto_aead/aegis256/implementations.h +0 -17
  476. package/ios/libsodium-stable/src/libsodium/crypto_aead/aes256gcm/aead_aes256gcm.c +0 -157
  477. package/ios/libsodium-stable/src/libsodium/crypto_aead/aes256gcm/aesni/aead_aes256gcm_aesni.c +0 -1015
  478. package/ios/libsodium-stable/src/libsodium/crypto_aead/aes256gcm/armcrypto/aead_aes256gcm_armcrypto.c +0 -1033
  479. package/ios/libsodium-stable/src/libsodium/crypto_aead/chacha20poly1305/aead_chacha20poly1305.c +0 -400
  480. package/ios/libsodium-stable/src/libsodium/crypto_aead/xchacha20poly1305/aead_xchacha20poly1305.c +0 -262
  481. package/ios/libsodium-stable/src/libsodium/crypto_auth/crypto_auth.c +0 -41
  482. package/ios/libsodium-stable/src/libsodium/crypto_auth/hmacsha256/auth_hmacsha256.c +0 -118
  483. package/ios/libsodium-stable/src/libsodium/crypto_auth/hmacsha512/auth_hmacsha512.c +0 -118
  484. package/ios/libsodium-stable/src/libsodium/crypto_auth/hmacsha512256/auth_hmacsha512256.c +0 -93
  485. package/ios/libsodium-stable/src/libsodium/crypto_box/crypto_box.c +0 -114
  486. package/ios/libsodium-stable/src/libsodium/crypto_box/crypto_box_easy.c +0 -115
  487. package/ios/libsodium-stable/src/libsodium/crypto_box/crypto_box_seal.c +0 -68
  488. package/ios/libsodium-stable/src/libsodium/crypto_box/curve25519xchacha20poly1305/box_curve25519xchacha20poly1305.c +0 -204
  489. package/ios/libsodium-stable/src/libsodium/crypto_box/curve25519xchacha20poly1305/box_seal_curve25519xchacha20poly1305.c +0 -79
  490. package/ios/libsodium-stable/src/libsodium/crypto_box/curve25519xsalsa20poly1305/box_curve25519xsalsa20poly1305.c +0 -156
  491. package/ios/libsodium-stable/src/libsodium/crypto_core/ed25519/core_ed25519.c +0 -225
  492. package/ios/libsodium-stable/src/libsodium/crypto_core/ed25519/core_ristretto255.c +0 -156
  493. package/ios/libsodium-stable/src/libsodium/crypto_core/ed25519/ref10/ed25519_ref10.c +0 -2873
  494. package/ios/libsodium-stable/src/libsodium/crypto_core/ed25519/ref10/fe_25_5/base.h +0 -1344
  495. package/ios/libsodium-stable/src/libsodium/crypto_core/ed25519/ref10/fe_25_5/base2.h +0 -40
  496. package/ios/libsodium-stable/src/libsodium/crypto_core/ed25519/ref10/fe_25_5/constants.h +0 -40
  497. package/ios/libsodium-stable/src/libsodium/crypto_core/ed25519/ref10/fe_25_5/fe.h +0 -220
  498. package/ios/libsodium-stable/src/libsodium/crypto_core/ed25519/ref10/fe_51/base.h +0 -1344
  499. package/ios/libsodium-stable/src/libsodium/crypto_core/ed25519/ref10/fe_51/base2.h +0 -40
  500. package/ios/libsodium-stable/src/libsodium/crypto_core/ed25519/ref10/fe_51/constants.h +0 -41
  501. package/ios/libsodium-stable/src/libsodium/crypto_core/ed25519/ref10/fe_51/fe.h +0 -116
  502. package/ios/libsodium-stable/src/libsodium/crypto_core/hchacha20/core_hchacha20.c +0 -93
  503. package/ios/libsodium-stable/src/libsodium/crypto_core/hsalsa20/core_hsalsa20.c +0 -21
  504. package/ios/libsodium-stable/src/libsodium/crypto_core/hsalsa20/ref2/core_hsalsa20_ref2.c +0 -95
  505. package/ios/libsodium-stable/src/libsodium/crypto_core/salsa/ref/core_salsa_ref.c +0 -195
  506. package/ios/libsodium-stable/src/libsodium/crypto_core/softaes/softaes.c +0 -340
  507. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/generichash_blake2.c +0 -55
  508. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2.h +0 -106
  509. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2b-compress-avx2.c +0 -52
  510. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2b-compress-avx2.h +0 -142
  511. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2b-compress-ref.c +0 -93
  512. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2b-compress-sse41.c +0 -91
  513. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2b-compress-sse41.h +0 -106
  514. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2b-compress-ssse3.c +0 -95
  515. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2b-compress-ssse3.h +0 -106
  516. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2b-load-avx2.h +0 -340
  517. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2b-load-sse2.h +0 -164
  518. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2b-load-sse41.h +0 -307
  519. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/blake2b-ref.c +0 -438
  520. package/ios/libsodium-stable/src/libsodium/crypto_generichash/blake2b/ref/generichash_blake2b.c +0 -116
  521. package/ios/libsodium-stable/src/libsodium/crypto_generichash/crypto_generichash.c +0 -91
  522. package/ios/libsodium-stable/src/libsodium/crypto_hash/crypto_hash.c +0 -20
  523. package/ios/libsodium-stable/src/libsodium/crypto_hash/sha256/cp/hash_sha256_cp.c +0 -256
  524. package/ios/libsodium-stable/src/libsodium/crypto_hash/sha256/hash_sha256.c +0 -13
  525. package/ios/libsodium-stable/src/libsodium/crypto_hash/sha512/cp/hash_sha512_cp.c +0 -284
  526. package/ios/libsodium-stable/src/libsodium/crypto_hash/sha512/hash_sha512.c +0 -13
  527. package/ios/libsodium-stable/src/libsodium/crypto_kdf/blake2b/kdf_blake2b.c +0 -52
  528. package/ios/libsodium-stable/src/libsodium/crypto_kdf/crypto_kdf.c +0 -49
  529. package/ios/libsodium-stable/src/libsodium/crypto_kdf/hkdf/kdf_hkdf_sha256.c +0 -123
  530. package/ios/libsodium-stable/src/libsodium/crypto_kdf/hkdf/kdf_hkdf_sha512.c +0 -123
  531. package/ios/libsodium-stable/src/libsodium/crypto_kx/crypto_kx.c +0 -143
  532. package/ios/libsodium-stable/src/libsodium/crypto_onetimeauth/crypto_onetimeauth.c +0 -71
  533. package/ios/libsodium-stable/src/libsodium/crypto_onetimeauth/poly1305/donna/poly1305_donna.c +0 -124
  534. package/ios/libsodium-stable/src/libsodium/crypto_onetimeauth/poly1305/donna/poly1305_donna.h +0 -12
  535. package/ios/libsodium-stable/src/libsodium/crypto_onetimeauth/poly1305/donna/poly1305_donna32.h +0 -235
  536. package/ios/libsodium-stable/src/libsodium/crypto_onetimeauth/poly1305/donna/poly1305_donna64.h +0 -221
  537. package/ios/libsodium-stable/src/libsodium/crypto_onetimeauth/poly1305/onetimeauth_poly1305.c +0 -90
  538. package/ios/libsodium-stable/src/libsodium/crypto_onetimeauth/poly1305/onetimeauth_poly1305.h +0 -21
  539. package/ios/libsodium-stable/src/libsodium/crypto_onetimeauth/poly1305/sse2/poly1305_sse2.c +0 -957
  540. package/ios/libsodium-stable/src/libsodium/crypto_onetimeauth/poly1305/sse2/poly1305_sse2.h +0 -12
  541. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/argon2-core.c +0 -556
  542. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/argon2-core.h +0 -271
  543. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/argon2-encoding.c +0 -306
  544. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/argon2-encoding.h +0 -34
  545. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/argon2-fill-block-avx2.c +0 -243
  546. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/argon2-fill-block-avx512f.c +0 -251
  547. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/argon2-fill-block-ref.c +0 -234
  548. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/argon2-fill-block-ssse3.c +0 -244
  549. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/argon2.c +0 -283
  550. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/argon2.h +0 -305
  551. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/blake2b-long.c +0 -79
  552. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/blake2b-long.h +0 -8
  553. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/blamka-round-avx2.h +0 -150
  554. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/blamka-round-avx512f.h +0 -145
  555. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/blamka-round-ref.h +0 -40
  556. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/blamka-round-ssse3.h +0 -124
  557. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/pwhash_argon2i.c +0 -294
  558. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/argon2/pwhash_argon2id.c +0 -238
  559. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/crypto_pwhash.c +0 -212
  560. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/scryptsalsa208sha256/crypto_scrypt-common.c +0 -268
  561. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/scryptsalsa208sha256/crypto_scrypt.h +0 -92
  562. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/scryptsalsa208sha256/nosse/pwhash_scryptsalsa208sha256_nosse.c +0 -318
  563. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/scryptsalsa208sha256/pbkdf2-sha256.c +0 -96
  564. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/scryptsalsa208sha256/pbkdf2-sha256.h +0 -45
  565. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/scryptsalsa208sha256/pwhash_scryptsalsa208sha256.c +0 -301
  566. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/scryptsalsa208sha256/scrypt_platform.c +0 -112
  567. package/ios/libsodium-stable/src/libsodium/crypto_pwhash/scryptsalsa208sha256/sse/pwhash_scryptsalsa208sha256_sse.c +0 -406
  568. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/crypto_scalarmult.c +0 -33
  569. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/ref10/x25519_ref10.c +0 -182
  570. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/ref10/x25519_ref10.h +0 -10
  571. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/consts.S +0 -25
  572. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/consts_namespace.h +0 -20
  573. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/curve25519_sandy2x.c +0 -71
  574. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/curve25519_sandy2x.h +0 -9
  575. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/fe.h +0 -26
  576. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/fe51.h +0 -35
  577. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/fe51_invert.c +0 -58
  578. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/fe51_mul.S +0 -200
  579. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/fe51_namespace.h +0 -16
  580. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/fe51_nsquare.S +0 -174
  581. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/fe51_pack.S +0 -228
  582. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/fe_frombytes_sandy2x.c +0 -78
  583. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/ladder.S +0 -1442
  584. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/ladder.h +0 -18
  585. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/ladder_namespace.h +0 -8
  586. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/sandy2x/sandy2x.S +0 -16
  587. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/scalarmult_curve25519.c +0 -60
  588. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/curve25519/scalarmult_curve25519.h +0 -11
  589. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/ed25519/ref10/scalarmult_ed25519_ref10.c +0 -121
  590. package/ios/libsodium-stable/src/libsodium/crypto_scalarmult/ristretto255/ref10/scalarmult_ristretto255_ref10.c +0 -63
  591. package/ios/libsodium-stable/src/libsodium/crypto_secretbox/crypto_secretbox.c +0 -67
  592. package/ios/libsodium-stable/src/libsodium/crypto_secretbox/crypto_secretbox_easy.c +0 -145
  593. package/ios/libsodium-stable/src/libsodium/crypto_secretbox/xchacha20poly1305/secretbox_xchacha20poly1305.c +0 -177
  594. package/ios/libsodium-stable/src/libsodium/crypto_secretbox/xsalsa20poly1305/secretbox_xsalsa20poly1305.c +0 -89
  595. package/ios/libsodium-stable/src/libsodium/crypto_secretstream/xchacha20poly1305/secretstream_xchacha20poly1305.c +0 -313
  596. package/ios/libsodium-stable/src/libsodium/crypto_shorthash/crypto_shorthash.c +0 -34
  597. package/ios/libsodium-stable/src/libsodium/crypto_shorthash/siphash24/ref/shorthash_siphash24_ref.c +0 -71
  598. package/ios/libsodium-stable/src/libsodium/crypto_shorthash/siphash24/ref/shorthash_siphash_ref.h +0 -24
  599. package/ios/libsodium-stable/src/libsodium/crypto_shorthash/siphash24/ref/shorthash_siphashx24_ref.c +0 -77
  600. package/ios/libsodium-stable/src/libsodium/crypto_shorthash/siphash24/shorthash_siphash24.c +0 -11
  601. package/ios/libsodium-stable/src/libsodium/crypto_shorthash/siphash24/shorthash_siphashx24.c +0 -11
  602. package/ios/libsodium-stable/src/libsodium/crypto_sign/crypto_sign.c +0 -115
  603. package/ios/libsodium-stable/src/libsodium/crypto_sign/ed25519/ref10/keypair.c +0 -84
  604. package/ios/libsodium-stable/src/libsodium/crypto_sign/ed25519/ref10/obsolete.c +0 -118
  605. package/ios/libsodium-stable/src/libsodium/crypto_sign/ed25519/ref10/open.c +0 -98
  606. package/ios/libsodium-stable/src/libsodium/crypto_sign/ed25519/ref10/sign.c +0 -128
  607. package/ios/libsodium-stable/src/libsodium/crypto_sign/ed25519/ref10/sign_ed25519_ref10.h +0 -18
  608. package/ios/libsodium-stable/src/libsodium/crypto_sign/ed25519/sign_ed25519.c +0 -97
  609. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/dolbeau/chacha20_dolbeau-avx2.c +0 -180
  610. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/dolbeau/chacha20_dolbeau-avx2.h +0 -8
  611. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/dolbeau/chacha20_dolbeau-ssse3.c +0 -176
  612. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/dolbeau/chacha20_dolbeau-ssse3.h +0 -8
  613. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/dolbeau/u0.h +0 -86
  614. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/dolbeau/u1.h +0 -98
  615. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/dolbeau/u4.h +0 -177
  616. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/dolbeau/u8.h +0 -326
  617. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/ref/chacha20_ref.c +0 -312
  618. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/ref/chacha20_ref.h +0 -8
  619. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/stream_chacha20.c +0 -184
  620. package/ios/libsodium-stable/src/libsodium/crypto_stream/chacha20/stream_chacha20.h +0 -22
  621. package/ios/libsodium-stable/src/libsodium/crypto_stream/crypto_stream.c +0 -49
  622. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/ref/salsa20_ref.c +0 -120
  623. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/ref/salsa20_ref.h +0 -8
  624. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/stream_salsa20.c +0 -100
  625. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/stream_salsa20.h +0 -16
  626. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/xmm6/salsa20_xmm6-asm.S +0 -965
  627. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/xmm6/salsa20_xmm6.c +0 -31
  628. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/xmm6/salsa20_xmm6.h +0 -8
  629. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/xmm6int/salsa20_xmm6int-avx2.c +0 -134
  630. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/xmm6int/salsa20_xmm6int-avx2.h +0 -8
  631. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/xmm6int/salsa20_xmm6int-sse2.c +0 -128
  632. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/xmm6int/salsa20_xmm6int-sse2.h +0 -8
  633. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/xmm6int/u0.h +0 -195
  634. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/xmm6int/u1.h +0 -207
  635. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/xmm6int/u4.h +0 -547
  636. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa20/xmm6int/u8.h +0 -477
  637. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa2012/ref/stream_salsa2012_ref.c +0 -106
  638. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa2012/stream_salsa2012.c +0 -26
  639. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa208/ref/stream_salsa208_ref.c +0 -106
  640. package/ios/libsodium-stable/src/libsodium/crypto_stream/salsa208/stream_salsa208.c +0 -26
  641. package/ios/libsodium-stable/src/libsodium/crypto_stream/xchacha20/stream_xchacha20.c +0 -69
  642. package/ios/libsodium-stable/src/libsodium/crypto_stream/xsalsa20/stream_xsalsa20.c +0 -66
  643. package/ios/libsodium-stable/src/libsodium/crypto_verify/verify.c +0 -103
  644. package/ios/libsodium-stable/src/libsodium/include/Makefile.am +0 -76
  645. package/ios/libsodium-stable/src/libsodium/include/sodium/core.h +0 -28
  646. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_aead_aegis128l.h +0 -92
  647. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_aead_aegis256.h +0 -92
  648. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_aead_aes256gcm.h +0 -179
  649. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_aead_chacha20poly1305.h +0 -180
  650. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_aead_xchacha20poly1305.h +0 -100
  651. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_auth.h +0 -46
  652. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_auth_hmacsha256.h +0 -70
  653. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_auth_hmacsha512.h +0 -68
  654. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_auth_hmacsha512256.h +0 -65
  655. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_box.h +0 -177
  656. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_box_curve25519xchacha20poly1305.h +0 -164
  657. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_box_curve25519xsalsa20poly1305.h +0 -112
  658. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_core_ed25519.h +0 -100
  659. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_core_hchacha20.h +0 -36
  660. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_core_hsalsa20.h +0 -36
  661. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_core_ristretto255.h +0 -100
  662. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_core_salsa20.h +0 -36
  663. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_core_salsa2012.h +0 -36
  664. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_core_salsa208.h +0 -40
  665. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_generichash.h +0 -84
  666. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_generichash_blake2b.h +0 -122
  667. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_hash.h +0 -40
  668. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_hash_sha256.h +0 -60
  669. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_hash_sha512.h +0 -60
  670. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_kdf.h +0 -53
  671. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_kdf_blake2b.h +0 -44
  672. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_kdf_hkdf_sha256.h +0 -74
  673. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_kdf_hkdf_sha512.h +0 -75
  674. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_kx.h +0 -66
  675. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_onetimeauth.h +0 -65
  676. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_onetimeauth_poly1305.h +0 -72
  677. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_pwhash.h +0 -147
  678. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_pwhash_argon2i.h +0 -122
  679. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_pwhash_argon2id.h +0 -122
  680. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_pwhash_scryptsalsa208sha256.h +0 -120
  681. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_scalarmult.h +0 -46
  682. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_scalarmult_curve25519.h +0 -42
  683. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_scalarmult_ed25519.h +0 -51
  684. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_scalarmult_ristretto255.h +0 -43
  685. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_secretbox.h +0 -93
  686. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_secretbox_xchacha20poly1305.h +0 -70
  687. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_secretbox_xsalsa20poly1305.h +0 -69
  688. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_secretstream_xchacha20poly1305.h +0 -108
  689. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_shorthash.h +0 -41
  690. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_shorthash_siphash24.h +0 -50
  691. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_sign.h +0 -107
  692. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_sign_ed25519.h +0 -124
  693. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_sign_edwards25519sha512batch.h +0 -55
  694. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_stream.h +0 -59
  695. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_stream_chacha20.h +0 -106
  696. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_stream_salsa20.h +0 -61
  697. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_stream_salsa2012.h +0 -53
  698. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_stream_salsa208.h +0 -56
  699. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_stream_xchacha20.h +0 -61
  700. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_stream_xsalsa20.h +0 -61
  701. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_verify_16.h +0 -23
  702. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_verify_32.h +0 -23
  703. package/ios/libsodium-stable/src/libsodium/include/sodium/crypto_verify_64.h +0 -23
  704. package/ios/libsodium-stable/src/libsodium/include/sodium/export.h +0 -57
  705. package/ios/libsodium-stable/src/libsodium/include/sodium/private/asm_cet.h +0 -11
  706. package/ios/libsodium-stable/src/libsodium/include/sodium/private/chacha20_ietf_ext.h +0 -16
  707. package/ios/libsodium-stable/src/libsodium/include/sodium/private/common.h +0 -296
  708. package/ios/libsodium-stable/src/libsodium/include/sodium/private/ed25519_ref10.h +0 -142
  709. package/ios/libsodium-stable/src/libsodium/include/sodium/private/ed25519_ref10_fe_25_5.h +0 -1030
  710. package/ios/libsodium-stable/src/libsodium/include/sodium/private/ed25519_ref10_fe_51.h +0 -508
  711. package/ios/libsodium-stable/src/libsodium/include/sodium/private/implementations.h +0 -13
  712. package/ios/libsodium-stable/src/libsodium/include/sodium/private/mutex.h +0 -7
  713. package/ios/libsodium-stable/src/libsodium/include/sodium/private/softaes.h +0 -56
  714. package/ios/libsodium-stable/src/libsodium/include/sodium/private/sse2_64_32.h +0 -50
  715. package/ios/libsodium-stable/src/libsodium/include/sodium/randombytes.h +0 -72
  716. package/ios/libsodium-stable/src/libsodium/include/sodium/randombytes_internal_random.h +0 -22
  717. package/ios/libsodium-stable/src/libsodium/include/sodium/randombytes_sysrandom.h +0 -19
  718. package/ios/libsodium-stable/src/libsodium/include/sodium/runtime.h +0 -55
  719. package/ios/libsodium-stable/src/libsodium/include/sodium/utils.h +0 -179
  720. package/ios/libsodium-stable/src/libsodium/include/sodium/version.h.in +0 -33
  721. package/ios/libsodium-stable/src/libsodium/include/sodium.h +0 -75
  722. package/ios/libsodium-stable/src/libsodium/randombytes/internal/randombytes_internal_random.c +0 -648
  723. package/ios/libsodium-stable/src/libsodium/randombytes/randombytes.c +0 -200
  724. package/ios/libsodium-stable/src/libsodium/randombytes/sysrandom/randombytes_sysrandom.c +0 -396
  725. package/ios/libsodium-stable/src/libsodium/sodium/codecs.c +0 -335
  726. package/ios/libsodium-stable/src/libsodium/sodium/core.c +0 -216
  727. package/ios/libsodium-stable/src/libsodium/sodium/runtime.c +0 -391
  728. package/ios/libsodium-stable/src/libsodium/sodium/utils.c +0 -809
  729. package/ios/libsodium-stable/src/libsodium/sodium/version.c +0 -30
  730. package/ios/libsodium-stable/test/Makefile.am +0 -5
  731. package/ios/libsodium-stable/test/constcheck.sh +0 -22
  732. package/ios/libsodium-stable/test/default/Makefile.am +0 -525
  733. package/ios/libsodium-stable/test/default/aead_aegis128l.c +0 -642
  734. package/ios/libsodium-stable/test/default/aead_aegis128l.exp +0 -1
  735. package/ios/libsodium-stable/test/default/aead_aegis256.c +0 -723
  736. package/ios/libsodium-stable/test/default/aead_aegis256.exp +0 -1
  737. package/ios/libsodium-stable/test/default/aead_aes256gcm.c +0 -3328
  738. package/ios/libsodium-stable/test/default/aead_aes256gcm.exp +0 -1
  739. package/ios/libsodium-stable/test/default/aead_aes256gcm2.c +0 -276
  740. package/ios/libsodium-stable/test/default/aead_aes256gcm2.exp +0 -1
  741. package/ios/libsodium-stable/test/default/aead_chacha20poly1305.c +0 -372
  742. package/ios/libsodium-stable/test/default/aead_chacha20poly1305.exp +0 -63
  743. package/ios/libsodium-stable/test/default/aead_chacha20poly13052.c +0 -1046
  744. package/ios/libsodium-stable/test/default/aead_chacha20poly13052.exp +0 -1
  745. package/ios/libsodium-stable/test/default/aead_xchacha20poly1305.c +0 -203
  746. package/ios/libsodium-stable/test/default/aead_xchacha20poly1305.exp +0 -51
  747. package/ios/libsodium-stable/test/default/auth.c +0 -141
  748. package/ios/libsodium-stable/test/default/auth.exp +0 -30
  749. package/ios/libsodium-stable/test/default/auth2.c +0 -34
  750. package/ios/libsodium-stable/test/default/auth2.exp +0 -4
  751. package/ios/libsodium-stable/test/default/auth3.c +0 -36
  752. package/ios/libsodium-stable/test/default/auth3.exp +0 -1
  753. package/ios/libsodium-stable/test/default/auth5.c +0 -41
  754. package/ios/libsodium-stable/test/default/auth5.exp +0 -0
  755. package/ios/libsodium-stable/test/default/auth6.c +0 -23
  756. package/ios/libsodium-stable/test/default/auth6.exp +0 -8
  757. package/ios/libsodium-stable/test/default/auth7.c +0 -41
  758. package/ios/libsodium-stable/test/default/auth7.exp +0 -0
  759. package/ios/libsodium-stable/test/default/box.c +0 -112
  760. package/ios/libsodium-stable/test/default/box.exp +0 -38
  761. package/ios/libsodium-stable/test/default/box2.c +0 -80
  762. package/ios/libsodium-stable/test/default/box2.exp +0 -34
  763. package/ios/libsodium-stable/test/default/box7.c +0 -50
  764. package/ios/libsodium-stable/test/default/box7.exp +0 -0
  765. package/ios/libsodium-stable/test/default/box8.c +0 -58
  766. package/ios/libsodium-stable/test/default/box8.exp +0 -0
  767. package/ios/libsodium-stable/test/default/box_easy.c +0 -72
  768. package/ios/libsodium-stable/test/default/box_easy.exp +0 -3
  769. package/ios/libsodium-stable/test/default/box_easy2.c +0 -149
  770. package/ios/libsodium-stable/test/default/box_easy2.exp +0 -7
  771. package/ios/libsodium-stable/test/default/box_seal.c +0 -165
  772. package/ios/libsodium-stable/test/default/box_seal.exp +0 -8
  773. package/ios/libsodium-stable/test/default/box_seed.c +0 -30
  774. package/ios/libsodium-stable/test/default/box_seed.exp +0 -8
  775. package/ios/libsodium-stable/test/default/chacha20.c +0 -186
  776. package/ios/libsodium-stable/test/default/chacha20.exp +0 -64
  777. package/ios/libsodium-stable/test/default/cmptest.h +0 -238
  778. package/ios/libsodium-stable/test/default/codecs.c +0 -251
  779. package/ios/libsodium-stable/test/default/codecs.exp +0 -30
  780. package/ios/libsodium-stable/test/default/core1.c +0 -41
  781. package/ios/libsodium-stable/test/default/core1.exp +0 -4
  782. package/ios/libsodium-stable/test/default/core2.c +0 -38
  783. package/ios/libsodium-stable/test/default/core2.exp +0 -4
  784. package/ios/libsodium-stable/test/default/core3.c +0 -115
  785. package/ios/libsodium-stable/test/default/core3.exp +0 -3
  786. package/ios/libsodium-stable/test/default/core4.c +0 -36
  787. package/ios/libsodium-stable/test/default/core4.exp +0 -8
  788. package/ios/libsodium-stable/test/default/core5.c +0 -33
  789. package/ios/libsodium-stable/test/default/core5.exp +0 -4
  790. package/ios/libsodium-stable/test/default/core6.c +0 -52
  791. package/ios/libsodium-stable/test/default/core6.exp +0 -4
  792. package/ios/libsodium-stable/test/default/core_ed25519.c +0 -545
  793. package/ios/libsodium-stable/test/default/core_ed25519.exp +0 -55
  794. package/ios/libsodium-stable/test/default/core_ristretto255.c +0 -271
  795. package/ios/libsodium-stable/test/default/core_ristretto255.exp +0 -8
  796. package/ios/libsodium-stable/test/default/ed25519_convert.c +0 -70
  797. package/ios/libsodium-stable/test/default/ed25519_convert.exp +0 -3
  798. package/ios/libsodium-stable/test/default/generichash.c +0 -1406
  799. package/ios/libsodium-stable/test/default/generichash.exp +0 -65
  800. package/ios/libsodium-stable/test/default/generichash2.c +0 -62
  801. package/ios/libsodium-stable/test/default/generichash2.exp +0 -64
  802. package/ios/libsodium-stable/test/default/generichash3.c +0 -176
  803. package/ios/libsodium-stable/test/default/generichash3.exp +0 -75
  804. package/ios/libsodium-stable/test/default/hash.c +0 -47
  805. package/ios/libsodium-stable/test/default/hash.exp +0 -4
  806. package/ios/libsodium-stable/test/default/hash3.c +0 -20
  807. package/ios/libsodium-stable/test/default/hash3.exp +0 -1
  808. package/ios/libsodium-stable/test/default/index.html.tpl +0 -98
  809. package/ios/libsodium-stable/test/default/kdf.c +0 -71
  810. package/ios/libsodium-stable/test/default/kdf.exp +0 -77
  811. package/ios/libsodium-stable/test/default/kdf_hkdf.c +0 -102
  812. package/ios/libsodium-stable/test/default/kdf_hkdf.exp +0 -205
  813. package/ios/libsodium-stable/test/default/keygen.c +0 -67
  814. package/ios/libsodium-stable/test/default/keygen.exp +0 -1
  815. package/ios/libsodium-stable/test/default/kx.c +0 -149
  816. package/ios/libsodium-stable/test/default/kx.exp +0 -7
  817. package/ios/libsodium-stable/test/default/metamorphic.c +0 -187
  818. package/ios/libsodium-stable/test/default/metamorphic.exp +0 -1
  819. package/ios/libsodium-stable/test/default/misuse.c +0 -187
  820. package/ios/libsodium-stable/test/default/misuse.exp +0 -0
  821. package/ios/libsodium-stable/test/default/onetimeauth.c +0 -63
  822. package/ios/libsodium-stable/test/default/onetimeauth.exp +0 -4
  823. package/ios/libsodium-stable/test/default/onetimeauth2.c +0 -33
  824. package/ios/libsodium-stable/test/default/onetimeauth2.exp +0 -1
  825. package/ios/libsodium-stable/test/default/onetimeauth7.c +0 -36
  826. package/ios/libsodium-stable/test/default/onetimeauth7.exp +0 -0
  827. package/ios/libsodium-stable/test/default/pre.js.inc +0 -22
  828. package/ios/libsodium-stable/test/default/pwhash_argon2i.c +0 -467
  829. package/ios/libsodium-stable/test/default/pwhash_argon2i.exp +0 -11
  830. package/ios/libsodium-stable/test/default/pwhash_argon2id.c +0 -517
  831. package/ios/libsodium-stable/test/default/pwhash_argon2id.exp +0 -14
  832. package/ios/libsodium-stable/test/default/pwhash_scrypt.c +0 -393
  833. package/ios/libsodium-stable/test/default/pwhash_scrypt.exp +0 -37
  834. package/ios/libsodium-stable/test/default/pwhash_scrypt_ll.c +0 -59
  835. package/ios/libsodium-stable/test/default/pwhash_scrypt_ll.exp +0 -15
  836. package/ios/libsodium-stable/test/default/randombytes.c +0 -164
  837. package/ios/libsodium-stable/test/default/randombytes.exp +0 -2
  838. package/ios/libsodium-stable/test/default/run.sh +0 -9
  839. package/ios/libsodium-stable/test/default/scalarmult.c +0 -77
  840. package/ios/libsodium-stable/test/default/scalarmult.exp +0 -5
  841. package/ios/libsodium-stable/test/default/scalarmult2.c +0 -22
  842. package/ios/libsodium-stable/test/default/scalarmult2.exp +0 -1
  843. package/ios/libsodium-stable/test/default/scalarmult5.c +0 -30
  844. package/ios/libsodium-stable/test/default/scalarmult5.exp +0 -1
  845. package/ios/libsodium-stable/test/default/scalarmult6.c +0 -54
  846. package/ios/libsodium-stable/test/default/scalarmult6.exp +0 -4
  847. package/ios/libsodium-stable/test/default/scalarmult7.c +0 -34
  848. package/ios/libsodium-stable/test/default/scalarmult7.exp +0 -1
  849. package/ios/libsodium-stable/test/default/scalarmult8.c +0 -580
  850. package/ios/libsodium-stable/test/default/scalarmult8.exp +0 -65
  851. package/ios/libsodium-stable/test/default/scalarmult_ed25519.c +0 -134
  852. package/ios/libsodium-stable/test/default/scalarmult_ed25519.exp +0 -1
  853. package/ios/libsodium-stable/test/default/scalarmult_ristretto255.c +0 -51
  854. package/ios/libsodium-stable/test/default/scalarmult_ristretto255.exp +0 -18
  855. package/ios/libsodium-stable/test/default/secretbox.c +0 -84
  856. package/ios/libsodium-stable/test/default/secretbox.exp +0 -38
  857. package/ios/libsodium-stable/test/default/secretbox2.c +0 -55
  858. package/ios/libsodium-stable/test/default/secretbox2.exp +0 -17
  859. package/ios/libsodium-stable/test/default/secretbox7.c +0 -36
  860. package/ios/libsodium-stable/test/default/secretbox7.exp +0 -0
  861. package/ios/libsodium-stable/test/default/secretbox8.c +0 -41
  862. package/ios/libsodium-stable/test/default/secretbox8.exp +0 -0
  863. package/ios/libsodium-stable/test/default/secretbox_easy.c +0 -124
  864. package/ios/libsodium-stable/test/default/secretbox_easy.exp +0 -9
  865. package/ios/libsodium-stable/test/default/secretbox_easy2.c +0 -72
  866. package/ios/libsodium-stable/test/default/secretbox_easy2.exp +0 -5
  867. package/ios/libsodium-stable/test/default/secretstream_xchacha20poly1305.c +0 -329
  868. package/ios/libsodium-stable/test/default/secretstream_xchacha20poly1305.exp +0 -1
  869. package/ios/libsodium-stable/test/default/shorthash.c +0 -35
  870. package/ios/libsodium-stable/test/default/shorthash.exp +0 -64
  871. package/ios/libsodium-stable/test/default/sign.c +0 -1324
  872. package/ios/libsodium-stable/test/default/sign.exp +0 -5
  873. package/ios/libsodium-stable/test/default/siphashx24.c +0 -33
  874. package/ios/libsodium-stable/test/default/siphashx24.exp +0 -64
  875. package/ios/libsodium-stable/test/default/sodium_core.c +0 -43
  876. package/ios/libsodium-stable/test/default/sodium_core.exp +0 -1
  877. package/ios/libsodium-stable/test/default/sodium_utils.c +0 -224
  878. package/ios/libsodium-stable/test/default/sodium_utils.exp +0 -25
  879. package/ios/libsodium-stable/test/default/sodium_utils2.c +0 -120
  880. package/ios/libsodium-stable/test/default/sodium_utils2.exp +0 -3
  881. package/ios/libsodium-stable/test/default/sodium_utils3.c +0 -90
  882. package/ios/libsodium-stable/test/default/sodium_utils3.exp +0 -2
  883. package/ios/libsodium-stable/test/default/sodium_version.c +0 -18
  884. package/ios/libsodium-stable/test/default/sodium_version.exp +0 -3
  885. package/ios/libsodium-stable/test/default/stream.c +0 -84
  886. package/ios/libsodium-stable/test/default/stream.exp +0 -83
  887. package/ios/libsodium-stable/test/default/stream2.c +0 -59
  888. package/ios/libsodium-stable/test/default/stream2.exp +0 -2
  889. package/ios/libsodium-stable/test/default/stream3.c +0 -32
  890. package/ios/libsodium-stable/test/default/stream3.exp +0 -4
  891. package/ios/libsodium-stable/test/default/stream4.c +0 -51
  892. package/ios/libsodium-stable/test/default/stream4.exp +0 -17
  893. package/ios/libsodium-stable/test/default/verify1.c +0 -76
  894. package/ios/libsodium-stable/test/default/verify1.exp +0 -2
  895. package/ios/libsodium-stable/test/default/wasi-test-wrapper.sh +0 -98
  896. package/ios/libsodium-stable/test/default/wintest.bat +0 -61
  897. package/ios/libsodium-stable/test/default/xchacha20.c +0 -428
  898. package/ios/libsodium-stable/test/default/xchacha20.exp +0 -5
  899. package/ios/libsodium-stable/test/quirks/quirks.h +0 -34
@@ -0,0 +1,1388 @@
1
+ #include "blake3_impl.h"
2
+
3
+ #include <immintrin.h>
4
+
5
+ #define _mm_shuffle_ps2(a, b, c) \
6
+ (_mm_castps_si128( \
7
+ _mm_shuffle_ps(_mm_castsi128_ps(a), _mm_castsi128_ps(b), (c))))
8
+
9
+ INLINE __m128i loadu_128(const uint8_t src[16]) {
10
+ return _mm_loadu_si128((void*)src);
11
+ }
12
+
13
+ INLINE __m256i loadu_256(const uint8_t src[32]) {
14
+ return _mm256_loadu_si256((void*)src);
15
+ }
16
+
17
+ INLINE __m512i loadu_512(const uint8_t src[64]) {
18
+ return _mm512_loadu_si512((void*)src);
19
+ }
20
+
21
+ INLINE void storeu_128(__m128i src, uint8_t dest[16]) {
22
+ _mm_storeu_si128((void*)dest, src);
23
+ }
24
+
25
+ INLINE void storeu_256(__m256i src, uint8_t dest[16]) {
26
+ _mm256_storeu_si256((void*)dest, src);
27
+ }
28
+
29
+ INLINE void storeu_512(__m512i src, uint8_t dest[16]) {
30
+ _mm512_storeu_si512((void*)dest, src);
31
+ }
32
+
33
+ INLINE __m128i add_128(__m128i a, __m128i b) { return _mm_add_epi32(a, b); }
34
+
35
+ INLINE __m256i add_256(__m256i a, __m256i b) { return _mm256_add_epi32(a, b); }
36
+
37
+ INLINE __m512i add_512(__m512i a, __m512i b) { return _mm512_add_epi32(a, b); }
38
+
39
+ INLINE __m128i xor_128(__m128i a, __m128i b) { return _mm_xor_si128(a, b); }
40
+
41
+ INLINE __m256i xor_256(__m256i a, __m256i b) { return _mm256_xor_si256(a, b); }
42
+
43
+ INLINE __m512i xor_512(__m512i a, __m512i b) { return _mm512_xor_si512(a, b); }
44
+
45
+ INLINE __m128i set1_128(uint32_t x) { return _mm_set1_epi32((int32_t)x); }
46
+
47
+ INLINE __m256i set1_256(uint32_t x) { return _mm256_set1_epi32((int32_t)x); }
48
+
49
+ INLINE __m512i set1_512(uint32_t x) { return _mm512_set1_epi32((int32_t)x); }
50
+
51
+ INLINE __m128i set4(uint32_t a, uint32_t b, uint32_t c, uint32_t d) {
52
+ return _mm_setr_epi32((int32_t)a, (int32_t)b, (int32_t)c, (int32_t)d);
53
+ }
54
+
55
+ INLINE __m128i rot16_128(__m128i x) { return _mm_ror_epi32(x, 16); }
56
+
57
+ INLINE __m256i rot16_256(__m256i x) { return _mm256_ror_epi32(x, 16); }
58
+
59
+ INLINE __m512i rot16_512(__m512i x) { return _mm512_ror_epi32(x, 16); }
60
+
61
+ INLINE __m128i rot12_128(__m128i x) { return _mm_ror_epi32(x, 12); }
62
+
63
+ INLINE __m256i rot12_256(__m256i x) { return _mm256_ror_epi32(x, 12); }
64
+
65
+ INLINE __m512i rot12_512(__m512i x) { return _mm512_ror_epi32(x, 12); }
66
+
67
+ INLINE __m128i rot8_128(__m128i x) { return _mm_ror_epi32(x, 8); }
68
+
69
+ INLINE __m256i rot8_256(__m256i x) { return _mm256_ror_epi32(x, 8); }
70
+
71
+ INLINE __m512i rot8_512(__m512i x) { return _mm512_ror_epi32(x, 8); }
72
+
73
+ INLINE __m128i rot7_128(__m128i x) { return _mm_ror_epi32(x, 7); }
74
+
75
+ INLINE __m256i rot7_256(__m256i x) { return _mm256_ror_epi32(x, 7); }
76
+
77
+ INLINE __m512i rot7_512(__m512i x) { return _mm512_ror_epi32(x, 7); }
78
+
79
+ /*
80
+ * ----------------------------------------------------------------------------
81
+ * compress_avx512
82
+ * ----------------------------------------------------------------------------
83
+ */
84
+
85
+ INLINE void g1(__m128i *row0, __m128i *row1, __m128i *row2, __m128i *row3,
86
+ __m128i m) {
87
+ *row0 = add_128(add_128(*row0, m), *row1);
88
+ *row3 = xor_128(*row3, *row0);
89
+ *row3 = rot16_128(*row3);
90
+ *row2 = add_128(*row2, *row3);
91
+ *row1 = xor_128(*row1, *row2);
92
+ *row1 = rot12_128(*row1);
93
+ }
94
+
95
+ INLINE void g2(__m128i *row0, __m128i *row1, __m128i *row2, __m128i *row3,
96
+ __m128i m) {
97
+ *row0 = add_128(add_128(*row0, m), *row1);
98
+ *row3 = xor_128(*row3, *row0);
99
+ *row3 = rot8_128(*row3);
100
+ *row2 = add_128(*row2, *row3);
101
+ *row1 = xor_128(*row1, *row2);
102
+ *row1 = rot7_128(*row1);
103
+ }
104
+
105
+ // Note the optimization here of leaving row1 as the unrotated row, rather than
106
+ // row0. All the message loads below are adjusted to compensate for this. See
107
+ // discussion at https://github.com/sneves/blake2-avx2/pull/4
108
+ INLINE void diagonalize(__m128i *row0, __m128i *row2, __m128i *row3) {
109
+ *row0 = _mm_shuffle_epi32(*row0, _MM_SHUFFLE(2, 1, 0, 3));
110
+ *row3 = _mm_shuffle_epi32(*row3, _MM_SHUFFLE(1, 0, 3, 2));
111
+ *row2 = _mm_shuffle_epi32(*row2, _MM_SHUFFLE(0, 3, 2, 1));
112
+ }
113
+
114
+ INLINE void undiagonalize(__m128i *row0, __m128i *row2, __m128i *row3) {
115
+ *row0 = _mm_shuffle_epi32(*row0, _MM_SHUFFLE(0, 3, 2, 1));
116
+ *row3 = _mm_shuffle_epi32(*row3, _MM_SHUFFLE(1, 0, 3, 2));
117
+ *row2 = _mm_shuffle_epi32(*row2, _MM_SHUFFLE(2, 1, 0, 3));
118
+ }
119
+
120
+ INLINE void compress_pre(__m128i rows[4], const uint32_t cv[8],
121
+ const uint8_t block[BLAKE3_BLOCK_LEN],
122
+ uint8_t block_len, uint64_t counter, uint8_t flags) {
123
+ rows[0] = loadu_128((uint8_t *)&cv[0]);
124
+ rows[1] = loadu_128((uint8_t *)&cv[4]);
125
+ rows[2] = set4(IV[0], IV[1], IV[2], IV[3]);
126
+ rows[3] = set4(counter_low(counter), counter_high(counter),
127
+ (uint32_t)block_len, (uint32_t)flags);
128
+
129
+ __m128i m0 = loadu_128(&block[sizeof(__m128i) * 0]);
130
+ __m128i m1 = loadu_128(&block[sizeof(__m128i) * 1]);
131
+ __m128i m2 = loadu_128(&block[sizeof(__m128i) * 2]);
132
+ __m128i m3 = loadu_128(&block[sizeof(__m128i) * 3]);
133
+
134
+ __m128i t0, t1, t2, t3, tt;
135
+
136
+ // Round 1. The first round permutes the message words from the original
137
+ // input order, into the groups that get mixed in parallel.
138
+ t0 = _mm_shuffle_ps2(m0, m1, _MM_SHUFFLE(2, 0, 2, 0)); // 6 4 2 0
139
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t0);
140
+ t1 = _mm_shuffle_ps2(m0, m1, _MM_SHUFFLE(3, 1, 3, 1)); // 7 5 3 1
141
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t1);
142
+ diagonalize(&rows[0], &rows[2], &rows[3]);
143
+ t2 = _mm_shuffle_ps2(m2, m3, _MM_SHUFFLE(2, 0, 2, 0)); // 14 12 10 8
144
+ t2 = _mm_shuffle_epi32(t2, _MM_SHUFFLE(2, 1, 0, 3)); // 12 10 8 14
145
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t2);
146
+ t3 = _mm_shuffle_ps2(m2, m3, _MM_SHUFFLE(3, 1, 3, 1)); // 15 13 11 9
147
+ t3 = _mm_shuffle_epi32(t3, _MM_SHUFFLE(2, 1, 0, 3)); // 13 11 9 15
148
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t3);
149
+ undiagonalize(&rows[0], &rows[2], &rows[3]);
150
+ m0 = t0;
151
+ m1 = t1;
152
+ m2 = t2;
153
+ m3 = t3;
154
+
155
+ // Round 2. This round and all following rounds apply a fixed permutation
156
+ // to the message words from the round before.
157
+ t0 = _mm_shuffle_ps2(m0, m1, _MM_SHUFFLE(3, 1, 1, 2));
158
+ t0 = _mm_shuffle_epi32(t0, _MM_SHUFFLE(0, 3, 2, 1));
159
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t0);
160
+ t1 = _mm_shuffle_ps2(m2, m3, _MM_SHUFFLE(3, 3, 2, 2));
161
+ tt = _mm_shuffle_epi32(m0, _MM_SHUFFLE(0, 0, 3, 3));
162
+ t1 = _mm_blend_epi16(tt, t1, 0xCC);
163
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t1);
164
+ diagonalize(&rows[0], &rows[2], &rows[3]);
165
+ t2 = _mm_unpacklo_epi64(m3, m1);
166
+ tt = _mm_blend_epi16(t2, m2, 0xC0);
167
+ t2 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(1, 3, 2, 0));
168
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t2);
169
+ t3 = _mm_unpackhi_epi32(m1, m3);
170
+ tt = _mm_unpacklo_epi32(m2, t3);
171
+ t3 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(0, 1, 3, 2));
172
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t3);
173
+ undiagonalize(&rows[0], &rows[2], &rows[3]);
174
+ m0 = t0;
175
+ m1 = t1;
176
+ m2 = t2;
177
+ m3 = t3;
178
+
179
+ // Round 3
180
+ t0 = _mm_shuffle_ps2(m0, m1, _MM_SHUFFLE(3, 1, 1, 2));
181
+ t0 = _mm_shuffle_epi32(t0, _MM_SHUFFLE(0, 3, 2, 1));
182
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t0);
183
+ t1 = _mm_shuffle_ps2(m2, m3, _MM_SHUFFLE(3, 3, 2, 2));
184
+ tt = _mm_shuffle_epi32(m0, _MM_SHUFFLE(0, 0, 3, 3));
185
+ t1 = _mm_blend_epi16(tt, t1, 0xCC);
186
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t1);
187
+ diagonalize(&rows[0], &rows[2], &rows[3]);
188
+ t2 = _mm_unpacklo_epi64(m3, m1);
189
+ tt = _mm_blend_epi16(t2, m2, 0xC0);
190
+ t2 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(1, 3, 2, 0));
191
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t2);
192
+ t3 = _mm_unpackhi_epi32(m1, m3);
193
+ tt = _mm_unpacklo_epi32(m2, t3);
194
+ t3 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(0, 1, 3, 2));
195
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t3);
196
+ undiagonalize(&rows[0], &rows[2], &rows[3]);
197
+ m0 = t0;
198
+ m1 = t1;
199
+ m2 = t2;
200
+ m3 = t3;
201
+
202
+ // Round 4
203
+ t0 = _mm_shuffle_ps2(m0, m1, _MM_SHUFFLE(3, 1, 1, 2));
204
+ t0 = _mm_shuffle_epi32(t0, _MM_SHUFFLE(0, 3, 2, 1));
205
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t0);
206
+ t1 = _mm_shuffle_ps2(m2, m3, _MM_SHUFFLE(3, 3, 2, 2));
207
+ tt = _mm_shuffle_epi32(m0, _MM_SHUFFLE(0, 0, 3, 3));
208
+ t1 = _mm_blend_epi16(tt, t1, 0xCC);
209
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t1);
210
+ diagonalize(&rows[0], &rows[2], &rows[3]);
211
+ t2 = _mm_unpacklo_epi64(m3, m1);
212
+ tt = _mm_blend_epi16(t2, m2, 0xC0);
213
+ t2 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(1, 3, 2, 0));
214
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t2);
215
+ t3 = _mm_unpackhi_epi32(m1, m3);
216
+ tt = _mm_unpacklo_epi32(m2, t3);
217
+ t3 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(0, 1, 3, 2));
218
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t3);
219
+ undiagonalize(&rows[0], &rows[2], &rows[3]);
220
+ m0 = t0;
221
+ m1 = t1;
222
+ m2 = t2;
223
+ m3 = t3;
224
+
225
+ // Round 5
226
+ t0 = _mm_shuffle_ps2(m0, m1, _MM_SHUFFLE(3, 1, 1, 2));
227
+ t0 = _mm_shuffle_epi32(t0, _MM_SHUFFLE(0, 3, 2, 1));
228
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t0);
229
+ t1 = _mm_shuffle_ps2(m2, m3, _MM_SHUFFLE(3, 3, 2, 2));
230
+ tt = _mm_shuffle_epi32(m0, _MM_SHUFFLE(0, 0, 3, 3));
231
+ t1 = _mm_blend_epi16(tt, t1, 0xCC);
232
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t1);
233
+ diagonalize(&rows[0], &rows[2], &rows[3]);
234
+ t2 = _mm_unpacklo_epi64(m3, m1);
235
+ tt = _mm_blend_epi16(t2, m2, 0xC0);
236
+ t2 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(1, 3, 2, 0));
237
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t2);
238
+ t3 = _mm_unpackhi_epi32(m1, m3);
239
+ tt = _mm_unpacklo_epi32(m2, t3);
240
+ t3 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(0, 1, 3, 2));
241
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t3);
242
+ undiagonalize(&rows[0], &rows[2], &rows[3]);
243
+ m0 = t0;
244
+ m1 = t1;
245
+ m2 = t2;
246
+ m3 = t3;
247
+
248
+ // Round 6
249
+ t0 = _mm_shuffle_ps2(m0, m1, _MM_SHUFFLE(3, 1, 1, 2));
250
+ t0 = _mm_shuffle_epi32(t0, _MM_SHUFFLE(0, 3, 2, 1));
251
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t0);
252
+ t1 = _mm_shuffle_ps2(m2, m3, _MM_SHUFFLE(3, 3, 2, 2));
253
+ tt = _mm_shuffle_epi32(m0, _MM_SHUFFLE(0, 0, 3, 3));
254
+ t1 = _mm_blend_epi16(tt, t1, 0xCC);
255
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t1);
256
+ diagonalize(&rows[0], &rows[2], &rows[3]);
257
+ t2 = _mm_unpacklo_epi64(m3, m1);
258
+ tt = _mm_blend_epi16(t2, m2, 0xC0);
259
+ t2 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(1, 3, 2, 0));
260
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t2);
261
+ t3 = _mm_unpackhi_epi32(m1, m3);
262
+ tt = _mm_unpacklo_epi32(m2, t3);
263
+ t3 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(0, 1, 3, 2));
264
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t3);
265
+ undiagonalize(&rows[0], &rows[2], &rows[3]);
266
+ m0 = t0;
267
+ m1 = t1;
268
+ m2 = t2;
269
+ m3 = t3;
270
+
271
+ // Round 7
272
+ t0 = _mm_shuffle_ps2(m0, m1, _MM_SHUFFLE(3, 1, 1, 2));
273
+ t0 = _mm_shuffle_epi32(t0, _MM_SHUFFLE(0, 3, 2, 1));
274
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t0);
275
+ t1 = _mm_shuffle_ps2(m2, m3, _MM_SHUFFLE(3, 3, 2, 2));
276
+ tt = _mm_shuffle_epi32(m0, _MM_SHUFFLE(0, 0, 3, 3));
277
+ t1 = _mm_blend_epi16(tt, t1, 0xCC);
278
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t1);
279
+ diagonalize(&rows[0], &rows[2], &rows[3]);
280
+ t2 = _mm_unpacklo_epi64(m3, m1);
281
+ tt = _mm_blend_epi16(t2, m2, 0xC0);
282
+ t2 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(1, 3, 2, 0));
283
+ g1(&rows[0], &rows[1], &rows[2], &rows[3], t2);
284
+ t3 = _mm_unpackhi_epi32(m1, m3);
285
+ tt = _mm_unpacklo_epi32(m2, t3);
286
+ t3 = _mm_shuffle_epi32(tt, _MM_SHUFFLE(0, 1, 3, 2));
287
+ g2(&rows[0], &rows[1], &rows[2], &rows[3], t3);
288
+ undiagonalize(&rows[0], &rows[2], &rows[3]);
289
+ }
290
+
291
+ void blake3_compress_xof_avx512(const uint32_t cv[8],
292
+ const uint8_t block[BLAKE3_BLOCK_LEN],
293
+ uint8_t block_len, uint64_t counter,
294
+ uint8_t flags, uint8_t out[64]) {
295
+ __m128i rows[4];
296
+ compress_pre(rows, cv, block, block_len, counter, flags);
297
+ storeu_128(xor_128(rows[0], rows[2]), &out[0]);
298
+ storeu_128(xor_128(rows[1], rows[3]), &out[16]);
299
+ storeu_128(xor_128(rows[2], loadu_128((uint8_t *)&cv[0])), &out[32]);
300
+ storeu_128(xor_128(rows[3], loadu_128((uint8_t *)&cv[4])), &out[48]);
301
+ }
302
+
303
+ void blake3_compress_in_place_avx512(uint32_t cv[8],
304
+ const uint8_t block[BLAKE3_BLOCK_LEN],
305
+ uint8_t block_len, uint64_t counter,
306
+ uint8_t flags) {
307
+ __m128i rows[4];
308
+ compress_pre(rows, cv, block, block_len, counter, flags);
309
+ storeu_128(xor_128(rows[0], rows[2]), (uint8_t *)&cv[0]);
310
+ storeu_128(xor_128(rows[1], rows[3]), (uint8_t *)&cv[4]);
311
+ }
312
+
313
+ /*
314
+ * ----------------------------------------------------------------------------
315
+ * hash4_avx512
316
+ * ----------------------------------------------------------------------------
317
+ */
318
+
319
+ INLINE void round_fn4(__m128i v[16], __m128i m[16], size_t r) {
320
+ v[0] = add_128(v[0], m[(size_t)MSG_SCHEDULE[r][0]]);
321
+ v[1] = add_128(v[1], m[(size_t)MSG_SCHEDULE[r][2]]);
322
+ v[2] = add_128(v[2], m[(size_t)MSG_SCHEDULE[r][4]]);
323
+ v[3] = add_128(v[3], m[(size_t)MSG_SCHEDULE[r][6]]);
324
+ v[0] = add_128(v[0], v[4]);
325
+ v[1] = add_128(v[1], v[5]);
326
+ v[2] = add_128(v[2], v[6]);
327
+ v[3] = add_128(v[3], v[7]);
328
+ v[12] = xor_128(v[12], v[0]);
329
+ v[13] = xor_128(v[13], v[1]);
330
+ v[14] = xor_128(v[14], v[2]);
331
+ v[15] = xor_128(v[15], v[3]);
332
+ v[12] = rot16_128(v[12]);
333
+ v[13] = rot16_128(v[13]);
334
+ v[14] = rot16_128(v[14]);
335
+ v[15] = rot16_128(v[15]);
336
+ v[8] = add_128(v[8], v[12]);
337
+ v[9] = add_128(v[9], v[13]);
338
+ v[10] = add_128(v[10], v[14]);
339
+ v[11] = add_128(v[11], v[15]);
340
+ v[4] = xor_128(v[4], v[8]);
341
+ v[5] = xor_128(v[5], v[9]);
342
+ v[6] = xor_128(v[6], v[10]);
343
+ v[7] = xor_128(v[7], v[11]);
344
+ v[4] = rot12_128(v[4]);
345
+ v[5] = rot12_128(v[5]);
346
+ v[6] = rot12_128(v[6]);
347
+ v[7] = rot12_128(v[7]);
348
+ v[0] = add_128(v[0], m[(size_t)MSG_SCHEDULE[r][1]]);
349
+ v[1] = add_128(v[1], m[(size_t)MSG_SCHEDULE[r][3]]);
350
+ v[2] = add_128(v[2], m[(size_t)MSG_SCHEDULE[r][5]]);
351
+ v[3] = add_128(v[3], m[(size_t)MSG_SCHEDULE[r][7]]);
352
+ v[0] = add_128(v[0], v[4]);
353
+ v[1] = add_128(v[1], v[5]);
354
+ v[2] = add_128(v[2], v[6]);
355
+ v[3] = add_128(v[3], v[7]);
356
+ v[12] = xor_128(v[12], v[0]);
357
+ v[13] = xor_128(v[13], v[1]);
358
+ v[14] = xor_128(v[14], v[2]);
359
+ v[15] = xor_128(v[15], v[3]);
360
+ v[12] = rot8_128(v[12]);
361
+ v[13] = rot8_128(v[13]);
362
+ v[14] = rot8_128(v[14]);
363
+ v[15] = rot8_128(v[15]);
364
+ v[8] = add_128(v[8], v[12]);
365
+ v[9] = add_128(v[9], v[13]);
366
+ v[10] = add_128(v[10], v[14]);
367
+ v[11] = add_128(v[11], v[15]);
368
+ v[4] = xor_128(v[4], v[8]);
369
+ v[5] = xor_128(v[5], v[9]);
370
+ v[6] = xor_128(v[6], v[10]);
371
+ v[7] = xor_128(v[7], v[11]);
372
+ v[4] = rot7_128(v[4]);
373
+ v[5] = rot7_128(v[5]);
374
+ v[6] = rot7_128(v[6]);
375
+ v[7] = rot7_128(v[7]);
376
+
377
+ v[0] = add_128(v[0], m[(size_t)MSG_SCHEDULE[r][8]]);
378
+ v[1] = add_128(v[1], m[(size_t)MSG_SCHEDULE[r][10]]);
379
+ v[2] = add_128(v[2], m[(size_t)MSG_SCHEDULE[r][12]]);
380
+ v[3] = add_128(v[3], m[(size_t)MSG_SCHEDULE[r][14]]);
381
+ v[0] = add_128(v[0], v[5]);
382
+ v[1] = add_128(v[1], v[6]);
383
+ v[2] = add_128(v[2], v[7]);
384
+ v[3] = add_128(v[3], v[4]);
385
+ v[15] = xor_128(v[15], v[0]);
386
+ v[12] = xor_128(v[12], v[1]);
387
+ v[13] = xor_128(v[13], v[2]);
388
+ v[14] = xor_128(v[14], v[3]);
389
+ v[15] = rot16_128(v[15]);
390
+ v[12] = rot16_128(v[12]);
391
+ v[13] = rot16_128(v[13]);
392
+ v[14] = rot16_128(v[14]);
393
+ v[10] = add_128(v[10], v[15]);
394
+ v[11] = add_128(v[11], v[12]);
395
+ v[8] = add_128(v[8], v[13]);
396
+ v[9] = add_128(v[9], v[14]);
397
+ v[5] = xor_128(v[5], v[10]);
398
+ v[6] = xor_128(v[6], v[11]);
399
+ v[7] = xor_128(v[7], v[8]);
400
+ v[4] = xor_128(v[4], v[9]);
401
+ v[5] = rot12_128(v[5]);
402
+ v[6] = rot12_128(v[6]);
403
+ v[7] = rot12_128(v[7]);
404
+ v[4] = rot12_128(v[4]);
405
+ v[0] = add_128(v[0], m[(size_t)MSG_SCHEDULE[r][9]]);
406
+ v[1] = add_128(v[1], m[(size_t)MSG_SCHEDULE[r][11]]);
407
+ v[2] = add_128(v[2], m[(size_t)MSG_SCHEDULE[r][13]]);
408
+ v[3] = add_128(v[3], m[(size_t)MSG_SCHEDULE[r][15]]);
409
+ v[0] = add_128(v[0], v[5]);
410
+ v[1] = add_128(v[1], v[6]);
411
+ v[2] = add_128(v[2], v[7]);
412
+ v[3] = add_128(v[3], v[4]);
413
+ v[15] = xor_128(v[15], v[0]);
414
+ v[12] = xor_128(v[12], v[1]);
415
+ v[13] = xor_128(v[13], v[2]);
416
+ v[14] = xor_128(v[14], v[3]);
417
+ v[15] = rot8_128(v[15]);
418
+ v[12] = rot8_128(v[12]);
419
+ v[13] = rot8_128(v[13]);
420
+ v[14] = rot8_128(v[14]);
421
+ v[10] = add_128(v[10], v[15]);
422
+ v[11] = add_128(v[11], v[12]);
423
+ v[8] = add_128(v[8], v[13]);
424
+ v[9] = add_128(v[9], v[14]);
425
+ v[5] = xor_128(v[5], v[10]);
426
+ v[6] = xor_128(v[6], v[11]);
427
+ v[7] = xor_128(v[7], v[8]);
428
+ v[4] = xor_128(v[4], v[9]);
429
+ v[5] = rot7_128(v[5]);
430
+ v[6] = rot7_128(v[6]);
431
+ v[7] = rot7_128(v[7]);
432
+ v[4] = rot7_128(v[4]);
433
+ }
434
+
435
+ INLINE void transpose_vecs_128(__m128i vecs[4]) {
436
+ // Interleave 32-bit lanes. The low unpack is lanes 00/11 and the high is
437
+ // 22/33. Note that this doesn't split the vector into two lanes, as the
438
+ // AVX2 counterparts do.
439
+ __m128i ab_01 = _mm_unpacklo_epi32(vecs[0], vecs[1]);
440
+ __m128i ab_23 = _mm_unpackhi_epi32(vecs[0], vecs[1]);
441
+ __m128i cd_01 = _mm_unpacklo_epi32(vecs[2], vecs[3]);
442
+ __m128i cd_23 = _mm_unpackhi_epi32(vecs[2], vecs[3]);
443
+
444
+ // Interleave 64-bit lanes.
445
+ __m128i abcd_0 = _mm_unpacklo_epi64(ab_01, cd_01);
446
+ __m128i abcd_1 = _mm_unpackhi_epi64(ab_01, cd_01);
447
+ __m128i abcd_2 = _mm_unpacklo_epi64(ab_23, cd_23);
448
+ __m128i abcd_3 = _mm_unpackhi_epi64(ab_23, cd_23);
449
+
450
+ vecs[0] = abcd_0;
451
+ vecs[1] = abcd_1;
452
+ vecs[2] = abcd_2;
453
+ vecs[3] = abcd_3;
454
+ }
455
+
456
+ INLINE void transpose_msg_vecs4(const uint8_t *const *inputs,
457
+ size_t block_offset, __m128i out[16]) {
458
+ out[0] = loadu_128(&inputs[0][block_offset + 0 * sizeof(__m128i)]);
459
+ out[1] = loadu_128(&inputs[1][block_offset + 0 * sizeof(__m128i)]);
460
+ out[2] = loadu_128(&inputs[2][block_offset + 0 * sizeof(__m128i)]);
461
+ out[3] = loadu_128(&inputs[3][block_offset + 0 * sizeof(__m128i)]);
462
+ out[4] = loadu_128(&inputs[0][block_offset + 1 * sizeof(__m128i)]);
463
+ out[5] = loadu_128(&inputs[1][block_offset + 1 * sizeof(__m128i)]);
464
+ out[6] = loadu_128(&inputs[2][block_offset + 1 * sizeof(__m128i)]);
465
+ out[7] = loadu_128(&inputs[3][block_offset + 1 * sizeof(__m128i)]);
466
+ out[8] = loadu_128(&inputs[0][block_offset + 2 * sizeof(__m128i)]);
467
+ out[9] = loadu_128(&inputs[1][block_offset + 2 * sizeof(__m128i)]);
468
+ out[10] = loadu_128(&inputs[2][block_offset + 2 * sizeof(__m128i)]);
469
+ out[11] = loadu_128(&inputs[3][block_offset + 2 * sizeof(__m128i)]);
470
+ out[12] = loadu_128(&inputs[0][block_offset + 3 * sizeof(__m128i)]);
471
+ out[13] = loadu_128(&inputs[1][block_offset + 3 * sizeof(__m128i)]);
472
+ out[14] = loadu_128(&inputs[2][block_offset + 3 * sizeof(__m128i)]);
473
+ out[15] = loadu_128(&inputs[3][block_offset + 3 * sizeof(__m128i)]);
474
+ for (size_t i = 0; i < 4; ++i) {
475
+ _mm_prefetch((const void *)&inputs[i][block_offset + 256], _MM_HINT_T0);
476
+ }
477
+ transpose_vecs_128(&out[0]);
478
+ transpose_vecs_128(&out[4]);
479
+ transpose_vecs_128(&out[8]);
480
+ transpose_vecs_128(&out[12]);
481
+ }
482
+
483
+ INLINE void load_counters4(uint64_t counter, bool increment_counter,
484
+ __m128i *out_lo, __m128i *out_hi) {
485
+ uint64_t mask = (increment_counter ? ~0 : 0);
486
+ __m256i mask_vec = _mm256_set1_epi64x(mask);
487
+ __m256i deltas = _mm256_setr_epi64x(0, 1, 2, 3);
488
+ deltas = _mm256_and_si256(mask_vec, deltas);
489
+ __m256i counters =
490
+ _mm256_add_epi64(_mm256_set1_epi64x((int64_t)counter), deltas);
491
+ *out_lo = _mm256_cvtepi64_epi32(counters);
492
+ *out_hi = _mm256_cvtepi64_epi32(_mm256_srli_epi64(counters, 32));
493
+ }
494
+
495
+ static
496
+ void blake3_hash4_avx512(const uint8_t *const *inputs, size_t blocks,
497
+ const uint32_t key[8], uint64_t counter,
498
+ bool increment_counter, uint8_t flags,
499
+ uint8_t flags_start, uint8_t flags_end, uint8_t *out) {
500
+ __m128i h_vecs[8] = {
501
+ set1_128(key[0]), set1_128(key[1]), set1_128(key[2]), set1_128(key[3]),
502
+ set1_128(key[4]), set1_128(key[5]), set1_128(key[6]), set1_128(key[7]),
503
+ };
504
+ __m128i counter_low_vec, counter_high_vec;
505
+ load_counters4(counter, increment_counter, &counter_low_vec,
506
+ &counter_high_vec);
507
+ uint8_t block_flags = flags | flags_start;
508
+
509
+ for (size_t block = 0; block < blocks; block++) {
510
+ if (block + 1 == blocks) {
511
+ block_flags |= flags_end;
512
+ }
513
+ __m128i block_len_vec = set1_128(BLAKE3_BLOCK_LEN);
514
+ __m128i block_flags_vec = set1_128(block_flags);
515
+ __m128i msg_vecs[16];
516
+ transpose_msg_vecs4(inputs, block * BLAKE3_BLOCK_LEN, msg_vecs);
517
+
518
+ __m128i v[16] = {
519
+ h_vecs[0], h_vecs[1], h_vecs[2], h_vecs[3],
520
+ h_vecs[4], h_vecs[5], h_vecs[6], h_vecs[7],
521
+ set1_128(IV[0]), set1_128(IV[1]), set1_128(IV[2]), set1_128(IV[3]),
522
+ counter_low_vec, counter_high_vec, block_len_vec, block_flags_vec,
523
+ };
524
+ round_fn4(v, msg_vecs, 0);
525
+ round_fn4(v, msg_vecs, 1);
526
+ round_fn4(v, msg_vecs, 2);
527
+ round_fn4(v, msg_vecs, 3);
528
+ round_fn4(v, msg_vecs, 4);
529
+ round_fn4(v, msg_vecs, 5);
530
+ round_fn4(v, msg_vecs, 6);
531
+ h_vecs[0] = xor_128(v[0], v[8]);
532
+ h_vecs[1] = xor_128(v[1], v[9]);
533
+ h_vecs[2] = xor_128(v[2], v[10]);
534
+ h_vecs[3] = xor_128(v[3], v[11]);
535
+ h_vecs[4] = xor_128(v[4], v[12]);
536
+ h_vecs[5] = xor_128(v[5], v[13]);
537
+ h_vecs[6] = xor_128(v[6], v[14]);
538
+ h_vecs[7] = xor_128(v[7], v[15]);
539
+
540
+ block_flags = flags;
541
+ }
542
+
543
+ transpose_vecs_128(&h_vecs[0]);
544
+ transpose_vecs_128(&h_vecs[4]);
545
+ // The first four vecs now contain the first half of each output, and the
546
+ // second four vecs contain the second half of each output.
547
+ storeu_128(h_vecs[0], &out[0 * sizeof(__m128i)]);
548
+ storeu_128(h_vecs[4], &out[1 * sizeof(__m128i)]);
549
+ storeu_128(h_vecs[1], &out[2 * sizeof(__m128i)]);
550
+ storeu_128(h_vecs[5], &out[3 * sizeof(__m128i)]);
551
+ storeu_128(h_vecs[2], &out[4 * sizeof(__m128i)]);
552
+ storeu_128(h_vecs[6], &out[5 * sizeof(__m128i)]);
553
+ storeu_128(h_vecs[3], &out[6 * sizeof(__m128i)]);
554
+ storeu_128(h_vecs[7], &out[7 * sizeof(__m128i)]);
555
+ }
556
+
557
+ static
558
+ void blake3_xof4_avx512(const uint32_t cv[8],
559
+ const uint8_t block[BLAKE3_BLOCK_LEN],
560
+ uint8_t block_len, uint64_t counter, uint8_t flags,
561
+ uint8_t out[4 * 64]) {
562
+ __m128i h_vecs[8] = {
563
+ set1_128(cv[0]), set1_128(cv[1]), set1_128(cv[2]), set1_128(cv[3]),
564
+ set1_128(cv[4]), set1_128(cv[5]), set1_128(cv[6]), set1_128(cv[7]),
565
+ };
566
+ uint32_t block_words[16];
567
+ load_block_words(block, block_words);
568
+ __m128i msg_vecs[16];
569
+ for (size_t i = 0; i < 16; i++) {
570
+ msg_vecs[i] = set1_128(block_words[i]);
571
+ }
572
+ __m128i counter_low_vec, counter_high_vec;
573
+ load_counters4(counter, true, &counter_low_vec, &counter_high_vec);
574
+ __m128i block_len_vec = set1_128(block_len);
575
+ __m128i block_flags_vec = set1_128(flags);
576
+ __m128i v[16] = {
577
+ h_vecs[0], h_vecs[1], h_vecs[2], h_vecs[3],
578
+ h_vecs[4], h_vecs[5], h_vecs[6], h_vecs[7],
579
+ set1_128(IV[0]), set1_128(IV[1]), set1_128(IV[2]), set1_128(IV[3]),
580
+ counter_low_vec, counter_high_vec, block_len_vec, block_flags_vec,
581
+ };
582
+ round_fn4(v, msg_vecs, 0);
583
+ round_fn4(v, msg_vecs, 1);
584
+ round_fn4(v, msg_vecs, 2);
585
+ round_fn4(v, msg_vecs, 3);
586
+ round_fn4(v, msg_vecs, 4);
587
+ round_fn4(v, msg_vecs, 5);
588
+ round_fn4(v, msg_vecs, 6);
589
+ for (size_t i = 0; i < 8; i++) {
590
+ v[i] = xor_128(v[i], v[i+8]);
591
+ v[i+8] = xor_128(v[i+8], h_vecs[i]);
592
+ }
593
+ transpose_vecs_128(&v[0]);
594
+ transpose_vecs_128(&v[4]);
595
+ transpose_vecs_128(&v[8]);
596
+ transpose_vecs_128(&v[12]);
597
+ for (size_t i = 0; i < 4; i++) {
598
+ storeu_128(v[i+ 0], &out[(4*i+0) * sizeof(__m128i)]);
599
+ storeu_128(v[i+ 4], &out[(4*i+1) * sizeof(__m128i)]);
600
+ storeu_128(v[i+ 8], &out[(4*i+2) * sizeof(__m128i)]);
601
+ storeu_128(v[i+12], &out[(4*i+3) * sizeof(__m128i)]);
602
+ }
603
+ }
604
+
605
+ /*
606
+ * ----------------------------------------------------------------------------
607
+ * hash8_avx512
608
+ * ----------------------------------------------------------------------------
609
+ */
610
+
611
+ INLINE void round_fn8(__m256i v[16], __m256i m[16], size_t r) {
612
+ v[0] = add_256(v[0], m[(size_t)MSG_SCHEDULE[r][0]]);
613
+ v[1] = add_256(v[1], m[(size_t)MSG_SCHEDULE[r][2]]);
614
+ v[2] = add_256(v[2], m[(size_t)MSG_SCHEDULE[r][4]]);
615
+ v[3] = add_256(v[3], m[(size_t)MSG_SCHEDULE[r][6]]);
616
+ v[0] = add_256(v[0], v[4]);
617
+ v[1] = add_256(v[1], v[5]);
618
+ v[2] = add_256(v[2], v[6]);
619
+ v[3] = add_256(v[3], v[7]);
620
+ v[12] = xor_256(v[12], v[0]);
621
+ v[13] = xor_256(v[13], v[1]);
622
+ v[14] = xor_256(v[14], v[2]);
623
+ v[15] = xor_256(v[15], v[3]);
624
+ v[12] = rot16_256(v[12]);
625
+ v[13] = rot16_256(v[13]);
626
+ v[14] = rot16_256(v[14]);
627
+ v[15] = rot16_256(v[15]);
628
+ v[8] = add_256(v[8], v[12]);
629
+ v[9] = add_256(v[9], v[13]);
630
+ v[10] = add_256(v[10], v[14]);
631
+ v[11] = add_256(v[11], v[15]);
632
+ v[4] = xor_256(v[4], v[8]);
633
+ v[5] = xor_256(v[5], v[9]);
634
+ v[6] = xor_256(v[6], v[10]);
635
+ v[7] = xor_256(v[7], v[11]);
636
+ v[4] = rot12_256(v[4]);
637
+ v[5] = rot12_256(v[5]);
638
+ v[6] = rot12_256(v[6]);
639
+ v[7] = rot12_256(v[7]);
640
+ v[0] = add_256(v[0], m[(size_t)MSG_SCHEDULE[r][1]]);
641
+ v[1] = add_256(v[1], m[(size_t)MSG_SCHEDULE[r][3]]);
642
+ v[2] = add_256(v[2], m[(size_t)MSG_SCHEDULE[r][5]]);
643
+ v[3] = add_256(v[3], m[(size_t)MSG_SCHEDULE[r][7]]);
644
+ v[0] = add_256(v[0], v[4]);
645
+ v[1] = add_256(v[1], v[5]);
646
+ v[2] = add_256(v[2], v[6]);
647
+ v[3] = add_256(v[3], v[7]);
648
+ v[12] = xor_256(v[12], v[0]);
649
+ v[13] = xor_256(v[13], v[1]);
650
+ v[14] = xor_256(v[14], v[2]);
651
+ v[15] = xor_256(v[15], v[3]);
652
+ v[12] = rot8_256(v[12]);
653
+ v[13] = rot8_256(v[13]);
654
+ v[14] = rot8_256(v[14]);
655
+ v[15] = rot8_256(v[15]);
656
+ v[8] = add_256(v[8], v[12]);
657
+ v[9] = add_256(v[9], v[13]);
658
+ v[10] = add_256(v[10], v[14]);
659
+ v[11] = add_256(v[11], v[15]);
660
+ v[4] = xor_256(v[4], v[8]);
661
+ v[5] = xor_256(v[5], v[9]);
662
+ v[6] = xor_256(v[6], v[10]);
663
+ v[7] = xor_256(v[7], v[11]);
664
+ v[4] = rot7_256(v[4]);
665
+ v[5] = rot7_256(v[5]);
666
+ v[6] = rot7_256(v[6]);
667
+ v[7] = rot7_256(v[7]);
668
+
669
+ v[0] = add_256(v[0], m[(size_t)MSG_SCHEDULE[r][8]]);
670
+ v[1] = add_256(v[1], m[(size_t)MSG_SCHEDULE[r][10]]);
671
+ v[2] = add_256(v[2], m[(size_t)MSG_SCHEDULE[r][12]]);
672
+ v[3] = add_256(v[3], m[(size_t)MSG_SCHEDULE[r][14]]);
673
+ v[0] = add_256(v[0], v[5]);
674
+ v[1] = add_256(v[1], v[6]);
675
+ v[2] = add_256(v[2], v[7]);
676
+ v[3] = add_256(v[3], v[4]);
677
+ v[15] = xor_256(v[15], v[0]);
678
+ v[12] = xor_256(v[12], v[1]);
679
+ v[13] = xor_256(v[13], v[2]);
680
+ v[14] = xor_256(v[14], v[3]);
681
+ v[15] = rot16_256(v[15]);
682
+ v[12] = rot16_256(v[12]);
683
+ v[13] = rot16_256(v[13]);
684
+ v[14] = rot16_256(v[14]);
685
+ v[10] = add_256(v[10], v[15]);
686
+ v[11] = add_256(v[11], v[12]);
687
+ v[8] = add_256(v[8], v[13]);
688
+ v[9] = add_256(v[9], v[14]);
689
+ v[5] = xor_256(v[5], v[10]);
690
+ v[6] = xor_256(v[6], v[11]);
691
+ v[7] = xor_256(v[7], v[8]);
692
+ v[4] = xor_256(v[4], v[9]);
693
+ v[5] = rot12_256(v[5]);
694
+ v[6] = rot12_256(v[6]);
695
+ v[7] = rot12_256(v[7]);
696
+ v[4] = rot12_256(v[4]);
697
+ v[0] = add_256(v[0], m[(size_t)MSG_SCHEDULE[r][9]]);
698
+ v[1] = add_256(v[1], m[(size_t)MSG_SCHEDULE[r][11]]);
699
+ v[2] = add_256(v[2], m[(size_t)MSG_SCHEDULE[r][13]]);
700
+ v[3] = add_256(v[3], m[(size_t)MSG_SCHEDULE[r][15]]);
701
+ v[0] = add_256(v[0], v[5]);
702
+ v[1] = add_256(v[1], v[6]);
703
+ v[2] = add_256(v[2], v[7]);
704
+ v[3] = add_256(v[3], v[4]);
705
+ v[15] = xor_256(v[15], v[0]);
706
+ v[12] = xor_256(v[12], v[1]);
707
+ v[13] = xor_256(v[13], v[2]);
708
+ v[14] = xor_256(v[14], v[3]);
709
+ v[15] = rot8_256(v[15]);
710
+ v[12] = rot8_256(v[12]);
711
+ v[13] = rot8_256(v[13]);
712
+ v[14] = rot8_256(v[14]);
713
+ v[10] = add_256(v[10], v[15]);
714
+ v[11] = add_256(v[11], v[12]);
715
+ v[8] = add_256(v[8], v[13]);
716
+ v[9] = add_256(v[9], v[14]);
717
+ v[5] = xor_256(v[5], v[10]);
718
+ v[6] = xor_256(v[6], v[11]);
719
+ v[7] = xor_256(v[7], v[8]);
720
+ v[4] = xor_256(v[4], v[9]);
721
+ v[5] = rot7_256(v[5]);
722
+ v[6] = rot7_256(v[6]);
723
+ v[7] = rot7_256(v[7]);
724
+ v[4] = rot7_256(v[4]);
725
+ }
726
+
727
+ INLINE void transpose_vecs_256(__m256i vecs[8]) {
728
+ // Interleave 32-bit lanes. The low unpack is lanes 00/11/44/55, and the high
729
+ // is 22/33/66/77.
730
+ __m256i ab_0145 = _mm256_unpacklo_epi32(vecs[0], vecs[1]);
731
+ __m256i ab_2367 = _mm256_unpackhi_epi32(vecs[0], vecs[1]);
732
+ __m256i cd_0145 = _mm256_unpacklo_epi32(vecs[2], vecs[3]);
733
+ __m256i cd_2367 = _mm256_unpackhi_epi32(vecs[2], vecs[3]);
734
+ __m256i ef_0145 = _mm256_unpacklo_epi32(vecs[4], vecs[5]);
735
+ __m256i ef_2367 = _mm256_unpackhi_epi32(vecs[4], vecs[5]);
736
+ __m256i gh_0145 = _mm256_unpacklo_epi32(vecs[6], vecs[7]);
737
+ __m256i gh_2367 = _mm256_unpackhi_epi32(vecs[6], vecs[7]);
738
+
739
+ // Interleave 64-bit lanes. The low unpack is lanes 00/22 and the high is
740
+ // 11/33.
741
+ __m256i abcd_04 = _mm256_unpacklo_epi64(ab_0145, cd_0145);
742
+ __m256i abcd_15 = _mm256_unpackhi_epi64(ab_0145, cd_0145);
743
+ __m256i abcd_26 = _mm256_unpacklo_epi64(ab_2367, cd_2367);
744
+ __m256i abcd_37 = _mm256_unpackhi_epi64(ab_2367, cd_2367);
745
+ __m256i efgh_04 = _mm256_unpacklo_epi64(ef_0145, gh_0145);
746
+ __m256i efgh_15 = _mm256_unpackhi_epi64(ef_0145, gh_0145);
747
+ __m256i efgh_26 = _mm256_unpacklo_epi64(ef_2367, gh_2367);
748
+ __m256i efgh_37 = _mm256_unpackhi_epi64(ef_2367, gh_2367);
749
+
750
+ // Interleave 128-bit lanes.
751
+ vecs[0] = _mm256_permute2x128_si256(abcd_04, efgh_04, 0x20);
752
+ vecs[1] = _mm256_permute2x128_si256(abcd_15, efgh_15, 0x20);
753
+ vecs[2] = _mm256_permute2x128_si256(abcd_26, efgh_26, 0x20);
754
+ vecs[3] = _mm256_permute2x128_si256(abcd_37, efgh_37, 0x20);
755
+ vecs[4] = _mm256_permute2x128_si256(abcd_04, efgh_04, 0x31);
756
+ vecs[5] = _mm256_permute2x128_si256(abcd_15, efgh_15, 0x31);
757
+ vecs[6] = _mm256_permute2x128_si256(abcd_26, efgh_26, 0x31);
758
+ vecs[7] = _mm256_permute2x128_si256(abcd_37, efgh_37, 0x31);
759
+ }
760
+
761
+ INLINE void transpose_msg_vecs8(const uint8_t *const *inputs,
762
+ size_t block_offset, __m256i out[16]) {
763
+ out[0] = loadu_256(&inputs[0][block_offset + 0 * sizeof(__m256i)]);
764
+ out[1] = loadu_256(&inputs[1][block_offset + 0 * sizeof(__m256i)]);
765
+ out[2] = loadu_256(&inputs[2][block_offset + 0 * sizeof(__m256i)]);
766
+ out[3] = loadu_256(&inputs[3][block_offset + 0 * sizeof(__m256i)]);
767
+ out[4] = loadu_256(&inputs[4][block_offset + 0 * sizeof(__m256i)]);
768
+ out[5] = loadu_256(&inputs[5][block_offset + 0 * sizeof(__m256i)]);
769
+ out[6] = loadu_256(&inputs[6][block_offset + 0 * sizeof(__m256i)]);
770
+ out[7] = loadu_256(&inputs[7][block_offset + 0 * sizeof(__m256i)]);
771
+ out[8] = loadu_256(&inputs[0][block_offset + 1 * sizeof(__m256i)]);
772
+ out[9] = loadu_256(&inputs[1][block_offset + 1 * sizeof(__m256i)]);
773
+ out[10] = loadu_256(&inputs[2][block_offset + 1 * sizeof(__m256i)]);
774
+ out[11] = loadu_256(&inputs[3][block_offset + 1 * sizeof(__m256i)]);
775
+ out[12] = loadu_256(&inputs[4][block_offset + 1 * sizeof(__m256i)]);
776
+ out[13] = loadu_256(&inputs[5][block_offset + 1 * sizeof(__m256i)]);
777
+ out[14] = loadu_256(&inputs[6][block_offset + 1 * sizeof(__m256i)]);
778
+ out[15] = loadu_256(&inputs[7][block_offset + 1 * sizeof(__m256i)]);
779
+ for (size_t i = 0; i < 8; ++i) {
780
+ _mm_prefetch((const void *)&inputs[i][block_offset + 256], _MM_HINT_T0);
781
+ }
782
+ transpose_vecs_256(&out[0]);
783
+ transpose_vecs_256(&out[8]);
784
+ }
785
+
786
+ INLINE void load_counters8(uint64_t counter, bool increment_counter,
787
+ __m256i *out_lo, __m256i *out_hi) {
788
+ uint64_t mask = (increment_counter ? ~0 : 0);
789
+ __m512i mask_vec = _mm512_set1_epi64(mask);
790
+ __m512i deltas = _mm512_setr_epi64(0, 1, 2, 3, 4, 5, 6, 7);
791
+ deltas = _mm512_and_si512(mask_vec, deltas);
792
+ __m512i counters =
793
+ _mm512_add_epi64(_mm512_set1_epi64((int64_t)counter), deltas);
794
+ *out_lo = _mm512_cvtepi64_epi32(counters);
795
+ *out_hi = _mm512_cvtepi64_epi32(_mm512_srli_epi64(counters, 32));
796
+ }
797
+
798
+ static
799
+ void blake3_hash8_avx512(const uint8_t *const *inputs, size_t blocks,
800
+ const uint32_t key[8], uint64_t counter,
801
+ bool increment_counter, uint8_t flags,
802
+ uint8_t flags_start, uint8_t flags_end, uint8_t *out) {
803
+ __m256i h_vecs[8] = {
804
+ set1_256(key[0]), set1_256(key[1]), set1_256(key[2]), set1_256(key[3]),
805
+ set1_256(key[4]), set1_256(key[5]), set1_256(key[6]), set1_256(key[7]),
806
+ };
807
+ __m256i counter_low_vec, counter_high_vec;
808
+ load_counters8(counter, increment_counter, &counter_low_vec,
809
+ &counter_high_vec);
810
+ uint8_t block_flags = flags | flags_start;
811
+
812
+ for (size_t block = 0; block < blocks; block++) {
813
+ if (block + 1 == blocks) {
814
+ block_flags |= flags_end;
815
+ }
816
+ __m256i block_len_vec = set1_256(BLAKE3_BLOCK_LEN);
817
+ __m256i block_flags_vec = set1_256(block_flags);
818
+ __m256i msg_vecs[16];
819
+ transpose_msg_vecs8(inputs, block * BLAKE3_BLOCK_LEN, msg_vecs);
820
+
821
+ __m256i v[16] = {
822
+ h_vecs[0], h_vecs[1], h_vecs[2], h_vecs[3],
823
+ h_vecs[4], h_vecs[5], h_vecs[6], h_vecs[7],
824
+ set1_256(IV[0]), set1_256(IV[1]), set1_256(IV[2]), set1_256(IV[3]),
825
+ counter_low_vec, counter_high_vec, block_len_vec, block_flags_vec,
826
+ };
827
+ round_fn8(v, msg_vecs, 0);
828
+ round_fn8(v, msg_vecs, 1);
829
+ round_fn8(v, msg_vecs, 2);
830
+ round_fn8(v, msg_vecs, 3);
831
+ round_fn8(v, msg_vecs, 4);
832
+ round_fn8(v, msg_vecs, 5);
833
+ round_fn8(v, msg_vecs, 6);
834
+ h_vecs[0] = xor_256(v[0], v[8]);
835
+ h_vecs[1] = xor_256(v[1], v[9]);
836
+ h_vecs[2] = xor_256(v[2], v[10]);
837
+ h_vecs[3] = xor_256(v[3], v[11]);
838
+ h_vecs[4] = xor_256(v[4], v[12]);
839
+ h_vecs[5] = xor_256(v[5], v[13]);
840
+ h_vecs[6] = xor_256(v[6], v[14]);
841
+ h_vecs[7] = xor_256(v[7], v[15]);
842
+
843
+ block_flags = flags;
844
+ }
845
+
846
+ transpose_vecs_256(h_vecs);
847
+ storeu_256(h_vecs[0], &out[0 * sizeof(__m256i)]);
848
+ storeu_256(h_vecs[1], &out[1 * sizeof(__m256i)]);
849
+ storeu_256(h_vecs[2], &out[2 * sizeof(__m256i)]);
850
+ storeu_256(h_vecs[3], &out[3 * sizeof(__m256i)]);
851
+ storeu_256(h_vecs[4], &out[4 * sizeof(__m256i)]);
852
+ storeu_256(h_vecs[5], &out[5 * sizeof(__m256i)]);
853
+ storeu_256(h_vecs[6], &out[6 * sizeof(__m256i)]);
854
+ storeu_256(h_vecs[7], &out[7 * sizeof(__m256i)]);
855
+ }
856
+
857
+ static
858
+ void blake3_xof8_avx512(const uint32_t cv[8],
859
+ const uint8_t block[BLAKE3_BLOCK_LEN],
860
+ uint8_t block_len, uint64_t counter, uint8_t flags,
861
+ uint8_t out[8 * 64]) {
862
+ __m256i h_vecs[8] = {
863
+ set1_256(cv[0]), set1_256(cv[1]), set1_256(cv[2]), set1_256(cv[3]),
864
+ set1_256(cv[4]), set1_256(cv[5]), set1_256(cv[6]), set1_256(cv[7]),
865
+ };
866
+ uint32_t block_words[16];
867
+ load_block_words(block, block_words);
868
+ __m256i msg_vecs[16];
869
+ for (size_t i = 0; i < 16; i++) {
870
+ msg_vecs[i] = set1_256(block_words[i]);
871
+ }
872
+ __m256i counter_low_vec, counter_high_vec;
873
+ load_counters8(counter, true, &counter_low_vec, &counter_high_vec);
874
+ __m256i block_len_vec = set1_256(block_len);
875
+ __m256i block_flags_vec = set1_256(flags);
876
+ __m256i v[16] = {
877
+ h_vecs[0], h_vecs[1], h_vecs[2], h_vecs[3],
878
+ h_vecs[4], h_vecs[5], h_vecs[6], h_vecs[7],
879
+ set1_256(IV[0]), set1_256(IV[1]), set1_256(IV[2]), set1_256(IV[3]),
880
+ counter_low_vec, counter_high_vec, block_len_vec, block_flags_vec,
881
+ };
882
+ round_fn8(v, msg_vecs, 0);
883
+ round_fn8(v, msg_vecs, 1);
884
+ round_fn8(v, msg_vecs, 2);
885
+ round_fn8(v, msg_vecs, 3);
886
+ round_fn8(v, msg_vecs, 4);
887
+ round_fn8(v, msg_vecs, 5);
888
+ round_fn8(v, msg_vecs, 6);
889
+ for (size_t i = 0; i < 8; i++) {
890
+ v[i] = xor_256(v[i], v[i+8]);
891
+ v[i+8] = xor_256(v[i+8], h_vecs[i]);
892
+ }
893
+ transpose_vecs_256(&v[0]);
894
+ transpose_vecs_256(&v[8]);
895
+ for (size_t i = 0; i < 8; i++) {
896
+ storeu_256(v[i+0], &out[(2*i+0) * sizeof(__m256i)]);
897
+ storeu_256(v[i+8], &out[(2*i+1) * sizeof(__m256i)]);
898
+ }
899
+ }
900
+
901
+ /*
902
+ * ----------------------------------------------------------------------------
903
+ * hash16_avx512
904
+ * ----------------------------------------------------------------------------
905
+ */
906
+
907
+ INLINE void round_fn16(__m512i v[16], __m512i m[16], size_t r) {
908
+ v[0] = add_512(v[0], m[(size_t)MSG_SCHEDULE[r][0]]);
909
+ v[1] = add_512(v[1], m[(size_t)MSG_SCHEDULE[r][2]]);
910
+ v[2] = add_512(v[2], m[(size_t)MSG_SCHEDULE[r][4]]);
911
+ v[3] = add_512(v[3], m[(size_t)MSG_SCHEDULE[r][6]]);
912
+ v[0] = add_512(v[0], v[4]);
913
+ v[1] = add_512(v[1], v[5]);
914
+ v[2] = add_512(v[2], v[6]);
915
+ v[3] = add_512(v[3], v[7]);
916
+ v[12] = xor_512(v[12], v[0]);
917
+ v[13] = xor_512(v[13], v[1]);
918
+ v[14] = xor_512(v[14], v[2]);
919
+ v[15] = xor_512(v[15], v[3]);
920
+ v[12] = rot16_512(v[12]);
921
+ v[13] = rot16_512(v[13]);
922
+ v[14] = rot16_512(v[14]);
923
+ v[15] = rot16_512(v[15]);
924
+ v[8] = add_512(v[8], v[12]);
925
+ v[9] = add_512(v[9], v[13]);
926
+ v[10] = add_512(v[10], v[14]);
927
+ v[11] = add_512(v[11], v[15]);
928
+ v[4] = xor_512(v[4], v[8]);
929
+ v[5] = xor_512(v[5], v[9]);
930
+ v[6] = xor_512(v[6], v[10]);
931
+ v[7] = xor_512(v[7], v[11]);
932
+ v[4] = rot12_512(v[4]);
933
+ v[5] = rot12_512(v[5]);
934
+ v[6] = rot12_512(v[6]);
935
+ v[7] = rot12_512(v[7]);
936
+ v[0] = add_512(v[0], m[(size_t)MSG_SCHEDULE[r][1]]);
937
+ v[1] = add_512(v[1], m[(size_t)MSG_SCHEDULE[r][3]]);
938
+ v[2] = add_512(v[2], m[(size_t)MSG_SCHEDULE[r][5]]);
939
+ v[3] = add_512(v[3], m[(size_t)MSG_SCHEDULE[r][7]]);
940
+ v[0] = add_512(v[0], v[4]);
941
+ v[1] = add_512(v[1], v[5]);
942
+ v[2] = add_512(v[2], v[6]);
943
+ v[3] = add_512(v[3], v[7]);
944
+ v[12] = xor_512(v[12], v[0]);
945
+ v[13] = xor_512(v[13], v[1]);
946
+ v[14] = xor_512(v[14], v[2]);
947
+ v[15] = xor_512(v[15], v[3]);
948
+ v[12] = rot8_512(v[12]);
949
+ v[13] = rot8_512(v[13]);
950
+ v[14] = rot8_512(v[14]);
951
+ v[15] = rot8_512(v[15]);
952
+ v[8] = add_512(v[8], v[12]);
953
+ v[9] = add_512(v[9], v[13]);
954
+ v[10] = add_512(v[10], v[14]);
955
+ v[11] = add_512(v[11], v[15]);
956
+ v[4] = xor_512(v[4], v[8]);
957
+ v[5] = xor_512(v[5], v[9]);
958
+ v[6] = xor_512(v[6], v[10]);
959
+ v[7] = xor_512(v[7], v[11]);
960
+ v[4] = rot7_512(v[4]);
961
+ v[5] = rot7_512(v[5]);
962
+ v[6] = rot7_512(v[6]);
963
+ v[7] = rot7_512(v[7]);
964
+
965
+ v[0] = add_512(v[0], m[(size_t)MSG_SCHEDULE[r][8]]);
966
+ v[1] = add_512(v[1], m[(size_t)MSG_SCHEDULE[r][10]]);
967
+ v[2] = add_512(v[2], m[(size_t)MSG_SCHEDULE[r][12]]);
968
+ v[3] = add_512(v[3], m[(size_t)MSG_SCHEDULE[r][14]]);
969
+ v[0] = add_512(v[0], v[5]);
970
+ v[1] = add_512(v[1], v[6]);
971
+ v[2] = add_512(v[2], v[7]);
972
+ v[3] = add_512(v[3], v[4]);
973
+ v[15] = xor_512(v[15], v[0]);
974
+ v[12] = xor_512(v[12], v[1]);
975
+ v[13] = xor_512(v[13], v[2]);
976
+ v[14] = xor_512(v[14], v[3]);
977
+ v[15] = rot16_512(v[15]);
978
+ v[12] = rot16_512(v[12]);
979
+ v[13] = rot16_512(v[13]);
980
+ v[14] = rot16_512(v[14]);
981
+ v[10] = add_512(v[10], v[15]);
982
+ v[11] = add_512(v[11], v[12]);
983
+ v[8] = add_512(v[8], v[13]);
984
+ v[9] = add_512(v[9], v[14]);
985
+ v[5] = xor_512(v[5], v[10]);
986
+ v[6] = xor_512(v[6], v[11]);
987
+ v[7] = xor_512(v[7], v[8]);
988
+ v[4] = xor_512(v[4], v[9]);
989
+ v[5] = rot12_512(v[5]);
990
+ v[6] = rot12_512(v[6]);
991
+ v[7] = rot12_512(v[7]);
992
+ v[4] = rot12_512(v[4]);
993
+ v[0] = add_512(v[0], m[(size_t)MSG_SCHEDULE[r][9]]);
994
+ v[1] = add_512(v[1], m[(size_t)MSG_SCHEDULE[r][11]]);
995
+ v[2] = add_512(v[2], m[(size_t)MSG_SCHEDULE[r][13]]);
996
+ v[3] = add_512(v[3], m[(size_t)MSG_SCHEDULE[r][15]]);
997
+ v[0] = add_512(v[0], v[5]);
998
+ v[1] = add_512(v[1], v[6]);
999
+ v[2] = add_512(v[2], v[7]);
1000
+ v[3] = add_512(v[3], v[4]);
1001
+ v[15] = xor_512(v[15], v[0]);
1002
+ v[12] = xor_512(v[12], v[1]);
1003
+ v[13] = xor_512(v[13], v[2]);
1004
+ v[14] = xor_512(v[14], v[3]);
1005
+ v[15] = rot8_512(v[15]);
1006
+ v[12] = rot8_512(v[12]);
1007
+ v[13] = rot8_512(v[13]);
1008
+ v[14] = rot8_512(v[14]);
1009
+ v[10] = add_512(v[10], v[15]);
1010
+ v[11] = add_512(v[11], v[12]);
1011
+ v[8] = add_512(v[8], v[13]);
1012
+ v[9] = add_512(v[9], v[14]);
1013
+ v[5] = xor_512(v[5], v[10]);
1014
+ v[6] = xor_512(v[6], v[11]);
1015
+ v[7] = xor_512(v[7], v[8]);
1016
+ v[4] = xor_512(v[4], v[9]);
1017
+ v[5] = rot7_512(v[5]);
1018
+ v[6] = rot7_512(v[6]);
1019
+ v[7] = rot7_512(v[7]);
1020
+ v[4] = rot7_512(v[4]);
1021
+ }
1022
+
1023
+ // 0b10001000, or lanes a0/a2/b0/b2 in little-endian order
1024
+ #define LO_IMM8 0x88
1025
+
1026
+ INLINE __m512i unpack_lo_128(__m512i a, __m512i b) {
1027
+ return _mm512_shuffle_i32x4(a, b, LO_IMM8);
1028
+ }
1029
+
1030
+ // 0b11011101, or lanes a1/a3/b1/b3 in little-endian order
1031
+ #define HI_IMM8 0xdd
1032
+
1033
+ INLINE __m512i unpack_hi_128(__m512i a, __m512i b) {
1034
+ return _mm512_shuffle_i32x4(a, b, HI_IMM8);
1035
+ }
1036
+
1037
+ INLINE void transpose_vecs_512(__m512i vecs[16]) {
1038
+ // Interleave 32-bit lanes. The _0 unpack is lanes
1039
+ // 0/0/1/1/4/4/5/5/8/8/9/9/12/12/13/13, and the _2 unpack is lanes
1040
+ // 2/2/3/3/6/6/7/7/10/10/11/11/14/14/15/15.
1041
+ __m512i ab_0 = _mm512_unpacklo_epi32(vecs[0], vecs[1]);
1042
+ __m512i ab_2 = _mm512_unpackhi_epi32(vecs[0], vecs[1]);
1043
+ __m512i cd_0 = _mm512_unpacklo_epi32(vecs[2], vecs[3]);
1044
+ __m512i cd_2 = _mm512_unpackhi_epi32(vecs[2], vecs[3]);
1045
+ __m512i ef_0 = _mm512_unpacklo_epi32(vecs[4], vecs[5]);
1046
+ __m512i ef_2 = _mm512_unpackhi_epi32(vecs[4], vecs[5]);
1047
+ __m512i gh_0 = _mm512_unpacklo_epi32(vecs[6], vecs[7]);
1048
+ __m512i gh_2 = _mm512_unpackhi_epi32(vecs[6], vecs[7]);
1049
+ __m512i ij_0 = _mm512_unpacklo_epi32(vecs[8], vecs[9]);
1050
+ __m512i ij_2 = _mm512_unpackhi_epi32(vecs[8], vecs[9]);
1051
+ __m512i kl_0 = _mm512_unpacklo_epi32(vecs[10], vecs[11]);
1052
+ __m512i kl_2 = _mm512_unpackhi_epi32(vecs[10], vecs[11]);
1053
+ __m512i mn_0 = _mm512_unpacklo_epi32(vecs[12], vecs[13]);
1054
+ __m512i mn_2 = _mm512_unpackhi_epi32(vecs[12], vecs[13]);
1055
+ __m512i op_0 = _mm512_unpacklo_epi32(vecs[14], vecs[15]);
1056
+ __m512i op_2 = _mm512_unpackhi_epi32(vecs[14], vecs[15]);
1057
+
1058
+ // Interleave 64-bit lanes. The _0 unpack is lanes
1059
+ // 0/0/0/0/4/4/4/4/8/8/8/8/12/12/12/12, the _1 unpack is lanes
1060
+ // 1/1/1/1/5/5/5/5/9/9/9/9/13/13/13/13, the _2 unpack is lanes
1061
+ // 2/2/2/2/6/6/6/6/10/10/10/10/14/14/14/14, and the _3 unpack is lanes
1062
+ // 3/3/3/3/7/7/7/7/11/11/11/11/15/15/15/15.
1063
+ __m512i abcd_0 = _mm512_unpacklo_epi64(ab_0, cd_0);
1064
+ __m512i abcd_1 = _mm512_unpackhi_epi64(ab_0, cd_0);
1065
+ __m512i abcd_2 = _mm512_unpacklo_epi64(ab_2, cd_2);
1066
+ __m512i abcd_3 = _mm512_unpackhi_epi64(ab_2, cd_2);
1067
+ __m512i efgh_0 = _mm512_unpacklo_epi64(ef_0, gh_0);
1068
+ __m512i efgh_1 = _mm512_unpackhi_epi64(ef_0, gh_0);
1069
+ __m512i efgh_2 = _mm512_unpacklo_epi64(ef_2, gh_2);
1070
+ __m512i efgh_3 = _mm512_unpackhi_epi64(ef_2, gh_2);
1071
+ __m512i ijkl_0 = _mm512_unpacklo_epi64(ij_0, kl_0);
1072
+ __m512i ijkl_1 = _mm512_unpackhi_epi64(ij_0, kl_0);
1073
+ __m512i ijkl_2 = _mm512_unpacklo_epi64(ij_2, kl_2);
1074
+ __m512i ijkl_3 = _mm512_unpackhi_epi64(ij_2, kl_2);
1075
+ __m512i mnop_0 = _mm512_unpacklo_epi64(mn_0, op_0);
1076
+ __m512i mnop_1 = _mm512_unpackhi_epi64(mn_0, op_0);
1077
+ __m512i mnop_2 = _mm512_unpacklo_epi64(mn_2, op_2);
1078
+ __m512i mnop_3 = _mm512_unpackhi_epi64(mn_2, op_2);
1079
+
1080
+ // Interleave 128-bit lanes. The _0 unpack is
1081
+ // 0/0/0/0/8/8/8/8/0/0/0/0/8/8/8/8, the _1 unpack is
1082
+ // 1/1/1/1/9/9/9/9/1/1/1/1/9/9/9/9, and so on.
1083
+ __m512i abcdefgh_0 = unpack_lo_128(abcd_0, efgh_0);
1084
+ __m512i abcdefgh_1 = unpack_lo_128(abcd_1, efgh_1);
1085
+ __m512i abcdefgh_2 = unpack_lo_128(abcd_2, efgh_2);
1086
+ __m512i abcdefgh_3 = unpack_lo_128(abcd_3, efgh_3);
1087
+ __m512i abcdefgh_4 = unpack_hi_128(abcd_0, efgh_0);
1088
+ __m512i abcdefgh_5 = unpack_hi_128(abcd_1, efgh_1);
1089
+ __m512i abcdefgh_6 = unpack_hi_128(abcd_2, efgh_2);
1090
+ __m512i abcdefgh_7 = unpack_hi_128(abcd_3, efgh_3);
1091
+ __m512i ijklmnop_0 = unpack_lo_128(ijkl_0, mnop_0);
1092
+ __m512i ijklmnop_1 = unpack_lo_128(ijkl_1, mnop_1);
1093
+ __m512i ijklmnop_2 = unpack_lo_128(ijkl_2, mnop_2);
1094
+ __m512i ijklmnop_3 = unpack_lo_128(ijkl_3, mnop_3);
1095
+ __m512i ijklmnop_4 = unpack_hi_128(ijkl_0, mnop_0);
1096
+ __m512i ijklmnop_5 = unpack_hi_128(ijkl_1, mnop_1);
1097
+ __m512i ijklmnop_6 = unpack_hi_128(ijkl_2, mnop_2);
1098
+ __m512i ijklmnop_7 = unpack_hi_128(ijkl_3, mnop_3);
1099
+
1100
+ // Interleave 128-bit lanes again for the final outputs.
1101
+ vecs[0] = unpack_lo_128(abcdefgh_0, ijklmnop_0);
1102
+ vecs[1] = unpack_lo_128(abcdefgh_1, ijklmnop_1);
1103
+ vecs[2] = unpack_lo_128(abcdefgh_2, ijklmnop_2);
1104
+ vecs[3] = unpack_lo_128(abcdefgh_3, ijklmnop_3);
1105
+ vecs[4] = unpack_lo_128(abcdefgh_4, ijklmnop_4);
1106
+ vecs[5] = unpack_lo_128(abcdefgh_5, ijklmnop_5);
1107
+ vecs[6] = unpack_lo_128(abcdefgh_6, ijklmnop_6);
1108
+ vecs[7] = unpack_lo_128(abcdefgh_7, ijklmnop_7);
1109
+ vecs[8] = unpack_hi_128(abcdefgh_0, ijklmnop_0);
1110
+ vecs[9] = unpack_hi_128(abcdefgh_1, ijklmnop_1);
1111
+ vecs[10] = unpack_hi_128(abcdefgh_2, ijklmnop_2);
1112
+ vecs[11] = unpack_hi_128(abcdefgh_3, ijklmnop_3);
1113
+ vecs[12] = unpack_hi_128(abcdefgh_4, ijklmnop_4);
1114
+ vecs[13] = unpack_hi_128(abcdefgh_5, ijklmnop_5);
1115
+ vecs[14] = unpack_hi_128(abcdefgh_6, ijklmnop_6);
1116
+ vecs[15] = unpack_hi_128(abcdefgh_7, ijklmnop_7);
1117
+ }
1118
+
1119
+ INLINE void transpose_msg_vecs16(const uint8_t *const *inputs,
1120
+ size_t block_offset, __m512i out[16]) {
1121
+ out[0] = loadu_512(&inputs[0][block_offset]);
1122
+ out[1] = loadu_512(&inputs[1][block_offset]);
1123
+ out[2] = loadu_512(&inputs[2][block_offset]);
1124
+ out[3] = loadu_512(&inputs[3][block_offset]);
1125
+ out[4] = loadu_512(&inputs[4][block_offset]);
1126
+ out[5] = loadu_512(&inputs[5][block_offset]);
1127
+ out[6] = loadu_512(&inputs[6][block_offset]);
1128
+ out[7] = loadu_512(&inputs[7][block_offset]);
1129
+ out[8] = loadu_512(&inputs[8][block_offset]);
1130
+ out[9] = loadu_512(&inputs[9][block_offset]);
1131
+ out[10] = loadu_512(&inputs[10][block_offset]);
1132
+ out[11] = loadu_512(&inputs[11][block_offset]);
1133
+ out[12] = loadu_512(&inputs[12][block_offset]);
1134
+ out[13] = loadu_512(&inputs[13][block_offset]);
1135
+ out[14] = loadu_512(&inputs[14][block_offset]);
1136
+ out[15] = loadu_512(&inputs[15][block_offset]);
1137
+ for (size_t i = 0; i < 16; ++i) {
1138
+ _mm_prefetch((const void *)&inputs[i][block_offset + 256], _MM_HINT_T0);
1139
+ }
1140
+ transpose_vecs_512(out);
1141
+ }
1142
+
1143
+ INLINE void load_counters16(uint64_t counter, bool increment_counter,
1144
+ __m512i *out_lo, __m512i *out_hi) {
1145
+ const __m512i mask = _mm512_set1_epi32(-(int32_t)increment_counter);
1146
+ const __m512i deltas = _mm512_set_epi32(15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
1147
+ const __m512i masked_deltas = _mm512_and_si512(deltas, mask);
1148
+ const __m512i low_words = _mm512_add_epi32(
1149
+ _mm512_set1_epi32((int32_t)counter),
1150
+ masked_deltas);
1151
+ // The carry bit is 1 if the high bit of the word was 1 before addition and is
1152
+ // 0 after.
1153
+ // NOTE: It would be a bit more natural to use _mm512_cmp_epu32_mask to
1154
+ // compute the carry bits here, and originally we did, but that intrinsic is
1155
+ // broken under GCC 5.4. See https://github.com/BLAKE3-team/BLAKE3/issues/271.
1156
+ const __m512i carries = _mm512_srli_epi32(
1157
+ _mm512_andnot_si512(
1158
+ low_words, // 0 after (gets inverted by andnot)
1159
+ _mm512_set1_epi32((int32_t)counter)), // and 1 before
1160
+ 31);
1161
+ const __m512i high_words = _mm512_add_epi32(
1162
+ _mm512_set1_epi32((int32_t)(counter >> 32)),
1163
+ carries);
1164
+ *out_lo = low_words;
1165
+ *out_hi = high_words;
1166
+ }
1167
+
1168
+ static
1169
+ void blake3_hash16_avx512(const uint8_t *const *inputs, size_t blocks,
1170
+ const uint32_t key[8], uint64_t counter,
1171
+ bool increment_counter, uint8_t flags,
1172
+ uint8_t flags_start, uint8_t flags_end,
1173
+ uint8_t *out) {
1174
+ __m512i h_vecs[8] = {
1175
+ set1_512(key[0]), set1_512(key[1]), set1_512(key[2]), set1_512(key[3]),
1176
+ set1_512(key[4]), set1_512(key[5]), set1_512(key[6]), set1_512(key[7]),
1177
+ };
1178
+ __m512i counter_low_vec, counter_high_vec;
1179
+ load_counters16(counter, increment_counter, &counter_low_vec,
1180
+ &counter_high_vec);
1181
+ uint8_t block_flags = flags | flags_start;
1182
+
1183
+ for (size_t block = 0; block < blocks; block++) {
1184
+ if (block + 1 == blocks) {
1185
+ block_flags |= flags_end;
1186
+ }
1187
+ __m512i block_len_vec = set1_512(BLAKE3_BLOCK_LEN);
1188
+ __m512i block_flags_vec = set1_512(block_flags);
1189
+ __m512i msg_vecs[16];
1190
+ transpose_msg_vecs16(inputs, block * BLAKE3_BLOCK_LEN, msg_vecs);
1191
+
1192
+ __m512i v[16] = {
1193
+ h_vecs[0], h_vecs[1], h_vecs[2], h_vecs[3],
1194
+ h_vecs[4], h_vecs[5], h_vecs[6], h_vecs[7],
1195
+ set1_512(IV[0]), set1_512(IV[1]), set1_512(IV[2]), set1_512(IV[3]),
1196
+ counter_low_vec, counter_high_vec, block_len_vec, block_flags_vec,
1197
+ };
1198
+ round_fn16(v, msg_vecs, 0);
1199
+ round_fn16(v, msg_vecs, 1);
1200
+ round_fn16(v, msg_vecs, 2);
1201
+ round_fn16(v, msg_vecs, 3);
1202
+ round_fn16(v, msg_vecs, 4);
1203
+ round_fn16(v, msg_vecs, 5);
1204
+ round_fn16(v, msg_vecs, 6);
1205
+ h_vecs[0] = xor_512(v[0], v[8]);
1206
+ h_vecs[1] = xor_512(v[1], v[9]);
1207
+ h_vecs[2] = xor_512(v[2], v[10]);
1208
+ h_vecs[3] = xor_512(v[3], v[11]);
1209
+ h_vecs[4] = xor_512(v[4], v[12]);
1210
+ h_vecs[5] = xor_512(v[5], v[13]);
1211
+ h_vecs[6] = xor_512(v[6], v[14]);
1212
+ h_vecs[7] = xor_512(v[7], v[15]);
1213
+
1214
+ block_flags = flags;
1215
+ }
1216
+
1217
+ // transpose_vecs_512 operates on a 16x16 matrix of words, but we only have 8
1218
+ // state vectors. Pad the matrix with zeros. After transposition, store the
1219
+ // lower half of each vector.
1220
+ __m512i padded[16] = {
1221
+ h_vecs[0], h_vecs[1], h_vecs[2], h_vecs[3],
1222
+ h_vecs[4], h_vecs[5], h_vecs[6], h_vecs[7],
1223
+ set1_512(0), set1_512(0), set1_512(0), set1_512(0),
1224
+ set1_512(0), set1_512(0), set1_512(0), set1_512(0),
1225
+ };
1226
+ transpose_vecs_512(padded);
1227
+ _mm256_mask_storeu_epi32(&out[0 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[0]));
1228
+ _mm256_mask_storeu_epi32(&out[1 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[1]));
1229
+ _mm256_mask_storeu_epi32(&out[2 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[2]));
1230
+ _mm256_mask_storeu_epi32(&out[3 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[3]));
1231
+ _mm256_mask_storeu_epi32(&out[4 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[4]));
1232
+ _mm256_mask_storeu_epi32(&out[5 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[5]));
1233
+ _mm256_mask_storeu_epi32(&out[6 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[6]));
1234
+ _mm256_mask_storeu_epi32(&out[7 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[7]));
1235
+ _mm256_mask_storeu_epi32(&out[8 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[8]));
1236
+ _mm256_mask_storeu_epi32(&out[9 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[9]));
1237
+ _mm256_mask_storeu_epi32(&out[10 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[10]));
1238
+ _mm256_mask_storeu_epi32(&out[11 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[11]));
1239
+ _mm256_mask_storeu_epi32(&out[12 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[12]));
1240
+ _mm256_mask_storeu_epi32(&out[13 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[13]));
1241
+ _mm256_mask_storeu_epi32(&out[14 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[14]));
1242
+ _mm256_mask_storeu_epi32(&out[15 * sizeof(__m256i)], (__mmask8)-1, _mm512_castsi512_si256(padded[15]));
1243
+ }
1244
+
1245
+ static
1246
+ void blake3_xof16_avx512(const uint32_t cv[8],
1247
+ const uint8_t block[BLAKE3_BLOCK_LEN],
1248
+ uint8_t block_len, uint64_t counter, uint8_t flags,
1249
+ uint8_t out[16 * 64]) {
1250
+ __m512i h_vecs[8] = {
1251
+ set1_512(cv[0]), set1_512(cv[1]), set1_512(cv[2]), set1_512(cv[3]),
1252
+ set1_512(cv[4]), set1_512(cv[5]), set1_512(cv[6]), set1_512(cv[7]),
1253
+ };
1254
+ uint32_t block_words[16];
1255
+ load_block_words(block, block_words);
1256
+ __m512i msg_vecs[16];
1257
+ for (size_t i = 0; i < 16; i++) {
1258
+ msg_vecs[i] = set1_512(block_words[i]);
1259
+ }
1260
+ __m512i counter_low_vec, counter_high_vec;
1261
+ load_counters16(counter, true, &counter_low_vec, &counter_high_vec);
1262
+ __m512i block_len_vec = set1_512(block_len);
1263
+ __m512i block_flags_vec = set1_512(flags);
1264
+ __m512i v[16] = {
1265
+ h_vecs[0], h_vecs[1], h_vecs[2], h_vecs[3],
1266
+ h_vecs[4], h_vecs[5], h_vecs[6], h_vecs[7],
1267
+ set1_512(IV[0]), set1_512(IV[1]), set1_512(IV[2]), set1_512(IV[3]),
1268
+ counter_low_vec, counter_high_vec, block_len_vec, block_flags_vec,
1269
+ };
1270
+ round_fn16(v, msg_vecs, 0);
1271
+ round_fn16(v, msg_vecs, 1);
1272
+ round_fn16(v, msg_vecs, 2);
1273
+ round_fn16(v, msg_vecs, 3);
1274
+ round_fn16(v, msg_vecs, 4);
1275
+ round_fn16(v, msg_vecs, 5);
1276
+ round_fn16(v, msg_vecs, 6);
1277
+ for (size_t i = 0; i < 8; i++) {
1278
+ v[i] = xor_512(v[i], v[i+8]);
1279
+ v[i+8] = xor_512(v[i+8], h_vecs[i]);
1280
+ }
1281
+ transpose_vecs_512(&v[0]);
1282
+ for (size_t i = 0; i < 16; i++) {
1283
+ storeu_512(v[i], &out[i * sizeof(__m512i)]);
1284
+ }
1285
+ }
1286
+
1287
+ /*
1288
+ * ----------------------------------------------------------------------------
1289
+ * hash_many_avx512
1290
+ * ----------------------------------------------------------------------------
1291
+ */
1292
+
1293
+ INLINE void hash_one_avx512(const uint8_t *input, size_t blocks,
1294
+ const uint32_t key[8], uint64_t counter,
1295
+ uint8_t flags, uint8_t flags_start,
1296
+ uint8_t flags_end, uint8_t out[BLAKE3_OUT_LEN]) {
1297
+ uint32_t cv[8];
1298
+ memcpy(cv, key, BLAKE3_KEY_LEN);
1299
+ uint8_t block_flags = flags | flags_start;
1300
+ while (blocks > 0) {
1301
+ if (blocks == 1) {
1302
+ block_flags |= flags_end;
1303
+ }
1304
+ blake3_compress_in_place_avx512(cv, input, BLAKE3_BLOCK_LEN, counter,
1305
+ block_flags);
1306
+ input = &input[BLAKE3_BLOCK_LEN];
1307
+ blocks -= 1;
1308
+ block_flags = flags;
1309
+ }
1310
+ memcpy(out, cv, BLAKE3_OUT_LEN);
1311
+ }
1312
+
1313
+ void blake3_hash_many_avx512(const uint8_t *const *inputs, size_t num_inputs,
1314
+ size_t blocks, const uint32_t key[8],
1315
+ uint64_t counter, bool increment_counter,
1316
+ uint8_t flags, uint8_t flags_start,
1317
+ uint8_t flags_end, uint8_t *out) {
1318
+ while (num_inputs >= 16) {
1319
+ blake3_hash16_avx512(inputs, blocks, key, counter, increment_counter, flags,
1320
+ flags_start, flags_end, out);
1321
+ if (increment_counter) {
1322
+ counter += 16;
1323
+ }
1324
+ inputs += 16;
1325
+ num_inputs -= 16;
1326
+ out = &out[16 * BLAKE3_OUT_LEN];
1327
+ }
1328
+ while (num_inputs >= 8) {
1329
+ blake3_hash8_avx512(inputs, blocks, key, counter, increment_counter, flags,
1330
+ flags_start, flags_end, out);
1331
+ if (increment_counter) {
1332
+ counter += 8;
1333
+ }
1334
+ inputs += 8;
1335
+ num_inputs -= 8;
1336
+ out = &out[8 * BLAKE3_OUT_LEN];
1337
+ }
1338
+ while (num_inputs >= 4) {
1339
+ blake3_hash4_avx512(inputs, blocks, key, counter, increment_counter, flags,
1340
+ flags_start, flags_end, out);
1341
+ if (increment_counter) {
1342
+ counter += 4;
1343
+ }
1344
+ inputs += 4;
1345
+ num_inputs -= 4;
1346
+ out = &out[4 * BLAKE3_OUT_LEN];
1347
+ }
1348
+ while (num_inputs > 0) {
1349
+ hash_one_avx512(inputs[0], blocks, key, counter, flags, flags_start,
1350
+ flags_end, out);
1351
+ if (increment_counter) {
1352
+ counter += 1;
1353
+ }
1354
+ inputs += 1;
1355
+ num_inputs -= 1;
1356
+ out = &out[BLAKE3_OUT_LEN];
1357
+ }
1358
+ }
1359
+
1360
+ void blake3_xof_many_avx512(const uint32_t cv[8],
1361
+ const uint8_t block[BLAKE3_BLOCK_LEN],
1362
+ uint8_t block_len, uint64_t counter, uint8_t flags,
1363
+ uint8_t* out, size_t outblocks) {
1364
+ while (outblocks >= 16) {
1365
+ blake3_xof16_avx512(cv, block, block_len, counter, flags, out);
1366
+ counter += 16;
1367
+ outblocks -= 16;
1368
+ out += 16 * BLAKE3_BLOCK_LEN;
1369
+ }
1370
+ while (outblocks >= 8) {
1371
+ blake3_xof8_avx512(cv, block, block_len, counter, flags, out);
1372
+ counter += 8;
1373
+ outblocks -= 8;
1374
+ out += 8 * BLAKE3_BLOCK_LEN;
1375
+ }
1376
+ while (outblocks >= 4) {
1377
+ blake3_xof4_avx512(cv, block, block_len, counter, flags, out);
1378
+ counter += 4;
1379
+ outblocks -= 4;
1380
+ out += 4 * BLAKE3_BLOCK_LEN;
1381
+ }
1382
+ while (outblocks > 0) {
1383
+ blake3_compress_xof_avx512(cv, block, block_len, counter, flags, out);
1384
+ counter += 1;
1385
+ outblocks -= 1;
1386
+ out += BLAKE3_BLOCK_LEN;
1387
+ }
1388
+ }