pq_crypto 0.6.1 → 0.6.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (141) hide show
  1. checksums.yaml +4 -4
  2. data/CHANGELOG.md +5 -0
  3. data/SECURITY.md +7 -0
  4. data/ext/pqcrypto/pqcrypto_version.h +1 -1
  5. data/ext/pqcrypto/vendor/.vendored +4 -4
  6. data/ext/pqcrypto/vendor/mldsa-native/README.md +23 -10
  7. data/ext/pqcrypto/vendor/mldsa-native/mldsa/README.md +23 -0
  8. data/ext/pqcrypto/vendor/mldsa-native/mldsa/mldsa_native.c +114 -58
  9. data/ext/pqcrypto/vendor/mldsa-native/mldsa/mldsa_native.h +498 -461
  10. data/ext/pqcrypto/vendor/mldsa-native/mldsa/mldsa_native_asm.S +145 -85
  11. data/ext/pqcrypto/vendor/mldsa-native/mldsa/mldsa_native_config.h +456 -422
  12. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/cbmc.h +47 -25
  13. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/common.h +26 -14
  14. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/ct.h +56 -81
  15. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/debug.h +17 -24
  16. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/fips202.c +33 -40
  17. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/fips202.h +67 -87
  18. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/fips202x4.c +19 -14
  19. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/fips202x4.h +13 -5
  20. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/keccakf1600.c +84 -10
  21. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/keccakf1600.h +10 -5
  22. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/auto.h +6 -0
  23. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/fips202_native_aarch64.h +22 -15
  24. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x1_scalar_aarch64_asm.S +376 -0
  25. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x1_v84a_aarch64_asm.S +204 -0
  26. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x2_v84a_aarch64_asm.S +259 -0
  27. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x4_v8a_scalar_hybrid_aarch64_asm.S +1077 -0
  28. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x4_v8a_v84a_scalar_hybrid_aarch64_asm.S +987 -0
  29. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccakf1600_round_constants.c +16 -10
  30. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/x1_scalar.h +2 -1
  31. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/x1_v84a.h +1 -1
  32. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/x2_v84a.h +4 -2
  33. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/x4_v8a_scalar.h +2 -2
  34. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/x4_v8a_v84a_scalar.h +1 -1
  35. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/api.h +60 -0
  36. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/mve.h +48 -0
  37. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/fips202_native_armv81m.h +18 -1
  38. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/keccak_f1600_x4_mve.S +658 -582
  39. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/keccak_f1600_x4_mve.c +5 -100
  40. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/keccakf1600_round_constants.c +26 -25
  41. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/state_extract_bytes_x4_mve.S +334 -0
  42. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/state_xor_bytes_x4_mve.S +355 -0
  43. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/auto.h +8 -3
  44. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/{xkcp.h → keccak_f1600_x4_avx2.h} +11 -8
  45. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/src/fips202_native_x86_64.h +44 -0
  46. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/src/keccak_f1600_x4_avx2_asm.S +454 -0
  47. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/src/keccakf1600_constants.c +52 -0
  48. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/meta.h +37 -28
  49. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/aarch64_zetas.c +213 -196
  50. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/arith_native_aarch64.h +248 -64
  51. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/intt_aarch64_asm.S +753 -0
  52. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l4_aarch64_asm.S +129 -0
  53. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l5_aarch64_asm.S +145 -0
  54. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l7_aarch64_asm.S +177 -0
  55. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/ntt_aarch64_asm.S +653 -0
  56. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/pointwise_montgomery_aarch64_asm.S +84 -0
  57. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_caddq_aarch64_asm.S +53 -0
  58. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_chknorm_aarch64_asm.S +55 -0
  59. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_decompose_32_aarch64_asm.S +86 -0
  60. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_decompose_88_aarch64_asm.S +86 -0
  61. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_use_hint_32_aarch64_asm.S +103 -0
  62. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_use_hint_88_aarch64_asm.S +111 -0
  63. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/polyz_unpack_17_aarch64_asm.S +75 -0
  64. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/polyz_unpack_19_aarch64_asm.S +72 -0
  65. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/polyz_unpack_table.c +23 -11
  66. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_aarch64_asm.S +189 -0
  67. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_eta2_aarch64_asm.S +137 -0
  68. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_eta4_aarch64_asm.S +130 -0
  69. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_eta_table.c +520 -516
  70. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_table.c +34 -33
  71. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/api.h +202 -242
  72. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/meta.h +25 -17
  73. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/arith_native_x86_64.h +112 -28
  74. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/consts.c +1 -1
  75. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/consts.h +1 -1
  76. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/intt_avx2_asm.S +2311 -0
  77. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/ntt_avx2_asm.S +2383 -0
  78. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/nttunpack_avx2_asm.S +238 -0
  79. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l4_avx2_asm.S +139 -0
  80. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l5_avx2_asm.S +155 -0
  81. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l7_avx2_asm.S +187 -0
  82. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_avx2_asm.S +130 -0
  83. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_caddq_avx2_asm.S +190 -0
  84. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_decompose_32_avx2.c +6 -4
  85. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_decompose_88_avx2.c +6 -4
  86. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_use_hint_32_avx2.c +9 -8
  87. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_use_hint_88_avx2.c +10 -9
  88. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/polyz_unpack_17_avx2.c +8 -5
  89. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/polyz_unpack_19_avx2.c +8 -5
  90. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/rej_uniform_eta2_avx2.c +6 -4
  91. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/rej_uniform_eta4_avx2.c +6 -4
  92. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/rej_uniform_table.c +130 -129
  93. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/packing.c +109 -180
  94. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/packing.h +169 -150
  95. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/poly.c +56 -40
  96. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/poly.h +149 -164
  97. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/poly_kl.c +52 -57
  98. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/poly_kl.h +132 -167
  99. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/polyvec.c +57 -424
  100. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/polyvec.h +167 -474
  101. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/polyvec_lazy.c +308 -0
  102. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/polyvec_lazy.h +653 -0
  103. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/reduce.h +22 -29
  104. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/rounding.h +37 -43
  105. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/sign.c +511 -367
  106. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/sign.h +456 -417
  107. data/lib/pq_crypto/version.rb +1 -1
  108. data/script/vendor_libs.rb +3 -3
  109. metadata +41 -35
  110. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x1_scalar_asm.S +0 -376
  111. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x1_v84a_asm.S +0 -204
  112. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x2_v84a_asm.S +0 -259
  113. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x4_v8a_scalar_hybrid_asm.S +0 -1077
  114. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x4_v8a_v84a_scalar_hybrid_asm.S +0 -987
  115. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/src/KeccakP_1600_times4_SIMD256.c +0 -488
  116. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/src/KeccakP_1600_times4_SIMD256.h +0 -16
  117. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/intt.S +0 -753
  118. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l4.S +0 -129
  119. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l5.S +0 -145
  120. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l7.S +0 -177
  121. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/ntt.S +0 -653
  122. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/pointwise_montgomery.S +0 -79
  123. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_caddq_asm.S +0 -53
  124. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_chknorm_asm.S +0 -55
  125. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_decompose_32_asm.S +0 -85
  126. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_decompose_88_asm.S +0 -85
  127. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_use_hint_32_asm.S +0 -102
  128. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_use_hint_88_asm.S +0 -110
  129. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/polyz_unpack_17_asm.S +0 -72
  130. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/polyz_unpack_19_asm.S +0 -69
  131. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_asm.S +0 -189
  132. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_eta2_asm.S +0 -135
  133. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_eta4_asm.S +0 -128
  134. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/intt.S +0 -2311
  135. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/ntt.S +0 -2383
  136. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/nttunpack.S +0 -239
  137. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise.S +0 -131
  138. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l4.S +0 -139
  139. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l5.S +0 -155
  140. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l7.S +0 -187
  141. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_caddq_avx2.c +0 -61
@@ -1,204 +0,0 @@
1
- /*
2
- * Copyright (c) The mlkem-native project authors
3
- * Copyright (c) The mldsa-native project authors
4
- * Copyright (c) 2021-2022 Arm Limited
5
- * Copyright (c) 2022 Matthias Kannwischer
6
- * SPDX-License-Identifier: Apache-2.0 OR ISC OR MIT
7
- */
8
-
9
- /* References
10
- * ==========
11
- *
12
- * - [HYBRID]
13
- * Hybrid scalar/vector implementations of Keccak and SPHINCS+ on AArch64
14
- * Becker, Kannwischer
15
- * https://eprint.iacr.org/2022/1243
16
- */
17
-
18
- /*yaml
19
- Name: keccak_f1600_x1_v84a_asm
20
- Description: AArch64 ARMv8.4-A implementation of Keccak-f[1600] permutation for single state
21
- Signature: void mld_keccak_f1600_x1_v84a_asm(uint64_t state[25], const uint64_t rc[24])
22
- ABI:
23
- x0:
24
- type: buffer
25
- size_bytes: 200
26
- permissions: read/write
27
- c_parameter: uint64_t state[25]
28
- description: Keccak state (25 x uint64_t)
29
- x1:
30
- type: buffer
31
- size_bytes: 192
32
- permissions: read-only
33
- c_parameter: const uint64_t rc[24]
34
- description: Round constants (24 x uint64_t)
35
- Stack:
36
- bytes: 64
37
- description: register preservation
38
- */
39
-
40
- //
41
- // Author: Hanno Becker <hanno.becker@arm.com>
42
- // Author: Matthias Kannwischer <matthias@kannwischer.eu>
43
- //
44
- // This implementation is essentially from the paper @[HYBRID].
45
- // The only difference is interleaving/deinterleaving of Keccak state
46
- // during load and store, so that the caller need not do this.
47
- //
48
-
49
- #include "../../../../common.h"
50
- #if defined(MLD_FIPS202_AARCH64_NEED_X1_V84A) && \
51
- !defined(MLD_CONFIG_MULTILEVEL_NO_SHARED)
52
-
53
- #if defined(__ARM_FEATURE_SHA3)
54
-
55
- /*
56
- * WARNING: This file is auto-derived from the mldsa-native source file
57
- * dev/fips202/aarch64/src/keccak_f1600_x1_v84a_asm.S using scripts/simpasm. Do not modify it directly.
58
- */
59
-
60
- #if defined(__ELF__)
61
- .section .note.GNU-stack,"",@progbits
62
- #endif
63
-
64
- .text
65
- .balign 4
66
- .global MLD_ASM_NAMESPACE(keccak_f1600_x1_v84a_asm)
67
- MLD_ASM_FN_SYMBOL(keccak_f1600_x1_v84a_asm)
68
-
69
- .cfi_startproc
70
- sub sp, sp, #0x40
71
- .cfi_adjust_cfa_offset 0x40
72
- stp d8, d9, [sp]
73
- .cfi_rel_offset d8, 0x0
74
- .cfi_rel_offset d9, 0x8
75
- stp d10, d11, [sp, #0x10]
76
- .cfi_rel_offset d10, 0x10
77
- .cfi_rel_offset d11, 0x18
78
- stp d12, d13, [sp, #0x20]
79
- .cfi_rel_offset d12, 0x20
80
- .cfi_rel_offset d13, 0x28
81
- stp d14, d15, [sp, #0x30]
82
- .cfi_rel_offset d14, 0x30
83
- .cfi_rel_offset d15, 0x38
84
- ldp d0, d1, [x0]
85
- ldp d2, d3, [x0, #0x10]
86
- ldp d4, d5, [x0, #0x20]
87
- ldp d6, d7, [x0, #0x30]
88
- ldp d8, d9, [x0, #0x40]
89
- ldp d10, d11, [x0, #0x50]
90
- ldp d12, d13, [x0, #0x60]
91
- ldp d14, d15, [x0, #0x70]
92
- ldp d16, d17, [x0, #0x80]
93
- ldp d18, d19, [x0, #0x90]
94
- ldp d20, d21, [x0, #0xa0]
95
- ldp d22, d23, [x0, #0xb0]
96
- ldr d24, [x0, #0xc0]
97
- mov x2, #0x18 // =24
98
-
99
- Lkeccak_f1600_x1_v84a_loop:
100
- eor3 v30.16b, v0.16b, v5.16b, v10.16b
101
- eor3 v29.16b, v1.16b, v6.16b, v11.16b
102
- eor3 v28.16b, v2.16b, v7.16b, v12.16b
103
- eor3 v27.16b, v3.16b, v8.16b, v13.16b
104
- eor3 v26.16b, v4.16b, v9.16b, v14.16b
105
- eor3 v30.16b, v30.16b, v15.16b, v20.16b
106
- eor3 v29.16b, v29.16b, v16.16b, v21.16b
107
- eor3 v28.16b, v28.16b, v17.16b, v22.16b
108
- eor3 v27.16b, v27.16b, v18.16b, v23.16b
109
- eor3 v26.16b, v26.16b, v19.16b, v24.16b
110
- rax1 v25.2d, v30.2d, v28.2d
111
- rax1 v28.2d, v28.2d, v26.2d
112
- rax1 v26.2d, v26.2d, v29.2d
113
- rax1 v29.2d, v29.2d, v27.2d
114
- rax1 v27.2d, v27.2d, v30.2d
115
- eor v30.16b, v0.16b, v26.16b
116
- xar v0.2d, v2.2d, v29.2d, #0x2
117
- xar v2.2d, v12.2d, v29.2d, #0x15
118
- xar v12.2d, v13.2d, v28.2d, #0x27
119
- xar v13.2d, v19.2d, v27.2d, #0x38
120
- xar v19.2d, v23.2d, v28.2d, #0x8
121
- xar v23.2d, v15.2d, v26.2d, #0x17
122
- xar v15.2d, v1.2d, v25.2d, #0x3f
123
- xar v1.2d, v8.2d, v28.2d, #0x9
124
- xar v8.2d, v16.2d, v25.2d, #0x13
125
- xar v16.2d, v7.2d, v29.2d, #0x3a
126
- xar v7.2d, v10.2d, v26.2d, #0x3d
127
- xar v10.2d, v3.2d, v28.2d, #0x24
128
- xar v3.2d, v18.2d, v28.2d, #0x2b
129
- xar v18.2d, v17.2d, v29.2d, #0x31
130
- xar v17.2d, v11.2d, v25.2d, #0x36
131
- xar v11.2d, v9.2d, v27.2d, #0x2c
132
- xar v9.2d, v22.2d, v29.2d, #0x3
133
- xar v22.2d, v14.2d, v27.2d, #0x19
134
- xar v14.2d, v20.2d, v26.2d, #0x2e
135
- xar v20.2d, v4.2d, v27.2d, #0x25
136
- xar v4.2d, v24.2d, v27.2d, #0x32
137
- xar v24.2d, v21.2d, v25.2d, #0x3e
138
- xar v21.2d, v5.2d, v26.2d, #0x1c
139
- xar v27.2d, v6.2d, v25.2d, #0x14
140
- ld1r { v31.2d }, [x1], #8
141
- bcax v5.16b, v10.16b, v7.16b, v11.16b
142
- bcax v6.16b, v11.16b, v8.16b, v7.16b
143
- bcax v7.16b, v7.16b, v9.16b, v8.16b
144
- bcax v8.16b, v8.16b, v10.16b, v9.16b
145
- bcax v9.16b, v9.16b, v11.16b, v10.16b
146
- bcax v10.16b, v15.16b, v12.16b, v16.16b
147
- bcax v11.16b, v16.16b, v13.16b, v12.16b
148
- bcax v12.16b, v12.16b, v14.16b, v13.16b
149
- bcax v13.16b, v13.16b, v15.16b, v14.16b
150
- bcax v14.16b, v14.16b, v16.16b, v15.16b
151
- bcax v15.16b, v20.16b, v17.16b, v21.16b
152
- bcax v16.16b, v21.16b, v18.16b, v17.16b
153
- bcax v17.16b, v17.16b, v19.16b, v18.16b
154
- bcax v18.16b, v18.16b, v20.16b, v19.16b
155
- bcax v19.16b, v19.16b, v21.16b, v20.16b
156
- bcax v20.16b, v0.16b, v22.16b, v1.16b
157
- bcax v21.16b, v1.16b, v23.16b, v22.16b
158
- bcax v22.16b, v22.16b, v24.16b, v23.16b
159
- bcax v23.16b, v23.16b, v0.16b, v24.16b
160
- bcax v24.16b, v24.16b, v1.16b, v0.16b
161
- bcax v0.16b, v30.16b, v2.16b, v27.16b
162
- bcax v1.16b, v27.16b, v3.16b, v2.16b
163
- bcax v2.16b, v2.16b, v4.16b, v3.16b
164
- bcax v3.16b, v3.16b, v30.16b, v4.16b
165
- bcax v4.16b, v4.16b, v27.16b, v30.16b
166
- eor v0.16b, v0.16b, v31.16b
167
- sub x2, x2, #0x1
168
- cbnz x2, Lkeccak_f1600_x1_v84a_loop
169
- stp d0, d1, [x0]
170
- stp d2, d3, [x0, #0x10]
171
- stp d4, d5, [x0, #0x20]
172
- stp d6, d7, [x0, #0x30]
173
- stp d8, d9, [x0, #0x40]
174
- stp d10, d11, [x0, #0x50]
175
- stp d12, d13, [x0, #0x60]
176
- stp d14, d15, [x0, #0x70]
177
- stp d16, d17, [x0, #0x80]
178
- stp d18, d19, [x0, #0x90]
179
- stp d20, d21, [x0, #0xa0]
180
- stp d22, d23, [x0, #0xb0]
181
- str d24, [x0, #0xc0]
182
- ldp d8, d9, [sp]
183
- .cfi_restore d8
184
- .cfi_restore d9
185
- ldp d10, d11, [sp, #0x10]
186
- .cfi_restore d10
187
- .cfi_restore d11
188
- ldp d12, d13, [sp, #0x20]
189
- .cfi_restore d12
190
- .cfi_restore d13
191
- ldp d14, d15, [sp, #0x30]
192
- .cfi_restore d14
193
- .cfi_restore d15
194
- add sp, sp, #0x40
195
- .cfi_adjust_cfa_offset -0x40
196
- ret
197
- .cfi_endproc
198
-
199
- MLD_ASM_FN_SIZE(keccak_f1600_x1_v84a_asm)
200
-
201
- #endif /* __ARM_FEATURE_SHA3 */
202
-
203
- #endif /* MLD_FIPS202_AARCH64_NEED_X1_V84A && !MLD_CONFIG_MULTILEVEL_NO_SHARED \
204
- */
@@ -1,259 +0,0 @@
1
- /*
2
- * Copyright (c) The mlkem-native project authors
3
- * Copyright (c) The mldsa-native project authors
4
- * Copyright (c) 2021-2022 Arm Limited
5
- * Copyright (c) 2022 Matthias Kannwischer
6
- * SPDX-License-Identifier: Apache-2.0 OR ISC OR MIT
7
- */
8
-
9
- /* References
10
- * ==========
11
- *
12
- * - [HYBRID]
13
- * Hybrid scalar/vector implementations of Keccak and SPHINCS+ on AArch64
14
- * Becker, Kannwischer
15
- * https://eprint.iacr.org/2022/1243
16
- */
17
-
18
- /*yaml
19
- Name: keccak_f1600_x2_v84a_asm
20
- Description: AArch64 ARMv8.4-A implementation of Keccak-f[1600] permutation for two sequential states
21
- Signature: void mld_keccak_f1600_x2_v84a_asm(uint64_t state[50], const uint64_t rc[24])
22
- ABI:
23
- x0:
24
- type: buffer
25
- size_bytes: 400
26
- permissions: read/write
27
- c_parameter: uint64_t state[50]
28
- description: Two sequential Keccak states (state0[25], state1[25])
29
- x1:
30
- type: buffer
31
- size_bytes: 192
32
- permissions: read-only
33
- c_parameter: const uint64_t rc[24]
34
- description: Round constants (24 x uint64_t)
35
- Stack:
36
- bytes: 64
37
- description: register preservation
38
- */
39
-
40
- //
41
- // Author: Hanno Becker <hanno.becker@arm.com>
42
- // Author: Matthias Kannwischer <matthias@kannwischer.eu>
43
- //
44
- // This implementation is essentially from the paper @[HYBRID].
45
- // The only difference is interleaving/deinterleaving of Keccak state
46
- // during load and store, so that the caller need not do this.
47
- //
48
-
49
- #include "../../../../common.h"
50
- #if defined(MLD_FIPS202_AARCH64_NEED_X2_V84A) && \
51
- !defined(MLD_CONFIG_MULTILEVEL_NO_SHARED)
52
-
53
- #if defined(__ARM_FEATURE_SHA3)
54
-
55
- /*
56
- * WARNING: This file is auto-derived from the mldsa-native source file
57
- * dev/fips202/aarch64/src/keccak_f1600_x2_v84a_asm.S using scripts/simpasm. Do not modify it directly.
58
- */
59
-
60
- #if defined(__ELF__)
61
- .section .note.GNU-stack,"",@progbits
62
- #endif
63
-
64
- .text
65
- .balign 4
66
- .global MLD_ASM_NAMESPACE(keccak_f1600_x2_v84a_asm)
67
- MLD_ASM_FN_SYMBOL(keccak_f1600_x2_v84a_asm)
68
-
69
- .cfi_startproc
70
- sub sp, sp, #0x40
71
- .cfi_adjust_cfa_offset 0x40
72
- stp d8, d9, [sp]
73
- .cfi_rel_offset d8, 0x0
74
- .cfi_rel_offset d9, 0x8
75
- stp d10, d11, [sp, #0x10]
76
- .cfi_rel_offset d10, 0x10
77
- .cfi_rel_offset d11, 0x18
78
- stp d12, d13, [sp, #0x20]
79
- .cfi_rel_offset d12, 0x20
80
- .cfi_rel_offset d13, 0x28
81
- stp d14, d15, [sp, #0x30]
82
- .cfi_rel_offset d14, 0x30
83
- .cfi_rel_offset d15, 0x38
84
- add x2, x0, #0xc8
85
- ldp q25, q26, [x0], #0x20
86
- ld1 { v27.2d, v28.2d }, [x2], #32
87
- trn1 v0.2d, v25.2d, v27.2d
88
- trn2 v1.2d, v25.2d, v27.2d
89
- trn1 v2.2d, v26.2d, v28.2d
90
- trn2 v3.2d, v26.2d, v28.2d
91
- ldp q25, q26, [x0], #0x20
92
- ld1 { v27.2d, v28.2d }, [x2], #32
93
- trn1 v4.2d, v25.2d, v27.2d
94
- trn2 v5.2d, v25.2d, v27.2d
95
- trn1 v6.2d, v26.2d, v28.2d
96
- trn2 v7.2d, v26.2d, v28.2d
97
- ldp q25, q26, [x0], #0x20
98
- ld1 { v27.2d, v28.2d }, [x2], #32
99
- trn1 v8.2d, v25.2d, v27.2d
100
- trn2 v9.2d, v25.2d, v27.2d
101
- trn1 v10.2d, v26.2d, v28.2d
102
- trn2 v11.2d, v26.2d, v28.2d
103
- ldp q25, q26, [x0], #0x20
104
- ld1 { v27.2d, v28.2d }, [x2], #32
105
- trn1 v12.2d, v25.2d, v27.2d
106
- trn2 v13.2d, v25.2d, v27.2d
107
- trn1 v14.2d, v26.2d, v28.2d
108
- trn2 v15.2d, v26.2d, v28.2d
109
- ldp q25, q26, [x0], #0x20
110
- ld1 { v27.2d, v28.2d }, [x2], #32
111
- trn1 v16.2d, v25.2d, v27.2d
112
- trn2 v17.2d, v25.2d, v27.2d
113
- trn1 v18.2d, v26.2d, v28.2d
114
- trn2 v19.2d, v26.2d, v28.2d
115
- ldp q25, q26, [x0], #0x20
116
- ld1 { v27.2d, v28.2d }, [x2], #32
117
- trn1 v20.2d, v25.2d, v27.2d
118
- trn2 v21.2d, v25.2d, v27.2d
119
- trn1 v22.2d, v26.2d, v28.2d
120
- trn2 v23.2d, v26.2d, v28.2d
121
- ldr d25, [x0]
122
- ldr d27, [x2]
123
- trn1 v24.2d, v25.2d, v27.2d
124
- mov x2, #0x18 // =24
125
-
126
- Lkeccak_f1600_x2_v84a_loop:
127
- eor3 v30.16b, v0.16b, v5.16b, v10.16b
128
- eor3 v29.16b, v1.16b, v6.16b, v11.16b
129
- eor3 v28.16b, v2.16b, v7.16b, v12.16b
130
- eor3 v27.16b, v3.16b, v8.16b, v13.16b
131
- eor3 v26.16b, v4.16b, v9.16b, v14.16b
132
- eor3 v30.16b, v30.16b, v15.16b, v20.16b
133
- eor3 v29.16b, v29.16b, v16.16b, v21.16b
134
- eor3 v28.16b, v28.16b, v17.16b, v22.16b
135
- eor3 v27.16b, v27.16b, v18.16b, v23.16b
136
- eor3 v26.16b, v26.16b, v19.16b, v24.16b
137
- rax1 v25.2d, v30.2d, v28.2d
138
- rax1 v28.2d, v28.2d, v26.2d
139
- rax1 v26.2d, v26.2d, v29.2d
140
- rax1 v29.2d, v29.2d, v27.2d
141
- rax1 v27.2d, v27.2d, v30.2d
142
- eor v30.16b, v0.16b, v26.16b
143
- xar v0.2d, v2.2d, v29.2d, #0x2
144
- xar v2.2d, v12.2d, v29.2d, #0x15
145
- xar v12.2d, v13.2d, v28.2d, #0x27
146
- xar v13.2d, v19.2d, v27.2d, #0x38
147
- xar v19.2d, v23.2d, v28.2d, #0x8
148
- xar v23.2d, v15.2d, v26.2d, #0x17
149
- xar v15.2d, v1.2d, v25.2d, #0x3f
150
- xar v1.2d, v8.2d, v28.2d, #0x9
151
- xar v8.2d, v16.2d, v25.2d, #0x13
152
- xar v16.2d, v7.2d, v29.2d, #0x3a
153
- xar v7.2d, v10.2d, v26.2d, #0x3d
154
- xar v10.2d, v3.2d, v28.2d, #0x24
155
- xar v3.2d, v18.2d, v28.2d, #0x2b
156
- xar v18.2d, v17.2d, v29.2d, #0x31
157
- xar v17.2d, v11.2d, v25.2d, #0x36
158
- xar v11.2d, v9.2d, v27.2d, #0x2c
159
- xar v9.2d, v22.2d, v29.2d, #0x3
160
- xar v22.2d, v14.2d, v27.2d, #0x19
161
- xar v14.2d, v20.2d, v26.2d, #0x2e
162
- xar v20.2d, v4.2d, v27.2d, #0x25
163
- xar v4.2d, v24.2d, v27.2d, #0x32
164
- xar v24.2d, v21.2d, v25.2d, #0x3e
165
- xar v21.2d, v5.2d, v26.2d, #0x1c
166
- xar v27.2d, v6.2d, v25.2d, #0x14
167
- ld1r { v31.2d }, [x1], #8
168
- bcax v5.16b, v10.16b, v7.16b, v11.16b
169
- bcax v6.16b, v11.16b, v8.16b, v7.16b
170
- bcax v7.16b, v7.16b, v9.16b, v8.16b
171
- bcax v8.16b, v8.16b, v10.16b, v9.16b
172
- bcax v9.16b, v9.16b, v11.16b, v10.16b
173
- bcax v10.16b, v15.16b, v12.16b, v16.16b
174
- bcax v11.16b, v16.16b, v13.16b, v12.16b
175
- bcax v12.16b, v12.16b, v14.16b, v13.16b
176
- bcax v13.16b, v13.16b, v15.16b, v14.16b
177
- bcax v14.16b, v14.16b, v16.16b, v15.16b
178
- bcax v15.16b, v20.16b, v17.16b, v21.16b
179
- bcax v16.16b, v21.16b, v18.16b, v17.16b
180
- bcax v17.16b, v17.16b, v19.16b, v18.16b
181
- bcax v18.16b, v18.16b, v20.16b, v19.16b
182
- bcax v19.16b, v19.16b, v21.16b, v20.16b
183
- bcax v20.16b, v0.16b, v22.16b, v1.16b
184
- bcax v21.16b, v1.16b, v23.16b, v22.16b
185
- bcax v22.16b, v22.16b, v24.16b, v23.16b
186
- bcax v23.16b, v23.16b, v0.16b, v24.16b
187
- bcax v24.16b, v24.16b, v1.16b, v0.16b
188
- bcax v0.16b, v30.16b, v2.16b, v27.16b
189
- bcax v1.16b, v27.16b, v3.16b, v2.16b
190
- bcax v2.16b, v2.16b, v4.16b, v3.16b
191
- bcax v3.16b, v3.16b, v30.16b, v4.16b
192
- bcax v4.16b, v4.16b, v27.16b, v30.16b
193
- eor v0.16b, v0.16b, v31.16b
194
- sub x2, x2, #0x1
195
- cbnz x2, Lkeccak_f1600_x2_v84a_loop
196
- sub x0, x0, #0xc0
197
- add x2, x0, #0xc8
198
- trn1 v25.2d, v0.2d, v1.2d
199
- trn1 v26.2d, v2.2d, v3.2d
200
- stp q25, q26, [x0], #0x20
201
- trn2 v27.2d, v0.2d, v1.2d
202
- trn2 v28.2d, v2.2d, v3.2d
203
- st1 { v27.2d, v28.2d }, [x2], #32
204
- trn1 v25.2d, v4.2d, v5.2d
205
- trn1 v26.2d, v6.2d, v7.2d
206
- stp q25, q26, [x0], #0x20
207
- trn2 v27.2d, v4.2d, v5.2d
208
- trn2 v28.2d, v6.2d, v7.2d
209
- st1 { v27.2d, v28.2d }, [x2], #32
210
- trn1 v25.2d, v8.2d, v9.2d
211
- trn1 v26.2d, v10.2d, v11.2d
212
- stp q25, q26, [x0], #0x20
213
- trn2 v27.2d, v8.2d, v9.2d
214
- trn2 v28.2d, v10.2d, v11.2d
215
- st1 { v27.2d, v28.2d }, [x2], #32
216
- trn1 v25.2d, v12.2d, v13.2d
217
- trn1 v26.2d, v14.2d, v15.2d
218
- stp q25, q26, [x0], #0x20
219
- trn2 v27.2d, v12.2d, v13.2d
220
- trn2 v28.2d, v14.2d, v15.2d
221
- st1 { v27.2d, v28.2d }, [x2], #32
222
- trn1 v25.2d, v16.2d, v17.2d
223
- trn1 v26.2d, v18.2d, v19.2d
224
- stp q25, q26, [x0], #0x20
225
- trn2 v27.2d, v16.2d, v17.2d
226
- trn2 v28.2d, v18.2d, v19.2d
227
- st1 { v27.2d, v28.2d }, [x2], #32
228
- trn1 v25.2d, v20.2d, v21.2d
229
- trn1 v26.2d, v22.2d, v23.2d
230
- stp q25, q26, [x0], #0x20
231
- trn2 v27.2d, v20.2d, v21.2d
232
- trn2 v28.2d, v22.2d, v23.2d
233
- st1 { v27.2d, v28.2d }, [x2], #32
234
- str d24, [x0]
235
- trn2 v25.2d, v24.2d, v24.2d
236
- str d25, [x2]
237
- ldp d8, d9, [sp]
238
- .cfi_restore d8
239
- .cfi_restore d9
240
- ldp d10, d11, [sp, #0x10]
241
- .cfi_restore d10
242
- .cfi_restore d11
243
- ldp d12, d13, [sp, #0x20]
244
- .cfi_restore d12
245
- .cfi_restore d13
246
- ldp d14, d15, [sp, #0x30]
247
- .cfi_restore d14
248
- .cfi_restore d15
249
- add sp, sp, #0x40
250
- .cfi_adjust_cfa_offset -0x40
251
- ret
252
- .cfi_endproc
253
-
254
- MLD_ASM_FN_SIZE(keccak_f1600_x2_v84a_asm)
255
-
256
- #endif /* __ARM_FEATURE_SHA3 */
257
-
258
- #endif /* MLD_FIPS202_AARCH64_NEED_X2_V84A && !MLD_CONFIG_MULTILEVEL_NO_SHARED \
259
- */