pq_crypto 0.6.1 → 0.6.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (141) hide show
  1. checksums.yaml +4 -4
  2. data/CHANGELOG.md +5 -0
  3. data/SECURITY.md +7 -0
  4. data/ext/pqcrypto/pqcrypto_version.h +1 -1
  5. data/ext/pqcrypto/vendor/.vendored +4 -4
  6. data/ext/pqcrypto/vendor/mldsa-native/README.md +23 -10
  7. data/ext/pqcrypto/vendor/mldsa-native/mldsa/README.md +23 -0
  8. data/ext/pqcrypto/vendor/mldsa-native/mldsa/mldsa_native.c +114 -58
  9. data/ext/pqcrypto/vendor/mldsa-native/mldsa/mldsa_native.h +498 -461
  10. data/ext/pqcrypto/vendor/mldsa-native/mldsa/mldsa_native_asm.S +145 -85
  11. data/ext/pqcrypto/vendor/mldsa-native/mldsa/mldsa_native_config.h +456 -422
  12. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/cbmc.h +47 -25
  13. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/common.h +26 -14
  14. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/ct.h +56 -81
  15. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/debug.h +17 -24
  16. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/fips202.c +33 -40
  17. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/fips202.h +67 -87
  18. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/fips202x4.c +19 -14
  19. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/fips202x4.h +13 -5
  20. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/keccakf1600.c +84 -10
  21. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/keccakf1600.h +10 -5
  22. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/auto.h +6 -0
  23. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/fips202_native_aarch64.h +22 -15
  24. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x1_scalar_aarch64_asm.S +376 -0
  25. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x1_v84a_aarch64_asm.S +204 -0
  26. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x2_v84a_aarch64_asm.S +259 -0
  27. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x4_v8a_scalar_hybrid_aarch64_asm.S +1077 -0
  28. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x4_v8a_v84a_scalar_hybrid_aarch64_asm.S +987 -0
  29. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccakf1600_round_constants.c +16 -10
  30. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/x1_scalar.h +2 -1
  31. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/x1_v84a.h +1 -1
  32. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/x2_v84a.h +4 -2
  33. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/x4_v8a_scalar.h +2 -2
  34. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/x4_v8a_v84a_scalar.h +1 -1
  35. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/api.h +60 -0
  36. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/mve.h +48 -0
  37. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/fips202_native_armv81m.h +18 -1
  38. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/keccak_f1600_x4_mve.S +658 -582
  39. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/keccak_f1600_x4_mve.c +5 -100
  40. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/keccakf1600_round_constants.c +26 -25
  41. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/state_extract_bytes_x4_mve.S +334 -0
  42. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/armv81m/src/state_xor_bytes_x4_mve.S +355 -0
  43. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/auto.h +8 -3
  44. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/{xkcp.h → keccak_f1600_x4_avx2.h} +11 -8
  45. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/src/fips202_native_x86_64.h +44 -0
  46. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/src/keccak_f1600_x4_avx2_asm.S +454 -0
  47. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/src/keccakf1600_constants.c +52 -0
  48. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/meta.h +37 -28
  49. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/aarch64_zetas.c +213 -196
  50. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/arith_native_aarch64.h +248 -64
  51. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/intt_aarch64_asm.S +753 -0
  52. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l4_aarch64_asm.S +129 -0
  53. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l5_aarch64_asm.S +145 -0
  54. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l7_aarch64_asm.S +177 -0
  55. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/ntt_aarch64_asm.S +653 -0
  56. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/pointwise_montgomery_aarch64_asm.S +84 -0
  57. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_caddq_aarch64_asm.S +53 -0
  58. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_chknorm_aarch64_asm.S +55 -0
  59. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_decompose_32_aarch64_asm.S +86 -0
  60. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_decompose_88_aarch64_asm.S +86 -0
  61. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_use_hint_32_aarch64_asm.S +103 -0
  62. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_use_hint_88_aarch64_asm.S +111 -0
  63. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/polyz_unpack_17_aarch64_asm.S +75 -0
  64. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/polyz_unpack_19_aarch64_asm.S +72 -0
  65. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/polyz_unpack_table.c +23 -11
  66. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_aarch64_asm.S +189 -0
  67. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_eta2_aarch64_asm.S +137 -0
  68. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_eta4_aarch64_asm.S +130 -0
  69. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_eta_table.c +520 -516
  70. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_table.c +34 -33
  71. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/api.h +202 -242
  72. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/meta.h +25 -17
  73. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/arith_native_x86_64.h +112 -28
  74. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/consts.c +1 -1
  75. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/consts.h +1 -1
  76. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/intt_avx2_asm.S +2311 -0
  77. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/ntt_avx2_asm.S +2383 -0
  78. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/nttunpack_avx2_asm.S +238 -0
  79. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l4_avx2_asm.S +139 -0
  80. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l5_avx2_asm.S +155 -0
  81. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l7_avx2_asm.S +187 -0
  82. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_avx2_asm.S +130 -0
  83. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_caddq_avx2_asm.S +190 -0
  84. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_decompose_32_avx2.c +6 -4
  85. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_decompose_88_avx2.c +6 -4
  86. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_use_hint_32_avx2.c +9 -8
  87. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_use_hint_88_avx2.c +10 -9
  88. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/polyz_unpack_17_avx2.c +8 -5
  89. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/polyz_unpack_19_avx2.c +8 -5
  90. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/rej_uniform_eta2_avx2.c +6 -4
  91. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/rej_uniform_eta4_avx2.c +6 -4
  92. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/rej_uniform_table.c +130 -129
  93. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/packing.c +109 -180
  94. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/packing.h +169 -150
  95. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/poly.c +56 -40
  96. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/poly.h +149 -164
  97. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/poly_kl.c +52 -57
  98. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/poly_kl.h +132 -167
  99. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/polyvec.c +57 -424
  100. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/polyvec.h +167 -474
  101. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/polyvec_lazy.c +308 -0
  102. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/polyvec_lazy.h +653 -0
  103. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/reduce.h +22 -29
  104. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/rounding.h +37 -43
  105. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/sign.c +511 -367
  106. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/sign.h +456 -417
  107. data/lib/pq_crypto/version.rb +1 -1
  108. data/script/vendor_libs.rb +3 -3
  109. metadata +41 -35
  110. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x1_scalar_asm.S +0 -376
  111. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x1_v84a_asm.S +0 -204
  112. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x2_v84a_asm.S +0 -259
  113. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x4_v8a_scalar_hybrid_asm.S +0 -1077
  114. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/aarch64/src/keccak_f1600_x4_v8a_v84a_scalar_hybrid_asm.S +0 -987
  115. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/src/KeccakP_1600_times4_SIMD256.c +0 -488
  116. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/fips202/native/x86_64/src/KeccakP_1600_times4_SIMD256.h +0 -16
  117. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/intt.S +0 -753
  118. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l4.S +0 -129
  119. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l5.S +0 -145
  120. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/mld_polyvecl_pointwise_acc_montgomery_l7.S +0 -177
  121. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/ntt.S +0 -653
  122. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/pointwise_montgomery.S +0 -79
  123. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_caddq_asm.S +0 -53
  124. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_chknorm_asm.S +0 -55
  125. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_decompose_32_asm.S +0 -85
  126. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_decompose_88_asm.S +0 -85
  127. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_use_hint_32_asm.S +0 -102
  128. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/poly_use_hint_88_asm.S +0 -110
  129. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/polyz_unpack_17_asm.S +0 -72
  130. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/polyz_unpack_19_asm.S +0 -69
  131. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_asm.S +0 -189
  132. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_eta2_asm.S +0 -135
  133. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/aarch64/src/rej_uniform_eta4_asm.S +0 -128
  134. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/intt.S +0 -2311
  135. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/ntt.S +0 -2383
  136. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/nttunpack.S +0 -239
  137. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise.S +0 -131
  138. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l4.S +0 -139
  139. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l5.S +0 -155
  140. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/pointwise_acc_l7.S +0 -187
  141. data/ext/pqcrypto/vendor/mldsa-native/mldsa/src/native/x86_64/src/poly_caddq_avx2.c +0 -61
@@ -0,0 +1,376 @@
1
+ /*
2
+ * Copyright (c) The mlkem-native project authors
3
+ * Copyright (c) The mldsa-native project authors
4
+ * Copyright (c) 2021-2022 Arm Limited
5
+ * Copyright (c) 2022 Matthias Kannwischer
6
+ * SPDX-License-Identifier: Apache-2.0 OR ISC OR MIT
7
+ */
8
+
9
+ // Author: Hanno Becker <hanno.becker@arm.com>
10
+ // Author: Matthias Kannwischer <matthias@kannwischer.eu>
11
+
12
+ /*yaml
13
+ Name: keccak_f1600_x1_scalar_asm
14
+ Description: AArch64 scalar implementation of Keccak-f[1600] permutation for single state
15
+ Signature: void mld_keccak_f1600_x1_scalar_aarch64_asm(uint64_t state[25], const uint64_t rc[24])
16
+ ABI:
17
+ x0:
18
+ type: buffer
19
+ size_bytes: 200
20
+ permissions: read/write
21
+ c_parameter: uint64_t state[25]
22
+ description: Keccak state (25 x uint64_t)
23
+ x1:
24
+ type: buffer
25
+ size_bytes: 192
26
+ permissions: read-only
27
+ c_parameter: uint64_t const *rc
28
+ description: Round constants (24 x uint64_t)
29
+ Stack:
30
+ bytes: 128
31
+ description: register preservation and temporary storage
32
+ */
33
+
34
+ #include "../../../../common.h"
35
+ #if defined(MLD_FIPS202_AARCH64_NEED_X1_SCALAR) && \
36
+ !defined(MLD_CONFIG_MULTILEVEL_NO_SHARED)
37
+
38
+ /*
39
+ * WARNING: This file is auto-derived from the mldsa-native source file
40
+ * dev/fips202/aarch64/src/keccak_f1600_x1_scalar_aarch64_asm.S using scripts/simpasm. Do not modify it directly.
41
+ */
42
+
43
+ .text
44
+ .balign 4
45
+ .global MLD_ASM_NAMESPACE(keccak_f1600_x1_scalar_aarch64_asm)
46
+ MLD_ASM_FN_SYMBOL(keccak_f1600_x1_scalar_aarch64_asm)
47
+
48
+ .cfi_startproc
49
+ sub sp, sp, #0x80
50
+ .cfi_adjust_cfa_offset 0x80
51
+ stp x19, x20, [sp, #0x20]
52
+ .cfi_rel_offset x19, 0x20
53
+ .cfi_rel_offset x20, 0x28
54
+ stp x21, x22, [sp, #0x30]
55
+ .cfi_rel_offset x21, 0x30
56
+ .cfi_rel_offset x22, 0x38
57
+ stp x23, x24, [sp, #0x40]
58
+ .cfi_rel_offset x23, 0x40
59
+ .cfi_rel_offset x24, 0x48
60
+ stp x25, x26, [sp, #0x50]
61
+ .cfi_rel_offset x25, 0x50
62
+ .cfi_rel_offset x26, 0x58
63
+ stp x27, x28, [sp, #0x60]
64
+ .cfi_rel_offset x27, 0x60
65
+ .cfi_rel_offset x28, 0x68
66
+ stp x29, x30, [sp, #0x70]
67
+ .cfi_rel_offset x29, 0x70
68
+ .cfi_rel_offset x30, 0x78
69
+
70
+ Lkeccak_f1600_x1_scalar_initial:
71
+ mov x26, x1
72
+ str x1, [sp, #0x8]
73
+ ldp x1, x6, [x0]
74
+ ldp x11, x16, [x0, #0x10]
75
+ ldp x21, x2, [x0, #0x20]
76
+ ldp x7, x12, [x0, #0x30]
77
+ ldp x17, x22, [x0, #0x40]
78
+ ldp x3, x8, [x0, #0x50]
79
+ ldp x13, x28, [x0, #0x60]
80
+ ldp x23, x4, [x0, #0x70]
81
+ ldp x9, x14, [x0, #0x80]
82
+ ldp x19, x24, [x0, #0x90]
83
+ ldp x5, x10, [x0, #0xa0]
84
+ ldp x15, x20, [x0, #0xb0]
85
+ ldr x25, [x0, #0xc0]
86
+ str x0, [sp]
87
+ eor x30, x24, x25
88
+ eor x27, x9, x10
89
+ eor x0, x30, x21
90
+ eor x26, x27, x6
91
+ eor x27, x26, x7
92
+ eor x29, x0, x22
93
+ eor x26, x29, x23
94
+ eor x29, x4, x5
95
+ eor x30, x29, x1
96
+ eor x0, x27, x8
97
+ eor x29, x30, x2
98
+ eor x30, x19, x20
99
+ eor x30, x30, x16
100
+ eor x27, x26, x0, ror #63
101
+ eor x4, x4, x27
102
+ eor x30, x30, x17
103
+ eor x30, x30, x28
104
+ eor x29, x29, x3
105
+ eor x0, x0, x30, ror #63
106
+ eor x30, x30, x29, ror #63
107
+ eor x22, x22, x30
108
+ eor x23, x23, x30
109
+ str x23, [sp, #0x18]
110
+ eor x23, x14, x15
111
+ eor x14, x14, x0
112
+ eor x23, x23, x11
113
+ eor x15, x15, x0
114
+ eor x1, x1, x27
115
+ eor x23, x23, x12
116
+ eor x23, x23, x13
117
+ eor x11, x11, x0
118
+ eor x29, x29, x23, ror #63
119
+ eor x23, x23, x26, ror #63
120
+ eor x26, x13, x0
121
+ eor x13, x28, x23
122
+ eor x28, x24, x30
123
+ eor x24, x16, x23
124
+ eor x16, x21, x30
125
+ eor x21, x25, x30
126
+ eor x30, x19, x23
127
+ eor x19, x20, x23
128
+ eor x20, x17, x23
129
+ eor x17, x12, x0
130
+ eor x0, x2, x27
131
+ eor x2, x6, x29
132
+ eor x6, x8, x29
133
+ bic x8, x28, x13, ror #47
134
+ eor x12, x3, x27
135
+ bic x3, x13, x17, ror #19
136
+ eor x5, x5, x27
137
+ ldr x27, [sp, #0x18]
138
+ bic x25, x17, x2, ror #5
139
+ eor x9, x9, x29
140
+ eor x23, x25, x5, ror #52
141
+ eor x3, x3, x2, ror #24
142
+ eor x8, x8, x17, ror #2
143
+ eor x17, x10, x29
144
+ bic x25, x12, x22, ror #47
145
+ eor x29, x7, x29
146
+ bic x10, x4, x27, ror #2
147
+ bic x7, x5, x28, ror #10
148
+ eor x10, x10, x20, ror #50
149
+ eor x13, x7, x13, ror #57
150
+ bic x7, x2, x5, ror #47
151
+ eor x2, x25, x24, ror #39
152
+ bic x25, x20, x11, ror #57
153
+ bic x5, x17, x4, ror #25
154
+ eor x25, x25, x17, ror #53
155
+ bic x17, x11, x17, ror #60
156
+ eor x28, x7, x28, ror #57
157
+ bic x7, x9, x12, ror #42
158
+ eor x7, x7, x22, ror #25
159
+ bic x22, x22, x24, ror #56
160
+ bic x24, x24, x15, ror #31
161
+ eor x22, x22, x15, ror #23
162
+ bic x20, x27, x20, ror #48
163
+ bic x15, x15, x9, ror #16
164
+ eor x12, x15, x12, ror #58
165
+ eor x15, x5, x27, ror #27
166
+ eor x5, x20, x11, ror #41
167
+ ldr x11, [sp, #0x8]
168
+ eor x20, x17, x4, ror #21
169
+ eor x17, x24, x9, ror #47
170
+ mov x24, #0x1 // =1
171
+ bic x9, x0, x16, ror #9
172
+ str x24, [sp, #0x10]
173
+ bic x24, x29, x1, ror #44
174
+ bic x27, x1, x21, ror #50
175
+ bic x4, x26, x29, ror #63
176
+ eor x1, x1, x4, ror #21
177
+ ldr x11, [x11]
178
+ bic x4, x21, x30, ror #57
179
+ eor x21, x24, x21, ror #30
180
+ eor x24, x9, x19, ror #44
181
+ bic x9, x14, x6, ror #5
182
+ eor x9, x9, x0, ror #43
183
+ bic x0, x6, x0, ror #38
184
+ eor x1, x1, x11
185
+ eor x11, x4, x26, ror #35
186
+ eor x4, x0, x16, ror #47
187
+ bic x0, x16, x19, ror #35
188
+ eor x16, x27, x30, ror #43
189
+ bic x27, x30, x26, ror #42
190
+ bic x26, x19, x14, ror #41
191
+ eor x19, x0, x14, ror #12
192
+ eor x14, x26, x6, ror #46
193
+ eor x6, x27, x29, ror #41
194
+
195
+ Lkeccak_f1600_x1_scalar_loop:
196
+ eor x0, x15, x11, ror #52
197
+ eor x0, x0, x13, ror #48
198
+ eor x26, x8, x9, ror #57
199
+ eor x27, x0, x14, ror #10
200
+ eor x29, x16, x28, ror #63
201
+ eor x26, x26, x6, ror #51
202
+ eor x30, x23, x22, ror #50
203
+ eor x0, x26, x10, ror #31
204
+ eor x29, x29, x19, ror #37
205
+ eor x27, x27, x12, ror #5
206
+ eor x30, x30, x24, ror #34
207
+ eor x0, x0, x7, ror #27
208
+ eor x26, x30, x21, ror #26
209
+ eor x26, x26, x25, ror #15
210
+ ror x30, x27, #0x3e
211
+ eor x30, x30, x26, ror #57
212
+ ror x26, x26, #0x3a
213
+ eor x16, x30, x16
214
+ eor x28, x30, x28, ror #63
215
+ str x28, [sp, #0x18]
216
+ eor x29, x29, x17, ror #36
217
+ eor x28, x1, x2, ror #61
218
+ eor x19, x30, x19, ror #37
219
+ eor x29, x29, x20, ror #2
220
+ eor x28, x28, x4, ror #54
221
+ eor x26, x26, x0, ror #55
222
+ eor x28, x28, x3, ror #39
223
+ eor x28, x28, x5, ror #25
224
+ ror x0, x0, #0x38
225
+ eor x0, x0, x29, ror #63
226
+ eor x27, x28, x27, ror #61
227
+ eor x13, x0, x13, ror #46
228
+ eor x28, x29, x28, ror #63
229
+ eor x29, x30, x20, ror #2
230
+ eor x20, x26, x3, ror #39
231
+ eor x11, x0, x11, ror #50
232
+ eor x25, x28, x25, ror #9
233
+ eor x3, x28, x21, ror #20
234
+ eor x21, x26, x1
235
+ eor x9, x27, x9, ror #49
236
+ eor x24, x28, x24, ror #28
237
+ eor x1, x30, x17, ror #36
238
+ eor x14, x0, x14, ror #8
239
+ eor x22, x28, x22, ror #44
240
+ eor x8, x27, x8, ror #56
241
+ eor x17, x27, x7, ror #19
242
+ eor x15, x0, x15, ror #62
243
+ bic x7, x20, x22, ror #47
244
+ eor x4, x26, x4, ror #54
245
+ eor x0, x0, x12, ror #3
246
+ eor x28, x28, x23, ror #58
247
+ eor x23, x26, x2, ror #61
248
+ eor x26, x26, x5, ror #25
249
+ eor x2, x7, x16, ror #39
250
+ bic x7, x9, x20, ror #42
251
+ bic x30, x15, x9, ror #16
252
+ eor x7, x7, x22, ror #25
253
+ eor x12, x30, x20, ror #58
254
+ bic x20, x22, x16, ror #56
255
+ eor x30, x27, x6, ror #43
256
+ eor x22, x20, x15, ror #23
257
+ bic x6, x19, x13, ror #42
258
+ eor x6, x6, x17, ror #41
259
+ bic x5, x13, x17, ror #63
260
+ eor x5, x21, x5, ror #21
261
+ bic x17, x17, x21, ror #44
262
+ eor x27, x27, x10, ror #23
263
+ bic x21, x21, x25, ror #50
264
+ bic x20, x27, x4, ror #25
265
+ bic x10, x16, x15, ror #31
266
+ eor x16, x21, x19, ror #43
267
+ eor x21, x17, x25, ror #30
268
+ bic x19, x25, x19, ror #57
269
+ ldr x25, [sp, #0x10]
270
+ eor x17, x10, x9, ror #47
271
+ ldr x9, [sp, #0x8]
272
+ eor x15, x20, x28, ror #27
273
+ bic x20, x4, x28, ror #2
274
+ eor x10, x20, x1, ror #50
275
+ bic x20, x11, x27, ror #60
276
+ eor x20, x20, x4, ror #21
277
+ bic x4, x28, x1, ror #48
278
+ bic x1, x1, x11, ror #57
279
+ ldr x28, [x9, x25, lsl #3]
280
+ ldr x9, [sp, #0x18]
281
+ add x25, x25, #0x1
282
+ str x25, [sp, #0x10]
283
+ cmp x25, #0x17
284
+ eor x25, x1, x27, ror #53
285
+ bic x27, x30, x26, ror #47
286
+ eor x1, x5, x28
287
+ eor x5, x4, x11, ror #41
288
+ eor x11, x19, x13, ror #35
289
+ bic x13, x26, x24, ror #10
290
+ eor x28, x27, x24, ror #57
291
+ bic x27, x24, x9, ror #47
292
+ bic x19, x23, x3, ror #9
293
+ bic x4, x29, x14, ror #41
294
+ eor x24, x19, x29, ror #44
295
+ bic x29, x3, x29, ror #35
296
+ eor x13, x13, x9, ror #57
297
+ eor x19, x29, x14, ror #12
298
+ bic x29, x9, x0, ror #19
299
+ bic x14, x14, x8, ror #5
300
+ eor x9, x14, x23, ror #43
301
+ eor x14, x4, x8, ror #46
302
+ bic x23, x8, x23, ror #38
303
+ eor x8, x27, x0, ror #2
304
+ eor x4, x23, x3, ror #47
305
+ bic x3, x0, x30, ror #5
306
+ eor x23, x3, x26, ror #52
307
+ eor x3, x29, x30, ror #24
308
+ b.le Lkeccak_f1600_x1_scalar_loop
309
+ ror x6, x6, #0x2b
310
+ ror x11, x11, #0x32
311
+ ror x21, x21, #0x14
312
+ ror x2, x2, #0x3d
313
+ ror x7, x7, #0x13
314
+ ror x12, x12, #0x3
315
+ ror x17, x17, #0x24
316
+ ror x22, x22, #0x2c
317
+ ror x3, x3, #0x27
318
+ ror x8, x8, #0x38
319
+ ror x13, x13, #0x2e
320
+ ror x28, x28, #0x3f
321
+ ror x23, x23, #0x3a
322
+ ror x4, x4, #0x36
323
+ ror x9, x9, #0x31
324
+ ror x14, x14, #0x8
325
+ ror x19, x19, #0x25
326
+ ror x24, x24, #0x1c
327
+ ror x5, x5, #0x19
328
+ ror x10, x10, #0x17
329
+ ror x15, x15, #0x3e
330
+ ror x20, x20, #0x2
331
+ ror x25, x25, #0x9
332
+ ldr x0, [sp]
333
+ stp x1, x6, [x0]
334
+ stp x11, x16, [x0, #0x10]
335
+ stp x21, x2, [x0, #0x20]
336
+ stp x7, x12, [x0, #0x30]
337
+ stp x17, x22, [x0, #0x40]
338
+ stp x3, x8, [x0, #0x50]
339
+ stp x13, x28, [x0, #0x60]
340
+ stp x23, x4, [x0, #0x70]
341
+ stp x9, x14, [x0, #0x80]
342
+ stp x19, x24, [x0, #0x90]
343
+ stp x5, x10, [x0, #0xa0]
344
+ stp x15, x20, [x0, #0xb0]
345
+ str x25, [x0, #0xc0]
346
+ ldp x19, x20, [sp, #0x20]
347
+ .cfi_restore x19
348
+ .cfi_restore x20
349
+ ldp x21, x22, [sp, #0x30]
350
+ .cfi_restore x21
351
+ .cfi_restore x22
352
+ ldp x23, x24, [sp, #0x40]
353
+ .cfi_restore x23
354
+ .cfi_restore x24
355
+ ldp x25, x26, [sp, #0x50]
356
+ .cfi_restore x25
357
+ .cfi_restore x26
358
+ ldp x27, x28, [sp, #0x60]
359
+ .cfi_restore x27
360
+ .cfi_restore x28
361
+ ldp x29, x30, [sp, #0x70]
362
+ .cfi_restore x29
363
+ .cfi_restore x30
364
+ add sp, sp, #0x80
365
+ .cfi_adjust_cfa_offset -0x80
366
+ ret
367
+ .cfi_endproc
368
+
369
+ MLD_ASM_FN_SIZE(keccak_f1600_x1_scalar_aarch64_asm)
370
+
371
+ #endif /* MLD_FIPS202_AARCH64_NEED_X1_SCALAR && \
372
+ !MLD_CONFIG_MULTILEVEL_NO_SHARED */
373
+
374
+ #if defined(__ELF__)
375
+ .section .note.GNU-stack,"",%progbits
376
+ #endif
@@ -0,0 +1,204 @@
1
+ /*
2
+ * Copyright (c) The mlkem-native project authors
3
+ * Copyright (c) The mldsa-native project authors
4
+ * Copyright (c) 2021-2022 Arm Limited
5
+ * Copyright (c) 2022 Matthias Kannwischer
6
+ * SPDX-License-Identifier: Apache-2.0 OR ISC OR MIT
7
+ */
8
+
9
+ /* References
10
+ * ==========
11
+ *
12
+ * - [HYBRID]
13
+ * Hybrid scalar/vector implementations of Keccak and SPHINCS+ on AArch64
14
+ * Becker, Kannwischer
15
+ * https://eprint.iacr.org/2022/1243
16
+ */
17
+
18
+ /*yaml
19
+ Name: keccak_f1600_x1_v84a_asm
20
+ Description: AArch64 ARMv8.4-A implementation of Keccak-f[1600] permutation for single state
21
+ Signature: void mld_keccak_f1600_x1_v84a_aarch64_asm(uint64_t state[25], const uint64_t rc[24])
22
+ ABI:
23
+ x0:
24
+ type: buffer
25
+ size_bytes: 200
26
+ permissions: read/write
27
+ c_parameter: uint64_t state[25]
28
+ description: Keccak state (25 x uint64_t)
29
+ x1:
30
+ type: buffer
31
+ size_bytes: 192
32
+ permissions: read-only
33
+ c_parameter: const uint64_t rc[24]
34
+ description: Round constants (24 x uint64_t)
35
+ Stack:
36
+ bytes: 64
37
+ description: register preservation
38
+ */
39
+
40
+ //
41
+ // Author: Hanno Becker <hanno.becker@arm.com>
42
+ // Author: Matthias Kannwischer <matthias@kannwischer.eu>
43
+ //
44
+ // This implementation is essentially from the paper @[HYBRID].
45
+ // The only difference is interleaving/deinterleaving of Keccak state
46
+ // during load and store, so that the caller need not do this.
47
+ //
48
+
49
+ #include "../../../../common.h"
50
+ #if defined(MLD_FIPS202_AARCH64_NEED_X1_V84A) && \
51
+ !defined(MLD_CONFIG_MULTILEVEL_NO_SHARED)
52
+
53
+ #if defined(__ARM_FEATURE_SHA3)
54
+
55
+ /*
56
+ * WARNING: This file is auto-derived from the mldsa-native source file
57
+ * dev/fips202/aarch64/src/keccak_f1600_x1_v84a_aarch64_asm.S using scripts/simpasm. Do not modify it directly.
58
+ */
59
+
60
+ .text
61
+ .balign 4
62
+ .global MLD_ASM_NAMESPACE(keccak_f1600_x1_v84a_aarch64_asm)
63
+ MLD_ASM_FN_SYMBOL(keccak_f1600_x1_v84a_aarch64_asm)
64
+
65
+ .cfi_startproc
66
+ sub sp, sp, #0x40
67
+ .cfi_adjust_cfa_offset 0x40
68
+ stp d8, d9, [sp]
69
+ .cfi_rel_offset d8, 0x0
70
+ .cfi_rel_offset d9, 0x8
71
+ stp d10, d11, [sp, #0x10]
72
+ .cfi_rel_offset d10, 0x10
73
+ .cfi_rel_offset d11, 0x18
74
+ stp d12, d13, [sp, #0x20]
75
+ .cfi_rel_offset d12, 0x20
76
+ .cfi_rel_offset d13, 0x28
77
+ stp d14, d15, [sp, #0x30]
78
+ .cfi_rel_offset d14, 0x30
79
+ .cfi_rel_offset d15, 0x38
80
+ ldp d0, d1, [x0]
81
+ ldp d2, d3, [x0, #0x10]
82
+ ldp d4, d5, [x0, #0x20]
83
+ ldp d6, d7, [x0, #0x30]
84
+ ldp d8, d9, [x0, #0x40]
85
+ ldp d10, d11, [x0, #0x50]
86
+ ldp d12, d13, [x0, #0x60]
87
+ ldp d14, d15, [x0, #0x70]
88
+ ldp d16, d17, [x0, #0x80]
89
+ ldp d18, d19, [x0, #0x90]
90
+ ldp d20, d21, [x0, #0xa0]
91
+ ldp d22, d23, [x0, #0xb0]
92
+ ldr d24, [x0, #0xc0]
93
+ mov x2, #0x18 // =24
94
+
95
+ Lkeccak_f1600_x1_v84a_loop:
96
+ eor3 v30.16b, v0.16b, v5.16b, v10.16b
97
+ eor3 v29.16b, v1.16b, v6.16b, v11.16b
98
+ eor3 v28.16b, v2.16b, v7.16b, v12.16b
99
+ eor3 v27.16b, v3.16b, v8.16b, v13.16b
100
+ eor3 v26.16b, v4.16b, v9.16b, v14.16b
101
+ eor3 v30.16b, v30.16b, v15.16b, v20.16b
102
+ eor3 v29.16b, v29.16b, v16.16b, v21.16b
103
+ eor3 v28.16b, v28.16b, v17.16b, v22.16b
104
+ eor3 v27.16b, v27.16b, v18.16b, v23.16b
105
+ eor3 v26.16b, v26.16b, v19.16b, v24.16b
106
+ rax1 v25.2d, v30.2d, v28.2d
107
+ rax1 v28.2d, v28.2d, v26.2d
108
+ rax1 v26.2d, v26.2d, v29.2d
109
+ rax1 v29.2d, v29.2d, v27.2d
110
+ rax1 v27.2d, v27.2d, v30.2d
111
+ eor v30.16b, v0.16b, v26.16b
112
+ xar v0.2d, v2.2d, v29.2d, #0x2
113
+ xar v2.2d, v12.2d, v29.2d, #0x15
114
+ xar v12.2d, v13.2d, v28.2d, #0x27
115
+ xar v13.2d, v19.2d, v27.2d, #0x38
116
+ xar v19.2d, v23.2d, v28.2d, #0x8
117
+ xar v23.2d, v15.2d, v26.2d, #0x17
118
+ xar v15.2d, v1.2d, v25.2d, #0x3f
119
+ xar v1.2d, v8.2d, v28.2d, #0x9
120
+ xar v8.2d, v16.2d, v25.2d, #0x13
121
+ xar v16.2d, v7.2d, v29.2d, #0x3a
122
+ xar v7.2d, v10.2d, v26.2d, #0x3d
123
+ xar v10.2d, v3.2d, v28.2d, #0x24
124
+ xar v3.2d, v18.2d, v28.2d, #0x2b
125
+ xar v18.2d, v17.2d, v29.2d, #0x31
126
+ xar v17.2d, v11.2d, v25.2d, #0x36
127
+ xar v11.2d, v9.2d, v27.2d, #0x2c
128
+ xar v9.2d, v22.2d, v29.2d, #0x3
129
+ xar v22.2d, v14.2d, v27.2d, #0x19
130
+ xar v14.2d, v20.2d, v26.2d, #0x2e
131
+ xar v20.2d, v4.2d, v27.2d, #0x25
132
+ xar v4.2d, v24.2d, v27.2d, #0x32
133
+ xar v24.2d, v21.2d, v25.2d, #0x3e
134
+ xar v21.2d, v5.2d, v26.2d, #0x1c
135
+ xar v27.2d, v6.2d, v25.2d, #0x14
136
+ ld1r { v31.2d }, [x1], #8
137
+ bcax v5.16b, v10.16b, v7.16b, v11.16b
138
+ bcax v6.16b, v11.16b, v8.16b, v7.16b
139
+ bcax v7.16b, v7.16b, v9.16b, v8.16b
140
+ bcax v8.16b, v8.16b, v10.16b, v9.16b
141
+ bcax v9.16b, v9.16b, v11.16b, v10.16b
142
+ bcax v10.16b, v15.16b, v12.16b, v16.16b
143
+ bcax v11.16b, v16.16b, v13.16b, v12.16b
144
+ bcax v12.16b, v12.16b, v14.16b, v13.16b
145
+ bcax v13.16b, v13.16b, v15.16b, v14.16b
146
+ bcax v14.16b, v14.16b, v16.16b, v15.16b
147
+ bcax v15.16b, v20.16b, v17.16b, v21.16b
148
+ bcax v16.16b, v21.16b, v18.16b, v17.16b
149
+ bcax v17.16b, v17.16b, v19.16b, v18.16b
150
+ bcax v18.16b, v18.16b, v20.16b, v19.16b
151
+ bcax v19.16b, v19.16b, v21.16b, v20.16b
152
+ bcax v20.16b, v0.16b, v22.16b, v1.16b
153
+ bcax v21.16b, v1.16b, v23.16b, v22.16b
154
+ bcax v22.16b, v22.16b, v24.16b, v23.16b
155
+ bcax v23.16b, v23.16b, v0.16b, v24.16b
156
+ bcax v24.16b, v24.16b, v1.16b, v0.16b
157
+ bcax v0.16b, v30.16b, v2.16b, v27.16b
158
+ bcax v1.16b, v27.16b, v3.16b, v2.16b
159
+ bcax v2.16b, v2.16b, v4.16b, v3.16b
160
+ bcax v3.16b, v3.16b, v30.16b, v4.16b
161
+ bcax v4.16b, v4.16b, v27.16b, v30.16b
162
+ eor v0.16b, v0.16b, v31.16b
163
+ sub x2, x2, #0x1
164
+ cbnz x2, Lkeccak_f1600_x1_v84a_loop
165
+ stp d0, d1, [x0]
166
+ stp d2, d3, [x0, #0x10]
167
+ stp d4, d5, [x0, #0x20]
168
+ stp d6, d7, [x0, #0x30]
169
+ stp d8, d9, [x0, #0x40]
170
+ stp d10, d11, [x0, #0x50]
171
+ stp d12, d13, [x0, #0x60]
172
+ stp d14, d15, [x0, #0x70]
173
+ stp d16, d17, [x0, #0x80]
174
+ stp d18, d19, [x0, #0x90]
175
+ stp d20, d21, [x0, #0xa0]
176
+ stp d22, d23, [x0, #0xb0]
177
+ str d24, [x0, #0xc0]
178
+ ldp d8, d9, [sp]
179
+ .cfi_restore d8
180
+ .cfi_restore d9
181
+ ldp d10, d11, [sp, #0x10]
182
+ .cfi_restore d10
183
+ .cfi_restore d11
184
+ ldp d12, d13, [sp, #0x20]
185
+ .cfi_restore d12
186
+ .cfi_restore d13
187
+ ldp d14, d15, [sp, #0x30]
188
+ .cfi_restore d14
189
+ .cfi_restore d15
190
+ add sp, sp, #0x40
191
+ .cfi_adjust_cfa_offset -0x40
192
+ ret
193
+ .cfi_endproc
194
+
195
+ MLD_ASM_FN_SIZE(keccak_f1600_x1_v84a_aarch64_asm)
196
+
197
+ #endif /* __ARM_FEATURE_SHA3 */
198
+
199
+ #endif /* MLD_FIPS202_AARCH64_NEED_X1_V84A && !MLD_CONFIG_MULTILEVEL_NO_SHARED \
200
+ */
201
+
202
+ #if defined(__ELF__)
203
+ .section .note.GNU-stack,"",%progbits
204
+ #endif