sleeping_kangaroo12 0.0.3 → 0.0.4

Sign up to get free protection for your applications and to get access to all the features.
Files changed (291) hide show
  1. checksums.yaml +4 -4
  2. data/README.md +34 -67
  3. data/ext/Rakefile +12 -37
  4. data/ext/binding/sleeping_kangaroo12.c +1 -16
  5. data/ext/{xkcp → k12}/Makefile +0 -0
  6. data/ext/k12/Makefile.build +118 -0
  7. data/ext/k12/README.markdown +86 -0
  8. data/ext/k12/lib/ARMv8Asha3/KeccakP-1600-ARMv8Asha3.S +623 -0
  9. data/ext/k12/lib/ARMv8Asha3/KeccakP-1600-SnP.h +65 -0
  10. data/ext/k12/lib/ARMv8Asha3/KeccakP-1600-opt64.c +227 -0
  11. data/ext/{xkcp/lib/low/KeccakP-1600/compact → k12/lib/Inplace32BI}/KeccakP-1600-SnP.h +4 -9
  12. data/ext/{xkcp/lib/low/KeccakP-1600/plain-32bits-inplace → k12/lib/Inplace32BI}/KeccakP-1600-inplace32BI.c +65 -160
  13. data/ext/k12/lib/KangarooTwelve.c +332 -0
  14. data/ext/{xkcp/lib/high/KangarooTwelve → k12/lib}/KangarooTwelve.h +53 -16
  15. data/ext/{xkcp/lib/low/KeccakP-1600/AVX2 → k12/lib/Optimized64}/KeccakP-1600-AVX2.s +122 -558
  16. data/ext/k12/lib/Optimized64/KeccakP-1600-AVX512-plainC.c +241 -0
  17. data/ext/k12/lib/Optimized64/KeccakP-1600-AVX512.s +551 -0
  18. data/ext/k12/lib/Optimized64/KeccakP-1600-SnP.h +74 -0
  19. data/ext/{xkcp/lib/low/KeccakP-1600/common/KeccakP-1600-64.macros → k12/lib/Optimized64/KeccakP-1600-opt64.c} +447 -169
  20. data/ext/k12/lib/Optimized64/KeccakP-1600-runtimeDispatch.c +406 -0
  21. data/ext/k12/lib/Optimized64/KeccakP-1600-timesN-AVX2.c +419 -0
  22. data/ext/k12/lib/Optimized64/KeccakP-1600-timesN-AVX512.c +458 -0
  23. data/ext/k12/lib/Optimized64/KeccakP-1600-timesN-SSSE3.c +438 -0
  24. data/ext/{xkcp/lib/low/KeccakP-1600/plain-64bits → k12/lib/Plain64}/KeccakP-1600-SnP.h +14 -20
  25. data/ext/{xkcp/lib/low/KeccakP-1600/ref-64bits/KeccakP-1600-reference.h → k12/lib/Plain64/KeccakP-1600-plain64.c} +9 -8
  26. data/ext/{xkcp/lib/common → k12/lib}/align.h +3 -2
  27. data/ext/{xkcp/lib/common → k12/lib}/brg_endian.h +0 -0
  28. data/ext/{xkcp → k12}/support/Build/ExpandProducts.xsl +0 -0
  29. data/ext/{xkcp → k12}/support/Build/ToGlobalMakefile.xsl +0 -0
  30. data/ext/{xkcp → k12}/support/Build/ToOneTarget.xsl +0 -0
  31. data/ext/{xkcp → k12}/support/Build/ToTargetConfigFile.xsl +0 -0
  32. data/ext/{xkcp → k12}/support/Build/ToTargetMakefile.xsl +10 -16
  33. data/ext/{xkcp → k12}/support/Build/ToVCXProj.xsl +0 -0
  34. data/lib/sleeping_kangaroo12/version.rb +1 -1
  35. metadata +33 -276
  36. data/ext/config/xkcp.build +0 -17
  37. data/ext/xkcp/LICENSE +0 -1
  38. data/ext/xkcp/Makefile.build +0 -200
  39. data/ext/xkcp/README.markdown +0 -296
  40. data/ext/xkcp/lib/HighLevel.build +0 -143
  41. data/ext/xkcp/lib/LowLevel.build +0 -757
  42. data/ext/xkcp/lib/high/KangarooTwelve/KangarooTwelve.c +0 -301
  43. data/ext/xkcp/lib/high/Keccak/FIPS202/KeccakHash.c +0 -81
  44. data/ext/xkcp/lib/high/Keccak/FIPS202/KeccakHash.h +0 -125
  45. data/ext/xkcp/lib/high/Keccak/FIPS202/SimpleFIPS202.c +0 -48
  46. data/ext/xkcp/lib/high/Keccak/FIPS202/SimpleFIPS202.h +0 -79
  47. data/ext/xkcp/lib/high/Keccak/KeccakDuplex.c +0 -81
  48. data/ext/xkcp/lib/high/Keccak/KeccakDuplex.h +0 -73
  49. data/ext/xkcp/lib/high/Keccak/KeccakDuplex.inc +0 -195
  50. data/ext/xkcp/lib/high/Keccak/KeccakSponge.c +0 -111
  51. data/ext/xkcp/lib/high/Keccak/KeccakSponge.h +0 -76
  52. data/ext/xkcp/lib/high/Keccak/KeccakSponge.inc +0 -314
  53. data/ext/xkcp/lib/high/Keccak/PRG/KeccakPRG.c +0 -61
  54. data/ext/xkcp/lib/high/Keccak/PRG/KeccakPRG.h +0 -67
  55. data/ext/xkcp/lib/high/Keccak/PRG/KeccakPRG.inc +0 -128
  56. data/ext/xkcp/lib/high/Keccak/SP800-185/SP800-185.c +0 -93
  57. data/ext/xkcp/lib/high/Keccak/SP800-185/SP800-185.h +0 -599
  58. data/ext/xkcp/lib/high/Keccak/SP800-185/SP800-185.inc +0 -573
  59. data/ext/xkcp/lib/high/Ketje/Ketjev2.c +0 -87
  60. data/ext/xkcp/lib/high/Ketje/Ketjev2.h +0 -88
  61. data/ext/xkcp/lib/high/Ketje/Ketjev2.inc +0 -274
  62. data/ext/xkcp/lib/high/Keyak/Keyakv2.c +0 -132
  63. data/ext/xkcp/lib/high/Keyak/Keyakv2.h +0 -217
  64. data/ext/xkcp/lib/high/Keyak/Keyakv2.inc +0 -81
  65. data/ext/xkcp/lib/high/Keyak/Motorist.inc +0 -953
  66. data/ext/xkcp/lib/high/Kravatte/Kravatte.c +0 -533
  67. data/ext/xkcp/lib/high/Kravatte/Kravatte.h +0 -115
  68. data/ext/xkcp/lib/high/Kravatte/KravatteModes.c +0 -557
  69. data/ext/xkcp/lib/high/Kravatte/KravatteModes.h +0 -247
  70. data/ext/xkcp/lib/high/Xoodyak/Cyclist.h +0 -66
  71. data/ext/xkcp/lib/high/Xoodyak/Cyclist.inc +0 -336
  72. data/ext/xkcp/lib/high/Xoodyak/Xoodyak-parameters.h +0 -26
  73. data/ext/xkcp/lib/high/Xoodyak/Xoodyak.c +0 -55
  74. data/ext/xkcp/lib/high/Xoodyak/Xoodyak.h +0 -35
  75. data/ext/xkcp/lib/high/Xoofff/Xoofff.c +0 -634
  76. data/ext/xkcp/lib/high/Xoofff/Xoofff.h +0 -147
  77. data/ext/xkcp/lib/high/Xoofff/XoofffModes.c +0 -483
  78. data/ext/xkcp/lib/high/Xoofff/XoofffModes.h +0 -241
  79. data/ext/xkcp/lib/high/common/Phases.h +0 -25
  80. data/ext/xkcp/lib/low/KeccakP-1600/ARM/KeccakP-1600-SnP.h +0 -41
  81. data/ext/xkcp/lib/low/KeccakP-1600/ARM/KeccakP-1600-inplace-32bi-armv6m-le-armcc.s +0 -1666
  82. data/ext/xkcp/lib/low/KeccakP-1600/ARM/KeccakP-1600-inplace-32bi-armv6m-le-gcc.s +0 -1655
  83. data/ext/xkcp/lib/low/KeccakP-1600/ARM/KeccakP-1600-inplace-32bi-armv7a-le-armcc.s +0 -1268
  84. data/ext/xkcp/lib/low/KeccakP-1600/ARM/KeccakP-1600-inplace-32bi-armv7a-le-gcc.s +0 -1264
  85. data/ext/xkcp/lib/low/KeccakP-1600/ARM/KeccakP-1600-inplace-32bi-armv7m-le-armcc.s +0 -1178
  86. data/ext/xkcp/lib/low/KeccakP-1600/ARM/KeccakP-1600-inplace-32bi-armv7m-le-gcc.s +0 -1175
  87. data/ext/xkcp/lib/low/KeccakP-1600/ARM/KeccakP-1600-u1-32bi-armv6m-le-armcc.s +0 -1338
  88. data/ext/xkcp/lib/low/KeccakP-1600/ARM/KeccakP-1600-u1-32bi-armv6m-le-gcc.s +0 -1336
  89. data/ext/xkcp/lib/low/KeccakP-1600/ARM/KeccakP-1600-u2-32bi-armv6m-le-armcc.s +0 -1343
  90. data/ext/xkcp/lib/low/KeccakP-1600/ARM/KeccakP-1600-u2-32bi-armv6m-le-gcc.s +0 -1339
  91. data/ext/xkcp/lib/low/KeccakP-1600/ARMv7A-NEON/KeccakP-1600-SnP.h +0 -42
  92. data/ext/xkcp/lib/low/KeccakP-1600/ARMv7A-NEON/KeccakP-1600-armv7a-le-neon-armcc.s +0 -823
  93. data/ext/xkcp/lib/low/KeccakP-1600/ARMv7A-NEON/KeccakP-1600-armv7a-le-neon-gcc.s +0 -831
  94. data/ext/xkcp/lib/low/KeccakP-1600/ARMv8A/KeccakP-1600-SnP.h +0 -31
  95. data/ext/xkcp/lib/low/KeccakP-1600/ARMv8A/KeccakP-1600-armv8a-neon.s +0 -540
  96. data/ext/xkcp/lib/low/KeccakP-1600/AVR8/KeccakP-1600-SnP.h +0 -42
  97. data/ext/xkcp/lib/low/KeccakP-1600/AVR8/KeccakP-1600-avr8-compact.s +0 -733
  98. data/ext/xkcp/lib/low/KeccakP-1600/AVR8/KeccakP-1600-avr8-fast.s +0 -1121
  99. data/ext/xkcp/lib/low/KeccakP-1600/AVX2/KeccakP-1600-SnP.h +0 -52
  100. data/ext/xkcp/lib/low/KeccakP-1600/AVX512/C/KeccakP-1600-AVX512.c +0 -623
  101. data/ext/xkcp/lib/low/KeccakP-1600/AVX512/C/KeccakP-1600-SnP.h +0 -47
  102. data/ext/xkcp/lib/low/KeccakP-1600/AVX512/C/u12/KeccakP-1600-AVX512-config.h +0 -6
  103. data/ext/xkcp/lib/low/KeccakP-1600/AVX512/C/u6/KeccakP-1600-AVX512-config.h +0 -6
  104. data/ext/xkcp/lib/low/KeccakP-1600/AVX512/C/ua/KeccakP-1600-AVX512-config.h +0 -6
  105. data/ext/xkcp/lib/low/KeccakP-1600/AVX512/KeccakP-1600-AVX512.s +0 -1031
  106. data/ext/xkcp/lib/low/KeccakP-1600/AVX512/KeccakP-1600-SnP.h +0 -53
  107. data/ext/xkcp/lib/low/KeccakP-1600/XOP/KeccakP-1600-SnP.h +0 -44
  108. data/ext/xkcp/lib/low/KeccakP-1600/XOP/KeccakP-1600-XOP.c +0 -476
  109. data/ext/xkcp/lib/low/KeccakP-1600/XOP/u6/KeccakP-1600-XOP-config.h +0 -6
  110. data/ext/xkcp/lib/low/KeccakP-1600/XOP/ua/KeccakP-1600-XOP-config.h +0 -6
  111. data/ext/xkcp/lib/low/KeccakP-1600/common/KeccakP-1600-unrolling.macros +0 -305
  112. data/ext/xkcp/lib/low/KeccakP-1600/compact/KeccakP-1600-compact64.c +0 -420
  113. data/ext/xkcp/lib/low/KeccakP-1600/plain-32bits-inplace/KeccakP-1600-SnP.h +0 -43
  114. data/ext/xkcp/lib/low/KeccakP-1600/plain-64bits/KeccakP-1600-opt64.c +0 -565
  115. data/ext/xkcp/lib/low/KeccakP-1600/plain-64bits/lcu6/KeccakP-1600-opt64-config.h +0 -7
  116. data/ext/xkcp/lib/low/KeccakP-1600/plain-64bits/lcua/KeccakP-1600-opt64-config.h +0 -7
  117. data/ext/xkcp/lib/low/KeccakP-1600/plain-64bits/lcua-shld/KeccakP-1600-opt64-config.h +0 -8
  118. data/ext/xkcp/lib/low/KeccakP-1600/plain-64bits/u6/KeccakP-1600-opt64-config.h +0 -6
  119. data/ext/xkcp/lib/low/KeccakP-1600/plain-64bits/ua/KeccakP-1600-opt64-config.h +0 -6
  120. data/ext/xkcp/lib/low/KeccakP-1600/ref-32bits/KeccakP-1600-SnP.h +0 -44
  121. data/ext/xkcp/lib/low/KeccakP-1600/ref-32bits/KeccakP-1600-reference.h +0 -23
  122. data/ext/xkcp/lib/low/KeccakP-1600/ref-32bits/KeccakP-1600-reference32BI.c +0 -625
  123. data/ext/xkcp/lib/low/KeccakP-1600/ref-64bits/KeccakP-1600-SnP.h +0 -44
  124. data/ext/xkcp/lib/low/KeccakP-1600/ref-64bits/KeccakP-1600-reference.c +0 -440
  125. data/ext/xkcp/lib/low/KeccakP-1600/x86-64/KeccakP-1600-SnP.h +0 -42
  126. data/ext/xkcp/lib/low/KeccakP-1600/x86-64/KeccakP-1600-x86-64-gas.s +0 -1196
  127. data/ext/xkcp/lib/low/KeccakP-1600/x86-64/KeccakP-1600-x86-64-gas_Apple.s +0 -1124
  128. data/ext/xkcp/lib/low/KeccakP-1600/x86-64/KeccakP-1600-x86-64-shld-gas.s +0 -1196
  129. data/ext/xkcp/lib/low/KeccakP-1600-times2/ARMv7A-NEON/KeccakP-1600-inplace-pl2-armv7a-neon-le-armcc.s +0 -1392
  130. data/ext/xkcp/lib/low/KeccakP-1600-times2/ARMv7A-NEON/KeccakP-1600-inplace-pl2-armv7a-neon-le-gcc.s +0 -1394
  131. data/ext/xkcp/lib/low/KeccakP-1600-times2/ARMv7A-NEON/KeccakP-1600-times2-SnP.h +0 -42
  132. data/ext/xkcp/lib/low/KeccakP-1600-times2/AVX512/AVX512u12/SIMD512-2-config.h +0 -7
  133. data/ext/xkcp/lib/low/KeccakP-1600-times2/AVX512/AVX512u4/SIMD512-2-config.h +0 -7
  134. data/ext/xkcp/lib/low/KeccakP-1600-times2/AVX512/AVX512ufull/SIMD512-2-config.h +0 -7
  135. data/ext/xkcp/lib/low/KeccakP-1600-times2/AVX512/KeccakP-1600-times2-SIMD512.c +0 -850
  136. data/ext/xkcp/lib/low/KeccakP-1600-times2/AVX512/KeccakP-1600-times2-SnP.h +0 -51
  137. data/ext/xkcp/lib/low/KeccakP-1600-times2/SIMD128/KeccakP-1600-times2-SIMD128.c +0 -957
  138. data/ext/xkcp/lib/low/KeccakP-1600-times2/SIMD128/KeccakP-1600-times2-SnP.h +0 -49
  139. data/ext/xkcp/lib/low/KeccakP-1600-times2/SIMD128/SSSE3-u2/SIMD128-config.h +0 -8
  140. data/ext/xkcp/lib/low/KeccakP-1600-times2/SIMD128/SSSE3-ua/SIMD128-config.h +0 -8
  141. data/ext/xkcp/lib/low/KeccakP-1600-times2/SIMD128/XOP-u2/SIMD128-config.h +0 -9
  142. data/ext/xkcp/lib/low/KeccakP-1600-times2/SIMD128/XOP-ua/SIMD128-config.h +0 -9
  143. data/ext/xkcp/lib/low/KeccakP-1600-times2/fallback-on1/KeccakP-1600-times2-SnP.h +0 -45
  144. data/ext/xkcp/lib/low/KeccakP-1600-times2/fallback-on1/KeccakP-1600-times2-on1.c +0 -37
  145. data/ext/xkcp/lib/low/KeccakP-1600-times4/AVX2/KeccakP-1600-times4-SIMD256.c +0 -1321
  146. data/ext/xkcp/lib/low/KeccakP-1600-times4/AVX2/KeccakP-1600-times4-SnP.h +0 -55
  147. data/ext/xkcp/lib/low/KeccakP-1600-times4/AVX2/u12/SIMD256-config.h +0 -7
  148. data/ext/xkcp/lib/low/KeccakP-1600-times4/AVX2/u6/SIMD256-config.h +0 -7
  149. data/ext/xkcp/lib/low/KeccakP-1600-times4/AVX2/ua/SIMD256-config.h +0 -7
  150. data/ext/xkcp/lib/low/KeccakP-1600-times4/AVX512/AVX512u12/SIMD512-4-config.h +0 -7
  151. data/ext/xkcp/lib/low/KeccakP-1600-times4/AVX512/AVX512u4/SIMD512-4-config.h +0 -7
  152. data/ext/xkcp/lib/low/KeccakP-1600-times4/AVX512/AVX512ufull/SIMD512-4-config.h +0 -7
  153. data/ext/xkcp/lib/low/KeccakP-1600-times4/AVX512/KeccakP-1600-times4-SIMD512.c +0 -881
  154. data/ext/xkcp/lib/low/KeccakP-1600-times4/AVX512/KeccakP-1600-times4-SnP.h +0 -51
  155. data/ext/xkcp/lib/low/KeccakP-1600-times4/fallback-on1/KeccakP-1600-times4-SnP.h +0 -45
  156. data/ext/xkcp/lib/low/KeccakP-1600-times4/fallback-on1/KeccakP-1600-times4-on1.c +0 -37
  157. data/ext/xkcp/lib/low/KeccakP-1600-times4/fallback-on2/KeccakP-1600-times4-SnP.h +0 -45
  158. data/ext/xkcp/lib/low/KeccakP-1600-times4/fallback-on2/KeccakP-1600-times4-on2.c +0 -38
  159. data/ext/xkcp/lib/low/KeccakP-1600-times8/AVX512/KeccakP-1600-times8-SIMD512.c +0 -1615
  160. data/ext/xkcp/lib/low/KeccakP-1600-times8/AVX512/KeccakP-1600-times8-SnP.h +0 -57
  161. data/ext/xkcp/lib/low/KeccakP-1600-times8/AVX512/u12/SIMD512-config.h +0 -7
  162. data/ext/xkcp/lib/low/KeccakP-1600-times8/AVX512/u4/SIMD512-config.h +0 -7
  163. data/ext/xkcp/lib/low/KeccakP-1600-times8/AVX512/ua/SIMD512-config.h +0 -7
  164. data/ext/xkcp/lib/low/KeccakP-1600-times8/fallback-on1/KeccakP-1600-times8-SnP.h +0 -45
  165. data/ext/xkcp/lib/low/KeccakP-1600-times8/fallback-on1/KeccakP-1600-times8-on1.c +0 -37
  166. data/ext/xkcp/lib/low/KeccakP-1600-times8/fallback-on2/KeccakP-1600-times8-SnP.h +0 -45
  167. data/ext/xkcp/lib/low/KeccakP-1600-times8/fallback-on2/KeccakP-1600-times8-on2.c +0 -38
  168. data/ext/xkcp/lib/low/KeccakP-1600-times8/fallback-on4/KeccakP-1600-times8-SnP.h +0 -45
  169. data/ext/xkcp/lib/low/KeccakP-1600-times8/fallback-on4/KeccakP-1600-times8-on4.c +0 -38
  170. data/ext/xkcp/lib/low/KeccakP-200/ARM/KeccakP-200-SnP.h +0 -41
  171. data/ext/xkcp/lib/low/KeccakP-200/ARM/KeccakP-200-armv6m-le-armcc.s +0 -442
  172. data/ext/xkcp/lib/low/KeccakP-200/ARM/KeccakP-200-armv6m-le-gcc.s +0 -446
  173. data/ext/xkcp/lib/low/KeccakP-200/ARM/KeccakP-200-armv7m-le-armcc.s +0 -419
  174. data/ext/xkcp/lib/low/KeccakP-200/ARM/KeccakP-200-armv7m-le-gcc.s +0 -427
  175. data/ext/xkcp/lib/low/KeccakP-200/AVR8/KeccakP-200-SnP.h +0 -41
  176. data/ext/xkcp/lib/low/KeccakP-200/AVR8/KeccakP-200-avr8-fast.s +0 -647
  177. data/ext/xkcp/lib/low/KeccakP-200/compact/KeccakP-200-SnP.h +0 -39
  178. data/ext/xkcp/lib/low/KeccakP-200/compact/KeccakP-200-compact.c +0 -190
  179. data/ext/xkcp/lib/low/KeccakP-200/ref/KeccakP-200-SnP.h +0 -43
  180. data/ext/xkcp/lib/low/KeccakP-200/ref/KeccakP-200-reference.c +0 -412
  181. data/ext/xkcp/lib/low/KeccakP-200/ref/KeccakP-200-reference.h +0 -23
  182. data/ext/xkcp/lib/low/KeccakP-400/ARM/KeccakP-400-SnP.h +0 -41
  183. data/ext/xkcp/lib/low/KeccakP-400/ARM/KeccakP-400-armv6m-le-armcc.s +0 -454
  184. data/ext/xkcp/lib/low/KeccakP-400/ARM/KeccakP-400-armv6m-le-gcc.s +0 -458
  185. data/ext/xkcp/lib/low/KeccakP-400/ARM/KeccakP-400-armv7m-le-armcc.s +0 -455
  186. data/ext/xkcp/lib/low/KeccakP-400/ARM/KeccakP-400-armv7m-le-gcc.s +0 -458
  187. data/ext/xkcp/lib/low/KeccakP-400/AVR8/KeccakP-400-SnP.h +0 -41
  188. data/ext/xkcp/lib/low/KeccakP-400/AVR8/KeccakP-400-avr8-fast.s +0 -728
  189. data/ext/xkcp/lib/low/KeccakP-400/ref/KeccakP-400-SnP.h +0 -43
  190. data/ext/xkcp/lib/low/KeccakP-400/ref/KeccakP-400-reference.c +0 -414
  191. data/ext/xkcp/lib/low/KeccakP-400/ref/KeccakP-400-reference.h +0 -23
  192. data/ext/xkcp/lib/low/KeccakP-800/ARM/KeccakP-800-SnP.h +0 -42
  193. data/ext/xkcp/lib/low/KeccakP-800/ARM/KeccakP-800-u1-armv6m-le-armcc.s +0 -527
  194. data/ext/xkcp/lib/low/KeccakP-800/ARM/KeccakP-800-u1-armv6m-le-gcc.s +0 -533
  195. data/ext/xkcp/lib/low/KeccakP-800/ARM/KeccakP-800-u2-armv6m-le-armcc.s +0 -528
  196. data/ext/xkcp/lib/low/KeccakP-800/ARM/KeccakP-800-u2-armv6m-le-gcc.s +0 -534
  197. data/ext/xkcp/lib/low/KeccakP-800/ARM/KeccakP-800-u2-armv7a-le-armcc.s +0 -521
  198. data/ext/xkcp/lib/low/KeccakP-800/ARM/KeccakP-800-u2-armv7a-le-gcc.s +0 -527
  199. data/ext/xkcp/lib/low/KeccakP-800/ARM/KeccakP-800-u2-armv7m-le-armcc.s +0 -517
  200. data/ext/xkcp/lib/low/KeccakP-800/ARM/KeccakP-800-u2-armv7m-le-gcc.s +0 -523
  201. data/ext/xkcp/lib/low/KeccakP-800/ARM/KeccakP-800-uf-armv7m-le-armcc.s +0 -550
  202. data/ext/xkcp/lib/low/KeccakP-800/ARM/KeccakP-800-uf-armv7m-le-gcc.s +0 -556
  203. data/ext/xkcp/lib/low/KeccakP-800/ARMv8A/KeccakP-800-SnP.h +0 -32
  204. data/ext/xkcp/lib/low/KeccakP-800/ARMv8A/KeccakP-800-armv8a-neon.s +0 -432
  205. data/ext/xkcp/lib/low/KeccakP-800/AVR8/KeccakP-800-SnP.h +0 -42
  206. data/ext/xkcp/lib/low/KeccakP-800/AVR8/KeccakP-800-avr8-fast.s +0 -929
  207. data/ext/xkcp/lib/low/KeccakP-800/compact/KeccakP-800-SnP.h +0 -40
  208. data/ext/xkcp/lib/low/KeccakP-800/compact/KeccakP-800-compact.c +0 -244
  209. data/ext/xkcp/lib/low/KeccakP-800/plain/KeccakP-800-SnP.h +0 -46
  210. data/ext/xkcp/lib/low/KeccakP-800/plain/KeccakP-800-opt32-bis.macros +0 -184
  211. data/ext/xkcp/lib/low/KeccakP-800/plain/KeccakP-800-opt32.c +0 -454
  212. data/ext/xkcp/lib/low/KeccakP-800/plain/KeccakP-800-opt32.macros +0 -459
  213. data/ext/xkcp/lib/low/KeccakP-800/plain/KeccakP-800-unrolling-bis.macros +0 -83
  214. data/ext/xkcp/lib/low/KeccakP-800/plain/KeccakP-800-unrolling.macros +0 -88
  215. data/ext/xkcp/lib/low/KeccakP-800/plain/lcu2/KeccakP-800-opt32-config.h +0 -7
  216. data/ext/xkcp/lib/low/KeccakP-800/plain/lcua/KeccakP-800-opt32-config.h +0 -7
  217. data/ext/xkcp/lib/low/KeccakP-800/plain/u2/KeccakP-800-opt32-config.h +0 -7
  218. data/ext/xkcp/lib/low/KeccakP-800/plain/ua/KeccakP-800-opt32-config.h +0 -7
  219. data/ext/xkcp/lib/low/KeccakP-800/ref/KeccakP-800-SnP.h +0 -44
  220. data/ext/xkcp/lib/low/KeccakP-800/ref/KeccakP-800-reference.c +0 -437
  221. data/ext/xkcp/lib/low/KeccakP-800/ref/KeccakP-800-reference.h +0 -23
  222. data/ext/xkcp/lib/low/Ketje/OptimizedAsmARM/Ket.h +0 -57
  223. data/ext/xkcp/lib/low/Ketje/OptimizedAsmARM/KetjeJr-armv7m-le-armcc.s +0 -475
  224. data/ext/xkcp/lib/low/Ketje/OptimizedAsmARM/KetjeJr-armv7m-le-gcc.s +0 -480
  225. data/ext/xkcp/lib/low/Ketje/OptimizedAsmARM/KetjeSr-armv7m-le-armcc.s +0 -590
  226. data/ext/xkcp/lib/low/Ketje/OptimizedAsmARM/KetjeSr-armv7m-le-gcc.s +0 -590
  227. data/ext/xkcp/lib/low/Ketje/OptimizedLE/Ket.c +0 -126
  228. data/ext/xkcp/lib/low/Ketje/OptimizedLE/Ket.h +0 -68
  229. data/ext/xkcp/lib/low/Ketje/OptimizedLE/Ket.inc +0 -174
  230. data/ext/xkcp/lib/low/Ketje/SnP-compliant/Ket.c +0 -80
  231. data/ext/xkcp/lib/low/Ketje/SnP-compliant/Ket.h +0 -68
  232. data/ext/xkcp/lib/low/Ketje/SnP-compliant/Ket.inc +0 -142
  233. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodoo-SnP.h +0 -55
  234. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodoo-u1-armv6m-le-armcc.s +0 -1086
  235. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodoo-u1-armv6m-le-gcc.s +0 -1092
  236. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodoo-uf-armv6-le-armcc.s +0 -721
  237. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodoo-uf-armv6-le-gcc.s +0 -726
  238. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodoo-uf-armv7m-le-armcc.s +0 -723
  239. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodoo-uf-armv7m-le-gcc.s +0 -729
  240. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodyak-u1-armv6m-le-armcc.s +0 -1164
  241. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodyak-u1-armv6m-le-gcc.s +0 -1165
  242. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodyak-uf-armv6-le-armcc.s +0 -562
  243. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodyak-uf-armv6-le-gcc.s +0 -563
  244. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodyak-uf-armv7m-le-armcc.s +0 -563
  245. data/ext/xkcp/lib/low/Xoodoo/ARM/Xoodyak-uf-armv7m-le-gcc.s +0 -565
  246. data/ext/xkcp/lib/low/Xoodoo/ARMv7A-NEON/Xoodoo-SnP.h +0 -55
  247. data/ext/xkcp/lib/low/Xoodoo/ARMv7A-NEON/Xoodoo-uf-armv7a-neon-le-armcc.s +0 -476
  248. data/ext/xkcp/lib/low/Xoodoo/ARMv7A-NEON/Xoodoo-uf-armv7a-neon-le-gcc.s +0 -485
  249. data/ext/xkcp/lib/low/Xoodoo/ARMv7A-NEON/Xoodyak-uf-armv7a-neon-le-armcc.s +0 -362
  250. data/ext/xkcp/lib/low/Xoodoo/ARMv7A-NEON/Xoodyak-uf-armv7a-neon-le-gcc.s +0 -367
  251. data/ext/xkcp/lib/low/Xoodoo/AVR8/Xoodoo-SnP.h +0 -43
  252. data/ext/xkcp/lib/low/Xoodoo/AVR8/Xoodoo-avr8-u1.s +0 -1341
  253. data/ext/xkcp/lib/low/Xoodoo/AVX512/Xoodoo-SIMD512.c +0 -581
  254. data/ext/xkcp/lib/low/Xoodoo/AVX512/Xoodoo-SnP.h +0 -58
  255. data/ext/xkcp/lib/low/Xoodoo/AVX512/Xoodyak-full-block-SIMD512.c +0 -332
  256. data/ext/xkcp/lib/low/Xoodoo/SSE2/Xoodoo-SIMD128.c +0 -329
  257. data/ext/xkcp/lib/low/Xoodoo/SSE2/Xoodoo-SnP.h +0 -53
  258. data/ext/xkcp/lib/low/Xoodoo/SSE2/Xoodyak-full-block-SIMD128.c +0 -355
  259. data/ext/xkcp/lib/low/Xoodoo/Xoodoo.h +0 -79
  260. data/ext/xkcp/lib/low/Xoodoo/plain/Xoodoo-SnP.h +0 -56
  261. data/ext/xkcp/lib/low/Xoodoo/plain/Xoodoo-optimized.c +0 -399
  262. data/ext/xkcp/lib/low/Xoodoo/plain/Xoodyak-full-blocks.c +0 -127
  263. data/ext/xkcp/lib/low/Xoodoo/ref/Xoodoo-SnP.h +0 -43
  264. data/ext/xkcp/lib/low/Xoodoo/ref/Xoodoo-reference.c +0 -253
  265. data/ext/xkcp/lib/low/Xoodoo-times16/AVX512/Xoodoo-times16-SIMD512.c +0 -1044
  266. data/ext/xkcp/lib/low/Xoodoo-times16/AVX512/Xoodoo-times16-SnP.h +0 -49
  267. data/ext/xkcp/lib/low/Xoodoo-times16/fallback-on1/Xoodoo-times16-SnP.h +0 -45
  268. data/ext/xkcp/lib/low/Xoodoo-times16/fallback-on1/Xoodoo-times16-on1.c +0 -37
  269. data/ext/xkcp/lib/low/Xoodoo-times4/ARMv7A-NEON/Xoodoo-times4-ARMv7A.s +0 -1587
  270. data/ext/xkcp/lib/low/Xoodoo-times4/ARMv7A-NEON/Xoodoo-times4-SnP.h +0 -48
  271. data/ext/xkcp/lib/low/Xoodoo-times4/AVX512/Xoodoo-times4-SIMD512.c +0 -1202
  272. data/ext/xkcp/lib/low/Xoodoo-times4/AVX512/Xoodoo-times4-SnP.h +0 -48
  273. data/ext/xkcp/lib/low/Xoodoo-times4/SSSE3/Xoodoo-times4-SIMD128.c +0 -484
  274. data/ext/xkcp/lib/low/Xoodoo-times4/SSSE3/Xoodoo-times4-SnP.h +0 -44
  275. data/ext/xkcp/lib/low/Xoodoo-times4/fallback-on1/Xoodoo-times4-SnP.h +0 -45
  276. data/ext/xkcp/lib/low/Xoodoo-times4/fallback-on1/Xoodoo-times4-on1.c +0 -37
  277. data/ext/xkcp/lib/low/Xoodoo-times8/AVX2/Xoodoo-times8-SIMD256.c +0 -939
  278. data/ext/xkcp/lib/low/Xoodoo-times8/AVX2/Xoodoo-times8-SnP.h +0 -49
  279. data/ext/xkcp/lib/low/Xoodoo-times8/AVX512/Xoodoo-times8-SIMD512.c +0 -1216
  280. data/ext/xkcp/lib/low/Xoodoo-times8/AVX512/Xoodoo-times8-SnP.h +0 -48
  281. data/ext/xkcp/lib/low/Xoodoo-times8/fallback-on1/Xoodoo-times8-SnP.h +0 -45
  282. data/ext/xkcp/lib/low/Xoodoo-times8/fallback-on1/Xoodoo-times8-on1.c +0 -37
  283. data/ext/xkcp/lib/low/common/PlSnP-Fallback.inc +0 -290
  284. data/ext/xkcp/lib/low/common/SnP-Relaned.h +0 -141
  285. data/ext/xkcp/support/Kernel-PMU/Kernel-pmu.md +0 -133
  286. data/ext/xkcp/support/Kernel-PMU/Makefile +0 -8
  287. data/ext/xkcp/support/Kernel-PMU/enable_arm_pmu.c +0 -129
  288. data/ext/xkcp/support/Kernel-PMU/load-module +0 -1
  289. data/ext/xkcp/util/KeccakSum/KeccakSum.c +0 -394
  290. data/ext/xkcp/util/KeccakSum/base64.c +0 -86
  291. data/ext/xkcp/util/KeccakSum/base64.h +0 -12
@@ -1,728 +0,0 @@
1
- ;
2
- ; The eXtended Keccak Code Package (XKCP)
3
- ; https://github.com/XKCP/XKCP
4
- ;
5
- ; The Keccak-p permutations, designed by Guido Bertoni, Joan Daemen, Michaël Peeters and Gilles Van Assche.
6
- ;
7
- ; Implementation by Ronny Van Keer, hereby denoted as "the implementer".
8
- ;
9
- ; For more information, feedback or questions, please refer to the Keccak Team website:
10
- ; https://keccak.team/
11
- ;
12
- ; To the extent possible under law, the implementer has waived all copyright
13
- ; and related or neighboring rights to the source code in this file.
14
- ; http://creativecommons.org/publicdomain/zero/1.0/
15
- ;
16
- ; ---
17
- ;
18
- ; This file implements Keccak-p[400] in a SnP-compatible way.
19
- ; Please refer to SnP-documentation.h for more details.
20
- ;
21
- ; This implementation comes with KeccakP-400-SnP.h in the same folder.
22
- ; Please refer to LowLevel.build for the exact list of other files it must be combined with.
23
- ;
24
-
25
- ; INFO: Tested on ATmega1280 simulator
26
-
27
- ; Registers used in all routines
28
- #define zero 1
29
- #define rpState 24
30
- #define rX 26
31
- #define rY 28
32
- #define rZ 30
33
- #define sp 0x3D
34
-
35
- ;----------------------------------------------------------------------------
36
- ;
37
- ; void KeccakP400_StaticInitialize( void )
38
- ;
39
- .global KeccakP400_StaticInitialize
40
-
41
- ;----------------------------------------------------------------------------
42
- ;
43
- ; void KeccakP400_Initialize(void *state)
44
- ;
45
- ; argument state is passed in r24:r25
46
- ;
47
- .global KeccakP400_Initialize
48
- KeccakP400_Initialize:
49
- movw rZ, r24
50
- ldi r23, 2*5 ; clear state (5 bytes/2.5 lanes per iteration)
51
- KeccakP400_Initialize_Loop:
52
- st z+, zero
53
- st z+, zero
54
- st z+, zero
55
- st z+, zero
56
- st z+, zero
57
- dec r23
58
- brne KeccakP400_Initialize_Loop
59
- KeccakP400_StaticInitialize:
60
- ret
61
-
62
- ;----------------------------------------------------------------------------
63
- ;
64
- ; void KeccakP400_AddByte(void *state, unsigned char data, unsigned int offset)
65
- ;
66
- ; argument state is passed in r24:r25
67
- ; argument data is passed in r22:r23, only LSB (r22) is used
68
- ; argument offset is passed in r20:r21, only LSB (r20) is used
69
- ;
70
- .global KeccakP400_AddByte
71
- KeccakP400_AddByte:
72
- movw rZ, r24
73
- add rZ, r20
74
- adc rZ+1, zero
75
- ld r0, Z
76
- eor r0, r22
77
- st Z, r0
78
- ret
79
-
80
- ;----------------------------------------------------------------------------
81
- ;
82
- ; void KeccakP400_AddBytes(void *state, const unsigned char *data, unsigned int offset, unsigned int length)
83
- ;
84
- ; argument state is passed in r24:r25
85
- ; argument data is passed in r22:r23
86
- ; argument offset is passed in r20:r21, only LSB (r20) is used
87
- ; argument length is passed in r18:r19, only LSB (r18) is used
88
- ;
89
- .global KeccakP400_AddBytes
90
- KeccakP400_AddBytes:
91
- tst r18
92
- breq KeccakP400_AddBytes_End
93
- movw rZ, r24
94
- add rZ, r20
95
- adc rZ+1, zero
96
- movw rX, r22
97
- KeccakP400_AddBytes_Loop:
98
- ld r21, X+
99
- ld r0, Z
100
- eor r0, r21
101
- st Z+, r0
102
- dec r18
103
- brne KeccakP400_AddBytes_Loop
104
- KeccakP400_AddBytes_End:
105
- ret
106
-
107
- ;----------------------------------------------------------------------------
108
- ;
109
- ; void KeccakP400_OverwriteBytes(void *state, const unsigned char *data, unsigned int offset, unsigned int length)
110
- ;
111
- ; argument state is passed in r24:r25
112
- ; argument data is passed in r22:r23
113
- ; argument offset is passed in r20:r21, only LSB (r20) is used
114
- ; argument length is passed in r18:r19, only LSB (r18) is used
115
- ;
116
- .global KeccakP400_OverwriteBytes
117
- KeccakP400_OverwriteBytes:
118
- tst r18
119
- breq KeccakP400_OverwriteBytes_End
120
- movw rZ, r24
121
- add rZ, r20
122
- adc rZ+1, zero
123
- movw rX, r22
124
- KeccakP400_OverwriteBytes_Loop:
125
- ld r0, X+
126
- st Z+, r0
127
- dec r18
128
- brne KeccakP400_OverwriteBytes_Loop
129
- KeccakP400_OverwriteBytes_End:
130
- ret
131
-
132
- ;----------------------------------------------------------------------------
133
- ;
134
- ; void KeccakP400_OverwriteWithZeroes(void *state, unsigned int byteCount)
135
- ;
136
- ; argument state is passed in r24:r25
137
- ; argument byteCount is passed in r22:r23, only LSB (r22) is used
138
- ;
139
- .global KeccakP400_OverwriteWithZeroes
140
- KeccakP400_OverwriteWithZeroes:
141
- movw rZ, r24 ; rZ = state
142
- mov r23, r22
143
- lsr r23
144
- lsr r23
145
- breq KeccakP400_OverwriteWithZeroes_Bytes
146
- KeccakP400_OverwriteWithZeroes_Loop2Lanes:
147
- st Z+, r1
148
- st Z+, r1
149
- st Z+, r1
150
- st Z+, r1
151
- dec r23
152
- brne KeccakP400_OverwriteWithZeroes_Loop2Lanes
153
- KeccakP400_OverwriteWithZeroes_Bytes:
154
- andi r22, 3
155
- breq KeccakP400_OverwriteWithZeroes_End
156
- KeccakP400_OverwriteWithZeroes_LoopBytes:
157
- st Z+, r1
158
- dec r22
159
- brne KeccakP400_OverwriteWithZeroes_LoopBytes
160
- KeccakP400_OverwriteWithZeroes_End:
161
- ret
162
-
163
- ;----------------------------------------------------------------------------
164
- ;
165
- ; void KeccakP400_ExtractBytes(void *state, const unsigned char *data, unsigned int offset, unsigned int length)
166
- ;
167
- ; argument state is passed in r24:r25
168
- ; argument data is passed in r22:r23
169
- ; argument offset is passed in r20:r21, only LSB (r20) is used
170
- ; argument length is passed in r18:r19, only LSB (r18) is used
171
- ;
172
- .global KeccakP400_ExtractBytes
173
- KeccakP400_ExtractBytes:
174
- tst r18
175
- breq KeccakP400_ExtractBytes_End
176
- movw rZ, r24
177
- add rZ, r20
178
- adc rZ+1, zero
179
- movw rX, r22
180
- KeccakP400_ExtractBytes_Loop:
181
- ld r0, Z+
182
- st X+, r0
183
- dec r18
184
- brne KeccakP400_ExtractBytes_Loop
185
- KeccakP400_ExtractBytes_End:
186
- ret
187
-
188
- ;----------------------------------------------------------------------------
189
- ;
190
- ; void KeccakP400_ExtractAndAddBytes(void *state, const unsigned char *input, unsigned char *output, unsigned int offset, unsigned int length)
191
- ;
192
- ; argument state is passed in r24:r25
193
- ; argument input is passed in r22:r23
194
- ; argument output is passed in r20:r21
195
- ; argument offset is passed in r18:r19, only LSB (r18) is used
196
- ; argument length is passed in r16:r17, only LSB (r16) is used
197
- ;
198
- .global KeccakP400_ExtractAndAddBytes
199
- KeccakP400_ExtractAndAddBytes:
200
- tst r16
201
- breq KeccakP400_ExtractAndAddBytes_End
202
- push r16
203
- push r28
204
- push r29
205
- movw rZ, r24
206
- add rZ, r18
207
- adc rZ+1, zero
208
- movw rX, r22
209
- movw rY, r20
210
- subi r16, 2
211
- brcs KeccakP400_ExtractAndAddBytes_Byte
212
- KeccakP400_ExtractAndAddBytes_LoopLane:
213
- ld r21, Z+
214
- ld r0, X+
215
- eor r0, r21
216
- st Y+, r0
217
- ld r21, Z+
218
- ld r0, X+
219
- eor r0, r21
220
- st Y+, r0
221
- subi r16, 2
222
- brcc KeccakP400_ExtractAndAddBytes_LoopLane
223
- KeccakP400_ExtractAndAddBytes_Byte:
224
- ldi r19, 2
225
- add r16, r19
226
- breq KeccakP400_ExtractAndAddBytes_Done
227
- KeccakP400_ExtractAndAddBytes_Loop1:
228
- ld r21, Z+
229
- ld r0, X+
230
- eor r0, r21
231
- st Y+, r0
232
- dec r16
233
- brne KeccakP400_ExtractAndAddBytes_Loop1
234
- KeccakP400_ExtractAndAddBytes_Done:
235
- pop r29
236
- pop r28
237
- pop r16
238
- KeccakP400_ExtractAndAddBytes_End:
239
- ret
240
-
241
-
242
- #define ROT_BIT(a) ((a) & 7)
243
- #define ROT_BYTE(a) (((a)/8 + !!(((a)%8) > 4)) & 1)
244
-
245
- KeccakP400_RhoPiConstants:
246
- .BYTE ROT_BIT( 1), ROT_BYTE( 3), 10 * 2
247
- .BYTE ROT_BIT( 3), ROT_BYTE( 6), 7 * 2
248
- .BYTE ROT_BIT( 6), ROT_BYTE(10), 11 * 2
249
- .BYTE ROT_BIT(10), ROT_BYTE(15), 17 * 2
250
- .BYTE ROT_BIT(15), ROT_BYTE(21), 18 * 2
251
- .BYTE ROT_BIT(21), ROT_BYTE(28), 3 * 2
252
- .BYTE ROT_BIT(28), ROT_BYTE(36), 5 * 2
253
- .BYTE ROT_BIT(36), ROT_BYTE(45), 16 * 2
254
- .BYTE ROT_BIT(45), ROT_BYTE(55), 8 * 2
255
- .BYTE ROT_BIT(55), ROT_BYTE( 2), 21 * 2
256
- .BYTE ROT_BIT( 2), ROT_BYTE(14), 24 * 2
257
- .BYTE ROT_BIT(14), ROT_BYTE(27), 4 * 2
258
- .BYTE ROT_BIT(27), ROT_BYTE(41), 15 * 2
259
- .BYTE ROT_BIT(41), ROT_BYTE(56), 23 * 2
260
- .BYTE ROT_BIT(56), ROT_BYTE( 8), 19 * 2
261
- .BYTE ROT_BIT( 8), ROT_BYTE(25), 13 * 2
262
- .BYTE ROT_BIT(25), ROT_BYTE(43), 12 * 2
263
- .BYTE ROT_BIT(43), ROT_BYTE(62), 2 * 2
264
- .BYTE ROT_BIT(62), ROT_BYTE(18), 20 * 2
265
- .BYTE ROT_BIT(18), ROT_BYTE(39), 14 * 2
266
- .BYTE ROT_BIT(39), ROT_BYTE(61), 22 * 2
267
- .BYTE ROT_BIT(61), ROT_BYTE(20), 9 * 2
268
- .BYTE ROT_BIT(20), ROT_BYTE(44), 6 * 2
269
- .BYTE ROT_BIT(44), ROT_BYTE( 1), 1 * 2
270
-
271
- KeccakP400_RoundConstants_20:
272
- .BYTE 0x01, 0x00
273
- .BYTE 0x82, 0x80
274
- .BYTE 0x8a, 0x80
275
- .BYTE 0x00, 0x80
276
- .BYTE 0x8b, 0x80
277
- .BYTE 0x01, 0x00
278
- .BYTE 0x81, 0x80
279
- .BYTE 0x09, 0x80
280
- .BYTE 0x8a, 0x00
281
- .BYTE 0x88, 0x00
282
- .BYTE 0x09, 0x80
283
- .BYTE 0x0a, 0x00
284
- .BYTE 0x8b, 0x80
285
- .BYTE 0x8b, 0x00
286
- .BYTE 0x89, 0x80
287
- .BYTE 0x03, 0x80
288
- .BYTE 0x02, 0x80
289
- .BYTE 0x80, 0x00
290
- .BYTE 0x0a, 0x80
291
- .BYTE 0x0a, 0x00
292
- KeccakP400_RoundConstants_N:
293
- .BYTE 0xFF, 0 ; terminator
294
-
295
- .text
296
-
297
- #define pRound 22 //; 2 regs (22-23)
298
- #define pRound1 23
299
-
300
- ;----------------------------------------------------------------------------
301
- ;
302
- ; void KeccakP400_Permute_20rounds( void *state )
303
- ;
304
- .global KeccakP400_Permute_20rounds
305
- KeccakP400_Permute_20rounds:
306
- ldi pRound, lo8(KeccakP400_RoundConstants_20)
307
- ldi pRound+1, hi8(KeccakP400_RoundConstants_20)
308
- rjmp KeccakP400_Permute
309
-
310
- ;----------------------------------------------------------------------------
311
- ;
312
- ; void KeccakP400_Permute_Nrounds( void *state, unsigned int nr )
313
- ;
314
- ; argument state is passed in r24:r25
315
- ; argument nr is passed in r22:r23
316
- ;
317
- .global KeccakP400_Permute_Nrounds
318
- KeccakP400_Permute_Nrounds:
319
- mov r0, r22
320
- lsl r0
321
- ldi pRound, lo8(KeccakP400_RoundConstants_N)
322
- ldi pRound+1, hi8(KeccakP400_RoundConstants_N)
323
- sub pRound, r0
324
- sbc pRound+1, r1
325
- KeccakP400_Permute:
326
- push r2
327
- push r3
328
- push r4
329
- push r5
330
- push r6
331
- push r7
332
- push r8
333
- push r9
334
- push r10
335
- push r11
336
- push r12
337
- push r13
338
- push r14
339
- push r15
340
- push r16
341
- push r17
342
- push r28
343
- push r29
344
-
345
- ; Allocate C variables (5*2)
346
- in rZ, sp
347
- in rZ+1, sp+1
348
- sbiw rZ, 5*2
349
- in r0, 0x3F
350
- cli
351
- out sp+1, rZ+1
352
- out sp, rZ ; Z points to 5 C lanes
353
- out 0x3F, r0
354
-
355
- ; Variables used in multiple operations
356
- #define rTemp 2 //; 8 regs (2-9)
357
- #define rTemp0 2
358
- #define rTemp1 3
359
- #define rTemp2 4
360
- #define rTemp3 5
361
- #define rTemp4 6
362
- #define rTemp5 7
363
- #define rTemp6 8
364
- #define rTemp7 9
365
- #define rTempBis 10 //; 8 regs (10-17)
366
- #define rTempBis0 10
367
- #define rTempBis1 11
368
- #define rTempBis2 12
369
- #define rTempBis3 13
370
- #define rTempBis4 14
371
- #define rTempBis5 15
372
- #define rTempBis6 16
373
- #define rTempBis7 17
374
- #define rTempTer 18 //; 4 regs (18-21)
375
- #define rTempTer0 18
376
- #define rTempTer1 19
377
-
378
- ; Initial Prepare Theta
379
- #define TCIPx rTempTer
380
-
381
- clr zero
382
- movw rY, rpState
383
- ldi TCIPx, 5*2
384
- KeccakP_InitialPrepTheta_Loop:
385
- ld r0, Y
386
- adiw rY, 10
387
- ld rTemp, Y
388
- adiw rY, 10
389
- eor r0, rTemp
390
- ld rTemp, Y
391
- adiw rY, 10
392
- eor r0, rTemp
393
- ld rTemp, Y
394
- eor r0, rTemp
395
- ldd rTemp, Y+10
396
- eor r0, rTemp
397
- st Z+, r0
398
- sbiw rY, 29
399
- dec TCIPx
400
- brne KeccakP_InitialPrepTheta_Loop
401
- #undef TCIPx
402
-
403
- KeccakP_RoundLoop:
404
-
405
- ; Theta
406
- #define TCplus rX
407
- #define TCplus1 rX1
408
- #define TCminus rZ
409
- #define TCminus1 rZ1
410
- #define TCcoordX rTempTer
411
- #define TCcoordY rTempTer1
412
-
413
- in TCminus, sp
414
- in TCminus+1, sp+1
415
- movw TCplus, TCminus
416
- adiw TCminus, 4*2
417
- adiw TCplus, 1*2
418
- movw rY, rpState
419
- ldi TCcoordX, 0x16
420
- KeccakTheta_Loop1:
421
- ld rTemp0, X+
422
- ld rTemp1, X+
423
-
424
- lsl rTemp0
425
- rol rTemp1
426
- adc rTemp0, zero
427
-
428
- ld r0, Z+
429
- eor rTemp0, r0
430
- ld r0, Z+
431
- eor rTemp1, r0
432
-
433
- ldi TCcoordY, 5
434
- KeccakTheta_Loop2:
435
- ld r0, Y
436
- eor r0, rTemp0
437
- st Y+, r0
438
- ld r0, Y
439
- eor r0, rTemp1
440
- st Y+, r0
441
- adiw rY, 8
442
-
443
- dec TCcoordY
444
- brne KeccakTheta_Loop2
445
-
446
- sbiw rY, 50-2
447
-
448
- lsr TCcoordX
449
- brcc local1
450
- brne KeccakTheta_Loop1
451
- rjmp KeccakTheta_End
452
- local1:
453
- cpi TCcoordX, 0x0B
454
- brne local2
455
- sbiw TCminus, 10
456
- rjmp KeccakTheta_Loop1
457
- local2:
458
- sbiw TCplus, 10
459
- rjmp KeccakTheta_Loop1
460
-
461
- KeccakTheta_End:
462
- #undef TCplus
463
- #undef TCminus
464
- #undef TCcoordX
465
- #undef TCcoordY
466
-
467
- ; Rho Pi
468
- #define RPpConst rTempTer //; 2 regs
469
- #define RPindex rTempTer+2
470
- #define RPByteRot rTempTer+3
471
- #define RPpBitRot rX
472
-
473
- sbiw rY, 8
474
- ld rTemp0, Y+
475
- ld rTemp1, Y+
476
- ldi RPpConst, lo8(KeccakP400_RhoPiConstants)
477
- ldi RPpConst+1, hi8(KeccakP400_RhoPiConstants)
478
- ldi RPpBitRot, pm_lo8(bit_rot_jmp_table)
479
- ldi RPpBitRot+1, pm_hi8(bit_rot_jmp_table)
480
-
481
- KeccakRhoPi_Loop:
482
- ; get rotation codes
483
- movw rZ, RPpConst
484
- lpm r0, Z+ ; get number of bits to rotate
485
- lpm RPByteRot, Z+ ; get number of bytes to rotate
486
- lpm RPindex, Z+ ; get index in state
487
- movw RPpConst, rZ
488
-
489
- ; do bit rotation
490
- movw rZ, RPpBitRot
491
- add rZ, r0
492
- adc rZ+1, zero
493
- ijmp
494
-
495
- KeccakRhoPi_RhoBitRotateDone:
496
- movw rY, rpState
497
- add rY, RPindex
498
- adc rY+1, zero
499
-
500
- tst RPByteRot
501
- brne KeccakRhoPi_LoadSwapped
502
- ld rTempBis0, Y
503
- ldd rTempBis1, Y+1
504
- st Y+, rTemp0
505
- st Y+, rTemp1
506
- movw rTemp0, rTempBis0
507
- subi RPindex, 2
508
- brne KeccakRhoPi_Loop
509
- rjmp KeccakRhoPi_Done
510
- KeccakRhoPi_LoadSwapped:
511
- ld rTempBis1, Y
512
- ldd rTempBis0, Y+1
513
- st Y+, rTemp0
514
- st Y+, rTemp1
515
- movw rTemp0, rTempBis0
516
- subi RPindex, 2
517
- brne KeccakRhoPi_Loop
518
- KeccakRhoPi_Done:
519
-
520
- #undef RPindex
521
- #undef RPTemp
522
-
523
- ; Chi, Iota, prepare Theta
524
- #define CIPTa0 rTemp
525
- #define CIPTa1 rTemp1
526
- #define CIPTa2 rTemp2
527
- #define CIPTa3 rTemp3
528
- #define CIPTa4 rTemp4
529
- #define CIPTc0 rTempBis
530
- #define CIPTc1 rTempBis1
531
- #define CIPTc2 rTempBis2
532
- #define CIPTc3 rTempBis3
533
- #define CIPTc4 rTempBis4
534
- #define CIPTz rTempBis6
535
- #define CIPTy rTempBis7
536
-
537
- movw rY, rpState
538
- in rX, sp
539
- in rX+1, sp+1
540
-
541
- movw rZ, pRound
542
-
543
- ldi CIPTz, 2
544
- KeccakChiIotaPrepareTheta_zLoop:
545
- mov CIPTc0, zero
546
- mov CIPTc1, zero
547
- movw CIPTc2, CIPTc0
548
- mov CIPTc4, zero
549
-
550
- ldi CIPTy, 5
551
- KeccakChiIotaPrepareTheta_yLoop:
552
- ld CIPTa0, Y
553
- ldd CIPTa1, Y+2
554
- ldd CIPTa2, Y+4
555
- ldd CIPTa3, Y+6
556
- ldd CIPTa4, Y+8
557
-
558
- ;*p = t = a0 ^ ((~a1) & a2); c0 ^= t;
559
- mov r0, CIPTa1
560
- com r0
561
- and r0, CIPTa2
562
- eor r0, CIPTa0
563
- eor CIPTc0, r0
564
- st Y, r0
565
-
566
- ;*(p+2) = t = a1 ^ ((~a2) & a3); c1 ^= t;
567
- mov r0, CIPTa2
568
- com r0
569
- and r0, CIPTa3
570
- eor r0, CIPTa1
571
- eor CIPTc1, r0
572
- std Y+2, r0
573
-
574
- ;*(p+4) = a2 ^= ((~a3) & a4); c2 ^= a2;
575
- mov r0, CIPTa3
576
- com r0
577
- and r0, CIPTa4
578
- eor r0, CIPTa2
579
- eor CIPTc2, r0
580
- std Y+4, r0
581
-
582
- ;*(p+6) = a3 ^= ((~a4) & a0); c3 ^= a3;
583
- mov r0, CIPTa4
584
- com r0
585
- and r0, CIPTa0
586
- eor r0, CIPTa3
587
- eor CIPTc3, r0
588
- std Y+6, r0
589
-
590
- ;*(p+8) = a4 ^= ((~a0) & a1); c4 ^= a4;
591
- com CIPTa0
592
- and CIPTa0, CIPTa1
593
- eor CIPTa0, CIPTa4
594
- eor CIPTc4, CIPTa0
595
- std Y+8, CIPTa0
596
-
597
- adiw rY, 10
598
- dec CIPTy
599
- brne KeccakChiIotaPrepareTheta_yLoop
600
-
601
- sbiw rY, 50
602
-
603
- lpm r0, Z+ ; Round Constant
604
- ld CIPTa0, Y
605
- eor CIPTa0, r0
606
- st Y+, CIPTa0
607
-
608
- movw pRound, rZ
609
- movw rZ, rX
610
- eor CIPTc0, r0
611
- st Z+, CIPTc0
612
- std Z+1, CIPTc1
613
- std Z+3, CIPTc2
614
- std Z+5, CIPTc3
615
- std Z+7, CIPTc4
616
- movw rX, rZ
617
- movw rZ, pRound
618
-
619
- dec CIPTz
620
- brne KeccakChiIotaPrepareTheta_zLoop
621
-
622
- #undef CIPTa0
623
- #undef CIPTa1
624
- #undef CIPTa2
625
- #undef CIPTa3
626
- #undef CIPTa4
627
- #undef CIPTc0
628
- #undef CIPTc1
629
- #undef CIPTc2
630
- #undef CIPTc3
631
- #undef CIPTc4
632
- #undef CIPTz
633
- #undef CIPTy
634
-
635
-
636
- ;Check for terminator
637
- lpm r0, Z
638
- inc r0
639
- breq KeccakP_Done
640
- rjmp KeccakP_RoundLoop
641
- KeccakP_Done:
642
-
643
- ; Free C(on stack) and registers
644
- in rX, sp ; free 5 C lanes
645
- in rX+1, sp+1
646
- adiw rX, 5*2
647
- in r0, 0x3F
648
- cli
649
- out sp+1, rX+1
650
- out sp, rX
651
- out 0x3F, r0
652
-
653
- pop r29
654
- pop r28
655
- pop r17
656
- pop r16
657
- pop r15
658
- pop r14
659
- pop r13
660
- pop r12
661
- pop r11
662
- pop r10
663
- pop r9
664
- pop r8
665
- pop r7
666
- pop r6
667
- pop r5
668
- pop r4
669
- pop r3
670
- pop r2
671
- ret
672
-
673
- bit_rot_jmp_table:
674
- rjmp KeccakRhoPi_RhoBitRotateDone
675
- rjmp rotate16_1bit_left
676
- rjmp rotate16_2bit_left
677
- rjmp rotate16_3bit_left
678
- rjmp rotate16_4bit_left
679
- rjmp rotate16_3bit_right
680
- rjmp rotate16_2bit_right
681
- rjmp rotate16_1bit_right
682
-
683
- rotate16_4bit_left:
684
- lsl rTemp
685
- rol rTemp+1
686
- adc rTemp, r1
687
- rotate16_3bit_left:
688
- lsl rTemp
689
- rol rTemp+1
690
- adc rTemp, r1
691
- rotate16_2bit_left:
692
- lsl rTemp
693
- rol rTemp+1
694
- adc rTemp, r1
695
- rotate16_1bit_left:
696
- lsl rTemp
697
- rol rTemp+1
698
- adc rTemp, r1
699
- rjmp KeccakRhoPi_RhoBitRotateDone
700
-
701
- rotate16_3bit_right:
702
- bst rTemp, 0
703
- ror rTemp+1
704
- ror rTemp
705
- bld rTemp+1, 7
706
- rotate16_2bit_right:
707
- bst rTemp, 0
708
- ror rTemp+1
709
- ror rTemp
710
- bld rTemp+1, 7
711
- rotate16_1bit_right:
712
- bst rTemp, 0
713
- ror rTemp+1
714
- ror rTemp
715
- bld rTemp+1, 7
716
- rjmp KeccakRhoPi_RhoBitRotateDone
717
-
718
- #undef rTemp
719
- #undef rTempBis
720
- #undef rTempTer
721
- #undef pRound
722
-
723
- #undef rpState
724
- #undef zero
725
- #undef rX
726
- #undef rY
727
- #undef rZ
728
- #undef sp