wp_block.c 34 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784
  1. /*
  2. * Copyright 2005-2016 The OpenSSL Project Authors. All Rights Reserved.
  3. *
  4. * Licensed under the OpenSSL license (the "License"). You may not use
  5. * this file except in compliance with the License. You can obtain a copy
  6. * in the file LICENSE in the source distribution or at
  7. * https://www.openssl.org/source/license.html
  8. */
  9. /**
  10. * The Whirlpool hashing function.
  11. *
  12. * See
  13. * P.S.L.M. Barreto, V. Rijmen,
  14. * ``The Whirlpool hashing function,''
  15. * NESSIE submission, 2000 (tweaked version, 2001),
  16. * <https://www.cosic.esat.kuleuven.ac.be/nessie/workshop/submissions/whirlpool.zip>
  17. *
  18. * Based on "@version 3.0 (2003.03.12)" by Paulo S.L.M. Barreto and
  19. * Vincent Rijmen. Lookup "reference implementations" on
  20. * <http://planeta.terra.com.br/informatica/paulobarreto/>
  21. *
  22. * =============================================================================
  23. *
  24. * THIS SOFTWARE IS PROVIDED BY THE AUTHORS ''AS IS'' AND ANY EXPRESS
  25. * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
  26. * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  27. * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE
  28. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  29. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  30. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
  31. * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
  32. * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
  33. * OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
  34. * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  35. *
  36. */
  37. #include "wp_locl.h"
  38. #include <string.h>
  39. typedef unsigned char u8;
  40. #if (defined(_WIN32) || defined(_WIN64)) && !defined(__MINGW32)
  41. typedef unsigned __int64 u64;
  42. #elif defined(__arch64__)
  43. typedef unsigned long u64;
  44. #else
  45. typedef unsigned long long u64;
  46. #endif
  47. #define ROUNDS 10
  48. #define STRICT_ALIGNMENT
  49. #if !defined(PEDANTIC) && (defined(__i386) || defined(__i386__) || \
  50. defined(__x86_64) || defined(__x86_64__) || \
  51. defined(_M_IX86) || defined(_M_AMD64) || \
  52. defined(_M_X64))
  53. /*
  54. * Well, formally there're couple of other architectures, which permit
  55. * unaligned loads, specifically those not crossing cache lines, IA-64 and
  56. * PowerPC...
  57. */
  58. # undef STRICT_ALIGNMENT
  59. #endif
  60. #undef SMALL_REGISTER_BANK
  61. #if defined(__i386) || defined(__i386__) || defined(_M_IX86)
  62. # define SMALL_REGISTER_BANK
  63. # if defined(WHIRLPOOL_ASM)
  64. # ifndef OPENSSL_SMALL_FOOTPRINT
  65. /*
  66. * it appears that for elder non-MMX
  67. * CPUs this is actually faster!
  68. */
  69. # define OPENSSL_SMALL_FOOTPRINT
  70. # endif
  71. # define GO_FOR_MMX(ctx,inp,num) do { \
  72. extern unsigned long OPENSSL_ia32cap_P[]; \
  73. void whirlpool_block_mmx(void *,const void *,size_t); \
  74. if (!(OPENSSL_ia32cap_P[0] & (1<<23))) break; \
  75. whirlpool_block_mmx(ctx->H.c,inp,num); return; \
  76. } while (0)
  77. # endif
  78. #endif
  79. #undef ROTATE
  80. #ifndef PEDANTIC
  81. # if defined(_MSC_VER)
  82. # if defined(_WIN64) /* applies to both IA-64 and AMD64 */
  83. # pragma intrinsic(_rotl64)
  84. # define ROTATE(a,n) _rotl64((a),n)
  85. # endif
  86. # elif defined(__GNUC__) && __GNUC__>=2
  87. # if defined(__x86_64) || defined(__x86_64__)
  88. # if defined(L_ENDIAN)
  89. # define ROTATE(a,n) ({ u64 ret; asm ("rolq %1,%0" \
  90. : "=r"(ret) : "J"(n),"0"(a) : "cc"); ret; })
  91. # elif defined(B_ENDIAN)
  92. /*
  93. * Most will argue that x86_64 is always little-endian. Well, yes, but
  94. * then we have stratus.com who has modified gcc to "emulate"
  95. * big-endian on x86. Is there evidence that they [or somebody else]
  96. * won't do same for x86_64? Naturally no. And this line is waiting
  97. * ready for that brave soul:-)
  98. */
  99. # define ROTATE(a,n) ({ u64 ret; asm ("rorq %1,%0" \
  100. : "=r"(ret) : "J"(n),"0"(a) : "cc"); ret; })
  101. # endif
  102. # elif defined(__ia64) || defined(__ia64__)
  103. # if defined(L_ENDIAN)
  104. # define ROTATE(a,n) ({ u64 ret; asm ("shrp %0=%1,%1,%2" \
  105. : "=r"(ret) : "r"(a),"M"(64-(n))); ret; })
  106. # elif defined(B_ENDIAN)
  107. # define ROTATE(a,n) ({ u64 ret; asm ("shrp %0=%1,%1,%2" \
  108. : "=r"(ret) : "r"(a),"M"(n)); ret; })
  109. # endif
  110. # endif
  111. # endif
  112. #endif
  113. #if defined(OPENSSL_SMALL_FOOTPRINT)
  114. # if !defined(ROTATE)
  115. # if defined(L_ENDIAN) /* little-endians have to rotate left */
  116. # define ROTATE(i,n) ((i)<<(n) ^ (i)>>(64-n))
  117. # elif defined(B_ENDIAN) /* big-endians have to rotate right */
  118. # define ROTATE(i,n) ((i)>>(n) ^ (i)<<(64-n))
  119. # endif
  120. # endif
  121. # if defined(ROTATE) && !defined(STRICT_ALIGNMENT)
  122. # define STRICT_ALIGNMENT /* ensure smallest table size */
  123. # endif
  124. #endif
  125. /*
  126. * Table size depends on STRICT_ALIGNMENT and whether or not endian-
  127. * specific ROTATE macro is defined. If STRICT_ALIGNMENT is not
  128. * defined, which is normally the case on x86[_64] CPUs, the table is
  129. * 4KB large unconditionally. Otherwise if ROTATE is defined, the
  130. * table is 2KB large, and otherwise - 16KB. 2KB table requires a
  131. * whole bunch of additional rotations, but I'm willing to "trade,"
  132. * because 16KB table certainly trashes L1 cache. I wish all CPUs
  133. * could handle unaligned load as 4KB table doesn't trash the cache,
  134. * nor does it require additional rotations.
  135. */
  136. /*
  137. * Note that every Cn macro expands as two loads: one byte load and
  138. * one quadword load. One can argue that that many single-byte loads
  139. * is too excessive, as one could load a quadword and "milk" it for
  140. * eight 8-bit values instead. Well, yes, but in order to do so *and*
  141. * avoid excessive loads you have to accommodate a handful of 64-bit
  142. * values in the register bank and issue a bunch of shifts and mask.
  143. * It's a tradeoff: loads vs. shift and mask in big register bank[!].
  144. * On most CPUs eight single-byte loads are faster and I let other
  145. * ones to depend on smart compiler to fold byte loads if beneficial.
  146. * Hand-coded assembler would be another alternative:-)
  147. */
  148. #ifdef STRICT_ALIGNMENT
  149. # if defined(ROTATE)
  150. # define N 1
  151. # define LL(c0,c1,c2,c3,c4,c5,c6,c7) c0,c1,c2,c3,c4,c5,c6,c7
  152. # define C0(K,i) (Cx.q[K.c[(i)*8+0]])
  153. # define C1(K,i) ROTATE(Cx.q[K.c[(i)*8+1]],8)
  154. # define C2(K,i) ROTATE(Cx.q[K.c[(i)*8+2]],16)
  155. # define C3(K,i) ROTATE(Cx.q[K.c[(i)*8+3]],24)
  156. # define C4(K,i) ROTATE(Cx.q[K.c[(i)*8+4]],32)
  157. # define C5(K,i) ROTATE(Cx.q[K.c[(i)*8+5]],40)
  158. # define C6(K,i) ROTATE(Cx.q[K.c[(i)*8+6]],48)
  159. # define C7(K,i) ROTATE(Cx.q[K.c[(i)*8+7]],56)
  160. # else
  161. # define N 8
  162. # define LL(c0,c1,c2,c3,c4,c5,c6,c7) c0,c1,c2,c3,c4,c5,c6,c7, \
  163. c7,c0,c1,c2,c3,c4,c5,c6, \
  164. c6,c7,c0,c1,c2,c3,c4,c5, \
  165. c5,c6,c7,c0,c1,c2,c3,c4, \
  166. c4,c5,c6,c7,c0,c1,c2,c3, \
  167. c3,c4,c5,c6,c7,c0,c1,c2, \
  168. c2,c3,c4,c5,c6,c7,c0,c1, \
  169. c1,c2,c3,c4,c5,c6,c7,c0
  170. # define C0(K,i) (Cx.q[0+8*K.c[(i)*8+0]])
  171. # define C1(K,i) (Cx.q[1+8*K.c[(i)*8+1]])
  172. # define C2(K,i) (Cx.q[2+8*K.c[(i)*8+2]])
  173. # define C3(K,i) (Cx.q[3+8*K.c[(i)*8+3]])
  174. # define C4(K,i) (Cx.q[4+8*K.c[(i)*8+4]])
  175. # define C5(K,i) (Cx.q[5+8*K.c[(i)*8+5]])
  176. # define C6(K,i) (Cx.q[6+8*K.c[(i)*8+6]])
  177. # define C7(K,i) (Cx.q[7+8*K.c[(i)*8+7]])
  178. # endif
  179. #else
  180. # define N 2
  181. # define LL(c0,c1,c2,c3,c4,c5,c6,c7) c0,c1,c2,c3,c4,c5,c6,c7, \
  182. c0,c1,c2,c3,c4,c5,c6,c7
  183. # define C0(K,i) (((u64*)(Cx.c+0))[2*K.c[(i)*8+0]])
  184. # define C1(K,i) (((u64*)(Cx.c+7))[2*K.c[(i)*8+1]])
  185. # define C2(K,i) (((u64*)(Cx.c+6))[2*K.c[(i)*8+2]])
  186. # define C3(K,i) (((u64*)(Cx.c+5))[2*K.c[(i)*8+3]])
  187. # define C4(K,i) (((u64*)(Cx.c+4))[2*K.c[(i)*8+4]])
  188. # define C5(K,i) (((u64*)(Cx.c+3))[2*K.c[(i)*8+5]])
  189. # define C6(K,i) (((u64*)(Cx.c+2))[2*K.c[(i)*8+6]])
  190. # define C7(K,i) (((u64*)(Cx.c+1))[2*K.c[(i)*8+7]])
  191. #endif
  192. static const
  193. union {
  194. u8 c[(256 * N + ROUNDS) * sizeof(u64)];
  195. u64 q[(256 * N + ROUNDS)];
  196. } Cx = {
  197. {
  198. /* Note endian-neutral representation:-) */
  199. LL(0x18, 0x18, 0x60, 0x18, 0xc0, 0x78, 0x30, 0xd8),
  200. LL(0x23, 0x23, 0x8c, 0x23, 0x05, 0xaf, 0x46, 0x26),
  201. LL(0xc6, 0xc6, 0x3f, 0xc6, 0x7e, 0xf9, 0x91, 0xb8),
  202. LL(0xe8, 0xe8, 0x87, 0xe8, 0x13, 0x6f, 0xcd, 0xfb),
  203. LL(0x87, 0x87, 0x26, 0x87, 0x4c, 0xa1, 0x13, 0xcb),
  204. LL(0xb8, 0xb8, 0xda, 0xb8, 0xa9, 0x62, 0x6d, 0x11),
  205. LL(0x01, 0x01, 0x04, 0x01, 0x08, 0x05, 0x02, 0x09),
  206. LL(0x4f, 0x4f, 0x21, 0x4f, 0x42, 0x6e, 0x9e, 0x0d),
  207. LL(0x36, 0x36, 0xd8, 0x36, 0xad, 0xee, 0x6c, 0x9b),
  208. LL(0xa6, 0xa6, 0xa2, 0xa6, 0x59, 0x04, 0x51, 0xff),
  209. LL(0xd2, 0xd2, 0x6f, 0xd2, 0xde, 0xbd, 0xb9, 0x0c),
  210. LL(0xf5, 0xf5, 0xf3, 0xf5, 0xfb, 0x06, 0xf7, 0x0e),
  211. LL(0x79, 0x79, 0xf9, 0x79, 0xef, 0x80, 0xf2, 0x96),
  212. LL(0x6f, 0x6f, 0xa1, 0x6f, 0x5f, 0xce, 0xde, 0x30),
  213. LL(0x91, 0x91, 0x7e, 0x91, 0xfc, 0xef, 0x3f, 0x6d),
  214. LL(0x52, 0x52, 0x55, 0x52, 0xaa, 0x07, 0xa4, 0xf8),
  215. LL(0x60, 0x60, 0x9d, 0x60, 0x27, 0xfd, 0xc0, 0x47),
  216. LL(0xbc, 0xbc, 0xca, 0xbc, 0x89, 0x76, 0x65, 0x35),
  217. LL(0x9b, 0x9b, 0x56, 0x9b, 0xac, 0xcd, 0x2b, 0x37),
  218. LL(0x8e, 0x8e, 0x02, 0x8e, 0x04, 0x8c, 0x01, 0x8a),
  219. LL(0xa3, 0xa3, 0xb6, 0xa3, 0x71, 0x15, 0x5b, 0xd2),
  220. LL(0x0c, 0x0c, 0x30, 0x0c, 0x60, 0x3c, 0x18, 0x6c),
  221. LL(0x7b, 0x7b, 0xf1, 0x7b, 0xff, 0x8a, 0xf6, 0x84),
  222. LL(0x35, 0x35, 0xd4, 0x35, 0xb5, 0xe1, 0x6a, 0x80),
  223. LL(0x1d, 0x1d, 0x74, 0x1d, 0xe8, 0x69, 0x3a, 0xf5),
  224. LL(0xe0, 0xe0, 0xa7, 0xe0, 0x53, 0x47, 0xdd, 0xb3),
  225. LL(0xd7, 0xd7, 0x7b, 0xd7, 0xf6, 0xac, 0xb3, 0x21),
  226. LL(0xc2, 0xc2, 0x2f, 0xc2, 0x5e, 0xed, 0x99, 0x9c),
  227. LL(0x2e, 0x2e, 0xb8, 0x2e, 0x6d, 0x96, 0x5c, 0x43),
  228. LL(0x4b, 0x4b, 0x31, 0x4b, 0x62, 0x7a, 0x96, 0x29),
  229. LL(0xfe, 0xfe, 0xdf, 0xfe, 0xa3, 0x21, 0xe1, 0x5d),
  230. LL(0x57, 0x57, 0x41, 0x57, 0x82, 0x16, 0xae, 0xd5),
  231. LL(0x15, 0x15, 0x54, 0x15, 0xa8, 0x41, 0x2a, 0xbd),
  232. LL(0x77, 0x77, 0xc1, 0x77, 0x9f, 0xb6, 0xee, 0xe8),
  233. LL(0x37, 0x37, 0xdc, 0x37, 0xa5, 0xeb, 0x6e, 0x92),
  234. LL(0xe5, 0xe5, 0xb3, 0xe5, 0x7b, 0x56, 0xd7, 0x9e),
  235. LL(0x9f, 0x9f, 0x46, 0x9f, 0x8c, 0xd9, 0x23, 0x13),
  236. LL(0xf0, 0xf0, 0xe7, 0xf0, 0xd3, 0x17, 0xfd, 0x23),
  237. LL(0x4a, 0x4a, 0x35, 0x4a, 0x6a, 0x7f, 0x94, 0x20),
  238. LL(0xda, 0xda, 0x4f, 0xda, 0x9e, 0x95, 0xa9, 0x44),
  239. LL(0x58, 0x58, 0x7d, 0x58, 0xfa, 0x25, 0xb0, 0xa2),
  240. LL(0xc9, 0xc9, 0x03, 0xc9, 0x06, 0xca, 0x8f, 0xcf),
  241. LL(0x29, 0x29, 0xa4, 0x29, 0x55, 0x8d, 0x52, 0x7c),
  242. LL(0x0a, 0x0a, 0x28, 0x0a, 0x50, 0x22, 0x14, 0x5a),
  243. LL(0xb1, 0xb1, 0xfe, 0xb1, 0xe1, 0x4f, 0x7f, 0x50),
  244. LL(0xa0, 0xa0, 0xba, 0xa0, 0x69, 0x1a, 0x5d, 0xc9),
  245. LL(0x6b, 0x6b, 0xb1, 0x6b, 0x7f, 0xda, 0xd6, 0x14),
  246. LL(0x85, 0x85, 0x2e, 0x85, 0x5c, 0xab, 0x17, 0xd9),
  247. LL(0xbd, 0xbd, 0xce, 0xbd, 0x81, 0x73, 0x67, 0x3c),
  248. LL(0x5d, 0x5d, 0x69, 0x5d, 0xd2, 0x34, 0xba, 0x8f),
  249. LL(0x10, 0x10, 0x40, 0x10, 0x80, 0x50, 0x20, 0x90),
  250. LL(0xf4, 0xf4, 0xf7, 0xf4, 0xf3, 0x03, 0xf5, 0x07),
  251. LL(0xcb, 0xcb, 0x0b, 0xcb, 0x16, 0xc0, 0x8b, 0xdd),
  252. LL(0x3e, 0x3e, 0xf8, 0x3e, 0xed, 0xc6, 0x7c, 0xd3),
  253. LL(0x05, 0x05, 0x14, 0x05, 0x28, 0x11, 0x0a, 0x2d),
  254. LL(0x67, 0x67, 0x81, 0x67, 0x1f, 0xe6, 0xce, 0x78),
  255. LL(0xe4, 0xe4, 0xb7, 0xe4, 0x73, 0x53, 0xd5, 0x97),
  256. LL(0x27, 0x27, 0x9c, 0x27, 0x25, 0xbb, 0x4e, 0x02),
  257. LL(0x41, 0x41, 0x19, 0x41, 0x32, 0x58, 0x82, 0x73),
  258. LL(0x8b, 0x8b, 0x16, 0x8b, 0x2c, 0x9d, 0x0b, 0xa7),
  259. LL(0xa7, 0xa7, 0xa6, 0xa7, 0x51, 0x01, 0x53, 0xf6),
  260. LL(0x7d, 0x7d, 0xe9, 0x7d, 0xcf, 0x94, 0xfa, 0xb2),
  261. LL(0x95, 0x95, 0x6e, 0x95, 0xdc, 0xfb, 0x37, 0x49),
  262. LL(0xd8, 0xd8, 0x47, 0xd8, 0x8e, 0x9f, 0xad, 0x56),
  263. LL(0xfb, 0xfb, 0xcb, 0xfb, 0x8b, 0x30, 0xeb, 0x70),
  264. LL(0xee, 0xee, 0x9f, 0xee, 0x23, 0x71, 0xc1, 0xcd),
  265. LL(0x7c, 0x7c, 0xed, 0x7c, 0xc7, 0x91, 0xf8, 0xbb),
  266. LL(0x66, 0x66, 0x85, 0x66, 0x17, 0xe3, 0xcc, 0x71),
  267. LL(0xdd, 0xdd, 0x53, 0xdd, 0xa6, 0x8e, 0xa7, 0x7b),
  268. LL(0x17, 0x17, 0x5c, 0x17, 0xb8, 0x4b, 0x2e, 0xaf),
  269. LL(0x47, 0x47, 0x01, 0x47, 0x02, 0x46, 0x8e, 0x45),
  270. LL(0x9e, 0x9e, 0x42, 0x9e, 0x84, 0xdc, 0x21, 0x1a),
  271. LL(0xca, 0xca, 0x0f, 0xca, 0x1e, 0xc5, 0x89, 0xd4),
  272. LL(0x2d, 0x2d, 0xb4, 0x2d, 0x75, 0x99, 0x5a, 0x58),
  273. LL(0xbf, 0xbf, 0xc6, 0xbf, 0x91, 0x79, 0x63, 0x2e),
  274. LL(0x07, 0x07, 0x1c, 0x07, 0x38, 0x1b, 0x0e, 0x3f),
  275. LL(0xad, 0xad, 0x8e, 0xad, 0x01, 0x23, 0x47, 0xac),
  276. LL(0x5a, 0x5a, 0x75, 0x5a, 0xea, 0x2f, 0xb4, 0xb0),
  277. LL(0x83, 0x83, 0x36, 0x83, 0x6c, 0xb5, 0x1b, 0xef),
  278. LL(0x33, 0x33, 0xcc, 0x33, 0x85, 0xff, 0x66, 0xb6),
  279. LL(0x63, 0x63, 0x91, 0x63, 0x3f, 0xf2, 0xc6, 0x5c),
  280. LL(0x02, 0x02, 0x08, 0x02, 0x10, 0x0a, 0x04, 0x12),
  281. LL(0xaa, 0xaa, 0x92, 0xaa, 0x39, 0x38, 0x49, 0x93),
  282. LL(0x71, 0x71, 0xd9, 0x71, 0xaf, 0xa8, 0xe2, 0xde),
  283. LL(0xc8, 0xc8, 0x07, 0xc8, 0x0e, 0xcf, 0x8d, 0xc6),
  284. LL(0x19, 0x19, 0x64, 0x19, 0xc8, 0x7d, 0x32, 0xd1),
  285. LL(0x49, 0x49, 0x39, 0x49, 0x72, 0x70, 0x92, 0x3b),
  286. LL(0xd9, 0xd9, 0x43, 0xd9, 0x86, 0x9a, 0xaf, 0x5f),
  287. LL(0xf2, 0xf2, 0xef, 0xf2, 0xc3, 0x1d, 0xf9, 0x31),
  288. LL(0xe3, 0xe3, 0xab, 0xe3, 0x4b, 0x48, 0xdb, 0xa8),
  289. LL(0x5b, 0x5b, 0x71, 0x5b, 0xe2, 0x2a, 0xb6, 0xb9),
  290. LL(0x88, 0x88, 0x1a, 0x88, 0x34, 0x92, 0x0d, 0xbc),
  291. LL(0x9a, 0x9a, 0x52, 0x9a, 0xa4, 0xc8, 0x29, 0x3e),
  292. LL(0x26, 0x26, 0x98, 0x26, 0x2d, 0xbe, 0x4c, 0x0b),
  293. LL(0x32, 0x32, 0xc8, 0x32, 0x8d, 0xfa, 0x64, 0xbf),
  294. LL(0xb0, 0xb0, 0xfa, 0xb0, 0xe9, 0x4a, 0x7d, 0x59),
  295. LL(0xe9, 0xe9, 0x83, 0xe9, 0x1b, 0x6a, 0xcf, 0xf2),
  296. LL(0x0f, 0x0f, 0x3c, 0x0f, 0x78, 0x33, 0x1e, 0x77),
  297. LL(0xd5, 0xd5, 0x73, 0xd5, 0xe6, 0xa6, 0xb7, 0x33),
  298. LL(0x80, 0x80, 0x3a, 0x80, 0x74, 0xba, 0x1d, 0xf4),
  299. LL(0xbe, 0xbe, 0xc2, 0xbe, 0x99, 0x7c, 0x61, 0x27),
  300. LL(0xcd, 0xcd, 0x13, 0xcd, 0x26, 0xde, 0x87, 0xeb),
  301. LL(0x34, 0x34, 0xd0, 0x34, 0xbd, 0xe4, 0x68, 0x89),
  302. LL(0x48, 0x48, 0x3d, 0x48, 0x7a, 0x75, 0x90, 0x32),
  303. LL(0xff, 0xff, 0xdb, 0xff, 0xab, 0x24, 0xe3, 0x54),
  304. LL(0x7a, 0x7a, 0xf5, 0x7a, 0xf7, 0x8f, 0xf4, 0x8d),
  305. LL(0x90, 0x90, 0x7a, 0x90, 0xf4, 0xea, 0x3d, 0x64),
  306. LL(0x5f, 0x5f, 0x61, 0x5f, 0xc2, 0x3e, 0xbe, 0x9d),
  307. LL(0x20, 0x20, 0x80, 0x20, 0x1d, 0xa0, 0x40, 0x3d),
  308. LL(0x68, 0x68, 0xbd, 0x68, 0x67, 0xd5, 0xd0, 0x0f),
  309. LL(0x1a, 0x1a, 0x68, 0x1a, 0xd0, 0x72, 0x34, 0xca),
  310. LL(0xae, 0xae, 0x82, 0xae, 0x19, 0x2c, 0x41, 0xb7),
  311. LL(0xb4, 0xb4, 0xea, 0xb4, 0xc9, 0x5e, 0x75, 0x7d),
  312. LL(0x54, 0x54, 0x4d, 0x54, 0x9a, 0x19, 0xa8, 0xce),
  313. LL(0x93, 0x93, 0x76, 0x93, 0xec, 0xe5, 0x3b, 0x7f),
  314. LL(0x22, 0x22, 0x88, 0x22, 0x0d, 0xaa, 0x44, 0x2f),
  315. LL(0x64, 0x64, 0x8d, 0x64, 0x07, 0xe9, 0xc8, 0x63),
  316. LL(0xf1, 0xf1, 0xe3, 0xf1, 0xdb, 0x12, 0xff, 0x2a),
  317. LL(0x73, 0x73, 0xd1, 0x73, 0xbf, 0xa2, 0xe6, 0xcc),
  318. LL(0x12, 0x12, 0x48, 0x12, 0x90, 0x5a, 0x24, 0x82),
  319. LL(0x40, 0x40, 0x1d, 0x40, 0x3a, 0x5d, 0x80, 0x7a),
  320. LL(0x08, 0x08, 0x20, 0x08, 0x40, 0x28, 0x10, 0x48),
  321. LL(0xc3, 0xc3, 0x2b, 0xc3, 0x56, 0xe8, 0x9b, 0x95),
  322. LL(0xec, 0xec, 0x97, 0xec, 0x33, 0x7b, 0xc5, 0xdf),
  323. LL(0xdb, 0xdb, 0x4b, 0xdb, 0x96, 0x90, 0xab, 0x4d),
  324. LL(0xa1, 0xa1, 0xbe, 0xa1, 0x61, 0x1f, 0x5f, 0xc0),
  325. LL(0x8d, 0x8d, 0x0e, 0x8d, 0x1c, 0x83, 0x07, 0x91),
  326. LL(0x3d, 0x3d, 0xf4, 0x3d, 0xf5, 0xc9, 0x7a, 0xc8),
  327. LL(0x97, 0x97, 0x66, 0x97, 0xcc, 0xf1, 0x33, 0x5b),
  328. LL(0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00),
  329. LL(0xcf, 0xcf, 0x1b, 0xcf, 0x36, 0xd4, 0x83, 0xf9),
  330. LL(0x2b, 0x2b, 0xac, 0x2b, 0x45, 0x87, 0x56, 0x6e),
  331. LL(0x76, 0x76, 0xc5, 0x76, 0x97, 0xb3, 0xec, 0xe1),
  332. LL(0x82, 0x82, 0x32, 0x82, 0x64, 0xb0, 0x19, 0xe6),
  333. LL(0xd6, 0xd6, 0x7f, 0xd6, 0xfe, 0xa9, 0xb1, 0x28),
  334. LL(0x1b, 0x1b, 0x6c, 0x1b, 0xd8, 0x77, 0x36, 0xc3),
  335. LL(0xb5, 0xb5, 0xee, 0xb5, 0xc1, 0x5b, 0x77, 0x74),
  336. LL(0xaf, 0xaf, 0x86, 0xaf, 0x11, 0x29, 0x43, 0xbe),
  337. LL(0x6a, 0x6a, 0xb5, 0x6a, 0x77, 0xdf, 0xd4, 0x1d),
  338. LL(0x50, 0x50, 0x5d, 0x50, 0xba, 0x0d, 0xa0, 0xea),
  339. LL(0x45, 0x45, 0x09, 0x45, 0x12, 0x4c, 0x8a, 0x57),
  340. LL(0xf3, 0xf3, 0xeb, 0xf3, 0xcb, 0x18, 0xfb, 0x38),
  341. LL(0x30, 0x30, 0xc0, 0x30, 0x9d, 0xf0, 0x60, 0xad),
  342. LL(0xef, 0xef, 0x9b, 0xef, 0x2b, 0x74, 0xc3, 0xc4),
  343. LL(0x3f, 0x3f, 0xfc, 0x3f, 0xe5, 0xc3, 0x7e, 0xda),
  344. LL(0x55, 0x55, 0x49, 0x55, 0x92, 0x1c, 0xaa, 0xc7),
  345. LL(0xa2, 0xa2, 0xb2, 0xa2, 0x79, 0x10, 0x59, 0xdb),
  346. LL(0xea, 0xea, 0x8f, 0xea, 0x03, 0x65, 0xc9, 0xe9),
  347. LL(0x65, 0x65, 0x89, 0x65, 0x0f, 0xec, 0xca, 0x6a),
  348. LL(0xba, 0xba, 0xd2, 0xba, 0xb9, 0x68, 0x69, 0x03),
  349. LL(0x2f, 0x2f, 0xbc, 0x2f, 0x65, 0x93, 0x5e, 0x4a),
  350. LL(0xc0, 0xc0, 0x27, 0xc0, 0x4e, 0xe7, 0x9d, 0x8e),
  351. LL(0xde, 0xde, 0x5f, 0xde, 0xbe, 0x81, 0xa1, 0x60),
  352. LL(0x1c, 0x1c, 0x70, 0x1c, 0xe0, 0x6c, 0x38, 0xfc),
  353. LL(0xfd, 0xfd, 0xd3, 0xfd, 0xbb, 0x2e, 0xe7, 0x46),
  354. LL(0x4d, 0x4d, 0x29, 0x4d, 0x52, 0x64, 0x9a, 0x1f),
  355. LL(0x92, 0x92, 0x72, 0x92, 0xe4, 0xe0, 0x39, 0x76),
  356. LL(0x75, 0x75, 0xc9, 0x75, 0x8f, 0xbc, 0xea, 0xfa),
  357. LL(0x06, 0x06, 0x18, 0x06, 0x30, 0x1e, 0x0c, 0x36),
  358. LL(0x8a, 0x8a, 0x12, 0x8a, 0x24, 0x98, 0x09, 0xae),
  359. LL(0xb2, 0xb2, 0xf2, 0xb2, 0xf9, 0x40, 0x79, 0x4b),
  360. LL(0xe6, 0xe6, 0xbf, 0xe6, 0x63, 0x59, 0xd1, 0x85),
  361. LL(0x0e, 0x0e, 0x38, 0x0e, 0x70, 0x36, 0x1c, 0x7e),
  362. LL(0x1f, 0x1f, 0x7c, 0x1f, 0xf8, 0x63, 0x3e, 0xe7),
  363. LL(0x62, 0x62, 0x95, 0x62, 0x37, 0xf7, 0xc4, 0x55),
  364. LL(0xd4, 0xd4, 0x77, 0xd4, 0xee, 0xa3, 0xb5, 0x3a),
  365. LL(0xa8, 0xa8, 0x9a, 0xa8, 0x29, 0x32, 0x4d, 0x81),
  366. LL(0x96, 0x96, 0x62, 0x96, 0xc4, 0xf4, 0x31, 0x52),
  367. LL(0xf9, 0xf9, 0xc3, 0xf9, 0x9b, 0x3a, 0xef, 0x62),
  368. LL(0xc5, 0xc5, 0x33, 0xc5, 0x66, 0xf6, 0x97, 0xa3),
  369. LL(0x25, 0x25, 0x94, 0x25, 0x35, 0xb1, 0x4a, 0x10),
  370. LL(0x59, 0x59, 0x79, 0x59, 0xf2, 0x20, 0xb2, 0xab),
  371. LL(0x84, 0x84, 0x2a, 0x84, 0x54, 0xae, 0x15, 0xd0),
  372. LL(0x72, 0x72, 0xd5, 0x72, 0xb7, 0xa7, 0xe4, 0xc5),
  373. LL(0x39, 0x39, 0xe4, 0x39, 0xd5, 0xdd, 0x72, 0xec),
  374. LL(0x4c, 0x4c, 0x2d, 0x4c, 0x5a, 0x61, 0x98, 0x16),
  375. LL(0x5e, 0x5e, 0x65, 0x5e, 0xca, 0x3b, 0xbc, 0x94),
  376. LL(0x78, 0x78, 0xfd, 0x78, 0xe7, 0x85, 0xf0, 0x9f),
  377. LL(0x38, 0x38, 0xe0, 0x38, 0xdd, 0xd8, 0x70, 0xe5),
  378. LL(0x8c, 0x8c, 0x0a, 0x8c, 0x14, 0x86, 0x05, 0x98),
  379. LL(0xd1, 0xd1, 0x63, 0xd1, 0xc6, 0xb2, 0xbf, 0x17),
  380. LL(0xa5, 0xa5, 0xae, 0xa5, 0x41, 0x0b, 0x57, 0xe4),
  381. LL(0xe2, 0xe2, 0xaf, 0xe2, 0x43, 0x4d, 0xd9, 0xa1),
  382. LL(0x61, 0x61, 0x99, 0x61, 0x2f, 0xf8, 0xc2, 0x4e),
  383. LL(0xb3, 0xb3, 0xf6, 0xb3, 0xf1, 0x45, 0x7b, 0x42),
  384. LL(0x21, 0x21, 0x84, 0x21, 0x15, 0xa5, 0x42, 0x34),
  385. LL(0x9c, 0x9c, 0x4a, 0x9c, 0x94, 0xd6, 0x25, 0x08),
  386. LL(0x1e, 0x1e, 0x78, 0x1e, 0xf0, 0x66, 0x3c, 0xee),
  387. LL(0x43, 0x43, 0x11, 0x43, 0x22, 0x52, 0x86, 0x61),
  388. LL(0xc7, 0xc7, 0x3b, 0xc7, 0x76, 0xfc, 0x93, 0xb1),
  389. LL(0xfc, 0xfc, 0xd7, 0xfc, 0xb3, 0x2b, 0xe5, 0x4f),
  390. LL(0x04, 0x04, 0x10, 0x04, 0x20, 0x14, 0x08, 0x24),
  391. LL(0x51, 0x51, 0x59, 0x51, 0xb2, 0x08, 0xa2, 0xe3),
  392. LL(0x99, 0x99, 0x5e, 0x99, 0xbc, 0xc7, 0x2f, 0x25),
  393. LL(0x6d, 0x6d, 0xa9, 0x6d, 0x4f, 0xc4, 0xda, 0x22),
  394. LL(0x0d, 0x0d, 0x34, 0x0d, 0x68, 0x39, 0x1a, 0x65),
  395. LL(0xfa, 0xfa, 0xcf, 0xfa, 0x83, 0x35, 0xe9, 0x79),
  396. LL(0xdf, 0xdf, 0x5b, 0xdf, 0xb6, 0x84, 0xa3, 0x69),
  397. LL(0x7e, 0x7e, 0xe5, 0x7e, 0xd7, 0x9b, 0xfc, 0xa9),
  398. LL(0x24, 0x24, 0x90, 0x24, 0x3d, 0xb4, 0x48, 0x19),
  399. LL(0x3b, 0x3b, 0xec, 0x3b, 0xc5, 0xd7, 0x76, 0xfe),
  400. LL(0xab, 0xab, 0x96, 0xab, 0x31, 0x3d, 0x4b, 0x9a),
  401. LL(0xce, 0xce, 0x1f, 0xce, 0x3e, 0xd1, 0x81, 0xf0),
  402. LL(0x11, 0x11, 0x44, 0x11, 0x88, 0x55, 0x22, 0x99),
  403. LL(0x8f, 0x8f, 0x06, 0x8f, 0x0c, 0x89, 0x03, 0x83),
  404. LL(0x4e, 0x4e, 0x25, 0x4e, 0x4a, 0x6b, 0x9c, 0x04),
  405. LL(0xb7, 0xb7, 0xe6, 0xb7, 0xd1, 0x51, 0x73, 0x66),
  406. LL(0xeb, 0xeb, 0x8b, 0xeb, 0x0b, 0x60, 0xcb, 0xe0),
  407. LL(0x3c, 0x3c, 0xf0, 0x3c, 0xfd, 0xcc, 0x78, 0xc1),
  408. LL(0x81, 0x81, 0x3e, 0x81, 0x7c, 0xbf, 0x1f, 0xfd),
  409. LL(0x94, 0x94, 0x6a, 0x94, 0xd4, 0xfe, 0x35, 0x40),
  410. LL(0xf7, 0xf7, 0xfb, 0xf7, 0xeb, 0x0c, 0xf3, 0x1c),
  411. LL(0xb9, 0xb9, 0xde, 0xb9, 0xa1, 0x67, 0x6f, 0x18),
  412. LL(0x13, 0x13, 0x4c, 0x13, 0x98, 0x5f, 0x26, 0x8b),
  413. LL(0x2c, 0x2c, 0xb0, 0x2c, 0x7d, 0x9c, 0x58, 0x51),
  414. LL(0xd3, 0xd3, 0x6b, 0xd3, 0xd6, 0xb8, 0xbb, 0x05),
  415. LL(0xe7, 0xe7, 0xbb, 0xe7, 0x6b, 0x5c, 0xd3, 0x8c),
  416. LL(0x6e, 0x6e, 0xa5, 0x6e, 0x57, 0xcb, 0xdc, 0x39),
  417. LL(0xc4, 0xc4, 0x37, 0xc4, 0x6e, 0xf3, 0x95, 0xaa),
  418. LL(0x03, 0x03, 0x0c, 0x03, 0x18, 0x0f, 0x06, 0x1b),
  419. LL(0x56, 0x56, 0x45, 0x56, 0x8a, 0x13, 0xac, 0xdc),
  420. LL(0x44, 0x44, 0x0d, 0x44, 0x1a, 0x49, 0x88, 0x5e),
  421. LL(0x7f, 0x7f, 0xe1, 0x7f, 0xdf, 0x9e, 0xfe, 0xa0),
  422. LL(0xa9, 0xa9, 0x9e, 0xa9, 0x21, 0x37, 0x4f, 0x88),
  423. LL(0x2a, 0x2a, 0xa8, 0x2a, 0x4d, 0x82, 0x54, 0x67),
  424. LL(0xbb, 0xbb, 0xd6, 0xbb, 0xb1, 0x6d, 0x6b, 0x0a),
  425. LL(0xc1, 0xc1, 0x23, 0xc1, 0x46, 0xe2, 0x9f, 0x87),
  426. LL(0x53, 0x53, 0x51, 0x53, 0xa2, 0x02, 0xa6, 0xf1),
  427. LL(0xdc, 0xdc, 0x57, 0xdc, 0xae, 0x8b, 0xa5, 0x72),
  428. LL(0x0b, 0x0b, 0x2c, 0x0b, 0x58, 0x27, 0x16, 0x53),
  429. LL(0x9d, 0x9d, 0x4e, 0x9d, 0x9c, 0xd3, 0x27, 0x01),
  430. LL(0x6c, 0x6c, 0xad, 0x6c, 0x47, 0xc1, 0xd8, 0x2b),
  431. LL(0x31, 0x31, 0xc4, 0x31, 0x95, 0xf5, 0x62, 0xa4),
  432. LL(0x74, 0x74, 0xcd, 0x74, 0x87, 0xb9, 0xe8, 0xf3),
  433. LL(0xf6, 0xf6, 0xff, 0xf6, 0xe3, 0x09, 0xf1, 0x15),
  434. LL(0x46, 0x46, 0x05, 0x46, 0x0a, 0x43, 0x8c, 0x4c),
  435. LL(0xac, 0xac, 0x8a, 0xac, 0x09, 0x26, 0x45, 0xa5),
  436. LL(0x89, 0x89, 0x1e, 0x89, 0x3c, 0x97, 0x0f, 0xb5),
  437. LL(0x14, 0x14, 0x50, 0x14, 0xa0, 0x44, 0x28, 0xb4),
  438. LL(0xe1, 0xe1, 0xa3, 0xe1, 0x5b, 0x42, 0xdf, 0xba),
  439. LL(0x16, 0x16, 0x58, 0x16, 0xb0, 0x4e, 0x2c, 0xa6),
  440. LL(0x3a, 0x3a, 0xe8, 0x3a, 0xcd, 0xd2, 0x74, 0xf7),
  441. LL(0x69, 0x69, 0xb9, 0x69, 0x6f, 0xd0, 0xd2, 0x06),
  442. LL(0x09, 0x09, 0x24, 0x09, 0x48, 0x2d, 0x12, 0x41),
  443. LL(0x70, 0x70, 0xdd, 0x70, 0xa7, 0xad, 0xe0, 0xd7),
  444. LL(0xb6, 0xb6, 0xe2, 0xb6, 0xd9, 0x54, 0x71, 0x6f),
  445. LL(0xd0, 0xd0, 0x67, 0xd0, 0xce, 0xb7, 0xbd, 0x1e),
  446. LL(0xed, 0xed, 0x93, 0xed, 0x3b, 0x7e, 0xc7, 0xd6),
  447. LL(0xcc, 0xcc, 0x17, 0xcc, 0x2e, 0xdb, 0x85, 0xe2),
  448. LL(0x42, 0x42, 0x15, 0x42, 0x2a, 0x57, 0x84, 0x68),
  449. LL(0x98, 0x98, 0x5a, 0x98, 0xb4, 0xc2, 0x2d, 0x2c),
  450. LL(0xa4, 0xa4, 0xaa, 0xa4, 0x49, 0x0e, 0x55, 0xed),
  451. LL(0x28, 0x28, 0xa0, 0x28, 0x5d, 0x88, 0x50, 0x75),
  452. LL(0x5c, 0x5c, 0x6d, 0x5c, 0xda, 0x31, 0xb8, 0x86),
  453. LL(0xf8, 0xf8, 0xc7, 0xf8, 0x93, 0x3f, 0xed, 0x6b),
  454. LL(0x86, 0x86, 0x22, 0x86, 0x44, 0xa4, 0x11, 0xc2),
  455. #define RC (&(Cx.q[256*N]))
  456. 0x18, 0x23, 0xc6, 0xe8, 0x87, 0xb8, 0x01, 0x4f,
  457. /* rc[ROUNDS] */
  458. 0x36, 0xa6, 0xd2, 0xf5, 0x79, 0x6f, 0x91, 0x52, 0x60, 0xbc, 0x9b,
  459. 0x8e, 0xa3, 0x0c, 0x7b, 0x35, 0x1d, 0xe0, 0xd7, 0xc2, 0x2e, 0x4b,
  460. 0xfe, 0x57, 0x15, 0x77, 0x37, 0xe5, 0x9f, 0xf0, 0x4a, 0xda, 0x58,
  461. 0xc9, 0x29, 0x0a, 0xb1, 0xa0, 0x6b, 0x85, 0xbd, 0x5d, 0x10, 0xf4,
  462. 0xcb, 0x3e, 0x05, 0x67, 0xe4, 0x27, 0x41, 0x8b, 0xa7, 0x7d, 0x95,
  463. 0xd8, 0xfb, 0xee, 0x7c, 0x66, 0xdd, 0x17, 0x47, 0x9e, 0xca, 0x2d,
  464. 0xbf, 0x07, 0xad, 0x5a, 0x83, 0x33
  465. }
  466. };
  467. void whirlpool_block(WHIRLPOOL_CTX *ctx, const void *inp, size_t n)
  468. {
  469. int r;
  470. const u8 *p = inp;
  471. union {
  472. u64 q[8];
  473. u8 c[64];
  474. } S, K, *H = (void *)ctx->H.q;
  475. #ifdef GO_FOR_MMX
  476. GO_FOR_MMX(ctx, inp, n);
  477. #endif
  478. do {
  479. #ifdef OPENSSL_SMALL_FOOTPRINT
  480. u64 L[8];
  481. int i;
  482. for (i = 0; i < 64; i++)
  483. S.c[i] = (K.c[i] = H->c[i]) ^ p[i];
  484. for (r = 0; r < ROUNDS; r++) {
  485. for (i = 0; i < 8; i++) {
  486. L[i] = i ? 0 : RC[r];
  487. L[i] ^= C0(K, i) ^ C1(K, (i - 1) & 7) ^
  488. C2(K, (i - 2) & 7) ^ C3(K, (i - 3) & 7) ^
  489. C4(K, (i - 4) & 7) ^ C5(K, (i - 5) & 7) ^
  490. C6(K, (i - 6) & 7) ^ C7(K, (i - 7) & 7);
  491. }
  492. memcpy(K.q, L, 64);
  493. for (i = 0; i < 8; i++) {
  494. L[i] ^= C0(S, i) ^ C1(S, (i - 1) & 7) ^
  495. C2(S, (i - 2) & 7) ^ C3(S, (i - 3) & 7) ^
  496. C4(S, (i - 4) & 7) ^ C5(S, (i - 5) & 7) ^
  497. C6(S, (i - 6) & 7) ^ C7(S, (i - 7) & 7);
  498. }
  499. memcpy(S.q, L, 64);
  500. }
  501. for (i = 0; i < 64; i++)
  502. H->c[i] ^= S.c[i] ^ p[i];
  503. #else
  504. u64 L0, L1, L2, L3, L4, L5, L6, L7;
  505. # ifdef STRICT_ALIGNMENT
  506. if ((size_t)p & 7) {
  507. memcpy(S.c, p, 64);
  508. S.q[0] ^= (K.q[0] = H->q[0]);
  509. S.q[1] ^= (K.q[1] = H->q[1]);
  510. S.q[2] ^= (K.q[2] = H->q[2]);
  511. S.q[3] ^= (K.q[3] = H->q[3]);
  512. S.q[4] ^= (K.q[4] = H->q[4]);
  513. S.q[5] ^= (K.q[5] = H->q[5]);
  514. S.q[6] ^= (K.q[6] = H->q[6]);
  515. S.q[7] ^= (K.q[7] = H->q[7]);
  516. } else
  517. # endif
  518. {
  519. const u64 *pa = (const u64 *)p;
  520. S.q[0] = (K.q[0] = H->q[0]) ^ pa[0];
  521. S.q[1] = (K.q[1] = H->q[1]) ^ pa[1];
  522. S.q[2] = (K.q[2] = H->q[2]) ^ pa[2];
  523. S.q[3] = (K.q[3] = H->q[3]) ^ pa[3];
  524. S.q[4] = (K.q[4] = H->q[4]) ^ pa[4];
  525. S.q[5] = (K.q[5] = H->q[5]) ^ pa[5];
  526. S.q[6] = (K.q[6] = H->q[6]) ^ pa[6];
  527. S.q[7] = (K.q[7] = H->q[7]) ^ pa[7];
  528. }
  529. for (r = 0; r < ROUNDS; r++) {
  530. # ifdef SMALL_REGISTER_BANK
  531. L0 = C0(K, 0) ^ C1(K, 7) ^ C2(K, 6) ^ C3(K, 5) ^
  532. C4(K, 4) ^ C5(K, 3) ^ C6(K, 2) ^ C7(K, 1) ^ RC[r];
  533. L1 = C0(K, 1) ^ C1(K, 0) ^ C2(K, 7) ^ C3(K, 6) ^
  534. C4(K, 5) ^ C5(K, 4) ^ C6(K, 3) ^ C7(K, 2);
  535. L2 = C0(K, 2) ^ C1(K, 1) ^ C2(K, 0) ^ C3(K, 7) ^
  536. C4(K, 6) ^ C5(K, 5) ^ C6(K, 4) ^ C7(K, 3);
  537. L3 = C0(K, 3) ^ C1(K, 2) ^ C2(K, 1) ^ C3(K, 0) ^
  538. C4(K, 7) ^ C5(K, 6) ^ C6(K, 5) ^ C7(K, 4);
  539. L4 = C0(K, 4) ^ C1(K, 3) ^ C2(K, 2) ^ C3(K, 1) ^
  540. C4(K, 0) ^ C5(K, 7) ^ C6(K, 6) ^ C7(K, 5);
  541. L5 = C0(K, 5) ^ C1(K, 4) ^ C2(K, 3) ^ C3(K, 2) ^
  542. C4(K, 1) ^ C5(K, 0) ^ C6(K, 7) ^ C7(K, 6);
  543. L6 = C0(K, 6) ^ C1(K, 5) ^ C2(K, 4) ^ C3(K, 3) ^
  544. C4(K, 2) ^ C5(K, 1) ^ C6(K, 0) ^ C7(K, 7);
  545. L7 = C0(K, 7) ^ C1(K, 6) ^ C2(K, 5) ^ C3(K, 4) ^
  546. C4(K, 3) ^ C5(K, 2) ^ C6(K, 1) ^ C7(K, 0);
  547. K.q[0] = L0;
  548. K.q[1] = L1;
  549. K.q[2] = L2;
  550. K.q[3] = L3;
  551. K.q[4] = L4;
  552. K.q[5] = L5;
  553. K.q[6] = L6;
  554. K.q[7] = L7;
  555. L0 ^= C0(S, 0) ^ C1(S, 7) ^ C2(S, 6) ^ C3(S, 5) ^
  556. C4(S, 4) ^ C5(S, 3) ^ C6(S, 2) ^ C7(S, 1);
  557. L1 ^= C0(S, 1) ^ C1(S, 0) ^ C2(S, 7) ^ C3(S, 6) ^
  558. C4(S, 5) ^ C5(S, 4) ^ C6(S, 3) ^ C7(S, 2);
  559. L2 ^= C0(S, 2) ^ C1(S, 1) ^ C2(S, 0) ^ C3(S, 7) ^
  560. C4(S, 6) ^ C5(S, 5) ^ C6(S, 4) ^ C7(S, 3);
  561. L3 ^= C0(S, 3) ^ C1(S, 2) ^ C2(S, 1) ^ C3(S, 0) ^
  562. C4(S, 7) ^ C5(S, 6) ^ C6(S, 5) ^ C7(S, 4);
  563. L4 ^= C0(S, 4) ^ C1(S, 3) ^ C2(S, 2) ^ C3(S, 1) ^
  564. C4(S, 0) ^ C5(S, 7) ^ C6(S, 6) ^ C7(S, 5);
  565. L5 ^= C0(S, 5) ^ C1(S, 4) ^ C2(S, 3) ^ C3(S, 2) ^
  566. C4(S, 1) ^ C5(S, 0) ^ C6(S, 7) ^ C7(S, 6);
  567. L6 ^= C0(S, 6) ^ C1(S, 5) ^ C2(S, 4) ^ C3(S, 3) ^
  568. C4(S, 2) ^ C5(S, 1) ^ C6(S, 0) ^ C7(S, 7);
  569. L7 ^= C0(S, 7) ^ C1(S, 6) ^ C2(S, 5) ^ C3(S, 4) ^
  570. C4(S, 3) ^ C5(S, 2) ^ C6(S, 1) ^ C7(S, 0);
  571. S.q[0] = L0;
  572. S.q[1] = L1;
  573. S.q[2] = L2;
  574. S.q[3] = L3;
  575. S.q[4] = L4;
  576. S.q[5] = L5;
  577. S.q[6] = L6;
  578. S.q[7] = L7;
  579. # else
  580. L0 = C0(K, 0);
  581. L1 = C1(K, 0);
  582. L2 = C2(K, 0);
  583. L3 = C3(K, 0);
  584. L4 = C4(K, 0);
  585. L5 = C5(K, 0);
  586. L6 = C6(K, 0);
  587. L7 = C7(K, 0);
  588. L0 ^= RC[r];
  589. L1 ^= C0(K, 1);
  590. L2 ^= C1(K, 1);
  591. L3 ^= C2(K, 1);
  592. L4 ^= C3(K, 1);
  593. L5 ^= C4(K, 1);
  594. L6 ^= C5(K, 1);
  595. L7 ^= C6(K, 1);
  596. L0 ^= C7(K, 1);
  597. L2 ^= C0(K, 2);
  598. L3 ^= C1(K, 2);
  599. L4 ^= C2(K, 2);
  600. L5 ^= C3(K, 2);
  601. L6 ^= C4(K, 2);
  602. L7 ^= C5(K, 2);
  603. L0 ^= C6(K, 2);
  604. L1 ^= C7(K, 2);
  605. L3 ^= C0(K, 3);
  606. L4 ^= C1(K, 3);
  607. L5 ^= C2(K, 3);
  608. L6 ^= C3(K, 3);
  609. L7 ^= C4(K, 3);
  610. L0 ^= C5(K, 3);
  611. L1 ^= C6(K, 3);
  612. L2 ^= C7(K, 3);
  613. L4 ^= C0(K, 4);
  614. L5 ^= C1(K, 4);
  615. L6 ^= C2(K, 4);
  616. L7 ^= C3(K, 4);
  617. L0 ^= C4(K, 4);
  618. L1 ^= C5(K, 4);
  619. L2 ^= C6(K, 4);
  620. L3 ^= C7(K, 4);
  621. L5 ^= C0(K, 5);
  622. L6 ^= C1(K, 5);
  623. L7 ^= C2(K, 5);
  624. L0 ^= C3(K, 5);
  625. L1 ^= C4(K, 5);
  626. L2 ^= C5(K, 5);
  627. L3 ^= C6(K, 5);
  628. L4 ^= C7(K, 5);
  629. L6 ^= C0(K, 6);
  630. L7 ^= C1(K, 6);
  631. L0 ^= C2(K, 6);
  632. L1 ^= C3(K, 6);
  633. L2 ^= C4(K, 6);
  634. L3 ^= C5(K, 6);
  635. L4 ^= C6(K, 6);
  636. L5 ^= C7(K, 6);
  637. L7 ^= C0(K, 7);
  638. L0 ^= C1(K, 7);
  639. L1 ^= C2(K, 7);
  640. L2 ^= C3(K, 7);
  641. L3 ^= C4(K, 7);
  642. L4 ^= C5(K, 7);
  643. L5 ^= C6(K, 7);
  644. L6 ^= C7(K, 7);
  645. K.q[0] = L0;
  646. K.q[1] = L1;
  647. K.q[2] = L2;
  648. K.q[3] = L3;
  649. K.q[4] = L4;
  650. K.q[5] = L5;
  651. K.q[6] = L6;
  652. K.q[7] = L7;
  653. L0 ^= C0(S, 0);
  654. L1 ^= C1(S, 0);
  655. L2 ^= C2(S, 0);
  656. L3 ^= C3(S, 0);
  657. L4 ^= C4(S, 0);
  658. L5 ^= C5(S, 0);
  659. L6 ^= C6(S, 0);
  660. L7 ^= C7(S, 0);
  661. L1 ^= C0(S, 1);
  662. L2 ^= C1(S, 1);
  663. L3 ^= C2(S, 1);
  664. L4 ^= C3(S, 1);
  665. L5 ^= C4(S, 1);
  666. L6 ^= C5(S, 1);
  667. L7 ^= C6(S, 1);
  668. L0 ^= C7(S, 1);
  669. L2 ^= C0(S, 2);
  670. L3 ^= C1(S, 2);
  671. L4 ^= C2(S, 2);
  672. L5 ^= C3(S, 2);
  673. L6 ^= C4(S, 2);
  674. L7 ^= C5(S, 2);
  675. L0 ^= C6(S, 2);
  676. L1 ^= C7(S, 2);
  677. L3 ^= C0(S, 3);
  678. L4 ^= C1(S, 3);
  679. L5 ^= C2(S, 3);
  680. L6 ^= C3(S, 3);
  681. L7 ^= C4(S, 3);
  682. L0 ^= C5(S, 3);
  683. L1 ^= C6(S, 3);
  684. L2 ^= C7(S, 3);
  685. L4 ^= C0(S, 4);
  686. L5 ^= C1(S, 4);
  687. L6 ^= C2(S, 4);
  688. L7 ^= C3(S, 4);
  689. L0 ^= C4(S, 4);
  690. L1 ^= C5(S, 4);
  691. L2 ^= C6(S, 4);
  692. L3 ^= C7(S, 4);
  693. L5 ^= C0(S, 5);
  694. L6 ^= C1(S, 5);
  695. L7 ^= C2(S, 5);
  696. L0 ^= C3(S, 5);
  697. L1 ^= C4(S, 5);
  698. L2 ^= C5(S, 5);
  699. L3 ^= C6(S, 5);
  700. L4 ^= C7(S, 5);
  701. L6 ^= C0(S, 6);
  702. L7 ^= C1(S, 6);
  703. L0 ^= C2(S, 6);
  704. L1 ^= C3(S, 6);
  705. L2 ^= C4(S, 6);
  706. L3 ^= C5(S, 6);
  707. L4 ^= C6(S, 6);
  708. L5 ^= C7(S, 6);
  709. L7 ^= C0(S, 7);
  710. L0 ^= C1(S, 7);
  711. L1 ^= C2(S, 7);
  712. L2 ^= C3(S, 7);
  713. L3 ^= C4(S, 7);
  714. L4 ^= C5(S, 7);
  715. L5 ^= C6(S, 7);
  716. L6 ^= C7(S, 7);
  717. S.q[0] = L0;
  718. S.q[1] = L1;
  719. S.q[2] = L2;
  720. S.q[3] = L3;
  721. S.q[4] = L4;
  722. S.q[5] = L5;
  723. S.q[6] = L6;
  724. S.q[7] = L7;
  725. # endif
  726. }
  727. # ifdef STRICT_ALIGNMENT
  728. if ((size_t)p & 7) {
  729. int i;
  730. for (i = 0; i < 64; i++)
  731. H->c[i] ^= S.c[i] ^ p[i];
  732. } else
  733. # endif
  734. {
  735. const u64 *pa = (const u64 *)p;
  736. H->q[0] ^= S.q[0] ^ pa[0];
  737. H->q[1] ^= S.q[1] ^ pa[1];
  738. H->q[2] ^= S.q[2] ^ pa[2];
  739. H->q[3] ^= S.q[3] ^ pa[3];
  740. H->q[4] ^= S.q[4] ^ pa[4];
  741. H->q[5] ^= S.q[5] ^ pa[5];
  742. H->q[6] ^= S.q[6] ^ pa[6];
  743. H->q[7] ^= S.q[7] ^ pa[7];
  744. }
  745. #endif
  746. p += 64;
  747. } while (--n);
  748. }