sp_cortexm.c 1.8 MB


  1. /* sp.c
  2. *
  3. * Copyright (C) 2006-2022 wolfSSL Inc.
  4. *
  5. * This file is part of wolfSSL.
  6. *
  7. * wolfSSL is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU General Public License as published by
  9. * the Free Software Foundation; either version 2 of the License, or
  10. * (at your option) any later version.
  11. *
  12. * wolfSSL is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. * GNU General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU General Public License
  18. * along with this program; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1335, USA
  20. */
  21. /* Implementation by Sean Parkinson. */
  22. #ifdef HAVE_CONFIG_H
  23. #include <config.h>
  24. #endif
  25. #include <wolfssl/wolfcrypt/settings.h>
  26. #if defined(WOLFSSL_HAVE_SP_RSA) || defined(WOLFSSL_HAVE_SP_DH) || \
  27. defined(WOLFSSL_HAVE_SP_ECC)
  28. #include <wolfssl/wolfcrypt/error-crypt.h>
  29. #include <wolfssl/wolfcrypt/cpuid.h>
  30. #ifdef NO_INLINE
  31. #include <wolfssl/wolfcrypt/misc.h>
  32. #else
  33. #define WOLFSSL_MISC_INCLUDED
  34. #include <wolfcrypt/src/misc.c>
  35. #endif
  36. #ifdef RSA_LOW_MEM
  37. #ifndef WOLFSSL_SP_SMALL
  38. #define WOLFSSL_SP_SMALL
  39. #endif
  40. #endif
  41. #include <wolfssl/wolfcrypt/sp.h>
  42. #ifdef __IAR_SYSTEMS_ICC__
  43. #define __asm__ asm
  44. #define __volatile__ volatile
  45. #endif /* __IAR_SYSTEMS_ICC__ */
  46. #ifdef __KEIL__
  47. #define __asm__ __asm
  48. #define __volatile__ volatile
  49. #endif
  50. #ifdef WOLFSSL_SP_ARM_CORTEX_M_ASM
  51. #define SP_PRINT_NUM(var, name, total, words, bits) \
  52. do { \
  53. int ii; \
  54. fprintf(stderr, name "=0x"); \
  55. for (ii = ((bits + 31) / 32) - 1; ii >= 0; ii--) \
  56. fprintf(stderr, SP_PRINT_FMT, (var)[ii]); \
  57. fprintf(stderr, "\n"); \
  58. } while (0)
  59. #define SP_PRINT_VAL(var, name) \
  60. fprintf(stderr, name "=0x" SP_PRINT_FMT "\n", var)
  61. #define SP_PRINT_INT(var, name) \
  62. fprintf(stderr, name "=%d\n", var)
  63. #if defined(WOLFSSL_HAVE_SP_RSA) || defined(WOLFSSL_HAVE_SP_DH)
  64. #ifndef WOLFSSL_SP_NO_2048
  65. /* Read big endian unsigned byte array into r.
  66. *
  67. * r A single precision integer.
  68. * size Maximum number of bytes to convert
  69. * a Byte array.
  70. * n Number of bytes in array to read.
  71. */
  72. static void sp_2048_from_bin(sp_digit* r, int size, const byte* a, int n)
  73. {
  74. int i;
  75. int j;
  76. byte* d;
  77. for (i = n - 1,j = 0; i >= 3; i -= 4) {
  78. r[j] = ((sp_digit)a[i - 0] << 0) |
  79. ((sp_digit)a[i - 1] << 8) |
  80. ((sp_digit)a[i - 2] << 16) |
  81. ((sp_digit)a[i - 3] << 24);
  82. j++;
  83. }
  84. if (i >= 0) {
  85. r[j] = 0;
  86. d = (byte*)r;
  87. switch (i) {
  88. case 2: d[n - 1 - 2] = a[2]; //fallthrough
  89. case 1: d[n - 1 - 1] = a[1]; //fallthrough
  90. case 0: d[n - 1 - 0] = a[0]; //fallthrough
  91. }
  92. j++;
  93. }
  94. for (; j < size; j++) {
  95. r[j] = 0;
  96. }
  97. }
  98. /* Convert an mp_int to an array of sp_digit.
  99. *
  100. * r A single precision integer.
  101. * size Maximum number of bytes to convert
  102. * a A multi-precision integer.
  103. */
  104. static void sp_2048_from_mp(sp_digit* r, int size, const mp_int* a)
  105. {
  106. #if DIGIT_BIT == 32
  107. int j;
  108. XMEMCPY(r, a->dp, sizeof(sp_digit) * a->used);
  109. for (j = a->used; j < size; j++) {
  110. r[j] = 0;
  111. }
  112. #elif DIGIT_BIT > 32
  113. int i;
  114. int j = 0;
  115. word32 s = 0;
  116. r[0] = 0;
  117. for (i = 0; i < a->used && j < size; i++) {
  118. r[j] |= ((sp_digit)a->dp[i] << s);
  119. r[j] &= 0xffffffff;
  120. s = 32U - s;
  121. if (j + 1 >= size) {
  122. break;
  123. }
  124. /* lint allow cast of mismatch word32 and mp_digit */
  125. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  126. while ((s + 32U) <= (word32)DIGIT_BIT) {
  127. s += 32U;
  128. r[j] &= 0xffffffff;
  129. if (j + 1 >= size) {
  130. break;
  131. }
  132. if (s < (word32)DIGIT_BIT) {
  133. /* lint allow cast of mismatch word32 and mp_digit */
  134. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  135. }
  136. else {
  137. r[++j] = (sp_digit)0;
  138. }
  139. }
  140. s = (word32)DIGIT_BIT - s;
  141. }
  142. for (j++; j < size; j++) {
  143. r[j] = 0;
  144. }
  145. #else
  146. int i;
  147. int j = 0;
  148. int s = 0;
  149. r[0] = 0;
  150. for (i = 0; i < a->used && j < size; i++) {
  151. r[j] |= ((sp_digit)a->dp[i]) << s;
  152. if (s + DIGIT_BIT >= 32) {
  153. r[j] &= 0xffffffff;
  154. if (j + 1 >= size) {
  155. break;
  156. }
  157. s = 32 - s;
  158. if (s == DIGIT_BIT) {
  159. r[++j] = 0;
  160. s = 0;
  161. }
  162. else {
  163. r[++j] = a->dp[i] >> s;
  164. s = DIGIT_BIT - s;
  165. }
  166. }
  167. else {
  168. s += DIGIT_BIT;
  169. }
  170. }
  171. for (j++; j < size; j++) {
  172. r[j] = 0;
  173. }
  174. #endif
  175. }
  176. /* Write r as big endian to byte array.
  177. * Fixed length number of bytes written: 256
  178. *
  179. * r A single precision integer.
  180. * a Byte array.
  181. */
  182. static void sp_2048_to_bin_64(sp_digit* r, byte* a)
  183. {
  184. int i;
  185. int j = 0;
  186. for (i = 63; i >= 0; i--) {
  187. a[j++] = r[i] >> 24;
  188. a[j++] = r[i] >> 16;
  189. a[j++] = r[i] >> 8;
  190. a[j++] = r[i] >> 0;
  191. }
  192. }
  193. #if (defined(WOLFSSL_HAVE_SP_RSA) && (!defined(WOLFSSL_RSA_PUBLIC_ONLY) || !defined(WOLFSSL_SP_SMALL))) || defined(WOLFSSL_HAVE_SP_DH)
  194. /* Normalize the values in each word to 32.
  195. *
  196. * a Array of sp_digit to normalize.
  197. */
  198. #define sp_2048_norm_64(a)
  199. #endif /* (WOLFSSL_HAVE_SP_RSA && (!WOLFSSL_RSA_PUBLIC_ONLY || !WOLFSSL_SP_SMALL)) || WOLFSSL_HAVE_SP_DH */
  200. /* Normalize the values in each word to 32.
  201. *
  202. * a Array of sp_digit to normalize.
  203. */
  204. #define sp_2048_norm_64(a)
  205. #ifndef WOLFSSL_SP_SMALL
  206. /* Multiply a and b into r. (r = a * b)
  207. *
  208. * r A single precision integer.
  209. * a A single precision integer.
  210. * b A single precision integer.
  211. */
  212. SP_NOINLINE static void sp_2048_mul_8(sp_digit* r, const sp_digit* a,
  213. const sp_digit* b)
  214. {
  215. sp_digit tmp_arr[8];
  216. sp_digit* tmp = tmp_arr;
  217. __asm__ __volatile__ (
  218. /* A[0] * B[0] */
  219. "ldr r6, [%[a], #0]\n\t"
  220. "ldr r8, [%[b], #0]\n\t"
  221. "umull r3, r4, r6, r8\n\t"
  222. "mov r5, #0\n\t"
  223. "str r3, [%[tmp], #0]\n\t"
  224. "mov r3, #0\n\t"
  225. /* A[0] * B[1] */
  226. "ldr r8, [%[b], #4]\n\t"
  227. "umull r6, r8, r6, r8\n\t"
  228. "adds r4, r4, r6\n\t"
  229. "adc r5, r5, r8\n\t"
  230. /* A[1] * B[0] */
  231. "ldr r6, [%[a], #4]\n\t"
  232. "ldr r8, [%[b], #0]\n\t"
  233. "umull r6, r8, r6, r8\n\t"
  234. "adds r4, r4, r6\n\t"
  235. "adcs r5, r5, r8\n\t"
  236. "adc r3, r3, #0\n\t"
  237. "str r4, [%[tmp], #4]\n\t"
  238. "mov r4, #0\n\t"
  239. /* A[0] * B[2] */
  240. "ldr r6, [%[a], #0]\n\t"
  241. "ldr r8, [%[b], #8]\n\t"
  242. "umull r6, r8, r6, r8\n\t"
  243. "adds r5, r5, r6\n\t"
  244. "adcs r3, r3, r8\n\t"
  245. "adc r4, r4, #0\n\t"
  246. /* A[1] * B[1] */
  247. "ldr r6, [%[a], #4]\n\t"
  248. "ldr r8, [%[b], #4]\n\t"
  249. "umull r6, r8, r6, r8\n\t"
  250. "adds r5, r5, r6\n\t"
  251. "adcs r3, r3, r8\n\t"
  252. "adc r4, r4, #0\n\t"
  253. /* A[2] * B[0] */
  254. "ldr r6, [%[a], #8]\n\t"
  255. "ldr r8, [%[b], #0]\n\t"
  256. "umull r6, r8, r6, r8\n\t"
  257. "adds r5, r5, r6\n\t"
  258. "adcs r3, r3, r8\n\t"
  259. "adc r4, r4, #0\n\t"
  260. "str r5, [%[tmp], #8]\n\t"
  261. "mov r5, #0\n\t"
  262. /* A[0] * B[3] */
  263. "ldr r6, [%[a], #0]\n\t"
  264. "ldr r8, [%[b], #12]\n\t"
  265. "umull r6, r8, r6, r8\n\t"
  266. "adds r3, r3, r6\n\t"
  267. "adcs r4, r4, r8\n\t"
  268. "adc r5, r5, #0\n\t"
  269. /* A[1] * B[2] */
  270. "ldr r6, [%[a], #4]\n\t"
  271. "ldr r8, [%[b], #8]\n\t"
  272. "umull r6, r8, r6, r8\n\t"
  273. "adds r3, r3, r6\n\t"
  274. "adcs r4, r4, r8\n\t"
  275. "adc r5, r5, #0\n\t"
  276. /* A[2] * B[1] */
  277. "ldr r6, [%[a], #8]\n\t"
  278. "ldr r8, [%[b], #4]\n\t"
  279. "umull r6, r8, r6, r8\n\t"
  280. "adds r3, r3, r6\n\t"
  281. "adcs r4, r4, r8\n\t"
  282. "adc r5, r5, #0\n\t"
  283. /* A[3] * B[0] */
  284. "ldr r6, [%[a], #12]\n\t"
  285. "ldr r8, [%[b], #0]\n\t"
  286. "umull r6, r8, r6, r8\n\t"
  287. "adds r3, r3, r6\n\t"
  288. "adcs r4, r4, r8\n\t"
  289. "adc r5, r5, #0\n\t"
  290. "str r3, [%[tmp], #12]\n\t"
  291. "mov r3, #0\n\t"
  292. /* A[0] * B[4] */
  293. "ldr r6, [%[a], #0]\n\t"
  294. "ldr r8, [%[b], #16]\n\t"
  295. "umull r6, r8, r6, r8\n\t"
  296. "adds r4, r4, r6\n\t"
  297. "adcs r5, r5, r8\n\t"
  298. "adc r3, r3, #0\n\t"
  299. /* A[1] * B[3] */
  300. "ldr r6, [%[a], #4]\n\t"
  301. "ldr r8, [%[b], #12]\n\t"
  302. "umull r6, r8, r6, r8\n\t"
  303. "adds r4, r4, r6\n\t"
  304. "adcs r5, r5, r8\n\t"
  305. "adc r3, r3, #0\n\t"
  306. /* A[2] * B[2] */
  307. "ldr r6, [%[a], #8]\n\t"
  308. "ldr r8, [%[b], #8]\n\t"
  309. "umull r6, r8, r6, r8\n\t"
  310. "adds r4, r4, r6\n\t"
  311. "adcs r5, r5, r8\n\t"
  312. "adc r3, r3, #0\n\t"
  313. /* A[3] * B[1] */
  314. "ldr r6, [%[a], #12]\n\t"
  315. "ldr r8, [%[b], #4]\n\t"
  316. "umull r6, r8, r6, r8\n\t"
  317. "adds r4, r4, r6\n\t"
  318. "adcs r5, r5, r8\n\t"
  319. "adc r3, r3, #0\n\t"
  320. /* A[4] * B[0] */
  321. "ldr r6, [%[a], #16]\n\t"
  322. "ldr r8, [%[b], #0]\n\t"
  323. "umull r6, r8, r6, r8\n\t"
  324. "adds r4, r4, r6\n\t"
  325. "adcs r5, r5, r8\n\t"
  326. "adc r3, r3, #0\n\t"
  327. "str r4, [%[tmp], #16]\n\t"
  328. "mov r4, #0\n\t"
  329. /* A[0] * B[5] */
  330. "ldr r6, [%[a], #0]\n\t"
  331. "ldr r8, [%[b], #20]\n\t"
  332. "umull r6, r8, r6, r8\n\t"
  333. "adds r5, r5, r6\n\t"
  334. "adcs r3, r3, r8\n\t"
  335. "adc r4, r4, #0\n\t"
  336. /* A[1] * B[4] */
  337. "ldr r6, [%[a], #4]\n\t"
  338. "ldr r8, [%[b], #16]\n\t"
  339. "umull r6, r8, r6, r8\n\t"
  340. "adds r5, r5, r6\n\t"
  341. "adcs r3, r3, r8\n\t"
  342. "adc r4, r4, #0\n\t"
  343. /* A[2] * B[3] */
  344. "ldr r6, [%[a], #8]\n\t"
  345. "ldr r8, [%[b], #12]\n\t"
  346. "umull r6, r8, r6, r8\n\t"
  347. "adds r5, r5, r6\n\t"
  348. "adcs r3, r3, r8\n\t"
  349. "adc r4, r4, #0\n\t"
  350. /* A[3] * B[2] */
  351. "ldr r6, [%[a], #12]\n\t"
  352. "ldr r8, [%[b], #8]\n\t"
  353. "umull r6, r8, r6, r8\n\t"
  354. "adds r5, r5, r6\n\t"
  355. "adcs r3, r3, r8\n\t"
  356. "adc r4, r4, #0\n\t"
  357. /* A[4] * B[1] */
  358. "ldr r6, [%[a], #16]\n\t"
  359. "ldr r8, [%[b], #4]\n\t"
  360. "umull r6, r8, r6, r8\n\t"
  361. "adds r5, r5, r6\n\t"
  362. "adcs r3, r3, r8\n\t"
  363. "adc r4, r4, #0\n\t"
  364. /* A[5] * B[0] */
  365. "ldr r6, [%[a], #20]\n\t"
  366. "ldr r8, [%[b], #0]\n\t"
  367. "umull r6, r8, r6, r8\n\t"
  368. "adds r5, r5, r6\n\t"
  369. "adcs r3, r3, r8\n\t"
  370. "adc r4, r4, #0\n\t"
  371. "str r5, [%[tmp], #20]\n\t"
  372. "mov r5, #0\n\t"
  373. /* A[0] * B[6] */
  374. "ldr r6, [%[a], #0]\n\t"
  375. "ldr r8, [%[b], #24]\n\t"
  376. "umull r6, r8, r6, r8\n\t"
  377. "adds r3, r3, r6\n\t"
  378. "adcs r4, r4, r8\n\t"
  379. "adc r5, r5, #0\n\t"
  380. /* A[1] * B[5] */
  381. "ldr r6, [%[a], #4]\n\t"
  382. "ldr r8, [%[b], #20]\n\t"
  383. "umull r6, r8, r6, r8\n\t"
  384. "adds r3, r3, r6\n\t"
  385. "adcs r4, r4, r8\n\t"
  386. "adc r5, r5, #0\n\t"
  387. /* A[2] * B[4] */
  388. "ldr r6, [%[a], #8]\n\t"
  389. "ldr r8, [%[b], #16]\n\t"
  390. "umull r6, r8, r6, r8\n\t"
  391. "adds r3, r3, r6\n\t"
  392. "adcs r4, r4, r8\n\t"
  393. "adc r5, r5, #0\n\t"
  394. /* A[3] * B[3] */
  395. "ldr r6, [%[a], #12]\n\t"
  396. "ldr r8, [%[b], #12]\n\t"
  397. "umull r6, r8, r6, r8\n\t"
  398. "adds r3, r3, r6\n\t"
  399. "adcs r4, r4, r8\n\t"
  400. "adc r5, r5, #0\n\t"
  401. /* A[4] * B[2] */
  402. "ldr r6, [%[a], #16]\n\t"
  403. "ldr r8, [%[b], #8]\n\t"
  404. "umull r6, r8, r6, r8\n\t"
  405. "adds r3, r3, r6\n\t"
  406. "adcs r4, r4, r8\n\t"
  407. "adc r5, r5, #0\n\t"
  408. /* A[5] * B[1] */
  409. "ldr r6, [%[a], #20]\n\t"
  410. "ldr r8, [%[b], #4]\n\t"
  411. "umull r6, r8, r6, r8\n\t"
  412. "adds r3, r3, r6\n\t"
  413. "adcs r4, r4, r8\n\t"
  414. "adc r5, r5, #0\n\t"
  415. /* A[6] * B[0] */
  416. "ldr r6, [%[a], #24]\n\t"
  417. "ldr r8, [%[b], #0]\n\t"
  418. "umull r6, r8, r6, r8\n\t"
  419. "adds r3, r3, r6\n\t"
  420. "adcs r4, r4, r8\n\t"
  421. "adc r5, r5, #0\n\t"
  422. "str r3, [%[tmp], #24]\n\t"
  423. "mov r3, #0\n\t"
  424. /* A[0] * B[7] */
  425. "ldr r6, [%[a], #0]\n\t"
  426. "ldr r8, [%[b], #28]\n\t"
  427. "umull r6, r8, r6, r8\n\t"
  428. "adds r4, r4, r6\n\t"
  429. "adcs r5, r5, r8\n\t"
  430. "adc r3, r3, #0\n\t"
  431. /* A[1] * B[6] */
  432. "ldr r6, [%[a], #4]\n\t"
  433. "ldr r8, [%[b], #24]\n\t"
  434. "umull r6, r8, r6, r8\n\t"
  435. "adds r4, r4, r6\n\t"
  436. "adcs r5, r5, r8\n\t"
  437. "adc r3, r3, #0\n\t"
  438. /* A[2] * B[5] */
  439. "ldr r6, [%[a], #8]\n\t"
  440. "ldr r8, [%[b], #20]\n\t"
  441. "umull r6, r8, r6, r8\n\t"
  442. "adds r4, r4, r6\n\t"
  443. "adcs r5, r5, r8\n\t"
  444. "adc r3, r3, #0\n\t"
  445. /* A[3] * B[4] */
  446. "ldr r6, [%[a], #12]\n\t"
  447. "ldr r8, [%[b], #16]\n\t"
  448. "umull r6, r8, r6, r8\n\t"
  449. "adds r4, r4, r6\n\t"
  450. "adcs r5, r5, r8\n\t"
  451. "adc r3, r3, #0\n\t"
  452. /* A[4] * B[3] */
  453. "ldr r6, [%[a], #16]\n\t"
  454. "ldr r8, [%[b], #12]\n\t"
  455. "umull r6, r8, r6, r8\n\t"
  456. "adds r4, r4, r6\n\t"
  457. "adcs r5, r5, r8\n\t"
  458. "adc r3, r3, #0\n\t"
  459. /* A[5] * B[2] */
  460. "ldr r6, [%[a], #20]\n\t"
  461. "ldr r8, [%[b], #8]\n\t"
  462. "umull r6, r8, r6, r8\n\t"
  463. "adds r4, r4, r6\n\t"
  464. "adcs r5, r5, r8\n\t"
  465. "adc r3, r3, #0\n\t"
  466. /* A[6] * B[1] */
  467. "ldr r6, [%[a], #24]\n\t"
  468. "ldr r8, [%[b], #4]\n\t"
  469. "umull r6, r8, r6, r8\n\t"
  470. "adds r4, r4, r6\n\t"
  471. "adcs r5, r5, r8\n\t"
  472. "adc r3, r3, #0\n\t"
  473. /* A[7] * B[0] */
  474. "ldr r6, [%[a], #28]\n\t"
  475. "ldr r8, [%[b], #0]\n\t"
  476. "umull r6, r8, r6, r8\n\t"
  477. "adds r4, r4, r6\n\t"
  478. "adcs r5, r5, r8\n\t"
  479. "adc r3, r3, #0\n\t"
  480. "str r4, [%[tmp], #28]\n\t"
  481. "mov r4, #0\n\t"
  482. /* A[1] * B[7] */
  483. "ldr r6, [%[a], #4]\n\t"
  484. "ldr r8, [%[b], #28]\n\t"
  485. "umull r6, r8, r6, r8\n\t"
  486. "adds r5, r5, r6\n\t"
  487. "adcs r3, r3, r8\n\t"
  488. "adc r4, r4, #0\n\t"
  489. /* A[2] * B[6] */
  490. "ldr r6, [%[a], #8]\n\t"
  491. "ldr r8, [%[b], #24]\n\t"
  492. "umull r6, r8, r6, r8\n\t"
  493. "adds r5, r5, r6\n\t"
  494. "adcs r3, r3, r8\n\t"
  495. "adc r4, r4, #0\n\t"
  496. /* A[3] * B[5] */
  497. "ldr r6, [%[a], #12]\n\t"
  498. "ldr r8, [%[b], #20]\n\t"
  499. "umull r6, r8, r6, r8\n\t"
  500. "adds r5, r5, r6\n\t"
  501. "adcs r3, r3, r8\n\t"
  502. "adc r4, r4, #0\n\t"
  503. /* A[4] * B[4] */
  504. "ldr r6, [%[a], #16]\n\t"
  505. "ldr r8, [%[b], #16]\n\t"
  506. "umull r6, r8, r6, r8\n\t"
  507. "adds r5, r5, r6\n\t"
  508. "adcs r3, r3, r8\n\t"
  509. "adc r4, r4, #0\n\t"
  510. /* A[5] * B[3] */
  511. "ldr r6, [%[a], #20]\n\t"
  512. "ldr r8, [%[b], #12]\n\t"
  513. "umull r6, r8, r6, r8\n\t"
  514. "adds r5, r5, r6\n\t"
  515. "adcs r3, r3, r8\n\t"
  516. "adc r4, r4, #0\n\t"
  517. /* A[6] * B[2] */
  518. "ldr r6, [%[a], #24]\n\t"
  519. "ldr r8, [%[b], #8]\n\t"
  520. "umull r6, r8, r6, r8\n\t"
  521. "adds r5, r5, r6\n\t"
  522. "adcs r3, r3, r8\n\t"
  523. "adc r4, r4, #0\n\t"
  524. /* A[7] * B[1] */
  525. "ldr r6, [%[a], #28]\n\t"
  526. "ldr r8, [%[b], #4]\n\t"
  527. "umull r6, r8, r6, r8\n\t"
  528. "adds r5, r5, r6\n\t"
  529. "adcs r3, r3, r8\n\t"
  530. "adc r4, r4, #0\n\t"
  531. "str r5, [%[r], #32]\n\t"
  532. "mov r5, #0\n\t"
  533. /* A[2] * B[7] */
  534. "ldr r6, [%[a], #8]\n\t"
  535. "ldr r8, [%[b], #28]\n\t"
  536. "umull r6, r8, r6, r8\n\t"
  537. "adds r3, r3, r6\n\t"
  538. "adcs r4, r4, r8\n\t"
  539. "adc r5, r5, #0\n\t"
  540. /* A[3] * B[6] */
  541. "ldr r6, [%[a], #12]\n\t"
  542. "ldr r8, [%[b], #24]\n\t"
  543. "umull r6, r8, r6, r8\n\t"
  544. "adds r3, r3, r6\n\t"
  545. "adcs r4, r4, r8\n\t"
  546. "adc r5, r5, #0\n\t"
  547. /* A[4] * B[5] */
  548. "ldr r6, [%[a], #16]\n\t"
  549. "ldr r8, [%[b], #20]\n\t"
  550. "umull r6, r8, r6, r8\n\t"
  551. "adds r3, r3, r6\n\t"
  552. "adcs r4, r4, r8\n\t"
  553. "adc r5, r5, #0\n\t"
  554. /* A[5] * B[4] */
  555. "ldr r6, [%[a], #20]\n\t"
  556. "ldr r8, [%[b], #16]\n\t"
  557. "umull r6, r8, r6, r8\n\t"
  558. "adds r3, r3, r6\n\t"
  559. "adcs r4, r4, r8\n\t"
  560. "adc r5, r5, #0\n\t"
  561. /* A[6] * B[3] */
  562. "ldr r6, [%[a], #24]\n\t"
  563. "ldr r8, [%[b], #12]\n\t"
  564. "umull r6, r8, r6, r8\n\t"
  565. "adds r3, r3, r6\n\t"
  566. "adcs r4, r4, r8\n\t"
  567. "adc r5, r5, #0\n\t"
  568. /* A[7] * B[2] */
  569. "ldr r6, [%[a], #28]\n\t"
  570. "ldr r8, [%[b], #8]\n\t"
  571. "umull r6, r8, r6, r8\n\t"
  572. "adds r3, r3, r6\n\t"
  573. "adcs r4, r4, r8\n\t"
  574. "adc r5, r5, #0\n\t"
  575. "str r3, [%[r], #36]\n\t"
  576. "mov r3, #0\n\t"
  577. /* A[3] * B[7] */
  578. "ldr r6, [%[a], #12]\n\t"
  579. "ldr r8, [%[b], #28]\n\t"
  580. "umull r6, r8, r6, r8\n\t"
  581. "adds r4, r4, r6\n\t"
  582. "adcs r5, r5, r8\n\t"
  583. "adc r3, r3, #0\n\t"
  584. /* A[4] * B[6] */
  585. "ldr r6, [%[a], #16]\n\t"
  586. "ldr r8, [%[b], #24]\n\t"
  587. "umull r6, r8, r6, r8\n\t"
  588. "adds r4, r4, r6\n\t"
  589. "adcs r5, r5, r8\n\t"
  590. "adc r3, r3, #0\n\t"
  591. /* A[5] * B[5] */
  592. "ldr r6, [%[a], #20]\n\t"
  593. "ldr r8, [%[b], #20]\n\t"
  594. "umull r6, r8, r6, r8\n\t"
  595. "adds r4, r4, r6\n\t"
  596. "adcs r5, r5, r8\n\t"
  597. "adc r3, r3, #0\n\t"
  598. /* A[6] * B[4] */
  599. "ldr r6, [%[a], #24]\n\t"
  600. "ldr r8, [%[b], #16]\n\t"
  601. "umull r6, r8, r6, r8\n\t"
  602. "adds r4, r4, r6\n\t"
  603. "adcs r5, r5, r8\n\t"
  604. "adc r3, r3, #0\n\t"
  605. /* A[7] * B[3] */
  606. "ldr r6, [%[a], #28]\n\t"
  607. "ldr r8, [%[b], #12]\n\t"
  608. "umull r6, r8, r6, r8\n\t"
  609. "adds r4, r4, r6\n\t"
  610. "adcs r5, r5, r8\n\t"
  611. "adc r3, r3, #0\n\t"
  612. "str r4, [%[r], #40]\n\t"
  613. "mov r4, #0\n\t"
  614. /* A[4] * B[7] */
  615. "ldr r6, [%[a], #16]\n\t"
  616. "ldr r8, [%[b], #28]\n\t"
  617. "umull r6, r8, r6, r8\n\t"
  618. "adds r5, r5, r6\n\t"
  619. "adcs r3, r3, r8\n\t"
  620. "adc r4, r4, #0\n\t"
  621. /* A[5] * B[6] */
  622. "ldr r6, [%[a], #20]\n\t"
  623. "ldr r8, [%[b], #24]\n\t"
  624. "umull r6, r8, r6, r8\n\t"
  625. "adds r5, r5, r6\n\t"
  626. "adcs r3, r3, r8\n\t"
  627. "adc r4, r4, #0\n\t"
  628. /* A[6] * B[5] */
  629. "ldr r6, [%[a], #24]\n\t"
  630. "ldr r8, [%[b], #20]\n\t"
  631. "umull r6, r8, r6, r8\n\t"
  632. "adds r5, r5, r6\n\t"
  633. "adcs r3, r3, r8\n\t"
  634. "adc r4, r4, #0\n\t"
  635. /* A[7] * B[4] */
  636. "ldr r6, [%[a], #28]\n\t"
  637. "ldr r8, [%[b], #16]\n\t"
  638. "umull r6, r8, r6, r8\n\t"
  639. "adds r5, r5, r6\n\t"
  640. "adcs r3, r3, r8\n\t"
  641. "adc r4, r4, #0\n\t"
  642. "str r5, [%[r], #44]\n\t"
  643. "mov r5, #0\n\t"
  644. /* A[5] * B[7] */
  645. "ldr r6, [%[a], #20]\n\t"
  646. "ldr r8, [%[b], #28]\n\t"
  647. "umull r6, r8, r6, r8\n\t"
  648. "adds r3, r3, r6\n\t"
  649. "adcs r4, r4, r8\n\t"
  650. "adc r5, r5, #0\n\t"
  651. /* A[6] * B[6] */
  652. "ldr r6, [%[a], #24]\n\t"
  653. "ldr r8, [%[b], #24]\n\t"
  654. "umull r6, r8, r6, r8\n\t"
  655. "adds r3, r3, r6\n\t"
  656. "adcs r4, r4, r8\n\t"
  657. "adc r5, r5, #0\n\t"
  658. /* A[7] * B[5] */
  659. "ldr r6, [%[a], #28]\n\t"
  660. "ldr r8, [%[b], #20]\n\t"
  661. "umull r6, r8, r6, r8\n\t"
  662. "adds r3, r3, r6\n\t"
  663. "adcs r4, r4, r8\n\t"
  664. "adc r5, r5, #0\n\t"
  665. "str r3, [%[r], #48]\n\t"
  666. "mov r3, #0\n\t"
  667. /* A[6] * B[7] */
  668. "ldr r6, [%[a], #24]\n\t"
  669. "ldr r8, [%[b], #28]\n\t"
  670. "umull r6, r8, r6, r8\n\t"
  671. "adds r4, r4, r6\n\t"
  672. "adcs r5, r5, r8\n\t"
  673. "adc r3, r3, #0\n\t"
  674. /* A[7] * B[6] */
  675. "ldr r6, [%[a], #28]\n\t"
  676. "ldr r8, [%[b], #24]\n\t"
  677. "umull r6, r8, r6, r8\n\t"
  678. "adds r4, r4, r6\n\t"
  679. "adcs r5, r5, r8\n\t"
  680. "adc r3, r3, #0\n\t"
  681. "str r4, [%[r], #52]\n\t"
  682. "mov r4, #0\n\t"
  683. /* A[7] * B[7] */
  684. "ldr r6, [%[a], #28]\n\t"
  685. "ldr r8, [%[b], #28]\n\t"
  686. "umull r6, r8, r6, r8\n\t"
  687. "adds r5, r5, r6\n\t"
  688. "adc r3, r3, r8\n\t"
  689. "str r5, [%[r], #56]\n\t"
  690. "str r3, [%[r], #60]\n\t"
  691. /* Transfer tmp to r */
  692. "ldr r3, [%[tmp], #0]\n\t"
  693. "ldr r4, [%[tmp], #4]\n\t"
  694. "ldr r5, [%[tmp], #8]\n\t"
  695. "ldr r6, [%[tmp], #12]\n\t"
  696. "str r3, [%[r], #0]\n\t"
  697. "str r4, [%[r], #4]\n\t"
  698. "str r5, [%[r], #8]\n\t"
  699. "str r6, [%[r], #12]\n\t"
  700. "ldr r3, [%[tmp], #16]\n\t"
  701. "ldr r4, [%[tmp], #20]\n\t"
  702. "ldr r5, [%[tmp], #24]\n\t"
  703. "ldr r6, [%[tmp], #28]\n\t"
  704. "str r3, [%[r], #16]\n\t"
  705. "str r4, [%[r], #20]\n\t"
  706. "str r5, [%[r], #24]\n\t"
  707. "str r6, [%[r], #28]\n\t"
  708. :
  709. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [tmp] "r" (tmp)
  710. : "memory", "r3", "r4", "r5", "r6", "r8"
  711. );
  712. }
  713. /* Add b to a into r. (r = a + b)
  714. *
  715. * r A single precision integer.
  716. * a A single precision integer.
  717. * b A single precision integer.
  718. */
  719. SP_NOINLINE static sp_digit sp_2048_add_8(sp_digit* r, const sp_digit* a,
  720. const sp_digit* b)
  721. {
  722. sp_digit c = 0;
  723. __asm__ __volatile__ (
  724. "ldm %[a]!, {r4, r5}\n\t"
  725. "ldm %[b]!, {r6, r8}\n\t"
  726. "adds r4, r4, r6\n\t"
  727. "adcs r5, r5, r8\n\t"
  728. "stm %[r]!, {r4, r5}\n\t"
  729. "ldm %[a]!, {r4, r5}\n\t"
  730. "ldm %[b]!, {r6, r8}\n\t"
  731. "adcs r4, r4, r6\n\t"
  732. "adcs r5, r5, r8\n\t"
  733. "stm %[r]!, {r4, r5}\n\t"
  734. "ldm %[a]!, {r4, r5}\n\t"
  735. "ldm %[b]!, {r6, r8}\n\t"
  736. "adcs r4, r4, r6\n\t"
  737. "adcs r5, r5, r8\n\t"
  738. "stm %[r]!, {r4, r5}\n\t"
  739. "ldm %[a]!, {r4, r5}\n\t"
  740. "ldm %[b]!, {r6, r8}\n\t"
  741. "adcs r4, r4, r6\n\t"
  742. "adcs r5, r5, r8\n\t"
  743. "stm %[r]!, {r4, r5}\n\t"
  744. "mov %[c], #0\n\t"
  745. "adc %[c], %[c], %[c]\n\t"
  746. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  747. :
  748. : "memory", "r4", "r5", "r6", "r8"
  749. );
  750. return c;
  751. }
  752. /* Sub b from a into r. (r = a - b)
  753. *
  754. * r A single precision integer.
  755. * a A single precision integer.
  756. * b A single precision integer.
  757. */
  758. SP_NOINLINE static sp_digit sp_2048_sub_in_place_16(sp_digit* a,
  759. const sp_digit* b)
  760. {
  761. sp_digit c = 0;
  762. __asm__ __volatile__ (
  763. "ldm %[a], {r3, r4}\n\t"
  764. "ldm %[b]!, {r5, r6}\n\t"
  765. "subs r3, r3, r5\n\t"
  766. "sbcs r4, r4, r6\n\t"
  767. "stm %[a]!, {r3, r4}\n\t"
  768. "ldm %[a], {r3, r4}\n\t"
  769. "ldm %[b]!, {r5, r6}\n\t"
  770. "sbcs r3, r3, r5\n\t"
  771. "sbcs r4, r4, r6\n\t"
  772. "stm %[a]!, {r3, r4}\n\t"
  773. "ldm %[a], {r3, r4}\n\t"
  774. "ldm %[b]!, {r5, r6}\n\t"
  775. "sbcs r3, r3, r5\n\t"
  776. "sbcs r4, r4, r6\n\t"
  777. "stm %[a]!, {r3, r4}\n\t"
  778. "ldm %[a], {r3, r4}\n\t"
  779. "ldm %[b]!, {r5, r6}\n\t"
  780. "sbcs r3, r3, r5\n\t"
  781. "sbcs r4, r4, r6\n\t"
  782. "stm %[a]!, {r3, r4}\n\t"
  783. "ldm %[a], {r3, r4}\n\t"
  784. "ldm %[b]!, {r5, r6}\n\t"
  785. "sbcs r3, r3, r5\n\t"
  786. "sbcs r4, r4, r6\n\t"
  787. "stm %[a]!, {r3, r4}\n\t"
  788. "ldm %[a], {r3, r4}\n\t"
  789. "ldm %[b]!, {r5, r6}\n\t"
  790. "sbcs r3, r3, r5\n\t"
  791. "sbcs r4, r4, r6\n\t"
  792. "stm %[a]!, {r3, r4}\n\t"
  793. "ldm %[a], {r3, r4}\n\t"
  794. "ldm %[b]!, {r5, r6}\n\t"
  795. "sbcs r3, r3, r5\n\t"
  796. "sbcs r4, r4, r6\n\t"
  797. "stm %[a]!, {r3, r4}\n\t"
  798. "ldm %[a], {r3, r4}\n\t"
  799. "ldm %[b]!, {r5, r6}\n\t"
  800. "sbcs r3, r3, r5\n\t"
  801. "sbcs r4, r4, r6\n\t"
  802. "stm %[a]!, {r3, r4}\n\t"
  803. "sbc %[c], %[c], %[c]\n\t"
  804. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  805. :
  806. : "memory", "r3", "r4", "r5", "r6"
  807. );
  808. return c;
  809. }
  810. /* Add b to a into r. (r = a + b)
  811. *
  812. * r A single precision integer.
  813. * a A single precision integer.
  814. * b A single precision integer.
  815. */
  816. SP_NOINLINE static sp_digit sp_2048_add_16(sp_digit* r, const sp_digit* a,
  817. const sp_digit* b)
  818. {
  819. sp_digit c = 0;
  820. __asm__ __volatile__ (
  821. "ldm %[a]!, {r4, r5}\n\t"
  822. "ldm %[b]!, {r6, r8}\n\t"
  823. "adds r4, r4, r6\n\t"
  824. "adcs r5, r5, r8\n\t"
  825. "stm %[r]!, {r4, r5}\n\t"
  826. "ldm %[a]!, {r4, r5}\n\t"
  827. "ldm %[b]!, {r6, r8}\n\t"
  828. "adcs r4, r4, r6\n\t"
  829. "adcs r5, r5, r8\n\t"
  830. "stm %[r]!, {r4, r5}\n\t"
  831. "ldm %[a]!, {r4, r5}\n\t"
  832. "ldm %[b]!, {r6, r8}\n\t"
  833. "adcs r4, r4, r6\n\t"
  834. "adcs r5, r5, r8\n\t"
  835. "stm %[r]!, {r4, r5}\n\t"
  836. "ldm %[a]!, {r4, r5}\n\t"
  837. "ldm %[b]!, {r6, r8}\n\t"
  838. "adcs r4, r4, r6\n\t"
  839. "adcs r5, r5, r8\n\t"
  840. "stm %[r]!, {r4, r5}\n\t"
  841. "ldm %[a]!, {r4, r5}\n\t"
  842. "ldm %[b]!, {r6, r8}\n\t"
  843. "adcs r4, r4, r6\n\t"
  844. "adcs r5, r5, r8\n\t"
  845. "stm %[r]!, {r4, r5}\n\t"
  846. "ldm %[a]!, {r4, r5}\n\t"
  847. "ldm %[b]!, {r6, r8}\n\t"
  848. "adcs r4, r4, r6\n\t"
  849. "adcs r5, r5, r8\n\t"
  850. "stm %[r]!, {r4, r5}\n\t"
  851. "ldm %[a]!, {r4, r5}\n\t"
  852. "ldm %[b]!, {r6, r8}\n\t"
  853. "adcs r4, r4, r6\n\t"
  854. "adcs r5, r5, r8\n\t"
  855. "stm %[r]!, {r4, r5}\n\t"
  856. "ldm %[a]!, {r4, r5}\n\t"
  857. "ldm %[b]!, {r6, r8}\n\t"
  858. "adcs r4, r4, r6\n\t"
  859. "adcs r5, r5, r8\n\t"
  860. "stm %[r]!, {r4, r5}\n\t"
  861. "mov %[c], #0\n\t"
  862. "adc %[c], %[c], %[c]\n\t"
  863. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  864. :
  865. : "memory", "r4", "r5", "r6", "r8"
  866. );
  867. return c;
  868. }
  869. /* AND m into each word of a and store in r.
  870. *
  871. * r A single precision integer.
  872. * a A single precision integer.
  873. * m Mask to AND against each digit.
  874. */
  875. static void sp_2048_mask_8(sp_digit* r, const sp_digit* a, sp_digit m)
  876. {
  877. #ifdef WOLFSSL_SP_SMALL
  878. int i;
  879. for (i=0; i<8; i++) {
  880. r[i] = a[i] & m;
  881. }
  882. #else
  883. r[0] = a[0] & m;
  884. r[1] = a[1] & m;
  885. r[2] = a[2] & m;
  886. r[3] = a[3] & m;
  887. r[4] = a[4] & m;
  888. r[5] = a[5] & m;
  889. r[6] = a[6] & m;
  890. r[7] = a[7] & m;
  891. #endif
  892. }
  893. /* Multiply a and b into r. (r = a * b)
  894. *
  895. * r A single precision integer.
  896. * a A single precision integer.
  897. * b A single precision integer.
  898. */
  899. SP_NOINLINE static void sp_2048_mul_16(sp_digit* r, const sp_digit* a,
  900. const sp_digit* b)
  901. {
  902. sp_digit* z0 = r;
  903. sp_digit z1[16];
  904. sp_digit a1[8];
  905. sp_digit b1[8];
  906. sp_digit* z2 = r + 16;
  907. sp_digit u;
  908. sp_digit ca;
  909. sp_digit cb;
  910. ca = sp_2048_add_8(a1, a, &a[8]);
  911. cb = sp_2048_add_8(b1, b, &b[8]);
  912. u = ca & cb;
  913. sp_2048_mul_8(z2, &a[8], &b[8]);
  914. sp_2048_mul_8(z0, a, b);
  915. sp_2048_mul_8(z1, a1, b1);
  916. u += sp_2048_sub_in_place_16(z1, z0);
  917. u += sp_2048_sub_in_place_16(z1, z2);
  918. sp_2048_mask_8(a1, a1, 0 - cb);
  919. u += sp_2048_add_8(z1 + 8, z1 + 8, a1);
  920. sp_2048_mask_8(b1, b1, 0 - ca);
  921. u += sp_2048_add_8(z1 + 8, z1 + 8, b1);
  922. u += sp_2048_add_16(r + 8, r + 8, z1);
  923. XMEMSET(a1 + 1, 0, sizeof(sp_digit) * (8 - 1));
  924. a1[0] = u;
  925. (void)sp_2048_add_8(r + 24, r + 24, a1);
  926. }
  927. /* Sub b from a into r. (r = a - b)
  928. *
  929. * r A single precision integer.
  930. * a A single precision integer.
  931. * b A single precision integer.
  932. */
  933. SP_NOINLINE static sp_digit sp_2048_sub_in_place_32(sp_digit* a,
  934. const sp_digit* b)
  935. {
  936. sp_digit c = 0;
  937. __asm__ __volatile__ (
  938. "ldm %[a], {r3, r4}\n\t"
  939. "ldm %[b]!, {r5, r6}\n\t"
  940. "subs r3, r3, r5\n\t"
  941. "sbcs r4, r4, r6\n\t"
  942. "stm %[a]!, {r3, r4}\n\t"
  943. "ldm %[a], {r3, r4}\n\t"
  944. "ldm %[b]!, {r5, r6}\n\t"
  945. "sbcs r3, r3, r5\n\t"
  946. "sbcs r4, r4, r6\n\t"
  947. "stm %[a]!, {r3, r4}\n\t"
  948. "ldm %[a], {r3, r4}\n\t"
  949. "ldm %[b]!, {r5, r6}\n\t"
  950. "sbcs r3, r3, r5\n\t"
  951. "sbcs r4, r4, r6\n\t"
  952. "stm %[a]!, {r3, r4}\n\t"
  953. "ldm %[a], {r3, r4}\n\t"
  954. "ldm %[b]!, {r5, r6}\n\t"
  955. "sbcs r3, r3, r5\n\t"
  956. "sbcs r4, r4, r6\n\t"
  957. "stm %[a]!, {r3, r4}\n\t"
  958. "ldm %[a], {r3, r4}\n\t"
  959. "ldm %[b]!, {r5, r6}\n\t"
  960. "sbcs r3, r3, r5\n\t"
  961. "sbcs r4, r4, r6\n\t"
  962. "stm %[a]!, {r3, r4}\n\t"
  963. "ldm %[a], {r3, r4}\n\t"
  964. "ldm %[b]!, {r5, r6}\n\t"
  965. "sbcs r3, r3, r5\n\t"
  966. "sbcs r4, r4, r6\n\t"
  967. "stm %[a]!, {r3, r4}\n\t"
  968. "ldm %[a], {r3, r4}\n\t"
  969. "ldm %[b]!, {r5, r6}\n\t"
  970. "sbcs r3, r3, r5\n\t"
  971. "sbcs r4, r4, r6\n\t"
  972. "stm %[a]!, {r3, r4}\n\t"
  973. "ldm %[a], {r3, r4}\n\t"
  974. "ldm %[b]!, {r5, r6}\n\t"
  975. "sbcs r3, r3, r5\n\t"
  976. "sbcs r4, r4, r6\n\t"
  977. "stm %[a]!, {r3, r4}\n\t"
  978. "ldm %[a], {r3, r4}\n\t"
  979. "ldm %[b]!, {r5, r6}\n\t"
  980. "sbcs r3, r3, r5\n\t"
  981. "sbcs r4, r4, r6\n\t"
  982. "stm %[a]!, {r3, r4}\n\t"
  983. "ldm %[a], {r3, r4}\n\t"
  984. "ldm %[b]!, {r5, r6}\n\t"
  985. "sbcs r3, r3, r5\n\t"
  986. "sbcs r4, r4, r6\n\t"
  987. "stm %[a]!, {r3, r4}\n\t"
  988. "ldm %[a], {r3, r4}\n\t"
  989. "ldm %[b]!, {r5, r6}\n\t"
  990. "sbcs r3, r3, r5\n\t"
  991. "sbcs r4, r4, r6\n\t"
  992. "stm %[a]!, {r3, r4}\n\t"
  993. "ldm %[a], {r3, r4}\n\t"
  994. "ldm %[b]!, {r5, r6}\n\t"
  995. "sbcs r3, r3, r5\n\t"
  996. "sbcs r4, r4, r6\n\t"
  997. "stm %[a]!, {r3, r4}\n\t"
  998. "ldm %[a], {r3, r4}\n\t"
  999. "ldm %[b]!, {r5, r6}\n\t"
  1000. "sbcs r3, r3, r5\n\t"
  1001. "sbcs r4, r4, r6\n\t"
  1002. "stm %[a]!, {r3, r4}\n\t"
  1003. "ldm %[a], {r3, r4}\n\t"
  1004. "ldm %[b]!, {r5, r6}\n\t"
  1005. "sbcs r3, r3, r5\n\t"
  1006. "sbcs r4, r4, r6\n\t"
  1007. "stm %[a]!, {r3, r4}\n\t"
  1008. "ldm %[a], {r3, r4}\n\t"
  1009. "ldm %[b]!, {r5, r6}\n\t"
  1010. "sbcs r3, r3, r5\n\t"
  1011. "sbcs r4, r4, r6\n\t"
  1012. "stm %[a]!, {r3, r4}\n\t"
  1013. "ldm %[a], {r3, r4}\n\t"
  1014. "ldm %[b]!, {r5, r6}\n\t"
  1015. "sbcs r3, r3, r5\n\t"
  1016. "sbcs r4, r4, r6\n\t"
  1017. "stm %[a]!, {r3, r4}\n\t"
  1018. "sbc %[c], %[c], %[c]\n\t"
  1019. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  1020. :
  1021. : "memory", "r3", "r4", "r5", "r6"
  1022. );
  1023. return c;
  1024. }
  1025. /* Add b to a into r. (r = a + b)
  1026. *
  1027. * r A single precision integer.
  1028. * a A single precision integer.
  1029. * b A single precision integer.
  1030. */
  1031. SP_NOINLINE static sp_digit sp_2048_add_32(sp_digit* r, const sp_digit* a,
  1032. const sp_digit* b)
  1033. {
  1034. sp_digit c = 0;
  1035. __asm__ __volatile__ (
  1036. "ldm %[a]!, {r4, r5}\n\t"
  1037. "ldm %[b]!, {r6, r8}\n\t"
  1038. "adds r4, r4, r6\n\t"
  1039. "adcs r5, r5, r8\n\t"
  1040. "stm %[r]!, {r4, r5}\n\t"
  1041. "ldm %[a]!, {r4, r5}\n\t"
  1042. "ldm %[b]!, {r6, r8}\n\t"
  1043. "adcs r4, r4, r6\n\t"
  1044. "adcs r5, r5, r8\n\t"
  1045. "stm %[r]!, {r4, r5}\n\t"
  1046. "ldm %[a]!, {r4, r5}\n\t"
  1047. "ldm %[b]!, {r6, r8}\n\t"
  1048. "adcs r4, r4, r6\n\t"
  1049. "adcs r5, r5, r8\n\t"
  1050. "stm %[r]!, {r4, r5}\n\t"
  1051. "ldm %[a]!, {r4, r5}\n\t"
  1052. "ldm %[b]!, {r6, r8}\n\t"
  1053. "adcs r4, r4, r6\n\t"
  1054. "adcs r5, r5, r8\n\t"
  1055. "stm %[r]!, {r4, r5}\n\t"
  1056. "ldm %[a]!, {r4, r5}\n\t"
  1057. "ldm %[b]!, {r6, r8}\n\t"
  1058. "adcs r4, r4, r6\n\t"
  1059. "adcs r5, r5, r8\n\t"
  1060. "stm %[r]!, {r4, r5}\n\t"
  1061. "ldm %[a]!, {r4, r5}\n\t"
  1062. "ldm %[b]!, {r6, r8}\n\t"
  1063. "adcs r4, r4, r6\n\t"
  1064. "adcs r5, r5, r8\n\t"
  1065. "stm %[r]!, {r4, r5}\n\t"
  1066. "ldm %[a]!, {r4, r5}\n\t"
  1067. "ldm %[b]!, {r6, r8}\n\t"
  1068. "adcs r4, r4, r6\n\t"
  1069. "adcs r5, r5, r8\n\t"
  1070. "stm %[r]!, {r4, r5}\n\t"
  1071. "ldm %[a]!, {r4, r5}\n\t"
  1072. "ldm %[b]!, {r6, r8}\n\t"
  1073. "adcs r4, r4, r6\n\t"
  1074. "adcs r5, r5, r8\n\t"
  1075. "stm %[r]!, {r4, r5}\n\t"
  1076. "ldm %[a]!, {r4, r5}\n\t"
  1077. "ldm %[b]!, {r6, r8}\n\t"
  1078. "adcs r4, r4, r6\n\t"
  1079. "adcs r5, r5, r8\n\t"
  1080. "stm %[r]!, {r4, r5}\n\t"
  1081. "ldm %[a]!, {r4, r5}\n\t"
  1082. "ldm %[b]!, {r6, r8}\n\t"
  1083. "adcs r4, r4, r6\n\t"
  1084. "adcs r5, r5, r8\n\t"
  1085. "stm %[r]!, {r4, r5}\n\t"
  1086. "ldm %[a]!, {r4, r5}\n\t"
  1087. "ldm %[b]!, {r6, r8}\n\t"
  1088. "adcs r4, r4, r6\n\t"
  1089. "adcs r5, r5, r8\n\t"
  1090. "stm %[r]!, {r4, r5}\n\t"
  1091. "ldm %[a]!, {r4, r5}\n\t"
  1092. "ldm %[b]!, {r6, r8}\n\t"
  1093. "adcs r4, r4, r6\n\t"
  1094. "adcs r5, r5, r8\n\t"
  1095. "stm %[r]!, {r4, r5}\n\t"
  1096. "ldm %[a]!, {r4, r5}\n\t"
  1097. "ldm %[b]!, {r6, r8}\n\t"
  1098. "adcs r4, r4, r6\n\t"
  1099. "adcs r5, r5, r8\n\t"
  1100. "stm %[r]!, {r4, r5}\n\t"
  1101. "ldm %[a]!, {r4, r5}\n\t"
  1102. "ldm %[b]!, {r6, r8}\n\t"
  1103. "adcs r4, r4, r6\n\t"
  1104. "adcs r5, r5, r8\n\t"
  1105. "stm %[r]!, {r4, r5}\n\t"
  1106. "ldm %[a]!, {r4, r5}\n\t"
  1107. "ldm %[b]!, {r6, r8}\n\t"
  1108. "adcs r4, r4, r6\n\t"
  1109. "adcs r5, r5, r8\n\t"
  1110. "stm %[r]!, {r4, r5}\n\t"
  1111. "ldm %[a]!, {r4, r5}\n\t"
  1112. "ldm %[b]!, {r6, r8}\n\t"
  1113. "adcs r4, r4, r6\n\t"
  1114. "adcs r5, r5, r8\n\t"
  1115. "stm %[r]!, {r4, r5}\n\t"
  1116. "mov %[c], #0\n\t"
  1117. "adc %[c], %[c], %[c]\n\t"
  1118. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  1119. :
  1120. : "memory", "r4", "r5", "r6", "r8"
  1121. );
  1122. return c;
  1123. }
  1124. /* AND m into each word of a and store in r.
  1125. *
  1126. * r A single precision integer.
  1127. * a A single precision integer.
  1128. * m Mask to AND against each digit.
  1129. */
  1130. static void sp_2048_mask_16(sp_digit* r, const sp_digit* a, sp_digit m)
  1131. {
  1132. #ifdef WOLFSSL_SP_SMALL
  1133. int i;
  1134. for (i=0; i<16; i++) {
  1135. r[i] = a[i] & m;
  1136. }
  1137. #else
  1138. int i;
  1139. for (i = 0; i < 16; i += 8) {
  1140. r[i+0] = a[i+0] & m;
  1141. r[i+1] = a[i+1] & m;
  1142. r[i+2] = a[i+2] & m;
  1143. r[i+3] = a[i+3] & m;
  1144. r[i+4] = a[i+4] & m;
  1145. r[i+5] = a[i+5] & m;
  1146. r[i+6] = a[i+6] & m;
  1147. r[i+7] = a[i+7] & m;
  1148. }
  1149. #endif
  1150. }
  1151. /* Multiply a and b into r. (r = a * b)
  1152. *
  1153. * r A single precision integer.
  1154. * a A single precision integer.
  1155. * b A single precision integer.
  1156. */
  1157. SP_NOINLINE static void sp_2048_mul_32(sp_digit* r, const sp_digit* a,
  1158. const sp_digit* b)
  1159. {
  1160. sp_digit* z0 = r;
  1161. sp_digit z1[32];
  1162. sp_digit a1[16];
  1163. sp_digit b1[16];
  1164. sp_digit* z2 = r + 32;
  1165. sp_digit u;
  1166. sp_digit ca;
  1167. sp_digit cb;
  1168. ca = sp_2048_add_16(a1, a, &a[16]);
  1169. cb = sp_2048_add_16(b1, b, &b[16]);
  1170. u = ca & cb;
  1171. sp_2048_mul_16(z2, &a[16], &b[16]);
  1172. sp_2048_mul_16(z0, a, b);
  1173. sp_2048_mul_16(z1, a1, b1);
  1174. u += sp_2048_sub_in_place_32(z1, z0);
  1175. u += sp_2048_sub_in_place_32(z1, z2);
  1176. sp_2048_mask_16(a1, a1, 0 - cb);
  1177. u += sp_2048_add_16(z1 + 16, z1 + 16, a1);
  1178. sp_2048_mask_16(b1, b1, 0 - ca);
  1179. u += sp_2048_add_16(z1 + 16, z1 + 16, b1);
  1180. u += sp_2048_add_32(r + 16, r + 16, z1);
  1181. XMEMSET(a1 + 1, 0, sizeof(sp_digit) * (16 - 1));
  1182. a1[0] = u;
  1183. (void)sp_2048_add_16(r + 48, r + 48, a1);
  1184. }
  1185. /* Sub b from a into r. (r = a - b)
  1186. *
  1187. * r A single precision integer.
  1188. * a A single precision integer.
  1189. * b A single precision integer.
  1190. */
  1191. SP_NOINLINE static sp_digit sp_2048_sub_in_place_64(sp_digit* a,
  1192. const sp_digit* b)
  1193. {
  1194. sp_digit c = 0;
  1195. __asm__ __volatile__ (
  1196. "ldm %[a], {r3, r4}\n\t"
  1197. "ldm %[b]!, {r5, r6}\n\t"
  1198. "subs r3, r3, r5\n\t"
  1199. "sbcs r4, r4, r6\n\t"
  1200. "stm %[a]!, {r3, r4}\n\t"
  1201. "ldm %[a], {r3, r4}\n\t"
  1202. "ldm %[b]!, {r5, r6}\n\t"
  1203. "sbcs r3, r3, r5\n\t"
  1204. "sbcs r4, r4, r6\n\t"
  1205. "stm %[a]!, {r3, r4}\n\t"
  1206. "ldm %[a], {r3, r4}\n\t"
  1207. "ldm %[b]!, {r5, r6}\n\t"
  1208. "sbcs r3, r3, r5\n\t"
  1209. "sbcs r4, r4, r6\n\t"
  1210. "stm %[a]!, {r3, r4}\n\t"
  1211. "ldm %[a], {r3, r4}\n\t"
  1212. "ldm %[b]!, {r5, r6}\n\t"
  1213. "sbcs r3, r3, r5\n\t"
  1214. "sbcs r4, r4, r6\n\t"
  1215. "stm %[a]!, {r3, r4}\n\t"
  1216. "ldm %[a], {r3, r4}\n\t"
  1217. "ldm %[b]!, {r5, r6}\n\t"
  1218. "sbcs r3, r3, r5\n\t"
  1219. "sbcs r4, r4, r6\n\t"
  1220. "stm %[a]!, {r3, r4}\n\t"
  1221. "ldm %[a], {r3, r4}\n\t"
  1222. "ldm %[b]!, {r5, r6}\n\t"
  1223. "sbcs r3, r3, r5\n\t"
  1224. "sbcs r4, r4, r6\n\t"
  1225. "stm %[a]!, {r3, r4}\n\t"
  1226. "ldm %[a], {r3, r4}\n\t"
  1227. "ldm %[b]!, {r5, r6}\n\t"
  1228. "sbcs r3, r3, r5\n\t"
  1229. "sbcs r4, r4, r6\n\t"
  1230. "stm %[a]!, {r3, r4}\n\t"
  1231. "ldm %[a], {r3, r4}\n\t"
  1232. "ldm %[b]!, {r5, r6}\n\t"
  1233. "sbcs r3, r3, r5\n\t"
  1234. "sbcs r4, r4, r6\n\t"
  1235. "stm %[a]!, {r3, r4}\n\t"
  1236. "ldm %[a], {r3, r4}\n\t"
  1237. "ldm %[b]!, {r5, r6}\n\t"
  1238. "sbcs r3, r3, r5\n\t"
  1239. "sbcs r4, r4, r6\n\t"
  1240. "stm %[a]!, {r3, r4}\n\t"
  1241. "ldm %[a], {r3, r4}\n\t"
  1242. "ldm %[b]!, {r5, r6}\n\t"
  1243. "sbcs r3, r3, r5\n\t"
  1244. "sbcs r4, r4, r6\n\t"
  1245. "stm %[a]!, {r3, r4}\n\t"
  1246. "ldm %[a], {r3, r4}\n\t"
  1247. "ldm %[b]!, {r5, r6}\n\t"
  1248. "sbcs r3, r3, r5\n\t"
  1249. "sbcs r4, r4, r6\n\t"
  1250. "stm %[a]!, {r3, r4}\n\t"
  1251. "ldm %[a], {r3, r4}\n\t"
  1252. "ldm %[b]!, {r5, r6}\n\t"
  1253. "sbcs r3, r3, r5\n\t"
  1254. "sbcs r4, r4, r6\n\t"
  1255. "stm %[a]!, {r3, r4}\n\t"
  1256. "ldm %[a], {r3, r4}\n\t"
  1257. "ldm %[b]!, {r5, r6}\n\t"
  1258. "sbcs r3, r3, r5\n\t"
  1259. "sbcs r4, r4, r6\n\t"
  1260. "stm %[a]!, {r3, r4}\n\t"
  1261. "ldm %[a], {r3, r4}\n\t"
  1262. "ldm %[b]!, {r5, r6}\n\t"
  1263. "sbcs r3, r3, r5\n\t"
  1264. "sbcs r4, r4, r6\n\t"
  1265. "stm %[a]!, {r3, r4}\n\t"
  1266. "ldm %[a], {r3, r4}\n\t"
  1267. "ldm %[b]!, {r5, r6}\n\t"
  1268. "sbcs r3, r3, r5\n\t"
  1269. "sbcs r4, r4, r6\n\t"
  1270. "stm %[a]!, {r3, r4}\n\t"
  1271. "ldm %[a], {r3, r4}\n\t"
  1272. "ldm %[b]!, {r5, r6}\n\t"
  1273. "sbcs r3, r3, r5\n\t"
  1274. "sbcs r4, r4, r6\n\t"
  1275. "stm %[a]!, {r3, r4}\n\t"
  1276. "ldm %[a], {r3, r4}\n\t"
  1277. "ldm %[b]!, {r5, r6}\n\t"
  1278. "sbcs r3, r3, r5\n\t"
  1279. "sbcs r4, r4, r6\n\t"
  1280. "stm %[a]!, {r3, r4}\n\t"
  1281. "ldm %[a], {r3, r4}\n\t"
  1282. "ldm %[b]!, {r5, r6}\n\t"
  1283. "sbcs r3, r3, r5\n\t"
  1284. "sbcs r4, r4, r6\n\t"
  1285. "stm %[a]!, {r3, r4}\n\t"
  1286. "ldm %[a], {r3, r4}\n\t"
  1287. "ldm %[b]!, {r5, r6}\n\t"
  1288. "sbcs r3, r3, r5\n\t"
  1289. "sbcs r4, r4, r6\n\t"
  1290. "stm %[a]!, {r3, r4}\n\t"
  1291. "ldm %[a], {r3, r4}\n\t"
  1292. "ldm %[b]!, {r5, r6}\n\t"
  1293. "sbcs r3, r3, r5\n\t"
  1294. "sbcs r4, r4, r6\n\t"
  1295. "stm %[a]!, {r3, r4}\n\t"
  1296. "ldm %[a], {r3, r4}\n\t"
  1297. "ldm %[b]!, {r5, r6}\n\t"
  1298. "sbcs r3, r3, r5\n\t"
  1299. "sbcs r4, r4, r6\n\t"
  1300. "stm %[a]!, {r3, r4}\n\t"
  1301. "ldm %[a], {r3, r4}\n\t"
  1302. "ldm %[b]!, {r5, r6}\n\t"
  1303. "sbcs r3, r3, r5\n\t"
  1304. "sbcs r4, r4, r6\n\t"
  1305. "stm %[a]!, {r3, r4}\n\t"
  1306. "ldm %[a], {r3, r4}\n\t"
  1307. "ldm %[b]!, {r5, r6}\n\t"
  1308. "sbcs r3, r3, r5\n\t"
  1309. "sbcs r4, r4, r6\n\t"
  1310. "stm %[a]!, {r3, r4}\n\t"
  1311. "ldm %[a], {r3, r4}\n\t"
  1312. "ldm %[b]!, {r5, r6}\n\t"
  1313. "sbcs r3, r3, r5\n\t"
  1314. "sbcs r4, r4, r6\n\t"
  1315. "stm %[a]!, {r3, r4}\n\t"
  1316. "ldm %[a], {r3, r4}\n\t"
  1317. "ldm %[b]!, {r5, r6}\n\t"
  1318. "sbcs r3, r3, r5\n\t"
  1319. "sbcs r4, r4, r6\n\t"
  1320. "stm %[a]!, {r3, r4}\n\t"
  1321. "ldm %[a], {r3, r4}\n\t"
  1322. "ldm %[b]!, {r5, r6}\n\t"
  1323. "sbcs r3, r3, r5\n\t"
  1324. "sbcs r4, r4, r6\n\t"
  1325. "stm %[a]!, {r3, r4}\n\t"
  1326. "ldm %[a], {r3, r4}\n\t"
  1327. "ldm %[b]!, {r5, r6}\n\t"
  1328. "sbcs r3, r3, r5\n\t"
  1329. "sbcs r4, r4, r6\n\t"
  1330. "stm %[a]!, {r3, r4}\n\t"
  1331. "ldm %[a], {r3, r4}\n\t"
  1332. "ldm %[b]!, {r5, r6}\n\t"
  1333. "sbcs r3, r3, r5\n\t"
  1334. "sbcs r4, r4, r6\n\t"
  1335. "stm %[a]!, {r3, r4}\n\t"
  1336. "ldm %[a], {r3, r4}\n\t"
  1337. "ldm %[b]!, {r5, r6}\n\t"
  1338. "sbcs r3, r3, r5\n\t"
  1339. "sbcs r4, r4, r6\n\t"
  1340. "stm %[a]!, {r3, r4}\n\t"
  1341. "ldm %[a], {r3, r4}\n\t"
  1342. "ldm %[b]!, {r5, r6}\n\t"
  1343. "sbcs r3, r3, r5\n\t"
  1344. "sbcs r4, r4, r6\n\t"
  1345. "stm %[a]!, {r3, r4}\n\t"
  1346. "ldm %[a], {r3, r4}\n\t"
  1347. "ldm %[b]!, {r5, r6}\n\t"
  1348. "sbcs r3, r3, r5\n\t"
  1349. "sbcs r4, r4, r6\n\t"
  1350. "stm %[a]!, {r3, r4}\n\t"
  1351. "ldm %[a], {r3, r4}\n\t"
  1352. "ldm %[b]!, {r5, r6}\n\t"
  1353. "sbcs r3, r3, r5\n\t"
  1354. "sbcs r4, r4, r6\n\t"
  1355. "stm %[a]!, {r3, r4}\n\t"
  1356. "sbc %[c], %[c], %[c]\n\t"
  1357. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  1358. :
  1359. : "memory", "r3", "r4", "r5", "r6"
  1360. );
  1361. return c;
  1362. }
  1363. /* Add b to a into r. (r = a + b)
  1364. *
  1365. * r A single precision integer.
  1366. * a A single precision integer.
  1367. * b A single precision integer.
  1368. */
  1369. SP_NOINLINE static sp_digit sp_2048_add_64(sp_digit* r, const sp_digit* a,
  1370. const sp_digit* b)
  1371. {
  1372. sp_digit c = 0;
  1373. __asm__ __volatile__ (
  1374. "ldm %[a]!, {r4, r5}\n\t"
  1375. "ldm %[b]!, {r6, r8}\n\t"
  1376. "adds r4, r4, r6\n\t"
  1377. "adcs r5, r5, r8\n\t"
  1378. "stm %[r]!, {r4, r5}\n\t"
  1379. "ldm %[a]!, {r4, r5}\n\t"
  1380. "ldm %[b]!, {r6, r8}\n\t"
  1381. "adcs r4, r4, r6\n\t"
  1382. "adcs r5, r5, r8\n\t"
  1383. "stm %[r]!, {r4, r5}\n\t"
  1384. "ldm %[a]!, {r4, r5}\n\t"
  1385. "ldm %[b]!, {r6, r8}\n\t"
  1386. "adcs r4, r4, r6\n\t"
  1387. "adcs r5, r5, r8\n\t"
  1388. "stm %[r]!, {r4, r5}\n\t"
  1389. "ldm %[a]!, {r4, r5}\n\t"
  1390. "ldm %[b]!, {r6, r8}\n\t"
  1391. "adcs r4, r4, r6\n\t"
  1392. "adcs r5, r5, r8\n\t"
  1393. "stm %[r]!, {r4, r5}\n\t"
  1394. "ldm %[a]!, {r4, r5}\n\t"
  1395. "ldm %[b]!, {r6, r8}\n\t"
  1396. "adcs r4, r4, r6\n\t"
  1397. "adcs r5, r5, r8\n\t"
  1398. "stm %[r]!, {r4, r5}\n\t"
  1399. "ldm %[a]!, {r4, r5}\n\t"
  1400. "ldm %[b]!, {r6, r8}\n\t"
  1401. "adcs r4, r4, r6\n\t"
  1402. "adcs r5, r5, r8\n\t"
  1403. "stm %[r]!, {r4, r5}\n\t"
  1404. "ldm %[a]!, {r4, r5}\n\t"
  1405. "ldm %[b]!, {r6, r8}\n\t"
  1406. "adcs r4, r4, r6\n\t"
  1407. "adcs r5, r5, r8\n\t"
  1408. "stm %[r]!, {r4, r5}\n\t"
  1409. "ldm %[a]!, {r4, r5}\n\t"
  1410. "ldm %[b]!, {r6, r8}\n\t"
  1411. "adcs r4, r4, r6\n\t"
  1412. "adcs r5, r5, r8\n\t"
  1413. "stm %[r]!, {r4, r5}\n\t"
  1414. "ldm %[a]!, {r4, r5}\n\t"
  1415. "ldm %[b]!, {r6, r8}\n\t"
  1416. "adcs r4, r4, r6\n\t"
  1417. "adcs r5, r5, r8\n\t"
  1418. "stm %[r]!, {r4, r5}\n\t"
  1419. "ldm %[a]!, {r4, r5}\n\t"
  1420. "ldm %[b]!, {r6, r8}\n\t"
  1421. "adcs r4, r4, r6\n\t"
  1422. "adcs r5, r5, r8\n\t"
  1423. "stm %[r]!, {r4, r5}\n\t"
  1424. "ldm %[a]!, {r4, r5}\n\t"
  1425. "ldm %[b]!, {r6, r8}\n\t"
  1426. "adcs r4, r4, r6\n\t"
  1427. "adcs r5, r5, r8\n\t"
  1428. "stm %[r]!, {r4, r5}\n\t"
  1429. "ldm %[a]!, {r4, r5}\n\t"
  1430. "ldm %[b]!, {r6, r8}\n\t"
  1431. "adcs r4, r4, r6\n\t"
  1432. "adcs r5, r5, r8\n\t"
  1433. "stm %[r]!, {r4, r5}\n\t"
  1434. "ldm %[a]!, {r4, r5}\n\t"
  1435. "ldm %[b]!, {r6, r8}\n\t"
  1436. "adcs r4, r4, r6\n\t"
  1437. "adcs r5, r5, r8\n\t"
  1438. "stm %[r]!, {r4, r5}\n\t"
  1439. "ldm %[a]!, {r4, r5}\n\t"
  1440. "ldm %[b]!, {r6, r8}\n\t"
  1441. "adcs r4, r4, r6\n\t"
  1442. "adcs r5, r5, r8\n\t"
  1443. "stm %[r]!, {r4, r5}\n\t"
  1444. "ldm %[a]!, {r4, r5}\n\t"
  1445. "ldm %[b]!, {r6, r8}\n\t"
  1446. "adcs r4, r4, r6\n\t"
  1447. "adcs r5, r5, r8\n\t"
  1448. "stm %[r]!, {r4, r5}\n\t"
  1449. "ldm %[a]!, {r4, r5}\n\t"
  1450. "ldm %[b]!, {r6, r8}\n\t"
  1451. "adcs r4, r4, r6\n\t"
  1452. "adcs r5, r5, r8\n\t"
  1453. "stm %[r]!, {r4, r5}\n\t"
  1454. "ldm %[a]!, {r4, r5}\n\t"
  1455. "ldm %[b]!, {r6, r8}\n\t"
  1456. "adcs r4, r4, r6\n\t"
  1457. "adcs r5, r5, r8\n\t"
  1458. "stm %[r]!, {r4, r5}\n\t"
  1459. "ldm %[a]!, {r4, r5}\n\t"
  1460. "ldm %[b]!, {r6, r8}\n\t"
  1461. "adcs r4, r4, r6\n\t"
  1462. "adcs r5, r5, r8\n\t"
  1463. "stm %[r]!, {r4, r5}\n\t"
  1464. "ldm %[a]!, {r4, r5}\n\t"
  1465. "ldm %[b]!, {r6, r8}\n\t"
  1466. "adcs r4, r4, r6\n\t"
  1467. "adcs r5, r5, r8\n\t"
  1468. "stm %[r]!, {r4, r5}\n\t"
  1469. "ldm %[a]!, {r4, r5}\n\t"
  1470. "ldm %[b]!, {r6, r8}\n\t"
  1471. "adcs r4, r4, r6\n\t"
  1472. "adcs r5, r5, r8\n\t"
  1473. "stm %[r]!, {r4, r5}\n\t"
  1474. "ldm %[a]!, {r4, r5}\n\t"
  1475. "ldm %[b]!, {r6, r8}\n\t"
  1476. "adcs r4, r4, r6\n\t"
  1477. "adcs r5, r5, r8\n\t"
  1478. "stm %[r]!, {r4, r5}\n\t"
  1479. "ldm %[a]!, {r4, r5}\n\t"
  1480. "ldm %[b]!, {r6, r8}\n\t"
  1481. "adcs r4, r4, r6\n\t"
  1482. "adcs r5, r5, r8\n\t"
  1483. "stm %[r]!, {r4, r5}\n\t"
  1484. "ldm %[a]!, {r4, r5}\n\t"
  1485. "ldm %[b]!, {r6, r8}\n\t"
  1486. "adcs r4, r4, r6\n\t"
  1487. "adcs r5, r5, r8\n\t"
  1488. "stm %[r]!, {r4, r5}\n\t"
  1489. "ldm %[a]!, {r4, r5}\n\t"
  1490. "ldm %[b]!, {r6, r8}\n\t"
  1491. "adcs r4, r4, r6\n\t"
  1492. "adcs r5, r5, r8\n\t"
  1493. "stm %[r]!, {r4, r5}\n\t"
  1494. "ldm %[a]!, {r4, r5}\n\t"
  1495. "ldm %[b]!, {r6, r8}\n\t"
  1496. "adcs r4, r4, r6\n\t"
  1497. "adcs r5, r5, r8\n\t"
  1498. "stm %[r]!, {r4, r5}\n\t"
  1499. "ldm %[a]!, {r4, r5}\n\t"
  1500. "ldm %[b]!, {r6, r8}\n\t"
  1501. "adcs r4, r4, r6\n\t"
  1502. "adcs r5, r5, r8\n\t"
  1503. "stm %[r]!, {r4, r5}\n\t"
  1504. "ldm %[a]!, {r4, r5}\n\t"
  1505. "ldm %[b]!, {r6, r8}\n\t"
  1506. "adcs r4, r4, r6\n\t"
  1507. "adcs r5, r5, r8\n\t"
  1508. "stm %[r]!, {r4, r5}\n\t"
  1509. "ldm %[a]!, {r4, r5}\n\t"
  1510. "ldm %[b]!, {r6, r8}\n\t"
  1511. "adcs r4, r4, r6\n\t"
  1512. "adcs r5, r5, r8\n\t"
  1513. "stm %[r]!, {r4, r5}\n\t"
  1514. "ldm %[a]!, {r4, r5}\n\t"
  1515. "ldm %[b]!, {r6, r8}\n\t"
  1516. "adcs r4, r4, r6\n\t"
  1517. "adcs r5, r5, r8\n\t"
  1518. "stm %[r]!, {r4, r5}\n\t"
  1519. "ldm %[a]!, {r4, r5}\n\t"
  1520. "ldm %[b]!, {r6, r8}\n\t"
  1521. "adcs r4, r4, r6\n\t"
  1522. "adcs r5, r5, r8\n\t"
  1523. "stm %[r]!, {r4, r5}\n\t"
  1524. "ldm %[a]!, {r4, r5}\n\t"
  1525. "ldm %[b]!, {r6, r8}\n\t"
  1526. "adcs r4, r4, r6\n\t"
  1527. "adcs r5, r5, r8\n\t"
  1528. "stm %[r]!, {r4, r5}\n\t"
  1529. "ldm %[a]!, {r4, r5}\n\t"
  1530. "ldm %[b]!, {r6, r8}\n\t"
  1531. "adcs r4, r4, r6\n\t"
  1532. "adcs r5, r5, r8\n\t"
  1533. "stm %[r]!, {r4, r5}\n\t"
  1534. "mov %[c], #0\n\t"
  1535. "adc %[c], %[c], %[c]\n\t"
  1536. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  1537. :
  1538. : "memory", "r4", "r5", "r6", "r8"
  1539. );
  1540. return c;
  1541. }
  1542. /* AND m into each word of a and store in r.
  1543. *
  1544. * r A single precision integer.
  1545. * a A single precision integer.
  1546. * m Mask to AND against each digit.
  1547. */
  1548. static void sp_2048_mask_32(sp_digit* r, const sp_digit* a, sp_digit m)
  1549. {
  1550. #ifdef WOLFSSL_SP_SMALL
  1551. int i;
  1552. for (i=0; i<32; i++) {
  1553. r[i] = a[i] & m;
  1554. }
  1555. #else
  1556. int i;
  1557. for (i = 0; i < 32; i += 8) {
  1558. r[i+0] = a[i+0] & m;
  1559. r[i+1] = a[i+1] & m;
  1560. r[i+2] = a[i+2] & m;
  1561. r[i+3] = a[i+3] & m;
  1562. r[i+4] = a[i+4] & m;
  1563. r[i+5] = a[i+5] & m;
  1564. r[i+6] = a[i+6] & m;
  1565. r[i+7] = a[i+7] & m;
  1566. }
  1567. #endif
  1568. }
  1569. /* Multiply a and b into r. (r = a * b)
  1570. *
  1571. * r A single precision integer.
  1572. * a A single precision integer.
  1573. * b A single precision integer.
  1574. */
  1575. SP_NOINLINE static void sp_2048_mul_64(sp_digit* r, const sp_digit* a,
  1576. const sp_digit* b)
  1577. {
  1578. sp_digit* z0 = r;
  1579. sp_digit z1[64];
  1580. sp_digit a1[32];
  1581. sp_digit b1[32];
  1582. sp_digit* z2 = r + 64;
  1583. sp_digit u;
  1584. sp_digit ca;
  1585. sp_digit cb;
  1586. ca = sp_2048_add_32(a1, a, &a[32]);
  1587. cb = sp_2048_add_32(b1, b, &b[32]);
  1588. u = ca & cb;
  1589. sp_2048_mul_32(z2, &a[32], &b[32]);
  1590. sp_2048_mul_32(z0, a, b);
  1591. sp_2048_mul_32(z1, a1, b1);
  1592. u += sp_2048_sub_in_place_64(z1, z0);
  1593. u += sp_2048_sub_in_place_64(z1, z2);
  1594. sp_2048_mask_32(a1, a1, 0 - cb);
  1595. u += sp_2048_add_32(z1 + 32, z1 + 32, a1);
  1596. sp_2048_mask_32(b1, b1, 0 - ca);
  1597. u += sp_2048_add_32(z1 + 32, z1 + 32, b1);
  1598. u += sp_2048_add_64(r + 32, r + 32, z1);
  1599. XMEMSET(a1 + 1, 0, sizeof(sp_digit) * (32 - 1));
  1600. a1[0] = u;
  1601. (void)sp_2048_add_32(r + 96, r + 96, a1);
  1602. }
  1603. /* Square a and put result in r. (r = a * a)
  1604. *
  1605. * r A single precision integer.
  1606. * a A single precision integer.
  1607. */
  1608. SP_NOINLINE static void sp_2048_sqr_8(sp_digit* r, const sp_digit* a)
  1609. {
  1610. sp_digit tmp_arr[8];
  1611. sp_digit* tmp = tmp_arr;
  1612. __asm__ __volatile__ (
  1613. /* A[0] * A[0] */
  1614. "ldr r6, [%[a], #0]\n\t"
  1615. "umull r3, r4, r6, r6\n\t"
  1616. "mov r5, #0\n\t"
  1617. "str r3, [%[tmp], #0]\n\t"
  1618. "mov r3, #0\n\t"
  1619. /* A[0] * A[1] */
  1620. "ldr r8, [%[a], #4]\n\t"
  1621. "umull r6, r8, r6, r8\n\t"
  1622. "adds r4, r4, r6\n\t"
  1623. "adc r5, r5, r8\n\t"
  1624. "adds r4, r4, r6\n\t"
  1625. "adcs r5, r5, r8\n\t"
  1626. "adc r3, r3, #0\n\t"
  1627. "str r4, [%[tmp], #4]\n\t"
  1628. "mov r4, #0\n\t"
  1629. /* A[0] * A[2] */
  1630. "ldr r6, [%[a], #0]\n\t"
  1631. "ldr r8, [%[a], #8]\n\t"
  1632. "umull r6, r8, r6, r8\n\t"
  1633. "adds r5, r5, r6\n\t"
  1634. "adc r3, r3, r8\n\t"
  1635. "adds r5, r5, r6\n\t"
  1636. "adcs r3, r3, r8\n\t"
  1637. "adc r4, r4, #0\n\t"
  1638. /* A[1] * A[1] */
  1639. "ldr r6, [%[a], #4]\n\t"
  1640. "umull r6, r8, r6, r6\n\t"
  1641. "adds r5, r5, r6\n\t"
  1642. "adcs r3, r3, r8\n\t"
  1643. "adc r4, r4, #0\n\t"
  1644. "str r5, [%[tmp], #8]\n\t"
  1645. "mov r5, #0\n\t"
  1646. /* A[0] * A[3] */
  1647. "ldr r6, [%[a], #0]\n\t"
  1648. "ldr r8, [%[a], #12]\n\t"
  1649. "umull r9, r10, r6, r8\n\t"
  1650. "mov r11, #0\n\t"
  1651. /* A[1] * A[2] */
  1652. "ldr r6, [%[a], #4]\n\t"
  1653. "ldr r8, [%[a], #8]\n\t"
  1654. "umull r6, r8, r6, r8\n\t"
  1655. "adds r9, r9, r6\n\t"
  1656. "adcs r10, r10, r8\n\t"
  1657. "adc r11, r11, #0\n\t"
  1658. "adds r9, r9, r9\n\t"
  1659. "adcs r10, r10, r10\n\t"
  1660. "adc r11, r11, r11\n\t"
  1661. "adds r3, r3, r9\n\t"
  1662. "adcs r4, r4, r10\n\t"
  1663. "adc r5, r5, r11\n\t"
  1664. "str r3, [%[tmp], #12]\n\t"
  1665. "mov r3, #0\n\t"
  1666. /* A[0] * A[4] */
  1667. "ldr r6, [%[a], #0]\n\t"
  1668. "ldr r8, [%[a], #16]\n\t"
  1669. "umull r9, r10, r6, r8\n\t"
  1670. "mov r11, #0\n\t"
  1671. /* A[1] * A[3] */
  1672. "ldr r6, [%[a], #4]\n\t"
  1673. "ldr r8, [%[a], #12]\n\t"
  1674. "umull r6, r8, r6, r8\n\t"
  1675. "adds r9, r9, r6\n\t"
  1676. "adcs r10, r10, r8\n\t"
  1677. "adc r11, r11, #0\n\t"
  1678. /* A[2] * A[2] */
  1679. "ldr r6, [%[a], #8]\n\t"
  1680. "umull r6, r8, r6, r6\n\t"
  1681. "adds r4, r4, r6\n\t"
  1682. "adcs r5, r5, r8\n\t"
  1683. "adc r3, r3, #0\n\t"
  1684. "adds r9, r9, r9\n\t"
  1685. "adcs r10, r10, r10\n\t"
  1686. "adc r11, r11, r11\n\t"
  1687. "adds r4, r4, r9\n\t"
  1688. "adcs r5, r5, r10\n\t"
  1689. "adc r3, r3, r11\n\t"
  1690. "str r4, [%[tmp], #16]\n\t"
  1691. "mov r4, #0\n\t"
  1692. /* A[0] * A[5] */
  1693. "ldr r6, [%[a], #0]\n\t"
  1694. "ldr r8, [%[a], #20]\n\t"
  1695. "umull r9, r10, r6, r8\n\t"
  1696. "mov r11, #0\n\t"
  1697. /* A[1] * A[4] */
  1698. "ldr r6, [%[a], #4]\n\t"
  1699. "ldr r8, [%[a], #16]\n\t"
  1700. "umull r6, r8, r6, r8\n\t"
  1701. "adds r9, r9, r6\n\t"
  1702. "adcs r10, r10, r8\n\t"
  1703. "adc r11, r11, #0\n\t"
  1704. /* A[2] * A[3] */
  1705. "ldr r6, [%[a], #8]\n\t"
  1706. "ldr r8, [%[a], #12]\n\t"
  1707. "umull r6, r8, r6, r8\n\t"
  1708. "adds r9, r9, r6\n\t"
  1709. "adcs r10, r10, r8\n\t"
  1710. "adc r11, r11, #0\n\t"
  1711. "adds r9, r9, r9\n\t"
  1712. "adcs r10, r10, r10\n\t"
  1713. "adc r11, r11, r11\n\t"
  1714. "adds r5, r5, r9\n\t"
  1715. "adcs r3, r3, r10\n\t"
  1716. "adc r4, r4, r11\n\t"
  1717. "str r5, [%[tmp], #20]\n\t"
  1718. "mov r5, #0\n\t"
  1719. /* A[0] * A[6] */
  1720. "ldr r6, [%[a], #0]\n\t"
  1721. "ldr r8, [%[a], #24]\n\t"
  1722. "umull r9, r10, r6, r8\n\t"
  1723. "mov r11, #0\n\t"
  1724. /* A[1] * A[5] */
  1725. "ldr r6, [%[a], #4]\n\t"
  1726. "ldr r8, [%[a], #20]\n\t"
  1727. "umull r6, r8, r6, r8\n\t"
  1728. "adds r9, r9, r6\n\t"
  1729. "adcs r10, r10, r8\n\t"
  1730. "adc r11, r11, #0\n\t"
  1731. /* A[2] * A[4] */
  1732. "ldr r6, [%[a], #8]\n\t"
  1733. "ldr r8, [%[a], #16]\n\t"
  1734. "umull r6, r8, r6, r8\n\t"
  1735. "adds r9, r9, r6\n\t"
  1736. "adcs r10, r10, r8\n\t"
  1737. "adc r11, r11, #0\n\t"
  1738. /* A[3] * A[3] */
  1739. "ldr r6, [%[a], #12]\n\t"
  1740. "umull r6, r8, r6, r6\n\t"
  1741. "adds r3, r3, r6\n\t"
  1742. "adcs r4, r4, r8\n\t"
  1743. "adc r5, r5, #0\n\t"
  1744. "adds r9, r9, r9\n\t"
  1745. "adcs r10, r10, r10\n\t"
  1746. "adc r11, r11, r11\n\t"
  1747. "adds r3, r3, r9\n\t"
  1748. "adcs r4, r4, r10\n\t"
  1749. "adc r5, r5, r11\n\t"
  1750. "str r3, [%[tmp], #24]\n\t"
  1751. "mov r3, #0\n\t"
  1752. /* A[0] * A[7] */
  1753. "ldr r6, [%[a], #0]\n\t"
  1754. "ldr r8, [%[a], #28]\n\t"
  1755. "umull r9, r10, r6, r8\n\t"
  1756. "mov r11, #0\n\t"
  1757. /* A[1] * A[6] */
  1758. "ldr r6, [%[a], #4]\n\t"
  1759. "ldr r8, [%[a], #24]\n\t"
  1760. "umull r6, r8, r6, r8\n\t"
  1761. "adds r9, r9, r6\n\t"
  1762. "adcs r10, r10, r8\n\t"
  1763. "adc r11, r11, #0\n\t"
  1764. /* A[2] * A[5] */
  1765. "ldr r6, [%[a], #8]\n\t"
  1766. "ldr r8, [%[a], #20]\n\t"
  1767. "umull r6, r8, r6, r8\n\t"
  1768. "adds r9, r9, r6\n\t"
  1769. "adcs r10, r10, r8\n\t"
  1770. "adc r11, r11, #0\n\t"
  1771. /* A[3] * A[4] */
  1772. "ldr r6, [%[a], #12]\n\t"
  1773. "ldr r8, [%[a], #16]\n\t"
  1774. "umull r6, r8, r6, r8\n\t"
  1775. "adds r9, r9, r6\n\t"
  1776. "adcs r10, r10, r8\n\t"
  1777. "adc r11, r11, #0\n\t"
  1778. "adds r9, r9, r9\n\t"
  1779. "adcs r10, r10, r10\n\t"
  1780. "adc r11, r11, r11\n\t"
  1781. "adds r4, r4, r9\n\t"
  1782. "adcs r5, r5, r10\n\t"
  1783. "adc r3, r3, r11\n\t"
  1784. "str r4, [%[tmp], #28]\n\t"
  1785. "mov r4, #0\n\t"
  1786. /* A[1] * A[7] */
  1787. "ldr r6, [%[a], #4]\n\t"
  1788. "ldr r8, [%[a], #28]\n\t"
  1789. "umull r9, r10, r6, r8\n\t"
  1790. "mov r11, #0\n\t"
  1791. /* A[2] * A[6] */
  1792. "ldr r6, [%[a], #8]\n\t"
  1793. "ldr r8, [%[a], #24]\n\t"
  1794. "umull r6, r8, r6, r8\n\t"
  1795. "adds r9, r9, r6\n\t"
  1796. "adcs r10, r10, r8\n\t"
  1797. "adc r11, r11, #0\n\t"
  1798. /* A[3] * A[5] */
  1799. "ldr r6, [%[a], #12]\n\t"
  1800. "ldr r8, [%[a], #20]\n\t"
  1801. "umull r6, r8, r6, r8\n\t"
  1802. "adds r9, r9, r6\n\t"
  1803. "adcs r10, r10, r8\n\t"
  1804. "adc r11, r11, #0\n\t"
  1805. /* A[4] * A[4] */
  1806. "ldr r6, [%[a], #16]\n\t"
  1807. "umull r6, r8, r6, r6\n\t"
  1808. "adds r5, r5, r6\n\t"
  1809. "adcs r3, r3, r8\n\t"
  1810. "adc r4, r4, #0\n\t"
  1811. "adds r9, r9, r9\n\t"
  1812. "adcs r10, r10, r10\n\t"
  1813. "adc r11, r11, r11\n\t"
  1814. "adds r5, r5, r9\n\t"
  1815. "adcs r3, r3, r10\n\t"
  1816. "adc r4, r4, r11\n\t"
  1817. "str r5, [%[r], #32]\n\t"
  1818. "mov r5, #0\n\t"
  1819. /* A[2] * A[7] */
  1820. "ldr r6, [%[a], #8]\n\t"
  1821. "ldr r8, [%[a], #28]\n\t"
  1822. "umull r9, r10, r6, r8\n\t"
  1823. "mov r11, #0\n\t"
  1824. /* A[3] * A[6] */
  1825. "ldr r6, [%[a], #12]\n\t"
  1826. "ldr r8, [%[a], #24]\n\t"
  1827. "umull r6, r8, r6, r8\n\t"
  1828. "adds r9, r9, r6\n\t"
  1829. "adcs r10, r10, r8\n\t"
  1830. "adc r11, r11, #0\n\t"
  1831. /* A[4] * A[5] */
  1832. "ldr r6, [%[a], #16]\n\t"
  1833. "ldr r8, [%[a], #20]\n\t"
  1834. "umull r6, r8, r6, r8\n\t"
  1835. "adds r9, r9, r6\n\t"
  1836. "adcs r10, r10, r8\n\t"
  1837. "adc r11, r11, #0\n\t"
  1838. "adds r9, r9, r9\n\t"
  1839. "adcs r10, r10, r10\n\t"
  1840. "adc r11, r11, r11\n\t"
  1841. "adds r3, r3, r9\n\t"
  1842. "adcs r4, r4, r10\n\t"
  1843. "adc r5, r5, r11\n\t"
  1844. "str r3, [%[r], #36]\n\t"
  1845. "mov r3, #0\n\t"
  1846. /* A[3] * A[7] */
  1847. "ldr r6, [%[a], #12]\n\t"
  1848. "ldr r8, [%[a], #28]\n\t"
  1849. "umull r9, r10, r6, r8\n\t"
  1850. "mov r11, #0\n\t"
  1851. /* A[4] * A[6] */
  1852. "ldr r6, [%[a], #16]\n\t"
  1853. "ldr r8, [%[a], #24]\n\t"
  1854. "umull r6, r8, r6, r8\n\t"
  1855. "adds r9, r9, r6\n\t"
  1856. "adcs r10, r10, r8\n\t"
  1857. "adc r11, r11, #0\n\t"
  1858. /* A[5] * A[5] */
  1859. "ldr r6, [%[a], #20]\n\t"
  1860. "umull r6, r8, r6, r6\n\t"
  1861. "adds r4, r4, r6\n\t"
  1862. "adcs r5, r5, r8\n\t"
  1863. "adc r3, r3, #0\n\t"
  1864. "adds r9, r9, r9\n\t"
  1865. "adcs r10, r10, r10\n\t"
  1866. "adc r11, r11, r11\n\t"
  1867. "adds r4, r4, r9\n\t"
  1868. "adcs r5, r5, r10\n\t"
  1869. "adc r3, r3, r11\n\t"
  1870. "str r4, [%[r], #40]\n\t"
  1871. "mov r4, #0\n\t"
  1872. /* A[4] * A[7] */
  1873. "ldr r6, [%[a], #16]\n\t"
  1874. "ldr r8, [%[a], #28]\n\t"
  1875. "umull r6, r8, r6, r8\n\t"
  1876. "adds r5, r5, r6\n\t"
  1877. "adcs r3, r3, r8\n\t"
  1878. "adc r4, r4, #0\n\t"
  1879. "adds r5, r5, r6\n\t"
  1880. "adcs r3, r3, r8\n\t"
  1881. "adc r4, r4, #0\n\t"
  1882. /* A[5] * A[6] */
  1883. "ldr r6, [%[a], #20]\n\t"
  1884. "ldr r8, [%[a], #24]\n\t"
  1885. "umull r6, r8, r6, r8\n\t"
  1886. "adds r5, r5, r6\n\t"
  1887. "adcs r3, r3, r8\n\t"
  1888. "adc r4, r4, #0\n\t"
  1889. "adds r5, r5, r6\n\t"
  1890. "adcs r3, r3, r8\n\t"
  1891. "adc r4, r4, #0\n\t"
  1892. "str r5, [%[r], #44]\n\t"
  1893. "mov r5, #0\n\t"
  1894. /* A[5] * A[7] */
  1895. "ldr r6, [%[a], #20]\n\t"
  1896. "ldr r8, [%[a], #28]\n\t"
  1897. "umull r6, r8, r6, r8\n\t"
  1898. "adds r3, r3, r6\n\t"
  1899. "adcs r4, r4, r8\n\t"
  1900. "adc r5, r5, #0\n\t"
  1901. "adds r3, r3, r6\n\t"
  1902. "adcs r4, r4, r8\n\t"
  1903. "adc r5, r5, #0\n\t"
  1904. /* A[6] * A[6] */
  1905. "ldr r6, [%[a], #24]\n\t"
  1906. "umull r6, r8, r6, r6\n\t"
  1907. "adds r3, r3, r6\n\t"
  1908. "adcs r4, r4, r8\n\t"
  1909. "adc r5, r5, #0\n\t"
  1910. "str r3, [%[r], #48]\n\t"
  1911. "mov r3, #0\n\t"
  1912. /* A[6] * A[7] */
  1913. "ldr r6, [%[a], #24]\n\t"
  1914. "ldr r8, [%[a], #28]\n\t"
  1915. "umull r6, r8, r6, r8\n\t"
  1916. "adds r4, r4, r6\n\t"
  1917. "adcs r5, r5, r8\n\t"
  1918. "adc r3, r3, #0\n\t"
  1919. "adds r4, r4, r6\n\t"
  1920. "adcs r5, r5, r8\n\t"
  1921. "adc r3, r3, #0\n\t"
  1922. "str r4, [%[r], #52]\n\t"
  1923. "mov r4, #0\n\t"
  1924. /* A[7] * A[7] */
  1925. "ldr r6, [%[a], #28]\n\t"
  1926. "umull r6, r8, r6, r6\n\t"
  1927. "adds r5, r5, r6\n\t"
  1928. "adc r3, r3, r8\n\t"
  1929. "str r5, [%[r], #56]\n\t"
  1930. "str r3, [%[r], #60]\n\t"
  1931. /* Transfer tmp to r */
  1932. "ldr r3, [%[tmp], #0]\n\t"
  1933. "ldr r4, [%[tmp], #4]\n\t"
  1934. "ldr r5, [%[tmp], #8]\n\t"
  1935. "ldr r6, [%[tmp], #12]\n\t"
  1936. "str r3, [%[r], #0]\n\t"
  1937. "str r4, [%[r], #4]\n\t"
  1938. "str r5, [%[r], #8]\n\t"
  1939. "str r6, [%[r], #12]\n\t"
  1940. "ldr r3, [%[tmp], #16]\n\t"
  1941. "ldr r4, [%[tmp], #20]\n\t"
  1942. "ldr r5, [%[tmp], #24]\n\t"
  1943. "ldr r6, [%[tmp], #28]\n\t"
  1944. "str r3, [%[r], #16]\n\t"
  1945. "str r4, [%[r], #20]\n\t"
  1946. "str r5, [%[r], #24]\n\t"
  1947. "str r6, [%[r], #28]\n\t"
  1948. :
  1949. : [r] "r" (r), [a] "r" (a), [tmp] "r" (tmp)
  1950. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11"
  1951. );
  1952. }
  1953. /* Sub b from a into r. (r = a - b)
  1954. *
  1955. * r A single precision integer.
  1956. * a A single precision integer.
  1957. * b A single precision integer.
  1958. */
  1959. SP_NOINLINE static sp_digit sp_2048_sub_8(sp_digit* r, const sp_digit* a,
  1960. const sp_digit* b)
  1961. {
  1962. sp_digit c = 0;
  1963. __asm__ __volatile__ (
  1964. "ldm %[a]!, {r4, r5}\n\t"
  1965. "ldm %[b]!, {r6, r8}\n\t"
  1966. "subs r4, r4, r6\n\t"
  1967. "sbcs r5, r5, r8\n\t"
  1968. "stm %[r]!, {r4, r5}\n\t"
  1969. "ldm %[a]!, {r4, r5}\n\t"
  1970. "ldm %[b]!, {r6, r8}\n\t"
  1971. "sbcs r4, r4, r6\n\t"
  1972. "sbcs r5, r5, r8\n\t"
  1973. "stm %[r]!, {r4, r5}\n\t"
  1974. "ldm %[a]!, {r4, r5}\n\t"
  1975. "ldm %[b]!, {r6, r8}\n\t"
  1976. "sbcs r4, r4, r6\n\t"
  1977. "sbcs r5, r5, r8\n\t"
  1978. "stm %[r]!, {r4, r5}\n\t"
  1979. "ldm %[a]!, {r4, r5}\n\t"
  1980. "ldm %[b]!, {r6, r8}\n\t"
  1981. "sbcs r4, r4, r6\n\t"
  1982. "sbcs r5, r5, r8\n\t"
  1983. "stm %[r]!, {r4, r5}\n\t"
  1984. "sbc %[c], %[c], %[c]\n\t"
  1985. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  1986. :
  1987. : "memory", "r4", "r5", "r6", "r8"
  1988. );
  1989. return c;
  1990. }
  1991. /* Square a and put result in r. (r = a * a)
  1992. *
  1993. * r A single precision integer.
  1994. * a A single precision integer.
  1995. */
  1996. SP_NOINLINE static void sp_2048_sqr_16(sp_digit* r, const sp_digit* a)
  1997. {
  1998. sp_digit* z0 = r;
  1999. sp_digit* z2 = r + 16;
  2000. sp_digit z1[16];
  2001. sp_digit* a1 = z1;
  2002. sp_digit zero[8];
  2003. sp_digit u;
  2004. sp_digit mask;
  2005. sp_digit* p1;
  2006. sp_digit* p2;
  2007. XMEMSET(zero, 0, sizeof(sp_digit) * 8);
  2008. mask = sp_2048_sub_8(a1, a, &a[8]);
  2009. p1 = (sp_digit*)(((sp_digit)zero & mask ) | ((sp_digit)a1 & (~mask)));
  2010. p2 = (sp_digit*)(((sp_digit)zero & (~mask)) | ((sp_digit)a1 & mask ));
  2011. (void)sp_2048_sub_8(a1, p1, p2);
  2012. sp_2048_sqr_8(z2, &a[8]);
  2013. sp_2048_sqr_8(z0, a);
  2014. sp_2048_sqr_8(z1, a1);
  2015. u = 0;
  2016. u -= sp_2048_sub_in_place_16(z1, z2);
  2017. u -= sp_2048_sub_in_place_16(z1, z0);
  2018. u += sp_2048_sub_in_place_16(r + 8, z1);
  2019. zero[0] = u;
  2020. (void)sp_2048_add_8(r + 24, r + 24, zero);
  2021. }
  2022. /* Sub b from a into r. (r = a - b)
  2023. *
  2024. * r A single precision integer.
  2025. * a A single precision integer.
  2026. * b A single precision integer.
  2027. */
  2028. SP_NOINLINE static sp_digit sp_2048_sub_16(sp_digit* r, const sp_digit* a,
  2029. const sp_digit* b)
  2030. {
  2031. sp_digit c = 0;
  2032. __asm__ __volatile__ (
  2033. "ldm %[a]!, {r4, r5}\n\t"
  2034. "ldm %[b]!, {r6, r8}\n\t"
  2035. "subs r4, r4, r6\n\t"
  2036. "sbcs r5, r5, r8\n\t"
  2037. "stm %[r]!, {r4, r5}\n\t"
  2038. "ldm %[a]!, {r4, r5}\n\t"
  2039. "ldm %[b]!, {r6, r8}\n\t"
  2040. "sbcs r4, r4, r6\n\t"
  2041. "sbcs r5, r5, r8\n\t"
  2042. "stm %[r]!, {r4, r5}\n\t"
  2043. "ldm %[a]!, {r4, r5}\n\t"
  2044. "ldm %[b]!, {r6, r8}\n\t"
  2045. "sbcs r4, r4, r6\n\t"
  2046. "sbcs r5, r5, r8\n\t"
  2047. "stm %[r]!, {r4, r5}\n\t"
  2048. "ldm %[a]!, {r4, r5}\n\t"
  2049. "ldm %[b]!, {r6, r8}\n\t"
  2050. "sbcs r4, r4, r6\n\t"
  2051. "sbcs r5, r5, r8\n\t"
  2052. "stm %[r]!, {r4, r5}\n\t"
  2053. "ldm %[a]!, {r4, r5}\n\t"
  2054. "ldm %[b]!, {r6, r8}\n\t"
  2055. "sbcs r4, r4, r6\n\t"
  2056. "sbcs r5, r5, r8\n\t"
  2057. "stm %[r]!, {r4, r5}\n\t"
  2058. "ldm %[a]!, {r4, r5}\n\t"
  2059. "ldm %[b]!, {r6, r8}\n\t"
  2060. "sbcs r4, r4, r6\n\t"
  2061. "sbcs r5, r5, r8\n\t"
  2062. "stm %[r]!, {r4, r5}\n\t"
  2063. "ldm %[a]!, {r4, r5}\n\t"
  2064. "ldm %[b]!, {r6, r8}\n\t"
  2065. "sbcs r4, r4, r6\n\t"
  2066. "sbcs r5, r5, r8\n\t"
  2067. "stm %[r]!, {r4, r5}\n\t"
  2068. "ldm %[a]!, {r4, r5}\n\t"
  2069. "ldm %[b]!, {r6, r8}\n\t"
  2070. "sbcs r4, r4, r6\n\t"
  2071. "sbcs r5, r5, r8\n\t"
  2072. "stm %[r]!, {r4, r5}\n\t"
  2073. "sbc %[c], %[c], %[c]\n\t"
  2074. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  2075. :
  2076. : "memory", "r4", "r5", "r6", "r8"
  2077. );
  2078. return c;
  2079. }
  2080. /* Square a and put result in r. (r = a * a)
  2081. *
  2082. * r A single precision integer.
  2083. * a A single precision integer.
  2084. */
  2085. SP_NOINLINE static void sp_2048_sqr_32(sp_digit* r, const sp_digit* a)
  2086. {
  2087. sp_digit* z0 = r;
  2088. sp_digit* z2 = r + 32;
  2089. sp_digit z1[32];
  2090. sp_digit* a1 = z1;
  2091. sp_digit zero[16];
  2092. sp_digit u;
  2093. sp_digit mask;
  2094. sp_digit* p1;
  2095. sp_digit* p2;
  2096. XMEMSET(zero, 0, sizeof(sp_digit) * 16);
  2097. mask = sp_2048_sub_16(a1, a, &a[16]);
  2098. p1 = (sp_digit*)(((sp_digit)zero & mask ) | ((sp_digit)a1 & (~mask)));
  2099. p2 = (sp_digit*)(((sp_digit)zero & (~mask)) | ((sp_digit)a1 & mask ));
  2100. (void)sp_2048_sub_16(a1, p1, p2);
  2101. sp_2048_sqr_16(z2, &a[16]);
  2102. sp_2048_sqr_16(z0, a);
  2103. sp_2048_sqr_16(z1, a1);
  2104. u = 0;
  2105. u -= sp_2048_sub_in_place_32(z1, z2);
  2106. u -= sp_2048_sub_in_place_32(z1, z0);
  2107. u += sp_2048_sub_in_place_32(r + 16, z1);
  2108. zero[0] = u;
  2109. (void)sp_2048_add_16(r + 48, r + 48, zero);
  2110. }
  2111. /* Sub b from a into r. (r = a - b)
  2112. *
  2113. * r A single precision integer.
  2114. * a A single precision integer.
  2115. * b A single precision integer.
  2116. */
  2117. SP_NOINLINE static sp_digit sp_2048_sub_32(sp_digit* r, const sp_digit* a,
  2118. const sp_digit* b)
  2119. {
  2120. sp_digit c = 0;
  2121. __asm__ __volatile__ (
  2122. "ldm %[a]!, {r4, r5}\n\t"
  2123. "ldm %[b]!, {r6, r8}\n\t"
  2124. "subs r4, r4, r6\n\t"
  2125. "sbcs r5, r5, r8\n\t"
  2126. "stm %[r]!, {r4, r5}\n\t"
  2127. "ldm %[a]!, {r4, r5}\n\t"
  2128. "ldm %[b]!, {r6, r8}\n\t"
  2129. "sbcs r4, r4, r6\n\t"
  2130. "sbcs r5, r5, r8\n\t"
  2131. "stm %[r]!, {r4, r5}\n\t"
  2132. "ldm %[a]!, {r4, r5}\n\t"
  2133. "ldm %[b]!, {r6, r8}\n\t"
  2134. "sbcs r4, r4, r6\n\t"
  2135. "sbcs r5, r5, r8\n\t"
  2136. "stm %[r]!, {r4, r5}\n\t"
  2137. "ldm %[a]!, {r4, r5}\n\t"
  2138. "ldm %[b]!, {r6, r8}\n\t"
  2139. "sbcs r4, r4, r6\n\t"
  2140. "sbcs r5, r5, r8\n\t"
  2141. "stm %[r]!, {r4, r5}\n\t"
  2142. "ldm %[a]!, {r4, r5}\n\t"
  2143. "ldm %[b]!, {r6, r8}\n\t"
  2144. "sbcs r4, r4, r6\n\t"
  2145. "sbcs r5, r5, r8\n\t"
  2146. "stm %[r]!, {r4, r5}\n\t"
  2147. "ldm %[a]!, {r4, r5}\n\t"
  2148. "ldm %[b]!, {r6, r8}\n\t"
  2149. "sbcs r4, r4, r6\n\t"
  2150. "sbcs r5, r5, r8\n\t"
  2151. "stm %[r]!, {r4, r5}\n\t"
  2152. "ldm %[a]!, {r4, r5}\n\t"
  2153. "ldm %[b]!, {r6, r8}\n\t"
  2154. "sbcs r4, r4, r6\n\t"
  2155. "sbcs r5, r5, r8\n\t"
  2156. "stm %[r]!, {r4, r5}\n\t"
  2157. "ldm %[a]!, {r4, r5}\n\t"
  2158. "ldm %[b]!, {r6, r8}\n\t"
  2159. "sbcs r4, r4, r6\n\t"
  2160. "sbcs r5, r5, r8\n\t"
  2161. "stm %[r]!, {r4, r5}\n\t"
  2162. "ldm %[a]!, {r4, r5}\n\t"
  2163. "ldm %[b]!, {r6, r8}\n\t"
  2164. "sbcs r4, r4, r6\n\t"
  2165. "sbcs r5, r5, r8\n\t"
  2166. "stm %[r]!, {r4, r5}\n\t"
  2167. "ldm %[a]!, {r4, r5}\n\t"
  2168. "ldm %[b]!, {r6, r8}\n\t"
  2169. "sbcs r4, r4, r6\n\t"
  2170. "sbcs r5, r5, r8\n\t"
  2171. "stm %[r]!, {r4, r5}\n\t"
  2172. "ldm %[a]!, {r4, r5}\n\t"
  2173. "ldm %[b]!, {r6, r8}\n\t"
  2174. "sbcs r4, r4, r6\n\t"
  2175. "sbcs r5, r5, r8\n\t"
  2176. "stm %[r]!, {r4, r5}\n\t"
  2177. "ldm %[a]!, {r4, r5}\n\t"
  2178. "ldm %[b]!, {r6, r8}\n\t"
  2179. "sbcs r4, r4, r6\n\t"
  2180. "sbcs r5, r5, r8\n\t"
  2181. "stm %[r]!, {r4, r5}\n\t"
  2182. "ldm %[a]!, {r4, r5}\n\t"
  2183. "ldm %[b]!, {r6, r8}\n\t"
  2184. "sbcs r4, r4, r6\n\t"
  2185. "sbcs r5, r5, r8\n\t"
  2186. "stm %[r]!, {r4, r5}\n\t"
  2187. "ldm %[a]!, {r4, r5}\n\t"
  2188. "ldm %[b]!, {r6, r8}\n\t"
  2189. "sbcs r4, r4, r6\n\t"
  2190. "sbcs r5, r5, r8\n\t"
  2191. "stm %[r]!, {r4, r5}\n\t"
  2192. "ldm %[a]!, {r4, r5}\n\t"
  2193. "ldm %[b]!, {r6, r8}\n\t"
  2194. "sbcs r4, r4, r6\n\t"
  2195. "sbcs r5, r5, r8\n\t"
  2196. "stm %[r]!, {r4, r5}\n\t"
  2197. "ldm %[a]!, {r4, r5}\n\t"
  2198. "ldm %[b]!, {r6, r8}\n\t"
  2199. "sbcs r4, r4, r6\n\t"
  2200. "sbcs r5, r5, r8\n\t"
  2201. "stm %[r]!, {r4, r5}\n\t"
  2202. "sbc %[c], %[c], %[c]\n\t"
  2203. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  2204. :
  2205. : "memory", "r4", "r5", "r6", "r8"
  2206. );
  2207. return c;
  2208. }
  2209. /* Square a and put result in r. (r = a * a)
  2210. *
  2211. * r A single precision integer.
  2212. * a A single precision integer.
  2213. */
  2214. SP_NOINLINE static void sp_2048_sqr_64(sp_digit* r, const sp_digit* a)
  2215. {
  2216. sp_digit* z0 = r;
  2217. sp_digit* z2 = r + 64;
  2218. sp_digit z1[64];
  2219. sp_digit* a1 = z1;
  2220. sp_digit zero[32];
  2221. sp_digit u;
  2222. sp_digit mask;
  2223. sp_digit* p1;
  2224. sp_digit* p2;
  2225. XMEMSET(zero, 0, sizeof(sp_digit) * 32);
  2226. mask = sp_2048_sub_32(a1, a, &a[32]);
  2227. p1 = (sp_digit*)(((sp_digit)zero & mask ) | ((sp_digit)a1 & (~mask)));
  2228. p2 = (sp_digit*)(((sp_digit)zero & (~mask)) | ((sp_digit)a1 & mask ));
  2229. (void)sp_2048_sub_32(a1, p1, p2);
  2230. sp_2048_sqr_32(z2, &a[32]);
  2231. sp_2048_sqr_32(z0, a);
  2232. sp_2048_sqr_32(z1, a1);
  2233. u = 0;
  2234. u -= sp_2048_sub_in_place_64(z1, z2);
  2235. u -= sp_2048_sub_in_place_64(z1, z0);
  2236. u += sp_2048_sub_in_place_64(r + 32, z1);
  2237. zero[0] = u;
  2238. (void)sp_2048_add_32(r + 96, r + 96, zero);
  2239. }
  2240. #endif /* !WOLFSSL_SP_SMALL */
  2241. #ifdef WOLFSSL_SP_SMALL
  2242. /* Add b to a into r. (r = a + b)
  2243. *
  2244. * r A single precision integer.
  2245. * a A single precision integer.
  2246. * b A single precision integer.
  2247. */
  2248. SP_NOINLINE static sp_digit sp_2048_add_64(sp_digit* r, const sp_digit* a,
  2249. const sp_digit* b)
  2250. {
  2251. sp_digit c = 0;
  2252. __asm__ __volatile__ (
  2253. "mov r6, %[a]\n\t"
  2254. "mov r8, #0\n\t"
  2255. "add r6, r6, #256\n\t"
  2256. "sub r8, r8, #1\n\t"
  2257. "\n1:\n\t"
  2258. "adds %[c], %[c], r8\n\t"
  2259. "ldr r4, [%[a]]\n\t"
  2260. "ldr r5, [%[b]]\n\t"
  2261. "adcs r4, r4, r5\n\t"
  2262. "str r4, [%[r]]\n\t"
  2263. "mov %[c], #0\n\t"
  2264. "adc %[c], %[c], %[c]\n\t"
  2265. "add %[a], %[a], #4\n\t"
  2266. "add %[b], %[b], #4\n\t"
  2267. "add %[r], %[r], #4\n\t"
  2268. "cmp %[a], r6\n\t"
  2269. #ifdef __GNUC__
  2270. "bne 1b\n\t"
  2271. #else
  2272. "bne.n 1b\n\t"
  2273. #endif /* __GNUC__ */
  2274. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  2275. :
  2276. : "memory", "r4", "r5", "r6", "r8"
  2277. );
  2278. return c;
  2279. }
  2280. #endif /* WOLFSSL_SP_SMALL */
  2281. #ifdef WOLFSSL_SP_SMALL
  2282. /* Sub b from a into a. (a -= b)
  2283. *
  2284. * a A single precision integer.
  2285. * b A single precision integer.
  2286. */
  2287. SP_NOINLINE static sp_digit sp_2048_sub_in_place_64(sp_digit* a,
  2288. const sp_digit* b)
  2289. {
  2290. sp_digit c = 0;
  2291. __asm__ __volatile__ (
  2292. "mov r8, %[a]\n\t"
  2293. "add r8, r8, #256\n\t"
  2294. "\n1:\n\t"
  2295. "mov r5, #0\n\t"
  2296. "subs r5, r5, %[c]\n\t"
  2297. "ldr r3, [%[a]]\n\t"
  2298. "ldr r4, [%[a], #4]\n\t"
  2299. "ldr r5, [%[b]]\n\t"
  2300. "ldr r6, [%[b], #4]\n\t"
  2301. "sbcs r3, r3, r5\n\t"
  2302. "sbcs r4, r4, r6\n\t"
  2303. "str r3, [%[a]]\n\t"
  2304. "str r4, [%[a], #4]\n\t"
  2305. "sbc %[c], %[c], %[c]\n\t"
  2306. "add %[a], %[a], #8\n\t"
  2307. "add %[b], %[b], #8\n\t"
  2308. "cmp %[a], r8\n\t"
  2309. #ifdef __GNUC__
  2310. "bne 1b\n\t"
  2311. #else
  2312. "bne.n 1b\n\t"
  2313. #endif /* __GNUC__ */
  2314. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  2315. :
  2316. : "memory", "r3", "r4", "r5", "r6", "r8"
  2317. );
  2318. return c;
  2319. }
  2320. #endif /* WOLFSSL_SP_SMALL */
  2321. #ifdef WOLFSSL_SP_SMALL
  2322. /* Multiply a and b into r. (r = a * b)
  2323. *
  2324. * r A single precision integer.
  2325. * a A single precision integer.
  2326. * b A single precision integer.
  2327. */
  2328. SP_NOINLINE static void sp_2048_mul_64(sp_digit* r, const sp_digit* a,
  2329. const sp_digit* b)
  2330. {
  2331. sp_digit tmp_arr[64 * 2];
  2332. sp_digit* tmp = tmp_arr;
  2333. __asm__ __volatile__ (
  2334. "mov r3, #0\n\t"
  2335. "mov r4, #0\n\t"
  2336. "mov r9, r3\n\t"
  2337. "mov r12, %[r]\n\t"
  2338. "mov r10, %[a]\n\t"
  2339. "mov r11, %[b]\n\t"
  2340. "mov r6, #1\n\t"
  2341. "lsl r6, r6, #8\n\t"
  2342. "add r6, r6, r10\n\t"
  2343. "mov r14, r6\n\t"
  2344. "\n1:\n\t"
  2345. "mov %[r], #0\n\t"
  2346. "mov r5, #0\n\t"
  2347. "mov r6, #252\n\t"
  2348. "mov %[a], r9\n\t"
  2349. "subs %[a], %[a], r6\n\t"
  2350. "sbc r6, r6, r6\n\t"
  2351. "mvn r6, r6\n\t"
  2352. "and %[a], %[a], r6\n\t"
  2353. "mov %[b], r9\n\t"
  2354. "sub %[b], %[b], %[a]\n\t"
  2355. "add %[a], %[a], r10\n\t"
  2356. "add %[b], %[b], r11\n\t"
  2357. "\n2:\n\t"
  2358. /* Multiply Start */
  2359. "ldr r6, [%[a]]\n\t"
  2360. "ldr r8, [%[b]]\n\t"
  2361. "umull r6, r8, r6, r8\n\t"
  2362. "adds r3, r3, r6\n\t"
  2363. "adcs r4, r4, r8\n\t"
  2364. "adc r5, r5, %[r]\n\t"
  2365. /* Multiply Done */
  2366. "add %[a], %[a], #4\n\t"
  2367. "sub %[b], %[b], #4\n\t"
  2368. "cmp %[a], r14\n\t"
  2369. #ifdef __GNUC__
  2370. "beq 3f\n\t"
  2371. #else
  2372. "beq.n 3f\n\t"
  2373. #endif /* __GNUC__ */
  2374. "mov r6, r9\n\t"
  2375. "add r6, r6, r10\n\t"
  2376. "cmp %[a], r6\n\t"
  2377. #ifdef __GNUC__
  2378. "ble 2b\n\t"
  2379. #else
  2380. "ble.n 2b\n\t"
  2381. #endif /* __GNUC__ */
  2382. "\n3:\n\t"
  2383. "mov %[r], r12\n\t"
  2384. "mov r8, r9\n\t"
  2385. "str r3, [%[r], r8]\n\t"
  2386. "mov r3, r4\n\t"
  2387. "mov r4, r5\n\t"
  2388. "add r8, r8, #4\n\t"
  2389. "mov r9, r8\n\t"
  2390. "mov r6, #1\n\t"
  2391. "lsl r6, r6, #8\n\t"
  2392. "add r6, r6, #248\n\t"
  2393. "cmp r8, r6\n\t"
  2394. #ifdef __GNUC__
  2395. "ble 1b\n\t"
  2396. #else
  2397. "ble.n 1b\n\t"
  2398. #endif /* __GNUC__ */
  2399. "str r3, [%[r], r8]\n\t"
  2400. "mov %[a], r10\n\t"
  2401. "mov %[b], r11\n\t"
  2402. :
  2403. : [r] "r" (tmp), [a] "r" (a), [b] "r" (b)
  2404. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  2405. );
  2406. XMEMCPY(r, tmp_arr, sizeof(tmp_arr));
  2407. }
  2408. /* Square a and put result in r. (r = a * a)
  2409. *
  2410. * r A single precision integer.
  2411. * a A single precision integer.
  2412. */
  2413. SP_NOINLINE static void sp_2048_sqr_64(sp_digit* r, const sp_digit* a)
  2414. {
  2415. __asm__ __volatile__ (
  2416. "mov r3, #0\n\t"
  2417. "mov r4, #0\n\t"
  2418. "mov r5, #0\n\t"
  2419. "mov r9, r3\n\t"
  2420. "mov r12, %[r]\n\t"
  2421. "mov r6, #2\n\t"
  2422. "lsl r6, r6, #8\n\t"
  2423. "neg r6, r6\n\t"
  2424. "add sp, sp, r6\n\t"
  2425. "mov r11, sp\n\t"
  2426. "mov r10, %[a]\n\t"
  2427. "\n1:\n\t"
  2428. "mov %[r], #0\n\t"
  2429. "mov r6, #252\n\t"
  2430. "mov %[a], r9\n\t"
  2431. "subs %[a], %[a], r6\n\t"
  2432. "sbc r6, r6, r6\n\t"
  2433. "mvn r6, r6\n\t"
  2434. "and %[a], %[a], r6\n\t"
  2435. "mov r2, r9\n\t"
  2436. "sub r2, r2, %[a]\n\t"
  2437. "add %[a], %[a], r10\n\t"
  2438. "add r2, r2, r10\n\t"
  2439. "\n2:\n\t"
  2440. "cmp r2, %[a]\n\t"
  2441. #ifdef __GNUC__
  2442. "beq 4f\n\t"
  2443. #else
  2444. "beq.n 4f\n\t"
  2445. #endif /* __GNUC__ */
  2446. /* Multiply * 2: Start */
  2447. "ldr r6, [%[a]]\n\t"
  2448. "ldr r8, [r2]\n\t"
  2449. "umull r6, r8, r6, r8\n\t"
  2450. "adds r3, r3, r6\n\t"
  2451. "adcs r4, r4, r8\n\t"
  2452. "adc r5, r5, %[r]\n\t"
  2453. "adds r3, r3, r6\n\t"
  2454. "adcs r4, r4, r8\n\t"
  2455. "adc r5, r5, %[r]\n\t"
  2456. /* Multiply * 2: Done */
  2457. #ifdef __GNUC__
  2458. "bal 5f\n\t"
  2459. #else
  2460. "bal.n 5f\n\t"
  2461. #endif /* __GNUC__ */
  2462. "\n4:\n\t"
  2463. /* Square: Start */
  2464. "ldr r6, [%[a]]\n\t"
  2465. "umull r6, r8, r6, r6\n\t"
  2466. "adds r3, r3, r6\n\t"
  2467. "adcs r4, r4, r8\n\t"
  2468. "adc r5, r5, %[r]\n\t"
  2469. /* Square: Done */
  2470. "\n5:\n\t"
  2471. "add %[a], %[a], #4\n\t"
  2472. "sub r2, r2, #4\n\t"
  2473. "mov r6, #1\n\t"
  2474. "lsl r6, r6, #8\n\t"
  2475. "add r6, r6, r10\n\t"
  2476. "cmp %[a], r6\n\t"
  2477. #ifdef __GNUC__
  2478. "beq 3f\n\t"
  2479. #else
  2480. "beq.n 3f\n\t"
  2481. #endif /* __GNUC__ */
  2482. "cmp %[a], r2\n\t"
  2483. #ifdef __GNUC__
  2484. "bgt 3f\n\t"
  2485. #else
  2486. "bgt.n 3f\n\t"
  2487. #endif /* __GNUC__ */
  2488. "mov r8, r9\n\t"
  2489. "add r8, r8, r10\n\t"
  2490. "cmp %[a], r8\n\t"
  2491. #ifdef __GNUC__
  2492. "ble 2b\n\t"
  2493. #else
  2494. "ble.n 2b\n\t"
  2495. #endif /* __GNUC__ */
  2496. "\n3:\n\t"
  2497. "mov %[r], r11\n\t"
  2498. "mov r8, r9\n\t"
  2499. "str r3, [%[r], r8]\n\t"
  2500. "mov r3, r4\n\t"
  2501. "mov r4, r5\n\t"
  2502. "mov r5, #0\n\t"
  2503. "add r8, r8, #4\n\t"
  2504. "mov r9, r8\n\t"
  2505. "mov r6, #1\n\t"
  2506. "lsl r6, r6, #8\n\t"
  2507. "add r6, r6, #248\n\t"
  2508. "cmp r8, r6\n\t"
  2509. #ifdef __GNUC__
  2510. "ble 1b\n\t"
  2511. #else
  2512. "ble.n 1b\n\t"
  2513. #endif /* __GNUC__ */
  2514. "mov %[a], r10\n\t"
  2515. "str r3, [%[r], r8]\n\t"
  2516. "mov %[r], r12\n\t"
  2517. "mov %[a], r11\n\t"
  2518. "mov r3, #1\n\t"
  2519. "lsl r3, r3, #8\n\t"
  2520. "add r3, r3, #252\n\t"
  2521. "\n4:\n\t"
  2522. "ldr r6, [%[a], r3]\n\t"
  2523. "str r6, [%[r], r3]\n\t"
  2524. "subs r3, r3, #4\n\t"
  2525. #ifdef __GNUC__
  2526. "bge 4b\n\t"
  2527. #else
  2528. "bge.n 4b\n\t"
  2529. #endif /* __GNUC__ */
  2530. "mov r6, #2\n\t"
  2531. "lsl r6, r6, #8\n\t"
  2532. "add sp, sp, r6\n\t"
  2533. :
  2534. : [r] "r" (r), [a] "r" (a)
  2535. : "memory", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12"
  2536. );
  2537. }
  2538. #endif /* WOLFSSL_SP_SMALL */
  2539. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || defined(WOLFSSL_HAVE_SP_DH)
  2540. #ifdef WOLFSSL_SP_SMALL
  2541. /* AND m into each word of a and store in r.
  2542. *
  2543. * r A single precision integer.
  2544. * a A single precision integer.
  2545. * m Mask to AND against each digit.
  2546. */
  2547. static void sp_2048_mask_32(sp_digit* r, const sp_digit* a, sp_digit m)
  2548. {
  2549. int i;
  2550. for (i=0; i<32; i++) {
  2551. r[i] = a[i] & m;
  2552. }
  2553. }
  2554. #endif /* WOLFSSL_SP_SMALL */
  2555. #ifdef WOLFSSL_SP_SMALL
  2556. /* Add b to a into r. (r = a + b)
  2557. *
  2558. * r A single precision integer.
  2559. * a A single precision integer.
  2560. * b A single precision integer.
  2561. */
  2562. SP_NOINLINE static sp_digit sp_2048_add_32(sp_digit* r, const sp_digit* a,
  2563. const sp_digit* b)
  2564. {
  2565. sp_digit c = 0;
  2566. __asm__ __volatile__ (
  2567. "mov r6, %[a]\n\t"
  2568. "mov r8, #0\n\t"
  2569. "add r6, r6, #128\n\t"
  2570. "sub r8, r8, #1\n\t"
  2571. "\n1:\n\t"
  2572. "adds %[c], %[c], r8\n\t"
  2573. "ldr r4, [%[a]]\n\t"
  2574. "ldr r5, [%[b]]\n\t"
  2575. "adcs r4, r4, r5\n\t"
  2576. "str r4, [%[r]]\n\t"
  2577. "mov %[c], #0\n\t"
  2578. "adc %[c], %[c], %[c]\n\t"
  2579. "add %[a], %[a], #4\n\t"
  2580. "add %[b], %[b], #4\n\t"
  2581. "add %[r], %[r], #4\n\t"
  2582. "cmp %[a], r6\n\t"
  2583. #ifdef __GNUC__
  2584. "bne 1b\n\t"
  2585. #else
  2586. "bne.n 1b\n\t"
  2587. #endif /* __GNUC__ */
  2588. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  2589. :
  2590. : "memory", "r4", "r5", "r6", "r8"
  2591. );
  2592. return c;
  2593. }
  2594. #endif /* WOLFSSL_SP_SMALL */
  2595. #ifdef WOLFSSL_SP_SMALL
  2596. /* Sub b from a into a. (a -= b)
  2597. *
  2598. * a A single precision integer.
  2599. * b A single precision integer.
  2600. */
  2601. SP_NOINLINE static sp_digit sp_2048_sub_in_place_32(sp_digit* a,
  2602. const sp_digit* b)
  2603. {
  2604. sp_digit c = 0;
  2605. __asm__ __volatile__ (
  2606. "mov r8, %[a]\n\t"
  2607. "add r8, r8, #128\n\t"
  2608. "\n1:\n\t"
  2609. "mov r5, #0\n\t"
  2610. "subs r5, r5, %[c]\n\t"
  2611. "ldr r3, [%[a]]\n\t"
  2612. "ldr r4, [%[a], #4]\n\t"
  2613. "ldr r5, [%[b]]\n\t"
  2614. "ldr r6, [%[b], #4]\n\t"
  2615. "sbcs r3, r3, r5\n\t"
  2616. "sbcs r4, r4, r6\n\t"
  2617. "str r3, [%[a]]\n\t"
  2618. "str r4, [%[a], #4]\n\t"
  2619. "sbc %[c], %[c], %[c]\n\t"
  2620. "add %[a], %[a], #8\n\t"
  2621. "add %[b], %[b], #8\n\t"
  2622. "cmp %[a], r8\n\t"
  2623. #ifdef __GNUC__
  2624. "bne 1b\n\t"
  2625. #else
  2626. "bne.n 1b\n\t"
  2627. #endif /* __GNUC__ */
  2628. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  2629. :
  2630. : "memory", "r3", "r4", "r5", "r6", "r8"
  2631. );
  2632. return c;
  2633. }
  2634. #endif /* WOLFSSL_SP_SMALL */
  2635. #ifdef WOLFSSL_SP_SMALL
  2636. /* Multiply a and b into r. (r = a * b)
  2637. *
  2638. * r A single precision integer.
  2639. * a A single precision integer.
  2640. * b A single precision integer.
  2641. */
  2642. SP_NOINLINE static void sp_2048_mul_32(sp_digit* r, const sp_digit* a,
  2643. const sp_digit* b)
  2644. {
  2645. sp_digit tmp_arr[32 * 2];
  2646. sp_digit* tmp = tmp_arr;
  2647. __asm__ __volatile__ (
  2648. "mov r3, #0\n\t"
  2649. "mov r4, #0\n\t"
  2650. "mov r9, r3\n\t"
  2651. "mov r12, %[r]\n\t"
  2652. "mov r10, %[a]\n\t"
  2653. "mov r11, %[b]\n\t"
  2654. "mov r6, #128\n\t"
  2655. "add r6, r6, r10\n\t"
  2656. "mov r14, r6\n\t"
  2657. "\n1:\n\t"
  2658. "mov %[r], #0\n\t"
  2659. "mov r5, #0\n\t"
  2660. "mov r6, #124\n\t"
  2661. "mov %[a], r9\n\t"
  2662. "subs %[a], %[a], r6\n\t"
  2663. "sbc r6, r6, r6\n\t"
  2664. "mvn r6, r6\n\t"
  2665. "and %[a], %[a], r6\n\t"
  2666. "mov %[b], r9\n\t"
  2667. "sub %[b], %[b], %[a]\n\t"
  2668. "add %[a], %[a], r10\n\t"
  2669. "add %[b], %[b], r11\n\t"
  2670. "\n2:\n\t"
  2671. /* Multiply Start */
  2672. "ldr r6, [%[a]]\n\t"
  2673. "ldr r8, [%[b]]\n\t"
  2674. "umull r6, r8, r6, r8\n\t"
  2675. "adds r3, r3, r6\n\t"
  2676. "adcs r4, r4, r8\n\t"
  2677. "adc r5, r5, %[r]\n\t"
  2678. /* Multiply Done */
  2679. "add %[a], %[a], #4\n\t"
  2680. "sub %[b], %[b], #4\n\t"
  2681. "cmp %[a], r14\n\t"
  2682. #ifdef __GNUC__
  2683. "beq 3f\n\t"
  2684. #else
  2685. "beq.n 3f\n\t"
  2686. #endif /* __GNUC__ */
  2687. "mov r6, r9\n\t"
  2688. "add r6, r6, r10\n\t"
  2689. "cmp %[a], r6\n\t"
  2690. #ifdef __GNUC__
  2691. "ble 2b\n\t"
  2692. #else
  2693. "ble.n 2b\n\t"
  2694. #endif /* __GNUC__ */
  2695. "\n3:\n\t"
  2696. "mov %[r], r12\n\t"
  2697. "mov r8, r9\n\t"
  2698. "str r3, [%[r], r8]\n\t"
  2699. "mov r3, r4\n\t"
  2700. "mov r4, r5\n\t"
  2701. "add r8, r8, #4\n\t"
  2702. "mov r9, r8\n\t"
  2703. "mov r6, #248\n\t"
  2704. "cmp r8, r6\n\t"
  2705. #ifdef __GNUC__
  2706. "ble 1b\n\t"
  2707. #else
  2708. "ble.n 1b\n\t"
  2709. #endif /* __GNUC__ */
  2710. "str r3, [%[r], r8]\n\t"
  2711. "mov %[a], r10\n\t"
  2712. "mov %[b], r11\n\t"
  2713. :
  2714. : [r] "r" (tmp), [a] "r" (a), [b] "r" (b)
  2715. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  2716. );
  2717. XMEMCPY(r, tmp_arr, sizeof(tmp_arr));
  2718. }
  2719. /* Square a and put result in r. (r = a * a)
  2720. *
  2721. * r A single precision integer.
  2722. * a A single precision integer.
  2723. */
  2724. SP_NOINLINE static void sp_2048_sqr_32(sp_digit* r, const sp_digit* a)
  2725. {
  2726. __asm__ __volatile__ (
  2727. "mov r3, #0\n\t"
  2728. "mov r4, #0\n\t"
  2729. "mov r5, #0\n\t"
  2730. "mov r9, r3\n\t"
  2731. "mov r12, %[r]\n\t"
  2732. "mov r6, #1\n\t"
  2733. "lsl r6, r6, #8\n\t"
  2734. "neg r6, r6\n\t"
  2735. "add sp, sp, r6\n\t"
  2736. "mov r11, sp\n\t"
  2737. "mov r10, %[a]\n\t"
  2738. "\n1:\n\t"
  2739. "mov %[r], #0\n\t"
  2740. "mov r6, #124\n\t"
  2741. "mov %[a], r9\n\t"
  2742. "subs %[a], %[a], r6\n\t"
  2743. "sbc r6, r6, r6\n\t"
  2744. "mvn r6, r6\n\t"
  2745. "and %[a], %[a], r6\n\t"
  2746. "mov r2, r9\n\t"
  2747. "sub r2, r2, %[a]\n\t"
  2748. "add %[a], %[a], r10\n\t"
  2749. "add r2, r2, r10\n\t"
  2750. "\n2:\n\t"
  2751. "cmp r2, %[a]\n\t"
  2752. #ifdef __GNUC__
  2753. "beq 4f\n\t"
  2754. #else
  2755. "beq.n 4f\n\t"
  2756. #endif /* __GNUC__ */
  2757. /* Multiply * 2: Start */
  2758. "ldr r6, [%[a]]\n\t"
  2759. "ldr r8, [r2]\n\t"
  2760. "umull r6, r8, r6, r8\n\t"
  2761. "adds r3, r3, r6\n\t"
  2762. "adcs r4, r4, r8\n\t"
  2763. "adc r5, r5, %[r]\n\t"
  2764. "adds r3, r3, r6\n\t"
  2765. "adcs r4, r4, r8\n\t"
  2766. "adc r5, r5, %[r]\n\t"
  2767. /* Multiply * 2: Done */
  2768. #ifdef __GNUC__
  2769. "bal 5f\n\t"
  2770. #else
  2771. "bal.n 5f\n\t"
  2772. #endif /* __GNUC__ */
  2773. "\n4:\n\t"
  2774. /* Square: Start */
  2775. "ldr r6, [%[a]]\n\t"
  2776. "umull r6, r8, r6, r6\n\t"
  2777. "adds r3, r3, r6\n\t"
  2778. "adcs r4, r4, r8\n\t"
  2779. "adc r5, r5, %[r]\n\t"
  2780. /* Square: Done */
  2781. "\n5:\n\t"
  2782. "add %[a], %[a], #4\n\t"
  2783. "sub r2, r2, #4\n\t"
  2784. "mov r6, #128\n\t"
  2785. "add r6, r6, r10\n\t"
  2786. "cmp %[a], r6\n\t"
  2787. #ifdef __GNUC__
  2788. "beq 3f\n\t"
  2789. #else
  2790. "beq.n 3f\n\t"
  2791. #endif /* __GNUC__ */
  2792. "cmp %[a], r2\n\t"
  2793. #ifdef __GNUC__
  2794. "bgt 3f\n\t"
  2795. #else
  2796. "bgt.n 3f\n\t"
  2797. #endif /* __GNUC__ */
  2798. "mov r8, r9\n\t"
  2799. "add r8, r8, r10\n\t"
  2800. "cmp %[a], r8\n\t"
  2801. #ifdef __GNUC__
  2802. "ble 2b\n\t"
  2803. #else
  2804. "ble.n 2b\n\t"
  2805. #endif /* __GNUC__ */
  2806. "\n3:\n\t"
  2807. "mov %[r], r11\n\t"
  2808. "mov r8, r9\n\t"
  2809. "str r3, [%[r], r8]\n\t"
  2810. "mov r3, r4\n\t"
  2811. "mov r4, r5\n\t"
  2812. "mov r5, #0\n\t"
  2813. "add r8, r8, #4\n\t"
  2814. "mov r9, r8\n\t"
  2815. "mov r6, #248\n\t"
  2816. "cmp r8, r6\n\t"
  2817. #ifdef __GNUC__
  2818. "ble 1b\n\t"
  2819. #else
  2820. "ble.n 1b\n\t"
  2821. #endif /* __GNUC__ */
  2822. "mov %[a], r10\n\t"
  2823. "str r3, [%[r], r8]\n\t"
  2824. "mov %[r], r12\n\t"
  2825. "mov %[a], r11\n\t"
  2826. "mov r3, #252\n\t"
  2827. "\n4:\n\t"
  2828. "ldr r6, [%[a], r3]\n\t"
  2829. "str r6, [%[r], r3]\n\t"
  2830. "subs r3, r3, #4\n\t"
  2831. #ifdef __GNUC__
  2832. "bge 4b\n\t"
  2833. #else
  2834. "bge.n 4b\n\t"
  2835. #endif /* __GNUC__ */
  2836. "mov r6, #1\n\t"
  2837. "lsl r6, r6, #8\n\t"
  2838. "add sp, sp, r6\n\t"
  2839. :
  2840. : [r] "r" (r), [a] "r" (a)
  2841. : "memory", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12"
  2842. );
  2843. }
  2844. #endif /* WOLFSSL_SP_SMALL */
  2845. #endif /* (WOLFSSL_HAVE_SP_RSA & !WOLFSSL_RSA_PUBLIC_ONLY) | WOLFSSL_HAVE_SP_DH */
  2846. /* Caclulate the bottom digit of -1/a mod 2^n.
  2847. *
  2848. * a A single precision number.
  2849. * rho Bottom word of inverse.
  2850. */
  2851. static void sp_2048_mont_setup(const sp_digit* a, sp_digit* rho)
  2852. {
  2853. sp_digit x;
  2854. sp_digit b;
  2855. b = a[0];
  2856. x = (((b + 2) & 4) << 1) + b; /* here x*a==1 mod 2**4 */
  2857. x *= 2 - b * x; /* here x*a==1 mod 2**8 */
  2858. x *= 2 - b * x; /* here x*a==1 mod 2**16 */
  2859. x *= 2 - b * x; /* here x*a==1 mod 2**32 */
  2860. /* rho = -1/m mod b */
  2861. *rho = (sp_digit)0 - x;
  2862. }
  2863. /* Mul a by digit b into r. (r = a * b)
  2864. *
  2865. * r A single precision integer.
  2866. * a A single precision integer.
  2867. * b A single precision digit.
  2868. */
  2869. SP_NOINLINE static void sp_2048_mul_d_64(sp_digit* r, const sp_digit* a,
  2870. sp_digit b)
  2871. {
  2872. __asm__ __volatile__ (
  2873. "add r9, %[a], #256\n\t"
  2874. /* A[0] * B */
  2875. "ldr r6, [%[a]], #4\n\t"
  2876. "umull r5, r3, r6, %[b]\n\t"
  2877. "mov r4, #0\n\t"
  2878. "str r5, [%[r]], #4\n\t"
  2879. /* A[0] * B - Done */
  2880. "\n1:\n\t"
  2881. "mov r5, #0\n\t"
  2882. /* A[] * B */
  2883. "ldr r6, [%[a]], #4\n\t"
  2884. "umull r6, r8, r6, %[b]\n\t"
  2885. "adds r3, r3, r6\n\t"
  2886. "adcs r4, r4, r8\n\t"
  2887. "adc r5, r5, #0\n\t"
  2888. /* A[] * B - Done */
  2889. "str r3, [%[r]], #4\n\t"
  2890. "mov r3, r4\n\t"
  2891. "mov r4, r5\n\t"
  2892. "cmp %[a], r9\n\t"
  2893. #ifdef __GNUC__
  2894. "blt 1b\n\t"
  2895. #else
  2896. "blt.n 1b\n\t"
  2897. #endif /* __GNUC__ */
  2898. "str r3, [%[r]]\n\t"
  2899. : [r] "+r" (r), [a] "+r" (a)
  2900. : [b] "r" (b)
  2901. : "memory", "r3", "r4", "r5", "r6", "r8", "r9"
  2902. );
  2903. }
  2904. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || defined(WOLFSSL_HAVE_SP_DH)
  2905. /* r = 2^n mod m where n is the number of bits to reduce by.
  2906. * Given m must be 2048 bits, just need to subtract.
  2907. *
  2908. * r A single precision number.
  2909. * m A single precision number.
  2910. */
  2911. static void sp_2048_mont_norm_32(sp_digit* r, const sp_digit* m)
  2912. {
  2913. XMEMSET(r, 0, sizeof(sp_digit) * 32);
  2914. /* r = 2^n mod m */
  2915. sp_2048_sub_in_place_32(r, m);
  2916. }
  2917. /* Conditionally subtract b from a using the mask m.
  2918. * m is -1 to subtract and 0 when not copying.
  2919. *
  2920. * r A single precision number representing condition subtract result.
  2921. * a A single precision number to subtract from.
  2922. * b A single precision number to subtract.
  2923. * m Mask value to apply.
  2924. */
  2925. SP_NOINLINE static sp_digit sp_2048_cond_sub_32(sp_digit* r, const sp_digit* a,
  2926. const sp_digit* b, sp_digit m)
  2927. {
  2928. sp_digit c = 0;
  2929. __asm__ __volatile__ (
  2930. "mov r5, #128\n\t"
  2931. "mov r9, r5\n\t"
  2932. "mov r8, #0\n\t"
  2933. "\n1:\n\t"
  2934. "ldr r6, [%[b], r8]\n\t"
  2935. "and r6, r6, %[m]\n\t"
  2936. "mov r5, #0\n\t"
  2937. "subs r5, r5, %[c]\n\t"
  2938. "ldr r5, [%[a], r8]\n\t"
  2939. "sbcs r5, r5, r6\n\t"
  2940. "sbcs %[c], %[c], %[c]\n\t"
  2941. "str r5, [%[r], r8]\n\t"
  2942. "add r8, r8, #4\n\t"
  2943. "cmp r8, r9\n\t"
  2944. #ifdef __GNUC__
  2945. "blt 1b\n\t"
  2946. #else
  2947. "blt.n 1b\n\t"
  2948. #endif /* __GNUC__ */
  2949. : [c] "+r" (c)
  2950. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  2951. : "memory", "r5", "r6", "r8", "r9"
  2952. );
  2953. return c;
  2954. }
  2955. /* Reduce the number back to 2048 bits using Montgomery reduction.
  2956. *
  2957. * a A single precision number to reduce in place.
  2958. * m The single precision number representing the modulus.
  2959. * mp The digit representing the negative inverse of m mod 2^n.
  2960. */
  2961. SP_NOINLINE static void sp_2048_mont_reduce_32(sp_digit* a, const sp_digit* m,
  2962. sp_digit mp)
  2963. {
  2964. sp_digit ca = 0;
  2965. __asm__ __volatile__ (
  2966. "mov r9, %[mp]\n\t"
  2967. "mov r12, %[m]\n\t"
  2968. "mov r10, %[a]\n\t"
  2969. "mov r4, #0\n\t"
  2970. "add r11, r10, #128\n\t"
  2971. "\n1:\n\t"
  2972. /* mu = a[i] * mp */
  2973. "mov %[mp], r9\n\t"
  2974. "ldr %[a], [r10]\n\t"
  2975. "mul %[mp], %[mp], %[a]\n\t"
  2976. "mov %[m], r12\n\t"
  2977. "add r14, r10, #120\n\t"
  2978. "\n2:\n\t"
  2979. /* a[i+j] += m[j] * mu */
  2980. "ldr %[a], [r10]\n\t"
  2981. "mov r5, #0\n\t"
  2982. /* Multiply m[j] and mu - Start */
  2983. "ldr r8, [%[m]], #4\n\t"
  2984. "umull r6, r8, %[mp], r8\n\t"
  2985. "adds %[a], %[a], r6\n\t"
  2986. "adc r5, r5, r8\n\t"
  2987. /* Multiply m[j] and mu - Done */
  2988. "adds r4, r4, %[a]\n\t"
  2989. "adc r5, r5, #0\n\t"
  2990. "str r4, [r10], #4\n\t"
  2991. /* a[i+j+1] += m[j+1] * mu */
  2992. "ldr %[a], [r10]\n\t"
  2993. "mov r4, #0\n\t"
  2994. /* Multiply m[j] and mu - Start */
  2995. "ldr r8, [%[m]], #4\n\t"
  2996. "umull r6, r8, %[mp], r8\n\t"
  2997. "adds %[a], %[a], r6\n\t"
  2998. "adc r4, r4, r8\n\t"
  2999. /* Multiply m[j] and mu - Done */
  3000. "adds r5, r5, %[a]\n\t"
  3001. "adc r4, r4, #0\n\t"
  3002. "str r5, [r10], #4\n\t"
  3003. "cmp r10, r14\n\t"
  3004. #ifdef __GNUC__
  3005. "blt 2b\n\t"
  3006. #else
  3007. "blt.n 2b\n\t"
  3008. #endif /* __GNUC__ */
  3009. /* a[i+30] += m[30] * mu */
  3010. "ldr %[a], [r10]\n\t"
  3011. "mov r5, #0\n\t"
  3012. /* Multiply m[j] and mu - Start */
  3013. "ldr r8, [%[m]], #4\n\t"
  3014. "umull r6, r8, %[mp], r8\n\t"
  3015. "adds %[a], %[a], r6\n\t"
  3016. "adc r5, r5, r8\n\t"
  3017. /* Multiply m[j] and mu - Done */
  3018. "adds r4, r4, %[a]\n\t"
  3019. "adc r5, r5, #0\n\t"
  3020. "str r4, [r10], #4\n\t"
  3021. /* a[i+31] += m[31] * mu */
  3022. "mov r4, %[ca]\n\t"
  3023. "mov %[ca], #0\n\t"
  3024. /* Multiply m[31] and mu - Start */
  3025. "ldr r8, [%[m]]\n\t"
  3026. "umull r6, r8, %[mp], r8\n\t"
  3027. "adds r5, r5, r6\n\t"
  3028. "adcs r4, r4, r8\n\t"
  3029. "adc %[ca], %[ca], #0\n\t"
  3030. /* Multiply m[31] and mu - Done */
  3031. "ldr r6, [r10]\n\t"
  3032. "ldr r8, [r10, #4]\n\t"
  3033. "adds r6, r6, r5\n\t"
  3034. "adcs r8, r8, r4\n\t"
  3035. "adc %[ca], %[ca], #0\n\t"
  3036. "str r6, [r10]\n\t"
  3037. "str r8, [r10, #4]\n\t"
  3038. /* Next word in a */
  3039. "sub r10, r10, #120\n\t"
  3040. "cmp r10, r11\n\t"
  3041. #ifdef __GNUC__
  3042. "blt 1b\n\t"
  3043. #else
  3044. "blt.n 1b\n\t"
  3045. #endif /* __GNUC__ */
  3046. "mov %[a], r10\n\t"
  3047. "mov %[m], r12\n\t"
  3048. : [ca] "+r" (ca), [a] "+r" (a)
  3049. : [m] "r" (m), [mp] "r" (mp)
  3050. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  3051. );
  3052. sp_2048_cond_sub_32(a - 32, a, m, (sp_digit)0 - ca);
  3053. }
  3054. /* Multiply two Montgomery form numbers mod the modulus (prime).
  3055. * (r = a * b mod m)
  3056. *
  3057. * r Result of multiplication.
  3058. * a First number to multiply in Montgomery form.
  3059. * b Second number to multiply in Montgomery form.
  3060. * m Modulus (prime).
  3061. * mp Montgomery mulitplier.
  3062. */
  3063. SP_NOINLINE static void sp_2048_mont_mul_32(sp_digit* r, const sp_digit* a,
  3064. const sp_digit* b, const sp_digit* m, sp_digit mp)
  3065. {
  3066. sp_2048_mul_32(r, a, b);
  3067. sp_2048_mont_reduce_32(r, m, mp);
  3068. }
  3069. /* Square the Montgomery form number. (r = a * a mod m)
  3070. *
  3071. * r Result of squaring.
  3072. * a Number to square in Montgomery form.
  3073. * m Modulus (prime).
  3074. * mp Montgomery mulitplier.
  3075. */
  3076. SP_NOINLINE static void sp_2048_mont_sqr_32(sp_digit* r, const sp_digit* a,
  3077. const sp_digit* m, sp_digit mp)
  3078. {
  3079. sp_2048_sqr_32(r, a);
  3080. sp_2048_mont_reduce_32(r, m, mp);
  3081. }
  3082. /* Mul a by digit b into r. (r = a * b)
  3083. *
  3084. * r A single precision integer.
  3085. * a A single precision integer.
  3086. * b A single precision digit.
  3087. */
  3088. SP_NOINLINE static void sp_2048_mul_d_32(sp_digit* r, const sp_digit* a,
  3089. sp_digit b)
  3090. {
  3091. __asm__ __volatile__ (
  3092. "add r9, %[a], #128\n\t"
  3093. /* A[0] * B */
  3094. "ldr r6, [%[a]], #4\n\t"
  3095. "umull r5, r3, r6, %[b]\n\t"
  3096. "mov r4, #0\n\t"
  3097. "str r5, [%[r]], #4\n\t"
  3098. /* A[0] * B - Done */
  3099. "\n1:\n\t"
  3100. "mov r5, #0\n\t"
  3101. /* A[] * B */
  3102. "ldr r6, [%[a]], #4\n\t"
  3103. "umull r6, r8, r6, %[b]\n\t"
  3104. "adds r3, r3, r6\n\t"
  3105. "adcs r4, r4, r8\n\t"
  3106. "adc r5, r5, #0\n\t"
  3107. /* A[] * B - Done */
  3108. "str r3, [%[r]], #4\n\t"
  3109. "mov r3, r4\n\t"
  3110. "mov r4, r5\n\t"
  3111. "cmp %[a], r9\n\t"
  3112. #ifdef __GNUC__
  3113. "blt 1b\n\t"
  3114. #else
  3115. "blt.n 1b\n\t"
  3116. #endif /* __GNUC__ */
  3117. "str r3, [%[r]]\n\t"
  3118. : [r] "+r" (r), [a] "+r" (a)
  3119. : [b] "r" (b)
  3120. : "memory", "r3", "r4", "r5", "r6", "r8", "r9"
  3121. );
  3122. }
  3123. /* Divide the double width number (d1|d0) by the divisor. (d1|d0 / div)
  3124. *
  3125. * d1 The high order half of the number to divide.
  3126. * d0 The low order half of the number to divide.
  3127. * div The divisor.
  3128. * returns the result of the division.
  3129. *
  3130. * Note that this is an approximate div. It may give an answer 1 larger.
  3131. */
  3132. SP_NOINLINE static sp_digit div_2048_word_32(sp_digit d1, sp_digit d0,
  3133. sp_digit div)
  3134. {
  3135. sp_digit r = 0;
  3136. __asm__ __volatile__ (
  3137. "lsr r6, %[div], #16\n\t"
  3138. "add r6, r6, #1\n\t"
  3139. "udiv r4, %[d1], r6\n\t"
  3140. "lsl r8, r4, #16\n\t"
  3141. "umull r4, r5, %[div], r8\n\t"
  3142. "subs %[d0], %[d0], r4\n\t"
  3143. "sbc %[d1], %[d1], r5\n\t"
  3144. "udiv r5, %[d1], r6\n\t"
  3145. "lsl r4, r5, #16\n\t"
  3146. "add r8, r8, r4\n\t"
  3147. "umull r4, r5, %[div], r4\n\t"
  3148. "subs %[d0], %[d0], r4\n\t"
  3149. "sbc %[d1], %[d1], r5\n\t"
  3150. "lsl r4, %[d1], #16\n\t"
  3151. "orr r4, r4, %[d0], lsr #16\n\t"
  3152. "udiv r4, r4, r6\n\t"
  3153. "add r8, r8, r4\n\t"
  3154. "umull r4, r5, %[div], r4\n\t"
  3155. "subs %[d0], %[d0], r4\n\t"
  3156. "sbc %[d1], %[d1], r5\n\t"
  3157. "lsl r4, %[d1], #16\n\t"
  3158. "orr r4, r4, %[d0], lsr #16\n\t"
  3159. "udiv r4, r4, r6\n\t"
  3160. "add r8, r8, r4\n\t"
  3161. "umull r4, r5, %[div], r4\n\t"
  3162. "subs %[d0], %[d0], r4\n\t"
  3163. "sbc %[d1], %[d1], r5\n\t"
  3164. "udiv r4, %[d0], %[div]\n\t"
  3165. "add r8, r8, r4\n\t"
  3166. "mov %[r], r8\n\t"
  3167. : [r] "+r" (r)
  3168. : [d1] "r" (d1), [d0] "r" (d0), [div] "r" (div)
  3169. : "r4", "r5", "r6", "r8"
  3170. );
  3171. return r;
  3172. }
  3173. /* Compare a with b in constant time.
  3174. *
  3175. * a A single precision integer.
  3176. * b A single precision integer.
  3177. * return -ve, 0 or +ve if a is less than, equal to or greater than b
  3178. * respectively.
  3179. */
  3180. SP_NOINLINE static sp_int32 sp_2048_cmp_32(const sp_digit* a, const sp_digit* b)
  3181. {
  3182. sp_digit r = 0;
  3183. __asm__ __volatile__ (
  3184. "mov r3, #0\n\t"
  3185. "mvn r3, r3\n\t"
  3186. "mov r6, #124\n\t"
  3187. "\n1:\n\t"
  3188. "ldr r8, [%[a], r6]\n\t"
  3189. "ldr r5, [%[b], r6]\n\t"
  3190. "and r8, r8, r3\n\t"
  3191. "and r5, r5, r3\n\t"
  3192. "mov r4, r8\n\t"
  3193. "subs r8, r8, r5\n\t"
  3194. "sbc r8, r8, r8\n\t"
  3195. "add %[r], %[r], r8\n\t"
  3196. "mvn r8, r8\n\t"
  3197. "and r3, r3, r8\n\t"
  3198. "subs r5, r5, r4\n\t"
  3199. "sbc r8, r8, r8\n\t"
  3200. "sub %[r], %[r], r8\n\t"
  3201. "mvn r8, r8\n\t"
  3202. "and r3, r3, r8\n\t"
  3203. "sub r6, r6, #4\n\t"
  3204. "cmp r6, #0\n\t"
  3205. #ifdef __GNUC__
  3206. "bge 1b\n\t"
  3207. #else
  3208. "bge.n 1b\n\t"
  3209. #endif /* __GNUC__ */
  3210. : [r] "+r" (r)
  3211. : [a] "r" (a), [b] "r" (b)
  3212. : "r3", "r4", "r5", "r6", "r8"
  3213. );
  3214. return r;
  3215. }
  3216. /* Divide d in a and put remainder into r (m*d + r = a)
  3217. * m is not calculated as it is not needed at this time.
  3218. *
  3219. * a Number to be divided.
  3220. * d Number to divide with.
  3221. * m Multiplier result.
  3222. * r Remainder from the division.
  3223. * returns MP_OKAY indicating success.
  3224. */
  3225. static WC_INLINE int sp_2048_div_32(const sp_digit* a, const sp_digit* d, sp_digit* m,
  3226. sp_digit* r)
  3227. {
  3228. sp_digit t1[64], t2[33];
  3229. sp_digit div, r1;
  3230. int i;
  3231. (void)m;
  3232. div = d[31];
  3233. XMEMCPY(t1, a, sizeof(*t1) * 2 * 32);
  3234. r1 = sp_2048_cmp_32(&t1[32], d) >= 0;
  3235. sp_2048_cond_sub_32(&t1[32], &t1[32], d, (sp_digit)0 - r1);
  3236. for (i = 31; i >= 0; i--) {
  3237. sp_digit mask = 0 - (t1[32 + i] == div);
  3238. sp_digit hi = t1[32 + i] + mask;
  3239. r1 = div_2048_word_32(hi, t1[32 + i - 1], div);
  3240. r1 |= mask;
  3241. sp_2048_mul_d_32(t2, d, r1);
  3242. t1[32 + i] += sp_2048_sub_in_place_32(&t1[i], t2);
  3243. t1[32 + i] -= t2[32];
  3244. sp_2048_mask_32(t2, d, t1[32 + i]);
  3245. t1[32 + i] += sp_2048_add_32(&t1[i], &t1[i], t2);
  3246. sp_2048_mask_32(t2, d, t1[32 + i]);
  3247. t1[32 + i] += sp_2048_add_32(&t1[i], &t1[i], t2);
  3248. }
  3249. r1 = sp_2048_cmp_32(t1, d) >= 0;
  3250. sp_2048_cond_sub_32(r, t1, d, (sp_digit)0 - r1);
  3251. return MP_OKAY;
  3252. }
  3253. /* Reduce a modulo m into r. (r = a mod m)
  3254. *
  3255. * r A single precision number that is the reduced result.
  3256. * a A single precision number that is to be reduced.
  3257. * m A single precision number that is the modulus to reduce with.
  3258. * returns MP_OKAY indicating success.
  3259. */
  3260. static WC_INLINE int sp_2048_mod_32(sp_digit* r, const sp_digit* a, const sp_digit* m)
  3261. {
  3262. return sp_2048_div_32(a, m, NULL, r);
  3263. }
  3264. #ifdef WOLFSSL_SP_SMALL
  3265. /* Modular exponentiate a to the e mod m. (r = a^e mod m)
  3266. *
  3267. * r A single precision number that is the result of the operation.
  3268. * a A single precision number being exponentiated.
  3269. * e A single precision number that is the exponent.
  3270. * bits The number of bits in the exponent.
  3271. * m A single precision number that is the modulus.
  3272. * returns 0 on success.
  3273. * returns MEMORY_E on dynamic memory allocation failure.
  3274. * returns MP_VAL when base is even or exponent is 0.
  3275. */
  3276. static int sp_2048_mod_exp_32(sp_digit* r, const sp_digit* a, const sp_digit* e,
  3277. int bits, const sp_digit* m, int reduceA)
  3278. {
  3279. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  3280. sp_digit* td = NULL;
  3281. #else
  3282. sp_digit td[16 * 64];
  3283. #endif
  3284. sp_digit* t[16];
  3285. sp_digit* norm = NULL;
  3286. sp_digit mp = 1;
  3287. sp_digit n;
  3288. sp_digit mask;
  3289. int i;
  3290. int c;
  3291. byte y;
  3292. int err = MP_OKAY;
  3293. if (bits == 0) {
  3294. err = MP_VAL;
  3295. }
  3296. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  3297. if (err == MP_OKAY) {
  3298. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * (16 * 64), NULL,
  3299. DYNAMIC_TYPE_TMP_BUFFER);
  3300. if (td == NULL)
  3301. err = MEMORY_E;
  3302. }
  3303. #endif
  3304. if (err == MP_OKAY) {
  3305. norm = td;
  3306. for (i=0; i<16; i++) {
  3307. t[i] = td + i * 64;
  3308. }
  3309. sp_2048_mont_setup(m, &mp);
  3310. sp_2048_mont_norm_32(norm, m);
  3311. XMEMSET(t[1], 0, sizeof(sp_digit) * 32U);
  3312. if (reduceA != 0) {
  3313. err = sp_2048_mod_32(t[1] + 32, a, m);
  3314. if (err == MP_OKAY) {
  3315. err = sp_2048_mod_32(t[1], t[1], m);
  3316. }
  3317. }
  3318. else {
  3319. XMEMCPY(t[1] + 32, a, sizeof(sp_digit) * 32);
  3320. err = sp_2048_mod_32(t[1], t[1], m);
  3321. }
  3322. }
  3323. if (err == MP_OKAY) {
  3324. sp_2048_mont_sqr_32(t[ 2], t[ 1], m, mp);
  3325. sp_2048_mont_mul_32(t[ 3], t[ 2], t[ 1], m, mp);
  3326. sp_2048_mont_sqr_32(t[ 4], t[ 2], m, mp);
  3327. sp_2048_mont_mul_32(t[ 5], t[ 3], t[ 2], m, mp);
  3328. sp_2048_mont_sqr_32(t[ 6], t[ 3], m, mp);
  3329. sp_2048_mont_mul_32(t[ 7], t[ 4], t[ 3], m, mp);
  3330. sp_2048_mont_sqr_32(t[ 8], t[ 4], m, mp);
  3331. sp_2048_mont_mul_32(t[ 9], t[ 5], t[ 4], m, mp);
  3332. sp_2048_mont_sqr_32(t[10], t[ 5], m, mp);
  3333. sp_2048_mont_mul_32(t[11], t[ 6], t[ 5], m, mp);
  3334. sp_2048_mont_sqr_32(t[12], t[ 6], m, mp);
  3335. sp_2048_mont_mul_32(t[13], t[ 7], t[ 6], m, mp);
  3336. sp_2048_mont_sqr_32(t[14], t[ 7], m, mp);
  3337. sp_2048_mont_mul_32(t[15], t[ 8], t[ 7], m, mp);
  3338. i = (bits - 1) / 32;
  3339. n = e[i--];
  3340. c = bits & 31;
  3341. if (c == 0) {
  3342. c = 32;
  3343. }
  3344. c -= bits % 4;
  3345. if (c == 32) {
  3346. c = 28;
  3347. }
  3348. if (c < 0) {
  3349. /* Number of bits in top word is less than number needed. */
  3350. c = -c;
  3351. y = (byte)(n << c);
  3352. n = e[i--];
  3353. y |= (byte)(n >> (64 - c));
  3354. n <<= c;
  3355. c = 64 - c;
  3356. }
  3357. else if (c == 0) {
  3358. /* All bits in top word used. */
  3359. y = (byte)n;
  3360. }
  3361. else {
  3362. y = (byte)(n >> c);
  3363. n <<= 32 - c;
  3364. }
  3365. XMEMCPY(r, t[y], sizeof(sp_digit) * 32);
  3366. for (; i>=0 || c>=4; ) {
  3367. if (c == 0) {
  3368. n = e[i--];
  3369. y = (byte)(n >> 28);
  3370. n <<= 4;
  3371. c = 28;
  3372. }
  3373. else if (c < 4) {
  3374. y = (byte)(n >> 28);
  3375. n = e[i--];
  3376. c = 4 - c;
  3377. y |= (byte)(n >> (32 - c));
  3378. n <<= c;
  3379. c = 32 - c;
  3380. }
  3381. else {
  3382. y = (byte)((n >> 28) & 0xf);
  3383. n <<= 4;
  3384. c -= 4;
  3385. }
  3386. sp_2048_mont_sqr_32(r, r, m, mp);
  3387. sp_2048_mont_sqr_32(r, r, m, mp);
  3388. sp_2048_mont_sqr_32(r, r, m, mp);
  3389. sp_2048_mont_sqr_32(r, r, m, mp);
  3390. sp_2048_mont_mul_32(r, r, t[y], m, mp);
  3391. }
  3392. XMEMSET(&r[32], 0, sizeof(sp_digit) * 32U);
  3393. sp_2048_mont_reduce_32(r, m, mp);
  3394. mask = 0 - (sp_2048_cmp_32(r, m) >= 0);
  3395. sp_2048_cond_sub_32(r, r, m, mask);
  3396. }
  3397. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  3398. if (td != NULL)
  3399. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  3400. #endif
  3401. return err;
  3402. }
  3403. #else
  3404. /* Modular exponentiate a to the e mod m. (r = a^e mod m)
  3405. *
  3406. * r A single precision number that is the result of the operation.
  3407. * a A single precision number being exponentiated.
  3408. * e A single precision number that is the exponent.
  3409. * bits The number of bits in the exponent.
  3410. * m A single precision number that is the modulus.
  3411. * returns 0 on success.
  3412. * returns MEMORY_E on dynamic memory allocation failure.
  3413. * returns MP_VAL when base is even or exponent is 0.
  3414. */
  3415. static int sp_2048_mod_exp_32(sp_digit* r, const sp_digit* a, const sp_digit* e,
  3416. int bits, const sp_digit* m, int reduceA)
  3417. {
  3418. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  3419. sp_digit* td = NULL;
  3420. #else
  3421. sp_digit td[32 * 64];
  3422. #endif
  3423. sp_digit* t[32];
  3424. sp_digit* norm = NULL;
  3425. sp_digit mp = 1;
  3426. sp_digit n;
  3427. sp_digit mask;
  3428. int i;
  3429. int c;
  3430. byte y;
  3431. int err = MP_OKAY;
  3432. if (bits == 0) {
  3433. err = MP_VAL;
  3434. }
  3435. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  3436. if (err == MP_OKAY) {
  3437. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * (32 * 64), NULL,
  3438. DYNAMIC_TYPE_TMP_BUFFER);
  3439. if (td == NULL)
  3440. err = MEMORY_E;
  3441. }
  3442. #endif
  3443. if (err == MP_OKAY) {
  3444. norm = td;
  3445. for (i=0; i<32; i++) {
  3446. t[i] = td + i * 64;
  3447. }
  3448. sp_2048_mont_setup(m, &mp);
  3449. sp_2048_mont_norm_32(norm, m);
  3450. XMEMSET(t[1], 0, sizeof(sp_digit) * 32U);
  3451. if (reduceA != 0) {
  3452. err = sp_2048_mod_32(t[1] + 32, a, m);
  3453. if (err == MP_OKAY) {
  3454. err = sp_2048_mod_32(t[1], t[1], m);
  3455. }
  3456. }
  3457. else {
  3458. XMEMCPY(t[1] + 32, a, sizeof(sp_digit) * 32);
  3459. err = sp_2048_mod_32(t[1], t[1], m);
  3460. }
  3461. }
  3462. if (err == MP_OKAY) {
  3463. sp_2048_mont_sqr_32(t[ 2], t[ 1], m, mp);
  3464. sp_2048_mont_mul_32(t[ 3], t[ 2], t[ 1], m, mp);
  3465. sp_2048_mont_sqr_32(t[ 4], t[ 2], m, mp);
  3466. sp_2048_mont_mul_32(t[ 5], t[ 3], t[ 2], m, mp);
  3467. sp_2048_mont_sqr_32(t[ 6], t[ 3], m, mp);
  3468. sp_2048_mont_mul_32(t[ 7], t[ 4], t[ 3], m, mp);
  3469. sp_2048_mont_sqr_32(t[ 8], t[ 4], m, mp);
  3470. sp_2048_mont_mul_32(t[ 9], t[ 5], t[ 4], m, mp);
  3471. sp_2048_mont_sqr_32(t[10], t[ 5], m, mp);
  3472. sp_2048_mont_mul_32(t[11], t[ 6], t[ 5], m, mp);
  3473. sp_2048_mont_sqr_32(t[12], t[ 6], m, mp);
  3474. sp_2048_mont_mul_32(t[13], t[ 7], t[ 6], m, mp);
  3475. sp_2048_mont_sqr_32(t[14], t[ 7], m, mp);
  3476. sp_2048_mont_mul_32(t[15], t[ 8], t[ 7], m, mp);
  3477. sp_2048_mont_sqr_32(t[16], t[ 8], m, mp);
  3478. sp_2048_mont_mul_32(t[17], t[ 9], t[ 8], m, mp);
  3479. sp_2048_mont_sqr_32(t[18], t[ 9], m, mp);
  3480. sp_2048_mont_mul_32(t[19], t[10], t[ 9], m, mp);
  3481. sp_2048_mont_sqr_32(t[20], t[10], m, mp);
  3482. sp_2048_mont_mul_32(t[21], t[11], t[10], m, mp);
  3483. sp_2048_mont_sqr_32(t[22], t[11], m, mp);
  3484. sp_2048_mont_mul_32(t[23], t[12], t[11], m, mp);
  3485. sp_2048_mont_sqr_32(t[24], t[12], m, mp);
  3486. sp_2048_mont_mul_32(t[25], t[13], t[12], m, mp);
  3487. sp_2048_mont_sqr_32(t[26], t[13], m, mp);
  3488. sp_2048_mont_mul_32(t[27], t[14], t[13], m, mp);
  3489. sp_2048_mont_sqr_32(t[28], t[14], m, mp);
  3490. sp_2048_mont_mul_32(t[29], t[15], t[14], m, mp);
  3491. sp_2048_mont_sqr_32(t[30], t[15], m, mp);
  3492. sp_2048_mont_mul_32(t[31], t[16], t[15], m, mp);
  3493. i = (bits - 1) / 32;
  3494. n = e[i--];
  3495. c = bits & 31;
  3496. if (c == 0) {
  3497. c = 32;
  3498. }
  3499. c -= bits % 5;
  3500. if (c == 32) {
  3501. c = 27;
  3502. }
  3503. if (c < 0) {
  3504. /* Number of bits in top word is less than number needed. */
  3505. c = -c;
  3506. y = (byte)(n << c);
  3507. n = e[i--];
  3508. y |= (byte)(n >> (64 - c));
  3509. n <<= c;
  3510. c = 64 - c;
  3511. }
  3512. else if (c == 0) {
  3513. /* All bits in top word used. */
  3514. y = (byte)n;
  3515. }
  3516. else {
  3517. y = (byte)(n >> c);
  3518. n <<= 32 - c;
  3519. }
  3520. XMEMCPY(r, t[y], sizeof(sp_digit) * 32);
  3521. for (; i>=0 || c>=5; ) {
  3522. if (c == 0) {
  3523. n = e[i--];
  3524. y = (byte)(n >> 27);
  3525. n <<= 5;
  3526. c = 27;
  3527. }
  3528. else if (c < 5) {
  3529. y = (byte)(n >> 27);
  3530. n = e[i--];
  3531. c = 5 - c;
  3532. y |= (byte)(n >> (32 - c));
  3533. n <<= c;
  3534. c = 32 - c;
  3535. }
  3536. else {
  3537. y = (byte)((n >> 27) & 0x1f);
  3538. n <<= 5;
  3539. c -= 5;
  3540. }
  3541. sp_2048_mont_sqr_32(r, r, m, mp);
  3542. sp_2048_mont_sqr_32(r, r, m, mp);
  3543. sp_2048_mont_sqr_32(r, r, m, mp);
  3544. sp_2048_mont_sqr_32(r, r, m, mp);
  3545. sp_2048_mont_sqr_32(r, r, m, mp);
  3546. sp_2048_mont_mul_32(r, r, t[y], m, mp);
  3547. }
  3548. XMEMSET(&r[32], 0, sizeof(sp_digit) * 32U);
  3549. sp_2048_mont_reduce_32(r, m, mp);
  3550. mask = 0 - (sp_2048_cmp_32(r, m) >= 0);
  3551. sp_2048_cond_sub_32(r, r, m, mask);
  3552. }
  3553. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  3554. if (td != NULL)
  3555. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  3556. #endif
  3557. return err;
  3558. }
  3559. #endif /* WOLFSSL_SP_SMALL */
  3560. #endif /* (WOLFSSL_HAVE_SP_RSA & !WOLFSSL_RSA_PUBLIC_ONLY) | WOLFSSL_HAVE_SP_DH */
  3561. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || defined(WOLFSSL_HAVE_SP_DH)
  3562. /* r = 2^n mod m where n is the number of bits to reduce by.
  3563. * Given m must be 2048 bits, just need to subtract.
  3564. *
  3565. * r A single precision number.
  3566. * m A single precision number.
  3567. */
  3568. static void sp_2048_mont_norm_64(sp_digit* r, const sp_digit* m)
  3569. {
  3570. XMEMSET(r, 0, sizeof(sp_digit) * 64);
  3571. /* r = 2^n mod m */
  3572. sp_2048_sub_in_place_64(r, m);
  3573. }
  3574. #endif /* (WOLFSSL_HAVE_SP_RSA & !WOLFSSL_RSA_PUBLIC_ONLY) | WOLFSSL_HAVE_SP_DH */
  3575. /* Conditionally subtract b from a using the mask m.
  3576. * m is -1 to subtract and 0 when not copying.
  3577. *
  3578. * r A single precision number representing condition subtract result.
  3579. * a A single precision number to subtract from.
  3580. * b A single precision number to subtract.
  3581. * m Mask value to apply.
  3582. */
  3583. SP_NOINLINE static sp_digit sp_2048_cond_sub_64(sp_digit* r, const sp_digit* a,
  3584. const sp_digit* b, sp_digit m)
  3585. {
  3586. sp_digit c = 0;
  3587. __asm__ __volatile__ (
  3588. "mov r5, #1\n\t"
  3589. "lsl r5, r5, #8\n\t"
  3590. "mov r9, r5\n\t"
  3591. "mov r8, #0\n\t"
  3592. "\n1:\n\t"
  3593. "ldr r6, [%[b], r8]\n\t"
  3594. "and r6, r6, %[m]\n\t"
  3595. "mov r5, #0\n\t"
  3596. "subs r5, r5, %[c]\n\t"
  3597. "ldr r5, [%[a], r8]\n\t"
  3598. "sbcs r5, r5, r6\n\t"
  3599. "sbcs %[c], %[c], %[c]\n\t"
  3600. "str r5, [%[r], r8]\n\t"
  3601. "add r8, r8, #4\n\t"
  3602. "cmp r8, r9\n\t"
  3603. #ifdef __GNUC__
  3604. "blt 1b\n\t"
  3605. #else
  3606. "blt.n 1b\n\t"
  3607. #endif /* __GNUC__ */
  3608. : [c] "+r" (c)
  3609. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  3610. : "memory", "r5", "r6", "r8", "r9"
  3611. );
  3612. return c;
  3613. }
  3614. /* Reduce the number back to 2048 bits using Montgomery reduction.
  3615. *
  3616. * a A single precision number to reduce in place.
  3617. * m The single precision number representing the modulus.
  3618. * mp The digit representing the negative inverse of m mod 2^n.
  3619. */
  3620. SP_NOINLINE static void sp_2048_mont_reduce_64(sp_digit* a, const sp_digit* m,
  3621. sp_digit mp)
  3622. {
  3623. sp_digit ca = 0;
  3624. __asm__ __volatile__ (
  3625. "mov r9, %[mp]\n\t"
  3626. "mov r12, %[m]\n\t"
  3627. "mov r10, %[a]\n\t"
  3628. "mov r4, #0\n\t"
  3629. "add r11, r10, #256\n\t"
  3630. "\n1:\n\t"
  3631. /* mu = a[i] * mp */
  3632. "mov %[mp], r9\n\t"
  3633. "ldr %[a], [r10]\n\t"
  3634. "mul %[mp], %[mp], %[a]\n\t"
  3635. "mov %[m], r12\n\t"
  3636. "add r14, r10, #248\n\t"
  3637. "\n2:\n\t"
  3638. /* a[i+j] += m[j] * mu */
  3639. "ldr %[a], [r10]\n\t"
  3640. "mov r5, #0\n\t"
  3641. /* Multiply m[j] and mu - Start */
  3642. "ldr r8, [%[m]], #4\n\t"
  3643. "umull r6, r8, %[mp], r8\n\t"
  3644. "adds %[a], %[a], r6\n\t"
  3645. "adc r5, r5, r8\n\t"
  3646. /* Multiply m[j] and mu - Done */
  3647. "adds r4, r4, %[a]\n\t"
  3648. "adc r5, r5, #0\n\t"
  3649. "str r4, [r10], #4\n\t"
  3650. /* a[i+j+1] += m[j+1] * mu */
  3651. "ldr %[a], [r10]\n\t"
  3652. "mov r4, #0\n\t"
  3653. /* Multiply m[j] and mu - Start */
  3654. "ldr r8, [%[m]], #4\n\t"
  3655. "umull r6, r8, %[mp], r8\n\t"
  3656. "adds %[a], %[a], r6\n\t"
  3657. "adc r4, r4, r8\n\t"
  3658. /* Multiply m[j] and mu - Done */
  3659. "adds r5, r5, %[a]\n\t"
  3660. "adc r4, r4, #0\n\t"
  3661. "str r5, [r10], #4\n\t"
  3662. "cmp r10, r14\n\t"
  3663. #ifdef __GNUC__
  3664. "blt 2b\n\t"
  3665. #else
  3666. "blt.n 2b\n\t"
  3667. #endif /* __GNUC__ */
  3668. /* a[i+62] += m[62] * mu */
  3669. "ldr %[a], [r10]\n\t"
  3670. "mov r5, #0\n\t"
  3671. /* Multiply m[j] and mu - Start */
  3672. "ldr r8, [%[m]], #4\n\t"
  3673. "umull r6, r8, %[mp], r8\n\t"
  3674. "adds %[a], %[a], r6\n\t"
  3675. "adc r5, r5, r8\n\t"
  3676. /* Multiply m[j] and mu - Done */
  3677. "adds r4, r4, %[a]\n\t"
  3678. "adc r5, r5, #0\n\t"
  3679. "str r4, [r10], #4\n\t"
  3680. /* a[i+63] += m[63] * mu */
  3681. "mov r4, %[ca]\n\t"
  3682. "mov %[ca], #0\n\t"
  3683. /* Multiply m[63] and mu - Start */
  3684. "ldr r8, [%[m]]\n\t"
  3685. "umull r6, r8, %[mp], r8\n\t"
  3686. "adds r5, r5, r6\n\t"
  3687. "adcs r4, r4, r8\n\t"
  3688. "adc %[ca], %[ca], #0\n\t"
  3689. /* Multiply m[63] and mu - Done */
  3690. "ldr r6, [r10]\n\t"
  3691. "ldr r8, [r10, #4]\n\t"
  3692. "adds r6, r6, r5\n\t"
  3693. "adcs r8, r8, r4\n\t"
  3694. "adc %[ca], %[ca], #0\n\t"
  3695. "str r6, [r10]\n\t"
  3696. "str r8, [r10, #4]\n\t"
  3697. /* Next word in a */
  3698. "sub r10, r10, #248\n\t"
  3699. "cmp r10, r11\n\t"
  3700. #ifdef __GNUC__
  3701. "blt 1b\n\t"
  3702. #else
  3703. "blt.n 1b\n\t"
  3704. #endif /* __GNUC__ */
  3705. "mov %[a], r10\n\t"
  3706. "mov %[m], r12\n\t"
  3707. : [ca] "+r" (ca), [a] "+r" (a)
  3708. : [m] "r" (m), [mp] "r" (mp)
  3709. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  3710. );
  3711. sp_2048_cond_sub_64(a - 64, a, m, (sp_digit)0 - ca);
  3712. }
  3713. /* Multiply two Montgomery form numbers mod the modulus (prime).
  3714. * (r = a * b mod m)
  3715. *
  3716. * r Result of multiplication.
  3717. * a First number to multiply in Montgomery form.
  3718. * b Second number to multiply in Montgomery form.
  3719. * m Modulus (prime).
  3720. * mp Montgomery mulitplier.
  3721. */
  3722. SP_NOINLINE static void sp_2048_mont_mul_64(sp_digit* r, const sp_digit* a,
  3723. const sp_digit* b, const sp_digit* m, sp_digit mp)
  3724. {
  3725. sp_2048_mul_64(r, a, b);
  3726. sp_2048_mont_reduce_64(r, m, mp);
  3727. }
  3728. /* Square the Montgomery form number. (r = a * a mod m)
  3729. *
  3730. * r Result of squaring.
  3731. * a Number to square in Montgomery form.
  3732. * m Modulus (prime).
  3733. * mp Montgomery mulitplier.
  3734. */
  3735. SP_NOINLINE static void sp_2048_mont_sqr_64(sp_digit* r, const sp_digit* a,
  3736. const sp_digit* m, sp_digit mp)
  3737. {
  3738. sp_2048_sqr_64(r, a);
  3739. sp_2048_mont_reduce_64(r, m, mp);
  3740. }
  3741. #ifdef WOLFSSL_SP_SMALL
  3742. /* Sub b from a into r. (r = a - b)
  3743. *
  3744. * r A single precision integer.
  3745. * a A single precision integer.
  3746. * b A single precision integer.
  3747. */
  3748. SP_NOINLINE static sp_digit sp_2048_sub_64(sp_digit* r, const sp_digit* a,
  3749. const sp_digit* b)
  3750. {
  3751. sp_digit c = 0;
  3752. __asm__ __volatile__ (
  3753. "mov r6, %[a]\n\t"
  3754. "mov r5, #1\n\t"
  3755. "lsl r5, r5, #8\n\t"
  3756. "add r6, r6, r5\n\t"
  3757. "\n1:\n\t"
  3758. "mov r5, #0\n\t"
  3759. "subs r5, r5, %[c]\n\t"
  3760. "ldr r4, [%[a]]\n\t"
  3761. "ldr r5, [%[b]]\n\t"
  3762. "sbcs r4, r4, r5\n\t"
  3763. "str r4, [%[r]]\n\t"
  3764. "sbc %[c], %[c], %[c]\n\t"
  3765. "add %[a], %[a], #4\n\t"
  3766. "add %[b], %[b], #4\n\t"
  3767. "add %[r], %[r], #4\n\t"
  3768. "cmp %[a], r6\n\t"
  3769. #ifdef __GNUC__
  3770. "bne 1b\n\t"
  3771. #else
  3772. "bne.n 1b\n\t"
  3773. #endif /* __GNUC__ */
  3774. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  3775. :
  3776. : "memory", "r4", "r5", "r6"
  3777. );
  3778. return c;
  3779. }
  3780. #else
  3781. /* Sub b from a into r. (r = a - b)
  3782. *
  3783. * r A single precision integer.
  3784. * a A single precision integer.
  3785. * b A single precision integer.
  3786. */
  3787. SP_NOINLINE static sp_digit sp_2048_sub_64(sp_digit* r, const sp_digit* a,
  3788. const sp_digit* b)
  3789. {
  3790. sp_digit c = 0;
  3791. __asm__ __volatile__ (
  3792. "ldm %[a]!, {r4, r5}\n\t"
  3793. "ldm %[b]!, {r6, r8}\n\t"
  3794. "subs r4, r4, r6\n\t"
  3795. "sbcs r5, r5, r8\n\t"
  3796. "stm %[r]!, {r4, r5}\n\t"
  3797. "ldm %[a]!, {r4, r5}\n\t"
  3798. "ldm %[b]!, {r6, r8}\n\t"
  3799. "sbcs r4, r4, r6\n\t"
  3800. "sbcs r5, r5, r8\n\t"
  3801. "stm %[r]!, {r4, r5}\n\t"
  3802. "ldm %[a]!, {r4, r5}\n\t"
  3803. "ldm %[b]!, {r6, r8}\n\t"
  3804. "sbcs r4, r4, r6\n\t"
  3805. "sbcs r5, r5, r8\n\t"
  3806. "stm %[r]!, {r4, r5}\n\t"
  3807. "ldm %[a]!, {r4, r5}\n\t"
  3808. "ldm %[b]!, {r6, r8}\n\t"
  3809. "sbcs r4, r4, r6\n\t"
  3810. "sbcs r5, r5, r8\n\t"
  3811. "stm %[r]!, {r4, r5}\n\t"
  3812. "ldm %[a]!, {r4, r5}\n\t"
  3813. "ldm %[b]!, {r6, r8}\n\t"
  3814. "sbcs r4, r4, r6\n\t"
  3815. "sbcs r5, r5, r8\n\t"
  3816. "stm %[r]!, {r4, r5}\n\t"
  3817. "ldm %[a]!, {r4, r5}\n\t"
  3818. "ldm %[b]!, {r6, r8}\n\t"
  3819. "sbcs r4, r4, r6\n\t"
  3820. "sbcs r5, r5, r8\n\t"
  3821. "stm %[r]!, {r4, r5}\n\t"
  3822. "ldm %[a]!, {r4, r5}\n\t"
  3823. "ldm %[b]!, {r6, r8}\n\t"
  3824. "sbcs r4, r4, r6\n\t"
  3825. "sbcs r5, r5, r8\n\t"
  3826. "stm %[r]!, {r4, r5}\n\t"
  3827. "ldm %[a]!, {r4, r5}\n\t"
  3828. "ldm %[b]!, {r6, r8}\n\t"
  3829. "sbcs r4, r4, r6\n\t"
  3830. "sbcs r5, r5, r8\n\t"
  3831. "stm %[r]!, {r4, r5}\n\t"
  3832. "ldm %[a]!, {r4, r5}\n\t"
  3833. "ldm %[b]!, {r6, r8}\n\t"
  3834. "sbcs r4, r4, r6\n\t"
  3835. "sbcs r5, r5, r8\n\t"
  3836. "stm %[r]!, {r4, r5}\n\t"
  3837. "ldm %[a]!, {r4, r5}\n\t"
  3838. "ldm %[b]!, {r6, r8}\n\t"
  3839. "sbcs r4, r4, r6\n\t"
  3840. "sbcs r5, r5, r8\n\t"
  3841. "stm %[r]!, {r4, r5}\n\t"
  3842. "ldm %[a]!, {r4, r5}\n\t"
  3843. "ldm %[b]!, {r6, r8}\n\t"
  3844. "sbcs r4, r4, r6\n\t"
  3845. "sbcs r5, r5, r8\n\t"
  3846. "stm %[r]!, {r4, r5}\n\t"
  3847. "ldm %[a]!, {r4, r5}\n\t"
  3848. "ldm %[b]!, {r6, r8}\n\t"
  3849. "sbcs r4, r4, r6\n\t"
  3850. "sbcs r5, r5, r8\n\t"
  3851. "stm %[r]!, {r4, r5}\n\t"
  3852. "ldm %[a]!, {r4, r5}\n\t"
  3853. "ldm %[b]!, {r6, r8}\n\t"
  3854. "sbcs r4, r4, r6\n\t"
  3855. "sbcs r5, r5, r8\n\t"
  3856. "stm %[r]!, {r4, r5}\n\t"
  3857. "ldm %[a]!, {r4, r5}\n\t"
  3858. "ldm %[b]!, {r6, r8}\n\t"
  3859. "sbcs r4, r4, r6\n\t"
  3860. "sbcs r5, r5, r8\n\t"
  3861. "stm %[r]!, {r4, r5}\n\t"
  3862. "ldm %[a]!, {r4, r5}\n\t"
  3863. "ldm %[b]!, {r6, r8}\n\t"
  3864. "sbcs r4, r4, r6\n\t"
  3865. "sbcs r5, r5, r8\n\t"
  3866. "stm %[r]!, {r4, r5}\n\t"
  3867. "ldm %[a]!, {r4, r5}\n\t"
  3868. "ldm %[b]!, {r6, r8}\n\t"
  3869. "sbcs r4, r4, r6\n\t"
  3870. "sbcs r5, r5, r8\n\t"
  3871. "stm %[r]!, {r4, r5}\n\t"
  3872. "ldm %[a]!, {r4, r5}\n\t"
  3873. "ldm %[b]!, {r6, r8}\n\t"
  3874. "sbcs r4, r4, r6\n\t"
  3875. "sbcs r5, r5, r8\n\t"
  3876. "stm %[r]!, {r4, r5}\n\t"
  3877. "ldm %[a]!, {r4, r5}\n\t"
  3878. "ldm %[b]!, {r6, r8}\n\t"
  3879. "sbcs r4, r4, r6\n\t"
  3880. "sbcs r5, r5, r8\n\t"
  3881. "stm %[r]!, {r4, r5}\n\t"
  3882. "ldm %[a]!, {r4, r5}\n\t"
  3883. "ldm %[b]!, {r6, r8}\n\t"
  3884. "sbcs r4, r4, r6\n\t"
  3885. "sbcs r5, r5, r8\n\t"
  3886. "stm %[r]!, {r4, r5}\n\t"
  3887. "ldm %[a]!, {r4, r5}\n\t"
  3888. "ldm %[b]!, {r6, r8}\n\t"
  3889. "sbcs r4, r4, r6\n\t"
  3890. "sbcs r5, r5, r8\n\t"
  3891. "stm %[r]!, {r4, r5}\n\t"
  3892. "ldm %[a]!, {r4, r5}\n\t"
  3893. "ldm %[b]!, {r6, r8}\n\t"
  3894. "sbcs r4, r4, r6\n\t"
  3895. "sbcs r5, r5, r8\n\t"
  3896. "stm %[r]!, {r4, r5}\n\t"
  3897. "ldm %[a]!, {r4, r5}\n\t"
  3898. "ldm %[b]!, {r6, r8}\n\t"
  3899. "sbcs r4, r4, r6\n\t"
  3900. "sbcs r5, r5, r8\n\t"
  3901. "stm %[r]!, {r4, r5}\n\t"
  3902. "ldm %[a]!, {r4, r5}\n\t"
  3903. "ldm %[b]!, {r6, r8}\n\t"
  3904. "sbcs r4, r4, r6\n\t"
  3905. "sbcs r5, r5, r8\n\t"
  3906. "stm %[r]!, {r4, r5}\n\t"
  3907. "ldm %[a]!, {r4, r5}\n\t"
  3908. "ldm %[b]!, {r6, r8}\n\t"
  3909. "sbcs r4, r4, r6\n\t"
  3910. "sbcs r5, r5, r8\n\t"
  3911. "stm %[r]!, {r4, r5}\n\t"
  3912. "ldm %[a]!, {r4, r5}\n\t"
  3913. "ldm %[b]!, {r6, r8}\n\t"
  3914. "sbcs r4, r4, r6\n\t"
  3915. "sbcs r5, r5, r8\n\t"
  3916. "stm %[r]!, {r4, r5}\n\t"
  3917. "ldm %[a]!, {r4, r5}\n\t"
  3918. "ldm %[b]!, {r6, r8}\n\t"
  3919. "sbcs r4, r4, r6\n\t"
  3920. "sbcs r5, r5, r8\n\t"
  3921. "stm %[r]!, {r4, r5}\n\t"
  3922. "ldm %[a]!, {r4, r5}\n\t"
  3923. "ldm %[b]!, {r6, r8}\n\t"
  3924. "sbcs r4, r4, r6\n\t"
  3925. "sbcs r5, r5, r8\n\t"
  3926. "stm %[r]!, {r4, r5}\n\t"
  3927. "ldm %[a]!, {r4, r5}\n\t"
  3928. "ldm %[b]!, {r6, r8}\n\t"
  3929. "sbcs r4, r4, r6\n\t"
  3930. "sbcs r5, r5, r8\n\t"
  3931. "stm %[r]!, {r4, r5}\n\t"
  3932. "ldm %[a]!, {r4, r5}\n\t"
  3933. "ldm %[b]!, {r6, r8}\n\t"
  3934. "sbcs r4, r4, r6\n\t"
  3935. "sbcs r5, r5, r8\n\t"
  3936. "stm %[r]!, {r4, r5}\n\t"
  3937. "ldm %[a]!, {r4, r5}\n\t"
  3938. "ldm %[b]!, {r6, r8}\n\t"
  3939. "sbcs r4, r4, r6\n\t"
  3940. "sbcs r5, r5, r8\n\t"
  3941. "stm %[r]!, {r4, r5}\n\t"
  3942. "ldm %[a]!, {r4, r5}\n\t"
  3943. "ldm %[b]!, {r6, r8}\n\t"
  3944. "sbcs r4, r4, r6\n\t"
  3945. "sbcs r5, r5, r8\n\t"
  3946. "stm %[r]!, {r4, r5}\n\t"
  3947. "ldm %[a]!, {r4, r5}\n\t"
  3948. "ldm %[b]!, {r6, r8}\n\t"
  3949. "sbcs r4, r4, r6\n\t"
  3950. "sbcs r5, r5, r8\n\t"
  3951. "stm %[r]!, {r4, r5}\n\t"
  3952. "sbc %[c], %[c], %[c]\n\t"
  3953. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  3954. :
  3955. : "memory", "r4", "r5", "r6", "r8"
  3956. );
  3957. return c;
  3958. }
  3959. #endif /* WOLFSSL_SP_SMALL */
  3960. /* Divide the double width number (d1|d0) by the divisor. (d1|d0 / div)
  3961. *
  3962. * d1 The high order half of the number to divide.
  3963. * d0 The low order half of the number to divide.
  3964. * div The divisor.
  3965. * returns the result of the division.
  3966. *
  3967. * Note that this is an approximate div. It may give an answer 1 larger.
  3968. */
  3969. SP_NOINLINE static sp_digit div_2048_word_64(sp_digit d1, sp_digit d0,
  3970. sp_digit div)
  3971. {
  3972. sp_digit r = 0;
  3973. __asm__ __volatile__ (
  3974. "lsr r6, %[div], #16\n\t"
  3975. "add r6, r6, #1\n\t"
  3976. "udiv r4, %[d1], r6\n\t"
  3977. "lsl r8, r4, #16\n\t"
  3978. "umull r4, r5, %[div], r8\n\t"
  3979. "subs %[d0], %[d0], r4\n\t"
  3980. "sbc %[d1], %[d1], r5\n\t"
  3981. "udiv r5, %[d1], r6\n\t"
  3982. "lsl r4, r5, #16\n\t"
  3983. "add r8, r8, r4\n\t"
  3984. "umull r4, r5, %[div], r4\n\t"
  3985. "subs %[d0], %[d0], r4\n\t"
  3986. "sbc %[d1], %[d1], r5\n\t"
  3987. "lsl r4, %[d1], #16\n\t"
  3988. "orr r4, r4, %[d0], lsr #16\n\t"
  3989. "udiv r4, r4, r6\n\t"
  3990. "add r8, r8, r4\n\t"
  3991. "umull r4, r5, %[div], r4\n\t"
  3992. "subs %[d0], %[d0], r4\n\t"
  3993. "sbc %[d1], %[d1], r5\n\t"
  3994. "lsl r4, %[d1], #16\n\t"
  3995. "orr r4, r4, %[d0], lsr #16\n\t"
  3996. "udiv r4, r4, r6\n\t"
  3997. "add r8, r8, r4\n\t"
  3998. "umull r4, r5, %[div], r4\n\t"
  3999. "subs %[d0], %[d0], r4\n\t"
  4000. "sbc %[d1], %[d1], r5\n\t"
  4001. "udiv r4, %[d0], %[div]\n\t"
  4002. "add r8, r8, r4\n\t"
  4003. "mov %[r], r8\n\t"
  4004. : [r] "+r" (r)
  4005. : [d1] "r" (d1), [d0] "r" (d0), [div] "r" (div)
  4006. : "r4", "r5", "r6", "r8"
  4007. );
  4008. return r;
  4009. }
  4010. /* Divide d in a and put remainder into r (m*d + r = a)
  4011. * m is not calculated as it is not needed at this time.
  4012. *
  4013. * a Number to be divided.
  4014. * d Number to divide with.
  4015. * m Multiplier result.
  4016. * r Remainder from the division.
  4017. * returns MP_OKAY indicating success.
  4018. */
  4019. static WC_INLINE int sp_2048_div_64_cond(const sp_digit* a, const sp_digit* d, sp_digit* m,
  4020. sp_digit* r)
  4021. {
  4022. sp_digit t1[128], t2[65];
  4023. sp_digit div, r1;
  4024. int i;
  4025. (void)m;
  4026. div = d[63];
  4027. XMEMCPY(t1, a, sizeof(*t1) * 2 * 64);
  4028. for (i = 63; i > 0; i--) {
  4029. if (t1[i + 64] != d[i])
  4030. break;
  4031. }
  4032. if (t1[i + 64] >= d[i]) {
  4033. sp_2048_sub_in_place_64(&t1[64], d);
  4034. }
  4035. for (i = 63; i >= 0; i--) {
  4036. if (t1[64 + i] == div) {
  4037. r1 = SP_DIGIT_MAX;
  4038. }
  4039. else {
  4040. r1 = div_2048_word_64(t1[64 + i], t1[64 + i - 1], div);
  4041. }
  4042. sp_2048_mul_d_64(t2, d, r1);
  4043. t1[64 + i] += sp_2048_sub_in_place_64(&t1[i], t2);
  4044. t1[64 + i] -= t2[64];
  4045. if (t1[64 + i] != 0) {
  4046. t1[64 + i] += sp_2048_add_64(&t1[i], &t1[i], d);
  4047. if (t1[64 + i] != 0)
  4048. t1[64 + i] += sp_2048_add_64(&t1[i], &t1[i], d);
  4049. }
  4050. }
  4051. for (i = 63; i > 0; i--) {
  4052. if (t1[i] != d[i])
  4053. break;
  4054. }
  4055. if (t1[i] >= d[i]) {
  4056. sp_2048_sub_64(r, t1, d);
  4057. }
  4058. else {
  4059. XMEMCPY(r, t1, sizeof(*t1) * 64);
  4060. }
  4061. return MP_OKAY;
  4062. }
  4063. /* Reduce a modulo m into r. (r = a mod m)
  4064. *
  4065. * r A single precision number that is the reduced result.
  4066. * a A single precision number that is to be reduced.
  4067. * m A single precision number that is the modulus to reduce with.
  4068. * returns MP_OKAY indicating success.
  4069. */
  4070. static WC_INLINE int sp_2048_mod_64_cond(sp_digit* r, const sp_digit* a, const sp_digit* m)
  4071. {
  4072. return sp_2048_div_64_cond(a, m, NULL, r);
  4073. }
  4074. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || defined(WOLFSSL_HAVE_SP_DH)
  4075. /* AND m into each word of a and store in r.
  4076. *
  4077. * r A single precision integer.
  4078. * a A single precision integer.
  4079. * m Mask to AND against each digit.
  4080. */
  4081. static void sp_2048_mask_64(sp_digit* r, const sp_digit* a, sp_digit m)
  4082. {
  4083. #ifdef WOLFSSL_SP_SMALL
  4084. int i;
  4085. for (i=0; i<64; i++) {
  4086. r[i] = a[i] & m;
  4087. }
  4088. #else
  4089. int i;
  4090. for (i = 0; i < 64; i += 8) {
  4091. r[i+0] = a[i+0] & m;
  4092. r[i+1] = a[i+1] & m;
  4093. r[i+2] = a[i+2] & m;
  4094. r[i+3] = a[i+3] & m;
  4095. r[i+4] = a[i+4] & m;
  4096. r[i+5] = a[i+5] & m;
  4097. r[i+6] = a[i+6] & m;
  4098. r[i+7] = a[i+7] & m;
  4099. }
  4100. #endif
  4101. }
  4102. /* Compare a with b in constant time.
  4103. *
  4104. * a A single precision integer.
  4105. * b A single precision integer.
  4106. * return -ve, 0 or +ve if a is less than, equal to or greater than b
  4107. * respectively.
  4108. */
  4109. SP_NOINLINE static sp_int32 sp_2048_cmp_64(const sp_digit* a, const sp_digit* b)
  4110. {
  4111. sp_digit r = 0;
  4112. __asm__ __volatile__ (
  4113. "mov r3, #0\n\t"
  4114. "mvn r3, r3\n\t"
  4115. "mov r6, #252\n\t"
  4116. "\n1:\n\t"
  4117. "ldr r8, [%[a], r6]\n\t"
  4118. "ldr r5, [%[b], r6]\n\t"
  4119. "and r8, r8, r3\n\t"
  4120. "and r5, r5, r3\n\t"
  4121. "mov r4, r8\n\t"
  4122. "subs r8, r8, r5\n\t"
  4123. "sbc r8, r8, r8\n\t"
  4124. "add %[r], %[r], r8\n\t"
  4125. "mvn r8, r8\n\t"
  4126. "and r3, r3, r8\n\t"
  4127. "subs r5, r5, r4\n\t"
  4128. "sbc r8, r8, r8\n\t"
  4129. "sub %[r], %[r], r8\n\t"
  4130. "mvn r8, r8\n\t"
  4131. "and r3, r3, r8\n\t"
  4132. "sub r6, r6, #4\n\t"
  4133. "cmp r6, #0\n\t"
  4134. #ifdef __GNUC__
  4135. "bge 1b\n\t"
  4136. #else
  4137. "bge.n 1b\n\t"
  4138. #endif /* __GNUC__ */
  4139. : [r] "+r" (r)
  4140. : [a] "r" (a), [b] "r" (b)
  4141. : "r3", "r4", "r5", "r6", "r8"
  4142. );
  4143. return r;
  4144. }
  4145. /* Divide d in a and put remainder into r (m*d + r = a)
  4146. * m is not calculated as it is not needed at this time.
  4147. *
  4148. * a Number to be divided.
  4149. * d Number to divide with.
  4150. * m Multiplier result.
  4151. * r Remainder from the division.
  4152. * returns MP_OKAY indicating success.
  4153. */
  4154. static WC_INLINE int sp_2048_div_64(const sp_digit* a, const sp_digit* d, sp_digit* m,
  4155. sp_digit* r)
  4156. {
  4157. sp_digit t1[128], t2[65];
  4158. sp_digit div, r1;
  4159. int i;
  4160. (void)m;
  4161. div = d[63];
  4162. XMEMCPY(t1, a, sizeof(*t1) * 2 * 64);
  4163. r1 = sp_2048_cmp_64(&t1[64], d) >= 0;
  4164. sp_2048_cond_sub_64(&t1[64], &t1[64], d, (sp_digit)0 - r1);
  4165. for (i = 63; i >= 0; i--) {
  4166. sp_digit mask = 0 - (t1[64 + i] == div);
  4167. sp_digit hi = t1[64 + i] + mask;
  4168. r1 = div_2048_word_64(hi, t1[64 + i - 1], div);
  4169. r1 |= mask;
  4170. sp_2048_mul_d_64(t2, d, r1);
  4171. t1[64 + i] += sp_2048_sub_in_place_64(&t1[i], t2);
  4172. t1[64 + i] -= t2[64];
  4173. sp_2048_mask_64(t2, d, t1[64 + i]);
  4174. t1[64 + i] += sp_2048_add_64(&t1[i], &t1[i], t2);
  4175. sp_2048_mask_64(t2, d, t1[64 + i]);
  4176. t1[64 + i] += sp_2048_add_64(&t1[i], &t1[i], t2);
  4177. }
  4178. r1 = sp_2048_cmp_64(t1, d) >= 0;
  4179. sp_2048_cond_sub_64(r, t1, d, (sp_digit)0 - r1);
  4180. return MP_OKAY;
  4181. }
  4182. /* Reduce a modulo m into r. (r = a mod m)
  4183. *
  4184. * r A single precision number that is the reduced result.
  4185. * a A single precision number that is to be reduced.
  4186. * m A single precision number that is the modulus to reduce with.
  4187. * returns MP_OKAY indicating success.
  4188. */
  4189. static WC_INLINE int sp_2048_mod_64(sp_digit* r, const sp_digit* a, const sp_digit* m)
  4190. {
  4191. return sp_2048_div_64(a, m, NULL, r);
  4192. }
  4193. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || \
  4194. defined(WOLFSSL_HAVE_SP_DH)
  4195. #ifdef WOLFSSL_SP_SMALL
  4196. /* Modular exponentiate a to the e mod m. (r = a^e mod m)
  4197. *
  4198. * r A single precision number that is the result of the operation.
  4199. * a A single precision number being exponentiated.
  4200. * e A single precision number that is the exponent.
  4201. * bits The number of bits in the exponent.
  4202. * m A single precision number that is the modulus.
  4203. * returns 0 on success.
  4204. * returns MEMORY_E on dynamic memory allocation failure.
  4205. * returns MP_VAL when base is even or exponent is 0.
  4206. */
  4207. static int sp_2048_mod_exp_64(sp_digit* r, const sp_digit* a, const sp_digit* e,
  4208. int bits, const sp_digit* m, int reduceA)
  4209. {
  4210. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4211. sp_digit* td = NULL;
  4212. #else
  4213. sp_digit td[8 * 128];
  4214. #endif
  4215. sp_digit* t[8];
  4216. sp_digit* norm = NULL;
  4217. sp_digit mp = 1;
  4218. sp_digit n;
  4219. sp_digit mask;
  4220. int i;
  4221. int c;
  4222. byte y;
  4223. int err = MP_OKAY;
  4224. if (bits == 0) {
  4225. err = MP_VAL;
  4226. }
  4227. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4228. if (err == MP_OKAY) {
  4229. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * (8 * 128), NULL,
  4230. DYNAMIC_TYPE_TMP_BUFFER);
  4231. if (td == NULL)
  4232. err = MEMORY_E;
  4233. }
  4234. #endif
  4235. if (err == MP_OKAY) {
  4236. norm = td;
  4237. for (i=0; i<8; i++) {
  4238. t[i] = td + i * 128;
  4239. }
  4240. sp_2048_mont_setup(m, &mp);
  4241. sp_2048_mont_norm_64(norm, m);
  4242. XMEMSET(t[1], 0, sizeof(sp_digit) * 64U);
  4243. if (reduceA != 0) {
  4244. err = sp_2048_mod_64(t[1] + 64, a, m);
  4245. if (err == MP_OKAY) {
  4246. err = sp_2048_mod_64(t[1], t[1], m);
  4247. }
  4248. }
  4249. else {
  4250. XMEMCPY(t[1] + 64, a, sizeof(sp_digit) * 64);
  4251. err = sp_2048_mod_64(t[1], t[1], m);
  4252. }
  4253. }
  4254. if (err == MP_OKAY) {
  4255. sp_2048_mont_sqr_64(t[ 2], t[ 1], m, mp);
  4256. sp_2048_mont_mul_64(t[ 3], t[ 2], t[ 1], m, mp);
  4257. sp_2048_mont_sqr_64(t[ 4], t[ 2], m, mp);
  4258. sp_2048_mont_mul_64(t[ 5], t[ 3], t[ 2], m, mp);
  4259. sp_2048_mont_sqr_64(t[ 6], t[ 3], m, mp);
  4260. sp_2048_mont_mul_64(t[ 7], t[ 4], t[ 3], m, mp);
  4261. i = (bits - 1) / 32;
  4262. n = e[i--];
  4263. c = bits & 31;
  4264. if (c == 0) {
  4265. c = 32;
  4266. }
  4267. c -= bits % 3;
  4268. if (c == 32) {
  4269. c = 29;
  4270. }
  4271. if (c < 0) {
  4272. /* Number of bits in top word is less than number needed. */
  4273. c = -c;
  4274. y = (byte)(n << c);
  4275. n = e[i--];
  4276. y |= (byte)(n >> (64 - c));
  4277. n <<= c;
  4278. c = 64 - c;
  4279. }
  4280. else if (c == 0) {
  4281. /* All bits in top word used. */
  4282. y = (byte)n;
  4283. }
  4284. else {
  4285. y = (byte)(n >> c);
  4286. n <<= 32 - c;
  4287. }
  4288. XMEMCPY(r, t[y], sizeof(sp_digit) * 64);
  4289. for (; i>=0 || c>=3; ) {
  4290. if (c == 0) {
  4291. n = e[i--];
  4292. y = (byte)(n >> 29);
  4293. n <<= 3;
  4294. c = 29;
  4295. }
  4296. else if (c < 3) {
  4297. y = (byte)(n >> 29);
  4298. n = e[i--];
  4299. c = 3 - c;
  4300. y |= (byte)(n >> (32 - c));
  4301. n <<= c;
  4302. c = 32 - c;
  4303. }
  4304. else {
  4305. y = (byte)((n >> 29) & 0x7);
  4306. n <<= 3;
  4307. c -= 3;
  4308. }
  4309. sp_2048_mont_sqr_64(r, r, m, mp);
  4310. sp_2048_mont_sqr_64(r, r, m, mp);
  4311. sp_2048_mont_sqr_64(r, r, m, mp);
  4312. sp_2048_mont_mul_64(r, r, t[y], m, mp);
  4313. }
  4314. XMEMSET(&r[64], 0, sizeof(sp_digit) * 64U);
  4315. sp_2048_mont_reduce_64(r, m, mp);
  4316. mask = 0 - (sp_2048_cmp_64(r, m) >= 0);
  4317. sp_2048_cond_sub_64(r, r, m, mask);
  4318. }
  4319. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4320. if (td != NULL)
  4321. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  4322. #endif
  4323. return err;
  4324. }
  4325. #else
  4326. /* Modular exponentiate a to the e mod m. (r = a^e mod m)
  4327. *
  4328. * r A single precision number that is the result of the operation.
  4329. * a A single precision number being exponentiated.
  4330. * e A single precision number that is the exponent.
  4331. * bits The number of bits in the exponent.
  4332. * m A single precision number that is the modulus.
  4333. * returns 0 on success.
  4334. * returns MEMORY_E on dynamic memory allocation failure.
  4335. * returns MP_VAL when base is even or exponent is 0.
  4336. */
  4337. static int sp_2048_mod_exp_64(sp_digit* r, const sp_digit* a, const sp_digit* e,
  4338. int bits, const sp_digit* m, int reduceA)
  4339. {
  4340. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4341. sp_digit* td = NULL;
  4342. #else
  4343. sp_digit td[16 * 128];
  4344. #endif
  4345. sp_digit* t[16];
  4346. sp_digit* norm = NULL;
  4347. sp_digit mp = 1;
  4348. sp_digit n;
  4349. sp_digit mask;
  4350. int i;
  4351. int c;
  4352. byte y;
  4353. int err = MP_OKAY;
  4354. if (bits == 0) {
  4355. err = MP_VAL;
  4356. }
  4357. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4358. if (err == MP_OKAY) {
  4359. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * (16 * 128), NULL,
  4360. DYNAMIC_TYPE_TMP_BUFFER);
  4361. if (td == NULL)
  4362. err = MEMORY_E;
  4363. }
  4364. #endif
  4365. if (err == MP_OKAY) {
  4366. norm = td;
  4367. for (i=0; i<16; i++) {
  4368. t[i] = td + i * 128;
  4369. }
  4370. sp_2048_mont_setup(m, &mp);
  4371. sp_2048_mont_norm_64(norm, m);
  4372. XMEMSET(t[1], 0, sizeof(sp_digit) * 64U);
  4373. if (reduceA != 0) {
  4374. err = sp_2048_mod_64(t[1] + 64, a, m);
  4375. if (err == MP_OKAY) {
  4376. err = sp_2048_mod_64(t[1], t[1], m);
  4377. }
  4378. }
  4379. else {
  4380. XMEMCPY(t[1] + 64, a, sizeof(sp_digit) * 64);
  4381. err = sp_2048_mod_64(t[1], t[1], m);
  4382. }
  4383. }
  4384. if (err == MP_OKAY) {
  4385. sp_2048_mont_sqr_64(t[ 2], t[ 1], m, mp);
  4386. sp_2048_mont_mul_64(t[ 3], t[ 2], t[ 1], m, mp);
  4387. sp_2048_mont_sqr_64(t[ 4], t[ 2], m, mp);
  4388. sp_2048_mont_mul_64(t[ 5], t[ 3], t[ 2], m, mp);
  4389. sp_2048_mont_sqr_64(t[ 6], t[ 3], m, mp);
  4390. sp_2048_mont_mul_64(t[ 7], t[ 4], t[ 3], m, mp);
  4391. sp_2048_mont_sqr_64(t[ 8], t[ 4], m, mp);
  4392. sp_2048_mont_mul_64(t[ 9], t[ 5], t[ 4], m, mp);
  4393. sp_2048_mont_sqr_64(t[10], t[ 5], m, mp);
  4394. sp_2048_mont_mul_64(t[11], t[ 6], t[ 5], m, mp);
  4395. sp_2048_mont_sqr_64(t[12], t[ 6], m, mp);
  4396. sp_2048_mont_mul_64(t[13], t[ 7], t[ 6], m, mp);
  4397. sp_2048_mont_sqr_64(t[14], t[ 7], m, mp);
  4398. sp_2048_mont_mul_64(t[15], t[ 8], t[ 7], m, mp);
  4399. i = (bits - 1) / 32;
  4400. n = e[i--];
  4401. c = bits & 31;
  4402. if (c == 0) {
  4403. c = 32;
  4404. }
  4405. c -= bits % 4;
  4406. if (c == 32) {
  4407. c = 28;
  4408. }
  4409. if (c < 0) {
  4410. /* Number of bits in top word is less than number needed. */
  4411. c = -c;
  4412. y = (byte)(n << c);
  4413. n = e[i--];
  4414. y |= (byte)(n >> (64 - c));
  4415. n <<= c;
  4416. c = 64 - c;
  4417. }
  4418. else if (c == 0) {
  4419. /* All bits in top word used. */
  4420. y = (byte)n;
  4421. }
  4422. else {
  4423. y = (byte)(n >> c);
  4424. n <<= 32 - c;
  4425. }
  4426. XMEMCPY(r, t[y], sizeof(sp_digit) * 64);
  4427. for (; i>=0 || c>=4; ) {
  4428. if (c == 0) {
  4429. n = e[i--];
  4430. y = (byte)(n >> 28);
  4431. n <<= 4;
  4432. c = 28;
  4433. }
  4434. else if (c < 4) {
  4435. y = (byte)(n >> 28);
  4436. n = e[i--];
  4437. c = 4 - c;
  4438. y |= (byte)(n >> (32 - c));
  4439. n <<= c;
  4440. c = 32 - c;
  4441. }
  4442. else {
  4443. y = (byte)((n >> 28) & 0xf);
  4444. n <<= 4;
  4445. c -= 4;
  4446. }
  4447. sp_2048_mont_sqr_64(r, r, m, mp);
  4448. sp_2048_mont_sqr_64(r, r, m, mp);
  4449. sp_2048_mont_sqr_64(r, r, m, mp);
  4450. sp_2048_mont_sqr_64(r, r, m, mp);
  4451. sp_2048_mont_mul_64(r, r, t[y], m, mp);
  4452. }
  4453. XMEMSET(&r[64], 0, sizeof(sp_digit) * 64U);
  4454. sp_2048_mont_reduce_64(r, m, mp);
  4455. mask = 0 - (sp_2048_cmp_64(r, m) >= 0);
  4456. sp_2048_cond_sub_64(r, r, m, mask);
  4457. }
  4458. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4459. if (td != NULL)
  4460. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  4461. #endif
  4462. return err;
  4463. }
  4464. #endif /* WOLFSSL_SP_SMALL */
  4465. #endif /* (WOLFSSL_HAVE_SP_RSA && !WOLFSSL_RSA_PUBLIC_ONLY) || WOLFSSL_HAVE_SP_DH */
  4466. #endif /* (WOLFSSL_HAVE_SP_RSA && !WOLFSSL_RSA_PUBLIC_ONLY) || WOLFSSL_HAVE_SP_DH */
  4467. #ifdef WOLFSSL_HAVE_SP_RSA
  4468. /* RSA public key operation.
  4469. *
  4470. * in Array of bytes representing the number to exponentiate, base.
  4471. * inLen Number of bytes in base.
  4472. * em Public exponent.
  4473. * mm Modulus.
  4474. * out Buffer to hold big-endian bytes of exponentiation result.
  4475. * Must be at least 256 bytes long.
  4476. * outLen Number of bytes in result.
  4477. * returns 0 on success, MP_TO_E when the outLen is too small, MP_READ_E when
  4478. * an array is too long and MEMORY_E when dynamic memory allocation fails.
  4479. */
  4480. int sp_RsaPublic_2048(const byte* in, word32 inLen, const mp_int* em,
  4481. const mp_int* mm, byte* out, word32* outLen)
  4482. {
  4483. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4484. sp_digit* a = NULL;
  4485. #else
  4486. sp_digit a[64 * 5];
  4487. #endif
  4488. sp_digit* m = NULL;
  4489. sp_digit* r = NULL;
  4490. sp_digit *ah = NULL;
  4491. sp_digit e[1] = {0};
  4492. int err = MP_OKAY;
  4493. if (*outLen < 256) {
  4494. err = MP_TO_E;
  4495. }
  4496. else if (mp_count_bits(em) > 32 || inLen > 256 ||
  4497. mp_count_bits(mm) != 2048) {
  4498. err = MP_READ_E;
  4499. }
  4500. else if (mp_iseven(mm)) {
  4501. err = MP_VAL;
  4502. }
  4503. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4504. if (err == MP_OKAY) {
  4505. a = (sp_digit*)XMALLOC(sizeof(sp_digit) * 64 * 5, NULL,
  4506. DYNAMIC_TYPE_RSA);
  4507. if (a == NULL)
  4508. err = MEMORY_E;
  4509. }
  4510. #endif
  4511. if (err == MP_OKAY) {
  4512. ah = a + 64;
  4513. r = a + 64 * 2;
  4514. m = r + 64 * 2;
  4515. sp_2048_from_bin(ah, 64, in, inLen);
  4516. #if DIGIT_BIT >= 32
  4517. e[0] = em->dp[0];
  4518. #else
  4519. e[0] = em->dp[0];
  4520. if (em->used > 1) {
  4521. e[0] |= ((sp_digit)em->dp[1]) << DIGIT_BIT;
  4522. }
  4523. #endif
  4524. if (e[0] == 0) {
  4525. err = MP_EXPTMOD_E;
  4526. }
  4527. }
  4528. if (err == MP_OKAY) {
  4529. sp_2048_from_mp(m, 64, mm);
  4530. if (e[0] == 0x10001) {
  4531. int i;
  4532. sp_digit mp;
  4533. sp_2048_mont_setup(m, &mp);
  4534. /* Convert to Montgomery form. */
  4535. XMEMSET(a, 0, sizeof(sp_digit) * 64);
  4536. err = sp_2048_mod_64_cond(r, a, m);
  4537. /* Montgomery form: r = a.R mod m */
  4538. if (err == MP_OKAY) {
  4539. /* r = a ^ 0x10000 => r = a squared 16 times */
  4540. for (i = 15; i >= 0; i--) {
  4541. sp_2048_mont_sqr_64(r, r, m, mp);
  4542. }
  4543. /* mont_red(r.R.R) = (r.R.R / R) mod m = r.R mod m
  4544. * mont_red(r.R * a) = (r.R.a / R) mod m = r.a mod m
  4545. */
  4546. sp_2048_mont_mul_64(r, r, ah, m, mp);
  4547. for (i = 63; i > 0; i--) {
  4548. if (r[i] != m[i]) {
  4549. break;
  4550. }
  4551. }
  4552. if (r[i] >= m[i]) {
  4553. sp_2048_sub_in_place_64(r, m);
  4554. }
  4555. }
  4556. }
  4557. else if (e[0] == 0x3) {
  4558. if (err == MP_OKAY) {
  4559. sp_2048_sqr_64(r, ah);
  4560. err = sp_2048_mod_64_cond(r, r, m);
  4561. }
  4562. if (err == MP_OKAY) {
  4563. sp_2048_mul_64(r, ah, r);
  4564. err = sp_2048_mod_64_cond(r, r, m);
  4565. }
  4566. }
  4567. else {
  4568. int i;
  4569. sp_digit mp;
  4570. sp_2048_mont_setup(m, &mp);
  4571. /* Convert to Montgomery form. */
  4572. XMEMSET(a, 0, sizeof(sp_digit) * 64);
  4573. err = sp_2048_mod_64_cond(a, a, m);
  4574. if (err == MP_OKAY) {
  4575. for (i = 31; i >= 0; i--) {
  4576. if (e[0] >> i) {
  4577. break;
  4578. }
  4579. }
  4580. XMEMCPY(r, a, sizeof(sp_digit) * 64);
  4581. for (i--; i >= 0; i--) {
  4582. sp_2048_mont_sqr_64(r, r, m, mp);
  4583. if (((e[0] >> i) & 1) == 1) {
  4584. sp_2048_mont_mul_64(r, r, a, m, mp);
  4585. }
  4586. }
  4587. XMEMSET(&r[64], 0, sizeof(sp_digit) * 64);
  4588. sp_2048_mont_reduce_64(r, m, mp);
  4589. for (i = 63; i > 0; i--) {
  4590. if (r[i] != m[i]) {
  4591. break;
  4592. }
  4593. }
  4594. if (r[i] >= m[i]) {
  4595. sp_2048_sub_in_place_64(r, m);
  4596. }
  4597. }
  4598. }
  4599. }
  4600. if (err == MP_OKAY) {
  4601. sp_2048_to_bin_64(r, out);
  4602. *outLen = 256;
  4603. }
  4604. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4605. if (a != NULL)
  4606. XFREE(a, NULL, DYNAMIC_TYPE_RSA);
  4607. #endif
  4608. return err;
  4609. }
  4610. #ifndef WOLFSSL_RSA_PUBLIC_ONLY
  4611. /* Conditionally add a and b using the mask m.
  4612. * m is -1 to add and 0 when not.
  4613. *
  4614. * r A single precision number representing conditional add result.
  4615. * a A single precision number to add with.
  4616. * b A single precision number to add.
  4617. * m Mask value to apply.
  4618. */
  4619. SP_NOINLINE static sp_digit sp_2048_cond_add_32(sp_digit* r, const sp_digit* a, const sp_digit* b,
  4620. sp_digit m)
  4621. {
  4622. sp_digit c = 0;
  4623. __asm__ __volatile__ (
  4624. "mov r5, #128\n\t"
  4625. "mov r9, r5\n\t"
  4626. "mov r8, #0\n\t"
  4627. "\n1:\n\t"
  4628. "ldr r6, [%[b], r8]\n\t"
  4629. "and r6, r6, %[m]\n\t"
  4630. "adds r5, %[c], #-1\n\t"
  4631. "ldr r5, [%[a], r8]\n\t"
  4632. "adcs r5, r5, r6\n\t"
  4633. "mov %[c], #0\n\t"
  4634. "adcs %[c], %[c], %[c]\n\t"
  4635. "str r5, [%[r], r8]\n\t"
  4636. "add r8, r8, #4\n\t"
  4637. "cmp r8, r9\n\t"
  4638. #ifdef __GNUC__
  4639. "blt 1b\n\t"
  4640. #else
  4641. "blt.n 1b\n\t"
  4642. #endif /* __GNUC__ */
  4643. : [c] "+r" (c)
  4644. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  4645. : "memory", "r5", "r6", "r8", "r9"
  4646. );
  4647. return c;
  4648. }
  4649. /* RSA private key operation.
  4650. *
  4651. * in Array of bytes representing the number to exponentiate, base.
  4652. * inLen Number of bytes in base.
  4653. * dm Private exponent.
  4654. * pm First prime.
  4655. * qm Second prime.
  4656. * dpm First prime's CRT exponent.
  4657. * dqm Second prime's CRT exponent.
  4658. * qim Inverse of second prime mod p.
  4659. * mm Modulus.
  4660. * out Buffer to hold big-endian bytes of exponentiation result.
  4661. * Must be at least 256 bytes long.
  4662. * outLen Number of bytes in result.
  4663. * returns 0 on success, MP_TO_E when the outLen is too small, MP_READ_E when
  4664. * an array is too long and MEMORY_E when dynamic memory allocation fails.
  4665. */
  4666. int sp_RsaPrivate_2048(const byte* in, word32 inLen, const mp_int* dm,
  4667. const mp_int* pm, const mp_int* qm, const mp_int* dpm, const mp_int* dqm,
  4668. const mp_int* qim, const mp_int* mm, byte* out, word32* outLen)
  4669. {
  4670. #if defined(SP_RSA_PRIVATE_EXP_D) || defined(RSA_LOW_MEM)
  4671. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4672. sp_digit* d = NULL;
  4673. #else
  4674. sp_digit d[64 * 4];
  4675. #endif
  4676. sp_digit* a = NULL;
  4677. sp_digit* m = NULL;
  4678. sp_digit* r = NULL;
  4679. int err = MP_OKAY;
  4680. (void)pm;
  4681. (void)qm;
  4682. (void)dpm;
  4683. (void)dqm;
  4684. (void)qim;
  4685. if (*outLen < 256U) {
  4686. err = MP_TO_E;
  4687. }
  4688. if (err == MP_OKAY) {
  4689. if (mp_count_bits(dm) > 2048) {
  4690. err = MP_READ_E;
  4691. }
  4692. else if (inLen > 256) {
  4693. err = MP_READ_E;
  4694. }
  4695. else if (mp_count_bits(mm) != 2048) {
  4696. err = MP_READ_E;
  4697. }
  4698. else if (mp_iseven(mm)) {
  4699. err = MP_VAL;
  4700. }
  4701. }
  4702. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4703. if (err == MP_OKAY) {
  4704. d = (sp_digit*)XMALLOC(sizeof(sp_digit) * 64 * 4, NULL,
  4705. DYNAMIC_TYPE_RSA);
  4706. if (d == NULL)
  4707. err = MEMORY_E;
  4708. }
  4709. #endif
  4710. if (err == MP_OKAY) {
  4711. a = d + 64;
  4712. m = a + 128;
  4713. r = a;
  4714. sp_2048_from_bin(a, 64, in, inLen);
  4715. sp_2048_from_mp(d, 64, dm);
  4716. sp_2048_from_mp(m, 64, mm);
  4717. err = sp_2048_mod_exp_64(r, a, d, 2048, m, 0);
  4718. }
  4719. if (err == MP_OKAY) {
  4720. sp_2048_to_bin_64(r, out);
  4721. *outLen = 256;
  4722. }
  4723. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4724. if (d != NULL)
  4725. #endif
  4726. {
  4727. /* only "a" and "r" are sensitive and need zeroized (same pointer) */
  4728. if (a != NULL)
  4729. ForceZero(a, sizeof(sp_digit) * 64);
  4730. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4731. XFREE(d, NULL, DYNAMIC_TYPE_RSA);
  4732. #endif
  4733. }
  4734. return err;
  4735. #else
  4736. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4737. sp_digit* a = NULL;
  4738. #else
  4739. sp_digit a[32 * 11];
  4740. #endif
  4741. sp_digit* p = NULL;
  4742. sp_digit* q = NULL;
  4743. sp_digit* dp = NULL;
  4744. sp_digit* tmpa = NULL;
  4745. sp_digit* tmpb = NULL;
  4746. sp_digit* r = NULL;
  4747. sp_digit* qi = NULL;
  4748. sp_digit* dq = NULL;
  4749. sp_digit c;
  4750. int err = MP_OKAY;
  4751. (void)dm;
  4752. (void)mm;
  4753. if (*outLen < 256) {
  4754. err = MP_TO_E;
  4755. }
  4756. else if (inLen > 256 || mp_count_bits(mm) != 2048) {
  4757. err = MP_READ_E;
  4758. }
  4759. else if (mp_iseven(mm)) {
  4760. err = MP_VAL;
  4761. }
  4762. else if (mp_iseven(pm)) {
  4763. err = MP_VAL;
  4764. }
  4765. else if (mp_iseven(qm)) {
  4766. err = MP_VAL;
  4767. }
  4768. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4769. if (err == MP_OKAY) {
  4770. a = (sp_digit*)XMALLOC(sizeof(sp_digit) * 32 * 11, NULL,
  4771. DYNAMIC_TYPE_RSA);
  4772. if (a == NULL)
  4773. err = MEMORY_E;
  4774. }
  4775. #endif
  4776. if (err == MP_OKAY) {
  4777. p = a + 64 * 2;
  4778. q = p + 32;
  4779. qi = dq = dp = q + 32;
  4780. tmpa = qi + 32;
  4781. tmpb = tmpa + 64;
  4782. r = a;
  4783. sp_2048_from_bin(a, 64, in, inLen);
  4784. sp_2048_from_mp(p, 32, pm);
  4785. sp_2048_from_mp(q, 32, qm);
  4786. sp_2048_from_mp(dp, 32, dpm);
  4787. err = sp_2048_mod_exp_32(tmpa, a, dp, 1024, p, 1);
  4788. }
  4789. if (err == MP_OKAY) {
  4790. sp_2048_from_mp(dq, 32, dqm);
  4791. err = sp_2048_mod_exp_32(tmpb, a, dq, 1024, q, 1);
  4792. }
  4793. if (err == MP_OKAY) {
  4794. c = sp_2048_sub_in_place_32(tmpa, tmpb);
  4795. c += sp_2048_cond_add_32(tmpa, tmpa, p, c);
  4796. sp_2048_cond_add_32(tmpa, tmpa, p, c);
  4797. sp_2048_from_mp(qi, 32, qim);
  4798. sp_2048_mul_32(tmpa, tmpa, qi);
  4799. err = sp_2048_mod_32(tmpa, tmpa, p);
  4800. }
  4801. if (err == MP_OKAY) {
  4802. sp_2048_mul_32(tmpa, q, tmpa);
  4803. XMEMSET(&tmpb[32], 0, sizeof(sp_digit) * 32);
  4804. sp_2048_add_64(r, tmpb, tmpa);
  4805. sp_2048_to_bin_64(r, out);
  4806. *outLen = 256;
  4807. }
  4808. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4809. if (a != NULL)
  4810. #endif
  4811. {
  4812. ForceZero(a, sizeof(sp_digit) * 32 * 11);
  4813. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  4814. XFREE(a, NULL, DYNAMIC_TYPE_RSA);
  4815. #endif
  4816. }
  4817. #endif /* SP_RSA_PRIVATE_EXP_D || RSA_LOW_MEM */
  4818. return err;
  4819. }
  4820. #endif /* WOLFSSL_RSA_PUBLIC_ONLY */
  4821. #endif /* WOLFSSL_HAVE_SP_RSA */
  4822. #if defined(WOLFSSL_HAVE_SP_DH) || (defined(WOLFSSL_HAVE_SP_RSA) && \
  4823. !defined(WOLFSSL_RSA_PUBLIC_ONLY))
  4824. /* Convert an array of sp_digit to an mp_int.
  4825. *
  4826. * a A single precision integer.
  4827. * r A multi-precision integer.
  4828. */
  4829. static int sp_2048_to_mp(const sp_digit* a, mp_int* r)
  4830. {
  4831. int err;
  4832. err = mp_grow(r, (2048 + DIGIT_BIT - 1) / DIGIT_BIT);
  4833. if (err == MP_OKAY) { /*lint !e774 case where err is always MP_OKAY*/
  4834. #if DIGIT_BIT == 32
  4835. XMEMCPY(r->dp, a, sizeof(sp_digit) * 64);
  4836. r->used = 64;
  4837. mp_clamp(r);
  4838. #elif DIGIT_BIT < 32
  4839. int i;
  4840. int j = 0;
  4841. int s = 0;
  4842. r->dp[0] = 0;
  4843. for (i = 0; i < 64; i++) {
  4844. r->dp[j] |= (mp_digit)(a[i] << s);
  4845. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  4846. s = DIGIT_BIT - s;
  4847. r->dp[++j] = (mp_digit)(a[i] >> s);
  4848. while (s + DIGIT_BIT <= 32) {
  4849. s += DIGIT_BIT;
  4850. r->dp[j++] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  4851. if (s == SP_WORD_SIZE) {
  4852. r->dp[j] = 0;
  4853. }
  4854. else {
  4855. r->dp[j] = (mp_digit)(a[i] >> s);
  4856. }
  4857. }
  4858. s = 32 - s;
  4859. }
  4860. r->used = (2048 + DIGIT_BIT - 1) / DIGIT_BIT;
  4861. mp_clamp(r);
  4862. #else
  4863. int i;
  4864. int j = 0;
  4865. int s = 0;
  4866. r->dp[0] = 0;
  4867. for (i = 0; i < 64; i++) {
  4868. r->dp[j] |= ((mp_digit)a[i]) << s;
  4869. if (s + 32 >= DIGIT_BIT) {
  4870. #if DIGIT_BIT != 32 && DIGIT_BIT != 64
  4871. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  4872. #endif
  4873. s = DIGIT_BIT - s;
  4874. r->dp[++j] = a[i] >> s;
  4875. s = 32 - s;
  4876. }
  4877. else {
  4878. s += 32;
  4879. }
  4880. }
  4881. r->used = (2048 + DIGIT_BIT - 1) / DIGIT_BIT;
  4882. mp_clamp(r);
  4883. #endif
  4884. }
  4885. return err;
  4886. }
  4887. /* Perform the modular exponentiation for Diffie-Hellman.
  4888. *
  4889. * base Base. MP integer.
  4890. * exp Exponent. MP integer.
  4891. * mod Modulus. MP integer.
  4892. * res Result. MP integer.
  4893. * returns 0 on success, MP_READ_E if there are too many bytes in an array
  4894. * and MEMORY_E if memory allocation fails.
  4895. */
  4896. int sp_ModExp_2048(const mp_int* base, const mp_int* exp, const mp_int* mod,
  4897. mp_int* res)
  4898. {
  4899. int err = MP_OKAY;
  4900. sp_digit b[128];
  4901. sp_digit e[64];
  4902. sp_digit m[64];
  4903. sp_digit* r = b;
  4904. int expBits = mp_count_bits(exp);
  4905. if (mp_count_bits(base) > 2048) {
  4906. err = MP_READ_E;
  4907. }
  4908. else if (expBits > 2048) {
  4909. err = MP_READ_E;
  4910. }
  4911. else if (mp_count_bits(mod) != 2048) {
  4912. err = MP_READ_E;
  4913. }
  4914. else if (mp_iseven(mod)) {
  4915. err = MP_VAL;
  4916. }
  4917. if (err == MP_OKAY) {
  4918. sp_2048_from_mp(b, 64, base);
  4919. sp_2048_from_mp(e, 64, exp);
  4920. sp_2048_from_mp(m, 64, mod);
  4921. err = sp_2048_mod_exp_64(r, b, e, expBits, m, 0);
  4922. }
  4923. if (err == MP_OKAY) {
  4924. err = sp_2048_to_mp(r, res);
  4925. }
  4926. XMEMSET(e, 0, sizeof(e));
  4927. return err;
  4928. }
  4929. #ifdef WOLFSSL_HAVE_SP_DH
  4930. #ifdef HAVE_FFDHE_2048
  4931. static void sp_2048_lshift_64(sp_digit* r, const sp_digit* a, byte n)
  4932. {
  4933. __asm__ __volatile__ (
  4934. "mov r6, #31\n\t"
  4935. "sub r6, r6, %[n]\n\t"
  4936. "add %[a], %[a], #192\n\t"
  4937. "add %[r], %[r], #192\n\t"
  4938. "ldr r3, [%[a], #60]\n\t"
  4939. "lsr r4, r3, #1\n\t"
  4940. "lsl r3, r3, %[n]\n\t"
  4941. "lsr r4, r4, r6\n\t"
  4942. "ldr r2, [%[a], #56]\n\t"
  4943. "str r4, [%[r], #64]\n\t"
  4944. "lsr r5, r2, #1\n\t"
  4945. "lsl r2, r2, %[n]\n\t"
  4946. "lsr r5, r5, r6\n\t"
  4947. "orr r3, r3, r5\n\t"
  4948. "ldr r4, [%[a], #52]\n\t"
  4949. "str r3, [%[r], #60]\n\t"
  4950. "lsr r5, r4, #1\n\t"
  4951. "lsl r4, r4, %[n]\n\t"
  4952. "lsr r5, r5, r6\n\t"
  4953. "orr r2, r2, r5\n\t"
  4954. "ldr r3, [%[a], #48]\n\t"
  4955. "str r2, [%[r], #56]\n\t"
  4956. "lsr r5, r3, #1\n\t"
  4957. "lsl r3, r3, %[n]\n\t"
  4958. "lsr r5, r5, r6\n\t"
  4959. "orr r4, r4, r5\n\t"
  4960. "ldr r2, [%[a], #44]\n\t"
  4961. "str r4, [%[r], #52]\n\t"
  4962. "lsr r5, r2, #1\n\t"
  4963. "lsl r2, r2, %[n]\n\t"
  4964. "lsr r5, r5, r6\n\t"
  4965. "orr r3, r3, r5\n\t"
  4966. "ldr r4, [%[a], #40]\n\t"
  4967. "str r3, [%[r], #48]\n\t"
  4968. "lsr r5, r4, #1\n\t"
  4969. "lsl r4, r4, %[n]\n\t"
  4970. "lsr r5, r5, r6\n\t"
  4971. "orr r2, r2, r5\n\t"
  4972. "ldr r3, [%[a], #36]\n\t"
  4973. "str r2, [%[r], #44]\n\t"
  4974. "lsr r5, r3, #1\n\t"
  4975. "lsl r3, r3, %[n]\n\t"
  4976. "lsr r5, r5, r6\n\t"
  4977. "orr r4, r4, r5\n\t"
  4978. "ldr r2, [%[a], #32]\n\t"
  4979. "str r4, [%[r], #40]\n\t"
  4980. "lsr r5, r2, #1\n\t"
  4981. "lsl r2, r2, %[n]\n\t"
  4982. "lsr r5, r5, r6\n\t"
  4983. "orr r3, r3, r5\n\t"
  4984. "ldr r4, [%[a], #28]\n\t"
  4985. "str r3, [%[r], #36]\n\t"
  4986. "lsr r5, r4, #1\n\t"
  4987. "lsl r4, r4, %[n]\n\t"
  4988. "lsr r5, r5, r6\n\t"
  4989. "orr r2, r2, r5\n\t"
  4990. "ldr r3, [%[a], #24]\n\t"
  4991. "str r2, [%[r], #32]\n\t"
  4992. "lsr r5, r3, #1\n\t"
  4993. "lsl r3, r3, %[n]\n\t"
  4994. "lsr r5, r5, r6\n\t"
  4995. "orr r4, r4, r5\n\t"
  4996. "ldr r2, [%[a], #20]\n\t"
  4997. "str r4, [%[r], #28]\n\t"
  4998. "lsr r5, r2, #1\n\t"
  4999. "lsl r2, r2, %[n]\n\t"
  5000. "lsr r5, r5, r6\n\t"
  5001. "orr r3, r3, r5\n\t"
  5002. "ldr r4, [%[a], #16]\n\t"
  5003. "str r3, [%[r], #24]\n\t"
  5004. "lsr r5, r4, #1\n\t"
  5005. "lsl r4, r4, %[n]\n\t"
  5006. "lsr r5, r5, r6\n\t"
  5007. "orr r2, r2, r5\n\t"
  5008. "ldr r3, [%[a], #12]\n\t"
  5009. "str r2, [%[r], #20]\n\t"
  5010. "lsr r5, r3, #1\n\t"
  5011. "lsl r3, r3, %[n]\n\t"
  5012. "lsr r5, r5, r6\n\t"
  5013. "orr r4, r4, r5\n\t"
  5014. "ldr r2, [%[a], #8]\n\t"
  5015. "str r4, [%[r], #16]\n\t"
  5016. "lsr r5, r2, #1\n\t"
  5017. "lsl r2, r2, %[n]\n\t"
  5018. "lsr r5, r5, r6\n\t"
  5019. "orr r3, r3, r5\n\t"
  5020. "ldr r4, [%[a], #4]\n\t"
  5021. "str r3, [%[r], #12]\n\t"
  5022. "lsr r5, r4, #1\n\t"
  5023. "lsl r4, r4, %[n]\n\t"
  5024. "lsr r5, r5, r6\n\t"
  5025. "orr r2, r2, r5\n\t"
  5026. "ldr r3, [%[a], #0]\n\t"
  5027. "str r2, [%[r], #8]\n\t"
  5028. "lsr r5, r3, #1\n\t"
  5029. "lsl r3, r3, %[n]\n\t"
  5030. "lsr r5, r5, r6\n\t"
  5031. "orr r4, r4, r5\n\t"
  5032. "sub %[a], %[a], #64\n\t"
  5033. "sub %[r], %[r], #64\n\t"
  5034. "ldr r2, [%[a], #60]\n\t"
  5035. "str r4, [%[r], #68]\n\t"
  5036. "lsr r5, r2, #1\n\t"
  5037. "lsl r2, r2, %[n]\n\t"
  5038. "lsr r5, r5, r6\n\t"
  5039. "orr r3, r3, r5\n\t"
  5040. "ldr r4, [%[a], #56]\n\t"
  5041. "str r3, [%[r], #64]\n\t"
  5042. "lsr r5, r4, #1\n\t"
  5043. "lsl r4, r4, %[n]\n\t"
  5044. "lsr r5, r5, r6\n\t"
  5045. "orr r2, r2, r5\n\t"
  5046. "ldr r3, [%[a], #52]\n\t"
  5047. "str r2, [%[r], #60]\n\t"
  5048. "lsr r5, r3, #1\n\t"
  5049. "lsl r3, r3, %[n]\n\t"
  5050. "lsr r5, r5, r6\n\t"
  5051. "orr r4, r4, r5\n\t"
  5052. "ldr r2, [%[a], #48]\n\t"
  5053. "str r4, [%[r], #56]\n\t"
  5054. "lsr r5, r2, #1\n\t"
  5055. "lsl r2, r2, %[n]\n\t"
  5056. "lsr r5, r5, r6\n\t"
  5057. "orr r3, r3, r5\n\t"
  5058. "ldr r4, [%[a], #44]\n\t"
  5059. "str r3, [%[r], #52]\n\t"
  5060. "lsr r5, r4, #1\n\t"
  5061. "lsl r4, r4, %[n]\n\t"
  5062. "lsr r5, r5, r6\n\t"
  5063. "orr r2, r2, r5\n\t"
  5064. "ldr r3, [%[a], #40]\n\t"
  5065. "str r2, [%[r], #48]\n\t"
  5066. "lsr r5, r3, #1\n\t"
  5067. "lsl r3, r3, %[n]\n\t"
  5068. "lsr r5, r5, r6\n\t"
  5069. "orr r4, r4, r5\n\t"
  5070. "ldr r2, [%[a], #36]\n\t"
  5071. "str r4, [%[r], #44]\n\t"
  5072. "lsr r5, r2, #1\n\t"
  5073. "lsl r2, r2, %[n]\n\t"
  5074. "lsr r5, r5, r6\n\t"
  5075. "orr r3, r3, r5\n\t"
  5076. "ldr r4, [%[a], #32]\n\t"
  5077. "str r3, [%[r], #40]\n\t"
  5078. "lsr r5, r4, #1\n\t"
  5079. "lsl r4, r4, %[n]\n\t"
  5080. "lsr r5, r5, r6\n\t"
  5081. "orr r2, r2, r5\n\t"
  5082. "ldr r3, [%[a], #28]\n\t"
  5083. "str r2, [%[r], #36]\n\t"
  5084. "lsr r5, r3, #1\n\t"
  5085. "lsl r3, r3, %[n]\n\t"
  5086. "lsr r5, r5, r6\n\t"
  5087. "orr r4, r4, r5\n\t"
  5088. "ldr r2, [%[a], #24]\n\t"
  5089. "str r4, [%[r], #32]\n\t"
  5090. "lsr r5, r2, #1\n\t"
  5091. "lsl r2, r2, %[n]\n\t"
  5092. "lsr r5, r5, r6\n\t"
  5093. "orr r3, r3, r5\n\t"
  5094. "ldr r4, [%[a], #20]\n\t"
  5095. "str r3, [%[r], #28]\n\t"
  5096. "lsr r5, r4, #1\n\t"
  5097. "lsl r4, r4, %[n]\n\t"
  5098. "lsr r5, r5, r6\n\t"
  5099. "orr r2, r2, r5\n\t"
  5100. "ldr r3, [%[a], #16]\n\t"
  5101. "str r2, [%[r], #24]\n\t"
  5102. "lsr r5, r3, #1\n\t"
  5103. "lsl r3, r3, %[n]\n\t"
  5104. "lsr r5, r5, r6\n\t"
  5105. "orr r4, r4, r5\n\t"
  5106. "ldr r2, [%[a], #12]\n\t"
  5107. "str r4, [%[r], #20]\n\t"
  5108. "lsr r5, r2, #1\n\t"
  5109. "lsl r2, r2, %[n]\n\t"
  5110. "lsr r5, r5, r6\n\t"
  5111. "orr r3, r3, r5\n\t"
  5112. "ldr r4, [%[a], #8]\n\t"
  5113. "str r3, [%[r], #16]\n\t"
  5114. "lsr r5, r4, #1\n\t"
  5115. "lsl r4, r4, %[n]\n\t"
  5116. "lsr r5, r5, r6\n\t"
  5117. "orr r2, r2, r5\n\t"
  5118. "ldr r3, [%[a], #4]\n\t"
  5119. "str r2, [%[r], #12]\n\t"
  5120. "lsr r5, r3, #1\n\t"
  5121. "lsl r3, r3, %[n]\n\t"
  5122. "lsr r5, r5, r6\n\t"
  5123. "orr r4, r4, r5\n\t"
  5124. "ldr r2, [%[a], #0]\n\t"
  5125. "str r4, [%[r], #8]\n\t"
  5126. "lsr r5, r2, #1\n\t"
  5127. "lsl r2, r2, %[n]\n\t"
  5128. "lsr r5, r5, r6\n\t"
  5129. "orr r3, r3, r5\n\t"
  5130. "sub %[a], %[a], #64\n\t"
  5131. "sub %[r], %[r], #64\n\t"
  5132. "ldr r4, [%[a], #60]\n\t"
  5133. "str r3, [%[r], #68]\n\t"
  5134. "lsr r5, r4, #1\n\t"
  5135. "lsl r4, r4, %[n]\n\t"
  5136. "lsr r5, r5, r6\n\t"
  5137. "orr r2, r2, r5\n\t"
  5138. "ldr r3, [%[a], #56]\n\t"
  5139. "str r2, [%[r], #64]\n\t"
  5140. "lsr r5, r3, #1\n\t"
  5141. "lsl r3, r3, %[n]\n\t"
  5142. "lsr r5, r5, r6\n\t"
  5143. "orr r4, r4, r5\n\t"
  5144. "ldr r2, [%[a], #52]\n\t"
  5145. "str r4, [%[r], #60]\n\t"
  5146. "lsr r5, r2, #1\n\t"
  5147. "lsl r2, r2, %[n]\n\t"
  5148. "lsr r5, r5, r6\n\t"
  5149. "orr r3, r3, r5\n\t"
  5150. "ldr r4, [%[a], #48]\n\t"
  5151. "str r3, [%[r], #56]\n\t"
  5152. "lsr r5, r4, #1\n\t"
  5153. "lsl r4, r4, %[n]\n\t"
  5154. "lsr r5, r5, r6\n\t"
  5155. "orr r2, r2, r5\n\t"
  5156. "ldr r3, [%[a], #44]\n\t"
  5157. "str r2, [%[r], #52]\n\t"
  5158. "lsr r5, r3, #1\n\t"
  5159. "lsl r3, r3, %[n]\n\t"
  5160. "lsr r5, r5, r6\n\t"
  5161. "orr r4, r4, r5\n\t"
  5162. "ldr r2, [%[a], #40]\n\t"
  5163. "str r4, [%[r], #48]\n\t"
  5164. "lsr r5, r2, #1\n\t"
  5165. "lsl r2, r2, %[n]\n\t"
  5166. "lsr r5, r5, r6\n\t"
  5167. "orr r3, r3, r5\n\t"
  5168. "ldr r4, [%[a], #36]\n\t"
  5169. "str r3, [%[r], #44]\n\t"
  5170. "lsr r5, r4, #1\n\t"
  5171. "lsl r4, r4, %[n]\n\t"
  5172. "lsr r5, r5, r6\n\t"
  5173. "orr r2, r2, r5\n\t"
  5174. "ldr r3, [%[a], #32]\n\t"
  5175. "str r2, [%[r], #40]\n\t"
  5176. "lsr r5, r3, #1\n\t"
  5177. "lsl r3, r3, %[n]\n\t"
  5178. "lsr r5, r5, r6\n\t"
  5179. "orr r4, r4, r5\n\t"
  5180. "ldr r2, [%[a], #28]\n\t"
  5181. "str r4, [%[r], #36]\n\t"
  5182. "lsr r5, r2, #1\n\t"
  5183. "lsl r2, r2, %[n]\n\t"
  5184. "lsr r5, r5, r6\n\t"
  5185. "orr r3, r3, r5\n\t"
  5186. "ldr r4, [%[a], #24]\n\t"
  5187. "str r3, [%[r], #32]\n\t"
  5188. "lsr r5, r4, #1\n\t"
  5189. "lsl r4, r4, %[n]\n\t"
  5190. "lsr r5, r5, r6\n\t"
  5191. "orr r2, r2, r5\n\t"
  5192. "ldr r3, [%[a], #20]\n\t"
  5193. "str r2, [%[r], #28]\n\t"
  5194. "lsr r5, r3, #1\n\t"
  5195. "lsl r3, r3, %[n]\n\t"
  5196. "lsr r5, r5, r6\n\t"
  5197. "orr r4, r4, r5\n\t"
  5198. "ldr r2, [%[a], #16]\n\t"
  5199. "str r4, [%[r], #24]\n\t"
  5200. "lsr r5, r2, #1\n\t"
  5201. "lsl r2, r2, %[n]\n\t"
  5202. "lsr r5, r5, r6\n\t"
  5203. "orr r3, r3, r5\n\t"
  5204. "ldr r4, [%[a], #12]\n\t"
  5205. "str r3, [%[r], #20]\n\t"
  5206. "lsr r5, r4, #1\n\t"
  5207. "lsl r4, r4, %[n]\n\t"
  5208. "lsr r5, r5, r6\n\t"
  5209. "orr r2, r2, r5\n\t"
  5210. "ldr r3, [%[a], #8]\n\t"
  5211. "str r2, [%[r], #16]\n\t"
  5212. "lsr r5, r3, #1\n\t"
  5213. "lsl r3, r3, %[n]\n\t"
  5214. "lsr r5, r5, r6\n\t"
  5215. "orr r4, r4, r5\n\t"
  5216. "ldr r2, [%[a], #4]\n\t"
  5217. "str r4, [%[r], #12]\n\t"
  5218. "lsr r5, r2, #1\n\t"
  5219. "lsl r2, r2, %[n]\n\t"
  5220. "lsr r5, r5, r6\n\t"
  5221. "orr r3, r3, r5\n\t"
  5222. "ldr r4, [%[a], #0]\n\t"
  5223. "str r3, [%[r], #8]\n\t"
  5224. "lsr r5, r4, #1\n\t"
  5225. "lsl r4, r4, %[n]\n\t"
  5226. "lsr r5, r5, r6\n\t"
  5227. "orr r2, r2, r5\n\t"
  5228. "sub %[a], %[a], #64\n\t"
  5229. "sub %[r], %[r], #64\n\t"
  5230. "ldr r3, [%[a], #60]\n\t"
  5231. "str r2, [%[r], #68]\n\t"
  5232. "lsr r5, r3, #1\n\t"
  5233. "lsl r3, r3, %[n]\n\t"
  5234. "lsr r5, r5, r6\n\t"
  5235. "orr r4, r4, r5\n\t"
  5236. "ldr r2, [%[a], #56]\n\t"
  5237. "str r4, [%[r], #64]\n\t"
  5238. "lsr r5, r2, #1\n\t"
  5239. "lsl r2, r2, %[n]\n\t"
  5240. "lsr r5, r5, r6\n\t"
  5241. "orr r3, r3, r5\n\t"
  5242. "ldr r4, [%[a], #52]\n\t"
  5243. "str r3, [%[r], #60]\n\t"
  5244. "lsr r5, r4, #1\n\t"
  5245. "lsl r4, r4, %[n]\n\t"
  5246. "lsr r5, r5, r6\n\t"
  5247. "orr r2, r2, r5\n\t"
  5248. "ldr r3, [%[a], #48]\n\t"
  5249. "str r2, [%[r], #56]\n\t"
  5250. "lsr r5, r3, #1\n\t"
  5251. "lsl r3, r3, %[n]\n\t"
  5252. "lsr r5, r5, r6\n\t"
  5253. "orr r4, r4, r5\n\t"
  5254. "ldr r2, [%[a], #44]\n\t"
  5255. "str r4, [%[r], #52]\n\t"
  5256. "lsr r5, r2, #1\n\t"
  5257. "lsl r2, r2, %[n]\n\t"
  5258. "lsr r5, r5, r6\n\t"
  5259. "orr r3, r3, r5\n\t"
  5260. "ldr r4, [%[a], #40]\n\t"
  5261. "str r3, [%[r], #48]\n\t"
  5262. "lsr r5, r4, #1\n\t"
  5263. "lsl r4, r4, %[n]\n\t"
  5264. "lsr r5, r5, r6\n\t"
  5265. "orr r2, r2, r5\n\t"
  5266. "ldr r3, [%[a], #36]\n\t"
  5267. "str r2, [%[r], #44]\n\t"
  5268. "lsr r5, r3, #1\n\t"
  5269. "lsl r3, r3, %[n]\n\t"
  5270. "lsr r5, r5, r6\n\t"
  5271. "orr r4, r4, r5\n\t"
  5272. "ldr r2, [%[a], #32]\n\t"
  5273. "str r4, [%[r], #40]\n\t"
  5274. "lsr r5, r2, #1\n\t"
  5275. "lsl r2, r2, %[n]\n\t"
  5276. "lsr r5, r5, r6\n\t"
  5277. "orr r3, r3, r5\n\t"
  5278. "ldr r4, [%[a], #28]\n\t"
  5279. "str r3, [%[r], #36]\n\t"
  5280. "lsr r5, r4, #1\n\t"
  5281. "lsl r4, r4, %[n]\n\t"
  5282. "lsr r5, r5, r6\n\t"
  5283. "orr r2, r2, r5\n\t"
  5284. "ldr r3, [%[a], #24]\n\t"
  5285. "str r2, [%[r], #32]\n\t"
  5286. "lsr r5, r3, #1\n\t"
  5287. "lsl r3, r3, %[n]\n\t"
  5288. "lsr r5, r5, r6\n\t"
  5289. "orr r4, r4, r5\n\t"
  5290. "ldr r2, [%[a], #20]\n\t"
  5291. "str r4, [%[r], #28]\n\t"
  5292. "lsr r5, r2, #1\n\t"
  5293. "lsl r2, r2, %[n]\n\t"
  5294. "lsr r5, r5, r6\n\t"
  5295. "orr r3, r3, r5\n\t"
  5296. "ldr r4, [%[a], #16]\n\t"
  5297. "str r3, [%[r], #24]\n\t"
  5298. "lsr r5, r4, #1\n\t"
  5299. "lsl r4, r4, %[n]\n\t"
  5300. "lsr r5, r5, r6\n\t"
  5301. "orr r2, r2, r5\n\t"
  5302. "ldr r3, [%[a], #12]\n\t"
  5303. "str r2, [%[r], #20]\n\t"
  5304. "lsr r5, r3, #1\n\t"
  5305. "lsl r3, r3, %[n]\n\t"
  5306. "lsr r5, r5, r6\n\t"
  5307. "orr r4, r4, r5\n\t"
  5308. "ldr r2, [%[a], #8]\n\t"
  5309. "str r4, [%[r], #16]\n\t"
  5310. "lsr r5, r2, #1\n\t"
  5311. "lsl r2, r2, %[n]\n\t"
  5312. "lsr r5, r5, r6\n\t"
  5313. "orr r3, r3, r5\n\t"
  5314. "ldr r4, [%[a], #4]\n\t"
  5315. "str r3, [%[r], #12]\n\t"
  5316. "lsr r5, r4, #1\n\t"
  5317. "lsl r4, r4, %[n]\n\t"
  5318. "lsr r5, r5, r6\n\t"
  5319. "orr r2, r2, r5\n\t"
  5320. "ldr r3, [%[a], #0]\n\t"
  5321. "str r2, [%[r], #8]\n\t"
  5322. "lsr r5, r3, #1\n\t"
  5323. "lsl r3, r3, %[n]\n\t"
  5324. "lsr r5, r5, r6\n\t"
  5325. "orr r4, r4, r5\n\t"
  5326. "str r3, [%[r]]\n\t"
  5327. "str r4, [%[r], #4]\n\t"
  5328. :
  5329. : [r] "r" (r), [a] "r" (a), [n] "r" (n)
  5330. : "memory", "r2", "r3", "r4", "r5", "r6"
  5331. );
  5332. }
  5333. /* Modular exponentiate 2 to the e mod m. (r = 2^e mod m)
  5334. *
  5335. * r A single precision number that is the result of the operation.
  5336. * e A single precision number that is the exponent.
  5337. * bits The number of bits in the exponent.
  5338. * m A single precision number that is the modulus.
  5339. * returns 0 on success.
  5340. * returns MEMORY_E on dynamic memory allocation failure.
  5341. * returns MP_VAL when base is even.
  5342. */
  5343. static int sp_2048_mod_exp_2_64(sp_digit* r, const sp_digit* e, int bits,
  5344. const sp_digit* m)
  5345. {
  5346. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  5347. sp_digit* td = NULL;
  5348. #else
  5349. sp_digit td[193];
  5350. #endif
  5351. sp_digit* norm = NULL;
  5352. sp_digit* tmp = NULL;
  5353. sp_digit mp = 1;
  5354. sp_digit n;
  5355. sp_digit o;
  5356. sp_digit mask;
  5357. int i;
  5358. int c;
  5359. byte y;
  5360. int err = MP_OKAY;
  5361. if (bits == 0) {
  5362. err = MP_VAL;
  5363. }
  5364. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  5365. if (err == MP_OKAY) {
  5366. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * 193, NULL,
  5367. DYNAMIC_TYPE_TMP_BUFFER);
  5368. if (td == NULL)
  5369. err = MEMORY_E;
  5370. }
  5371. #endif
  5372. if (err == MP_OKAY) {
  5373. norm = td;
  5374. tmp = td + 128;
  5375. sp_2048_mont_setup(m, &mp);
  5376. sp_2048_mont_norm_64(norm, m);
  5377. i = (bits - 1) / 32;
  5378. n = e[i--];
  5379. c = bits & 31;
  5380. if (c == 0) {
  5381. c = 32;
  5382. }
  5383. c -= bits % 5;
  5384. if (c == 32) {
  5385. c = 27;
  5386. }
  5387. if (c < 0) {
  5388. /* Number of bits in top word is less than number needed. */
  5389. c = -c;
  5390. y = (byte)(n << c);
  5391. n = e[i--];
  5392. y |= (byte)(n >> (64 - c));
  5393. n <<= c;
  5394. c = 64 - c;
  5395. }
  5396. else if (c == 0) {
  5397. /* All bits in top word used. */
  5398. y = (byte)n;
  5399. }
  5400. else {
  5401. y = (byte)(n >> c);
  5402. n <<= 32 - c;
  5403. }
  5404. sp_2048_lshift_64(r, norm, y);
  5405. for (; i>=0 || c>=5; ) {
  5406. if (c == 0) {
  5407. n = e[i--];
  5408. y = (byte)(n >> 27);
  5409. n <<= 5;
  5410. c = 27;
  5411. }
  5412. else if (c < 5) {
  5413. y = (byte)(n >> 27);
  5414. n = e[i--];
  5415. c = 5 - c;
  5416. y |= (byte)(n >> (32 - c));
  5417. n <<= c;
  5418. c = 32 - c;
  5419. }
  5420. else {
  5421. y = (byte)((n >> 27) & 0x1f);
  5422. n <<= 5;
  5423. c -= 5;
  5424. }
  5425. sp_2048_mont_sqr_64(r, r, m, mp);
  5426. sp_2048_mont_sqr_64(r, r, m, mp);
  5427. sp_2048_mont_sqr_64(r, r, m, mp);
  5428. sp_2048_mont_sqr_64(r, r, m, mp);
  5429. sp_2048_mont_sqr_64(r, r, m, mp);
  5430. sp_2048_lshift_64(r, r, y);
  5431. sp_2048_mul_d_64(tmp, norm, r[64]);
  5432. r[64] = 0;
  5433. o = sp_2048_add_64(r, r, tmp);
  5434. sp_2048_cond_sub_64(r, r, m, (sp_digit)0 - o);
  5435. }
  5436. XMEMSET(&r[64], 0, sizeof(sp_digit) * 64U);
  5437. sp_2048_mont_reduce_64(r, m, mp);
  5438. mask = 0 - (sp_2048_cmp_64(r, m) >= 0);
  5439. sp_2048_cond_sub_64(r, r, m, mask);
  5440. }
  5441. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  5442. if (td != NULL)
  5443. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  5444. #endif
  5445. return err;
  5446. }
  5447. #endif /* HAVE_FFDHE_2048 */
  5448. /* Perform the modular exponentiation for Diffie-Hellman.
  5449. *
  5450. * base Base.
  5451. * exp Array of bytes that is the exponent.
  5452. * expLen Length of data, in bytes, in exponent.
  5453. * mod Modulus.
  5454. * out Buffer to hold big-endian bytes of exponentiation result.
  5455. * Must be at least 256 bytes long.
  5456. * outLen Length, in bytes, of exponentiation result.
  5457. * returns 0 on success, MP_READ_E if there are too many bytes in an array
  5458. * and MEMORY_E if memory allocation fails.
  5459. */
  5460. int sp_DhExp_2048(const mp_int* base, const byte* exp, word32 expLen,
  5461. const mp_int* mod, byte* out, word32* outLen)
  5462. {
  5463. int err = MP_OKAY;
  5464. sp_digit b[128];
  5465. sp_digit e[64];
  5466. sp_digit m[64];
  5467. sp_digit* r = b;
  5468. word32 i;
  5469. if (mp_count_bits(base) > 2048) {
  5470. err = MP_READ_E;
  5471. }
  5472. else if (expLen > 256) {
  5473. err = MP_READ_E;
  5474. }
  5475. else if (mp_count_bits(mod) != 2048) {
  5476. err = MP_READ_E;
  5477. }
  5478. else if (mp_iseven(mod)) {
  5479. err = MP_VAL;
  5480. }
  5481. if (err == MP_OKAY) {
  5482. sp_2048_from_mp(b, 64, base);
  5483. sp_2048_from_bin(e, 64, exp, expLen);
  5484. sp_2048_from_mp(m, 64, mod);
  5485. #ifdef HAVE_FFDHE_2048
  5486. if (base->used == 1 && base->dp[0] == 2 && m[63] == (sp_digit)-1)
  5487. err = sp_2048_mod_exp_2_64(r, e, expLen * 8, m);
  5488. else
  5489. #endif
  5490. err = sp_2048_mod_exp_64(r, b, e, expLen * 8, m, 0);
  5491. }
  5492. if (err == MP_OKAY) {
  5493. sp_2048_to_bin_64(r, out);
  5494. *outLen = 256;
  5495. for (i=0; i<256 && out[i] == 0; i++) {
  5496. /* Search for first non-zero. */
  5497. }
  5498. *outLen -= i;
  5499. XMEMMOVE(out, out + i, *outLen);
  5500. }
  5501. XMEMSET(e, 0, sizeof(e));
  5502. return err;
  5503. }
  5504. #endif /* WOLFSSL_HAVE_SP_DH */
  5505. /* Perform the modular exponentiation for Diffie-Hellman.
  5506. *
  5507. * base Base. MP integer.
  5508. * exp Exponent. MP integer.
  5509. * mod Modulus. MP integer.
  5510. * res Result. MP integer.
  5511. * returns 0 on success, MP_READ_E if there are too many bytes in an array
  5512. * and MEMORY_E if memory allocation fails.
  5513. */
  5514. int sp_ModExp_1024(const mp_int* base, const mp_int* exp, const mp_int* mod,
  5515. mp_int* res)
  5516. {
  5517. int err = MP_OKAY;
  5518. sp_digit b[64];
  5519. sp_digit e[32];
  5520. sp_digit m[32];
  5521. sp_digit* r = b;
  5522. int expBits = mp_count_bits(exp);
  5523. if (mp_count_bits(base) > 1024) {
  5524. err = MP_READ_E;
  5525. }
  5526. else if (expBits > 1024) {
  5527. err = MP_READ_E;
  5528. }
  5529. else if (mp_count_bits(mod) != 1024) {
  5530. err = MP_READ_E;
  5531. }
  5532. else if (mp_iseven(mod)) {
  5533. err = MP_VAL;
  5534. }
  5535. if (err == MP_OKAY) {
  5536. sp_2048_from_mp(b, 32, base);
  5537. sp_2048_from_mp(e, 32, exp);
  5538. sp_2048_from_mp(m, 32, mod);
  5539. err = sp_2048_mod_exp_32(r, b, e, expBits, m, 0);
  5540. }
  5541. if (err == MP_OKAY) {
  5542. XMEMSET(r + 32, 0, sizeof(*r) * 32U);
  5543. err = sp_2048_to_mp(r, res);
  5544. res->used = mod->used;
  5545. mp_clamp(res);
  5546. }
  5547. XMEMSET(e, 0, sizeof(e));
  5548. return err;
  5549. }
  5550. #endif /* WOLFSSL_HAVE_SP_DH | (WOLFSSL_HAVE_SP_RSA & !WOLFSSL_RSA_PUBLIC_ONLY) */
  5551. #endif /* !WOLFSSL_SP_NO_2048 */
  5552. #ifndef WOLFSSL_SP_NO_3072
  5553. /* Read big endian unsigned byte array into r.
  5554. *
  5555. * r A single precision integer.
  5556. * size Maximum number of bytes to convert
  5557. * a Byte array.
  5558. * n Number of bytes in array to read.
  5559. */
  5560. static void sp_3072_from_bin(sp_digit* r, int size, const byte* a, int n)
  5561. {
  5562. int i;
  5563. int j;
  5564. byte* d;
  5565. for (i = n - 1,j = 0; i >= 3; i -= 4) {
  5566. r[j] = ((sp_digit)a[i - 0] << 0) |
  5567. ((sp_digit)a[i - 1] << 8) |
  5568. ((sp_digit)a[i - 2] << 16) |
  5569. ((sp_digit)a[i - 3] << 24);
  5570. j++;
  5571. }
  5572. if (i >= 0) {
  5573. r[j] = 0;
  5574. d = (byte*)r;
  5575. switch (i) {
  5576. case 2: d[n - 1 - 2] = a[2]; //fallthrough
  5577. case 1: d[n - 1 - 1] = a[1]; //fallthrough
  5578. case 0: d[n - 1 - 0] = a[0]; //fallthrough
  5579. }
  5580. j++;
  5581. }
  5582. for (; j < size; j++) {
  5583. r[j] = 0;
  5584. }
  5585. }
  5586. /* Convert an mp_int to an array of sp_digit.
  5587. *
  5588. * r A single precision integer.
  5589. * size Maximum number of bytes to convert
  5590. * a A multi-precision integer.
  5591. */
  5592. static void sp_3072_from_mp(sp_digit* r, int size, const mp_int* a)
  5593. {
  5594. #if DIGIT_BIT == 32
  5595. int j;
  5596. XMEMCPY(r, a->dp, sizeof(sp_digit) * a->used);
  5597. for (j = a->used; j < size; j++) {
  5598. r[j] = 0;
  5599. }
  5600. #elif DIGIT_BIT > 32
  5601. int i;
  5602. int j = 0;
  5603. word32 s = 0;
  5604. r[0] = 0;
  5605. for (i = 0; i < a->used && j < size; i++) {
  5606. r[j] |= ((sp_digit)a->dp[i] << s);
  5607. r[j] &= 0xffffffff;
  5608. s = 32U - s;
  5609. if (j + 1 >= size) {
  5610. break;
  5611. }
  5612. /* lint allow cast of mismatch word32 and mp_digit */
  5613. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  5614. while ((s + 32U) <= (word32)DIGIT_BIT) {
  5615. s += 32U;
  5616. r[j] &= 0xffffffff;
  5617. if (j + 1 >= size) {
  5618. break;
  5619. }
  5620. if (s < (word32)DIGIT_BIT) {
  5621. /* lint allow cast of mismatch word32 and mp_digit */
  5622. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  5623. }
  5624. else {
  5625. r[++j] = (sp_digit)0;
  5626. }
  5627. }
  5628. s = (word32)DIGIT_BIT - s;
  5629. }
  5630. for (j++; j < size; j++) {
  5631. r[j] = 0;
  5632. }
  5633. #else
  5634. int i;
  5635. int j = 0;
  5636. int s = 0;
  5637. r[0] = 0;
  5638. for (i = 0; i < a->used && j < size; i++) {
  5639. r[j] |= ((sp_digit)a->dp[i]) << s;
  5640. if (s + DIGIT_BIT >= 32) {
  5641. r[j] &= 0xffffffff;
  5642. if (j + 1 >= size) {
  5643. break;
  5644. }
  5645. s = 32 - s;
  5646. if (s == DIGIT_BIT) {
  5647. r[++j] = 0;
  5648. s = 0;
  5649. }
  5650. else {
  5651. r[++j] = a->dp[i] >> s;
  5652. s = DIGIT_BIT - s;
  5653. }
  5654. }
  5655. else {
  5656. s += DIGIT_BIT;
  5657. }
  5658. }
  5659. for (j++; j < size; j++) {
  5660. r[j] = 0;
  5661. }
  5662. #endif
  5663. }
  5664. /* Write r as big endian to byte array.
  5665. * Fixed length number of bytes written: 384
  5666. *
  5667. * r A single precision integer.
  5668. * a Byte array.
  5669. */
  5670. static void sp_3072_to_bin_96(sp_digit* r, byte* a)
  5671. {
  5672. int i;
  5673. int j = 0;
  5674. for (i = 95; i >= 0; i--) {
  5675. a[j++] = r[i] >> 24;
  5676. a[j++] = r[i] >> 16;
  5677. a[j++] = r[i] >> 8;
  5678. a[j++] = r[i] >> 0;
  5679. }
  5680. }
  5681. #if (defined(WOLFSSL_HAVE_SP_RSA) && (!defined(WOLFSSL_RSA_PUBLIC_ONLY) || !defined(WOLFSSL_SP_SMALL))) || defined(WOLFSSL_HAVE_SP_DH)
  5682. /* Normalize the values in each word to 32.
  5683. *
  5684. * a Array of sp_digit to normalize.
  5685. */
  5686. #define sp_3072_norm_96(a)
  5687. #endif /* (WOLFSSL_HAVE_SP_RSA && (!WOLFSSL_RSA_PUBLIC_ONLY || !WOLFSSL_SP_SMALL)) || WOLFSSL_HAVE_SP_DH */
  5688. /* Normalize the values in each word to 32.
  5689. *
  5690. * a Array of sp_digit to normalize.
  5691. */
  5692. #define sp_3072_norm_96(a)
  5693. #ifndef WOLFSSL_SP_SMALL
  5694. /* Multiply a and b into r. (r = a * b)
  5695. *
  5696. * r A single precision integer.
  5697. * a A single precision integer.
  5698. * b A single precision integer.
  5699. */
  5700. SP_NOINLINE static void sp_3072_mul_12(sp_digit* r, const sp_digit* a,
  5701. const sp_digit* b)
  5702. {
  5703. sp_digit tmp_arr[12 * 2];
  5704. sp_digit* tmp = tmp_arr;
  5705. __asm__ __volatile__ (
  5706. "mov r3, #0\n\t"
  5707. "mov r4, #0\n\t"
  5708. "mov r9, r3\n\t"
  5709. "mov r12, %[r]\n\t"
  5710. "mov r10, %[a]\n\t"
  5711. "mov r11, %[b]\n\t"
  5712. "mov r6, #48\n\t"
  5713. "add r6, r6, r10\n\t"
  5714. "mov r14, r6\n\t"
  5715. "\n1:\n\t"
  5716. "mov %[r], #0\n\t"
  5717. "mov r5, #0\n\t"
  5718. "mov r6, #44\n\t"
  5719. "mov %[a], r9\n\t"
  5720. "subs %[a], %[a], r6\n\t"
  5721. "sbc r6, r6, r6\n\t"
  5722. "mvn r6, r6\n\t"
  5723. "and %[a], %[a], r6\n\t"
  5724. "mov %[b], r9\n\t"
  5725. "sub %[b], %[b], %[a]\n\t"
  5726. "add %[a], %[a], r10\n\t"
  5727. "add %[b], %[b], r11\n\t"
  5728. "\n2:\n\t"
  5729. /* Multiply Start */
  5730. "ldr r6, [%[a]]\n\t"
  5731. "ldr r8, [%[b]]\n\t"
  5732. "umull r6, r8, r6, r8\n\t"
  5733. "adds r3, r3, r6\n\t"
  5734. "adcs r4, r4, r8\n\t"
  5735. "adc r5, r5, %[r]\n\t"
  5736. /* Multiply Done */
  5737. "add %[a], %[a], #4\n\t"
  5738. "sub %[b], %[b], #4\n\t"
  5739. "cmp %[a], r14\n\t"
  5740. #ifdef __GNUC__
  5741. "beq 3f\n\t"
  5742. #else
  5743. "beq.n 3f\n\t"
  5744. #endif /* __GNUC__ */
  5745. "mov r6, r9\n\t"
  5746. "add r6, r6, r10\n\t"
  5747. "cmp %[a], r6\n\t"
  5748. #ifdef __GNUC__
  5749. "ble 2b\n\t"
  5750. #else
  5751. "ble.n 2b\n\t"
  5752. #endif /* __GNUC__ */
  5753. "\n3:\n\t"
  5754. "mov %[r], r12\n\t"
  5755. "mov r8, r9\n\t"
  5756. "str r3, [%[r], r8]\n\t"
  5757. "mov r3, r4\n\t"
  5758. "mov r4, r5\n\t"
  5759. "add r8, r8, #4\n\t"
  5760. "mov r9, r8\n\t"
  5761. "mov r6, #88\n\t"
  5762. "cmp r8, r6\n\t"
  5763. #ifdef __GNUC__
  5764. "ble 1b\n\t"
  5765. #else
  5766. "ble.n 1b\n\t"
  5767. #endif /* __GNUC__ */
  5768. "str r3, [%[r], r8]\n\t"
  5769. "mov %[a], r10\n\t"
  5770. "mov %[b], r11\n\t"
  5771. :
  5772. : [r] "r" (tmp), [a] "r" (a), [b] "r" (b)
  5773. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  5774. );
  5775. XMEMCPY(r, tmp_arr, sizeof(tmp_arr));
  5776. }
  5777. /* Add b to a into r. (r = a + b)
  5778. *
  5779. * r A single precision integer.
  5780. * a A single precision integer.
  5781. * b A single precision integer.
  5782. */
  5783. SP_NOINLINE static sp_digit sp_3072_add_12(sp_digit* r, const sp_digit* a,
  5784. const sp_digit* b)
  5785. {
  5786. sp_digit c = 0;
  5787. __asm__ __volatile__ (
  5788. "ldm %[a]!, {r4, r5}\n\t"
  5789. "ldm %[b]!, {r6, r8}\n\t"
  5790. "adds r4, r4, r6\n\t"
  5791. "adcs r5, r5, r8\n\t"
  5792. "stm %[r]!, {r4, r5}\n\t"
  5793. "ldm %[a]!, {r4, r5}\n\t"
  5794. "ldm %[b]!, {r6, r8}\n\t"
  5795. "adcs r4, r4, r6\n\t"
  5796. "adcs r5, r5, r8\n\t"
  5797. "stm %[r]!, {r4, r5}\n\t"
  5798. "ldm %[a]!, {r4, r5}\n\t"
  5799. "ldm %[b]!, {r6, r8}\n\t"
  5800. "adcs r4, r4, r6\n\t"
  5801. "adcs r5, r5, r8\n\t"
  5802. "stm %[r]!, {r4, r5}\n\t"
  5803. "ldm %[a]!, {r4, r5}\n\t"
  5804. "ldm %[b]!, {r6, r8}\n\t"
  5805. "adcs r4, r4, r6\n\t"
  5806. "adcs r5, r5, r8\n\t"
  5807. "stm %[r]!, {r4, r5}\n\t"
  5808. "ldm %[a]!, {r4, r5}\n\t"
  5809. "ldm %[b]!, {r6, r8}\n\t"
  5810. "adcs r4, r4, r6\n\t"
  5811. "adcs r5, r5, r8\n\t"
  5812. "stm %[r]!, {r4, r5}\n\t"
  5813. "ldm %[a]!, {r4, r5}\n\t"
  5814. "ldm %[b]!, {r6, r8}\n\t"
  5815. "adcs r4, r4, r6\n\t"
  5816. "adcs r5, r5, r8\n\t"
  5817. "stm %[r]!, {r4, r5}\n\t"
  5818. "mov %[c], #0\n\t"
  5819. "adc %[c], %[c], %[c]\n\t"
  5820. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  5821. :
  5822. : "memory", "r4", "r5", "r6", "r8"
  5823. );
  5824. return c;
  5825. }
  5826. /* Sub b from a into r. (r = a - b)
  5827. *
  5828. * r A single precision integer.
  5829. * a A single precision integer.
  5830. * b A single precision integer.
  5831. */
  5832. SP_NOINLINE static sp_digit sp_3072_sub_in_place_24(sp_digit* a,
  5833. const sp_digit* b)
  5834. {
  5835. sp_digit c = 0;
  5836. __asm__ __volatile__ (
  5837. "ldm %[a], {r3, r4}\n\t"
  5838. "ldm %[b]!, {r5, r6}\n\t"
  5839. "subs r3, r3, r5\n\t"
  5840. "sbcs r4, r4, r6\n\t"
  5841. "stm %[a]!, {r3, r4}\n\t"
  5842. "ldm %[a], {r3, r4}\n\t"
  5843. "ldm %[b]!, {r5, r6}\n\t"
  5844. "sbcs r3, r3, r5\n\t"
  5845. "sbcs r4, r4, r6\n\t"
  5846. "stm %[a]!, {r3, r4}\n\t"
  5847. "ldm %[a], {r3, r4}\n\t"
  5848. "ldm %[b]!, {r5, r6}\n\t"
  5849. "sbcs r3, r3, r5\n\t"
  5850. "sbcs r4, r4, r6\n\t"
  5851. "stm %[a]!, {r3, r4}\n\t"
  5852. "ldm %[a], {r3, r4}\n\t"
  5853. "ldm %[b]!, {r5, r6}\n\t"
  5854. "sbcs r3, r3, r5\n\t"
  5855. "sbcs r4, r4, r6\n\t"
  5856. "stm %[a]!, {r3, r4}\n\t"
  5857. "ldm %[a], {r3, r4}\n\t"
  5858. "ldm %[b]!, {r5, r6}\n\t"
  5859. "sbcs r3, r3, r5\n\t"
  5860. "sbcs r4, r4, r6\n\t"
  5861. "stm %[a]!, {r3, r4}\n\t"
  5862. "ldm %[a], {r3, r4}\n\t"
  5863. "ldm %[b]!, {r5, r6}\n\t"
  5864. "sbcs r3, r3, r5\n\t"
  5865. "sbcs r4, r4, r6\n\t"
  5866. "stm %[a]!, {r3, r4}\n\t"
  5867. "ldm %[a], {r3, r4}\n\t"
  5868. "ldm %[b]!, {r5, r6}\n\t"
  5869. "sbcs r3, r3, r5\n\t"
  5870. "sbcs r4, r4, r6\n\t"
  5871. "stm %[a]!, {r3, r4}\n\t"
  5872. "ldm %[a], {r3, r4}\n\t"
  5873. "ldm %[b]!, {r5, r6}\n\t"
  5874. "sbcs r3, r3, r5\n\t"
  5875. "sbcs r4, r4, r6\n\t"
  5876. "stm %[a]!, {r3, r4}\n\t"
  5877. "ldm %[a], {r3, r4}\n\t"
  5878. "ldm %[b]!, {r5, r6}\n\t"
  5879. "sbcs r3, r3, r5\n\t"
  5880. "sbcs r4, r4, r6\n\t"
  5881. "stm %[a]!, {r3, r4}\n\t"
  5882. "ldm %[a], {r3, r4}\n\t"
  5883. "ldm %[b]!, {r5, r6}\n\t"
  5884. "sbcs r3, r3, r5\n\t"
  5885. "sbcs r4, r4, r6\n\t"
  5886. "stm %[a]!, {r3, r4}\n\t"
  5887. "ldm %[a], {r3, r4}\n\t"
  5888. "ldm %[b]!, {r5, r6}\n\t"
  5889. "sbcs r3, r3, r5\n\t"
  5890. "sbcs r4, r4, r6\n\t"
  5891. "stm %[a]!, {r3, r4}\n\t"
  5892. "ldm %[a], {r3, r4}\n\t"
  5893. "ldm %[b]!, {r5, r6}\n\t"
  5894. "sbcs r3, r3, r5\n\t"
  5895. "sbcs r4, r4, r6\n\t"
  5896. "stm %[a]!, {r3, r4}\n\t"
  5897. "sbc %[c], %[c], %[c]\n\t"
  5898. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  5899. :
  5900. : "memory", "r3", "r4", "r5", "r6"
  5901. );
  5902. return c;
  5903. }
  5904. /* Add b to a into r. (r = a + b)
  5905. *
  5906. * r A single precision integer.
  5907. * a A single precision integer.
  5908. * b A single precision integer.
  5909. */
  5910. SP_NOINLINE static sp_digit sp_3072_add_24(sp_digit* r, const sp_digit* a,
  5911. const sp_digit* b)
  5912. {
  5913. sp_digit c = 0;
  5914. __asm__ __volatile__ (
  5915. "ldm %[a]!, {r4, r5}\n\t"
  5916. "ldm %[b]!, {r6, r8}\n\t"
  5917. "adds r4, r4, r6\n\t"
  5918. "adcs r5, r5, r8\n\t"
  5919. "stm %[r]!, {r4, r5}\n\t"
  5920. "ldm %[a]!, {r4, r5}\n\t"
  5921. "ldm %[b]!, {r6, r8}\n\t"
  5922. "adcs r4, r4, r6\n\t"
  5923. "adcs r5, r5, r8\n\t"
  5924. "stm %[r]!, {r4, r5}\n\t"
  5925. "ldm %[a]!, {r4, r5}\n\t"
  5926. "ldm %[b]!, {r6, r8}\n\t"
  5927. "adcs r4, r4, r6\n\t"
  5928. "adcs r5, r5, r8\n\t"
  5929. "stm %[r]!, {r4, r5}\n\t"
  5930. "ldm %[a]!, {r4, r5}\n\t"
  5931. "ldm %[b]!, {r6, r8}\n\t"
  5932. "adcs r4, r4, r6\n\t"
  5933. "adcs r5, r5, r8\n\t"
  5934. "stm %[r]!, {r4, r5}\n\t"
  5935. "ldm %[a]!, {r4, r5}\n\t"
  5936. "ldm %[b]!, {r6, r8}\n\t"
  5937. "adcs r4, r4, r6\n\t"
  5938. "adcs r5, r5, r8\n\t"
  5939. "stm %[r]!, {r4, r5}\n\t"
  5940. "ldm %[a]!, {r4, r5}\n\t"
  5941. "ldm %[b]!, {r6, r8}\n\t"
  5942. "adcs r4, r4, r6\n\t"
  5943. "adcs r5, r5, r8\n\t"
  5944. "stm %[r]!, {r4, r5}\n\t"
  5945. "ldm %[a]!, {r4, r5}\n\t"
  5946. "ldm %[b]!, {r6, r8}\n\t"
  5947. "adcs r4, r4, r6\n\t"
  5948. "adcs r5, r5, r8\n\t"
  5949. "stm %[r]!, {r4, r5}\n\t"
  5950. "ldm %[a]!, {r4, r5}\n\t"
  5951. "ldm %[b]!, {r6, r8}\n\t"
  5952. "adcs r4, r4, r6\n\t"
  5953. "adcs r5, r5, r8\n\t"
  5954. "stm %[r]!, {r4, r5}\n\t"
  5955. "ldm %[a]!, {r4, r5}\n\t"
  5956. "ldm %[b]!, {r6, r8}\n\t"
  5957. "adcs r4, r4, r6\n\t"
  5958. "adcs r5, r5, r8\n\t"
  5959. "stm %[r]!, {r4, r5}\n\t"
  5960. "ldm %[a]!, {r4, r5}\n\t"
  5961. "ldm %[b]!, {r6, r8}\n\t"
  5962. "adcs r4, r4, r6\n\t"
  5963. "adcs r5, r5, r8\n\t"
  5964. "stm %[r]!, {r4, r5}\n\t"
  5965. "ldm %[a]!, {r4, r5}\n\t"
  5966. "ldm %[b]!, {r6, r8}\n\t"
  5967. "adcs r4, r4, r6\n\t"
  5968. "adcs r5, r5, r8\n\t"
  5969. "stm %[r]!, {r4, r5}\n\t"
  5970. "ldm %[a]!, {r4, r5}\n\t"
  5971. "ldm %[b]!, {r6, r8}\n\t"
  5972. "adcs r4, r4, r6\n\t"
  5973. "adcs r5, r5, r8\n\t"
  5974. "stm %[r]!, {r4, r5}\n\t"
  5975. "mov %[c], #0\n\t"
  5976. "adc %[c], %[c], %[c]\n\t"
  5977. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  5978. :
  5979. : "memory", "r4", "r5", "r6", "r8"
  5980. );
  5981. return c;
  5982. }
  5983. /* AND m into each word of a and store in r.
  5984. *
  5985. * r A single precision integer.
  5986. * a A single precision integer.
  5987. * m Mask to AND against each digit.
  5988. */
  5989. static void sp_3072_mask_12(sp_digit* r, const sp_digit* a, sp_digit m)
  5990. {
  5991. #ifdef WOLFSSL_SP_SMALL
  5992. int i;
  5993. for (i=0; i<12; i++) {
  5994. r[i] = a[i] & m;
  5995. }
  5996. #else
  5997. r[0] = a[0] & m;
  5998. r[1] = a[1] & m;
  5999. r[2] = a[2] & m;
  6000. r[3] = a[3] & m;
  6001. r[4] = a[4] & m;
  6002. r[5] = a[5] & m;
  6003. r[6] = a[6] & m;
  6004. r[7] = a[7] & m;
  6005. r[8] = a[8] & m;
  6006. r[9] = a[9] & m;
  6007. r[10] = a[10] & m;
  6008. r[11] = a[11] & m;
  6009. #endif
  6010. }
  6011. /* Multiply a and b into r. (r = a * b)
  6012. *
  6013. * r A single precision integer.
  6014. * a A single precision integer.
  6015. * b A single precision integer.
  6016. */
  6017. SP_NOINLINE static void sp_3072_mul_24(sp_digit* r, const sp_digit* a,
  6018. const sp_digit* b)
  6019. {
  6020. sp_digit* z0 = r;
  6021. sp_digit z1[24];
  6022. sp_digit a1[12];
  6023. sp_digit b1[12];
  6024. sp_digit* z2 = r + 24;
  6025. sp_digit u;
  6026. sp_digit ca;
  6027. sp_digit cb;
  6028. ca = sp_3072_add_12(a1, a, &a[12]);
  6029. cb = sp_3072_add_12(b1, b, &b[12]);
  6030. u = ca & cb;
  6031. sp_3072_mul_12(z2, &a[12], &b[12]);
  6032. sp_3072_mul_12(z0, a, b);
  6033. sp_3072_mul_12(z1, a1, b1);
  6034. u += sp_3072_sub_in_place_24(z1, z0);
  6035. u += sp_3072_sub_in_place_24(z1, z2);
  6036. sp_3072_mask_12(a1, a1, 0 - cb);
  6037. u += sp_3072_add_12(z1 + 12, z1 + 12, a1);
  6038. sp_3072_mask_12(b1, b1, 0 - ca);
  6039. u += sp_3072_add_12(z1 + 12, z1 + 12, b1);
  6040. u += sp_3072_add_24(r + 12, r + 12, z1);
  6041. XMEMSET(a1 + 1, 0, sizeof(sp_digit) * (12 - 1));
  6042. a1[0] = u;
  6043. (void)sp_3072_add_12(r + 36, r + 36, a1);
  6044. }
  6045. /* Sub b from a into r. (r = a - b)
  6046. *
  6047. * r A single precision integer.
  6048. * a A single precision integer.
  6049. * b A single precision integer.
  6050. */
  6051. SP_NOINLINE static sp_digit sp_3072_sub_in_place_48(sp_digit* a,
  6052. const sp_digit* b)
  6053. {
  6054. sp_digit c = 0;
  6055. __asm__ __volatile__ (
  6056. "ldm %[a], {r3, r4}\n\t"
  6057. "ldm %[b]!, {r5, r6}\n\t"
  6058. "subs r3, r3, r5\n\t"
  6059. "sbcs r4, r4, r6\n\t"
  6060. "stm %[a]!, {r3, r4}\n\t"
  6061. "ldm %[a], {r3, r4}\n\t"
  6062. "ldm %[b]!, {r5, r6}\n\t"
  6063. "sbcs r3, r3, r5\n\t"
  6064. "sbcs r4, r4, r6\n\t"
  6065. "stm %[a]!, {r3, r4}\n\t"
  6066. "ldm %[a], {r3, r4}\n\t"
  6067. "ldm %[b]!, {r5, r6}\n\t"
  6068. "sbcs r3, r3, r5\n\t"
  6069. "sbcs r4, r4, r6\n\t"
  6070. "stm %[a]!, {r3, r4}\n\t"
  6071. "ldm %[a], {r3, r4}\n\t"
  6072. "ldm %[b]!, {r5, r6}\n\t"
  6073. "sbcs r3, r3, r5\n\t"
  6074. "sbcs r4, r4, r6\n\t"
  6075. "stm %[a]!, {r3, r4}\n\t"
  6076. "ldm %[a], {r3, r4}\n\t"
  6077. "ldm %[b]!, {r5, r6}\n\t"
  6078. "sbcs r3, r3, r5\n\t"
  6079. "sbcs r4, r4, r6\n\t"
  6080. "stm %[a]!, {r3, r4}\n\t"
  6081. "ldm %[a], {r3, r4}\n\t"
  6082. "ldm %[b]!, {r5, r6}\n\t"
  6083. "sbcs r3, r3, r5\n\t"
  6084. "sbcs r4, r4, r6\n\t"
  6085. "stm %[a]!, {r3, r4}\n\t"
  6086. "ldm %[a], {r3, r4}\n\t"
  6087. "ldm %[b]!, {r5, r6}\n\t"
  6088. "sbcs r3, r3, r5\n\t"
  6089. "sbcs r4, r4, r6\n\t"
  6090. "stm %[a]!, {r3, r4}\n\t"
  6091. "ldm %[a], {r3, r4}\n\t"
  6092. "ldm %[b]!, {r5, r6}\n\t"
  6093. "sbcs r3, r3, r5\n\t"
  6094. "sbcs r4, r4, r6\n\t"
  6095. "stm %[a]!, {r3, r4}\n\t"
  6096. "ldm %[a], {r3, r4}\n\t"
  6097. "ldm %[b]!, {r5, r6}\n\t"
  6098. "sbcs r3, r3, r5\n\t"
  6099. "sbcs r4, r4, r6\n\t"
  6100. "stm %[a]!, {r3, r4}\n\t"
  6101. "ldm %[a], {r3, r4}\n\t"
  6102. "ldm %[b]!, {r5, r6}\n\t"
  6103. "sbcs r3, r3, r5\n\t"
  6104. "sbcs r4, r4, r6\n\t"
  6105. "stm %[a]!, {r3, r4}\n\t"
  6106. "ldm %[a], {r3, r4}\n\t"
  6107. "ldm %[b]!, {r5, r6}\n\t"
  6108. "sbcs r3, r3, r5\n\t"
  6109. "sbcs r4, r4, r6\n\t"
  6110. "stm %[a]!, {r3, r4}\n\t"
  6111. "ldm %[a], {r3, r4}\n\t"
  6112. "ldm %[b]!, {r5, r6}\n\t"
  6113. "sbcs r3, r3, r5\n\t"
  6114. "sbcs r4, r4, r6\n\t"
  6115. "stm %[a]!, {r3, r4}\n\t"
  6116. "ldm %[a], {r3, r4}\n\t"
  6117. "ldm %[b]!, {r5, r6}\n\t"
  6118. "sbcs r3, r3, r5\n\t"
  6119. "sbcs r4, r4, r6\n\t"
  6120. "stm %[a]!, {r3, r4}\n\t"
  6121. "ldm %[a], {r3, r4}\n\t"
  6122. "ldm %[b]!, {r5, r6}\n\t"
  6123. "sbcs r3, r3, r5\n\t"
  6124. "sbcs r4, r4, r6\n\t"
  6125. "stm %[a]!, {r3, r4}\n\t"
  6126. "ldm %[a], {r3, r4}\n\t"
  6127. "ldm %[b]!, {r5, r6}\n\t"
  6128. "sbcs r3, r3, r5\n\t"
  6129. "sbcs r4, r4, r6\n\t"
  6130. "stm %[a]!, {r3, r4}\n\t"
  6131. "ldm %[a], {r3, r4}\n\t"
  6132. "ldm %[b]!, {r5, r6}\n\t"
  6133. "sbcs r3, r3, r5\n\t"
  6134. "sbcs r4, r4, r6\n\t"
  6135. "stm %[a]!, {r3, r4}\n\t"
  6136. "ldm %[a], {r3, r4}\n\t"
  6137. "ldm %[b]!, {r5, r6}\n\t"
  6138. "sbcs r3, r3, r5\n\t"
  6139. "sbcs r4, r4, r6\n\t"
  6140. "stm %[a]!, {r3, r4}\n\t"
  6141. "ldm %[a], {r3, r4}\n\t"
  6142. "ldm %[b]!, {r5, r6}\n\t"
  6143. "sbcs r3, r3, r5\n\t"
  6144. "sbcs r4, r4, r6\n\t"
  6145. "stm %[a]!, {r3, r4}\n\t"
  6146. "ldm %[a], {r3, r4}\n\t"
  6147. "ldm %[b]!, {r5, r6}\n\t"
  6148. "sbcs r3, r3, r5\n\t"
  6149. "sbcs r4, r4, r6\n\t"
  6150. "stm %[a]!, {r3, r4}\n\t"
  6151. "ldm %[a], {r3, r4}\n\t"
  6152. "ldm %[b]!, {r5, r6}\n\t"
  6153. "sbcs r3, r3, r5\n\t"
  6154. "sbcs r4, r4, r6\n\t"
  6155. "stm %[a]!, {r3, r4}\n\t"
  6156. "ldm %[a], {r3, r4}\n\t"
  6157. "ldm %[b]!, {r5, r6}\n\t"
  6158. "sbcs r3, r3, r5\n\t"
  6159. "sbcs r4, r4, r6\n\t"
  6160. "stm %[a]!, {r3, r4}\n\t"
  6161. "ldm %[a], {r3, r4}\n\t"
  6162. "ldm %[b]!, {r5, r6}\n\t"
  6163. "sbcs r3, r3, r5\n\t"
  6164. "sbcs r4, r4, r6\n\t"
  6165. "stm %[a]!, {r3, r4}\n\t"
  6166. "ldm %[a], {r3, r4}\n\t"
  6167. "ldm %[b]!, {r5, r6}\n\t"
  6168. "sbcs r3, r3, r5\n\t"
  6169. "sbcs r4, r4, r6\n\t"
  6170. "stm %[a]!, {r3, r4}\n\t"
  6171. "ldm %[a], {r3, r4}\n\t"
  6172. "ldm %[b]!, {r5, r6}\n\t"
  6173. "sbcs r3, r3, r5\n\t"
  6174. "sbcs r4, r4, r6\n\t"
  6175. "stm %[a]!, {r3, r4}\n\t"
  6176. "sbc %[c], %[c], %[c]\n\t"
  6177. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  6178. :
  6179. : "memory", "r3", "r4", "r5", "r6"
  6180. );
  6181. return c;
  6182. }
  6183. /* Add b to a into r. (r = a + b)
  6184. *
  6185. * r A single precision integer.
  6186. * a A single precision integer.
  6187. * b A single precision integer.
  6188. */
  6189. SP_NOINLINE static sp_digit sp_3072_add_48(sp_digit* r, const sp_digit* a,
  6190. const sp_digit* b)
  6191. {
  6192. sp_digit c = 0;
  6193. __asm__ __volatile__ (
  6194. "ldm %[a]!, {r4, r5}\n\t"
  6195. "ldm %[b]!, {r6, r8}\n\t"
  6196. "adds r4, r4, r6\n\t"
  6197. "adcs r5, r5, r8\n\t"
  6198. "stm %[r]!, {r4, r5}\n\t"
  6199. "ldm %[a]!, {r4, r5}\n\t"
  6200. "ldm %[b]!, {r6, r8}\n\t"
  6201. "adcs r4, r4, r6\n\t"
  6202. "adcs r5, r5, r8\n\t"
  6203. "stm %[r]!, {r4, r5}\n\t"
  6204. "ldm %[a]!, {r4, r5}\n\t"
  6205. "ldm %[b]!, {r6, r8}\n\t"
  6206. "adcs r4, r4, r6\n\t"
  6207. "adcs r5, r5, r8\n\t"
  6208. "stm %[r]!, {r4, r5}\n\t"
  6209. "ldm %[a]!, {r4, r5}\n\t"
  6210. "ldm %[b]!, {r6, r8}\n\t"
  6211. "adcs r4, r4, r6\n\t"
  6212. "adcs r5, r5, r8\n\t"
  6213. "stm %[r]!, {r4, r5}\n\t"
  6214. "ldm %[a]!, {r4, r5}\n\t"
  6215. "ldm %[b]!, {r6, r8}\n\t"
  6216. "adcs r4, r4, r6\n\t"
  6217. "adcs r5, r5, r8\n\t"
  6218. "stm %[r]!, {r4, r5}\n\t"
  6219. "ldm %[a]!, {r4, r5}\n\t"
  6220. "ldm %[b]!, {r6, r8}\n\t"
  6221. "adcs r4, r4, r6\n\t"
  6222. "adcs r5, r5, r8\n\t"
  6223. "stm %[r]!, {r4, r5}\n\t"
  6224. "ldm %[a]!, {r4, r5}\n\t"
  6225. "ldm %[b]!, {r6, r8}\n\t"
  6226. "adcs r4, r4, r6\n\t"
  6227. "adcs r5, r5, r8\n\t"
  6228. "stm %[r]!, {r4, r5}\n\t"
  6229. "ldm %[a]!, {r4, r5}\n\t"
  6230. "ldm %[b]!, {r6, r8}\n\t"
  6231. "adcs r4, r4, r6\n\t"
  6232. "adcs r5, r5, r8\n\t"
  6233. "stm %[r]!, {r4, r5}\n\t"
  6234. "ldm %[a]!, {r4, r5}\n\t"
  6235. "ldm %[b]!, {r6, r8}\n\t"
  6236. "adcs r4, r4, r6\n\t"
  6237. "adcs r5, r5, r8\n\t"
  6238. "stm %[r]!, {r4, r5}\n\t"
  6239. "ldm %[a]!, {r4, r5}\n\t"
  6240. "ldm %[b]!, {r6, r8}\n\t"
  6241. "adcs r4, r4, r6\n\t"
  6242. "adcs r5, r5, r8\n\t"
  6243. "stm %[r]!, {r4, r5}\n\t"
  6244. "ldm %[a]!, {r4, r5}\n\t"
  6245. "ldm %[b]!, {r6, r8}\n\t"
  6246. "adcs r4, r4, r6\n\t"
  6247. "adcs r5, r5, r8\n\t"
  6248. "stm %[r]!, {r4, r5}\n\t"
  6249. "ldm %[a]!, {r4, r5}\n\t"
  6250. "ldm %[b]!, {r6, r8}\n\t"
  6251. "adcs r4, r4, r6\n\t"
  6252. "adcs r5, r5, r8\n\t"
  6253. "stm %[r]!, {r4, r5}\n\t"
  6254. "ldm %[a]!, {r4, r5}\n\t"
  6255. "ldm %[b]!, {r6, r8}\n\t"
  6256. "adcs r4, r4, r6\n\t"
  6257. "adcs r5, r5, r8\n\t"
  6258. "stm %[r]!, {r4, r5}\n\t"
  6259. "ldm %[a]!, {r4, r5}\n\t"
  6260. "ldm %[b]!, {r6, r8}\n\t"
  6261. "adcs r4, r4, r6\n\t"
  6262. "adcs r5, r5, r8\n\t"
  6263. "stm %[r]!, {r4, r5}\n\t"
  6264. "ldm %[a]!, {r4, r5}\n\t"
  6265. "ldm %[b]!, {r6, r8}\n\t"
  6266. "adcs r4, r4, r6\n\t"
  6267. "adcs r5, r5, r8\n\t"
  6268. "stm %[r]!, {r4, r5}\n\t"
  6269. "ldm %[a]!, {r4, r5}\n\t"
  6270. "ldm %[b]!, {r6, r8}\n\t"
  6271. "adcs r4, r4, r6\n\t"
  6272. "adcs r5, r5, r8\n\t"
  6273. "stm %[r]!, {r4, r5}\n\t"
  6274. "ldm %[a]!, {r4, r5}\n\t"
  6275. "ldm %[b]!, {r6, r8}\n\t"
  6276. "adcs r4, r4, r6\n\t"
  6277. "adcs r5, r5, r8\n\t"
  6278. "stm %[r]!, {r4, r5}\n\t"
  6279. "ldm %[a]!, {r4, r5}\n\t"
  6280. "ldm %[b]!, {r6, r8}\n\t"
  6281. "adcs r4, r4, r6\n\t"
  6282. "adcs r5, r5, r8\n\t"
  6283. "stm %[r]!, {r4, r5}\n\t"
  6284. "ldm %[a]!, {r4, r5}\n\t"
  6285. "ldm %[b]!, {r6, r8}\n\t"
  6286. "adcs r4, r4, r6\n\t"
  6287. "adcs r5, r5, r8\n\t"
  6288. "stm %[r]!, {r4, r5}\n\t"
  6289. "ldm %[a]!, {r4, r5}\n\t"
  6290. "ldm %[b]!, {r6, r8}\n\t"
  6291. "adcs r4, r4, r6\n\t"
  6292. "adcs r5, r5, r8\n\t"
  6293. "stm %[r]!, {r4, r5}\n\t"
  6294. "ldm %[a]!, {r4, r5}\n\t"
  6295. "ldm %[b]!, {r6, r8}\n\t"
  6296. "adcs r4, r4, r6\n\t"
  6297. "adcs r5, r5, r8\n\t"
  6298. "stm %[r]!, {r4, r5}\n\t"
  6299. "ldm %[a]!, {r4, r5}\n\t"
  6300. "ldm %[b]!, {r6, r8}\n\t"
  6301. "adcs r4, r4, r6\n\t"
  6302. "adcs r5, r5, r8\n\t"
  6303. "stm %[r]!, {r4, r5}\n\t"
  6304. "ldm %[a]!, {r4, r5}\n\t"
  6305. "ldm %[b]!, {r6, r8}\n\t"
  6306. "adcs r4, r4, r6\n\t"
  6307. "adcs r5, r5, r8\n\t"
  6308. "stm %[r]!, {r4, r5}\n\t"
  6309. "ldm %[a]!, {r4, r5}\n\t"
  6310. "ldm %[b]!, {r6, r8}\n\t"
  6311. "adcs r4, r4, r6\n\t"
  6312. "adcs r5, r5, r8\n\t"
  6313. "stm %[r]!, {r4, r5}\n\t"
  6314. "mov %[c], #0\n\t"
  6315. "adc %[c], %[c], %[c]\n\t"
  6316. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  6317. :
  6318. : "memory", "r4", "r5", "r6", "r8"
  6319. );
  6320. return c;
  6321. }
  6322. /* AND m into each word of a and store in r.
  6323. *
  6324. * r A single precision integer.
  6325. * a A single precision integer.
  6326. * m Mask to AND against each digit.
  6327. */
  6328. static void sp_3072_mask_24(sp_digit* r, const sp_digit* a, sp_digit m)
  6329. {
  6330. #ifdef WOLFSSL_SP_SMALL
  6331. int i;
  6332. for (i=0; i<24; i++) {
  6333. r[i] = a[i] & m;
  6334. }
  6335. #else
  6336. int i;
  6337. for (i = 0; i < 24; i += 8) {
  6338. r[i+0] = a[i+0] & m;
  6339. r[i+1] = a[i+1] & m;
  6340. r[i+2] = a[i+2] & m;
  6341. r[i+3] = a[i+3] & m;
  6342. r[i+4] = a[i+4] & m;
  6343. r[i+5] = a[i+5] & m;
  6344. r[i+6] = a[i+6] & m;
  6345. r[i+7] = a[i+7] & m;
  6346. }
  6347. #endif
  6348. }
  6349. /* Multiply a and b into r. (r = a * b)
  6350. *
  6351. * r A single precision integer.
  6352. * a A single precision integer.
  6353. * b A single precision integer.
  6354. */
  6355. SP_NOINLINE static void sp_3072_mul_48(sp_digit* r, const sp_digit* a,
  6356. const sp_digit* b)
  6357. {
  6358. sp_digit* z0 = r;
  6359. sp_digit z1[48];
  6360. sp_digit a1[24];
  6361. sp_digit b1[24];
  6362. sp_digit* z2 = r + 48;
  6363. sp_digit u;
  6364. sp_digit ca;
  6365. sp_digit cb;
  6366. ca = sp_3072_add_24(a1, a, &a[24]);
  6367. cb = sp_3072_add_24(b1, b, &b[24]);
  6368. u = ca & cb;
  6369. sp_3072_mul_24(z2, &a[24], &b[24]);
  6370. sp_3072_mul_24(z0, a, b);
  6371. sp_3072_mul_24(z1, a1, b1);
  6372. u += sp_3072_sub_in_place_48(z1, z0);
  6373. u += sp_3072_sub_in_place_48(z1, z2);
  6374. sp_3072_mask_24(a1, a1, 0 - cb);
  6375. u += sp_3072_add_24(z1 + 24, z1 + 24, a1);
  6376. sp_3072_mask_24(b1, b1, 0 - ca);
  6377. u += sp_3072_add_24(z1 + 24, z1 + 24, b1);
  6378. u += sp_3072_add_48(r + 24, r + 24, z1);
  6379. XMEMSET(a1 + 1, 0, sizeof(sp_digit) * (24 - 1));
  6380. a1[0] = u;
  6381. (void)sp_3072_add_24(r + 72, r + 72, a1);
  6382. }
  6383. /* Sub b from a into r. (r = a - b)
  6384. *
  6385. * r A single precision integer.
  6386. * a A single precision integer.
  6387. * b A single precision integer.
  6388. */
  6389. SP_NOINLINE static sp_digit sp_3072_sub_in_place_96(sp_digit* a,
  6390. const sp_digit* b)
  6391. {
  6392. sp_digit c = 0;
  6393. __asm__ __volatile__ (
  6394. "ldm %[a], {r3, r4}\n\t"
  6395. "ldm %[b]!, {r5, r6}\n\t"
  6396. "subs r3, r3, r5\n\t"
  6397. "sbcs r4, r4, r6\n\t"
  6398. "stm %[a]!, {r3, r4}\n\t"
  6399. "ldm %[a], {r3, r4}\n\t"
  6400. "ldm %[b]!, {r5, r6}\n\t"
  6401. "sbcs r3, r3, r5\n\t"
  6402. "sbcs r4, r4, r6\n\t"
  6403. "stm %[a]!, {r3, r4}\n\t"
  6404. "ldm %[a], {r3, r4}\n\t"
  6405. "ldm %[b]!, {r5, r6}\n\t"
  6406. "sbcs r3, r3, r5\n\t"
  6407. "sbcs r4, r4, r6\n\t"
  6408. "stm %[a]!, {r3, r4}\n\t"
  6409. "ldm %[a], {r3, r4}\n\t"
  6410. "ldm %[b]!, {r5, r6}\n\t"
  6411. "sbcs r3, r3, r5\n\t"
  6412. "sbcs r4, r4, r6\n\t"
  6413. "stm %[a]!, {r3, r4}\n\t"
  6414. "ldm %[a], {r3, r4}\n\t"
  6415. "ldm %[b]!, {r5, r6}\n\t"
  6416. "sbcs r3, r3, r5\n\t"
  6417. "sbcs r4, r4, r6\n\t"
  6418. "stm %[a]!, {r3, r4}\n\t"
  6419. "ldm %[a], {r3, r4}\n\t"
  6420. "ldm %[b]!, {r5, r6}\n\t"
  6421. "sbcs r3, r3, r5\n\t"
  6422. "sbcs r4, r4, r6\n\t"
  6423. "stm %[a]!, {r3, r4}\n\t"
  6424. "ldm %[a], {r3, r4}\n\t"
  6425. "ldm %[b]!, {r5, r6}\n\t"
  6426. "sbcs r3, r3, r5\n\t"
  6427. "sbcs r4, r4, r6\n\t"
  6428. "stm %[a]!, {r3, r4}\n\t"
  6429. "ldm %[a], {r3, r4}\n\t"
  6430. "ldm %[b]!, {r5, r6}\n\t"
  6431. "sbcs r3, r3, r5\n\t"
  6432. "sbcs r4, r4, r6\n\t"
  6433. "stm %[a]!, {r3, r4}\n\t"
  6434. "ldm %[a], {r3, r4}\n\t"
  6435. "ldm %[b]!, {r5, r6}\n\t"
  6436. "sbcs r3, r3, r5\n\t"
  6437. "sbcs r4, r4, r6\n\t"
  6438. "stm %[a]!, {r3, r4}\n\t"
  6439. "ldm %[a], {r3, r4}\n\t"
  6440. "ldm %[b]!, {r5, r6}\n\t"
  6441. "sbcs r3, r3, r5\n\t"
  6442. "sbcs r4, r4, r6\n\t"
  6443. "stm %[a]!, {r3, r4}\n\t"
  6444. "ldm %[a], {r3, r4}\n\t"
  6445. "ldm %[b]!, {r5, r6}\n\t"
  6446. "sbcs r3, r3, r5\n\t"
  6447. "sbcs r4, r4, r6\n\t"
  6448. "stm %[a]!, {r3, r4}\n\t"
  6449. "ldm %[a], {r3, r4}\n\t"
  6450. "ldm %[b]!, {r5, r6}\n\t"
  6451. "sbcs r3, r3, r5\n\t"
  6452. "sbcs r4, r4, r6\n\t"
  6453. "stm %[a]!, {r3, r4}\n\t"
  6454. "ldm %[a], {r3, r4}\n\t"
  6455. "ldm %[b]!, {r5, r6}\n\t"
  6456. "sbcs r3, r3, r5\n\t"
  6457. "sbcs r4, r4, r6\n\t"
  6458. "stm %[a]!, {r3, r4}\n\t"
  6459. "ldm %[a], {r3, r4}\n\t"
  6460. "ldm %[b]!, {r5, r6}\n\t"
  6461. "sbcs r3, r3, r5\n\t"
  6462. "sbcs r4, r4, r6\n\t"
  6463. "stm %[a]!, {r3, r4}\n\t"
  6464. "ldm %[a], {r3, r4}\n\t"
  6465. "ldm %[b]!, {r5, r6}\n\t"
  6466. "sbcs r3, r3, r5\n\t"
  6467. "sbcs r4, r4, r6\n\t"
  6468. "stm %[a]!, {r3, r4}\n\t"
  6469. "ldm %[a], {r3, r4}\n\t"
  6470. "ldm %[b]!, {r5, r6}\n\t"
  6471. "sbcs r3, r3, r5\n\t"
  6472. "sbcs r4, r4, r6\n\t"
  6473. "stm %[a]!, {r3, r4}\n\t"
  6474. "ldm %[a], {r3, r4}\n\t"
  6475. "ldm %[b]!, {r5, r6}\n\t"
  6476. "sbcs r3, r3, r5\n\t"
  6477. "sbcs r4, r4, r6\n\t"
  6478. "stm %[a]!, {r3, r4}\n\t"
  6479. "ldm %[a], {r3, r4}\n\t"
  6480. "ldm %[b]!, {r5, r6}\n\t"
  6481. "sbcs r3, r3, r5\n\t"
  6482. "sbcs r4, r4, r6\n\t"
  6483. "stm %[a]!, {r3, r4}\n\t"
  6484. "ldm %[a], {r3, r4}\n\t"
  6485. "ldm %[b]!, {r5, r6}\n\t"
  6486. "sbcs r3, r3, r5\n\t"
  6487. "sbcs r4, r4, r6\n\t"
  6488. "stm %[a]!, {r3, r4}\n\t"
  6489. "ldm %[a], {r3, r4}\n\t"
  6490. "ldm %[b]!, {r5, r6}\n\t"
  6491. "sbcs r3, r3, r5\n\t"
  6492. "sbcs r4, r4, r6\n\t"
  6493. "stm %[a]!, {r3, r4}\n\t"
  6494. "ldm %[a], {r3, r4}\n\t"
  6495. "ldm %[b]!, {r5, r6}\n\t"
  6496. "sbcs r3, r3, r5\n\t"
  6497. "sbcs r4, r4, r6\n\t"
  6498. "stm %[a]!, {r3, r4}\n\t"
  6499. "ldm %[a], {r3, r4}\n\t"
  6500. "ldm %[b]!, {r5, r6}\n\t"
  6501. "sbcs r3, r3, r5\n\t"
  6502. "sbcs r4, r4, r6\n\t"
  6503. "stm %[a]!, {r3, r4}\n\t"
  6504. "ldm %[a], {r3, r4}\n\t"
  6505. "ldm %[b]!, {r5, r6}\n\t"
  6506. "sbcs r3, r3, r5\n\t"
  6507. "sbcs r4, r4, r6\n\t"
  6508. "stm %[a]!, {r3, r4}\n\t"
  6509. "ldm %[a], {r3, r4}\n\t"
  6510. "ldm %[b]!, {r5, r6}\n\t"
  6511. "sbcs r3, r3, r5\n\t"
  6512. "sbcs r4, r4, r6\n\t"
  6513. "stm %[a]!, {r3, r4}\n\t"
  6514. "ldm %[a], {r3, r4}\n\t"
  6515. "ldm %[b]!, {r5, r6}\n\t"
  6516. "sbcs r3, r3, r5\n\t"
  6517. "sbcs r4, r4, r6\n\t"
  6518. "stm %[a]!, {r3, r4}\n\t"
  6519. "ldm %[a], {r3, r4}\n\t"
  6520. "ldm %[b]!, {r5, r6}\n\t"
  6521. "sbcs r3, r3, r5\n\t"
  6522. "sbcs r4, r4, r6\n\t"
  6523. "stm %[a]!, {r3, r4}\n\t"
  6524. "ldm %[a], {r3, r4}\n\t"
  6525. "ldm %[b]!, {r5, r6}\n\t"
  6526. "sbcs r3, r3, r5\n\t"
  6527. "sbcs r4, r4, r6\n\t"
  6528. "stm %[a]!, {r3, r4}\n\t"
  6529. "ldm %[a], {r3, r4}\n\t"
  6530. "ldm %[b]!, {r5, r6}\n\t"
  6531. "sbcs r3, r3, r5\n\t"
  6532. "sbcs r4, r4, r6\n\t"
  6533. "stm %[a]!, {r3, r4}\n\t"
  6534. "ldm %[a], {r3, r4}\n\t"
  6535. "ldm %[b]!, {r5, r6}\n\t"
  6536. "sbcs r3, r3, r5\n\t"
  6537. "sbcs r4, r4, r6\n\t"
  6538. "stm %[a]!, {r3, r4}\n\t"
  6539. "ldm %[a], {r3, r4}\n\t"
  6540. "ldm %[b]!, {r5, r6}\n\t"
  6541. "sbcs r3, r3, r5\n\t"
  6542. "sbcs r4, r4, r6\n\t"
  6543. "stm %[a]!, {r3, r4}\n\t"
  6544. "ldm %[a], {r3, r4}\n\t"
  6545. "ldm %[b]!, {r5, r6}\n\t"
  6546. "sbcs r3, r3, r5\n\t"
  6547. "sbcs r4, r4, r6\n\t"
  6548. "stm %[a]!, {r3, r4}\n\t"
  6549. "ldm %[a], {r3, r4}\n\t"
  6550. "ldm %[b]!, {r5, r6}\n\t"
  6551. "sbcs r3, r3, r5\n\t"
  6552. "sbcs r4, r4, r6\n\t"
  6553. "stm %[a]!, {r3, r4}\n\t"
  6554. "ldm %[a], {r3, r4}\n\t"
  6555. "ldm %[b]!, {r5, r6}\n\t"
  6556. "sbcs r3, r3, r5\n\t"
  6557. "sbcs r4, r4, r6\n\t"
  6558. "stm %[a]!, {r3, r4}\n\t"
  6559. "ldm %[a], {r3, r4}\n\t"
  6560. "ldm %[b]!, {r5, r6}\n\t"
  6561. "sbcs r3, r3, r5\n\t"
  6562. "sbcs r4, r4, r6\n\t"
  6563. "stm %[a]!, {r3, r4}\n\t"
  6564. "ldm %[a], {r3, r4}\n\t"
  6565. "ldm %[b]!, {r5, r6}\n\t"
  6566. "sbcs r3, r3, r5\n\t"
  6567. "sbcs r4, r4, r6\n\t"
  6568. "stm %[a]!, {r3, r4}\n\t"
  6569. "ldm %[a], {r3, r4}\n\t"
  6570. "ldm %[b]!, {r5, r6}\n\t"
  6571. "sbcs r3, r3, r5\n\t"
  6572. "sbcs r4, r4, r6\n\t"
  6573. "stm %[a]!, {r3, r4}\n\t"
  6574. "ldm %[a], {r3, r4}\n\t"
  6575. "ldm %[b]!, {r5, r6}\n\t"
  6576. "sbcs r3, r3, r5\n\t"
  6577. "sbcs r4, r4, r6\n\t"
  6578. "stm %[a]!, {r3, r4}\n\t"
  6579. "ldm %[a], {r3, r4}\n\t"
  6580. "ldm %[b]!, {r5, r6}\n\t"
  6581. "sbcs r3, r3, r5\n\t"
  6582. "sbcs r4, r4, r6\n\t"
  6583. "stm %[a]!, {r3, r4}\n\t"
  6584. "ldm %[a], {r3, r4}\n\t"
  6585. "ldm %[b]!, {r5, r6}\n\t"
  6586. "sbcs r3, r3, r5\n\t"
  6587. "sbcs r4, r4, r6\n\t"
  6588. "stm %[a]!, {r3, r4}\n\t"
  6589. "ldm %[a], {r3, r4}\n\t"
  6590. "ldm %[b]!, {r5, r6}\n\t"
  6591. "sbcs r3, r3, r5\n\t"
  6592. "sbcs r4, r4, r6\n\t"
  6593. "stm %[a]!, {r3, r4}\n\t"
  6594. "ldm %[a], {r3, r4}\n\t"
  6595. "ldm %[b]!, {r5, r6}\n\t"
  6596. "sbcs r3, r3, r5\n\t"
  6597. "sbcs r4, r4, r6\n\t"
  6598. "stm %[a]!, {r3, r4}\n\t"
  6599. "ldm %[a], {r3, r4}\n\t"
  6600. "ldm %[b]!, {r5, r6}\n\t"
  6601. "sbcs r3, r3, r5\n\t"
  6602. "sbcs r4, r4, r6\n\t"
  6603. "stm %[a]!, {r3, r4}\n\t"
  6604. "ldm %[a], {r3, r4}\n\t"
  6605. "ldm %[b]!, {r5, r6}\n\t"
  6606. "sbcs r3, r3, r5\n\t"
  6607. "sbcs r4, r4, r6\n\t"
  6608. "stm %[a]!, {r3, r4}\n\t"
  6609. "ldm %[a], {r3, r4}\n\t"
  6610. "ldm %[b]!, {r5, r6}\n\t"
  6611. "sbcs r3, r3, r5\n\t"
  6612. "sbcs r4, r4, r6\n\t"
  6613. "stm %[a]!, {r3, r4}\n\t"
  6614. "ldm %[a], {r3, r4}\n\t"
  6615. "ldm %[b]!, {r5, r6}\n\t"
  6616. "sbcs r3, r3, r5\n\t"
  6617. "sbcs r4, r4, r6\n\t"
  6618. "stm %[a]!, {r3, r4}\n\t"
  6619. "ldm %[a], {r3, r4}\n\t"
  6620. "ldm %[b]!, {r5, r6}\n\t"
  6621. "sbcs r3, r3, r5\n\t"
  6622. "sbcs r4, r4, r6\n\t"
  6623. "stm %[a]!, {r3, r4}\n\t"
  6624. "ldm %[a], {r3, r4}\n\t"
  6625. "ldm %[b]!, {r5, r6}\n\t"
  6626. "sbcs r3, r3, r5\n\t"
  6627. "sbcs r4, r4, r6\n\t"
  6628. "stm %[a]!, {r3, r4}\n\t"
  6629. "ldm %[a], {r3, r4}\n\t"
  6630. "ldm %[b]!, {r5, r6}\n\t"
  6631. "sbcs r3, r3, r5\n\t"
  6632. "sbcs r4, r4, r6\n\t"
  6633. "stm %[a]!, {r3, r4}\n\t"
  6634. "sbc %[c], %[c], %[c]\n\t"
  6635. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  6636. :
  6637. : "memory", "r3", "r4", "r5", "r6"
  6638. );
  6639. return c;
  6640. }
  6641. /* Add b to a into r. (r = a + b)
  6642. *
  6643. * r A single precision integer.
  6644. * a A single precision integer.
  6645. * b A single precision integer.
  6646. */
  6647. SP_NOINLINE static sp_digit sp_3072_add_96(sp_digit* r, const sp_digit* a,
  6648. const sp_digit* b)
  6649. {
  6650. sp_digit c = 0;
  6651. __asm__ __volatile__ (
  6652. "ldm %[a]!, {r4, r5}\n\t"
  6653. "ldm %[b]!, {r6, r8}\n\t"
  6654. "adds r4, r4, r6\n\t"
  6655. "adcs r5, r5, r8\n\t"
  6656. "stm %[r]!, {r4, r5}\n\t"
  6657. "ldm %[a]!, {r4, r5}\n\t"
  6658. "ldm %[b]!, {r6, r8}\n\t"
  6659. "adcs r4, r4, r6\n\t"
  6660. "adcs r5, r5, r8\n\t"
  6661. "stm %[r]!, {r4, r5}\n\t"
  6662. "ldm %[a]!, {r4, r5}\n\t"
  6663. "ldm %[b]!, {r6, r8}\n\t"
  6664. "adcs r4, r4, r6\n\t"
  6665. "adcs r5, r5, r8\n\t"
  6666. "stm %[r]!, {r4, r5}\n\t"
  6667. "ldm %[a]!, {r4, r5}\n\t"
  6668. "ldm %[b]!, {r6, r8}\n\t"
  6669. "adcs r4, r4, r6\n\t"
  6670. "adcs r5, r5, r8\n\t"
  6671. "stm %[r]!, {r4, r5}\n\t"
  6672. "ldm %[a]!, {r4, r5}\n\t"
  6673. "ldm %[b]!, {r6, r8}\n\t"
  6674. "adcs r4, r4, r6\n\t"
  6675. "adcs r5, r5, r8\n\t"
  6676. "stm %[r]!, {r4, r5}\n\t"
  6677. "ldm %[a]!, {r4, r5}\n\t"
  6678. "ldm %[b]!, {r6, r8}\n\t"
  6679. "adcs r4, r4, r6\n\t"
  6680. "adcs r5, r5, r8\n\t"
  6681. "stm %[r]!, {r4, r5}\n\t"
  6682. "ldm %[a]!, {r4, r5}\n\t"
  6683. "ldm %[b]!, {r6, r8}\n\t"
  6684. "adcs r4, r4, r6\n\t"
  6685. "adcs r5, r5, r8\n\t"
  6686. "stm %[r]!, {r4, r5}\n\t"
  6687. "ldm %[a]!, {r4, r5}\n\t"
  6688. "ldm %[b]!, {r6, r8}\n\t"
  6689. "adcs r4, r4, r6\n\t"
  6690. "adcs r5, r5, r8\n\t"
  6691. "stm %[r]!, {r4, r5}\n\t"
  6692. "ldm %[a]!, {r4, r5}\n\t"
  6693. "ldm %[b]!, {r6, r8}\n\t"
  6694. "adcs r4, r4, r6\n\t"
  6695. "adcs r5, r5, r8\n\t"
  6696. "stm %[r]!, {r4, r5}\n\t"
  6697. "ldm %[a]!, {r4, r5}\n\t"
  6698. "ldm %[b]!, {r6, r8}\n\t"
  6699. "adcs r4, r4, r6\n\t"
  6700. "adcs r5, r5, r8\n\t"
  6701. "stm %[r]!, {r4, r5}\n\t"
  6702. "ldm %[a]!, {r4, r5}\n\t"
  6703. "ldm %[b]!, {r6, r8}\n\t"
  6704. "adcs r4, r4, r6\n\t"
  6705. "adcs r5, r5, r8\n\t"
  6706. "stm %[r]!, {r4, r5}\n\t"
  6707. "ldm %[a]!, {r4, r5}\n\t"
  6708. "ldm %[b]!, {r6, r8}\n\t"
  6709. "adcs r4, r4, r6\n\t"
  6710. "adcs r5, r5, r8\n\t"
  6711. "stm %[r]!, {r4, r5}\n\t"
  6712. "ldm %[a]!, {r4, r5}\n\t"
  6713. "ldm %[b]!, {r6, r8}\n\t"
  6714. "adcs r4, r4, r6\n\t"
  6715. "adcs r5, r5, r8\n\t"
  6716. "stm %[r]!, {r4, r5}\n\t"
  6717. "ldm %[a]!, {r4, r5}\n\t"
  6718. "ldm %[b]!, {r6, r8}\n\t"
  6719. "adcs r4, r4, r6\n\t"
  6720. "adcs r5, r5, r8\n\t"
  6721. "stm %[r]!, {r4, r5}\n\t"
  6722. "ldm %[a]!, {r4, r5}\n\t"
  6723. "ldm %[b]!, {r6, r8}\n\t"
  6724. "adcs r4, r4, r6\n\t"
  6725. "adcs r5, r5, r8\n\t"
  6726. "stm %[r]!, {r4, r5}\n\t"
  6727. "ldm %[a]!, {r4, r5}\n\t"
  6728. "ldm %[b]!, {r6, r8}\n\t"
  6729. "adcs r4, r4, r6\n\t"
  6730. "adcs r5, r5, r8\n\t"
  6731. "stm %[r]!, {r4, r5}\n\t"
  6732. "ldm %[a]!, {r4, r5}\n\t"
  6733. "ldm %[b]!, {r6, r8}\n\t"
  6734. "adcs r4, r4, r6\n\t"
  6735. "adcs r5, r5, r8\n\t"
  6736. "stm %[r]!, {r4, r5}\n\t"
  6737. "ldm %[a]!, {r4, r5}\n\t"
  6738. "ldm %[b]!, {r6, r8}\n\t"
  6739. "adcs r4, r4, r6\n\t"
  6740. "adcs r5, r5, r8\n\t"
  6741. "stm %[r]!, {r4, r5}\n\t"
  6742. "ldm %[a]!, {r4, r5}\n\t"
  6743. "ldm %[b]!, {r6, r8}\n\t"
  6744. "adcs r4, r4, r6\n\t"
  6745. "adcs r5, r5, r8\n\t"
  6746. "stm %[r]!, {r4, r5}\n\t"
  6747. "ldm %[a]!, {r4, r5}\n\t"
  6748. "ldm %[b]!, {r6, r8}\n\t"
  6749. "adcs r4, r4, r6\n\t"
  6750. "adcs r5, r5, r8\n\t"
  6751. "stm %[r]!, {r4, r5}\n\t"
  6752. "ldm %[a]!, {r4, r5}\n\t"
  6753. "ldm %[b]!, {r6, r8}\n\t"
  6754. "adcs r4, r4, r6\n\t"
  6755. "adcs r5, r5, r8\n\t"
  6756. "stm %[r]!, {r4, r5}\n\t"
  6757. "ldm %[a]!, {r4, r5}\n\t"
  6758. "ldm %[b]!, {r6, r8}\n\t"
  6759. "adcs r4, r4, r6\n\t"
  6760. "adcs r5, r5, r8\n\t"
  6761. "stm %[r]!, {r4, r5}\n\t"
  6762. "ldm %[a]!, {r4, r5}\n\t"
  6763. "ldm %[b]!, {r6, r8}\n\t"
  6764. "adcs r4, r4, r6\n\t"
  6765. "adcs r5, r5, r8\n\t"
  6766. "stm %[r]!, {r4, r5}\n\t"
  6767. "ldm %[a]!, {r4, r5}\n\t"
  6768. "ldm %[b]!, {r6, r8}\n\t"
  6769. "adcs r4, r4, r6\n\t"
  6770. "adcs r5, r5, r8\n\t"
  6771. "stm %[r]!, {r4, r5}\n\t"
  6772. "ldm %[a]!, {r4, r5}\n\t"
  6773. "ldm %[b]!, {r6, r8}\n\t"
  6774. "adcs r4, r4, r6\n\t"
  6775. "adcs r5, r5, r8\n\t"
  6776. "stm %[r]!, {r4, r5}\n\t"
  6777. "ldm %[a]!, {r4, r5}\n\t"
  6778. "ldm %[b]!, {r6, r8}\n\t"
  6779. "adcs r4, r4, r6\n\t"
  6780. "adcs r5, r5, r8\n\t"
  6781. "stm %[r]!, {r4, r5}\n\t"
  6782. "ldm %[a]!, {r4, r5}\n\t"
  6783. "ldm %[b]!, {r6, r8}\n\t"
  6784. "adcs r4, r4, r6\n\t"
  6785. "adcs r5, r5, r8\n\t"
  6786. "stm %[r]!, {r4, r5}\n\t"
  6787. "ldm %[a]!, {r4, r5}\n\t"
  6788. "ldm %[b]!, {r6, r8}\n\t"
  6789. "adcs r4, r4, r6\n\t"
  6790. "adcs r5, r5, r8\n\t"
  6791. "stm %[r]!, {r4, r5}\n\t"
  6792. "ldm %[a]!, {r4, r5}\n\t"
  6793. "ldm %[b]!, {r6, r8}\n\t"
  6794. "adcs r4, r4, r6\n\t"
  6795. "adcs r5, r5, r8\n\t"
  6796. "stm %[r]!, {r4, r5}\n\t"
  6797. "ldm %[a]!, {r4, r5}\n\t"
  6798. "ldm %[b]!, {r6, r8}\n\t"
  6799. "adcs r4, r4, r6\n\t"
  6800. "adcs r5, r5, r8\n\t"
  6801. "stm %[r]!, {r4, r5}\n\t"
  6802. "ldm %[a]!, {r4, r5}\n\t"
  6803. "ldm %[b]!, {r6, r8}\n\t"
  6804. "adcs r4, r4, r6\n\t"
  6805. "adcs r5, r5, r8\n\t"
  6806. "stm %[r]!, {r4, r5}\n\t"
  6807. "ldm %[a]!, {r4, r5}\n\t"
  6808. "ldm %[b]!, {r6, r8}\n\t"
  6809. "adcs r4, r4, r6\n\t"
  6810. "adcs r5, r5, r8\n\t"
  6811. "stm %[r]!, {r4, r5}\n\t"
  6812. "ldm %[a]!, {r4, r5}\n\t"
  6813. "ldm %[b]!, {r6, r8}\n\t"
  6814. "adcs r4, r4, r6\n\t"
  6815. "adcs r5, r5, r8\n\t"
  6816. "stm %[r]!, {r4, r5}\n\t"
  6817. "ldm %[a]!, {r4, r5}\n\t"
  6818. "ldm %[b]!, {r6, r8}\n\t"
  6819. "adcs r4, r4, r6\n\t"
  6820. "adcs r5, r5, r8\n\t"
  6821. "stm %[r]!, {r4, r5}\n\t"
  6822. "ldm %[a]!, {r4, r5}\n\t"
  6823. "ldm %[b]!, {r6, r8}\n\t"
  6824. "adcs r4, r4, r6\n\t"
  6825. "adcs r5, r5, r8\n\t"
  6826. "stm %[r]!, {r4, r5}\n\t"
  6827. "ldm %[a]!, {r4, r5}\n\t"
  6828. "ldm %[b]!, {r6, r8}\n\t"
  6829. "adcs r4, r4, r6\n\t"
  6830. "adcs r5, r5, r8\n\t"
  6831. "stm %[r]!, {r4, r5}\n\t"
  6832. "ldm %[a]!, {r4, r5}\n\t"
  6833. "ldm %[b]!, {r6, r8}\n\t"
  6834. "adcs r4, r4, r6\n\t"
  6835. "adcs r5, r5, r8\n\t"
  6836. "stm %[r]!, {r4, r5}\n\t"
  6837. "ldm %[a]!, {r4, r5}\n\t"
  6838. "ldm %[b]!, {r6, r8}\n\t"
  6839. "adcs r4, r4, r6\n\t"
  6840. "adcs r5, r5, r8\n\t"
  6841. "stm %[r]!, {r4, r5}\n\t"
  6842. "ldm %[a]!, {r4, r5}\n\t"
  6843. "ldm %[b]!, {r6, r8}\n\t"
  6844. "adcs r4, r4, r6\n\t"
  6845. "adcs r5, r5, r8\n\t"
  6846. "stm %[r]!, {r4, r5}\n\t"
  6847. "ldm %[a]!, {r4, r5}\n\t"
  6848. "ldm %[b]!, {r6, r8}\n\t"
  6849. "adcs r4, r4, r6\n\t"
  6850. "adcs r5, r5, r8\n\t"
  6851. "stm %[r]!, {r4, r5}\n\t"
  6852. "ldm %[a]!, {r4, r5}\n\t"
  6853. "ldm %[b]!, {r6, r8}\n\t"
  6854. "adcs r4, r4, r6\n\t"
  6855. "adcs r5, r5, r8\n\t"
  6856. "stm %[r]!, {r4, r5}\n\t"
  6857. "ldm %[a]!, {r4, r5}\n\t"
  6858. "ldm %[b]!, {r6, r8}\n\t"
  6859. "adcs r4, r4, r6\n\t"
  6860. "adcs r5, r5, r8\n\t"
  6861. "stm %[r]!, {r4, r5}\n\t"
  6862. "ldm %[a]!, {r4, r5}\n\t"
  6863. "ldm %[b]!, {r6, r8}\n\t"
  6864. "adcs r4, r4, r6\n\t"
  6865. "adcs r5, r5, r8\n\t"
  6866. "stm %[r]!, {r4, r5}\n\t"
  6867. "ldm %[a]!, {r4, r5}\n\t"
  6868. "ldm %[b]!, {r6, r8}\n\t"
  6869. "adcs r4, r4, r6\n\t"
  6870. "adcs r5, r5, r8\n\t"
  6871. "stm %[r]!, {r4, r5}\n\t"
  6872. "ldm %[a]!, {r4, r5}\n\t"
  6873. "ldm %[b]!, {r6, r8}\n\t"
  6874. "adcs r4, r4, r6\n\t"
  6875. "adcs r5, r5, r8\n\t"
  6876. "stm %[r]!, {r4, r5}\n\t"
  6877. "ldm %[a]!, {r4, r5}\n\t"
  6878. "ldm %[b]!, {r6, r8}\n\t"
  6879. "adcs r4, r4, r6\n\t"
  6880. "adcs r5, r5, r8\n\t"
  6881. "stm %[r]!, {r4, r5}\n\t"
  6882. "ldm %[a]!, {r4, r5}\n\t"
  6883. "ldm %[b]!, {r6, r8}\n\t"
  6884. "adcs r4, r4, r6\n\t"
  6885. "adcs r5, r5, r8\n\t"
  6886. "stm %[r]!, {r4, r5}\n\t"
  6887. "ldm %[a]!, {r4, r5}\n\t"
  6888. "ldm %[b]!, {r6, r8}\n\t"
  6889. "adcs r4, r4, r6\n\t"
  6890. "adcs r5, r5, r8\n\t"
  6891. "stm %[r]!, {r4, r5}\n\t"
  6892. "mov %[c], #0\n\t"
  6893. "adc %[c], %[c], %[c]\n\t"
  6894. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  6895. :
  6896. : "memory", "r4", "r5", "r6", "r8"
  6897. );
  6898. return c;
  6899. }
  6900. /* AND m into each word of a and store in r.
  6901. *
  6902. * r A single precision integer.
  6903. * a A single precision integer.
  6904. * m Mask to AND against each digit.
  6905. */
  6906. static void sp_3072_mask_48(sp_digit* r, const sp_digit* a, sp_digit m)
  6907. {
  6908. #ifdef WOLFSSL_SP_SMALL
  6909. int i;
  6910. for (i=0; i<48; i++) {
  6911. r[i] = a[i] & m;
  6912. }
  6913. #else
  6914. int i;
  6915. for (i = 0; i < 48; i += 8) {
  6916. r[i+0] = a[i+0] & m;
  6917. r[i+1] = a[i+1] & m;
  6918. r[i+2] = a[i+2] & m;
  6919. r[i+3] = a[i+3] & m;
  6920. r[i+4] = a[i+4] & m;
  6921. r[i+5] = a[i+5] & m;
  6922. r[i+6] = a[i+6] & m;
  6923. r[i+7] = a[i+7] & m;
  6924. }
  6925. #endif
  6926. }
  6927. /* Multiply a and b into r. (r = a * b)
  6928. *
  6929. * r A single precision integer.
  6930. * a A single precision integer.
  6931. * b A single precision integer.
  6932. */
  6933. SP_NOINLINE static void sp_3072_mul_96(sp_digit* r, const sp_digit* a,
  6934. const sp_digit* b)
  6935. {
  6936. sp_digit* z0 = r;
  6937. sp_digit z1[96];
  6938. sp_digit a1[48];
  6939. sp_digit b1[48];
  6940. sp_digit* z2 = r + 96;
  6941. sp_digit u;
  6942. sp_digit ca;
  6943. sp_digit cb;
  6944. ca = sp_3072_add_48(a1, a, &a[48]);
  6945. cb = sp_3072_add_48(b1, b, &b[48]);
  6946. u = ca & cb;
  6947. sp_3072_mul_48(z2, &a[48], &b[48]);
  6948. sp_3072_mul_48(z0, a, b);
  6949. sp_3072_mul_48(z1, a1, b1);
  6950. u += sp_3072_sub_in_place_96(z1, z0);
  6951. u += sp_3072_sub_in_place_96(z1, z2);
  6952. sp_3072_mask_48(a1, a1, 0 - cb);
  6953. u += sp_3072_add_48(z1 + 48, z1 + 48, a1);
  6954. sp_3072_mask_48(b1, b1, 0 - ca);
  6955. u += sp_3072_add_48(z1 + 48, z1 + 48, b1);
  6956. u += sp_3072_add_96(r + 48, r + 48, z1);
  6957. XMEMSET(a1 + 1, 0, sizeof(sp_digit) * (48 - 1));
  6958. a1[0] = u;
  6959. (void)sp_3072_add_48(r + 144, r + 144, a1);
  6960. }
  6961. /* Square a and put result in r. (r = a * a)
  6962. *
  6963. * r A single precision integer.
  6964. * a A single precision integer.
  6965. */
  6966. SP_NOINLINE static void sp_3072_sqr_12(sp_digit* r, const sp_digit* a)
  6967. {
  6968. __asm__ __volatile__ (
  6969. "mov r3, #0\n\t"
  6970. "mov r4, #0\n\t"
  6971. "mov r5, #0\n\t"
  6972. "mov r9, r3\n\t"
  6973. "mov r12, %[r]\n\t"
  6974. "mov r6, #96\n\t"
  6975. "neg r6, r6\n\t"
  6976. "add sp, sp, r6\n\t"
  6977. "mov r11, sp\n\t"
  6978. "mov r10, %[a]\n\t"
  6979. "\n1:\n\t"
  6980. "mov %[r], #0\n\t"
  6981. "mov r6, #44\n\t"
  6982. "mov %[a], r9\n\t"
  6983. "subs %[a], %[a], r6\n\t"
  6984. "sbc r6, r6, r6\n\t"
  6985. "mvn r6, r6\n\t"
  6986. "and %[a], %[a], r6\n\t"
  6987. "mov r2, r9\n\t"
  6988. "sub r2, r2, %[a]\n\t"
  6989. "add %[a], %[a], r10\n\t"
  6990. "add r2, r2, r10\n\t"
  6991. "\n2:\n\t"
  6992. "cmp r2, %[a]\n\t"
  6993. #ifdef __GNUC__
  6994. "beq 4f\n\t"
  6995. #else
  6996. "beq.n 4f\n\t"
  6997. #endif /* __GNUC__ */
  6998. /* Multiply * 2: Start */
  6999. "ldr r6, [%[a]]\n\t"
  7000. "ldr r8, [r2]\n\t"
  7001. "umull r6, r8, r6, r8\n\t"
  7002. "adds r3, r3, r6\n\t"
  7003. "adcs r4, r4, r8\n\t"
  7004. "adc r5, r5, %[r]\n\t"
  7005. "adds r3, r3, r6\n\t"
  7006. "adcs r4, r4, r8\n\t"
  7007. "adc r5, r5, %[r]\n\t"
  7008. /* Multiply * 2: Done */
  7009. #ifdef __GNUC__
  7010. "bal 5f\n\t"
  7011. #else
  7012. "bal.n 5f\n\t"
  7013. #endif /* __GNUC__ */
  7014. "\n4:\n\t"
  7015. /* Square: Start */
  7016. "ldr r6, [%[a]]\n\t"
  7017. "umull r6, r8, r6, r6\n\t"
  7018. "adds r3, r3, r6\n\t"
  7019. "adcs r4, r4, r8\n\t"
  7020. "adc r5, r5, %[r]\n\t"
  7021. /* Square: Done */
  7022. "\n5:\n\t"
  7023. "add %[a], %[a], #4\n\t"
  7024. "sub r2, r2, #4\n\t"
  7025. "mov r6, #48\n\t"
  7026. "add r6, r6, r10\n\t"
  7027. "cmp %[a], r6\n\t"
  7028. #ifdef __GNUC__
  7029. "beq 3f\n\t"
  7030. #else
  7031. "beq.n 3f\n\t"
  7032. #endif /* __GNUC__ */
  7033. "cmp %[a], r2\n\t"
  7034. #ifdef __GNUC__
  7035. "bgt 3f\n\t"
  7036. #else
  7037. "bgt.n 3f\n\t"
  7038. #endif /* __GNUC__ */
  7039. "mov r8, r9\n\t"
  7040. "add r8, r8, r10\n\t"
  7041. "cmp %[a], r8\n\t"
  7042. #ifdef __GNUC__
  7043. "ble 2b\n\t"
  7044. #else
  7045. "ble.n 2b\n\t"
  7046. #endif /* __GNUC__ */
  7047. "\n3:\n\t"
  7048. "mov %[r], r11\n\t"
  7049. "mov r8, r9\n\t"
  7050. "str r3, [%[r], r8]\n\t"
  7051. "mov r3, r4\n\t"
  7052. "mov r4, r5\n\t"
  7053. "mov r5, #0\n\t"
  7054. "add r8, r8, #4\n\t"
  7055. "mov r9, r8\n\t"
  7056. "mov r6, #88\n\t"
  7057. "cmp r8, r6\n\t"
  7058. #ifdef __GNUC__
  7059. "ble 1b\n\t"
  7060. #else
  7061. "ble.n 1b\n\t"
  7062. #endif /* __GNUC__ */
  7063. "mov %[a], r10\n\t"
  7064. "str r3, [%[r], r8]\n\t"
  7065. "mov %[r], r12\n\t"
  7066. "mov %[a], r11\n\t"
  7067. "mov r3, #92\n\t"
  7068. "\n4:\n\t"
  7069. "ldr r6, [%[a], r3]\n\t"
  7070. "str r6, [%[r], r3]\n\t"
  7071. "subs r3, r3, #4\n\t"
  7072. #ifdef __GNUC__
  7073. "bge 4b\n\t"
  7074. #else
  7075. "bge.n 4b\n\t"
  7076. #endif /* __GNUC__ */
  7077. "mov r6, #96\n\t"
  7078. "add sp, sp, r6\n\t"
  7079. :
  7080. : [r] "r" (r), [a] "r" (a)
  7081. : "memory", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12"
  7082. );
  7083. }
  7084. /* Sub b from a into r. (r = a - b)
  7085. *
  7086. * r A single precision integer.
  7087. * a A single precision integer.
  7088. * b A single precision integer.
  7089. */
  7090. SP_NOINLINE static sp_digit sp_3072_sub_12(sp_digit* r, const sp_digit* a,
  7091. const sp_digit* b)
  7092. {
  7093. sp_digit c = 0;
  7094. __asm__ __volatile__ (
  7095. "ldm %[a]!, {r4, r5}\n\t"
  7096. "ldm %[b]!, {r6, r8}\n\t"
  7097. "subs r4, r4, r6\n\t"
  7098. "sbcs r5, r5, r8\n\t"
  7099. "stm %[r]!, {r4, r5}\n\t"
  7100. "ldm %[a]!, {r4, r5}\n\t"
  7101. "ldm %[b]!, {r6, r8}\n\t"
  7102. "sbcs r4, r4, r6\n\t"
  7103. "sbcs r5, r5, r8\n\t"
  7104. "stm %[r]!, {r4, r5}\n\t"
  7105. "ldm %[a]!, {r4, r5}\n\t"
  7106. "ldm %[b]!, {r6, r8}\n\t"
  7107. "sbcs r4, r4, r6\n\t"
  7108. "sbcs r5, r5, r8\n\t"
  7109. "stm %[r]!, {r4, r5}\n\t"
  7110. "ldm %[a]!, {r4, r5}\n\t"
  7111. "ldm %[b]!, {r6, r8}\n\t"
  7112. "sbcs r4, r4, r6\n\t"
  7113. "sbcs r5, r5, r8\n\t"
  7114. "stm %[r]!, {r4, r5}\n\t"
  7115. "ldm %[a]!, {r4, r5}\n\t"
  7116. "ldm %[b]!, {r6, r8}\n\t"
  7117. "sbcs r4, r4, r6\n\t"
  7118. "sbcs r5, r5, r8\n\t"
  7119. "stm %[r]!, {r4, r5}\n\t"
  7120. "ldm %[a]!, {r4, r5}\n\t"
  7121. "ldm %[b]!, {r6, r8}\n\t"
  7122. "sbcs r4, r4, r6\n\t"
  7123. "sbcs r5, r5, r8\n\t"
  7124. "stm %[r]!, {r4, r5}\n\t"
  7125. "sbc %[c], %[c], %[c]\n\t"
  7126. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  7127. :
  7128. : "memory", "r4", "r5", "r6", "r8"
  7129. );
  7130. return c;
  7131. }
  7132. /* Square a and put result in r. (r = a * a)
  7133. *
  7134. * r A single precision integer.
  7135. * a A single precision integer.
  7136. */
  7137. SP_NOINLINE static void sp_3072_sqr_24(sp_digit* r, const sp_digit* a)
  7138. {
  7139. sp_digit* z0 = r;
  7140. sp_digit* z2 = r + 24;
  7141. sp_digit z1[24];
  7142. sp_digit* a1 = z1;
  7143. sp_digit zero[12];
  7144. sp_digit u;
  7145. sp_digit mask;
  7146. sp_digit* p1;
  7147. sp_digit* p2;
  7148. XMEMSET(zero, 0, sizeof(sp_digit) * 12);
  7149. mask = sp_3072_sub_12(a1, a, &a[12]);
  7150. p1 = (sp_digit*)(((sp_digit)zero & mask ) | ((sp_digit)a1 & (~mask)));
  7151. p2 = (sp_digit*)(((sp_digit)zero & (~mask)) | ((sp_digit)a1 & mask ));
  7152. (void)sp_3072_sub_12(a1, p1, p2);
  7153. sp_3072_sqr_12(z2, &a[12]);
  7154. sp_3072_sqr_12(z0, a);
  7155. sp_3072_sqr_12(z1, a1);
  7156. u = 0;
  7157. u -= sp_3072_sub_in_place_24(z1, z2);
  7158. u -= sp_3072_sub_in_place_24(z1, z0);
  7159. u += sp_3072_sub_in_place_24(r + 12, z1);
  7160. zero[0] = u;
  7161. (void)sp_3072_add_12(r + 36, r + 36, zero);
  7162. }
  7163. /* Sub b from a into r. (r = a - b)
  7164. *
  7165. * r A single precision integer.
  7166. * a A single precision integer.
  7167. * b A single precision integer.
  7168. */
  7169. SP_NOINLINE static sp_digit sp_3072_sub_24(sp_digit* r, const sp_digit* a,
  7170. const sp_digit* b)
  7171. {
  7172. sp_digit c = 0;
  7173. __asm__ __volatile__ (
  7174. "ldm %[a]!, {r4, r5}\n\t"
  7175. "ldm %[b]!, {r6, r8}\n\t"
  7176. "subs r4, r4, r6\n\t"
  7177. "sbcs r5, r5, r8\n\t"
  7178. "stm %[r]!, {r4, r5}\n\t"
  7179. "ldm %[a]!, {r4, r5}\n\t"
  7180. "ldm %[b]!, {r6, r8}\n\t"
  7181. "sbcs r4, r4, r6\n\t"
  7182. "sbcs r5, r5, r8\n\t"
  7183. "stm %[r]!, {r4, r5}\n\t"
  7184. "ldm %[a]!, {r4, r5}\n\t"
  7185. "ldm %[b]!, {r6, r8}\n\t"
  7186. "sbcs r4, r4, r6\n\t"
  7187. "sbcs r5, r5, r8\n\t"
  7188. "stm %[r]!, {r4, r5}\n\t"
  7189. "ldm %[a]!, {r4, r5}\n\t"
  7190. "ldm %[b]!, {r6, r8}\n\t"
  7191. "sbcs r4, r4, r6\n\t"
  7192. "sbcs r5, r5, r8\n\t"
  7193. "stm %[r]!, {r4, r5}\n\t"
  7194. "ldm %[a]!, {r4, r5}\n\t"
  7195. "ldm %[b]!, {r6, r8}\n\t"
  7196. "sbcs r4, r4, r6\n\t"
  7197. "sbcs r5, r5, r8\n\t"
  7198. "stm %[r]!, {r4, r5}\n\t"
  7199. "ldm %[a]!, {r4, r5}\n\t"
  7200. "ldm %[b]!, {r6, r8}\n\t"
  7201. "sbcs r4, r4, r6\n\t"
  7202. "sbcs r5, r5, r8\n\t"
  7203. "stm %[r]!, {r4, r5}\n\t"
  7204. "ldm %[a]!, {r4, r5}\n\t"
  7205. "ldm %[b]!, {r6, r8}\n\t"
  7206. "sbcs r4, r4, r6\n\t"
  7207. "sbcs r5, r5, r8\n\t"
  7208. "stm %[r]!, {r4, r5}\n\t"
  7209. "ldm %[a]!, {r4, r5}\n\t"
  7210. "ldm %[b]!, {r6, r8}\n\t"
  7211. "sbcs r4, r4, r6\n\t"
  7212. "sbcs r5, r5, r8\n\t"
  7213. "stm %[r]!, {r4, r5}\n\t"
  7214. "ldm %[a]!, {r4, r5}\n\t"
  7215. "ldm %[b]!, {r6, r8}\n\t"
  7216. "sbcs r4, r4, r6\n\t"
  7217. "sbcs r5, r5, r8\n\t"
  7218. "stm %[r]!, {r4, r5}\n\t"
  7219. "ldm %[a]!, {r4, r5}\n\t"
  7220. "ldm %[b]!, {r6, r8}\n\t"
  7221. "sbcs r4, r4, r6\n\t"
  7222. "sbcs r5, r5, r8\n\t"
  7223. "stm %[r]!, {r4, r5}\n\t"
  7224. "ldm %[a]!, {r4, r5}\n\t"
  7225. "ldm %[b]!, {r6, r8}\n\t"
  7226. "sbcs r4, r4, r6\n\t"
  7227. "sbcs r5, r5, r8\n\t"
  7228. "stm %[r]!, {r4, r5}\n\t"
  7229. "ldm %[a]!, {r4, r5}\n\t"
  7230. "ldm %[b]!, {r6, r8}\n\t"
  7231. "sbcs r4, r4, r6\n\t"
  7232. "sbcs r5, r5, r8\n\t"
  7233. "stm %[r]!, {r4, r5}\n\t"
  7234. "sbc %[c], %[c], %[c]\n\t"
  7235. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  7236. :
  7237. : "memory", "r4", "r5", "r6", "r8"
  7238. );
  7239. return c;
  7240. }
  7241. /* Square a and put result in r. (r = a * a)
  7242. *
  7243. * r A single precision integer.
  7244. * a A single precision integer.
  7245. */
  7246. SP_NOINLINE static void sp_3072_sqr_48(sp_digit* r, const sp_digit* a)
  7247. {
  7248. sp_digit* z0 = r;
  7249. sp_digit* z2 = r + 48;
  7250. sp_digit z1[48];
  7251. sp_digit* a1 = z1;
  7252. sp_digit zero[24];
  7253. sp_digit u;
  7254. sp_digit mask;
  7255. sp_digit* p1;
  7256. sp_digit* p2;
  7257. XMEMSET(zero, 0, sizeof(sp_digit) * 24);
  7258. mask = sp_3072_sub_24(a1, a, &a[24]);
  7259. p1 = (sp_digit*)(((sp_digit)zero & mask ) | ((sp_digit)a1 & (~mask)));
  7260. p2 = (sp_digit*)(((sp_digit)zero & (~mask)) | ((sp_digit)a1 & mask ));
  7261. (void)sp_3072_sub_24(a1, p1, p2);
  7262. sp_3072_sqr_24(z2, &a[24]);
  7263. sp_3072_sqr_24(z0, a);
  7264. sp_3072_sqr_24(z1, a1);
  7265. u = 0;
  7266. u -= sp_3072_sub_in_place_48(z1, z2);
  7267. u -= sp_3072_sub_in_place_48(z1, z0);
  7268. u += sp_3072_sub_in_place_48(r + 24, z1);
  7269. zero[0] = u;
  7270. (void)sp_3072_add_24(r + 72, r + 72, zero);
  7271. }
  7272. /* Sub b from a into r. (r = a - b)
  7273. *
  7274. * r A single precision integer.
  7275. * a A single precision integer.
  7276. * b A single precision integer.
  7277. */
  7278. SP_NOINLINE static sp_digit sp_3072_sub_48(sp_digit* r, const sp_digit* a,
  7279. const sp_digit* b)
  7280. {
  7281. sp_digit c = 0;
  7282. __asm__ __volatile__ (
  7283. "ldm %[a]!, {r4, r5}\n\t"
  7284. "ldm %[b]!, {r6, r8}\n\t"
  7285. "subs r4, r4, r6\n\t"
  7286. "sbcs r5, r5, r8\n\t"
  7287. "stm %[r]!, {r4, r5}\n\t"
  7288. "ldm %[a]!, {r4, r5}\n\t"
  7289. "ldm %[b]!, {r6, r8}\n\t"
  7290. "sbcs r4, r4, r6\n\t"
  7291. "sbcs r5, r5, r8\n\t"
  7292. "stm %[r]!, {r4, r5}\n\t"
  7293. "ldm %[a]!, {r4, r5}\n\t"
  7294. "ldm %[b]!, {r6, r8}\n\t"
  7295. "sbcs r4, r4, r6\n\t"
  7296. "sbcs r5, r5, r8\n\t"
  7297. "stm %[r]!, {r4, r5}\n\t"
  7298. "ldm %[a]!, {r4, r5}\n\t"
  7299. "ldm %[b]!, {r6, r8}\n\t"
  7300. "sbcs r4, r4, r6\n\t"
  7301. "sbcs r5, r5, r8\n\t"
  7302. "stm %[r]!, {r4, r5}\n\t"
  7303. "ldm %[a]!, {r4, r5}\n\t"
  7304. "ldm %[b]!, {r6, r8}\n\t"
  7305. "sbcs r4, r4, r6\n\t"
  7306. "sbcs r5, r5, r8\n\t"
  7307. "stm %[r]!, {r4, r5}\n\t"
  7308. "ldm %[a]!, {r4, r5}\n\t"
  7309. "ldm %[b]!, {r6, r8}\n\t"
  7310. "sbcs r4, r4, r6\n\t"
  7311. "sbcs r5, r5, r8\n\t"
  7312. "stm %[r]!, {r4, r5}\n\t"
  7313. "ldm %[a]!, {r4, r5}\n\t"
  7314. "ldm %[b]!, {r6, r8}\n\t"
  7315. "sbcs r4, r4, r6\n\t"
  7316. "sbcs r5, r5, r8\n\t"
  7317. "stm %[r]!, {r4, r5}\n\t"
  7318. "ldm %[a]!, {r4, r5}\n\t"
  7319. "ldm %[b]!, {r6, r8}\n\t"
  7320. "sbcs r4, r4, r6\n\t"
  7321. "sbcs r5, r5, r8\n\t"
  7322. "stm %[r]!, {r4, r5}\n\t"
  7323. "ldm %[a]!, {r4, r5}\n\t"
  7324. "ldm %[b]!, {r6, r8}\n\t"
  7325. "sbcs r4, r4, r6\n\t"
  7326. "sbcs r5, r5, r8\n\t"
  7327. "stm %[r]!, {r4, r5}\n\t"
  7328. "ldm %[a]!, {r4, r5}\n\t"
  7329. "ldm %[b]!, {r6, r8}\n\t"
  7330. "sbcs r4, r4, r6\n\t"
  7331. "sbcs r5, r5, r8\n\t"
  7332. "stm %[r]!, {r4, r5}\n\t"
  7333. "ldm %[a]!, {r4, r5}\n\t"
  7334. "ldm %[b]!, {r6, r8}\n\t"
  7335. "sbcs r4, r4, r6\n\t"
  7336. "sbcs r5, r5, r8\n\t"
  7337. "stm %[r]!, {r4, r5}\n\t"
  7338. "ldm %[a]!, {r4, r5}\n\t"
  7339. "ldm %[b]!, {r6, r8}\n\t"
  7340. "sbcs r4, r4, r6\n\t"
  7341. "sbcs r5, r5, r8\n\t"
  7342. "stm %[r]!, {r4, r5}\n\t"
  7343. "ldm %[a]!, {r4, r5}\n\t"
  7344. "ldm %[b]!, {r6, r8}\n\t"
  7345. "sbcs r4, r4, r6\n\t"
  7346. "sbcs r5, r5, r8\n\t"
  7347. "stm %[r]!, {r4, r5}\n\t"
  7348. "ldm %[a]!, {r4, r5}\n\t"
  7349. "ldm %[b]!, {r6, r8}\n\t"
  7350. "sbcs r4, r4, r6\n\t"
  7351. "sbcs r5, r5, r8\n\t"
  7352. "stm %[r]!, {r4, r5}\n\t"
  7353. "ldm %[a]!, {r4, r5}\n\t"
  7354. "ldm %[b]!, {r6, r8}\n\t"
  7355. "sbcs r4, r4, r6\n\t"
  7356. "sbcs r5, r5, r8\n\t"
  7357. "stm %[r]!, {r4, r5}\n\t"
  7358. "ldm %[a]!, {r4, r5}\n\t"
  7359. "ldm %[b]!, {r6, r8}\n\t"
  7360. "sbcs r4, r4, r6\n\t"
  7361. "sbcs r5, r5, r8\n\t"
  7362. "stm %[r]!, {r4, r5}\n\t"
  7363. "ldm %[a]!, {r4, r5}\n\t"
  7364. "ldm %[b]!, {r6, r8}\n\t"
  7365. "sbcs r4, r4, r6\n\t"
  7366. "sbcs r5, r5, r8\n\t"
  7367. "stm %[r]!, {r4, r5}\n\t"
  7368. "ldm %[a]!, {r4, r5}\n\t"
  7369. "ldm %[b]!, {r6, r8}\n\t"
  7370. "sbcs r4, r4, r6\n\t"
  7371. "sbcs r5, r5, r8\n\t"
  7372. "stm %[r]!, {r4, r5}\n\t"
  7373. "ldm %[a]!, {r4, r5}\n\t"
  7374. "ldm %[b]!, {r6, r8}\n\t"
  7375. "sbcs r4, r4, r6\n\t"
  7376. "sbcs r5, r5, r8\n\t"
  7377. "stm %[r]!, {r4, r5}\n\t"
  7378. "ldm %[a]!, {r4, r5}\n\t"
  7379. "ldm %[b]!, {r6, r8}\n\t"
  7380. "sbcs r4, r4, r6\n\t"
  7381. "sbcs r5, r5, r8\n\t"
  7382. "stm %[r]!, {r4, r5}\n\t"
  7383. "ldm %[a]!, {r4, r5}\n\t"
  7384. "ldm %[b]!, {r6, r8}\n\t"
  7385. "sbcs r4, r4, r6\n\t"
  7386. "sbcs r5, r5, r8\n\t"
  7387. "stm %[r]!, {r4, r5}\n\t"
  7388. "ldm %[a]!, {r4, r5}\n\t"
  7389. "ldm %[b]!, {r6, r8}\n\t"
  7390. "sbcs r4, r4, r6\n\t"
  7391. "sbcs r5, r5, r8\n\t"
  7392. "stm %[r]!, {r4, r5}\n\t"
  7393. "ldm %[a]!, {r4, r5}\n\t"
  7394. "ldm %[b]!, {r6, r8}\n\t"
  7395. "sbcs r4, r4, r6\n\t"
  7396. "sbcs r5, r5, r8\n\t"
  7397. "stm %[r]!, {r4, r5}\n\t"
  7398. "ldm %[a]!, {r4, r5}\n\t"
  7399. "ldm %[b]!, {r6, r8}\n\t"
  7400. "sbcs r4, r4, r6\n\t"
  7401. "sbcs r5, r5, r8\n\t"
  7402. "stm %[r]!, {r4, r5}\n\t"
  7403. "sbc %[c], %[c], %[c]\n\t"
  7404. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  7405. :
  7406. : "memory", "r4", "r5", "r6", "r8"
  7407. );
  7408. return c;
  7409. }
  7410. /* Square a and put result in r. (r = a * a)
  7411. *
  7412. * r A single precision integer.
  7413. * a A single precision integer.
  7414. */
  7415. SP_NOINLINE static void sp_3072_sqr_96(sp_digit* r, const sp_digit* a)
  7416. {
  7417. sp_digit* z0 = r;
  7418. sp_digit* z2 = r + 96;
  7419. sp_digit z1[96];
  7420. sp_digit* a1 = z1;
  7421. sp_digit zero[48];
  7422. sp_digit u;
  7423. sp_digit mask;
  7424. sp_digit* p1;
  7425. sp_digit* p2;
  7426. XMEMSET(zero, 0, sizeof(sp_digit) * 48);
  7427. mask = sp_3072_sub_48(a1, a, &a[48]);
  7428. p1 = (sp_digit*)(((sp_digit)zero & mask ) | ((sp_digit)a1 & (~mask)));
  7429. p2 = (sp_digit*)(((sp_digit)zero & (~mask)) | ((sp_digit)a1 & mask ));
  7430. (void)sp_3072_sub_48(a1, p1, p2);
  7431. sp_3072_sqr_48(z2, &a[48]);
  7432. sp_3072_sqr_48(z0, a);
  7433. sp_3072_sqr_48(z1, a1);
  7434. u = 0;
  7435. u -= sp_3072_sub_in_place_96(z1, z2);
  7436. u -= sp_3072_sub_in_place_96(z1, z0);
  7437. u += sp_3072_sub_in_place_96(r + 48, z1);
  7438. zero[0] = u;
  7439. (void)sp_3072_add_48(r + 144, r + 144, zero);
  7440. }
  7441. #endif /* !WOLFSSL_SP_SMALL */
  7442. #ifdef WOLFSSL_SP_SMALL
  7443. /* Add b to a into r. (r = a + b)
  7444. *
  7445. * r A single precision integer.
  7446. * a A single precision integer.
  7447. * b A single precision integer.
  7448. */
  7449. SP_NOINLINE static sp_digit sp_3072_add_96(sp_digit* r, const sp_digit* a,
  7450. const sp_digit* b)
  7451. {
  7452. sp_digit c = 0;
  7453. __asm__ __volatile__ (
  7454. "mov r6, %[a]\n\t"
  7455. "mov r8, #0\n\t"
  7456. "add r6, r6, #384\n\t"
  7457. "sub r8, r8, #1\n\t"
  7458. "\n1:\n\t"
  7459. "adds %[c], %[c], r8\n\t"
  7460. "ldr r4, [%[a]]\n\t"
  7461. "ldr r5, [%[b]]\n\t"
  7462. "adcs r4, r4, r5\n\t"
  7463. "str r4, [%[r]]\n\t"
  7464. "mov %[c], #0\n\t"
  7465. "adc %[c], %[c], %[c]\n\t"
  7466. "add %[a], %[a], #4\n\t"
  7467. "add %[b], %[b], #4\n\t"
  7468. "add %[r], %[r], #4\n\t"
  7469. "cmp %[a], r6\n\t"
  7470. #ifdef __GNUC__
  7471. "bne 1b\n\t"
  7472. #else
  7473. "bne.n 1b\n\t"
  7474. #endif /* __GNUC__ */
  7475. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  7476. :
  7477. : "memory", "r4", "r5", "r6", "r8"
  7478. );
  7479. return c;
  7480. }
  7481. #endif /* WOLFSSL_SP_SMALL */
  7482. #ifdef WOLFSSL_SP_SMALL
  7483. /* Sub b from a into a. (a -= b)
  7484. *
  7485. * a A single precision integer.
  7486. * b A single precision integer.
  7487. */
  7488. SP_NOINLINE static sp_digit sp_3072_sub_in_place_96(sp_digit* a,
  7489. const sp_digit* b)
  7490. {
  7491. sp_digit c = 0;
  7492. __asm__ __volatile__ (
  7493. "mov r8, %[a]\n\t"
  7494. "add r8, r8, #384\n\t"
  7495. "\n1:\n\t"
  7496. "mov r5, #0\n\t"
  7497. "subs r5, r5, %[c]\n\t"
  7498. "ldr r3, [%[a]]\n\t"
  7499. "ldr r4, [%[a], #4]\n\t"
  7500. "ldr r5, [%[b]]\n\t"
  7501. "ldr r6, [%[b], #4]\n\t"
  7502. "sbcs r3, r3, r5\n\t"
  7503. "sbcs r4, r4, r6\n\t"
  7504. "str r3, [%[a]]\n\t"
  7505. "str r4, [%[a], #4]\n\t"
  7506. "sbc %[c], %[c], %[c]\n\t"
  7507. "add %[a], %[a], #8\n\t"
  7508. "add %[b], %[b], #8\n\t"
  7509. "cmp %[a], r8\n\t"
  7510. #ifdef __GNUC__
  7511. "bne 1b\n\t"
  7512. #else
  7513. "bne.n 1b\n\t"
  7514. #endif /* __GNUC__ */
  7515. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  7516. :
  7517. : "memory", "r3", "r4", "r5", "r6", "r8"
  7518. );
  7519. return c;
  7520. }
  7521. #endif /* WOLFSSL_SP_SMALL */
  7522. #ifdef WOLFSSL_SP_SMALL
  7523. /* Multiply a and b into r. (r = a * b)
  7524. *
  7525. * r A single precision integer.
  7526. * a A single precision integer.
  7527. * b A single precision integer.
  7528. */
  7529. SP_NOINLINE static void sp_3072_mul_96(sp_digit* r, const sp_digit* a,
  7530. const sp_digit* b)
  7531. {
  7532. sp_digit tmp_arr[96 * 2];
  7533. sp_digit* tmp = tmp_arr;
  7534. __asm__ __volatile__ (
  7535. "mov r3, #0\n\t"
  7536. "mov r4, #0\n\t"
  7537. "mov r9, r3\n\t"
  7538. "mov r12, %[r]\n\t"
  7539. "mov r10, %[a]\n\t"
  7540. "mov r11, %[b]\n\t"
  7541. "mov r6, #1\n\t"
  7542. "lsl r6, r6, #8\n\t"
  7543. "add r6, r6, #128\n\t"
  7544. "add r6, r6, r10\n\t"
  7545. "mov r14, r6\n\t"
  7546. "\n1:\n\t"
  7547. "mov %[r], #0\n\t"
  7548. "mov r5, #0\n\t"
  7549. "mov r6, #1\n\t"
  7550. "lsl r6, r6, #8\n\t"
  7551. "add r6, r6, #124\n\t"
  7552. "mov %[a], r9\n\t"
  7553. "subs %[a], %[a], r6\n\t"
  7554. "sbc r6, r6, r6\n\t"
  7555. "mvn r6, r6\n\t"
  7556. "and %[a], %[a], r6\n\t"
  7557. "mov %[b], r9\n\t"
  7558. "sub %[b], %[b], %[a]\n\t"
  7559. "add %[a], %[a], r10\n\t"
  7560. "add %[b], %[b], r11\n\t"
  7561. "\n2:\n\t"
  7562. /* Multiply Start */
  7563. "ldr r6, [%[a]]\n\t"
  7564. "ldr r8, [%[b]]\n\t"
  7565. "umull r6, r8, r6, r8\n\t"
  7566. "adds r3, r3, r6\n\t"
  7567. "adcs r4, r4, r8\n\t"
  7568. "adc r5, r5, %[r]\n\t"
  7569. /* Multiply Done */
  7570. "add %[a], %[a], #4\n\t"
  7571. "sub %[b], %[b], #4\n\t"
  7572. "cmp %[a], r14\n\t"
  7573. #ifdef __GNUC__
  7574. "beq 3f\n\t"
  7575. #else
  7576. "beq.n 3f\n\t"
  7577. #endif /* __GNUC__ */
  7578. "mov r6, r9\n\t"
  7579. "add r6, r6, r10\n\t"
  7580. "cmp %[a], r6\n\t"
  7581. #ifdef __GNUC__
  7582. "ble 2b\n\t"
  7583. #else
  7584. "ble.n 2b\n\t"
  7585. #endif /* __GNUC__ */
  7586. "\n3:\n\t"
  7587. "mov %[r], r12\n\t"
  7588. "mov r8, r9\n\t"
  7589. "str r3, [%[r], r8]\n\t"
  7590. "mov r3, r4\n\t"
  7591. "mov r4, r5\n\t"
  7592. "add r8, r8, #4\n\t"
  7593. "mov r9, r8\n\t"
  7594. "mov r6, #2\n\t"
  7595. "lsl r6, r6, #8\n\t"
  7596. "add r6, r6, #248\n\t"
  7597. "cmp r8, r6\n\t"
  7598. #ifdef __GNUC__
  7599. "ble 1b\n\t"
  7600. #else
  7601. "ble.n 1b\n\t"
  7602. #endif /* __GNUC__ */
  7603. "str r3, [%[r], r8]\n\t"
  7604. "mov %[a], r10\n\t"
  7605. "mov %[b], r11\n\t"
  7606. :
  7607. : [r] "r" (tmp), [a] "r" (a), [b] "r" (b)
  7608. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  7609. );
  7610. XMEMCPY(r, tmp_arr, sizeof(tmp_arr));
  7611. }
  7612. /* Square a and put result in r. (r = a * a)
  7613. *
  7614. * r A single precision integer.
  7615. * a A single precision integer.
  7616. */
  7617. SP_NOINLINE static void sp_3072_sqr_96(sp_digit* r, const sp_digit* a)
  7618. {
  7619. __asm__ __volatile__ (
  7620. "mov r3, #0\n\t"
  7621. "mov r4, #0\n\t"
  7622. "mov r5, #0\n\t"
  7623. "mov r9, r3\n\t"
  7624. "mov r12, %[r]\n\t"
  7625. "mov r6, #3\n\t"
  7626. "lsl r6, r6, #8\n\t"
  7627. "neg r6, r6\n\t"
  7628. "add sp, sp, r6\n\t"
  7629. "mov r11, sp\n\t"
  7630. "mov r10, %[a]\n\t"
  7631. "\n1:\n\t"
  7632. "mov %[r], #0\n\t"
  7633. "mov r6, #1\n\t"
  7634. "lsl r6, r6, #8\n\t"
  7635. "add r6, r6, #124\n\t"
  7636. "mov %[a], r9\n\t"
  7637. "subs %[a], %[a], r6\n\t"
  7638. "sbc r6, r6, r6\n\t"
  7639. "mvn r6, r6\n\t"
  7640. "and %[a], %[a], r6\n\t"
  7641. "mov r2, r9\n\t"
  7642. "sub r2, r2, %[a]\n\t"
  7643. "add %[a], %[a], r10\n\t"
  7644. "add r2, r2, r10\n\t"
  7645. "\n2:\n\t"
  7646. "cmp r2, %[a]\n\t"
  7647. #ifdef __GNUC__
  7648. "beq 4f\n\t"
  7649. #else
  7650. "beq.n 4f\n\t"
  7651. #endif /* __GNUC__ */
  7652. /* Multiply * 2: Start */
  7653. "ldr r6, [%[a]]\n\t"
  7654. "ldr r8, [r2]\n\t"
  7655. "umull r6, r8, r6, r8\n\t"
  7656. "adds r3, r3, r6\n\t"
  7657. "adcs r4, r4, r8\n\t"
  7658. "adc r5, r5, %[r]\n\t"
  7659. "adds r3, r3, r6\n\t"
  7660. "adcs r4, r4, r8\n\t"
  7661. "adc r5, r5, %[r]\n\t"
  7662. /* Multiply * 2: Done */
  7663. #ifdef __GNUC__
  7664. "bal 5f\n\t"
  7665. #else
  7666. "bal.n 5f\n\t"
  7667. #endif /* __GNUC__ */
  7668. "\n4:\n\t"
  7669. /* Square: Start */
  7670. "ldr r6, [%[a]]\n\t"
  7671. "umull r6, r8, r6, r6\n\t"
  7672. "adds r3, r3, r6\n\t"
  7673. "adcs r4, r4, r8\n\t"
  7674. "adc r5, r5, %[r]\n\t"
  7675. /* Square: Done */
  7676. "\n5:\n\t"
  7677. "add %[a], %[a], #4\n\t"
  7678. "sub r2, r2, #4\n\t"
  7679. "mov r6, #1\n\t"
  7680. "lsl r6, r6, #8\n\t"
  7681. "add r6, r6, #128\n\t"
  7682. "add r6, r6, r10\n\t"
  7683. "cmp %[a], r6\n\t"
  7684. #ifdef __GNUC__
  7685. "beq 3f\n\t"
  7686. #else
  7687. "beq.n 3f\n\t"
  7688. #endif /* __GNUC__ */
  7689. "cmp %[a], r2\n\t"
  7690. #ifdef __GNUC__
  7691. "bgt 3f\n\t"
  7692. #else
  7693. "bgt.n 3f\n\t"
  7694. #endif /* __GNUC__ */
  7695. "mov r8, r9\n\t"
  7696. "add r8, r8, r10\n\t"
  7697. "cmp %[a], r8\n\t"
  7698. #ifdef __GNUC__
  7699. "ble 2b\n\t"
  7700. #else
  7701. "ble.n 2b\n\t"
  7702. #endif /* __GNUC__ */
  7703. "\n3:\n\t"
  7704. "mov %[r], r11\n\t"
  7705. "mov r8, r9\n\t"
  7706. "str r3, [%[r], r8]\n\t"
  7707. "mov r3, r4\n\t"
  7708. "mov r4, r5\n\t"
  7709. "mov r5, #0\n\t"
  7710. "add r8, r8, #4\n\t"
  7711. "mov r9, r8\n\t"
  7712. "mov r6, #2\n\t"
  7713. "lsl r6, r6, #8\n\t"
  7714. "add r6, r6, #248\n\t"
  7715. "cmp r8, r6\n\t"
  7716. #ifdef __GNUC__
  7717. "ble 1b\n\t"
  7718. #else
  7719. "ble.n 1b\n\t"
  7720. #endif /* __GNUC__ */
  7721. "mov %[a], r10\n\t"
  7722. "str r3, [%[r], r8]\n\t"
  7723. "mov %[r], r12\n\t"
  7724. "mov %[a], r11\n\t"
  7725. "mov r3, #2\n\t"
  7726. "lsl r3, r3, #8\n\t"
  7727. "add r3, r3, #252\n\t"
  7728. "\n4:\n\t"
  7729. "ldr r6, [%[a], r3]\n\t"
  7730. "str r6, [%[r], r3]\n\t"
  7731. "subs r3, r3, #4\n\t"
  7732. #ifdef __GNUC__
  7733. "bge 4b\n\t"
  7734. #else
  7735. "bge.n 4b\n\t"
  7736. #endif /* __GNUC__ */
  7737. "mov r6, #3\n\t"
  7738. "lsl r6, r6, #8\n\t"
  7739. "add sp, sp, r6\n\t"
  7740. :
  7741. : [r] "r" (r), [a] "r" (a)
  7742. : "memory", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12"
  7743. );
  7744. }
  7745. #endif /* WOLFSSL_SP_SMALL */
  7746. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || defined(WOLFSSL_HAVE_SP_DH)
  7747. #ifdef WOLFSSL_SP_SMALL
  7748. /* AND m into each word of a and store in r.
  7749. *
  7750. * r A single precision integer.
  7751. * a A single precision integer.
  7752. * m Mask to AND against each digit.
  7753. */
  7754. static void sp_3072_mask_48(sp_digit* r, const sp_digit* a, sp_digit m)
  7755. {
  7756. int i;
  7757. for (i=0; i<48; i++) {
  7758. r[i] = a[i] & m;
  7759. }
  7760. }
  7761. #endif /* WOLFSSL_SP_SMALL */
  7762. #ifdef WOLFSSL_SP_SMALL
  7763. /* Add b to a into r. (r = a + b)
  7764. *
  7765. * r A single precision integer.
  7766. * a A single precision integer.
  7767. * b A single precision integer.
  7768. */
  7769. SP_NOINLINE static sp_digit sp_3072_add_48(sp_digit* r, const sp_digit* a,
  7770. const sp_digit* b)
  7771. {
  7772. sp_digit c = 0;
  7773. __asm__ __volatile__ (
  7774. "mov r6, %[a]\n\t"
  7775. "mov r8, #0\n\t"
  7776. "add r6, r6, #192\n\t"
  7777. "sub r8, r8, #1\n\t"
  7778. "\n1:\n\t"
  7779. "adds %[c], %[c], r8\n\t"
  7780. "ldr r4, [%[a]]\n\t"
  7781. "ldr r5, [%[b]]\n\t"
  7782. "adcs r4, r4, r5\n\t"
  7783. "str r4, [%[r]]\n\t"
  7784. "mov %[c], #0\n\t"
  7785. "adc %[c], %[c], %[c]\n\t"
  7786. "add %[a], %[a], #4\n\t"
  7787. "add %[b], %[b], #4\n\t"
  7788. "add %[r], %[r], #4\n\t"
  7789. "cmp %[a], r6\n\t"
  7790. #ifdef __GNUC__
  7791. "bne 1b\n\t"
  7792. #else
  7793. "bne.n 1b\n\t"
  7794. #endif /* __GNUC__ */
  7795. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  7796. :
  7797. : "memory", "r4", "r5", "r6", "r8"
  7798. );
  7799. return c;
  7800. }
  7801. #endif /* WOLFSSL_SP_SMALL */
  7802. #ifdef WOLFSSL_SP_SMALL
  7803. /* Sub b from a into a. (a -= b)
  7804. *
  7805. * a A single precision integer.
  7806. * b A single precision integer.
  7807. */
  7808. SP_NOINLINE static sp_digit sp_3072_sub_in_place_48(sp_digit* a,
  7809. const sp_digit* b)
  7810. {
  7811. sp_digit c = 0;
  7812. __asm__ __volatile__ (
  7813. "mov r8, %[a]\n\t"
  7814. "add r8, r8, #192\n\t"
  7815. "\n1:\n\t"
  7816. "mov r5, #0\n\t"
  7817. "subs r5, r5, %[c]\n\t"
  7818. "ldr r3, [%[a]]\n\t"
  7819. "ldr r4, [%[a], #4]\n\t"
  7820. "ldr r5, [%[b]]\n\t"
  7821. "ldr r6, [%[b], #4]\n\t"
  7822. "sbcs r3, r3, r5\n\t"
  7823. "sbcs r4, r4, r6\n\t"
  7824. "str r3, [%[a]]\n\t"
  7825. "str r4, [%[a], #4]\n\t"
  7826. "sbc %[c], %[c], %[c]\n\t"
  7827. "add %[a], %[a], #8\n\t"
  7828. "add %[b], %[b], #8\n\t"
  7829. "cmp %[a], r8\n\t"
  7830. #ifdef __GNUC__
  7831. "bne 1b\n\t"
  7832. #else
  7833. "bne.n 1b\n\t"
  7834. #endif /* __GNUC__ */
  7835. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  7836. :
  7837. : "memory", "r3", "r4", "r5", "r6", "r8"
  7838. );
  7839. return c;
  7840. }
  7841. #endif /* WOLFSSL_SP_SMALL */
  7842. #ifdef WOLFSSL_SP_SMALL
  7843. /* Multiply a and b into r. (r = a * b)
  7844. *
  7845. * r A single precision integer.
  7846. * a A single precision integer.
  7847. * b A single precision integer.
  7848. */
  7849. SP_NOINLINE static void sp_3072_mul_48(sp_digit* r, const sp_digit* a,
  7850. const sp_digit* b)
  7851. {
  7852. sp_digit tmp_arr[48 * 2];
  7853. sp_digit* tmp = tmp_arr;
  7854. __asm__ __volatile__ (
  7855. "mov r3, #0\n\t"
  7856. "mov r4, #0\n\t"
  7857. "mov r9, r3\n\t"
  7858. "mov r12, %[r]\n\t"
  7859. "mov r10, %[a]\n\t"
  7860. "mov r11, %[b]\n\t"
  7861. "mov r6, #192\n\t"
  7862. "add r6, r6, r10\n\t"
  7863. "mov r14, r6\n\t"
  7864. "\n1:\n\t"
  7865. "mov %[r], #0\n\t"
  7866. "mov r5, #0\n\t"
  7867. "mov r6, #188\n\t"
  7868. "mov %[a], r9\n\t"
  7869. "subs %[a], %[a], r6\n\t"
  7870. "sbc r6, r6, r6\n\t"
  7871. "mvn r6, r6\n\t"
  7872. "and %[a], %[a], r6\n\t"
  7873. "mov %[b], r9\n\t"
  7874. "sub %[b], %[b], %[a]\n\t"
  7875. "add %[a], %[a], r10\n\t"
  7876. "add %[b], %[b], r11\n\t"
  7877. "\n2:\n\t"
  7878. /* Multiply Start */
  7879. "ldr r6, [%[a]]\n\t"
  7880. "ldr r8, [%[b]]\n\t"
  7881. "umull r6, r8, r6, r8\n\t"
  7882. "adds r3, r3, r6\n\t"
  7883. "adcs r4, r4, r8\n\t"
  7884. "adc r5, r5, %[r]\n\t"
  7885. /* Multiply Done */
  7886. "add %[a], %[a], #4\n\t"
  7887. "sub %[b], %[b], #4\n\t"
  7888. "cmp %[a], r14\n\t"
  7889. #ifdef __GNUC__
  7890. "beq 3f\n\t"
  7891. #else
  7892. "beq.n 3f\n\t"
  7893. #endif /* __GNUC__ */
  7894. "mov r6, r9\n\t"
  7895. "add r6, r6, r10\n\t"
  7896. "cmp %[a], r6\n\t"
  7897. #ifdef __GNUC__
  7898. "ble 2b\n\t"
  7899. #else
  7900. "ble.n 2b\n\t"
  7901. #endif /* __GNUC__ */
  7902. "\n3:\n\t"
  7903. "mov %[r], r12\n\t"
  7904. "mov r8, r9\n\t"
  7905. "str r3, [%[r], r8]\n\t"
  7906. "mov r3, r4\n\t"
  7907. "mov r4, r5\n\t"
  7908. "add r8, r8, #4\n\t"
  7909. "mov r9, r8\n\t"
  7910. "mov r6, #1\n\t"
  7911. "lsl r6, r6, #8\n\t"
  7912. "add r6, r6, #120\n\t"
  7913. "cmp r8, r6\n\t"
  7914. #ifdef __GNUC__
  7915. "ble 1b\n\t"
  7916. #else
  7917. "ble.n 1b\n\t"
  7918. #endif /* __GNUC__ */
  7919. "str r3, [%[r], r8]\n\t"
  7920. "mov %[a], r10\n\t"
  7921. "mov %[b], r11\n\t"
  7922. :
  7923. : [r] "r" (tmp), [a] "r" (a), [b] "r" (b)
  7924. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  7925. );
  7926. XMEMCPY(r, tmp_arr, sizeof(tmp_arr));
  7927. }
  7928. /* Square a and put result in r. (r = a * a)
  7929. *
  7930. * r A single precision integer.
  7931. * a A single precision integer.
  7932. */
  7933. SP_NOINLINE static void sp_3072_sqr_48(sp_digit* r, const sp_digit* a)
  7934. {
  7935. __asm__ __volatile__ (
  7936. "mov r3, #0\n\t"
  7937. "mov r4, #0\n\t"
  7938. "mov r5, #0\n\t"
  7939. "mov r9, r3\n\t"
  7940. "mov r12, %[r]\n\t"
  7941. "mov r6, #1\n\t"
  7942. "lsl r6, r6, #8\n\t"
  7943. "add r6, r6, #128\n\t"
  7944. "neg r6, r6\n\t"
  7945. "add sp, sp, r6\n\t"
  7946. "mov r11, sp\n\t"
  7947. "mov r10, %[a]\n\t"
  7948. "\n1:\n\t"
  7949. "mov %[r], #0\n\t"
  7950. "mov r6, #188\n\t"
  7951. "mov %[a], r9\n\t"
  7952. "subs %[a], %[a], r6\n\t"
  7953. "sbc r6, r6, r6\n\t"
  7954. "mvn r6, r6\n\t"
  7955. "and %[a], %[a], r6\n\t"
  7956. "mov r2, r9\n\t"
  7957. "sub r2, r2, %[a]\n\t"
  7958. "add %[a], %[a], r10\n\t"
  7959. "add r2, r2, r10\n\t"
  7960. "\n2:\n\t"
  7961. "cmp r2, %[a]\n\t"
  7962. #ifdef __GNUC__
  7963. "beq 4f\n\t"
  7964. #else
  7965. "beq.n 4f\n\t"
  7966. #endif /* __GNUC__ */
  7967. /* Multiply * 2: Start */
  7968. "ldr r6, [%[a]]\n\t"
  7969. "ldr r8, [r2]\n\t"
  7970. "umull r6, r8, r6, r8\n\t"
  7971. "adds r3, r3, r6\n\t"
  7972. "adcs r4, r4, r8\n\t"
  7973. "adc r5, r5, %[r]\n\t"
  7974. "adds r3, r3, r6\n\t"
  7975. "adcs r4, r4, r8\n\t"
  7976. "adc r5, r5, %[r]\n\t"
  7977. /* Multiply * 2: Done */
  7978. #ifdef __GNUC__
  7979. "bal 5f\n\t"
  7980. #else
  7981. "bal.n 5f\n\t"
  7982. #endif /* __GNUC__ */
  7983. "\n4:\n\t"
  7984. /* Square: Start */
  7985. "ldr r6, [%[a]]\n\t"
  7986. "umull r6, r8, r6, r6\n\t"
  7987. "adds r3, r3, r6\n\t"
  7988. "adcs r4, r4, r8\n\t"
  7989. "adc r5, r5, %[r]\n\t"
  7990. /* Square: Done */
  7991. "\n5:\n\t"
  7992. "add %[a], %[a], #4\n\t"
  7993. "sub r2, r2, #4\n\t"
  7994. "mov r6, #192\n\t"
  7995. "add r6, r6, r10\n\t"
  7996. "cmp %[a], r6\n\t"
  7997. #ifdef __GNUC__
  7998. "beq 3f\n\t"
  7999. #else
  8000. "beq.n 3f\n\t"
  8001. #endif /* __GNUC__ */
  8002. "cmp %[a], r2\n\t"
  8003. #ifdef __GNUC__
  8004. "bgt 3f\n\t"
  8005. #else
  8006. "bgt.n 3f\n\t"
  8007. #endif /* __GNUC__ */
  8008. "mov r8, r9\n\t"
  8009. "add r8, r8, r10\n\t"
  8010. "cmp %[a], r8\n\t"
  8011. #ifdef __GNUC__
  8012. "ble 2b\n\t"
  8013. #else
  8014. "ble.n 2b\n\t"
  8015. #endif /* __GNUC__ */
  8016. "\n3:\n\t"
  8017. "mov %[r], r11\n\t"
  8018. "mov r8, r9\n\t"
  8019. "str r3, [%[r], r8]\n\t"
  8020. "mov r3, r4\n\t"
  8021. "mov r4, r5\n\t"
  8022. "mov r5, #0\n\t"
  8023. "add r8, r8, #4\n\t"
  8024. "mov r9, r8\n\t"
  8025. "mov r6, #1\n\t"
  8026. "lsl r6, r6, #8\n\t"
  8027. "add r6, r6, #120\n\t"
  8028. "cmp r8, r6\n\t"
  8029. #ifdef __GNUC__
  8030. "ble 1b\n\t"
  8031. #else
  8032. "ble.n 1b\n\t"
  8033. #endif /* __GNUC__ */
  8034. "mov %[a], r10\n\t"
  8035. "str r3, [%[r], r8]\n\t"
  8036. "mov %[r], r12\n\t"
  8037. "mov %[a], r11\n\t"
  8038. "mov r3, #1\n\t"
  8039. "lsl r3, r3, #8\n\t"
  8040. "add r3, r3, #124\n\t"
  8041. "\n4:\n\t"
  8042. "ldr r6, [%[a], r3]\n\t"
  8043. "str r6, [%[r], r3]\n\t"
  8044. "subs r3, r3, #4\n\t"
  8045. #ifdef __GNUC__
  8046. "bge 4b\n\t"
  8047. #else
  8048. "bge.n 4b\n\t"
  8049. #endif /* __GNUC__ */
  8050. "mov r6, #1\n\t"
  8051. "lsl r6, r6, #8\n\t"
  8052. "add r6, r6, #128\n\t"
  8053. "add sp, sp, r6\n\t"
  8054. :
  8055. : [r] "r" (r), [a] "r" (a)
  8056. : "memory", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12"
  8057. );
  8058. }
  8059. #endif /* WOLFSSL_SP_SMALL */
  8060. #endif /* (WOLFSSL_HAVE_SP_RSA & !WOLFSSL_RSA_PUBLIC_ONLY) | WOLFSSL_HAVE_SP_DH */
  8061. /* Caclulate the bottom digit of -1/a mod 2^n.
  8062. *
  8063. * a A single precision number.
  8064. * rho Bottom word of inverse.
  8065. */
  8066. static void sp_3072_mont_setup(const sp_digit* a, sp_digit* rho)
  8067. {
  8068. sp_digit x;
  8069. sp_digit b;
  8070. b = a[0];
  8071. x = (((b + 2) & 4) << 1) + b; /* here x*a==1 mod 2**4 */
  8072. x *= 2 - b * x; /* here x*a==1 mod 2**8 */
  8073. x *= 2 - b * x; /* here x*a==1 mod 2**16 */
  8074. x *= 2 - b * x; /* here x*a==1 mod 2**32 */
  8075. /* rho = -1/m mod b */
  8076. *rho = (sp_digit)0 - x;
  8077. }
  8078. /* Mul a by digit b into r. (r = a * b)
  8079. *
  8080. * r A single precision integer.
  8081. * a A single precision integer.
  8082. * b A single precision digit.
  8083. */
  8084. SP_NOINLINE static void sp_3072_mul_d_96(sp_digit* r, const sp_digit* a,
  8085. sp_digit b)
  8086. {
  8087. __asm__ __volatile__ (
  8088. "add r9, %[a], #384\n\t"
  8089. /* A[0] * B */
  8090. "ldr r6, [%[a]], #4\n\t"
  8091. "umull r5, r3, r6, %[b]\n\t"
  8092. "mov r4, #0\n\t"
  8093. "str r5, [%[r]], #4\n\t"
  8094. /* A[0] * B - Done */
  8095. "\n1:\n\t"
  8096. "mov r5, #0\n\t"
  8097. /* A[] * B */
  8098. "ldr r6, [%[a]], #4\n\t"
  8099. "umull r6, r8, r6, %[b]\n\t"
  8100. "adds r3, r3, r6\n\t"
  8101. "adcs r4, r4, r8\n\t"
  8102. "adc r5, r5, #0\n\t"
  8103. /* A[] * B - Done */
  8104. "str r3, [%[r]], #4\n\t"
  8105. "mov r3, r4\n\t"
  8106. "mov r4, r5\n\t"
  8107. "cmp %[a], r9\n\t"
  8108. #ifdef __GNUC__
  8109. "blt 1b\n\t"
  8110. #else
  8111. "blt.n 1b\n\t"
  8112. #endif /* __GNUC__ */
  8113. "str r3, [%[r]]\n\t"
  8114. : [r] "+r" (r), [a] "+r" (a)
  8115. : [b] "r" (b)
  8116. : "memory", "r3", "r4", "r5", "r6", "r8", "r9"
  8117. );
  8118. }
  8119. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || defined(WOLFSSL_HAVE_SP_DH)
  8120. /* r = 2^n mod m where n is the number of bits to reduce by.
  8121. * Given m must be 3072 bits, just need to subtract.
  8122. *
  8123. * r A single precision number.
  8124. * m A single precision number.
  8125. */
  8126. static void sp_3072_mont_norm_48(sp_digit* r, const sp_digit* m)
  8127. {
  8128. XMEMSET(r, 0, sizeof(sp_digit) * 48);
  8129. /* r = 2^n mod m */
  8130. sp_3072_sub_in_place_48(r, m);
  8131. }
  8132. /* Conditionally subtract b from a using the mask m.
  8133. * m is -1 to subtract and 0 when not copying.
  8134. *
  8135. * r A single precision number representing condition subtract result.
  8136. * a A single precision number to subtract from.
  8137. * b A single precision number to subtract.
  8138. * m Mask value to apply.
  8139. */
  8140. SP_NOINLINE static sp_digit sp_3072_cond_sub_48(sp_digit* r, const sp_digit* a,
  8141. const sp_digit* b, sp_digit m)
  8142. {
  8143. sp_digit c = 0;
  8144. __asm__ __volatile__ (
  8145. "mov r5, #192\n\t"
  8146. "mov r9, r5\n\t"
  8147. "mov r8, #0\n\t"
  8148. "\n1:\n\t"
  8149. "ldr r6, [%[b], r8]\n\t"
  8150. "and r6, r6, %[m]\n\t"
  8151. "mov r5, #0\n\t"
  8152. "subs r5, r5, %[c]\n\t"
  8153. "ldr r5, [%[a], r8]\n\t"
  8154. "sbcs r5, r5, r6\n\t"
  8155. "sbcs %[c], %[c], %[c]\n\t"
  8156. "str r5, [%[r], r8]\n\t"
  8157. "add r8, r8, #4\n\t"
  8158. "cmp r8, r9\n\t"
  8159. #ifdef __GNUC__
  8160. "blt 1b\n\t"
  8161. #else
  8162. "blt.n 1b\n\t"
  8163. #endif /* __GNUC__ */
  8164. : [c] "+r" (c)
  8165. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  8166. : "memory", "r5", "r6", "r8", "r9"
  8167. );
  8168. return c;
  8169. }
  8170. /* Reduce the number back to 3072 bits using Montgomery reduction.
  8171. *
  8172. * a A single precision number to reduce in place.
  8173. * m The single precision number representing the modulus.
  8174. * mp The digit representing the negative inverse of m mod 2^n.
  8175. */
  8176. SP_NOINLINE static void sp_3072_mont_reduce_48(sp_digit* a, const sp_digit* m,
  8177. sp_digit mp)
  8178. {
  8179. sp_digit ca = 0;
  8180. __asm__ __volatile__ (
  8181. "mov r9, %[mp]\n\t"
  8182. "mov r12, %[m]\n\t"
  8183. "mov r10, %[a]\n\t"
  8184. "mov r4, #0\n\t"
  8185. "add r11, r10, #192\n\t"
  8186. "\n1:\n\t"
  8187. /* mu = a[i] * mp */
  8188. "mov %[mp], r9\n\t"
  8189. "ldr %[a], [r10]\n\t"
  8190. "mul %[mp], %[mp], %[a]\n\t"
  8191. "mov %[m], r12\n\t"
  8192. "add r14, r10, #184\n\t"
  8193. "\n2:\n\t"
  8194. /* a[i+j] += m[j] * mu */
  8195. "ldr %[a], [r10]\n\t"
  8196. "mov r5, #0\n\t"
  8197. /* Multiply m[j] and mu - Start */
  8198. "ldr r8, [%[m]], #4\n\t"
  8199. "umull r6, r8, %[mp], r8\n\t"
  8200. "adds %[a], %[a], r6\n\t"
  8201. "adc r5, r5, r8\n\t"
  8202. /* Multiply m[j] and mu - Done */
  8203. "adds r4, r4, %[a]\n\t"
  8204. "adc r5, r5, #0\n\t"
  8205. "str r4, [r10], #4\n\t"
  8206. /* a[i+j+1] += m[j+1] * mu */
  8207. "ldr %[a], [r10]\n\t"
  8208. "mov r4, #0\n\t"
  8209. /* Multiply m[j] and mu - Start */
  8210. "ldr r8, [%[m]], #4\n\t"
  8211. "umull r6, r8, %[mp], r8\n\t"
  8212. "adds %[a], %[a], r6\n\t"
  8213. "adc r4, r4, r8\n\t"
  8214. /* Multiply m[j] and mu - Done */
  8215. "adds r5, r5, %[a]\n\t"
  8216. "adc r4, r4, #0\n\t"
  8217. "str r5, [r10], #4\n\t"
  8218. "cmp r10, r14\n\t"
  8219. #ifdef __GNUC__
  8220. "blt 2b\n\t"
  8221. #else
  8222. "blt.n 2b\n\t"
  8223. #endif /* __GNUC__ */
  8224. /* a[i+46] += m[46] * mu */
  8225. "ldr %[a], [r10]\n\t"
  8226. "mov r5, #0\n\t"
  8227. /* Multiply m[j] and mu - Start */
  8228. "ldr r8, [%[m]], #4\n\t"
  8229. "umull r6, r8, %[mp], r8\n\t"
  8230. "adds %[a], %[a], r6\n\t"
  8231. "adc r5, r5, r8\n\t"
  8232. /* Multiply m[j] and mu - Done */
  8233. "adds r4, r4, %[a]\n\t"
  8234. "adc r5, r5, #0\n\t"
  8235. "str r4, [r10], #4\n\t"
  8236. /* a[i+47] += m[47] * mu */
  8237. "mov r4, %[ca]\n\t"
  8238. "mov %[ca], #0\n\t"
  8239. /* Multiply m[47] and mu - Start */
  8240. "ldr r8, [%[m]]\n\t"
  8241. "umull r6, r8, %[mp], r8\n\t"
  8242. "adds r5, r5, r6\n\t"
  8243. "adcs r4, r4, r8\n\t"
  8244. "adc %[ca], %[ca], #0\n\t"
  8245. /* Multiply m[47] and mu - Done */
  8246. "ldr r6, [r10]\n\t"
  8247. "ldr r8, [r10, #4]\n\t"
  8248. "adds r6, r6, r5\n\t"
  8249. "adcs r8, r8, r4\n\t"
  8250. "adc %[ca], %[ca], #0\n\t"
  8251. "str r6, [r10]\n\t"
  8252. "str r8, [r10, #4]\n\t"
  8253. /* Next word in a */
  8254. "sub r10, r10, #184\n\t"
  8255. "cmp r10, r11\n\t"
  8256. #ifdef __GNUC__
  8257. "blt 1b\n\t"
  8258. #else
  8259. "blt.n 1b\n\t"
  8260. #endif /* __GNUC__ */
  8261. "mov %[a], r10\n\t"
  8262. "mov %[m], r12\n\t"
  8263. : [ca] "+r" (ca), [a] "+r" (a)
  8264. : [m] "r" (m), [mp] "r" (mp)
  8265. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  8266. );
  8267. sp_3072_cond_sub_48(a - 48, a, m, (sp_digit)0 - ca);
  8268. }
  8269. /* Multiply two Montgomery form numbers mod the modulus (prime).
  8270. * (r = a * b mod m)
  8271. *
  8272. * r Result of multiplication.
  8273. * a First number to multiply in Montgomery form.
  8274. * b Second number to multiply in Montgomery form.
  8275. * m Modulus (prime).
  8276. * mp Montgomery mulitplier.
  8277. */
  8278. SP_NOINLINE static void sp_3072_mont_mul_48(sp_digit* r, const sp_digit* a,
  8279. const sp_digit* b, const sp_digit* m, sp_digit mp)
  8280. {
  8281. sp_3072_mul_48(r, a, b);
  8282. sp_3072_mont_reduce_48(r, m, mp);
  8283. }
  8284. /* Square the Montgomery form number. (r = a * a mod m)
  8285. *
  8286. * r Result of squaring.
  8287. * a Number to square in Montgomery form.
  8288. * m Modulus (prime).
  8289. * mp Montgomery mulitplier.
  8290. */
  8291. SP_NOINLINE static void sp_3072_mont_sqr_48(sp_digit* r, const sp_digit* a,
  8292. const sp_digit* m, sp_digit mp)
  8293. {
  8294. sp_3072_sqr_48(r, a);
  8295. sp_3072_mont_reduce_48(r, m, mp);
  8296. }
  8297. /* Mul a by digit b into r. (r = a * b)
  8298. *
  8299. * r A single precision integer.
  8300. * a A single precision integer.
  8301. * b A single precision digit.
  8302. */
  8303. SP_NOINLINE static void sp_3072_mul_d_48(sp_digit* r, const sp_digit* a,
  8304. sp_digit b)
  8305. {
  8306. __asm__ __volatile__ (
  8307. "add r9, %[a], #192\n\t"
  8308. /* A[0] * B */
  8309. "ldr r6, [%[a]], #4\n\t"
  8310. "umull r5, r3, r6, %[b]\n\t"
  8311. "mov r4, #0\n\t"
  8312. "str r5, [%[r]], #4\n\t"
  8313. /* A[0] * B - Done */
  8314. "\n1:\n\t"
  8315. "mov r5, #0\n\t"
  8316. /* A[] * B */
  8317. "ldr r6, [%[a]], #4\n\t"
  8318. "umull r6, r8, r6, %[b]\n\t"
  8319. "adds r3, r3, r6\n\t"
  8320. "adcs r4, r4, r8\n\t"
  8321. "adc r5, r5, #0\n\t"
  8322. /* A[] * B - Done */
  8323. "str r3, [%[r]], #4\n\t"
  8324. "mov r3, r4\n\t"
  8325. "mov r4, r5\n\t"
  8326. "cmp %[a], r9\n\t"
  8327. #ifdef __GNUC__
  8328. "blt 1b\n\t"
  8329. #else
  8330. "blt.n 1b\n\t"
  8331. #endif /* __GNUC__ */
  8332. "str r3, [%[r]]\n\t"
  8333. : [r] "+r" (r), [a] "+r" (a)
  8334. : [b] "r" (b)
  8335. : "memory", "r3", "r4", "r5", "r6", "r8", "r9"
  8336. );
  8337. }
  8338. /* Divide the double width number (d1|d0) by the divisor. (d1|d0 / div)
  8339. *
  8340. * d1 The high order half of the number to divide.
  8341. * d0 The low order half of the number to divide.
  8342. * div The divisor.
  8343. * returns the result of the division.
  8344. *
  8345. * Note that this is an approximate div. It may give an answer 1 larger.
  8346. */
  8347. SP_NOINLINE static sp_digit div_3072_word_48(sp_digit d1, sp_digit d0,
  8348. sp_digit div)
  8349. {
  8350. sp_digit r = 0;
  8351. __asm__ __volatile__ (
  8352. "lsr r6, %[div], #16\n\t"
  8353. "add r6, r6, #1\n\t"
  8354. "udiv r4, %[d1], r6\n\t"
  8355. "lsl r8, r4, #16\n\t"
  8356. "umull r4, r5, %[div], r8\n\t"
  8357. "subs %[d0], %[d0], r4\n\t"
  8358. "sbc %[d1], %[d1], r5\n\t"
  8359. "udiv r5, %[d1], r6\n\t"
  8360. "lsl r4, r5, #16\n\t"
  8361. "add r8, r8, r4\n\t"
  8362. "umull r4, r5, %[div], r4\n\t"
  8363. "subs %[d0], %[d0], r4\n\t"
  8364. "sbc %[d1], %[d1], r5\n\t"
  8365. "lsl r4, %[d1], #16\n\t"
  8366. "orr r4, r4, %[d0], lsr #16\n\t"
  8367. "udiv r4, r4, r6\n\t"
  8368. "add r8, r8, r4\n\t"
  8369. "umull r4, r5, %[div], r4\n\t"
  8370. "subs %[d0], %[d0], r4\n\t"
  8371. "sbc %[d1], %[d1], r5\n\t"
  8372. "lsl r4, %[d1], #16\n\t"
  8373. "orr r4, r4, %[d0], lsr #16\n\t"
  8374. "udiv r4, r4, r6\n\t"
  8375. "add r8, r8, r4\n\t"
  8376. "umull r4, r5, %[div], r4\n\t"
  8377. "subs %[d0], %[d0], r4\n\t"
  8378. "sbc %[d1], %[d1], r5\n\t"
  8379. "udiv r4, %[d0], %[div]\n\t"
  8380. "add r8, r8, r4\n\t"
  8381. "mov %[r], r8\n\t"
  8382. : [r] "+r" (r)
  8383. : [d1] "r" (d1), [d0] "r" (d0), [div] "r" (div)
  8384. : "r4", "r5", "r6", "r8"
  8385. );
  8386. return r;
  8387. }
  8388. /* Compare a with b in constant time.
  8389. *
  8390. * a A single precision integer.
  8391. * b A single precision integer.
  8392. * return -ve, 0 or +ve if a is less than, equal to or greater than b
  8393. * respectively.
  8394. */
  8395. SP_NOINLINE static sp_int32 sp_3072_cmp_48(const sp_digit* a, const sp_digit* b)
  8396. {
  8397. sp_digit r = 0;
  8398. __asm__ __volatile__ (
  8399. "mov r3, #0\n\t"
  8400. "mvn r3, r3\n\t"
  8401. "mov r6, #188\n\t"
  8402. "\n1:\n\t"
  8403. "ldr r8, [%[a], r6]\n\t"
  8404. "ldr r5, [%[b], r6]\n\t"
  8405. "and r8, r8, r3\n\t"
  8406. "and r5, r5, r3\n\t"
  8407. "mov r4, r8\n\t"
  8408. "subs r8, r8, r5\n\t"
  8409. "sbc r8, r8, r8\n\t"
  8410. "add %[r], %[r], r8\n\t"
  8411. "mvn r8, r8\n\t"
  8412. "and r3, r3, r8\n\t"
  8413. "subs r5, r5, r4\n\t"
  8414. "sbc r8, r8, r8\n\t"
  8415. "sub %[r], %[r], r8\n\t"
  8416. "mvn r8, r8\n\t"
  8417. "and r3, r3, r8\n\t"
  8418. "sub r6, r6, #4\n\t"
  8419. "cmp r6, #0\n\t"
  8420. #ifdef __GNUC__
  8421. "bge 1b\n\t"
  8422. #else
  8423. "bge.n 1b\n\t"
  8424. #endif /* __GNUC__ */
  8425. : [r] "+r" (r)
  8426. : [a] "r" (a), [b] "r" (b)
  8427. : "r3", "r4", "r5", "r6", "r8"
  8428. );
  8429. return r;
  8430. }
  8431. /* Divide d in a and put remainder into r (m*d + r = a)
  8432. * m is not calculated as it is not needed at this time.
  8433. *
  8434. * a Number to be divided.
  8435. * d Number to divide with.
  8436. * m Multiplier result.
  8437. * r Remainder from the division.
  8438. * returns MP_OKAY indicating success.
  8439. */
  8440. static WC_INLINE int sp_3072_div_48(const sp_digit* a, const sp_digit* d, sp_digit* m,
  8441. sp_digit* r)
  8442. {
  8443. sp_digit t1[96], t2[49];
  8444. sp_digit div, r1;
  8445. int i;
  8446. (void)m;
  8447. div = d[47];
  8448. XMEMCPY(t1, a, sizeof(*t1) * 2 * 48);
  8449. r1 = sp_3072_cmp_48(&t1[48], d) >= 0;
  8450. sp_3072_cond_sub_48(&t1[48], &t1[48], d, (sp_digit)0 - r1);
  8451. for (i = 47; i >= 0; i--) {
  8452. sp_digit mask = 0 - (t1[48 + i] == div);
  8453. sp_digit hi = t1[48 + i] + mask;
  8454. r1 = div_3072_word_48(hi, t1[48 + i - 1], div);
  8455. r1 |= mask;
  8456. sp_3072_mul_d_48(t2, d, r1);
  8457. t1[48 + i] += sp_3072_sub_in_place_48(&t1[i], t2);
  8458. t1[48 + i] -= t2[48];
  8459. sp_3072_mask_48(t2, d, t1[48 + i]);
  8460. t1[48 + i] += sp_3072_add_48(&t1[i], &t1[i], t2);
  8461. sp_3072_mask_48(t2, d, t1[48 + i]);
  8462. t1[48 + i] += sp_3072_add_48(&t1[i], &t1[i], t2);
  8463. }
  8464. r1 = sp_3072_cmp_48(t1, d) >= 0;
  8465. sp_3072_cond_sub_48(r, t1, d, (sp_digit)0 - r1);
  8466. return MP_OKAY;
  8467. }
  8468. /* Reduce a modulo m into r. (r = a mod m)
  8469. *
  8470. * r A single precision number that is the reduced result.
  8471. * a A single precision number that is to be reduced.
  8472. * m A single precision number that is the modulus to reduce with.
  8473. * returns MP_OKAY indicating success.
  8474. */
  8475. static WC_INLINE int sp_3072_mod_48(sp_digit* r, const sp_digit* a, const sp_digit* m)
  8476. {
  8477. return sp_3072_div_48(a, m, NULL, r);
  8478. }
  8479. #ifdef WOLFSSL_SP_SMALL
  8480. /* Modular exponentiate a to the e mod m. (r = a^e mod m)
  8481. *
  8482. * r A single precision number that is the result of the operation.
  8483. * a A single precision number being exponentiated.
  8484. * e A single precision number that is the exponent.
  8485. * bits The number of bits in the exponent.
  8486. * m A single precision number that is the modulus.
  8487. * returns 0 on success.
  8488. * returns MEMORY_E on dynamic memory allocation failure.
  8489. * returns MP_VAL when base is even or exponent is 0.
  8490. */
  8491. static int sp_3072_mod_exp_48(sp_digit* r, const sp_digit* a, const sp_digit* e,
  8492. int bits, const sp_digit* m, int reduceA)
  8493. {
  8494. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  8495. sp_digit* td = NULL;
  8496. #else
  8497. sp_digit td[16 * 96];
  8498. #endif
  8499. sp_digit* t[16];
  8500. sp_digit* norm = NULL;
  8501. sp_digit mp = 1;
  8502. sp_digit n;
  8503. sp_digit mask;
  8504. int i;
  8505. int c;
  8506. byte y;
  8507. int err = MP_OKAY;
  8508. if (bits == 0) {
  8509. err = MP_VAL;
  8510. }
  8511. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  8512. if (err == MP_OKAY) {
  8513. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * (16 * 96), NULL,
  8514. DYNAMIC_TYPE_TMP_BUFFER);
  8515. if (td == NULL)
  8516. err = MEMORY_E;
  8517. }
  8518. #endif
  8519. if (err == MP_OKAY) {
  8520. norm = td;
  8521. for (i=0; i<16; i++) {
  8522. t[i] = td + i * 96;
  8523. }
  8524. sp_3072_mont_setup(m, &mp);
  8525. sp_3072_mont_norm_48(norm, m);
  8526. XMEMSET(t[1], 0, sizeof(sp_digit) * 48U);
  8527. if (reduceA != 0) {
  8528. err = sp_3072_mod_48(t[1] + 48, a, m);
  8529. if (err == MP_OKAY) {
  8530. err = sp_3072_mod_48(t[1], t[1], m);
  8531. }
  8532. }
  8533. else {
  8534. XMEMCPY(t[1] + 48, a, sizeof(sp_digit) * 48);
  8535. err = sp_3072_mod_48(t[1], t[1], m);
  8536. }
  8537. }
  8538. if (err == MP_OKAY) {
  8539. sp_3072_mont_sqr_48(t[ 2], t[ 1], m, mp);
  8540. sp_3072_mont_mul_48(t[ 3], t[ 2], t[ 1], m, mp);
  8541. sp_3072_mont_sqr_48(t[ 4], t[ 2], m, mp);
  8542. sp_3072_mont_mul_48(t[ 5], t[ 3], t[ 2], m, mp);
  8543. sp_3072_mont_sqr_48(t[ 6], t[ 3], m, mp);
  8544. sp_3072_mont_mul_48(t[ 7], t[ 4], t[ 3], m, mp);
  8545. sp_3072_mont_sqr_48(t[ 8], t[ 4], m, mp);
  8546. sp_3072_mont_mul_48(t[ 9], t[ 5], t[ 4], m, mp);
  8547. sp_3072_mont_sqr_48(t[10], t[ 5], m, mp);
  8548. sp_3072_mont_mul_48(t[11], t[ 6], t[ 5], m, mp);
  8549. sp_3072_mont_sqr_48(t[12], t[ 6], m, mp);
  8550. sp_3072_mont_mul_48(t[13], t[ 7], t[ 6], m, mp);
  8551. sp_3072_mont_sqr_48(t[14], t[ 7], m, mp);
  8552. sp_3072_mont_mul_48(t[15], t[ 8], t[ 7], m, mp);
  8553. i = (bits - 1) / 32;
  8554. n = e[i--];
  8555. c = bits & 31;
  8556. if (c == 0) {
  8557. c = 32;
  8558. }
  8559. c -= bits % 4;
  8560. if (c == 32) {
  8561. c = 28;
  8562. }
  8563. if (c < 0) {
  8564. /* Number of bits in top word is less than number needed. */
  8565. c = -c;
  8566. y = (byte)(n << c);
  8567. n = e[i--];
  8568. y |= (byte)(n >> (64 - c));
  8569. n <<= c;
  8570. c = 64 - c;
  8571. }
  8572. else if (c == 0) {
  8573. /* All bits in top word used. */
  8574. y = (byte)n;
  8575. }
  8576. else {
  8577. y = (byte)(n >> c);
  8578. n <<= 32 - c;
  8579. }
  8580. XMEMCPY(r, t[y], sizeof(sp_digit) * 48);
  8581. for (; i>=0 || c>=4; ) {
  8582. if (c == 0) {
  8583. n = e[i--];
  8584. y = (byte)(n >> 28);
  8585. n <<= 4;
  8586. c = 28;
  8587. }
  8588. else if (c < 4) {
  8589. y = (byte)(n >> 28);
  8590. n = e[i--];
  8591. c = 4 - c;
  8592. y |= (byte)(n >> (32 - c));
  8593. n <<= c;
  8594. c = 32 - c;
  8595. }
  8596. else {
  8597. y = (byte)((n >> 28) & 0xf);
  8598. n <<= 4;
  8599. c -= 4;
  8600. }
  8601. sp_3072_mont_sqr_48(r, r, m, mp);
  8602. sp_3072_mont_sqr_48(r, r, m, mp);
  8603. sp_3072_mont_sqr_48(r, r, m, mp);
  8604. sp_3072_mont_sqr_48(r, r, m, mp);
  8605. sp_3072_mont_mul_48(r, r, t[y], m, mp);
  8606. }
  8607. XMEMSET(&r[48], 0, sizeof(sp_digit) * 48U);
  8608. sp_3072_mont_reduce_48(r, m, mp);
  8609. mask = 0 - (sp_3072_cmp_48(r, m) >= 0);
  8610. sp_3072_cond_sub_48(r, r, m, mask);
  8611. }
  8612. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  8613. if (td != NULL)
  8614. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  8615. #endif
  8616. return err;
  8617. }
  8618. #else
  8619. /* Modular exponentiate a to the e mod m. (r = a^e mod m)
  8620. *
  8621. * r A single precision number that is the result of the operation.
  8622. * a A single precision number being exponentiated.
  8623. * e A single precision number that is the exponent.
  8624. * bits The number of bits in the exponent.
  8625. * m A single precision number that is the modulus.
  8626. * returns 0 on success.
  8627. * returns MEMORY_E on dynamic memory allocation failure.
  8628. * returns MP_VAL when base is even or exponent is 0.
  8629. */
  8630. static int sp_3072_mod_exp_48(sp_digit* r, const sp_digit* a, const sp_digit* e,
  8631. int bits, const sp_digit* m, int reduceA)
  8632. {
  8633. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  8634. sp_digit* td = NULL;
  8635. #else
  8636. sp_digit td[32 * 96];
  8637. #endif
  8638. sp_digit* t[32];
  8639. sp_digit* norm = NULL;
  8640. sp_digit mp = 1;
  8641. sp_digit n;
  8642. sp_digit mask;
  8643. int i;
  8644. int c;
  8645. byte y;
  8646. int err = MP_OKAY;
  8647. if (bits == 0) {
  8648. err = MP_VAL;
  8649. }
  8650. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  8651. if (err == MP_OKAY) {
  8652. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * (32 * 96), NULL,
  8653. DYNAMIC_TYPE_TMP_BUFFER);
  8654. if (td == NULL)
  8655. err = MEMORY_E;
  8656. }
  8657. #endif
  8658. if (err == MP_OKAY) {
  8659. norm = td;
  8660. for (i=0; i<32; i++) {
  8661. t[i] = td + i * 96;
  8662. }
  8663. sp_3072_mont_setup(m, &mp);
  8664. sp_3072_mont_norm_48(norm, m);
  8665. XMEMSET(t[1], 0, sizeof(sp_digit) * 48U);
  8666. if (reduceA != 0) {
  8667. err = sp_3072_mod_48(t[1] + 48, a, m);
  8668. if (err == MP_OKAY) {
  8669. err = sp_3072_mod_48(t[1], t[1], m);
  8670. }
  8671. }
  8672. else {
  8673. XMEMCPY(t[1] + 48, a, sizeof(sp_digit) * 48);
  8674. err = sp_3072_mod_48(t[1], t[1], m);
  8675. }
  8676. }
  8677. if (err == MP_OKAY) {
  8678. sp_3072_mont_sqr_48(t[ 2], t[ 1], m, mp);
  8679. sp_3072_mont_mul_48(t[ 3], t[ 2], t[ 1], m, mp);
  8680. sp_3072_mont_sqr_48(t[ 4], t[ 2], m, mp);
  8681. sp_3072_mont_mul_48(t[ 5], t[ 3], t[ 2], m, mp);
  8682. sp_3072_mont_sqr_48(t[ 6], t[ 3], m, mp);
  8683. sp_3072_mont_mul_48(t[ 7], t[ 4], t[ 3], m, mp);
  8684. sp_3072_mont_sqr_48(t[ 8], t[ 4], m, mp);
  8685. sp_3072_mont_mul_48(t[ 9], t[ 5], t[ 4], m, mp);
  8686. sp_3072_mont_sqr_48(t[10], t[ 5], m, mp);
  8687. sp_3072_mont_mul_48(t[11], t[ 6], t[ 5], m, mp);
  8688. sp_3072_mont_sqr_48(t[12], t[ 6], m, mp);
  8689. sp_3072_mont_mul_48(t[13], t[ 7], t[ 6], m, mp);
  8690. sp_3072_mont_sqr_48(t[14], t[ 7], m, mp);
  8691. sp_3072_mont_mul_48(t[15], t[ 8], t[ 7], m, mp);
  8692. sp_3072_mont_sqr_48(t[16], t[ 8], m, mp);
  8693. sp_3072_mont_mul_48(t[17], t[ 9], t[ 8], m, mp);
  8694. sp_3072_mont_sqr_48(t[18], t[ 9], m, mp);
  8695. sp_3072_mont_mul_48(t[19], t[10], t[ 9], m, mp);
  8696. sp_3072_mont_sqr_48(t[20], t[10], m, mp);
  8697. sp_3072_mont_mul_48(t[21], t[11], t[10], m, mp);
  8698. sp_3072_mont_sqr_48(t[22], t[11], m, mp);
  8699. sp_3072_mont_mul_48(t[23], t[12], t[11], m, mp);
  8700. sp_3072_mont_sqr_48(t[24], t[12], m, mp);
  8701. sp_3072_mont_mul_48(t[25], t[13], t[12], m, mp);
  8702. sp_3072_mont_sqr_48(t[26], t[13], m, mp);
  8703. sp_3072_mont_mul_48(t[27], t[14], t[13], m, mp);
  8704. sp_3072_mont_sqr_48(t[28], t[14], m, mp);
  8705. sp_3072_mont_mul_48(t[29], t[15], t[14], m, mp);
  8706. sp_3072_mont_sqr_48(t[30], t[15], m, mp);
  8707. sp_3072_mont_mul_48(t[31], t[16], t[15], m, mp);
  8708. i = (bits - 1) / 32;
  8709. n = e[i--];
  8710. c = bits & 31;
  8711. if (c == 0) {
  8712. c = 32;
  8713. }
  8714. c -= bits % 5;
  8715. if (c == 32) {
  8716. c = 27;
  8717. }
  8718. if (c < 0) {
  8719. /* Number of bits in top word is less than number needed. */
  8720. c = -c;
  8721. y = (byte)(n << c);
  8722. n = e[i--];
  8723. y |= (byte)(n >> (64 - c));
  8724. n <<= c;
  8725. c = 64 - c;
  8726. }
  8727. else if (c == 0) {
  8728. /* All bits in top word used. */
  8729. y = (byte)n;
  8730. }
  8731. else {
  8732. y = (byte)(n >> c);
  8733. n <<= 32 - c;
  8734. }
  8735. XMEMCPY(r, t[y], sizeof(sp_digit) * 48);
  8736. for (; i>=0 || c>=5; ) {
  8737. if (c == 0) {
  8738. n = e[i--];
  8739. y = (byte)(n >> 27);
  8740. n <<= 5;
  8741. c = 27;
  8742. }
  8743. else if (c < 5) {
  8744. y = (byte)(n >> 27);
  8745. n = e[i--];
  8746. c = 5 - c;
  8747. y |= (byte)(n >> (32 - c));
  8748. n <<= c;
  8749. c = 32 - c;
  8750. }
  8751. else {
  8752. y = (byte)((n >> 27) & 0x1f);
  8753. n <<= 5;
  8754. c -= 5;
  8755. }
  8756. sp_3072_mont_sqr_48(r, r, m, mp);
  8757. sp_3072_mont_sqr_48(r, r, m, mp);
  8758. sp_3072_mont_sqr_48(r, r, m, mp);
  8759. sp_3072_mont_sqr_48(r, r, m, mp);
  8760. sp_3072_mont_sqr_48(r, r, m, mp);
  8761. sp_3072_mont_mul_48(r, r, t[y], m, mp);
  8762. }
  8763. XMEMSET(&r[48], 0, sizeof(sp_digit) * 48U);
  8764. sp_3072_mont_reduce_48(r, m, mp);
  8765. mask = 0 - (sp_3072_cmp_48(r, m) >= 0);
  8766. sp_3072_cond_sub_48(r, r, m, mask);
  8767. }
  8768. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  8769. if (td != NULL)
  8770. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  8771. #endif
  8772. return err;
  8773. }
  8774. #endif /* WOLFSSL_SP_SMALL */
  8775. #endif /* (WOLFSSL_HAVE_SP_RSA & !WOLFSSL_RSA_PUBLIC_ONLY) | WOLFSSL_HAVE_SP_DH */
  8776. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || defined(WOLFSSL_HAVE_SP_DH)
  8777. /* r = 2^n mod m where n is the number of bits to reduce by.
  8778. * Given m must be 3072 bits, just need to subtract.
  8779. *
  8780. * r A single precision number.
  8781. * m A single precision number.
  8782. */
  8783. static void sp_3072_mont_norm_96(sp_digit* r, const sp_digit* m)
  8784. {
  8785. XMEMSET(r, 0, sizeof(sp_digit) * 96);
  8786. /* r = 2^n mod m */
  8787. sp_3072_sub_in_place_96(r, m);
  8788. }
  8789. #endif /* (WOLFSSL_HAVE_SP_RSA & !WOLFSSL_RSA_PUBLIC_ONLY) | WOLFSSL_HAVE_SP_DH */
  8790. /* Conditionally subtract b from a using the mask m.
  8791. * m is -1 to subtract and 0 when not copying.
  8792. *
  8793. * r A single precision number representing condition subtract result.
  8794. * a A single precision number to subtract from.
  8795. * b A single precision number to subtract.
  8796. * m Mask value to apply.
  8797. */
  8798. SP_NOINLINE static sp_digit sp_3072_cond_sub_96(sp_digit* r, const sp_digit* a,
  8799. const sp_digit* b, sp_digit m)
  8800. {
  8801. sp_digit c = 0;
  8802. __asm__ __volatile__ (
  8803. "mov r5, #1\n\t"
  8804. "lsl r5, r5, #8\n\t"
  8805. "add r5, r5, #128\n\t"
  8806. "mov r9, r5\n\t"
  8807. "mov r8, #0\n\t"
  8808. "\n1:\n\t"
  8809. "ldr r6, [%[b], r8]\n\t"
  8810. "and r6, r6, %[m]\n\t"
  8811. "mov r5, #0\n\t"
  8812. "subs r5, r5, %[c]\n\t"
  8813. "ldr r5, [%[a], r8]\n\t"
  8814. "sbcs r5, r5, r6\n\t"
  8815. "sbcs %[c], %[c], %[c]\n\t"
  8816. "str r5, [%[r], r8]\n\t"
  8817. "add r8, r8, #4\n\t"
  8818. "cmp r8, r9\n\t"
  8819. #ifdef __GNUC__
  8820. "blt 1b\n\t"
  8821. #else
  8822. "blt.n 1b\n\t"
  8823. #endif /* __GNUC__ */
  8824. : [c] "+r" (c)
  8825. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  8826. : "memory", "r5", "r6", "r8", "r9"
  8827. );
  8828. return c;
  8829. }
  8830. /* Reduce the number back to 3072 bits using Montgomery reduction.
  8831. *
  8832. * a A single precision number to reduce in place.
  8833. * m The single precision number representing the modulus.
  8834. * mp The digit representing the negative inverse of m mod 2^n.
  8835. */
  8836. SP_NOINLINE static void sp_3072_mont_reduce_96(sp_digit* a, const sp_digit* m,
  8837. sp_digit mp)
  8838. {
  8839. sp_digit ca = 0;
  8840. __asm__ __volatile__ (
  8841. "mov r9, %[mp]\n\t"
  8842. "mov r12, %[m]\n\t"
  8843. "mov r10, %[a]\n\t"
  8844. "mov r4, #0\n\t"
  8845. "add r11, r10, #384\n\t"
  8846. "\n1:\n\t"
  8847. /* mu = a[i] * mp */
  8848. "mov %[mp], r9\n\t"
  8849. "ldr %[a], [r10]\n\t"
  8850. "mul %[mp], %[mp], %[a]\n\t"
  8851. "mov %[m], r12\n\t"
  8852. "add r14, r10, #376\n\t"
  8853. "\n2:\n\t"
  8854. /* a[i+j] += m[j] * mu */
  8855. "ldr %[a], [r10]\n\t"
  8856. "mov r5, #0\n\t"
  8857. /* Multiply m[j] and mu - Start */
  8858. "ldr r8, [%[m]], #4\n\t"
  8859. "umull r6, r8, %[mp], r8\n\t"
  8860. "adds %[a], %[a], r6\n\t"
  8861. "adc r5, r5, r8\n\t"
  8862. /* Multiply m[j] and mu - Done */
  8863. "adds r4, r4, %[a]\n\t"
  8864. "adc r5, r5, #0\n\t"
  8865. "str r4, [r10], #4\n\t"
  8866. /* a[i+j+1] += m[j+1] * mu */
  8867. "ldr %[a], [r10]\n\t"
  8868. "mov r4, #0\n\t"
  8869. /* Multiply m[j] and mu - Start */
  8870. "ldr r8, [%[m]], #4\n\t"
  8871. "umull r6, r8, %[mp], r8\n\t"
  8872. "adds %[a], %[a], r6\n\t"
  8873. "adc r4, r4, r8\n\t"
  8874. /* Multiply m[j] and mu - Done */
  8875. "adds r5, r5, %[a]\n\t"
  8876. "adc r4, r4, #0\n\t"
  8877. "str r5, [r10], #4\n\t"
  8878. "cmp r10, r14\n\t"
  8879. #ifdef __GNUC__
  8880. "blt 2b\n\t"
  8881. #else
  8882. "blt.n 2b\n\t"
  8883. #endif /* __GNUC__ */
  8884. /* a[i+94] += m[94] * mu */
  8885. "ldr %[a], [r10]\n\t"
  8886. "mov r5, #0\n\t"
  8887. /* Multiply m[j] and mu - Start */
  8888. "ldr r8, [%[m]], #4\n\t"
  8889. "umull r6, r8, %[mp], r8\n\t"
  8890. "adds %[a], %[a], r6\n\t"
  8891. "adc r5, r5, r8\n\t"
  8892. /* Multiply m[j] and mu - Done */
  8893. "adds r4, r4, %[a]\n\t"
  8894. "adc r5, r5, #0\n\t"
  8895. "str r4, [r10], #4\n\t"
  8896. /* a[i+95] += m[95] * mu */
  8897. "mov r4, %[ca]\n\t"
  8898. "mov %[ca], #0\n\t"
  8899. /* Multiply m[95] and mu - Start */
  8900. "ldr r8, [%[m]]\n\t"
  8901. "umull r6, r8, %[mp], r8\n\t"
  8902. "adds r5, r5, r6\n\t"
  8903. "adcs r4, r4, r8\n\t"
  8904. "adc %[ca], %[ca], #0\n\t"
  8905. /* Multiply m[95] and mu - Done */
  8906. "ldr r6, [r10]\n\t"
  8907. "ldr r8, [r10, #4]\n\t"
  8908. "adds r6, r6, r5\n\t"
  8909. "adcs r8, r8, r4\n\t"
  8910. "adc %[ca], %[ca], #0\n\t"
  8911. "str r6, [r10]\n\t"
  8912. "str r8, [r10, #4]\n\t"
  8913. /* Next word in a */
  8914. "sub r10, r10, #376\n\t"
  8915. "cmp r10, r11\n\t"
  8916. #ifdef __GNUC__
  8917. "blt 1b\n\t"
  8918. #else
  8919. "blt.n 1b\n\t"
  8920. #endif /* __GNUC__ */
  8921. "mov %[a], r10\n\t"
  8922. "mov %[m], r12\n\t"
  8923. : [ca] "+r" (ca), [a] "+r" (a)
  8924. : [m] "r" (m), [mp] "r" (mp)
  8925. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  8926. );
  8927. sp_3072_cond_sub_96(a - 96, a, m, (sp_digit)0 - ca);
  8928. }
  8929. /* Multiply two Montgomery form numbers mod the modulus (prime).
  8930. * (r = a * b mod m)
  8931. *
  8932. * r Result of multiplication.
  8933. * a First number to multiply in Montgomery form.
  8934. * b Second number to multiply in Montgomery form.
  8935. * m Modulus (prime).
  8936. * mp Montgomery mulitplier.
  8937. */
  8938. SP_NOINLINE static void sp_3072_mont_mul_96(sp_digit* r, const sp_digit* a,
  8939. const sp_digit* b, const sp_digit* m, sp_digit mp)
  8940. {
  8941. sp_3072_mul_96(r, a, b);
  8942. sp_3072_mont_reduce_96(r, m, mp);
  8943. }
  8944. /* Square the Montgomery form number. (r = a * a mod m)
  8945. *
  8946. * r Result of squaring.
  8947. * a Number to square in Montgomery form.
  8948. * m Modulus (prime).
  8949. * mp Montgomery mulitplier.
  8950. */
  8951. SP_NOINLINE static void sp_3072_mont_sqr_96(sp_digit* r, const sp_digit* a,
  8952. const sp_digit* m, sp_digit mp)
  8953. {
  8954. sp_3072_sqr_96(r, a);
  8955. sp_3072_mont_reduce_96(r, m, mp);
  8956. }
  8957. #ifdef WOLFSSL_SP_SMALL
  8958. /* Sub b from a into r. (r = a - b)
  8959. *
  8960. * r A single precision integer.
  8961. * a A single precision integer.
  8962. * b A single precision integer.
  8963. */
  8964. SP_NOINLINE static sp_digit sp_3072_sub_96(sp_digit* r, const sp_digit* a,
  8965. const sp_digit* b)
  8966. {
  8967. sp_digit c = 0;
  8968. __asm__ __volatile__ (
  8969. "mov r6, %[a]\n\t"
  8970. "mov r5, #1\n\t"
  8971. "lsl r5, r5, #8\n\t"
  8972. "add r5, r5, #128\n\t"
  8973. "add r6, r6, r5\n\t"
  8974. "\n1:\n\t"
  8975. "mov r5, #0\n\t"
  8976. "subs r5, r5, %[c]\n\t"
  8977. "ldr r4, [%[a]]\n\t"
  8978. "ldr r5, [%[b]]\n\t"
  8979. "sbcs r4, r4, r5\n\t"
  8980. "str r4, [%[r]]\n\t"
  8981. "sbc %[c], %[c], %[c]\n\t"
  8982. "add %[a], %[a], #4\n\t"
  8983. "add %[b], %[b], #4\n\t"
  8984. "add %[r], %[r], #4\n\t"
  8985. "cmp %[a], r6\n\t"
  8986. #ifdef __GNUC__
  8987. "bne 1b\n\t"
  8988. #else
  8989. "bne.n 1b\n\t"
  8990. #endif /* __GNUC__ */
  8991. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  8992. :
  8993. : "memory", "r4", "r5", "r6"
  8994. );
  8995. return c;
  8996. }
  8997. #else
  8998. /* Sub b from a into r. (r = a - b)
  8999. *
  9000. * r A single precision integer.
  9001. * a A single precision integer.
  9002. * b A single precision integer.
  9003. */
  9004. SP_NOINLINE static sp_digit sp_3072_sub_96(sp_digit* r, const sp_digit* a,
  9005. const sp_digit* b)
  9006. {
  9007. sp_digit c = 0;
  9008. __asm__ __volatile__ (
  9009. "ldm %[a]!, {r4, r5}\n\t"
  9010. "ldm %[b]!, {r6, r8}\n\t"
  9011. "subs r4, r4, r6\n\t"
  9012. "sbcs r5, r5, r8\n\t"
  9013. "stm %[r]!, {r4, r5}\n\t"
  9014. "ldm %[a]!, {r4, r5}\n\t"
  9015. "ldm %[b]!, {r6, r8}\n\t"
  9016. "sbcs r4, r4, r6\n\t"
  9017. "sbcs r5, r5, r8\n\t"
  9018. "stm %[r]!, {r4, r5}\n\t"
  9019. "ldm %[a]!, {r4, r5}\n\t"
  9020. "ldm %[b]!, {r6, r8}\n\t"
  9021. "sbcs r4, r4, r6\n\t"
  9022. "sbcs r5, r5, r8\n\t"
  9023. "stm %[r]!, {r4, r5}\n\t"
  9024. "ldm %[a]!, {r4, r5}\n\t"
  9025. "ldm %[b]!, {r6, r8}\n\t"
  9026. "sbcs r4, r4, r6\n\t"
  9027. "sbcs r5, r5, r8\n\t"
  9028. "stm %[r]!, {r4, r5}\n\t"
  9029. "ldm %[a]!, {r4, r5}\n\t"
  9030. "ldm %[b]!, {r6, r8}\n\t"
  9031. "sbcs r4, r4, r6\n\t"
  9032. "sbcs r5, r5, r8\n\t"
  9033. "stm %[r]!, {r4, r5}\n\t"
  9034. "ldm %[a]!, {r4, r5}\n\t"
  9035. "ldm %[b]!, {r6, r8}\n\t"
  9036. "sbcs r4, r4, r6\n\t"
  9037. "sbcs r5, r5, r8\n\t"
  9038. "stm %[r]!, {r4, r5}\n\t"
  9039. "ldm %[a]!, {r4, r5}\n\t"
  9040. "ldm %[b]!, {r6, r8}\n\t"
  9041. "sbcs r4, r4, r6\n\t"
  9042. "sbcs r5, r5, r8\n\t"
  9043. "stm %[r]!, {r4, r5}\n\t"
  9044. "ldm %[a]!, {r4, r5}\n\t"
  9045. "ldm %[b]!, {r6, r8}\n\t"
  9046. "sbcs r4, r4, r6\n\t"
  9047. "sbcs r5, r5, r8\n\t"
  9048. "stm %[r]!, {r4, r5}\n\t"
  9049. "ldm %[a]!, {r4, r5}\n\t"
  9050. "ldm %[b]!, {r6, r8}\n\t"
  9051. "sbcs r4, r4, r6\n\t"
  9052. "sbcs r5, r5, r8\n\t"
  9053. "stm %[r]!, {r4, r5}\n\t"
  9054. "ldm %[a]!, {r4, r5}\n\t"
  9055. "ldm %[b]!, {r6, r8}\n\t"
  9056. "sbcs r4, r4, r6\n\t"
  9057. "sbcs r5, r5, r8\n\t"
  9058. "stm %[r]!, {r4, r5}\n\t"
  9059. "ldm %[a]!, {r4, r5}\n\t"
  9060. "ldm %[b]!, {r6, r8}\n\t"
  9061. "sbcs r4, r4, r6\n\t"
  9062. "sbcs r5, r5, r8\n\t"
  9063. "stm %[r]!, {r4, r5}\n\t"
  9064. "ldm %[a]!, {r4, r5}\n\t"
  9065. "ldm %[b]!, {r6, r8}\n\t"
  9066. "sbcs r4, r4, r6\n\t"
  9067. "sbcs r5, r5, r8\n\t"
  9068. "stm %[r]!, {r4, r5}\n\t"
  9069. "ldm %[a]!, {r4, r5}\n\t"
  9070. "ldm %[b]!, {r6, r8}\n\t"
  9071. "sbcs r4, r4, r6\n\t"
  9072. "sbcs r5, r5, r8\n\t"
  9073. "stm %[r]!, {r4, r5}\n\t"
  9074. "ldm %[a]!, {r4, r5}\n\t"
  9075. "ldm %[b]!, {r6, r8}\n\t"
  9076. "sbcs r4, r4, r6\n\t"
  9077. "sbcs r5, r5, r8\n\t"
  9078. "stm %[r]!, {r4, r5}\n\t"
  9079. "ldm %[a]!, {r4, r5}\n\t"
  9080. "ldm %[b]!, {r6, r8}\n\t"
  9081. "sbcs r4, r4, r6\n\t"
  9082. "sbcs r5, r5, r8\n\t"
  9083. "stm %[r]!, {r4, r5}\n\t"
  9084. "ldm %[a]!, {r4, r5}\n\t"
  9085. "ldm %[b]!, {r6, r8}\n\t"
  9086. "sbcs r4, r4, r6\n\t"
  9087. "sbcs r5, r5, r8\n\t"
  9088. "stm %[r]!, {r4, r5}\n\t"
  9089. "ldm %[a]!, {r4, r5}\n\t"
  9090. "ldm %[b]!, {r6, r8}\n\t"
  9091. "sbcs r4, r4, r6\n\t"
  9092. "sbcs r5, r5, r8\n\t"
  9093. "stm %[r]!, {r4, r5}\n\t"
  9094. "ldm %[a]!, {r4, r5}\n\t"
  9095. "ldm %[b]!, {r6, r8}\n\t"
  9096. "sbcs r4, r4, r6\n\t"
  9097. "sbcs r5, r5, r8\n\t"
  9098. "stm %[r]!, {r4, r5}\n\t"
  9099. "ldm %[a]!, {r4, r5}\n\t"
  9100. "ldm %[b]!, {r6, r8}\n\t"
  9101. "sbcs r4, r4, r6\n\t"
  9102. "sbcs r5, r5, r8\n\t"
  9103. "stm %[r]!, {r4, r5}\n\t"
  9104. "ldm %[a]!, {r4, r5}\n\t"
  9105. "ldm %[b]!, {r6, r8}\n\t"
  9106. "sbcs r4, r4, r6\n\t"
  9107. "sbcs r5, r5, r8\n\t"
  9108. "stm %[r]!, {r4, r5}\n\t"
  9109. "ldm %[a]!, {r4, r5}\n\t"
  9110. "ldm %[b]!, {r6, r8}\n\t"
  9111. "sbcs r4, r4, r6\n\t"
  9112. "sbcs r5, r5, r8\n\t"
  9113. "stm %[r]!, {r4, r5}\n\t"
  9114. "ldm %[a]!, {r4, r5}\n\t"
  9115. "ldm %[b]!, {r6, r8}\n\t"
  9116. "sbcs r4, r4, r6\n\t"
  9117. "sbcs r5, r5, r8\n\t"
  9118. "stm %[r]!, {r4, r5}\n\t"
  9119. "ldm %[a]!, {r4, r5}\n\t"
  9120. "ldm %[b]!, {r6, r8}\n\t"
  9121. "sbcs r4, r4, r6\n\t"
  9122. "sbcs r5, r5, r8\n\t"
  9123. "stm %[r]!, {r4, r5}\n\t"
  9124. "ldm %[a]!, {r4, r5}\n\t"
  9125. "ldm %[b]!, {r6, r8}\n\t"
  9126. "sbcs r4, r4, r6\n\t"
  9127. "sbcs r5, r5, r8\n\t"
  9128. "stm %[r]!, {r4, r5}\n\t"
  9129. "ldm %[a]!, {r4, r5}\n\t"
  9130. "ldm %[b]!, {r6, r8}\n\t"
  9131. "sbcs r4, r4, r6\n\t"
  9132. "sbcs r5, r5, r8\n\t"
  9133. "stm %[r]!, {r4, r5}\n\t"
  9134. "ldm %[a]!, {r4, r5}\n\t"
  9135. "ldm %[b]!, {r6, r8}\n\t"
  9136. "sbcs r4, r4, r6\n\t"
  9137. "sbcs r5, r5, r8\n\t"
  9138. "stm %[r]!, {r4, r5}\n\t"
  9139. "ldm %[a]!, {r4, r5}\n\t"
  9140. "ldm %[b]!, {r6, r8}\n\t"
  9141. "sbcs r4, r4, r6\n\t"
  9142. "sbcs r5, r5, r8\n\t"
  9143. "stm %[r]!, {r4, r5}\n\t"
  9144. "ldm %[a]!, {r4, r5}\n\t"
  9145. "ldm %[b]!, {r6, r8}\n\t"
  9146. "sbcs r4, r4, r6\n\t"
  9147. "sbcs r5, r5, r8\n\t"
  9148. "stm %[r]!, {r4, r5}\n\t"
  9149. "ldm %[a]!, {r4, r5}\n\t"
  9150. "ldm %[b]!, {r6, r8}\n\t"
  9151. "sbcs r4, r4, r6\n\t"
  9152. "sbcs r5, r5, r8\n\t"
  9153. "stm %[r]!, {r4, r5}\n\t"
  9154. "ldm %[a]!, {r4, r5}\n\t"
  9155. "ldm %[b]!, {r6, r8}\n\t"
  9156. "sbcs r4, r4, r6\n\t"
  9157. "sbcs r5, r5, r8\n\t"
  9158. "stm %[r]!, {r4, r5}\n\t"
  9159. "ldm %[a]!, {r4, r5}\n\t"
  9160. "ldm %[b]!, {r6, r8}\n\t"
  9161. "sbcs r4, r4, r6\n\t"
  9162. "sbcs r5, r5, r8\n\t"
  9163. "stm %[r]!, {r4, r5}\n\t"
  9164. "ldm %[a]!, {r4, r5}\n\t"
  9165. "ldm %[b]!, {r6, r8}\n\t"
  9166. "sbcs r4, r4, r6\n\t"
  9167. "sbcs r5, r5, r8\n\t"
  9168. "stm %[r]!, {r4, r5}\n\t"
  9169. "ldm %[a]!, {r4, r5}\n\t"
  9170. "ldm %[b]!, {r6, r8}\n\t"
  9171. "sbcs r4, r4, r6\n\t"
  9172. "sbcs r5, r5, r8\n\t"
  9173. "stm %[r]!, {r4, r5}\n\t"
  9174. "ldm %[a]!, {r4, r5}\n\t"
  9175. "ldm %[b]!, {r6, r8}\n\t"
  9176. "sbcs r4, r4, r6\n\t"
  9177. "sbcs r5, r5, r8\n\t"
  9178. "stm %[r]!, {r4, r5}\n\t"
  9179. "ldm %[a]!, {r4, r5}\n\t"
  9180. "ldm %[b]!, {r6, r8}\n\t"
  9181. "sbcs r4, r4, r6\n\t"
  9182. "sbcs r5, r5, r8\n\t"
  9183. "stm %[r]!, {r4, r5}\n\t"
  9184. "ldm %[a]!, {r4, r5}\n\t"
  9185. "ldm %[b]!, {r6, r8}\n\t"
  9186. "sbcs r4, r4, r6\n\t"
  9187. "sbcs r5, r5, r8\n\t"
  9188. "stm %[r]!, {r4, r5}\n\t"
  9189. "ldm %[a]!, {r4, r5}\n\t"
  9190. "ldm %[b]!, {r6, r8}\n\t"
  9191. "sbcs r4, r4, r6\n\t"
  9192. "sbcs r5, r5, r8\n\t"
  9193. "stm %[r]!, {r4, r5}\n\t"
  9194. "ldm %[a]!, {r4, r5}\n\t"
  9195. "ldm %[b]!, {r6, r8}\n\t"
  9196. "sbcs r4, r4, r6\n\t"
  9197. "sbcs r5, r5, r8\n\t"
  9198. "stm %[r]!, {r4, r5}\n\t"
  9199. "ldm %[a]!, {r4, r5}\n\t"
  9200. "ldm %[b]!, {r6, r8}\n\t"
  9201. "sbcs r4, r4, r6\n\t"
  9202. "sbcs r5, r5, r8\n\t"
  9203. "stm %[r]!, {r4, r5}\n\t"
  9204. "ldm %[a]!, {r4, r5}\n\t"
  9205. "ldm %[b]!, {r6, r8}\n\t"
  9206. "sbcs r4, r4, r6\n\t"
  9207. "sbcs r5, r5, r8\n\t"
  9208. "stm %[r]!, {r4, r5}\n\t"
  9209. "ldm %[a]!, {r4, r5}\n\t"
  9210. "ldm %[b]!, {r6, r8}\n\t"
  9211. "sbcs r4, r4, r6\n\t"
  9212. "sbcs r5, r5, r8\n\t"
  9213. "stm %[r]!, {r4, r5}\n\t"
  9214. "ldm %[a]!, {r4, r5}\n\t"
  9215. "ldm %[b]!, {r6, r8}\n\t"
  9216. "sbcs r4, r4, r6\n\t"
  9217. "sbcs r5, r5, r8\n\t"
  9218. "stm %[r]!, {r4, r5}\n\t"
  9219. "ldm %[a]!, {r4, r5}\n\t"
  9220. "ldm %[b]!, {r6, r8}\n\t"
  9221. "sbcs r4, r4, r6\n\t"
  9222. "sbcs r5, r5, r8\n\t"
  9223. "stm %[r]!, {r4, r5}\n\t"
  9224. "ldm %[a]!, {r4, r5}\n\t"
  9225. "ldm %[b]!, {r6, r8}\n\t"
  9226. "sbcs r4, r4, r6\n\t"
  9227. "sbcs r5, r5, r8\n\t"
  9228. "stm %[r]!, {r4, r5}\n\t"
  9229. "ldm %[a]!, {r4, r5}\n\t"
  9230. "ldm %[b]!, {r6, r8}\n\t"
  9231. "sbcs r4, r4, r6\n\t"
  9232. "sbcs r5, r5, r8\n\t"
  9233. "stm %[r]!, {r4, r5}\n\t"
  9234. "ldm %[a]!, {r4, r5}\n\t"
  9235. "ldm %[b]!, {r6, r8}\n\t"
  9236. "sbcs r4, r4, r6\n\t"
  9237. "sbcs r5, r5, r8\n\t"
  9238. "stm %[r]!, {r4, r5}\n\t"
  9239. "ldm %[a]!, {r4, r5}\n\t"
  9240. "ldm %[b]!, {r6, r8}\n\t"
  9241. "sbcs r4, r4, r6\n\t"
  9242. "sbcs r5, r5, r8\n\t"
  9243. "stm %[r]!, {r4, r5}\n\t"
  9244. "ldm %[a]!, {r4, r5}\n\t"
  9245. "ldm %[b]!, {r6, r8}\n\t"
  9246. "sbcs r4, r4, r6\n\t"
  9247. "sbcs r5, r5, r8\n\t"
  9248. "stm %[r]!, {r4, r5}\n\t"
  9249. "sbc %[c], %[c], %[c]\n\t"
  9250. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  9251. :
  9252. : "memory", "r4", "r5", "r6", "r8"
  9253. );
  9254. return c;
  9255. }
  9256. #endif /* WOLFSSL_SP_SMALL */
  9257. /* Divide the double width number (d1|d0) by the divisor. (d1|d0 / div)
  9258. *
  9259. * d1 The high order half of the number to divide.
  9260. * d0 The low order half of the number to divide.
  9261. * div The divisor.
  9262. * returns the result of the division.
  9263. *
  9264. * Note that this is an approximate div. It may give an answer 1 larger.
  9265. */
  9266. SP_NOINLINE static sp_digit div_3072_word_96(sp_digit d1, sp_digit d0,
  9267. sp_digit div)
  9268. {
  9269. sp_digit r = 0;
  9270. __asm__ __volatile__ (
  9271. "lsr r6, %[div], #16\n\t"
  9272. "add r6, r6, #1\n\t"
  9273. "udiv r4, %[d1], r6\n\t"
  9274. "lsl r8, r4, #16\n\t"
  9275. "umull r4, r5, %[div], r8\n\t"
  9276. "subs %[d0], %[d0], r4\n\t"
  9277. "sbc %[d1], %[d1], r5\n\t"
  9278. "udiv r5, %[d1], r6\n\t"
  9279. "lsl r4, r5, #16\n\t"
  9280. "add r8, r8, r4\n\t"
  9281. "umull r4, r5, %[div], r4\n\t"
  9282. "subs %[d0], %[d0], r4\n\t"
  9283. "sbc %[d1], %[d1], r5\n\t"
  9284. "lsl r4, %[d1], #16\n\t"
  9285. "orr r4, r4, %[d0], lsr #16\n\t"
  9286. "udiv r4, r4, r6\n\t"
  9287. "add r8, r8, r4\n\t"
  9288. "umull r4, r5, %[div], r4\n\t"
  9289. "subs %[d0], %[d0], r4\n\t"
  9290. "sbc %[d1], %[d1], r5\n\t"
  9291. "lsl r4, %[d1], #16\n\t"
  9292. "orr r4, r4, %[d0], lsr #16\n\t"
  9293. "udiv r4, r4, r6\n\t"
  9294. "add r8, r8, r4\n\t"
  9295. "umull r4, r5, %[div], r4\n\t"
  9296. "subs %[d0], %[d0], r4\n\t"
  9297. "sbc %[d1], %[d1], r5\n\t"
  9298. "udiv r4, %[d0], %[div]\n\t"
  9299. "add r8, r8, r4\n\t"
  9300. "mov %[r], r8\n\t"
  9301. : [r] "+r" (r)
  9302. : [d1] "r" (d1), [d0] "r" (d0), [div] "r" (div)
  9303. : "r4", "r5", "r6", "r8"
  9304. );
  9305. return r;
  9306. }
  9307. /* Divide d in a and put remainder into r (m*d + r = a)
  9308. * m is not calculated as it is not needed at this time.
  9309. *
  9310. * a Number to be divided.
  9311. * d Number to divide with.
  9312. * m Multiplier result.
  9313. * r Remainder from the division.
  9314. * returns MP_OKAY indicating success.
  9315. */
  9316. static WC_INLINE int sp_3072_div_96_cond(const sp_digit* a, const sp_digit* d, sp_digit* m,
  9317. sp_digit* r)
  9318. {
  9319. sp_digit t1[192], t2[97];
  9320. sp_digit div, r1;
  9321. int i;
  9322. (void)m;
  9323. div = d[95];
  9324. XMEMCPY(t1, a, sizeof(*t1) * 2 * 96);
  9325. for (i = 95; i > 0; i--) {
  9326. if (t1[i + 96] != d[i])
  9327. break;
  9328. }
  9329. if (t1[i + 96] >= d[i]) {
  9330. sp_3072_sub_in_place_96(&t1[96], d);
  9331. }
  9332. for (i = 95; i >= 0; i--) {
  9333. if (t1[96 + i] == div) {
  9334. r1 = SP_DIGIT_MAX;
  9335. }
  9336. else {
  9337. r1 = div_3072_word_96(t1[96 + i], t1[96 + i - 1], div);
  9338. }
  9339. sp_3072_mul_d_96(t2, d, r1);
  9340. t1[96 + i] += sp_3072_sub_in_place_96(&t1[i], t2);
  9341. t1[96 + i] -= t2[96];
  9342. if (t1[96 + i] != 0) {
  9343. t1[96 + i] += sp_3072_add_96(&t1[i], &t1[i], d);
  9344. if (t1[96 + i] != 0)
  9345. t1[96 + i] += sp_3072_add_96(&t1[i], &t1[i], d);
  9346. }
  9347. }
  9348. for (i = 95; i > 0; i--) {
  9349. if (t1[i] != d[i])
  9350. break;
  9351. }
  9352. if (t1[i] >= d[i]) {
  9353. sp_3072_sub_96(r, t1, d);
  9354. }
  9355. else {
  9356. XMEMCPY(r, t1, sizeof(*t1) * 96);
  9357. }
  9358. return MP_OKAY;
  9359. }
  9360. /* Reduce a modulo m into r. (r = a mod m)
  9361. *
  9362. * r A single precision number that is the reduced result.
  9363. * a A single precision number that is to be reduced.
  9364. * m A single precision number that is the modulus to reduce with.
  9365. * returns MP_OKAY indicating success.
  9366. */
  9367. static WC_INLINE int sp_3072_mod_96_cond(sp_digit* r, const sp_digit* a, const sp_digit* m)
  9368. {
  9369. return sp_3072_div_96_cond(a, m, NULL, r);
  9370. }
  9371. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || defined(WOLFSSL_HAVE_SP_DH)
  9372. /* AND m into each word of a and store in r.
  9373. *
  9374. * r A single precision integer.
  9375. * a A single precision integer.
  9376. * m Mask to AND against each digit.
  9377. */
  9378. static void sp_3072_mask_96(sp_digit* r, const sp_digit* a, sp_digit m)
  9379. {
  9380. #ifdef WOLFSSL_SP_SMALL
  9381. int i;
  9382. for (i=0; i<96; i++) {
  9383. r[i] = a[i] & m;
  9384. }
  9385. #else
  9386. int i;
  9387. for (i = 0; i < 96; i += 8) {
  9388. r[i+0] = a[i+0] & m;
  9389. r[i+1] = a[i+1] & m;
  9390. r[i+2] = a[i+2] & m;
  9391. r[i+3] = a[i+3] & m;
  9392. r[i+4] = a[i+4] & m;
  9393. r[i+5] = a[i+5] & m;
  9394. r[i+6] = a[i+6] & m;
  9395. r[i+7] = a[i+7] & m;
  9396. }
  9397. #endif
  9398. }
  9399. /* Compare a with b in constant time.
  9400. *
  9401. * a A single precision integer.
  9402. * b A single precision integer.
  9403. * return -ve, 0 or +ve if a is less than, equal to or greater than b
  9404. * respectively.
  9405. */
  9406. SP_NOINLINE static sp_int32 sp_3072_cmp_96(const sp_digit* a, const sp_digit* b)
  9407. {
  9408. sp_digit r = 0;
  9409. __asm__ __volatile__ (
  9410. "mov r3, #0\n\t"
  9411. "mvn r3, r3\n\t"
  9412. "mov r6, #1\n\t"
  9413. "lsl r6, r6, #8\n\t"
  9414. "add r6, r6, #124\n\t"
  9415. "\n1:\n\t"
  9416. "ldr r8, [%[a], r6]\n\t"
  9417. "ldr r5, [%[b], r6]\n\t"
  9418. "and r8, r8, r3\n\t"
  9419. "and r5, r5, r3\n\t"
  9420. "mov r4, r8\n\t"
  9421. "subs r8, r8, r5\n\t"
  9422. "sbc r8, r8, r8\n\t"
  9423. "add %[r], %[r], r8\n\t"
  9424. "mvn r8, r8\n\t"
  9425. "and r3, r3, r8\n\t"
  9426. "subs r5, r5, r4\n\t"
  9427. "sbc r8, r8, r8\n\t"
  9428. "sub %[r], %[r], r8\n\t"
  9429. "mvn r8, r8\n\t"
  9430. "and r3, r3, r8\n\t"
  9431. "sub r6, r6, #4\n\t"
  9432. "cmp r6, #0\n\t"
  9433. #ifdef __GNUC__
  9434. "bge 1b\n\t"
  9435. #else
  9436. "bge.n 1b\n\t"
  9437. #endif /* __GNUC__ */
  9438. : [r] "+r" (r)
  9439. : [a] "r" (a), [b] "r" (b)
  9440. : "r3", "r4", "r5", "r6", "r8"
  9441. );
  9442. return r;
  9443. }
  9444. /* Divide d in a and put remainder into r (m*d + r = a)
  9445. * m is not calculated as it is not needed at this time.
  9446. *
  9447. * a Number to be divided.
  9448. * d Number to divide with.
  9449. * m Multiplier result.
  9450. * r Remainder from the division.
  9451. * returns MP_OKAY indicating success.
  9452. */
  9453. static WC_INLINE int sp_3072_div_96(const sp_digit* a, const sp_digit* d, sp_digit* m,
  9454. sp_digit* r)
  9455. {
  9456. sp_digit t1[192], t2[97];
  9457. sp_digit div, r1;
  9458. int i;
  9459. (void)m;
  9460. div = d[95];
  9461. XMEMCPY(t1, a, sizeof(*t1) * 2 * 96);
  9462. r1 = sp_3072_cmp_96(&t1[96], d) >= 0;
  9463. sp_3072_cond_sub_96(&t1[96], &t1[96], d, (sp_digit)0 - r1);
  9464. for (i = 95; i >= 0; i--) {
  9465. sp_digit mask = 0 - (t1[96 + i] == div);
  9466. sp_digit hi = t1[96 + i] + mask;
  9467. r1 = div_3072_word_96(hi, t1[96 + i - 1], div);
  9468. r1 |= mask;
  9469. sp_3072_mul_d_96(t2, d, r1);
  9470. t1[96 + i] += sp_3072_sub_in_place_96(&t1[i], t2);
  9471. t1[96 + i] -= t2[96];
  9472. sp_3072_mask_96(t2, d, t1[96 + i]);
  9473. t1[96 + i] += sp_3072_add_96(&t1[i], &t1[i], t2);
  9474. sp_3072_mask_96(t2, d, t1[96 + i]);
  9475. t1[96 + i] += sp_3072_add_96(&t1[i], &t1[i], t2);
  9476. }
  9477. r1 = sp_3072_cmp_96(t1, d) >= 0;
  9478. sp_3072_cond_sub_96(r, t1, d, (sp_digit)0 - r1);
  9479. return MP_OKAY;
  9480. }
  9481. /* Reduce a modulo m into r. (r = a mod m)
  9482. *
  9483. * r A single precision number that is the reduced result.
  9484. * a A single precision number that is to be reduced.
  9485. * m A single precision number that is the modulus to reduce with.
  9486. * returns MP_OKAY indicating success.
  9487. */
  9488. static WC_INLINE int sp_3072_mod_96(sp_digit* r, const sp_digit* a, const sp_digit* m)
  9489. {
  9490. return sp_3072_div_96(a, m, NULL, r);
  9491. }
  9492. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || \
  9493. defined(WOLFSSL_HAVE_SP_DH)
  9494. #ifdef WOLFSSL_SP_SMALL
  9495. /* Modular exponentiate a to the e mod m. (r = a^e mod m)
  9496. *
  9497. * r A single precision number that is the result of the operation.
  9498. * a A single precision number being exponentiated.
  9499. * e A single precision number that is the exponent.
  9500. * bits The number of bits in the exponent.
  9501. * m A single precision number that is the modulus.
  9502. * returns 0 on success.
  9503. * returns MEMORY_E on dynamic memory allocation failure.
  9504. * returns MP_VAL when base is even or exponent is 0.
  9505. */
  9506. static int sp_3072_mod_exp_96(sp_digit* r, const sp_digit* a, const sp_digit* e,
  9507. int bits, const sp_digit* m, int reduceA)
  9508. {
  9509. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  9510. sp_digit* td = NULL;
  9511. #else
  9512. sp_digit td[8 * 192];
  9513. #endif
  9514. sp_digit* t[8];
  9515. sp_digit* norm = NULL;
  9516. sp_digit mp = 1;
  9517. sp_digit n;
  9518. sp_digit mask;
  9519. int i;
  9520. int c;
  9521. byte y;
  9522. int err = MP_OKAY;
  9523. if (bits == 0) {
  9524. err = MP_VAL;
  9525. }
  9526. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  9527. if (err == MP_OKAY) {
  9528. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * (8 * 192), NULL,
  9529. DYNAMIC_TYPE_TMP_BUFFER);
  9530. if (td == NULL)
  9531. err = MEMORY_E;
  9532. }
  9533. #endif
  9534. if (err == MP_OKAY) {
  9535. norm = td;
  9536. for (i=0; i<8; i++) {
  9537. t[i] = td + i * 192;
  9538. }
  9539. sp_3072_mont_setup(m, &mp);
  9540. sp_3072_mont_norm_96(norm, m);
  9541. XMEMSET(t[1], 0, sizeof(sp_digit) * 96U);
  9542. if (reduceA != 0) {
  9543. err = sp_3072_mod_96(t[1] + 96, a, m);
  9544. if (err == MP_OKAY) {
  9545. err = sp_3072_mod_96(t[1], t[1], m);
  9546. }
  9547. }
  9548. else {
  9549. XMEMCPY(t[1] + 96, a, sizeof(sp_digit) * 96);
  9550. err = sp_3072_mod_96(t[1], t[1], m);
  9551. }
  9552. }
  9553. if (err == MP_OKAY) {
  9554. sp_3072_mont_sqr_96(t[ 2], t[ 1], m, mp);
  9555. sp_3072_mont_mul_96(t[ 3], t[ 2], t[ 1], m, mp);
  9556. sp_3072_mont_sqr_96(t[ 4], t[ 2], m, mp);
  9557. sp_3072_mont_mul_96(t[ 5], t[ 3], t[ 2], m, mp);
  9558. sp_3072_mont_sqr_96(t[ 6], t[ 3], m, mp);
  9559. sp_3072_mont_mul_96(t[ 7], t[ 4], t[ 3], m, mp);
  9560. i = (bits - 1) / 32;
  9561. n = e[i--];
  9562. c = bits & 31;
  9563. if (c == 0) {
  9564. c = 32;
  9565. }
  9566. c -= bits % 3;
  9567. if (c == 32) {
  9568. c = 29;
  9569. }
  9570. if (c < 0) {
  9571. /* Number of bits in top word is less than number needed. */
  9572. c = -c;
  9573. y = (byte)(n << c);
  9574. n = e[i--];
  9575. y |= (byte)(n >> (64 - c));
  9576. n <<= c;
  9577. c = 64 - c;
  9578. }
  9579. else if (c == 0) {
  9580. /* All bits in top word used. */
  9581. y = (byte)n;
  9582. }
  9583. else {
  9584. y = (byte)(n >> c);
  9585. n <<= 32 - c;
  9586. }
  9587. XMEMCPY(r, t[y], sizeof(sp_digit) * 96);
  9588. for (; i>=0 || c>=3; ) {
  9589. if (c == 0) {
  9590. n = e[i--];
  9591. y = (byte)(n >> 29);
  9592. n <<= 3;
  9593. c = 29;
  9594. }
  9595. else if (c < 3) {
  9596. y = (byte)(n >> 29);
  9597. n = e[i--];
  9598. c = 3 - c;
  9599. y |= (byte)(n >> (32 - c));
  9600. n <<= c;
  9601. c = 32 - c;
  9602. }
  9603. else {
  9604. y = (byte)((n >> 29) & 0x7);
  9605. n <<= 3;
  9606. c -= 3;
  9607. }
  9608. sp_3072_mont_sqr_96(r, r, m, mp);
  9609. sp_3072_mont_sqr_96(r, r, m, mp);
  9610. sp_3072_mont_sqr_96(r, r, m, mp);
  9611. sp_3072_mont_mul_96(r, r, t[y], m, mp);
  9612. }
  9613. XMEMSET(&r[96], 0, sizeof(sp_digit) * 96U);
  9614. sp_3072_mont_reduce_96(r, m, mp);
  9615. mask = 0 - (sp_3072_cmp_96(r, m) >= 0);
  9616. sp_3072_cond_sub_96(r, r, m, mask);
  9617. }
  9618. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  9619. if (td != NULL)
  9620. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  9621. #endif
  9622. return err;
  9623. }
  9624. #else
  9625. /* Modular exponentiate a to the e mod m. (r = a^e mod m)
  9626. *
  9627. * r A single precision number that is the result of the operation.
  9628. * a A single precision number being exponentiated.
  9629. * e A single precision number that is the exponent.
  9630. * bits The number of bits in the exponent.
  9631. * m A single precision number that is the modulus.
  9632. * returns 0 on success.
  9633. * returns MEMORY_E on dynamic memory allocation failure.
  9634. * returns MP_VAL when base is even or exponent is 0.
  9635. */
  9636. static int sp_3072_mod_exp_96(sp_digit* r, const sp_digit* a, const sp_digit* e,
  9637. int bits, const sp_digit* m, int reduceA)
  9638. {
  9639. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  9640. sp_digit* td = NULL;
  9641. #else
  9642. sp_digit td[16 * 192];
  9643. #endif
  9644. sp_digit* t[16];
  9645. sp_digit* norm = NULL;
  9646. sp_digit mp = 1;
  9647. sp_digit n;
  9648. sp_digit mask;
  9649. int i;
  9650. int c;
  9651. byte y;
  9652. int err = MP_OKAY;
  9653. if (bits == 0) {
  9654. err = MP_VAL;
  9655. }
  9656. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  9657. if (err == MP_OKAY) {
  9658. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * (16 * 192), NULL,
  9659. DYNAMIC_TYPE_TMP_BUFFER);
  9660. if (td == NULL)
  9661. err = MEMORY_E;
  9662. }
  9663. #endif
  9664. if (err == MP_OKAY) {
  9665. norm = td;
  9666. for (i=0; i<16; i++) {
  9667. t[i] = td + i * 192;
  9668. }
  9669. sp_3072_mont_setup(m, &mp);
  9670. sp_3072_mont_norm_96(norm, m);
  9671. XMEMSET(t[1], 0, sizeof(sp_digit) * 96U);
  9672. if (reduceA != 0) {
  9673. err = sp_3072_mod_96(t[1] + 96, a, m);
  9674. if (err == MP_OKAY) {
  9675. err = sp_3072_mod_96(t[1], t[1], m);
  9676. }
  9677. }
  9678. else {
  9679. XMEMCPY(t[1] + 96, a, sizeof(sp_digit) * 96);
  9680. err = sp_3072_mod_96(t[1], t[1], m);
  9681. }
  9682. }
  9683. if (err == MP_OKAY) {
  9684. sp_3072_mont_sqr_96(t[ 2], t[ 1], m, mp);
  9685. sp_3072_mont_mul_96(t[ 3], t[ 2], t[ 1], m, mp);
  9686. sp_3072_mont_sqr_96(t[ 4], t[ 2], m, mp);
  9687. sp_3072_mont_mul_96(t[ 5], t[ 3], t[ 2], m, mp);
  9688. sp_3072_mont_sqr_96(t[ 6], t[ 3], m, mp);
  9689. sp_3072_mont_mul_96(t[ 7], t[ 4], t[ 3], m, mp);
  9690. sp_3072_mont_sqr_96(t[ 8], t[ 4], m, mp);
  9691. sp_3072_mont_mul_96(t[ 9], t[ 5], t[ 4], m, mp);
  9692. sp_3072_mont_sqr_96(t[10], t[ 5], m, mp);
  9693. sp_3072_mont_mul_96(t[11], t[ 6], t[ 5], m, mp);
  9694. sp_3072_mont_sqr_96(t[12], t[ 6], m, mp);
  9695. sp_3072_mont_mul_96(t[13], t[ 7], t[ 6], m, mp);
  9696. sp_3072_mont_sqr_96(t[14], t[ 7], m, mp);
  9697. sp_3072_mont_mul_96(t[15], t[ 8], t[ 7], m, mp);
  9698. i = (bits - 1) / 32;
  9699. n = e[i--];
  9700. c = bits & 31;
  9701. if (c == 0) {
  9702. c = 32;
  9703. }
  9704. c -= bits % 4;
  9705. if (c == 32) {
  9706. c = 28;
  9707. }
  9708. if (c < 0) {
  9709. /* Number of bits in top word is less than number needed. */
  9710. c = -c;
  9711. y = (byte)(n << c);
  9712. n = e[i--];
  9713. y |= (byte)(n >> (64 - c));
  9714. n <<= c;
  9715. c = 64 - c;
  9716. }
  9717. else if (c == 0) {
  9718. /* All bits in top word used. */
  9719. y = (byte)n;
  9720. }
  9721. else {
  9722. y = (byte)(n >> c);
  9723. n <<= 32 - c;
  9724. }
  9725. XMEMCPY(r, t[y], sizeof(sp_digit) * 96);
  9726. for (; i>=0 || c>=4; ) {
  9727. if (c == 0) {
  9728. n = e[i--];
  9729. y = (byte)(n >> 28);
  9730. n <<= 4;
  9731. c = 28;
  9732. }
  9733. else if (c < 4) {
  9734. y = (byte)(n >> 28);
  9735. n = e[i--];
  9736. c = 4 - c;
  9737. y |= (byte)(n >> (32 - c));
  9738. n <<= c;
  9739. c = 32 - c;
  9740. }
  9741. else {
  9742. y = (byte)((n >> 28) & 0xf);
  9743. n <<= 4;
  9744. c -= 4;
  9745. }
  9746. sp_3072_mont_sqr_96(r, r, m, mp);
  9747. sp_3072_mont_sqr_96(r, r, m, mp);
  9748. sp_3072_mont_sqr_96(r, r, m, mp);
  9749. sp_3072_mont_sqr_96(r, r, m, mp);
  9750. sp_3072_mont_mul_96(r, r, t[y], m, mp);
  9751. }
  9752. XMEMSET(&r[96], 0, sizeof(sp_digit) * 96U);
  9753. sp_3072_mont_reduce_96(r, m, mp);
  9754. mask = 0 - (sp_3072_cmp_96(r, m) >= 0);
  9755. sp_3072_cond_sub_96(r, r, m, mask);
  9756. }
  9757. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  9758. if (td != NULL)
  9759. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  9760. #endif
  9761. return err;
  9762. }
  9763. #endif /* WOLFSSL_SP_SMALL */
  9764. #endif /* (WOLFSSL_HAVE_SP_RSA && !WOLFSSL_RSA_PUBLIC_ONLY) || WOLFSSL_HAVE_SP_DH */
  9765. #endif /* (WOLFSSL_HAVE_SP_RSA && !WOLFSSL_RSA_PUBLIC_ONLY) || WOLFSSL_HAVE_SP_DH */
  9766. #ifdef WOLFSSL_HAVE_SP_RSA
  9767. /* RSA public key operation.
  9768. *
  9769. * in Array of bytes representing the number to exponentiate, base.
  9770. * inLen Number of bytes in base.
  9771. * em Public exponent.
  9772. * mm Modulus.
  9773. * out Buffer to hold big-endian bytes of exponentiation result.
  9774. * Must be at least 384 bytes long.
  9775. * outLen Number of bytes in result.
  9776. * returns 0 on success, MP_TO_E when the outLen is too small, MP_READ_E when
  9777. * an array is too long and MEMORY_E when dynamic memory allocation fails.
  9778. */
  9779. int sp_RsaPublic_3072(const byte* in, word32 inLen, const mp_int* em,
  9780. const mp_int* mm, byte* out, word32* outLen)
  9781. {
  9782. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  9783. sp_digit* a = NULL;
  9784. #else
  9785. sp_digit a[96 * 5];
  9786. #endif
  9787. sp_digit* m = NULL;
  9788. sp_digit* r = NULL;
  9789. sp_digit *ah = NULL;
  9790. sp_digit e[1] = {0};
  9791. int err = MP_OKAY;
  9792. if (*outLen < 384) {
  9793. err = MP_TO_E;
  9794. }
  9795. else if (mp_count_bits(em) > 32 || inLen > 384 ||
  9796. mp_count_bits(mm) != 3072) {
  9797. err = MP_READ_E;
  9798. }
  9799. else if (mp_iseven(mm)) {
  9800. err = MP_VAL;
  9801. }
  9802. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  9803. if (err == MP_OKAY) {
  9804. a = (sp_digit*)XMALLOC(sizeof(sp_digit) * 96 * 5, NULL,
  9805. DYNAMIC_TYPE_RSA);
  9806. if (a == NULL)
  9807. err = MEMORY_E;
  9808. }
  9809. #endif
  9810. if (err == MP_OKAY) {
  9811. ah = a + 96;
  9812. r = a + 96 * 2;
  9813. m = r + 96 * 2;
  9814. sp_3072_from_bin(ah, 96, in, inLen);
  9815. #if DIGIT_BIT >= 32
  9816. e[0] = em->dp[0];
  9817. #else
  9818. e[0] = em->dp[0];
  9819. if (em->used > 1) {
  9820. e[0] |= ((sp_digit)em->dp[1]) << DIGIT_BIT;
  9821. }
  9822. #endif
  9823. if (e[0] == 0) {
  9824. err = MP_EXPTMOD_E;
  9825. }
  9826. }
  9827. if (err == MP_OKAY) {
  9828. sp_3072_from_mp(m, 96, mm);
  9829. if (e[0] == 0x10001) {
  9830. int i;
  9831. sp_digit mp;
  9832. sp_3072_mont_setup(m, &mp);
  9833. /* Convert to Montgomery form. */
  9834. XMEMSET(a, 0, sizeof(sp_digit) * 96);
  9835. err = sp_3072_mod_96_cond(r, a, m);
  9836. /* Montgomery form: r = a.R mod m */
  9837. if (err == MP_OKAY) {
  9838. /* r = a ^ 0x10000 => r = a squared 16 times */
  9839. for (i = 15; i >= 0; i--) {
  9840. sp_3072_mont_sqr_96(r, r, m, mp);
  9841. }
  9842. /* mont_red(r.R.R) = (r.R.R / R) mod m = r.R mod m
  9843. * mont_red(r.R * a) = (r.R.a / R) mod m = r.a mod m
  9844. */
  9845. sp_3072_mont_mul_96(r, r, ah, m, mp);
  9846. for (i = 95; i > 0; i--) {
  9847. if (r[i] != m[i]) {
  9848. break;
  9849. }
  9850. }
  9851. if (r[i] >= m[i]) {
  9852. sp_3072_sub_in_place_96(r, m);
  9853. }
  9854. }
  9855. }
  9856. else if (e[0] == 0x3) {
  9857. if (err == MP_OKAY) {
  9858. sp_3072_sqr_96(r, ah);
  9859. err = sp_3072_mod_96_cond(r, r, m);
  9860. }
  9861. if (err == MP_OKAY) {
  9862. sp_3072_mul_96(r, ah, r);
  9863. err = sp_3072_mod_96_cond(r, r, m);
  9864. }
  9865. }
  9866. else {
  9867. int i;
  9868. sp_digit mp;
  9869. sp_3072_mont_setup(m, &mp);
  9870. /* Convert to Montgomery form. */
  9871. XMEMSET(a, 0, sizeof(sp_digit) * 96);
  9872. err = sp_3072_mod_96_cond(a, a, m);
  9873. if (err == MP_OKAY) {
  9874. for (i = 31; i >= 0; i--) {
  9875. if (e[0] >> i) {
  9876. break;
  9877. }
  9878. }
  9879. XMEMCPY(r, a, sizeof(sp_digit) * 96);
  9880. for (i--; i >= 0; i--) {
  9881. sp_3072_mont_sqr_96(r, r, m, mp);
  9882. if (((e[0] >> i) & 1) == 1) {
  9883. sp_3072_mont_mul_96(r, r, a, m, mp);
  9884. }
  9885. }
  9886. XMEMSET(&r[96], 0, sizeof(sp_digit) * 96);
  9887. sp_3072_mont_reduce_96(r, m, mp);
  9888. for (i = 95; i > 0; i--) {
  9889. if (r[i] != m[i]) {
  9890. break;
  9891. }
  9892. }
  9893. if (r[i] >= m[i]) {
  9894. sp_3072_sub_in_place_96(r, m);
  9895. }
  9896. }
  9897. }
  9898. }
  9899. if (err == MP_OKAY) {
  9900. sp_3072_to_bin_96(r, out);
  9901. *outLen = 384;
  9902. }
  9903. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  9904. if (a != NULL)
  9905. XFREE(a, NULL, DYNAMIC_TYPE_RSA);
  9906. #endif
  9907. return err;
  9908. }
  9909. #ifndef WOLFSSL_RSA_PUBLIC_ONLY
  9910. /* Conditionally add a and b using the mask m.
  9911. * m is -1 to add and 0 when not.
  9912. *
  9913. * r A single precision number representing conditional add result.
  9914. * a A single precision number to add with.
  9915. * b A single precision number to add.
  9916. * m Mask value to apply.
  9917. */
  9918. SP_NOINLINE static sp_digit sp_3072_cond_add_48(sp_digit* r, const sp_digit* a, const sp_digit* b,
  9919. sp_digit m)
  9920. {
  9921. sp_digit c = 0;
  9922. __asm__ __volatile__ (
  9923. "mov r5, #192\n\t"
  9924. "mov r9, r5\n\t"
  9925. "mov r8, #0\n\t"
  9926. "\n1:\n\t"
  9927. "ldr r6, [%[b], r8]\n\t"
  9928. "and r6, r6, %[m]\n\t"
  9929. "adds r5, %[c], #-1\n\t"
  9930. "ldr r5, [%[a], r8]\n\t"
  9931. "adcs r5, r5, r6\n\t"
  9932. "mov %[c], #0\n\t"
  9933. "adcs %[c], %[c], %[c]\n\t"
  9934. "str r5, [%[r], r8]\n\t"
  9935. "add r8, r8, #4\n\t"
  9936. "cmp r8, r9\n\t"
  9937. #ifdef __GNUC__
  9938. "blt 1b\n\t"
  9939. #else
  9940. "blt.n 1b\n\t"
  9941. #endif /* __GNUC__ */
  9942. : [c] "+r" (c)
  9943. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  9944. : "memory", "r5", "r6", "r8", "r9"
  9945. );
  9946. return c;
  9947. }
  9948. /* RSA private key operation.
  9949. *
  9950. * in Array of bytes representing the number to exponentiate, base.
  9951. * inLen Number of bytes in base.
  9952. * dm Private exponent.
  9953. * pm First prime.
  9954. * qm Second prime.
  9955. * dpm First prime's CRT exponent.
  9956. * dqm Second prime's CRT exponent.
  9957. * qim Inverse of second prime mod p.
  9958. * mm Modulus.
  9959. * out Buffer to hold big-endian bytes of exponentiation result.
  9960. * Must be at least 384 bytes long.
  9961. * outLen Number of bytes in result.
  9962. * returns 0 on success, MP_TO_E when the outLen is too small, MP_READ_E when
  9963. * an array is too long and MEMORY_E when dynamic memory allocation fails.
  9964. */
  9965. int sp_RsaPrivate_3072(const byte* in, word32 inLen, const mp_int* dm,
  9966. const mp_int* pm, const mp_int* qm, const mp_int* dpm, const mp_int* dqm,
  9967. const mp_int* qim, const mp_int* mm, byte* out, word32* outLen)
  9968. {
  9969. #if defined(SP_RSA_PRIVATE_EXP_D) || defined(RSA_LOW_MEM)
  9970. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  9971. sp_digit* d = NULL;
  9972. #else
  9973. sp_digit d[96 * 4];
  9974. #endif
  9975. sp_digit* a = NULL;
  9976. sp_digit* m = NULL;
  9977. sp_digit* r = NULL;
  9978. int err = MP_OKAY;
  9979. (void)pm;
  9980. (void)qm;
  9981. (void)dpm;
  9982. (void)dqm;
  9983. (void)qim;
  9984. if (*outLen < 384U) {
  9985. err = MP_TO_E;
  9986. }
  9987. if (err == MP_OKAY) {
  9988. if (mp_count_bits(dm) > 3072) {
  9989. err = MP_READ_E;
  9990. }
  9991. else if (inLen > 384) {
  9992. err = MP_READ_E;
  9993. }
  9994. else if (mp_count_bits(mm) != 3072) {
  9995. err = MP_READ_E;
  9996. }
  9997. else if (mp_iseven(mm)) {
  9998. err = MP_VAL;
  9999. }
  10000. }
  10001. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  10002. if (err == MP_OKAY) {
  10003. d = (sp_digit*)XMALLOC(sizeof(sp_digit) * 96 * 4, NULL,
  10004. DYNAMIC_TYPE_RSA);
  10005. if (d == NULL)
  10006. err = MEMORY_E;
  10007. }
  10008. #endif
  10009. if (err == MP_OKAY) {
  10010. a = d + 96;
  10011. m = a + 192;
  10012. r = a;
  10013. sp_3072_from_bin(a, 96, in, inLen);
  10014. sp_3072_from_mp(d, 96, dm);
  10015. sp_3072_from_mp(m, 96, mm);
  10016. err = sp_3072_mod_exp_96(r, a, d, 3072, m, 0);
  10017. }
  10018. if (err == MP_OKAY) {
  10019. sp_3072_to_bin_96(r, out);
  10020. *outLen = 384;
  10021. }
  10022. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  10023. if (d != NULL)
  10024. #endif
  10025. {
  10026. /* only "a" and "r" are sensitive and need zeroized (same pointer) */
  10027. if (a != NULL)
  10028. ForceZero(a, sizeof(sp_digit) * 96);
  10029. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  10030. XFREE(d, NULL, DYNAMIC_TYPE_RSA);
  10031. #endif
  10032. }
  10033. return err;
  10034. #else
  10035. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  10036. sp_digit* a = NULL;
  10037. #else
  10038. sp_digit a[48 * 11];
  10039. #endif
  10040. sp_digit* p = NULL;
  10041. sp_digit* q = NULL;
  10042. sp_digit* dp = NULL;
  10043. sp_digit* tmpa = NULL;
  10044. sp_digit* tmpb = NULL;
  10045. sp_digit* r = NULL;
  10046. sp_digit* qi = NULL;
  10047. sp_digit* dq = NULL;
  10048. sp_digit c;
  10049. int err = MP_OKAY;
  10050. (void)dm;
  10051. (void)mm;
  10052. if (*outLen < 384) {
  10053. err = MP_TO_E;
  10054. }
  10055. else if (inLen > 384 || mp_count_bits(mm) != 3072) {
  10056. err = MP_READ_E;
  10057. }
  10058. else if (mp_iseven(mm)) {
  10059. err = MP_VAL;
  10060. }
  10061. else if (mp_iseven(pm)) {
  10062. err = MP_VAL;
  10063. }
  10064. else if (mp_iseven(qm)) {
  10065. err = MP_VAL;
  10066. }
  10067. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  10068. if (err == MP_OKAY) {
  10069. a = (sp_digit*)XMALLOC(sizeof(sp_digit) * 48 * 11, NULL,
  10070. DYNAMIC_TYPE_RSA);
  10071. if (a == NULL)
  10072. err = MEMORY_E;
  10073. }
  10074. #endif
  10075. if (err == MP_OKAY) {
  10076. p = a + 96 * 2;
  10077. q = p + 48;
  10078. qi = dq = dp = q + 48;
  10079. tmpa = qi + 48;
  10080. tmpb = tmpa + 96;
  10081. r = a;
  10082. sp_3072_from_bin(a, 96, in, inLen);
  10083. sp_3072_from_mp(p, 48, pm);
  10084. sp_3072_from_mp(q, 48, qm);
  10085. sp_3072_from_mp(dp, 48, dpm);
  10086. err = sp_3072_mod_exp_48(tmpa, a, dp, 1536, p, 1);
  10087. }
  10088. if (err == MP_OKAY) {
  10089. sp_3072_from_mp(dq, 48, dqm);
  10090. err = sp_3072_mod_exp_48(tmpb, a, dq, 1536, q, 1);
  10091. }
  10092. if (err == MP_OKAY) {
  10093. c = sp_3072_sub_in_place_48(tmpa, tmpb);
  10094. c += sp_3072_cond_add_48(tmpa, tmpa, p, c);
  10095. sp_3072_cond_add_48(tmpa, tmpa, p, c);
  10096. sp_3072_from_mp(qi, 48, qim);
  10097. sp_3072_mul_48(tmpa, tmpa, qi);
  10098. err = sp_3072_mod_48(tmpa, tmpa, p);
  10099. }
  10100. if (err == MP_OKAY) {
  10101. sp_3072_mul_48(tmpa, q, tmpa);
  10102. XMEMSET(&tmpb[48], 0, sizeof(sp_digit) * 48);
  10103. sp_3072_add_96(r, tmpb, tmpa);
  10104. sp_3072_to_bin_96(r, out);
  10105. *outLen = 384;
  10106. }
  10107. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  10108. if (a != NULL)
  10109. #endif
  10110. {
  10111. ForceZero(a, sizeof(sp_digit) * 48 * 11);
  10112. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  10113. XFREE(a, NULL, DYNAMIC_TYPE_RSA);
  10114. #endif
  10115. }
  10116. #endif /* SP_RSA_PRIVATE_EXP_D || RSA_LOW_MEM */
  10117. return err;
  10118. }
  10119. #endif /* WOLFSSL_RSA_PUBLIC_ONLY */
  10120. #endif /* WOLFSSL_HAVE_SP_RSA */
  10121. #if defined(WOLFSSL_HAVE_SP_DH) || (defined(WOLFSSL_HAVE_SP_RSA) && \
  10122. !defined(WOLFSSL_RSA_PUBLIC_ONLY))
  10123. /* Convert an array of sp_digit to an mp_int.
  10124. *
  10125. * a A single precision integer.
  10126. * r A multi-precision integer.
  10127. */
  10128. static int sp_3072_to_mp(const sp_digit* a, mp_int* r)
  10129. {
  10130. int err;
  10131. err = mp_grow(r, (3072 + DIGIT_BIT - 1) / DIGIT_BIT);
  10132. if (err == MP_OKAY) { /*lint !e774 case where err is always MP_OKAY*/
  10133. #if DIGIT_BIT == 32
  10134. XMEMCPY(r->dp, a, sizeof(sp_digit) * 96);
  10135. r->used = 96;
  10136. mp_clamp(r);
  10137. #elif DIGIT_BIT < 32
  10138. int i;
  10139. int j = 0;
  10140. int s = 0;
  10141. r->dp[0] = 0;
  10142. for (i = 0; i < 96; i++) {
  10143. r->dp[j] |= (mp_digit)(a[i] << s);
  10144. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  10145. s = DIGIT_BIT - s;
  10146. r->dp[++j] = (mp_digit)(a[i] >> s);
  10147. while (s + DIGIT_BIT <= 32) {
  10148. s += DIGIT_BIT;
  10149. r->dp[j++] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  10150. if (s == SP_WORD_SIZE) {
  10151. r->dp[j] = 0;
  10152. }
  10153. else {
  10154. r->dp[j] = (mp_digit)(a[i] >> s);
  10155. }
  10156. }
  10157. s = 32 - s;
  10158. }
  10159. r->used = (3072 + DIGIT_BIT - 1) / DIGIT_BIT;
  10160. mp_clamp(r);
  10161. #else
  10162. int i;
  10163. int j = 0;
  10164. int s = 0;
  10165. r->dp[0] = 0;
  10166. for (i = 0; i < 96; i++) {
  10167. r->dp[j] |= ((mp_digit)a[i]) << s;
  10168. if (s + 32 >= DIGIT_BIT) {
  10169. #if DIGIT_BIT != 32 && DIGIT_BIT != 64
  10170. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  10171. #endif
  10172. s = DIGIT_BIT - s;
  10173. r->dp[++j] = a[i] >> s;
  10174. s = 32 - s;
  10175. }
  10176. else {
  10177. s += 32;
  10178. }
  10179. }
  10180. r->used = (3072 + DIGIT_BIT - 1) / DIGIT_BIT;
  10181. mp_clamp(r);
  10182. #endif
  10183. }
  10184. return err;
  10185. }
  10186. /* Perform the modular exponentiation for Diffie-Hellman.
  10187. *
  10188. * base Base. MP integer.
  10189. * exp Exponent. MP integer.
  10190. * mod Modulus. MP integer.
  10191. * res Result. MP integer.
  10192. * returns 0 on success, MP_READ_E if there are too many bytes in an array
  10193. * and MEMORY_E if memory allocation fails.
  10194. */
  10195. int sp_ModExp_3072(const mp_int* base, const mp_int* exp, const mp_int* mod,
  10196. mp_int* res)
  10197. {
  10198. int err = MP_OKAY;
  10199. sp_digit b[192];
  10200. sp_digit e[96];
  10201. sp_digit m[96];
  10202. sp_digit* r = b;
  10203. int expBits = mp_count_bits(exp);
  10204. if (mp_count_bits(base) > 3072) {
  10205. err = MP_READ_E;
  10206. }
  10207. else if (expBits > 3072) {
  10208. err = MP_READ_E;
  10209. }
  10210. else if (mp_count_bits(mod) != 3072) {
  10211. err = MP_READ_E;
  10212. }
  10213. else if (mp_iseven(mod)) {
  10214. err = MP_VAL;
  10215. }
  10216. if (err == MP_OKAY) {
  10217. sp_3072_from_mp(b, 96, base);
  10218. sp_3072_from_mp(e, 96, exp);
  10219. sp_3072_from_mp(m, 96, mod);
  10220. err = sp_3072_mod_exp_96(r, b, e, expBits, m, 0);
  10221. }
  10222. if (err == MP_OKAY) {
  10223. err = sp_3072_to_mp(r, res);
  10224. }
  10225. XMEMSET(e, 0, sizeof(e));
  10226. return err;
  10227. }
  10228. #ifdef WOLFSSL_HAVE_SP_DH
  10229. #ifdef HAVE_FFDHE_3072
  10230. static void sp_3072_lshift_96(sp_digit* r, const sp_digit* a, byte n)
  10231. {
  10232. __asm__ __volatile__ (
  10233. "mov r6, #31\n\t"
  10234. "sub r6, r6, %[n]\n\t"
  10235. "add %[a], %[a], #320\n\t"
  10236. "add %[r], %[r], #320\n\t"
  10237. "ldr r3, [%[a], #60]\n\t"
  10238. "lsr r4, r3, #1\n\t"
  10239. "lsl r3, r3, %[n]\n\t"
  10240. "lsr r4, r4, r6\n\t"
  10241. "ldr r2, [%[a], #56]\n\t"
  10242. "str r4, [%[r], #64]\n\t"
  10243. "lsr r5, r2, #1\n\t"
  10244. "lsl r2, r2, %[n]\n\t"
  10245. "lsr r5, r5, r6\n\t"
  10246. "orr r3, r3, r5\n\t"
  10247. "ldr r4, [%[a], #52]\n\t"
  10248. "str r3, [%[r], #60]\n\t"
  10249. "lsr r5, r4, #1\n\t"
  10250. "lsl r4, r4, %[n]\n\t"
  10251. "lsr r5, r5, r6\n\t"
  10252. "orr r2, r2, r5\n\t"
  10253. "ldr r3, [%[a], #48]\n\t"
  10254. "str r2, [%[r], #56]\n\t"
  10255. "lsr r5, r3, #1\n\t"
  10256. "lsl r3, r3, %[n]\n\t"
  10257. "lsr r5, r5, r6\n\t"
  10258. "orr r4, r4, r5\n\t"
  10259. "ldr r2, [%[a], #44]\n\t"
  10260. "str r4, [%[r], #52]\n\t"
  10261. "lsr r5, r2, #1\n\t"
  10262. "lsl r2, r2, %[n]\n\t"
  10263. "lsr r5, r5, r6\n\t"
  10264. "orr r3, r3, r5\n\t"
  10265. "ldr r4, [%[a], #40]\n\t"
  10266. "str r3, [%[r], #48]\n\t"
  10267. "lsr r5, r4, #1\n\t"
  10268. "lsl r4, r4, %[n]\n\t"
  10269. "lsr r5, r5, r6\n\t"
  10270. "orr r2, r2, r5\n\t"
  10271. "ldr r3, [%[a], #36]\n\t"
  10272. "str r2, [%[r], #44]\n\t"
  10273. "lsr r5, r3, #1\n\t"
  10274. "lsl r3, r3, %[n]\n\t"
  10275. "lsr r5, r5, r6\n\t"
  10276. "orr r4, r4, r5\n\t"
  10277. "ldr r2, [%[a], #32]\n\t"
  10278. "str r4, [%[r], #40]\n\t"
  10279. "lsr r5, r2, #1\n\t"
  10280. "lsl r2, r2, %[n]\n\t"
  10281. "lsr r5, r5, r6\n\t"
  10282. "orr r3, r3, r5\n\t"
  10283. "ldr r4, [%[a], #28]\n\t"
  10284. "str r3, [%[r], #36]\n\t"
  10285. "lsr r5, r4, #1\n\t"
  10286. "lsl r4, r4, %[n]\n\t"
  10287. "lsr r5, r5, r6\n\t"
  10288. "orr r2, r2, r5\n\t"
  10289. "ldr r3, [%[a], #24]\n\t"
  10290. "str r2, [%[r], #32]\n\t"
  10291. "lsr r5, r3, #1\n\t"
  10292. "lsl r3, r3, %[n]\n\t"
  10293. "lsr r5, r5, r6\n\t"
  10294. "orr r4, r4, r5\n\t"
  10295. "ldr r2, [%[a], #20]\n\t"
  10296. "str r4, [%[r], #28]\n\t"
  10297. "lsr r5, r2, #1\n\t"
  10298. "lsl r2, r2, %[n]\n\t"
  10299. "lsr r5, r5, r6\n\t"
  10300. "orr r3, r3, r5\n\t"
  10301. "ldr r4, [%[a], #16]\n\t"
  10302. "str r3, [%[r], #24]\n\t"
  10303. "lsr r5, r4, #1\n\t"
  10304. "lsl r4, r4, %[n]\n\t"
  10305. "lsr r5, r5, r6\n\t"
  10306. "orr r2, r2, r5\n\t"
  10307. "ldr r3, [%[a], #12]\n\t"
  10308. "str r2, [%[r], #20]\n\t"
  10309. "lsr r5, r3, #1\n\t"
  10310. "lsl r3, r3, %[n]\n\t"
  10311. "lsr r5, r5, r6\n\t"
  10312. "orr r4, r4, r5\n\t"
  10313. "ldr r2, [%[a], #8]\n\t"
  10314. "str r4, [%[r], #16]\n\t"
  10315. "lsr r5, r2, #1\n\t"
  10316. "lsl r2, r2, %[n]\n\t"
  10317. "lsr r5, r5, r6\n\t"
  10318. "orr r3, r3, r5\n\t"
  10319. "ldr r4, [%[a], #4]\n\t"
  10320. "str r3, [%[r], #12]\n\t"
  10321. "lsr r5, r4, #1\n\t"
  10322. "lsl r4, r4, %[n]\n\t"
  10323. "lsr r5, r5, r6\n\t"
  10324. "orr r2, r2, r5\n\t"
  10325. "ldr r3, [%[a], #0]\n\t"
  10326. "str r2, [%[r], #8]\n\t"
  10327. "lsr r5, r3, #1\n\t"
  10328. "lsl r3, r3, %[n]\n\t"
  10329. "lsr r5, r5, r6\n\t"
  10330. "orr r4, r4, r5\n\t"
  10331. "sub %[a], %[a], #64\n\t"
  10332. "sub %[r], %[r], #64\n\t"
  10333. "ldr r2, [%[a], #60]\n\t"
  10334. "str r4, [%[r], #68]\n\t"
  10335. "lsr r5, r2, #1\n\t"
  10336. "lsl r2, r2, %[n]\n\t"
  10337. "lsr r5, r5, r6\n\t"
  10338. "orr r3, r3, r5\n\t"
  10339. "ldr r4, [%[a], #56]\n\t"
  10340. "str r3, [%[r], #64]\n\t"
  10341. "lsr r5, r4, #1\n\t"
  10342. "lsl r4, r4, %[n]\n\t"
  10343. "lsr r5, r5, r6\n\t"
  10344. "orr r2, r2, r5\n\t"
  10345. "ldr r3, [%[a], #52]\n\t"
  10346. "str r2, [%[r], #60]\n\t"
  10347. "lsr r5, r3, #1\n\t"
  10348. "lsl r3, r3, %[n]\n\t"
  10349. "lsr r5, r5, r6\n\t"
  10350. "orr r4, r4, r5\n\t"
  10351. "ldr r2, [%[a], #48]\n\t"
  10352. "str r4, [%[r], #56]\n\t"
  10353. "lsr r5, r2, #1\n\t"
  10354. "lsl r2, r2, %[n]\n\t"
  10355. "lsr r5, r5, r6\n\t"
  10356. "orr r3, r3, r5\n\t"
  10357. "ldr r4, [%[a], #44]\n\t"
  10358. "str r3, [%[r], #52]\n\t"
  10359. "lsr r5, r4, #1\n\t"
  10360. "lsl r4, r4, %[n]\n\t"
  10361. "lsr r5, r5, r6\n\t"
  10362. "orr r2, r2, r5\n\t"
  10363. "ldr r3, [%[a], #40]\n\t"
  10364. "str r2, [%[r], #48]\n\t"
  10365. "lsr r5, r3, #1\n\t"
  10366. "lsl r3, r3, %[n]\n\t"
  10367. "lsr r5, r5, r6\n\t"
  10368. "orr r4, r4, r5\n\t"
  10369. "ldr r2, [%[a], #36]\n\t"
  10370. "str r4, [%[r], #44]\n\t"
  10371. "lsr r5, r2, #1\n\t"
  10372. "lsl r2, r2, %[n]\n\t"
  10373. "lsr r5, r5, r6\n\t"
  10374. "orr r3, r3, r5\n\t"
  10375. "ldr r4, [%[a], #32]\n\t"
  10376. "str r3, [%[r], #40]\n\t"
  10377. "lsr r5, r4, #1\n\t"
  10378. "lsl r4, r4, %[n]\n\t"
  10379. "lsr r5, r5, r6\n\t"
  10380. "orr r2, r2, r5\n\t"
  10381. "ldr r3, [%[a], #28]\n\t"
  10382. "str r2, [%[r], #36]\n\t"
  10383. "lsr r5, r3, #1\n\t"
  10384. "lsl r3, r3, %[n]\n\t"
  10385. "lsr r5, r5, r6\n\t"
  10386. "orr r4, r4, r5\n\t"
  10387. "ldr r2, [%[a], #24]\n\t"
  10388. "str r4, [%[r], #32]\n\t"
  10389. "lsr r5, r2, #1\n\t"
  10390. "lsl r2, r2, %[n]\n\t"
  10391. "lsr r5, r5, r6\n\t"
  10392. "orr r3, r3, r5\n\t"
  10393. "ldr r4, [%[a], #20]\n\t"
  10394. "str r3, [%[r], #28]\n\t"
  10395. "lsr r5, r4, #1\n\t"
  10396. "lsl r4, r4, %[n]\n\t"
  10397. "lsr r5, r5, r6\n\t"
  10398. "orr r2, r2, r5\n\t"
  10399. "ldr r3, [%[a], #16]\n\t"
  10400. "str r2, [%[r], #24]\n\t"
  10401. "lsr r5, r3, #1\n\t"
  10402. "lsl r3, r3, %[n]\n\t"
  10403. "lsr r5, r5, r6\n\t"
  10404. "orr r4, r4, r5\n\t"
  10405. "ldr r2, [%[a], #12]\n\t"
  10406. "str r4, [%[r], #20]\n\t"
  10407. "lsr r5, r2, #1\n\t"
  10408. "lsl r2, r2, %[n]\n\t"
  10409. "lsr r5, r5, r6\n\t"
  10410. "orr r3, r3, r5\n\t"
  10411. "ldr r4, [%[a], #8]\n\t"
  10412. "str r3, [%[r], #16]\n\t"
  10413. "lsr r5, r4, #1\n\t"
  10414. "lsl r4, r4, %[n]\n\t"
  10415. "lsr r5, r5, r6\n\t"
  10416. "orr r2, r2, r5\n\t"
  10417. "ldr r3, [%[a], #4]\n\t"
  10418. "str r2, [%[r], #12]\n\t"
  10419. "lsr r5, r3, #1\n\t"
  10420. "lsl r3, r3, %[n]\n\t"
  10421. "lsr r5, r5, r6\n\t"
  10422. "orr r4, r4, r5\n\t"
  10423. "ldr r2, [%[a], #0]\n\t"
  10424. "str r4, [%[r], #8]\n\t"
  10425. "lsr r5, r2, #1\n\t"
  10426. "lsl r2, r2, %[n]\n\t"
  10427. "lsr r5, r5, r6\n\t"
  10428. "orr r3, r3, r5\n\t"
  10429. "sub %[a], %[a], #64\n\t"
  10430. "sub %[r], %[r], #64\n\t"
  10431. "ldr r4, [%[a], #60]\n\t"
  10432. "str r3, [%[r], #68]\n\t"
  10433. "lsr r5, r4, #1\n\t"
  10434. "lsl r4, r4, %[n]\n\t"
  10435. "lsr r5, r5, r6\n\t"
  10436. "orr r2, r2, r5\n\t"
  10437. "ldr r3, [%[a], #56]\n\t"
  10438. "str r2, [%[r], #64]\n\t"
  10439. "lsr r5, r3, #1\n\t"
  10440. "lsl r3, r3, %[n]\n\t"
  10441. "lsr r5, r5, r6\n\t"
  10442. "orr r4, r4, r5\n\t"
  10443. "ldr r2, [%[a], #52]\n\t"
  10444. "str r4, [%[r], #60]\n\t"
  10445. "lsr r5, r2, #1\n\t"
  10446. "lsl r2, r2, %[n]\n\t"
  10447. "lsr r5, r5, r6\n\t"
  10448. "orr r3, r3, r5\n\t"
  10449. "ldr r4, [%[a], #48]\n\t"
  10450. "str r3, [%[r], #56]\n\t"
  10451. "lsr r5, r4, #1\n\t"
  10452. "lsl r4, r4, %[n]\n\t"
  10453. "lsr r5, r5, r6\n\t"
  10454. "orr r2, r2, r5\n\t"
  10455. "ldr r3, [%[a], #44]\n\t"
  10456. "str r2, [%[r], #52]\n\t"
  10457. "lsr r5, r3, #1\n\t"
  10458. "lsl r3, r3, %[n]\n\t"
  10459. "lsr r5, r5, r6\n\t"
  10460. "orr r4, r4, r5\n\t"
  10461. "ldr r2, [%[a], #40]\n\t"
  10462. "str r4, [%[r], #48]\n\t"
  10463. "lsr r5, r2, #1\n\t"
  10464. "lsl r2, r2, %[n]\n\t"
  10465. "lsr r5, r5, r6\n\t"
  10466. "orr r3, r3, r5\n\t"
  10467. "ldr r4, [%[a], #36]\n\t"
  10468. "str r3, [%[r], #44]\n\t"
  10469. "lsr r5, r4, #1\n\t"
  10470. "lsl r4, r4, %[n]\n\t"
  10471. "lsr r5, r5, r6\n\t"
  10472. "orr r2, r2, r5\n\t"
  10473. "ldr r3, [%[a], #32]\n\t"
  10474. "str r2, [%[r], #40]\n\t"
  10475. "lsr r5, r3, #1\n\t"
  10476. "lsl r3, r3, %[n]\n\t"
  10477. "lsr r5, r5, r6\n\t"
  10478. "orr r4, r4, r5\n\t"
  10479. "ldr r2, [%[a], #28]\n\t"
  10480. "str r4, [%[r], #36]\n\t"
  10481. "lsr r5, r2, #1\n\t"
  10482. "lsl r2, r2, %[n]\n\t"
  10483. "lsr r5, r5, r6\n\t"
  10484. "orr r3, r3, r5\n\t"
  10485. "ldr r4, [%[a], #24]\n\t"
  10486. "str r3, [%[r], #32]\n\t"
  10487. "lsr r5, r4, #1\n\t"
  10488. "lsl r4, r4, %[n]\n\t"
  10489. "lsr r5, r5, r6\n\t"
  10490. "orr r2, r2, r5\n\t"
  10491. "ldr r3, [%[a], #20]\n\t"
  10492. "str r2, [%[r], #28]\n\t"
  10493. "lsr r5, r3, #1\n\t"
  10494. "lsl r3, r3, %[n]\n\t"
  10495. "lsr r5, r5, r6\n\t"
  10496. "orr r4, r4, r5\n\t"
  10497. "ldr r2, [%[a], #16]\n\t"
  10498. "str r4, [%[r], #24]\n\t"
  10499. "lsr r5, r2, #1\n\t"
  10500. "lsl r2, r2, %[n]\n\t"
  10501. "lsr r5, r5, r6\n\t"
  10502. "orr r3, r3, r5\n\t"
  10503. "ldr r4, [%[a], #12]\n\t"
  10504. "str r3, [%[r], #20]\n\t"
  10505. "lsr r5, r4, #1\n\t"
  10506. "lsl r4, r4, %[n]\n\t"
  10507. "lsr r5, r5, r6\n\t"
  10508. "orr r2, r2, r5\n\t"
  10509. "ldr r3, [%[a], #8]\n\t"
  10510. "str r2, [%[r], #16]\n\t"
  10511. "lsr r5, r3, #1\n\t"
  10512. "lsl r3, r3, %[n]\n\t"
  10513. "lsr r5, r5, r6\n\t"
  10514. "orr r4, r4, r5\n\t"
  10515. "ldr r2, [%[a], #4]\n\t"
  10516. "str r4, [%[r], #12]\n\t"
  10517. "lsr r5, r2, #1\n\t"
  10518. "lsl r2, r2, %[n]\n\t"
  10519. "lsr r5, r5, r6\n\t"
  10520. "orr r3, r3, r5\n\t"
  10521. "ldr r4, [%[a], #0]\n\t"
  10522. "str r3, [%[r], #8]\n\t"
  10523. "lsr r5, r4, #1\n\t"
  10524. "lsl r4, r4, %[n]\n\t"
  10525. "lsr r5, r5, r6\n\t"
  10526. "orr r2, r2, r5\n\t"
  10527. "sub %[a], %[a], #64\n\t"
  10528. "sub %[r], %[r], #64\n\t"
  10529. "ldr r3, [%[a], #60]\n\t"
  10530. "str r2, [%[r], #68]\n\t"
  10531. "lsr r5, r3, #1\n\t"
  10532. "lsl r3, r3, %[n]\n\t"
  10533. "lsr r5, r5, r6\n\t"
  10534. "orr r4, r4, r5\n\t"
  10535. "ldr r2, [%[a], #56]\n\t"
  10536. "str r4, [%[r], #64]\n\t"
  10537. "lsr r5, r2, #1\n\t"
  10538. "lsl r2, r2, %[n]\n\t"
  10539. "lsr r5, r5, r6\n\t"
  10540. "orr r3, r3, r5\n\t"
  10541. "ldr r4, [%[a], #52]\n\t"
  10542. "str r3, [%[r], #60]\n\t"
  10543. "lsr r5, r4, #1\n\t"
  10544. "lsl r4, r4, %[n]\n\t"
  10545. "lsr r5, r5, r6\n\t"
  10546. "orr r2, r2, r5\n\t"
  10547. "ldr r3, [%[a], #48]\n\t"
  10548. "str r2, [%[r], #56]\n\t"
  10549. "lsr r5, r3, #1\n\t"
  10550. "lsl r3, r3, %[n]\n\t"
  10551. "lsr r5, r5, r6\n\t"
  10552. "orr r4, r4, r5\n\t"
  10553. "ldr r2, [%[a], #44]\n\t"
  10554. "str r4, [%[r], #52]\n\t"
  10555. "lsr r5, r2, #1\n\t"
  10556. "lsl r2, r2, %[n]\n\t"
  10557. "lsr r5, r5, r6\n\t"
  10558. "orr r3, r3, r5\n\t"
  10559. "ldr r4, [%[a], #40]\n\t"
  10560. "str r3, [%[r], #48]\n\t"
  10561. "lsr r5, r4, #1\n\t"
  10562. "lsl r4, r4, %[n]\n\t"
  10563. "lsr r5, r5, r6\n\t"
  10564. "orr r2, r2, r5\n\t"
  10565. "ldr r3, [%[a], #36]\n\t"
  10566. "str r2, [%[r], #44]\n\t"
  10567. "lsr r5, r3, #1\n\t"
  10568. "lsl r3, r3, %[n]\n\t"
  10569. "lsr r5, r5, r6\n\t"
  10570. "orr r4, r4, r5\n\t"
  10571. "ldr r2, [%[a], #32]\n\t"
  10572. "str r4, [%[r], #40]\n\t"
  10573. "lsr r5, r2, #1\n\t"
  10574. "lsl r2, r2, %[n]\n\t"
  10575. "lsr r5, r5, r6\n\t"
  10576. "orr r3, r3, r5\n\t"
  10577. "ldr r4, [%[a], #28]\n\t"
  10578. "str r3, [%[r], #36]\n\t"
  10579. "lsr r5, r4, #1\n\t"
  10580. "lsl r4, r4, %[n]\n\t"
  10581. "lsr r5, r5, r6\n\t"
  10582. "orr r2, r2, r5\n\t"
  10583. "ldr r3, [%[a], #24]\n\t"
  10584. "str r2, [%[r], #32]\n\t"
  10585. "lsr r5, r3, #1\n\t"
  10586. "lsl r3, r3, %[n]\n\t"
  10587. "lsr r5, r5, r6\n\t"
  10588. "orr r4, r4, r5\n\t"
  10589. "ldr r2, [%[a], #20]\n\t"
  10590. "str r4, [%[r], #28]\n\t"
  10591. "lsr r5, r2, #1\n\t"
  10592. "lsl r2, r2, %[n]\n\t"
  10593. "lsr r5, r5, r6\n\t"
  10594. "orr r3, r3, r5\n\t"
  10595. "ldr r4, [%[a], #16]\n\t"
  10596. "str r3, [%[r], #24]\n\t"
  10597. "lsr r5, r4, #1\n\t"
  10598. "lsl r4, r4, %[n]\n\t"
  10599. "lsr r5, r5, r6\n\t"
  10600. "orr r2, r2, r5\n\t"
  10601. "ldr r3, [%[a], #12]\n\t"
  10602. "str r2, [%[r], #20]\n\t"
  10603. "lsr r5, r3, #1\n\t"
  10604. "lsl r3, r3, %[n]\n\t"
  10605. "lsr r5, r5, r6\n\t"
  10606. "orr r4, r4, r5\n\t"
  10607. "ldr r2, [%[a], #8]\n\t"
  10608. "str r4, [%[r], #16]\n\t"
  10609. "lsr r5, r2, #1\n\t"
  10610. "lsl r2, r2, %[n]\n\t"
  10611. "lsr r5, r5, r6\n\t"
  10612. "orr r3, r3, r5\n\t"
  10613. "ldr r4, [%[a], #4]\n\t"
  10614. "str r3, [%[r], #12]\n\t"
  10615. "lsr r5, r4, #1\n\t"
  10616. "lsl r4, r4, %[n]\n\t"
  10617. "lsr r5, r5, r6\n\t"
  10618. "orr r2, r2, r5\n\t"
  10619. "ldr r3, [%[a], #0]\n\t"
  10620. "str r2, [%[r], #8]\n\t"
  10621. "lsr r5, r3, #1\n\t"
  10622. "lsl r3, r3, %[n]\n\t"
  10623. "lsr r5, r5, r6\n\t"
  10624. "orr r4, r4, r5\n\t"
  10625. "sub %[a], %[a], #64\n\t"
  10626. "sub %[r], %[r], #64\n\t"
  10627. "ldr r2, [%[a], #60]\n\t"
  10628. "str r4, [%[r], #68]\n\t"
  10629. "lsr r5, r2, #1\n\t"
  10630. "lsl r2, r2, %[n]\n\t"
  10631. "lsr r5, r5, r6\n\t"
  10632. "orr r3, r3, r5\n\t"
  10633. "ldr r4, [%[a], #56]\n\t"
  10634. "str r3, [%[r], #64]\n\t"
  10635. "lsr r5, r4, #1\n\t"
  10636. "lsl r4, r4, %[n]\n\t"
  10637. "lsr r5, r5, r6\n\t"
  10638. "orr r2, r2, r5\n\t"
  10639. "ldr r3, [%[a], #52]\n\t"
  10640. "str r2, [%[r], #60]\n\t"
  10641. "lsr r5, r3, #1\n\t"
  10642. "lsl r3, r3, %[n]\n\t"
  10643. "lsr r5, r5, r6\n\t"
  10644. "orr r4, r4, r5\n\t"
  10645. "ldr r2, [%[a], #48]\n\t"
  10646. "str r4, [%[r], #56]\n\t"
  10647. "lsr r5, r2, #1\n\t"
  10648. "lsl r2, r2, %[n]\n\t"
  10649. "lsr r5, r5, r6\n\t"
  10650. "orr r3, r3, r5\n\t"
  10651. "ldr r4, [%[a], #44]\n\t"
  10652. "str r3, [%[r], #52]\n\t"
  10653. "lsr r5, r4, #1\n\t"
  10654. "lsl r4, r4, %[n]\n\t"
  10655. "lsr r5, r5, r6\n\t"
  10656. "orr r2, r2, r5\n\t"
  10657. "ldr r3, [%[a], #40]\n\t"
  10658. "str r2, [%[r], #48]\n\t"
  10659. "lsr r5, r3, #1\n\t"
  10660. "lsl r3, r3, %[n]\n\t"
  10661. "lsr r5, r5, r6\n\t"
  10662. "orr r4, r4, r5\n\t"
  10663. "ldr r2, [%[a], #36]\n\t"
  10664. "str r4, [%[r], #44]\n\t"
  10665. "lsr r5, r2, #1\n\t"
  10666. "lsl r2, r2, %[n]\n\t"
  10667. "lsr r5, r5, r6\n\t"
  10668. "orr r3, r3, r5\n\t"
  10669. "ldr r4, [%[a], #32]\n\t"
  10670. "str r3, [%[r], #40]\n\t"
  10671. "lsr r5, r4, #1\n\t"
  10672. "lsl r4, r4, %[n]\n\t"
  10673. "lsr r5, r5, r6\n\t"
  10674. "orr r2, r2, r5\n\t"
  10675. "ldr r3, [%[a], #28]\n\t"
  10676. "str r2, [%[r], #36]\n\t"
  10677. "lsr r5, r3, #1\n\t"
  10678. "lsl r3, r3, %[n]\n\t"
  10679. "lsr r5, r5, r6\n\t"
  10680. "orr r4, r4, r5\n\t"
  10681. "ldr r2, [%[a], #24]\n\t"
  10682. "str r4, [%[r], #32]\n\t"
  10683. "lsr r5, r2, #1\n\t"
  10684. "lsl r2, r2, %[n]\n\t"
  10685. "lsr r5, r5, r6\n\t"
  10686. "orr r3, r3, r5\n\t"
  10687. "ldr r4, [%[a], #20]\n\t"
  10688. "str r3, [%[r], #28]\n\t"
  10689. "lsr r5, r4, #1\n\t"
  10690. "lsl r4, r4, %[n]\n\t"
  10691. "lsr r5, r5, r6\n\t"
  10692. "orr r2, r2, r5\n\t"
  10693. "ldr r3, [%[a], #16]\n\t"
  10694. "str r2, [%[r], #24]\n\t"
  10695. "lsr r5, r3, #1\n\t"
  10696. "lsl r3, r3, %[n]\n\t"
  10697. "lsr r5, r5, r6\n\t"
  10698. "orr r4, r4, r5\n\t"
  10699. "ldr r2, [%[a], #12]\n\t"
  10700. "str r4, [%[r], #20]\n\t"
  10701. "lsr r5, r2, #1\n\t"
  10702. "lsl r2, r2, %[n]\n\t"
  10703. "lsr r5, r5, r6\n\t"
  10704. "orr r3, r3, r5\n\t"
  10705. "ldr r4, [%[a], #8]\n\t"
  10706. "str r3, [%[r], #16]\n\t"
  10707. "lsr r5, r4, #1\n\t"
  10708. "lsl r4, r4, %[n]\n\t"
  10709. "lsr r5, r5, r6\n\t"
  10710. "orr r2, r2, r5\n\t"
  10711. "ldr r3, [%[a], #4]\n\t"
  10712. "str r2, [%[r], #12]\n\t"
  10713. "lsr r5, r3, #1\n\t"
  10714. "lsl r3, r3, %[n]\n\t"
  10715. "lsr r5, r5, r6\n\t"
  10716. "orr r4, r4, r5\n\t"
  10717. "ldr r2, [%[a], #0]\n\t"
  10718. "str r4, [%[r], #8]\n\t"
  10719. "lsr r5, r2, #1\n\t"
  10720. "lsl r2, r2, %[n]\n\t"
  10721. "lsr r5, r5, r6\n\t"
  10722. "orr r3, r3, r5\n\t"
  10723. "sub %[a], %[a], #64\n\t"
  10724. "sub %[r], %[r], #64\n\t"
  10725. "ldr r4, [%[a], #60]\n\t"
  10726. "str r3, [%[r], #68]\n\t"
  10727. "lsr r5, r4, #1\n\t"
  10728. "lsl r4, r4, %[n]\n\t"
  10729. "lsr r5, r5, r6\n\t"
  10730. "orr r2, r2, r5\n\t"
  10731. "ldr r3, [%[a], #56]\n\t"
  10732. "str r2, [%[r], #64]\n\t"
  10733. "lsr r5, r3, #1\n\t"
  10734. "lsl r3, r3, %[n]\n\t"
  10735. "lsr r5, r5, r6\n\t"
  10736. "orr r4, r4, r5\n\t"
  10737. "ldr r2, [%[a], #52]\n\t"
  10738. "str r4, [%[r], #60]\n\t"
  10739. "lsr r5, r2, #1\n\t"
  10740. "lsl r2, r2, %[n]\n\t"
  10741. "lsr r5, r5, r6\n\t"
  10742. "orr r3, r3, r5\n\t"
  10743. "ldr r4, [%[a], #48]\n\t"
  10744. "str r3, [%[r], #56]\n\t"
  10745. "lsr r5, r4, #1\n\t"
  10746. "lsl r4, r4, %[n]\n\t"
  10747. "lsr r5, r5, r6\n\t"
  10748. "orr r2, r2, r5\n\t"
  10749. "ldr r3, [%[a], #44]\n\t"
  10750. "str r2, [%[r], #52]\n\t"
  10751. "lsr r5, r3, #1\n\t"
  10752. "lsl r3, r3, %[n]\n\t"
  10753. "lsr r5, r5, r6\n\t"
  10754. "orr r4, r4, r5\n\t"
  10755. "ldr r2, [%[a], #40]\n\t"
  10756. "str r4, [%[r], #48]\n\t"
  10757. "lsr r5, r2, #1\n\t"
  10758. "lsl r2, r2, %[n]\n\t"
  10759. "lsr r5, r5, r6\n\t"
  10760. "orr r3, r3, r5\n\t"
  10761. "ldr r4, [%[a], #36]\n\t"
  10762. "str r3, [%[r], #44]\n\t"
  10763. "lsr r5, r4, #1\n\t"
  10764. "lsl r4, r4, %[n]\n\t"
  10765. "lsr r5, r5, r6\n\t"
  10766. "orr r2, r2, r5\n\t"
  10767. "ldr r3, [%[a], #32]\n\t"
  10768. "str r2, [%[r], #40]\n\t"
  10769. "lsr r5, r3, #1\n\t"
  10770. "lsl r3, r3, %[n]\n\t"
  10771. "lsr r5, r5, r6\n\t"
  10772. "orr r4, r4, r5\n\t"
  10773. "ldr r2, [%[a], #28]\n\t"
  10774. "str r4, [%[r], #36]\n\t"
  10775. "lsr r5, r2, #1\n\t"
  10776. "lsl r2, r2, %[n]\n\t"
  10777. "lsr r5, r5, r6\n\t"
  10778. "orr r3, r3, r5\n\t"
  10779. "ldr r4, [%[a], #24]\n\t"
  10780. "str r3, [%[r], #32]\n\t"
  10781. "lsr r5, r4, #1\n\t"
  10782. "lsl r4, r4, %[n]\n\t"
  10783. "lsr r5, r5, r6\n\t"
  10784. "orr r2, r2, r5\n\t"
  10785. "ldr r3, [%[a], #20]\n\t"
  10786. "str r2, [%[r], #28]\n\t"
  10787. "lsr r5, r3, #1\n\t"
  10788. "lsl r3, r3, %[n]\n\t"
  10789. "lsr r5, r5, r6\n\t"
  10790. "orr r4, r4, r5\n\t"
  10791. "ldr r2, [%[a], #16]\n\t"
  10792. "str r4, [%[r], #24]\n\t"
  10793. "lsr r5, r2, #1\n\t"
  10794. "lsl r2, r2, %[n]\n\t"
  10795. "lsr r5, r5, r6\n\t"
  10796. "orr r3, r3, r5\n\t"
  10797. "ldr r4, [%[a], #12]\n\t"
  10798. "str r3, [%[r], #20]\n\t"
  10799. "lsr r5, r4, #1\n\t"
  10800. "lsl r4, r4, %[n]\n\t"
  10801. "lsr r5, r5, r6\n\t"
  10802. "orr r2, r2, r5\n\t"
  10803. "ldr r3, [%[a], #8]\n\t"
  10804. "str r2, [%[r], #16]\n\t"
  10805. "lsr r5, r3, #1\n\t"
  10806. "lsl r3, r3, %[n]\n\t"
  10807. "lsr r5, r5, r6\n\t"
  10808. "orr r4, r4, r5\n\t"
  10809. "ldr r2, [%[a], #4]\n\t"
  10810. "str r4, [%[r], #12]\n\t"
  10811. "lsr r5, r2, #1\n\t"
  10812. "lsl r2, r2, %[n]\n\t"
  10813. "lsr r5, r5, r6\n\t"
  10814. "orr r3, r3, r5\n\t"
  10815. "ldr r4, [%[a], #0]\n\t"
  10816. "str r3, [%[r], #8]\n\t"
  10817. "lsr r5, r4, #1\n\t"
  10818. "lsl r4, r4, %[n]\n\t"
  10819. "lsr r5, r5, r6\n\t"
  10820. "orr r2, r2, r5\n\t"
  10821. "str r4, [%[r]]\n\t"
  10822. "str r2, [%[r], #4]\n\t"
  10823. :
  10824. : [r] "r" (r), [a] "r" (a), [n] "r" (n)
  10825. : "memory", "r2", "r3", "r4", "r5", "r6"
  10826. );
  10827. }
  10828. /* Modular exponentiate 2 to the e mod m. (r = 2^e mod m)
  10829. *
  10830. * r A single precision number that is the result of the operation.
  10831. * e A single precision number that is the exponent.
  10832. * bits The number of bits in the exponent.
  10833. * m A single precision number that is the modulus.
  10834. * returns 0 on success.
  10835. * returns MEMORY_E on dynamic memory allocation failure.
  10836. * returns MP_VAL when base is even.
  10837. */
  10838. static int sp_3072_mod_exp_2_96(sp_digit* r, const sp_digit* e, int bits,
  10839. const sp_digit* m)
  10840. {
  10841. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  10842. sp_digit* td = NULL;
  10843. #else
  10844. sp_digit td[289];
  10845. #endif
  10846. sp_digit* norm = NULL;
  10847. sp_digit* tmp = NULL;
  10848. sp_digit mp = 1;
  10849. sp_digit n;
  10850. sp_digit o;
  10851. sp_digit mask;
  10852. int i;
  10853. int c;
  10854. byte y;
  10855. int err = MP_OKAY;
  10856. if (bits == 0) {
  10857. err = MP_VAL;
  10858. }
  10859. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  10860. if (err == MP_OKAY) {
  10861. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * 289, NULL,
  10862. DYNAMIC_TYPE_TMP_BUFFER);
  10863. if (td == NULL)
  10864. err = MEMORY_E;
  10865. }
  10866. #endif
  10867. if (err == MP_OKAY) {
  10868. norm = td;
  10869. tmp = td + 192;
  10870. sp_3072_mont_setup(m, &mp);
  10871. sp_3072_mont_norm_96(norm, m);
  10872. i = (bits - 1) / 32;
  10873. n = e[i--];
  10874. c = bits & 31;
  10875. if (c == 0) {
  10876. c = 32;
  10877. }
  10878. c -= bits % 5;
  10879. if (c == 32) {
  10880. c = 27;
  10881. }
  10882. if (c < 0) {
  10883. /* Number of bits in top word is less than number needed. */
  10884. c = -c;
  10885. y = (byte)(n << c);
  10886. n = e[i--];
  10887. y |= (byte)(n >> (64 - c));
  10888. n <<= c;
  10889. c = 64 - c;
  10890. }
  10891. else if (c == 0) {
  10892. /* All bits in top word used. */
  10893. y = (byte)n;
  10894. }
  10895. else {
  10896. y = (byte)(n >> c);
  10897. n <<= 32 - c;
  10898. }
  10899. sp_3072_lshift_96(r, norm, y);
  10900. for (; i>=0 || c>=5; ) {
  10901. if (c == 0) {
  10902. n = e[i--];
  10903. y = (byte)(n >> 27);
  10904. n <<= 5;
  10905. c = 27;
  10906. }
  10907. else if (c < 5) {
  10908. y = (byte)(n >> 27);
  10909. n = e[i--];
  10910. c = 5 - c;
  10911. y |= (byte)(n >> (32 - c));
  10912. n <<= c;
  10913. c = 32 - c;
  10914. }
  10915. else {
  10916. y = (byte)((n >> 27) & 0x1f);
  10917. n <<= 5;
  10918. c -= 5;
  10919. }
  10920. sp_3072_mont_sqr_96(r, r, m, mp);
  10921. sp_3072_mont_sqr_96(r, r, m, mp);
  10922. sp_3072_mont_sqr_96(r, r, m, mp);
  10923. sp_3072_mont_sqr_96(r, r, m, mp);
  10924. sp_3072_mont_sqr_96(r, r, m, mp);
  10925. sp_3072_lshift_96(r, r, y);
  10926. sp_3072_mul_d_96(tmp, norm, r[96]);
  10927. r[96] = 0;
  10928. o = sp_3072_add_96(r, r, tmp);
  10929. sp_3072_cond_sub_96(r, r, m, (sp_digit)0 - o);
  10930. }
  10931. XMEMSET(&r[96], 0, sizeof(sp_digit) * 96U);
  10932. sp_3072_mont_reduce_96(r, m, mp);
  10933. mask = 0 - (sp_3072_cmp_96(r, m) >= 0);
  10934. sp_3072_cond_sub_96(r, r, m, mask);
  10935. }
  10936. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  10937. if (td != NULL)
  10938. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  10939. #endif
  10940. return err;
  10941. }
  10942. #endif /* HAVE_FFDHE_3072 */
  10943. /* Perform the modular exponentiation for Diffie-Hellman.
  10944. *
  10945. * base Base.
  10946. * exp Array of bytes that is the exponent.
  10947. * expLen Length of data, in bytes, in exponent.
  10948. * mod Modulus.
  10949. * out Buffer to hold big-endian bytes of exponentiation result.
  10950. * Must be at least 384 bytes long.
  10951. * outLen Length, in bytes, of exponentiation result.
  10952. * returns 0 on success, MP_READ_E if there are too many bytes in an array
  10953. * and MEMORY_E if memory allocation fails.
  10954. */
  10955. int sp_DhExp_3072(const mp_int* base, const byte* exp, word32 expLen,
  10956. const mp_int* mod, byte* out, word32* outLen)
  10957. {
  10958. int err = MP_OKAY;
  10959. sp_digit b[192];
  10960. sp_digit e[96];
  10961. sp_digit m[96];
  10962. sp_digit* r = b;
  10963. word32 i;
  10964. if (mp_count_bits(base) > 3072) {
  10965. err = MP_READ_E;
  10966. }
  10967. else if (expLen > 384) {
  10968. err = MP_READ_E;
  10969. }
  10970. else if (mp_count_bits(mod) != 3072) {
  10971. err = MP_READ_E;
  10972. }
  10973. else if (mp_iseven(mod)) {
  10974. err = MP_VAL;
  10975. }
  10976. if (err == MP_OKAY) {
  10977. sp_3072_from_mp(b, 96, base);
  10978. sp_3072_from_bin(e, 96, exp, expLen);
  10979. sp_3072_from_mp(m, 96, mod);
  10980. #ifdef HAVE_FFDHE_3072
  10981. if (base->used == 1 && base->dp[0] == 2 && m[95] == (sp_digit)-1)
  10982. err = sp_3072_mod_exp_2_96(r, e, expLen * 8, m);
  10983. else
  10984. #endif
  10985. err = sp_3072_mod_exp_96(r, b, e, expLen * 8, m, 0);
  10986. }
  10987. if (err == MP_OKAY) {
  10988. sp_3072_to_bin_96(r, out);
  10989. *outLen = 384;
  10990. for (i=0; i<384 && out[i] == 0; i++) {
  10991. /* Search for first non-zero. */
  10992. }
  10993. *outLen -= i;
  10994. XMEMMOVE(out, out + i, *outLen);
  10995. }
  10996. XMEMSET(e, 0, sizeof(e));
  10997. return err;
  10998. }
  10999. #endif /* WOLFSSL_HAVE_SP_DH */
  11000. /* Perform the modular exponentiation for Diffie-Hellman.
  11001. *
  11002. * base Base. MP integer.
  11003. * exp Exponent. MP integer.
  11004. * mod Modulus. MP integer.
  11005. * res Result. MP integer.
  11006. * returns 0 on success, MP_READ_E if there are too many bytes in an array
  11007. * and MEMORY_E if memory allocation fails.
  11008. */
  11009. int sp_ModExp_1536(const mp_int* base, const mp_int* exp, const mp_int* mod,
  11010. mp_int* res)
  11011. {
  11012. int err = MP_OKAY;
  11013. sp_digit b[96];
  11014. sp_digit e[48];
  11015. sp_digit m[48];
  11016. sp_digit* r = b;
  11017. int expBits = mp_count_bits(exp);
  11018. if (mp_count_bits(base) > 1536) {
  11019. err = MP_READ_E;
  11020. }
  11021. else if (expBits > 1536) {
  11022. err = MP_READ_E;
  11023. }
  11024. else if (mp_count_bits(mod) != 1536) {
  11025. err = MP_READ_E;
  11026. }
  11027. else if (mp_iseven(mod)) {
  11028. err = MP_VAL;
  11029. }
  11030. if (err == MP_OKAY) {
  11031. sp_3072_from_mp(b, 48, base);
  11032. sp_3072_from_mp(e, 48, exp);
  11033. sp_3072_from_mp(m, 48, mod);
  11034. err = sp_3072_mod_exp_48(r, b, e, expBits, m, 0);
  11035. }
  11036. if (err == MP_OKAY) {
  11037. XMEMSET(r + 48, 0, sizeof(*r) * 48U);
  11038. err = sp_3072_to_mp(r, res);
  11039. res->used = mod->used;
  11040. mp_clamp(res);
  11041. }
  11042. XMEMSET(e, 0, sizeof(e));
  11043. return err;
  11044. }
  11045. #endif /* WOLFSSL_HAVE_SP_DH | (WOLFSSL_HAVE_SP_RSA & !WOLFSSL_RSA_PUBLIC_ONLY) */
  11046. #endif /* !WOLFSSL_SP_NO_3072 */
  11047. #ifdef WOLFSSL_SP_4096
  11048. /* Read big endian unsigned byte array into r.
  11049. *
  11050. * r A single precision integer.
  11051. * size Maximum number of bytes to convert
  11052. * a Byte array.
  11053. * n Number of bytes in array to read.
  11054. */
  11055. static void sp_4096_from_bin(sp_digit* r, int size, const byte* a, int n)
  11056. {
  11057. int i;
  11058. int j;
  11059. byte* d;
  11060. for (i = n - 1,j = 0; i >= 3; i -= 4) {
  11061. r[j] = ((sp_digit)a[i - 0] << 0) |
  11062. ((sp_digit)a[i - 1] << 8) |
  11063. ((sp_digit)a[i - 2] << 16) |
  11064. ((sp_digit)a[i - 3] << 24);
  11065. j++;
  11066. }
  11067. if (i >= 0) {
  11068. r[j] = 0;
  11069. d = (byte*)r;
  11070. switch (i) {
  11071. case 2: d[n - 1 - 2] = a[2]; //fallthrough
  11072. case 1: d[n - 1 - 1] = a[1]; //fallthrough
  11073. case 0: d[n - 1 - 0] = a[0]; //fallthrough
  11074. }
  11075. j++;
  11076. }
  11077. for (; j < size; j++) {
  11078. r[j] = 0;
  11079. }
  11080. }
  11081. /* Convert an mp_int to an array of sp_digit.
  11082. *
  11083. * r A single precision integer.
  11084. * size Maximum number of bytes to convert
  11085. * a A multi-precision integer.
  11086. */
  11087. static void sp_4096_from_mp(sp_digit* r, int size, const mp_int* a)
  11088. {
  11089. #if DIGIT_BIT == 32
  11090. int j;
  11091. XMEMCPY(r, a->dp, sizeof(sp_digit) * a->used);
  11092. for (j = a->used; j < size; j++) {
  11093. r[j] = 0;
  11094. }
  11095. #elif DIGIT_BIT > 32
  11096. int i;
  11097. int j = 0;
  11098. word32 s = 0;
  11099. r[0] = 0;
  11100. for (i = 0; i < a->used && j < size; i++) {
  11101. r[j] |= ((sp_digit)a->dp[i] << s);
  11102. r[j] &= 0xffffffff;
  11103. s = 32U - s;
  11104. if (j + 1 >= size) {
  11105. break;
  11106. }
  11107. /* lint allow cast of mismatch word32 and mp_digit */
  11108. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  11109. while ((s + 32U) <= (word32)DIGIT_BIT) {
  11110. s += 32U;
  11111. r[j] &= 0xffffffff;
  11112. if (j + 1 >= size) {
  11113. break;
  11114. }
  11115. if (s < (word32)DIGIT_BIT) {
  11116. /* lint allow cast of mismatch word32 and mp_digit */
  11117. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  11118. }
  11119. else {
  11120. r[++j] = (sp_digit)0;
  11121. }
  11122. }
  11123. s = (word32)DIGIT_BIT - s;
  11124. }
  11125. for (j++; j < size; j++) {
  11126. r[j] = 0;
  11127. }
  11128. #else
  11129. int i;
  11130. int j = 0;
  11131. int s = 0;
  11132. r[0] = 0;
  11133. for (i = 0; i < a->used && j < size; i++) {
  11134. r[j] |= ((sp_digit)a->dp[i]) << s;
  11135. if (s + DIGIT_BIT >= 32) {
  11136. r[j] &= 0xffffffff;
  11137. if (j + 1 >= size) {
  11138. break;
  11139. }
  11140. s = 32 - s;
  11141. if (s == DIGIT_BIT) {
  11142. r[++j] = 0;
  11143. s = 0;
  11144. }
  11145. else {
  11146. r[++j] = a->dp[i] >> s;
  11147. s = DIGIT_BIT - s;
  11148. }
  11149. }
  11150. else {
  11151. s += DIGIT_BIT;
  11152. }
  11153. }
  11154. for (j++; j < size; j++) {
  11155. r[j] = 0;
  11156. }
  11157. #endif
  11158. }
  11159. /* Write r as big endian to byte array.
  11160. * Fixed length number of bytes written: 512
  11161. *
  11162. * r A single precision integer.
  11163. * a Byte array.
  11164. */
  11165. static void sp_4096_to_bin_128(sp_digit* r, byte* a)
  11166. {
  11167. int i;
  11168. int j = 0;
  11169. for (i = 127; i >= 0; i--) {
  11170. a[j++] = r[i] >> 24;
  11171. a[j++] = r[i] >> 16;
  11172. a[j++] = r[i] >> 8;
  11173. a[j++] = r[i] >> 0;
  11174. }
  11175. }
  11176. #if (defined(WOLFSSL_HAVE_SP_RSA) && (!defined(WOLFSSL_RSA_PUBLIC_ONLY) || !defined(WOLFSSL_SP_SMALL))) || defined(WOLFSSL_HAVE_SP_DH)
  11177. /* Normalize the values in each word to 32.
  11178. *
  11179. * a Array of sp_digit to normalize.
  11180. */
  11181. #define sp_4096_norm_128(a)
  11182. #endif /* (WOLFSSL_HAVE_SP_RSA && (!WOLFSSL_RSA_PUBLIC_ONLY || !WOLFSSL_SP_SMALL)) || WOLFSSL_HAVE_SP_DH */
  11183. /* Normalize the values in each word to 32.
  11184. *
  11185. * a Array of sp_digit to normalize.
  11186. */
  11187. #define sp_4096_norm_128(a)
  11188. #ifndef WOLFSSL_SP_SMALL
  11189. /* Sub b from a into r. (r = a - b)
  11190. *
  11191. * r A single precision integer.
  11192. * a A single precision integer.
  11193. * b A single precision integer.
  11194. */
  11195. SP_NOINLINE static sp_digit sp_4096_sub_in_place_128(sp_digit* a,
  11196. const sp_digit* b)
  11197. {
  11198. sp_digit c = 0;
  11199. __asm__ __volatile__ (
  11200. "ldm %[a], {r3, r4}\n\t"
  11201. "ldm %[b]!, {r5, r6}\n\t"
  11202. "subs r3, r3, r5\n\t"
  11203. "sbcs r4, r4, r6\n\t"
  11204. "stm %[a]!, {r3, r4}\n\t"
  11205. "ldm %[a], {r3, r4}\n\t"
  11206. "ldm %[b]!, {r5, r6}\n\t"
  11207. "sbcs r3, r3, r5\n\t"
  11208. "sbcs r4, r4, r6\n\t"
  11209. "stm %[a]!, {r3, r4}\n\t"
  11210. "ldm %[a], {r3, r4}\n\t"
  11211. "ldm %[b]!, {r5, r6}\n\t"
  11212. "sbcs r3, r3, r5\n\t"
  11213. "sbcs r4, r4, r6\n\t"
  11214. "stm %[a]!, {r3, r4}\n\t"
  11215. "ldm %[a], {r3, r4}\n\t"
  11216. "ldm %[b]!, {r5, r6}\n\t"
  11217. "sbcs r3, r3, r5\n\t"
  11218. "sbcs r4, r4, r6\n\t"
  11219. "stm %[a]!, {r3, r4}\n\t"
  11220. "ldm %[a], {r3, r4}\n\t"
  11221. "ldm %[b]!, {r5, r6}\n\t"
  11222. "sbcs r3, r3, r5\n\t"
  11223. "sbcs r4, r4, r6\n\t"
  11224. "stm %[a]!, {r3, r4}\n\t"
  11225. "ldm %[a], {r3, r4}\n\t"
  11226. "ldm %[b]!, {r5, r6}\n\t"
  11227. "sbcs r3, r3, r5\n\t"
  11228. "sbcs r4, r4, r6\n\t"
  11229. "stm %[a]!, {r3, r4}\n\t"
  11230. "ldm %[a], {r3, r4}\n\t"
  11231. "ldm %[b]!, {r5, r6}\n\t"
  11232. "sbcs r3, r3, r5\n\t"
  11233. "sbcs r4, r4, r6\n\t"
  11234. "stm %[a]!, {r3, r4}\n\t"
  11235. "ldm %[a], {r3, r4}\n\t"
  11236. "ldm %[b]!, {r5, r6}\n\t"
  11237. "sbcs r3, r3, r5\n\t"
  11238. "sbcs r4, r4, r6\n\t"
  11239. "stm %[a]!, {r3, r4}\n\t"
  11240. "ldm %[a], {r3, r4}\n\t"
  11241. "ldm %[b]!, {r5, r6}\n\t"
  11242. "sbcs r3, r3, r5\n\t"
  11243. "sbcs r4, r4, r6\n\t"
  11244. "stm %[a]!, {r3, r4}\n\t"
  11245. "ldm %[a], {r3, r4}\n\t"
  11246. "ldm %[b]!, {r5, r6}\n\t"
  11247. "sbcs r3, r3, r5\n\t"
  11248. "sbcs r4, r4, r6\n\t"
  11249. "stm %[a]!, {r3, r4}\n\t"
  11250. "ldm %[a], {r3, r4}\n\t"
  11251. "ldm %[b]!, {r5, r6}\n\t"
  11252. "sbcs r3, r3, r5\n\t"
  11253. "sbcs r4, r4, r6\n\t"
  11254. "stm %[a]!, {r3, r4}\n\t"
  11255. "ldm %[a], {r3, r4}\n\t"
  11256. "ldm %[b]!, {r5, r6}\n\t"
  11257. "sbcs r3, r3, r5\n\t"
  11258. "sbcs r4, r4, r6\n\t"
  11259. "stm %[a]!, {r3, r4}\n\t"
  11260. "ldm %[a], {r3, r4}\n\t"
  11261. "ldm %[b]!, {r5, r6}\n\t"
  11262. "sbcs r3, r3, r5\n\t"
  11263. "sbcs r4, r4, r6\n\t"
  11264. "stm %[a]!, {r3, r4}\n\t"
  11265. "ldm %[a], {r3, r4}\n\t"
  11266. "ldm %[b]!, {r5, r6}\n\t"
  11267. "sbcs r3, r3, r5\n\t"
  11268. "sbcs r4, r4, r6\n\t"
  11269. "stm %[a]!, {r3, r4}\n\t"
  11270. "ldm %[a], {r3, r4}\n\t"
  11271. "ldm %[b]!, {r5, r6}\n\t"
  11272. "sbcs r3, r3, r5\n\t"
  11273. "sbcs r4, r4, r6\n\t"
  11274. "stm %[a]!, {r3, r4}\n\t"
  11275. "ldm %[a], {r3, r4}\n\t"
  11276. "ldm %[b]!, {r5, r6}\n\t"
  11277. "sbcs r3, r3, r5\n\t"
  11278. "sbcs r4, r4, r6\n\t"
  11279. "stm %[a]!, {r3, r4}\n\t"
  11280. "ldm %[a], {r3, r4}\n\t"
  11281. "ldm %[b]!, {r5, r6}\n\t"
  11282. "sbcs r3, r3, r5\n\t"
  11283. "sbcs r4, r4, r6\n\t"
  11284. "stm %[a]!, {r3, r4}\n\t"
  11285. "ldm %[a], {r3, r4}\n\t"
  11286. "ldm %[b]!, {r5, r6}\n\t"
  11287. "sbcs r3, r3, r5\n\t"
  11288. "sbcs r4, r4, r6\n\t"
  11289. "stm %[a]!, {r3, r4}\n\t"
  11290. "ldm %[a], {r3, r4}\n\t"
  11291. "ldm %[b]!, {r5, r6}\n\t"
  11292. "sbcs r3, r3, r5\n\t"
  11293. "sbcs r4, r4, r6\n\t"
  11294. "stm %[a]!, {r3, r4}\n\t"
  11295. "ldm %[a], {r3, r4}\n\t"
  11296. "ldm %[b]!, {r5, r6}\n\t"
  11297. "sbcs r3, r3, r5\n\t"
  11298. "sbcs r4, r4, r6\n\t"
  11299. "stm %[a]!, {r3, r4}\n\t"
  11300. "ldm %[a], {r3, r4}\n\t"
  11301. "ldm %[b]!, {r5, r6}\n\t"
  11302. "sbcs r3, r3, r5\n\t"
  11303. "sbcs r4, r4, r6\n\t"
  11304. "stm %[a]!, {r3, r4}\n\t"
  11305. "ldm %[a], {r3, r4}\n\t"
  11306. "ldm %[b]!, {r5, r6}\n\t"
  11307. "sbcs r3, r3, r5\n\t"
  11308. "sbcs r4, r4, r6\n\t"
  11309. "stm %[a]!, {r3, r4}\n\t"
  11310. "ldm %[a], {r3, r4}\n\t"
  11311. "ldm %[b]!, {r5, r6}\n\t"
  11312. "sbcs r3, r3, r5\n\t"
  11313. "sbcs r4, r4, r6\n\t"
  11314. "stm %[a]!, {r3, r4}\n\t"
  11315. "ldm %[a], {r3, r4}\n\t"
  11316. "ldm %[b]!, {r5, r6}\n\t"
  11317. "sbcs r3, r3, r5\n\t"
  11318. "sbcs r4, r4, r6\n\t"
  11319. "stm %[a]!, {r3, r4}\n\t"
  11320. "ldm %[a], {r3, r4}\n\t"
  11321. "ldm %[b]!, {r5, r6}\n\t"
  11322. "sbcs r3, r3, r5\n\t"
  11323. "sbcs r4, r4, r6\n\t"
  11324. "stm %[a]!, {r3, r4}\n\t"
  11325. "ldm %[a], {r3, r4}\n\t"
  11326. "ldm %[b]!, {r5, r6}\n\t"
  11327. "sbcs r3, r3, r5\n\t"
  11328. "sbcs r4, r4, r6\n\t"
  11329. "stm %[a]!, {r3, r4}\n\t"
  11330. "ldm %[a], {r3, r4}\n\t"
  11331. "ldm %[b]!, {r5, r6}\n\t"
  11332. "sbcs r3, r3, r5\n\t"
  11333. "sbcs r4, r4, r6\n\t"
  11334. "stm %[a]!, {r3, r4}\n\t"
  11335. "ldm %[a], {r3, r4}\n\t"
  11336. "ldm %[b]!, {r5, r6}\n\t"
  11337. "sbcs r3, r3, r5\n\t"
  11338. "sbcs r4, r4, r6\n\t"
  11339. "stm %[a]!, {r3, r4}\n\t"
  11340. "ldm %[a], {r3, r4}\n\t"
  11341. "ldm %[b]!, {r5, r6}\n\t"
  11342. "sbcs r3, r3, r5\n\t"
  11343. "sbcs r4, r4, r6\n\t"
  11344. "stm %[a]!, {r3, r4}\n\t"
  11345. "ldm %[a], {r3, r4}\n\t"
  11346. "ldm %[b]!, {r5, r6}\n\t"
  11347. "sbcs r3, r3, r5\n\t"
  11348. "sbcs r4, r4, r6\n\t"
  11349. "stm %[a]!, {r3, r4}\n\t"
  11350. "ldm %[a], {r3, r4}\n\t"
  11351. "ldm %[b]!, {r5, r6}\n\t"
  11352. "sbcs r3, r3, r5\n\t"
  11353. "sbcs r4, r4, r6\n\t"
  11354. "stm %[a]!, {r3, r4}\n\t"
  11355. "ldm %[a], {r3, r4}\n\t"
  11356. "ldm %[b]!, {r5, r6}\n\t"
  11357. "sbcs r3, r3, r5\n\t"
  11358. "sbcs r4, r4, r6\n\t"
  11359. "stm %[a]!, {r3, r4}\n\t"
  11360. "ldm %[a], {r3, r4}\n\t"
  11361. "ldm %[b]!, {r5, r6}\n\t"
  11362. "sbcs r3, r3, r5\n\t"
  11363. "sbcs r4, r4, r6\n\t"
  11364. "stm %[a]!, {r3, r4}\n\t"
  11365. "ldm %[a], {r3, r4}\n\t"
  11366. "ldm %[b]!, {r5, r6}\n\t"
  11367. "sbcs r3, r3, r5\n\t"
  11368. "sbcs r4, r4, r6\n\t"
  11369. "stm %[a]!, {r3, r4}\n\t"
  11370. "ldm %[a], {r3, r4}\n\t"
  11371. "ldm %[b]!, {r5, r6}\n\t"
  11372. "sbcs r3, r3, r5\n\t"
  11373. "sbcs r4, r4, r6\n\t"
  11374. "stm %[a]!, {r3, r4}\n\t"
  11375. "ldm %[a], {r3, r4}\n\t"
  11376. "ldm %[b]!, {r5, r6}\n\t"
  11377. "sbcs r3, r3, r5\n\t"
  11378. "sbcs r4, r4, r6\n\t"
  11379. "stm %[a]!, {r3, r4}\n\t"
  11380. "ldm %[a], {r3, r4}\n\t"
  11381. "ldm %[b]!, {r5, r6}\n\t"
  11382. "sbcs r3, r3, r5\n\t"
  11383. "sbcs r4, r4, r6\n\t"
  11384. "stm %[a]!, {r3, r4}\n\t"
  11385. "ldm %[a], {r3, r4}\n\t"
  11386. "ldm %[b]!, {r5, r6}\n\t"
  11387. "sbcs r3, r3, r5\n\t"
  11388. "sbcs r4, r4, r6\n\t"
  11389. "stm %[a]!, {r3, r4}\n\t"
  11390. "ldm %[a], {r3, r4}\n\t"
  11391. "ldm %[b]!, {r5, r6}\n\t"
  11392. "sbcs r3, r3, r5\n\t"
  11393. "sbcs r4, r4, r6\n\t"
  11394. "stm %[a]!, {r3, r4}\n\t"
  11395. "ldm %[a], {r3, r4}\n\t"
  11396. "ldm %[b]!, {r5, r6}\n\t"
  11397. "sbcs r3, r3, r5\n\t"
  11398. "sbcs r4, r4, r6\n\t"
  11399. "stm %[a]!, {r3, r4}\n\t"
  11400. "ldm %[a], {r3, r4}\n\t"
  11401. "ldm %[b]!, {r5, r6}\n\t"
  11402. "sbcs r3, r3, r5\n\t"
  11403. "sbcs r4, r4, r6\n\t"
  11404. "stm %[a]!, {r3, r4}\n\t"
  11405. "ldm %[a], {r3, r4}\n\t"
  11406. "ldm %[b]!, {r5, r6}\n\t"
  11407. "sbcs r3, r3, r5\n\t"
  11408. "sbcs r4, r4, r6\n\t"
  11409. "stm %[a]!, {r3, r4}\n\t"
  11410. "ldm %[a], {r3, r4}\n\t"
  11411. "ldm %[b]!, {r5, r6}\n\t"
  11412. "sbcs r3, r3, r5\n\t"
  11413. "sbcs r4, r4, r6\n\t"
  11414. "stm %[a]!, {r3, r4}\n\t"
  11415. "ldm %[a], {r3, r4}\n\t"
  11416. "ldm %[b]!, {r5, r6}\n\t"
  11417. "sbcs r3, r3, r5\n\t"
  11418. "sbcs r4, r4, r6\n\t"
  11419. "stm %[a]!, {r3, r4}\n\t"
  11420. "ldm %[a], {r3, r4}\n\t"
  11421. "ldm %[b]!, {r5, r6}\n\t"
  11422. "sbcs r3, r3, r5\n\t"
  11423. "sbcs r4, r4, r6\n\t"
  11424. "stm %[a]!, {r3, r4}\n\t"
  11425. "ldm %[a], {r3, r4}\n\t"
  11426. "ldm %[b]!, {r5, r6}\n\t"
  11427. "sbcs r3, r3, r5\n\t"
  11428. "sbcs r4, r4, r6\n\t"
  11429. "stm %[a]!, {r3, r4}\n\t"
  11430. "ldm %[a], {r3, r4}\n\t"
  11431. "ldm %[b]!, {r5, r6}\n\t"
  11432. "sbcs r3, r3, r5\n\t"
  11433. "sbcs r4, r4, r6\n\t"
  11434. "stm %[a]!, {r3, r4}\n\t"
  11435. "ldm %[a], {r3, r4}\n\t"
  11436. "ldm %[b]!, {r5, r6}\n\t"
  11437. "sbcs r3, r3, r5\n\t"
  11438. "sbcs r4, r4, r6\n\t"
  11439. "stm %[a]!, {r3, r4}\n\t"
  11440. "ldm %[a], {r3, r4}\n\t"
  11441. "ldm %[b]!, {r5, r6}\n\t"
  11442. "sbcs r3, r3, r5\n\t"
  11443. "sbcs r4, r4, r6\n\t"
  11444. "stm %[a]!, {r3, r4}\n\t"
  11445. "ldm %[a], {r3, r4}\n\t"
  11446. "ldm %[b]!, {r5, r6}\n\t"
  11447. "sbcs r3, r3, r5\n\t"
  11448. "sbcs r4, r4, r6\n\t"
  11449. "stm %[a]!, {r3, r4}\n\t"
  11450. "ldm %[a], {r3, r4}\n\t"
  11451. "ldm %[b]!, {r5, r6}\n\t"
  11452. "sbcs r3, r3, r5\n\t"
  11453. "sbcs r4, r4, r6\n\t"
  11454. "stm %[a]!, {r3, r4}\n\t"
  11455. "ldm %[a], {r3, r4}\n\t"
  11456. "ldm %[b]!, {r5, r6}\n\t"
  11457. "sbcs r3, r3, r5\n\t"
  11458. "sbcs r4, r4, r6\n\t"
  11459. "stm %[a]!, {r3, r4}\n\t"
  11460. "ldm %[a], {r3, r4}\n\t"
  11461. "ldm %[b]!, {r5, r6}\n\t"
  11462. "sbcs r3, r3, r5\n\t"
  11463. "sbcs r4, r4, r6\n\t"
  11464. "stm %[a]!, {r3, r4}\n\t"
  11465. "ldm %[a], {r3, r4}\n\t"
  11466. "ldm %[b]!, {r5, r6}\n\t"
  11467. "sbcs r3, r3, r5\n\t"
  11468. "sbcs r4, r4, r6\n\t"
  11469. "stm %[a]!, {r3, r4}\n\t"
  11470. "ldm %[a], {r3, r4}\n\t"
  11471. "ldm %[b]!, {r5, r6}\n\t"
  11472. "sbcs r3, r3, r5\n\t"
  11473. "sbcs r4, r4, r6\n\t"
  11474. "stm %[a]!, {r3, r4}\n\t"
  11475. "ldm %[a], {r3, r4}\n\t"
  11476. "ldm %[b]!, {r5, r6}\n\t"
  11477. "sbcs r3, r3, r5\n\t"
  11478. "sbcs r4, r4, r6\n\t"
  11479. "stm %[a]!, {r3, r4}\n\t"
  11480. "ldm %[a], {r3, r4}\n\t"
  11481. "ldm %[b]!, {r5, r6}\n\t"
  11482. "sbcs r3, r3, r5\n\t"
  11483. "sbcs r4, r4, r6\n\t"
  11484. "stm %[a]!, {r3, r4}\n\t"
  11485. "ldm %[a], {r3, r4}\n\t"
  11486. "ldm %[b]!, {r5, r6}\n\t"
  11487. "sbcs r3, r3, r5\n\t"
  11488. "sbcs r4, r4, r6\n\t"
  11489. "stm %[a]!, {r3, r4}\n\t"
  11490. "ldm %[a], {r3, r4}\n\t"
  11491. "ldm %[b]!, {r5, r6}\n\t"
  11492. "sbcs r3, r3, r5\n\t"
  11493. "sbcs r4, r4, r6\n\t"
  11494. "stm %[a]!, {r3, r4}\n\t"
  11495. "ldm %[a], {r3, r4}\n\t"
  11496. "ldm %[b]!, {r5, r6}\n\t"
  11497. "sbcs r3, r3, r5\n\t"
  11498. "sbcs r4, r4, r6\n\t"
  11499. "stm %[a]!, {r3, r4}\n\t"
  11500. "ldm %[a], {r3, r4}\n\t"
  11501. "ldm %[b]!, {r5, r6}\n\t"
  11502. "sbcs r3, r3, r5\n\t"
  11503. "sbcs r4, r4, r6\n\t"
  11504. "stm %[a]!, {r3, r4}\n\t"
  11505. "ldm %[a], {r3, r4}\n\t"
  11506. "ldm %[b]!, {r5, r6}\n\t"
  11507. "sbcs r3, r3, r5\n\t"
  11508. "sbcs r4, r4, r6\n\t"
  11509. "stm %[a]!, {r3, r4}\n\t"
  11510. "ldm %[a], {r3, r4}\n\t"
  11511. "ldm %[b]!, {r5, r6}\n\t"
  11512. "sbcs r3, r3, r5\n\t"
  11513. "sbcs r4, r4, r6\n\t"
  11514. "stm %[a]!, {r3, r4}\n\t"
  11515. "ldm %[a], {r3, r4}\n\t"
  11516. "ldm %[b]!, {r5, r6}\n\t"
  11517. "sbcs r3, r3, r5\n\t"
  11518. "sbcs r4, r4, r6\n\t"
  11519. "stm %[a]!, {r3, r4}\n\t"
  11520. "sbc %[c], %[c], %[c]\n\t"
  11521. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  11522. :
  11523. : "memory", "r3", "r4", "r5", "r6"
  11524. );
  11525. return c;
  11526. }
  11527. /* Add b to a into r. (r = a + b)
  11528. *
  11529. * r A single precision integer.
  11530. * a A single precision integer.
  11531. * b A single precision integer.
  11532. */
  11533. SP_NOINLINE static sp_digit sp_4096_add_128(sp_digit* r, const sp_digit* a,
  11534. const sp_digit* b)
  11535. {
  11536. sp_digit c = 0;
  11537. __asm__ __volatile__ (
  11538. "ldm %[a]!, {r4, r5}\n\t"
  11539. "ldm %[b]!, {r6, r8}\n\t"
  11540. "adds r4, r4, r6\n\t"
  11541. "adcs r5, r5, r8\n\t"
  11542. "stm %[r]!, {r4, r5}\n\t"
  11543. "ldm %[a]!, {r4, r5}\n\t"
  11544. "ldm %[b]!, {r6, r8}\n\t"
  11545. "adcs r4, r4, r6\n\t"
  11546. "adcs r5, r5, r8\n\t"
  11547. "stm %[r]!, {r4, r5}\n\t"
  11548. "ldm %[a]!, {r4, r5}\n\t"
  11549. "ldm %[b]!, {r6, r8}\n\t"
  11550. "adcs r4, r4, r6\n\t"
  11551. "adcs r5, r5, r8\n\t"
  11552. "stm %[r]!, {r4, r5}\n\t"
  11553. "ldm %[a]!, {r4, r5}\n\t"
  11554. "ldm %[b]!, {r6, r8}\n\t"
  11555. "adcs r4, r4, r6\n\t"
  11556. "adcs r5, r5, r8\n\t"
  11557. "stm %[r]!, {r4, r5}\n\t"
  11558. "ldm %[a]!, {r4, r5}\n\t"
  11559. "ldm %[b]!, {r6, r8}\n\t"
  11560. "adcs r4, r4, r6\n\t"
  11561. "adcs r5, r5, r8\n\t"
  11562. "stm %[r]!, {r4, r5}\n\t"
  11563. "ldm %[a]!, {r4, r5}\n\t"
  11564. "ldm %[b]!, {r6, r8}\n\t"
  11565. "adcs r4, r4, r6\n\t"
  11566. "adcs r5, r5, r8\n\t"
  11567. "stm %[r]!, {r4, r5}\n\t"
  11568. "ldm %[a]!, {r4, r5}\n\t"
  11569. "ldm %[b]!, {r6, r8}\n\t"
  11570. "adcs r4, r4, r6\n\t"
  11571. "adcs r5, r5, r8\n\t"
  11572. "stm %[r]!, {r4, r5}\n\t"
  11573. "ldm %[a]!, {r4, r5}\n\t"
  11574. "ldm %[b]!, {r6, r8}\n\t"
  11575. "adcs r4, r4, r6\n\t"
  11576. "adcs r5, r5, r8\n\t"
  11577. "stm %[r]!, {r4, r5}\n\t"
  11578. "ldm %[a]!, {r4, r5}\n\t"
  11579. "ldm %[b]!, {r6, r8}\n\t"
  11580. "adcs r4, r4, r6\n\t"
  11581. "adcs r5, r5, r8\n\t"
  11582. "stm %[r]!, {r4, r5}\n\t"
  11583. "ldm %[a]!, {r4, r5}\n\t"
  11584. "ldm %[b]!, {r6, r8}\n\t"
  11585. "adcs r4, r4, r6\n\t"
  11586. "adcs r5, r5, r8\n\t"
  11587. "stm %[r]!, {r4, r5}\n\t"
  11588. "ldm %[a]!, {r4, r5}\n\t"
  11589. "ldm %[b]!, {r6, r8}\n\t"
  11590. "adcs r4, r4, r6\n\t"
  11591. "adcs r5, r5, r8\n\t"
  11592. "stm %[r]!, {r4, r5}\n\t"
  11593. "ldm %[a]!, {r4, r5}\n\t"
  11594. "ldm %[b]!, {r6, r8}\n\t"
  11595. "adcs r4, r4, r6\n\t"
  11596. "adcs r5, r5, r8\n\t"
  11597. "stm %[r]!, {r4, r5}\n\t"
  11598. "ldm %[a]!, {r4, r5}\n\t"
  11599. "ldm %[b]!, {r6, r8}\n\t"
  11600. "adcs r4, r4, r6\n\t"
  11601. "adcs r5, r5, r8\n\t"
  11602. "stm %[r]!, {r4, r5}\n\t"
  11603. "ldm %[a]!, {r4, r5}\n\t"
  11604. "ldm %[b]!, {r6, r8}\n\t"
  11605. "adcs r4, r4, r6\n\t"
  11606. "adcs r5, r5, r8\n\t"
  11607. "stm %[r]!, {r4, r5}\n\t"
  11608. "ldm %[a]!, {r4, r5}\n\t"
  11609. "ldm %[b]!, {r6, r8}\n\t"
  11610. "adcs r4, r4, r6\n\t"
  11611. "adcs r5, r5, r8\n\t"
  11612. "stm %[r]!, {r4, r5}\n\t"
  11613. "ldm %[a]!, {r4, r5}\n\t"
  11614. "ldm %[b]!, {r6, r8}\n\t"
  11615. "adcs r4, r4, r6\n\t"
  11616. "adcs r5, r5, r8\n\t"
  11617. "stm %[r]!, {r4, r5}\n\t"
  11618. "ldm %[a]!, {r4, r5}\n\t"
  11619. "ldm %[b]!, {r6, r8}\n\t"
  11620. "adcs r4, r4, r6\n\t"
  11621. "adcs r5, r5, r8\n\t"
  11622. "stm %[r]!, {r4, r5}\n\t"
  11623. "ldm %[a]!, {r4, r5}\n\t"
  11624. "ldm %[b]!, {r6, r8}\n\t"
  11625. "adcs r4, r4, r6\n\t"
  11626. "adcs r5, r5, r8\n\t"
  11627. "stm %[r]!, {r4, r5}\n\t"
  11628. "ldm %[a]!, {r4, r5}\n\t"
  11629. "ldm %[b]!, {r6, r8}\n\t"
  11630. "adcs r4, r4, r6\n\t"
  11631. "adcs r5, r5, r8\n\t"
  11632. "stm %[r]!, {r4, r5}\n\t"
  11633. "ldm %[a]!, {r4, r5}\n\t"
  11634. "ldm %[b]!, {r6, r8}\n\t"
  11635. "adcs r4, r4, r6\n\t"
  11636. "adcs r5, r5, r8\n\t"
  11637. "stm %[r]!, {r4, r5}\n\t"
  11638. "ldm %[a]!, {r4, r5}\n\t"
  11639. "ldm %[b]!, {r6, r8}\n\t"
  11640. "adcs r4, r4, r6\n\t"
  11641. "adcs r5, r5, r8\n\t"
  11642. "stm %[r]!, {r4, r5}\n\t"
  11643. "ldm %[a]!, {r4, r5}\n\t"
  11644. "ldm %[b]!, {r6, r8}\n\t"
  11645. "adcs r4, r4, r6\n\t"
  11646. "adcs r5, r5, r8\n\t"
  11647. "stm %[r]!, {r4, r5}\n\t"
  11648. "ldm %[a]!, {r4, r5}\n\t"
  11649. "ldm %[b]!, {r6, r8}\n\t"
  11650. "adcs r4, r4, r6\n\t"
  11651. "adcs r5, r5, r8\n\t"
  11652. "stm %[r]!, {r4, r5}\n\t"
  11653. "ldm %[a]!, {r4, r5}\n\t"
  11654. "ldm %[b]!, {r6, r8}\n\t"
  11655. "adcs r4, r4, r6\n\t"
  11656. "adcs r5, r5, r8\n\t"
  11657. "stm %[r]!, {r4, r5}\n\t"
  11658. "ldm %[a]!, {r4, r5}\n\t"
  11659. "ldm %[b]!, {r6, r8}\n\t"
  11660. "adcs r4, r4, r6\n\t"
  11661. "adcs r5, r5, r8\n\t"
  11662. "stm %[r]!, {r4, r5}\n\t"
  11663. "ldm %[a]!, {r4, r5}\n\t"
  11664. "ldm %[b]!, {r6, r8}\n\t"
  11665. "adcs r4, r4, r6\n\t"
  11666. "adcs r5, r5, r8\n\t"
  11667. "stm %[r]!, {r4, r5}\n\t"
  11668. "ldm %[a]!, {r4, r5}\n\t"
  11669. "ldm %[b]!, {r6, r8}\n\t"
  11670. "adcs r4, r4, r6\n\t"
  11671. "adcs r5, r5, r8\n\t"
  11672. "stm %[r]!, {r4, r5}\n\t"
  11673. "ldm %[a]!, {r4, r5}\n\t"
  11674. "ldm %[b]!, {r6, r8}\n\t"
  11675. "adcs r4, r4, r6\n\t"
  11676. "adcs r5, r5, r8\n\t"
  11677. "stm %[r]!, {r4, r5}\n\t"
  11678. "ldm %[a]!, {r4, r5}\n\t"
  11679. "ldm %[b]!, {r6, r8}\n\t"
  11680. "adcs r4, r4, r6\n\t"
  11681. "adcs r5, r5, r8\n\t"
  11682. "stm %[r]!, {r4, r5}\n\t"
  11683. "ldm %[a]!, {r4, r5}\n\t"
  11684. "ldm %[b]!, {r6, r8}\n\t"
  11685. "adcs r4, r4, r6\n\t"
  11686. "adcs r5, r5, r8\n\t"
  11687. "stm %[r]!, {r4, r5}\n\t"
  11688. "ldm %[a]!, {r4, r5}\n\t"
  11689. "ldm %[b]!, {r6, r8}\n\t"
  11690. "adcs r4, r4, r6\n\t"
  11691. "adcs r5, r5, r8\n\t"
  11692. "stm %[r]!, {r4, r5}\n\t"
  11693. "ldm %[a]!, {r4, r5}\n\t"
  11694. "ldm %[b]!, {r6, r8}\n\t"
  11695. "adcs r4, r4, r6\n\t"
  11696. "adcs r5, r5, r8\n\t"
  11697. "stm %[r]!, {r4, r5}\n\t"
  11698. "ldm %[a]!, {r4, r5}\n\t"
  11699. "ldm %[b]!, {r6, r8}\n\t"
  11700. "adcs r4, r4, r6\n\t"
  11701. "adcs r5, r5, r8\n\t"
  11702. "stm %[r]!, {r4, r5}\n\t"
  11703. "ldm %[a]!, {r4, r5}\n\t"
  11704. "ldm %[b]!, {r6, r8}\n\t"
  11705. "adcs r4, r4, r6\n\t"
  11706. "adcs r5, r5, r8\n\t"
  11707. "stm %[r]!, {r4, r5}\n\t"
  11708. "ldm %[a]!, {r4, r5}\n\t"
  11709. "ldm %[b]!, {r6, r8}\n\t"
  11710. "adcs r4, r4, r6\n\t"
  11711. "adcs r5, r5, r8\n\t"
  11712. "stm %[r]!, {r4, r5}\n\t"
  11713. "ldm %[a]!, {r4, r5}\n\t"
  11714. "ldm %[b]!, {r6, r8}\n\t"
  11715. "adcs r4, r4, r6\n\t"
  11716. "adcs r5, r5, r8\n\t"
  11717. "stm %[r]!, {r4, r5}\n\t"
  11718. "ldm %[a]!, {r4, r5}\n\t"
  11719. "ldm %[b]!, {r6, r8}\n\t"
  11720. "adcs r4, r4, r6\n\t"
  11721. "adcs r5, r5, r8\n\t"
  11722. "stm %[r]!, {r4, r5}\n\t"
  11723. "ldm %[a]!, {r4, r5}\n\t"
  11724. "ldm %[b]!, {r6, r8}\n\t"
  11725. "adcs r4, r4, r6\n\t"
  11726. "adcs r5, r5, r8\n\t"
  11727. "stm %[r]!, {r4, r5}\n\t"
  11728. "ldm %[a]!, {r4, r5}\n\t"
  11729. "ldm %[b]!, {r6, r8}\n\t"
  11730. "adcs r4, r4, r6\n\t"
  11731. "adcs r5, r5, r8\n\t"
  11732. "stm %[r]!, {r4, r5}\n\t"
  11733. "ldm %[a]!, {r4, r5}\n\t"
  11734. "ldm %[b]!, {r6, r8}\n\t"
  11735. "adcs r4, r4, r6\n\t"
  11736. "adcs r5, r5, r8\n\t"
  11737. "stm %[r]!, {r4, r5}\n\t"
  11738. "ldm %[a]!, {r4, r5}\n\t"
  11739. "ldm %[b]!, {r6, r8}\n\t"
  11740. "adcs r4, r4, r6\n\t"
  11741. "adcs r5, r5, r8\n\t"
  11742. "stm %[r]!, {r4, r5}\n\t"
  11743. "ldm %[a]!, {r4, r5}\n\t"
  11744. "ldm %[b]!, {r6, r8}\n\t"
  11745. "adcs r4, r4, r6\n\t"
  11746. "adcs r5, r5, r8\n\t"
  11747. "stm %[r]!, {r4, r5}\n\t"
  11748. "ldm %[a]!, {r4, r5}\n\t"
  11749. "ldm %[b]!, {r6, r8}\n\t"
  11750. "adcs r4, r4, r6\n\t"
  11751. "adcs r5, r5, r8\n\t"
  11752. "stm %[r]!, {r4, r5}\n\t"
  11753. "ldm %[a]!, {r4, r5}\n\t"
  11754. "ldm %[b]!, {r6, r8}\n\t"
  11755. "adcs r4, r4, r6\n\t"
  11756. "adcs r5, r5, r8\n\t"
  11757. "stm %[r]!, {r4, r5}\n\t"
  11758. "ldm %[a]!, {r4, r5}\n\t"
  11759. "ldm %[b]!, {r6, r8}\n\t"
  11760. "adcs r4, r4, r6\n\t"
  11761. "adcs r5, r5, r8\n\t"
  11762. "stm %[r]!, {r4, r5}\n\t"
  11763. "ldm %[a]!, {r4, r5}\n\t"
  11764. "ldm %[b]!, {r6, r8}\n\t"
  11765. "adcs r4, r4, r6\n\t"
  11766. "adcs r5, r5, r8\n\t"
  11767. "stm %[r]!, {r4, r5}\n\t"
  11768. "ldm %[a]!, {r4, r5}\n\t"
  11769. "ldm %[b]!, {r6, r8}\n\t"
  11770. "adcs r4, r4, r6\n\t"
  11771. "adcs r5, r5, r8\n\t"
  11772. "stm %[r]!, {r4, r5}\n\t"
  11773. "ldm %[a]!, {r4, r5}\n\t"
  11774. "ldm %[b]!, {r6, r8}\n\t"
  11775. "adcs r4, r4, r6\n\t"
  11776. "adcs r5, r5, r8\n\t"
  11777. "stm %[r]!, {r4, r5}\n\t"
  11778. "ldm %[a]!, {r4, r5}\n\t"
  11779. "ldm %[b]!, {r6, r8}\n\t"
  11780. "adcs r4, r4, r6\n\t"
  11781. "adcs r5, r5, r8\n\t"
  11782. "stm %[r]!, {r4, r5}\n\t"
  11783. "ldm %[a]!, {r4, r5}\n\t"
  11784. "ldm %[b]!, {r6, r8}\n\t"
  11785. "adcs r4, r4, r6\n\t"
  11786. "adcs r5, r5, r8\n\t"
  11787. "stm %[r]!, {r4, r5}\n\t"
  11788. "ldm %[a]!, {r4, r5}\n\t"
  11789. "ldm %[b]!, {r6, r8}\n\t"
  11790. "adcs r4, r4, r6\n\t"
  11791. "adcs r5, r5, r8\n\t"
  11792. "stm %[r]!, {r4, r5}\n\t"
  11793. "ldm %[a]!, {r4, r5}\n\t"
  11794. "ldm %[b]!, {r6, r8}\n\t"
  11795. "adcs r4, r4, r6\n\t"
  11796. "adcs r5, r5, r8\n\t"
  11797. "stm %[r]!, {r4, r5}\n\t"
  11798. "ldm %[a]!, {r4, r5}\n\t"
  11799. "ldm %[b]!, {r6, r8}\n\t"
  11800. "adcs r4, r4, r6\n\t"
  11801. "adcs r5, r5, r8\n\t"
  11802. "stm %[r]!, {r4, r5}\n\t"
  11803. "ldm %[a]!, {r4, r5}\n\t"
  11804. "ldm %[b]!, {r6, r8}\n\t"
  11805. "adcs r4, r4, r6\n\t"
  11806. "adcs r5, r5, r8\n\t"
  11807. "stm %[r]!, {r4, r5}\n\t"
  11808. "ldm %[a]!, {r4, r5}\n\t"
  11809. "ldm %[b]!, {r6, r8}\n\t"
  11810. "adcs r4, r4, r6\n\t"
  11811. "adcs r5, r5, r8\n\t"
  11812. "stm %[r]!, {r4, r5}\n\t"
  11813. "ldm %[a]!, {r4, r5}\n\t"
  11814. "ldm %[b]!, {r6, r8}\n\t"
  11815. "adcs r4, r4, r6\n\t"
  11816. "adcs r5, r5, r8\n\t"
  11817. "stm %[r]!, {r4, r5}\n\t"
  11818. "ldm %[a]!, {r4, r5}\n\t"
  11819. "ldm %[b]!, {r6, r8}\n\t"
  11820. "adcs r4, r4, r6\n\t"
  11821. "adcs r5, r5, r8\n\t"
  11822. "stm %[r]!, {r4, r5}\n\t"
  11823. "ldm %[a]!, {r4, r5}\n\t"
  11824. "ldm %[b]!, {r6, r8}\n\t"
  11825. "adcs r4, r4, r6\n\t"
  11826. "adcs r5, r5, r8\n\t"
  11827. "stm %[r]!, {r4, r5}\n\t"
  11828. "ldm %[a]!, {r4, r5}\n\t"
  11829. "ldm %[b]!, {r6, r8}\n\t"
  11830. "adcs r4, r4, r6\n\t"
  11831. "adcs r5, r5, r8\n\t"
  11832. "stm %[r]!, {r4, r5}\n\t"
  11833. "ldm %[a]!, {r4, r5}\n\t"
  11834. "ldm %[b]!, {r6, r8}\n\t"
  11835. "adcs r4, r4, r6\n\t"
  11836. "adcs r5, r5, r8\n\t"
  11837. "stm %[r]!, {r4, r5}\n\t"
  11838. "ldm %[a]!, {r4, r5}\n\t"
  11839. "ldm %[b]!, {r6, r8}\n\t"
  11840. "adcs r4, r4, r6\n\t"
  11841. "adcs r5, r5, r8\n\t"
  11842. "stm %[r]!, {r4, r5}\n\t"
  11843. "ldm %[a]!, {r4, r5}\n\t"
  11844. "ldm %[b]!, {r6, r8}\n\t"
  11845. "adcs r4, r4, r6\n\t"
  11846. "adcs r5, r5, r8\n\t"
  11847. "stm %[r]!, {r4, r5}\n\t"
  11848. "ldm %[a]!, {r4, r5}\n\t"
  11849. "ldm %[b]!, {r6, r8}\n\t"
  11850. "adcs r4, r4, r6\n\t"
  11851. "adcs r5, r5, r8\n\t"
  11852. "stm %[r]!, {r4, r5}\n\t"
  11853. "ldm %[a]!, {r4, r5}\n\t"
  11854. "ldm %[b]!, {r6, r8}\n\t"
  11855. "adcs r4, r4, r6\n\t"
  11856. "adcs r5, r5, r8\n\t"
  11857. "stm %[r]!, {r4, r5}\n\t"
  11858. "mov %[c], #0\n\t"
  11859. "adc %[c], %[c], %[c]\n\t"
  11860. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  11861. :
  11862. : "memory", "r4", "r5", "r6", "r8"
  11863. );
  11864. return c;
  11865. }
  11866. /* Multiply a and b into r. (r = a * b)
  11867. *
  11868. * r A single precision integer.
  11869. * a A single precision integer.
  11870. * b A single precision integer.
  11871. */
  11872. SP_NOINLINE static void sp_4096_mul_128(sp_digit* r, const sp_digit* a,
  11873. const sp_digit* b)
  11874. {
  11875. sp_digit* z0 = r;
  11876. sp_digit z1[128];
  11877. sp_digit a1[64];
  11878. sp_digit b1[64];
  11879. sp_digit* z2 = r + 128;
  11880. sp_digit u;
  11881. sp_digit ca;
  11882. sp_digit cb;
  11883. ca = sp_2048_add_64(a1, a, &a[64]);
  11884. cb = sp_2048_add_64(b1, b, &b[64]);
  11885. u = ca & cb;
  11886. sp_2048_mul_64(z2, &a[64], &b[64]);
  11887. sp_2048_mul_64(z0, a, b);
  11888. sp_2048_mul_64(z1, a1, b1);
  11889. u += sp_4096_sub_in_place_128(z1, z0);
  11890. u += sp_4096_sub_in_place_128(z1, z2);
  11891. sp_2048_mask_64(a1, a1, 0 - cb);
  11892. u += sp_2048_add_64(z1 + 64, z1 + 64, a1);
  11893. sp_2048_mask_64(b1, b1, 0 - ca);
  11894. u += sp_2048_add_64(z1 + 64, z1 + 64, b1);
  11895. u += sp_4096_add_128(r + 64, r + 64, z1);
  11896. XMEMSET(a1 + 1, 0, sizeof(sp_digit) * (64 - 1));
  11897. a1[0] = u;
  11898. (void)sp_2048_add_64(r + 192, r + 192, a1);
  11899. }
  11900. /* Square a and put result in r. (r = a * a)
  11901. *
  11902. * r A single precision integer.
  11903. * a A single precision integer.
  11904. */
  11905. SP_NOINLINE static void sp_4096_sqr_128(sp_digit* r, const sp_digit* a)
  11906. {
  11907. sp_digit* z0 = r;
  11908. sp_digit* z2 = r + 128;
  11909. sp_digit z1[128];
  11910. sp_digit* a1 = z1;
  11911. sp_digit zero[64];
  11912. sp_digit u;
  11913. sp_digit mask;
  11914. sp_digit* p1;
  11915. sp_digit* p2;
  11916. XMEMSET(zero, 0, sizeof(sp_digit) * 64);
  11917. mask = sp_2048_sub_64(a1, a, &a[64]);
  11918. p1 = (sp_digit*)(((sp_digit)zero & mask ) | ((sp_digit)a1 & (~mask)));
  11919. p2 = (sp_digit*)(((sp_digit)zero & (~mask)) | ((sp_digit)a1 & mask ));
  11920. (void)sp_2048_sub_64(a1, p1, p2);
  11921. sp_2048_sqr_64(z2, &a[64]);
  11922. sp_2048_sqr_64(z0, a);
  11923. sp_2048_sqr_64(z1, a1);
  11924. u = 0;
  11925. u -= sp_4096_sub_in_place_128(z1, z2);
  11926. u -= sp_4096_sub_in_place_128(z1, z0);
  11927. u += sp_4096_sub_in_place_128(r + 64, z1);
  11928. zero[0] = u;
  11929. (void)sp_2048_add_64(r + 192, r + 192, zero);
  11930. }
  11931. #endif /* !WOLFSSL_SP_SMALL */
  11932. #ifdef WOLFSSL_SP_SMALL
  11933. /* Add b to a into r. (r = a + b)
  11934. *
  11935. * r A single precision integer.
  11936. * a A single precision integer.
  11937. * b A single precision integer.
  11938. */
  11939. SP_NOINLINE static sp_digit sp_4096_add_128(sp_digit* r, const sp_digit* a,
  11940. const sp_digit* b)
  11941. {
  11942. sp_digit c = 0;
  11943. __asm__ __volatile__ (
  11944. "mov r6, %[a]\n\t"
  11945. "mov r8, #0\n\t"
  11946. "add r6, r6, #512\n\t"
  11947. "sub r8, r8, #1\n\t"
  11948. "\n1:\n\t"
  11949. "adds %[c], %[c], r8\n\t"
  11950. "ldr r4, [%[a]]\n\t"
  11951. "ldr r5, [%[b]]\n\t"
  11952. "adcs r4, r4, r5\n\t"
  11953. "str r4, [%[r]]\n\t"
  11954. "mov %[c], #0\n\t"
  11955. "adc %[c], %[c], %[c]\n\t"
  11956. "add %[a], %[a], #4\n\t"
  11957. "add %[b], %[b], #4\n\t"
  11958. "add %[r], %[r], #4\n\t"
  11959. "cmp %[a], r6\n\t"
  11960. #ifdef __GNUC__
  11961. "bne 1b\n\t"
  11962. #else
  11963. "bne.n 1b\n\t"
  11964. #endif /* __GNUC__ */
  11965. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  11966. :
  11967. : "memory", "r4", "r5", "r6", "r8"
  11968. );
  11969. return c;
  11970. }
  11971. #endif /* WOLFSSL_SP_SMALL */
  11972. #ifdef WOLFSSL_SP_SMALL
  11973. /* Sub b from a into a. (a -= b)
  11974. *
  11975. * a A single precision integer.
  11976. * b A single precision integer.
  11977. */
  11978. SP_NOINLINE static sp_digit sp_4096_sub_in_place_128(sp_digit* a,
  11979. const sp_digit* b)
  11980. {
  11981. sp_digit c = 0;
  11982. __asm__ __volatile__ (
  11983. "mov r8, %[a]\n\t"
  11984. "add r8, r8, #512\n\t"
  11985. "\n1:\n\t"
  11986. "mov r5, #0\n\t"
  11987. "subs r5, r5, %[c]\n\t"
  11988. "ldr r3, [%[a]]\n\t"
  11989. "ldr r4, [%[a], #4]\n\t"
  11990. "ldr r5, [%[b]]\n\t"
  11991. "ldr r6, [%[b], #4]\n\t"
  11992. "sbcs r3, r3, r5\n\t"
  11993. "sbcs r4, r4, r6\n\t"
  11994. "str r3, [%[a]]\n\t"
  11995. "str r4, [%[a], #4]\n\t"
  11996. "sbc %[c], %[c], %[c]\n\t"
  11997. "add %[a], %[a], #8\n\t"
  11998. "add %[b], %[b], #8\n\t"
  11999. "cmp %[a], r8\n\t"
  12000. #ifdef __GNUC__
  12001. "bne 1b\n\t"
  12002. #else
  12003. "bne.n 1b\n\t"
  12004. #endif /* __GNUC__ */
  12005. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  12006. :
  12007. : "memory", "r3", "r4", "r5", "r6", "r8"
  12008. );
  12009. return c;
  12010. }
  12011. #endif /* WOLFSSL_SP_SMALL */
  12012. #ifdef WOLFSSL_SP_SMALL
  12013. /* Multiply a and b into r. (r = a * b)
  12014. *
  12015. * r A single precision integer.
  12016. * a A single precision integer.
  12017. * b A single precision integer.
  12018. */
  12019. SP_NOINLINE static void sp_4096_mul_128(sp_digit* r, const sp_digit* a,
  12020. const sp_digit* b)
  12021. {
  12022. sp_digit tmp_arr[128 * 2];
  12023. sp_digit* tmp = tmp_arr;
  12024. __asm__ __volatile__ (
  12025. "mov r3, #0\n\t"
  12026. "mov r4, #0\n\t"
  12027. "mov r9, r3\n\t"
  12028. "mov r12, %[r]\n\t"
  12029. "mov r10, %[a]\n\t"
  12030. "mov r11, %[b]\n\t"
  12031. "mov r6, #2\n\t"
  12032. "lsl r6, r6, #8\n\t"
  12033. "add r6, r6, r10\n\t"
  12034. "mov r14, r6\n\t"
  12035. "\n1:\n\t"
  12036. "mov %[r], #0\n\t"
  12037. "mov r5, #0\n\t"
  12038. "mov r6, #1\n\t"
  12039. "lsl r6, r6, #8\n\t"
  12040. "add r6, r6, #252\n\t"
  12041. "mov %[a], r9\n\t"
  12042. "subs %[a], %[a], r6\n\t"
  12043. "sbc r6, r6, r6\n\t"
  12044. "mvn r6, r6\n\t"
  12045. "and %[a], %[a], r6\n\t"
  12046. "mov %[b], r9\n\t"
  12047. "sub %[b], %[b], %[a]\n\t"
  12048. "add %[a], %[a], r10\n\t"
  12049. "add %[b], %[b], r11\n\t"
  12050. "\n2:\n\t"
  12051. /* Multiply Start */
  12052. "ldr r6, [%[a]]\n\t"
  12053. "ldr r8, [%[b]]\n\t"
  12054. "umull r6, r8, r6, r8\n\t"
  12055. "adds r3, r3, r6\n\t"
  12056. "adcs r4, r4, r8\n\t"
  12057. "adc r5, r5, %[r]\n\t"
  12058. /* Multiply Done */
  12059. "add %[a], %[a], #4\n\t"
  12060. "sub %[b], %[b], #4\n\t"
  12061. "cmp %[a], r14\n\t"
  12062. #ifdef __GNUC__
  12063. "beq 3f\n\t"
  12064. #else
  12065. "beq.n 3f\n\t"
  12066. #endif /* __GNUC__ */
  12067. "mov r6, r9\n\t"
  12068. "add r6, r6, r10\n\t"
  12069. "cmp %[a], r6\n\t"
  12070. #ifdef __GNUC__
  12071. "ble 2b\n\t"
  12072. #else
  12073. "ble.n 2b\n\t"
  12074. #endif /* __GNUC__ */
  12075. "\n3:\n\t"
  12076. "mov %[r], r12\n\t"
  12077. "mov r8, r9\n\t"
  12078. "str r3, [%[r], r8]\n\t"
  12079. "mov r3, r4\n\t"
  12080. "mov r4, r5\n\t"
  12081. "add r8, r8, #4\n\t"
  12082. "mov r9, r8\n\t"
  12083. "mov r6, #3\n\t"
  12084. "lsl r6, r6, #8\n\t"
  12085. "add r6, r6, #248\n\t"
  12086. "cmp r8, r6\n\t"
  12087. #ifdef __GNUC__
  12088. "ble 1b\n\t"
  12089. #else
  12090. "ble.n 1b\n\t"
  12091. #endif /* __GNUC__ */
  12092. "str r3, [%[r], r8]\n\t"
  12093. "mov %[a], r10\n\t"
  12094. "mov %[b], r11\n\t"
  12095. :
  12096. : [r] "r" (tmp), [a] "r" (a), [b] "r" (b)
  12097. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  12098. );
  12099. XMEMCPY(r, tmp_arr, sizeof(tmp_arr));
  12100. }
  12101. /* Square a and put result in r. (r = a * a)
  12102. *
  12103. * r A single precision integer.
  12104. * a A single precision integer.
  12105. */
  12106. SP_NOINLINE static void sp_4096_sqr_128(sp_digit* r, const sp_digit* a)
  12107. {
  12108. __asm__ __volatile__ (
  12109. "mov r3, #0\n\t"
  12110. "mov r4, #0\n\t"
  12111. "mov r5, #0\n\t"
  12112. "mov r9, r3\n\t"
  12113. "mov r12, %[r]\n\t"
  12114. "mov r6, #4\n\t"
  12115. "lsl r6, r6, #8\n\t"
  12116. "neg r6, r6\n\t"
  12117. "add sp, sp, r6\n\t"
  12118. "mov r11, sp\n\t"
  12119. "mov r10, %[a]\n\t"
  12120. "\n1:\n\t"
  12121. "mov %[r], #0\n\t"
  12122. "mov r6, #1\n\t"
  12123. "lsl r6, r6, #8\n\t"
  12124. "add r6, r6, #252\n\t"
  12125. "mov %[a], r9\n\t"
  12126. "subs %[a], %[a], r6\n\t"
  12127. "sbc r6, r6, r6\n\t"
  12128. "mvn r6, r6\n\t"
  12129. "and %[a], %[a], r6\n\t"
  12130. "mov r2, r9\n\t"
  12131. "sub r2, r2, %[a]\n\t"
  12132. "add %[a], %[a], r10\n\t"
  12133. "add r2, r2, r10\n\t"
  12134. "\n2:\n\t"
  12135. "cmp r2, %[a]\n\t"
  12136. #ifdef __GNUC__
  12137. "beq 4f\n\t"
  12138. #else
  12139. "beq.n 4f\n\t"
  12140. #endif /* __GNUC__ */
  12141. /* Multiply * 2: Start */
  12142. "ldr r6, [%[a]]\n\t"
  12143. "ldr r8, [r2]\n\t"
  12144. "umull r6, r8, r6, r8\n\t"
  12145. "adds r3, r3, r6\n\t"
  12146. "adcs r4, r4, r8\n\t"
  12147. "adc r5, r5, %[r]\n\t"
  12148. "adds r3, r3, r6\n\t"
  12149. "adcs r4, r4, r8\n\t"
  12150. "adc r5, r5, %[r]\n\t"
  12151. /* Multiply * 2: Done */
  12152. #ifdef __GNUC__
  12153. "bal 5f\n\t"
  12154. #else
  12155. "bal.n 5f\n\t"
  12156. #endif /* __GNUC__ */
  12157. "\n4:\n\t"
  12158. /* Square: Start */
  12159. "ldr r6, [%[a]]\n\t"
  12160. "umull r6, r8, r6, r6\n\t"
  12161. "adds r3, r3, r6\n\t"
  12162. "adcs r4, r4, r8\n\t"
  12163. "adc r5, r5, %[r]\n\t"
  12164. /* Square: Done */
  12165. "\n5:\n\t"
  12166. "add %[a], %[a], #4\n\t"
  12167. "sub r2, r2, #4\n\t"
  12168. "mov r6, #2\n\t"
  12169. "lsl r6, r6, #8\n\t"
  12170. "add r6, r6, r10\n\t"
  12171. "cmp %[a], r6\n\t"
  12172. #ifdef __GNUC__
  12173. "beq 3f\n\t"
  12174. #else
  12175. "beq.n 3f\n\t"
  12176. #endif /* __GNUC__ */
  12177. "cmp %[a], r2\n\t"
  12178. #ifdef __GNUC__
  12179. "bgt 3f\n\t"
  12180. #else
  12181. "bgt.n 3f\n\t"
  12182. #endif /* __GNUC__ */
  12183. "mov r8, r9\n\t"
  12184. "add r8, r8, r10\n\t"
  12185. "cmp %[a], r8\n\t"
  12186. #ifdef __GNUC__
  12187. "ble 2b\n\t"
  12188. #else
  12189. "ble.n 2b\n\t"
  12190. #endif /* __GNUC__ */
  12191. "\n3:\n\t"
  12192. "mov %[r], r11\n\t"
  12193. "mov r8, r9\n\t"
  12194. "str r3, [%[r], r8]\n\t"
  12195. "mov r3, r4\n\t"
  12196. "mov r4, r5\n\t"
  12197. "mov r5, #0\n\t"
  12198. "add r8, r8, #4\n\t"
  12199. "mov r9, r8\n\t"
  12200. "mov r6, #3\n\t"
  12201. "lsl r6, r6, #8\n\t"
  12202. "add r6, r6, #248\n\t"
  12203. "cmp r8, r6\n\t"
  12204. #ifdef __GNUC__
  12205. "ble 1b\n\t"
  12206. #else
  12207. "ble.n 1b\n\t"
  12208. #endif /* __GNUC__ */
  12209. "mov %[a], r10\n\t"
  12210. "str r3, [%[r], r8]\n\t"
  12211. "mov %[r], r12\n\t"
  12212. "mov %[a], r11\n\t"
  12213. "mov r3, #3\n\t"
  12214. "lsl r3, r3, #8\n\t"
  12215. "add r3, r3, #252\n\t"
  12216. "\n4:\n\t"
  12217. "ldr r6, [%[a], r3]\n\t"
  12218. "str r6, [%[r], r3]\n\t"
  12219. "subs r3, r3, #4\n\t"
  12220. #ifdef __GNUC__
  12221. "bge 4b\n\t"
  12222. #else
  12223. "bge.n 4b\n\t"
  12224. #endif /* __GNUC__ */
  12225. "mov r6, #4\n\t"
  12226. "lsl r6, r6, #8\n\t"
  12227. "add sp, sp, r6\n\t"
  12228. :
  12229. : [r] "r" (r), [a] "r" (a)
  12230. : "memory", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12"
  12231. );
  12232. }
  12233. #endif /* WOLFSSL_SP_SMALL */
  12234. /* Caclulate the bottom digit of -1/a mod 2^n.
  12235. *
  12236. * a A single precision number.
  12237. * rho Bottom word of inverse.
  12238. */
  12239. static void sp_4096_mont_setup(const sp_digit* a, sp_digit* rho)
  12240. {
  12241. sp_digit x;
  12242. sp_digit b;
  12243. b = a[0];
  12244. x = (((b + 2) & 4) << 1) + b; /* here x*a==1 mod 2**4 */
  12245. x *= 2 - b * x; /* here x*a==1 mod 2**8 */
  12246. x *= 2 - b * x; /* here x*a==1 mod 2**16 */
  12247. x *= 2 - b * x; /* here x*a==1 mod 2**32 */
  12248. /* rho = -1/m mod b */
  12249. *rho = (sp_digit)0 - x;
  12250. }
  12251. /* Mul a by digit b into r. (r = a * b)
  12252. *
  12253. * r A single precision integer.
  12254. * a A single precision integer.
  12255. * b A single precision digit.
  12256. */
  12257. SP_NOINLINE static void sp_4096_mul_d_128(sp_digit* r, const sp_digit* a,
  12258. sp_digit b)
  12259. {
  12260. __asm__ __volatile__ (
  12261. "add r9, %[a], #512\n\t"
  12262. /* A[0] * B */
  12263. "ldr r6, [%[a]], #4\n\t"
  12264. "umull r5, r3, r6, %[b]\n\t"
  12265. "mov r4, #0\n\t"
  12266. "str r5, [%[r]], #4\n\t"
  12267. /* A[0] * B - Done */
  12268. "\n1:\n\t"
  12269. "mov r5, #0\n\t"
  12270. /* A[] * B */
  12271. "ldr r6, [%[a]], #4\n\t"
  12272. "umull r6, r8, r6, %[b]\n\t"
  12273. "adds r3, r3, r6\n\t"
  12274. "adcs r4, r4, r8\n\t"
  12275. "adc r5, r5, #0\n\t"
  12276. /* A[] * B - Done */
  12277. "str r3, [%[r]], #4\n\t"
  12278. "mov r3, r4\n\t"
  12279. "mov r4, r5\n\t"
  12280. "cmp %[a], r9\n\t"
  12281. #ifdef __GNUC__
  12282. "blt 1b\n\t"
  12283. #else
  12284. "blt.n 1b\n\t"
  12285. #endif /* __GNUC__ */
  12286. "str r3, [%[r]]\n\t"
  12287. : [r] "+r" (r), [a] "+r" (a)
  12288. : [b] "r" (b)
  12289. : "memory", "r3", "r4", "r5", "r6", "r8", "r9"
  12290. );
  12291. }
  12292. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || defined(WOLFSSL_HAVE_SP_DH)
  12293. /* r = 2^n mod m where n is the number of bits to reduce by.
  12294. * Given m must be 4096 bits, just need to subtract.
  12295. *
  12296. * r A single precision number.
  12297. * m A single precision number.
  12298. */
  12299. static void sp_4096_mont_norm_128(sp_digit* r, const sp_digit* m)
  12300. {
  12301. XMEMSET(r, 0, sizeof(sp_digit) * 128);
  12302. /* r = 2^n mod m */
  12303. sp_4096_sub_in_place_128(r, m);
  12304. }
  12305. #endif /* (WOLFSSL_HAVE_SP_RSA & !WOLFSSL_RSA_PUBLIC_ONLY) | WOLFSSL_HAVE_SP_DH */
  12306. /* Conditionally subtract b from a using the mask m.
  12307. * m is -1 to subtract and 0 when not copying.
  12308. *
  12309. * r A single precision number representing condition subtract result.
  12310. * a A single precision number to subtract from.
  12311. * b A single precision number to subtract.
  12312. * m Mask value to apply.
  12313. */
  12314. SP_NOINLINE static sp_digit sp_4096_cond_sub_128(sp_digit* r, const sp_digit* a,
  12315. const sp_digit* b, sp_digit m)
  12316. {
  12317. sp_digit c = 0;
  12318. __asm__ __volatile__ (
  12319. "mov r5, #2\n\t"
  12320. "lsl r5, r5, #8\n\t"
  12321. "mov r9, r5\n\t"
  12322. "mov r8, #0\n\t"
  12323. "\n1:\n\t"
  12324. "ldr r6, [%[b], r8]\n\t"
  12325. "and r6, r6, %[m]\n\t"
  12326. "mov r5, #0\n\t"
  12327. "subs r5, r5, %[c]\n\t"
  12328. "ldr r5, [%[a], r8]\n\t"
  12329. "sbcs r5, r5, r6\n\t"
  12330. "sbcs %[c], %[c], %[c]\n\t"
  12331. "str r5, [%[r], r8]\n\t"
  12332. "add r8, r8, #4\n\t"
  12333. "cmp r8, r9\n\t"
  12334. #ifdef __GNUC__
  12335. "blt 1b\n\t"
  12336. #else
  12337. "blt.n 1b\n\t"
  12338. #endif /* __GNUC__ */
  12339. : [c] "+r" (c)
  12340. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  12341. : "memory", "r5", "r6", "r8", "r9"
  12342. );
  12343. return c;
  12344. }
  12345. /* Reduce the number back to 4096 bits using Montgomery reduction.
  12346. *
  12347. * a A single precision number to reduce in place.
  12348. * m The single precision number representing the modulus.
  12349. * mp The digit representing the negative inverse of m mod 2^n.
  12350. */
  12351. SP_NOINLINE static void sp_4096_mont_reduce_128(sp_digit* a, const sp_digit* m,
  12352. sp_digit mp)
  12353. {
  12354. sp_digit ca = 0;
  12355. __asm__ __volatile__ (
  12356. "mov r9, %[mp]\n\t"
  12357. "mov r12, %[m]\n\t"
  12358. "mov r10, %[a]\n\t"
  12359. "mov r4, #0\n\t"
  12360. "add r11, r10, #512\n\t"
  12361. "\n1:\n\t"
  12362. /* mu = a[i] * mp */
  12363. "mov %[mp], r9\n\t"
  12364. "ldr %[a], [r10]\n\t"
  12365. "mul %[mp], %[mp], %[a]\n\t"
  12366. "mov %[m], r12\n\t"
  12367. "add r14, r10, #504\n\t"
  12368. "\n2:\n\t"
  12369. /* a[i+j] += m[j] * mu */
  12370. "ldr %[a], [r10]\n\t"
  12371. "mov r5, #0\n\t"
  12372. /* Multiply m[j] and mu - Start */
  12373. "ldr r8, [%[m]], #4\n\t"
  12374. "umull r6, r8, %[mp], r8\n\t"
  12375. "adds %[a], %[a], r6\n\t"
  12376. "adc r5, r5, r8\n\t"
  12377. /* Multiply m[j] and mu - Done */
  12378. "adds r4, r4, %[a]\n\t"
  12379. "adc r5, r5, #0\n\t"
  12380. "str r4, [r10], #4\n\t"
  12381. /* a[i+j+1] += m[j+1] * mu */
  12382. "ldr %[a], [r10]\n\t"
  12383. "mov r4, #0\n\t"
  12384. /* Multiply m[j] and mu - Start */
  12385. "ldr r8, [%[m]], #4\n\t"
  12386. "umull r6, r8, %[mp], r8\n\t"
  12387. "adds %[a], %[a], r6\n\t"
  12388. "adc r4, r4, r8\n\t"
  12389. /* Multiply m[j] and mu - Done */
  12390. "adds r5, r5, %[a]\n\t"
  12391. "adc r4, r4, #0\n\t"
  12392. "str r5, [r10], #4\n\t"
  12393. "cmp r10, r14\n\t"
  12394. #ifdef __GNUC__
  12395. "blt 2b\n\t"
  12396. #else
  12397. "blt.n 2b\n\t"
  12398. #endif /* __GNUC__ */
  12399. /* a[i+126] += m[126] * mu */
  12400. "ldr %[a], [r10]\n\t"
  12401. "mov r5, #0\n\t"
  12402. /* Multiply m[j] and mu - Start */
  12403. "ldr r8, [%[m]], #4\n\t"
  12404. "umull r6, r8, %[mp], r8\n\t"
  12405. "adds %[a], %[a], r6\n\t"
  12406. "adc r5, r5, r8\n\t"
  12407. /* Multiply m[j] and mu - Done */
  12408. "adds r4, r4, %[a]\n\t"
  12409. "adc r5, r5, #0\n\t"
  12410. "str r4, [r10], #4\n\t"
  12411. /* a[i+127] += m[127] * mu */
  12412. "mov r4, %[ca]\n\t"
  12413. "mov %[ca], #0\n\t"
  12414. /* Multiply m[127] and mu - Start */
  12415. "ldr r8, [%[m]]\n\t"
  12416. "umull r6, r8, %[mp], r8\n\t"
  12417. "adds r5, r5, r6\n\t"
  12418. "adcs r4, r4, r8\n\t"
  12419. "adc %[ca], %[ca], #0\n\t"
  12420. /* Multiply m[127] and mu - Done */
  12421. "ldr r6, [r10]\n\t"
  12422. "ldr r8, [r10, #4]\n\t"
  12423. "adds r6, r6, r5\n\t"
  12424. "adcs r8, r8, r4\n\t"
  12425. "adc %[ca], %[ca], #0\n\t"
  12426. "str r6, [r10]\n\t"
  12427. "str r8, [r10, #4]\n\t"
  12428. /* Next word in a */
  12429. "sub r10, r10, #504\n\t"
  12430. "cmp r10, r11\n\t"
  12431. #ifdef __GNUC__
  12432. "blt 1b\n\t"
  12433. #else
  12434. "blt.n 1b\n\t"
  12435. #endif /* __GNUC__ */
  12436. "mov %[a], r10\n\t"
  12437. "mov %[m], r12\n\t"
  12438. : [ca] "+r" (ca), [a] "+r" (a)
  12439. : [m] "r" (m), [mp] "r" (mp)
  12440. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  12441. );
  12442. sp_4096_cond_sub_128(a - 128, a, m, (sp_digit)0 - ca);
  12443. }
  12444. /* Multiply two Montgomery form numbers mod the modulus (prime).
  12445. * (r = a * b mod m)
  12446. *
  12447. * r Result of multiplication.
  12448. * a First number to multiply in Montgomery form.
  12449. * b Second number to multiply in Montgomery form.
  12450. * m Modulus (prime).
  12451. * mp Montgomery mulitplier.
  12452. */
  12453. SP_NOINLINE static void sp_4096_mont_mul_128(sp_digit* r, const sp_digit* a,
  12454. const sp_digit* b, const sp_digit* m, sp_digit mp)
  12455. {
  12456. sp_4096_mul_128(r, a, b);
  12457. sp_4096_mont_reduce_128(r, m, mp);
  12458. }
  12459. /* Square the Montgomery form number. (r = a * a mod m)
  12460. *
  12461. * r Result of squaring.
  12462. * a Number to square in Montgomery form.
  12463. * m Modulus (prime).
  12464. * mp Montgomery mulitplier.
  12465. */
  12466. SP_NOINLINE static void sp_4096_mont_sqr_128(sp_digit* r, const sp_digit* a,
  12467. const sp_digit* m, sp_digit mp)
  12468. {
  12469. sp_4096_sqr_128(r, a);
  12470. sp_4096_mont_reduce_128(r, m, mp);
  12471. }
  12472. #ifdef WOLFSSL_SP_SMALL
  12473. /* Sub b from a into r. (r = a - b)
  12474. *
  12475. * r A single precision integer.
  12476. * a A single precision integer.
  12477. * b A single precision integer.
  12478. */
  12479. SP_NOINLINE static sp_digit sp_4096_sub_128(sp_digit* r, const sp_digit* a,
  12480. const sp_digit* b)
  12481. {
  12482. sp_digit c = 0;
  12483. __asm__ __volatile__ (
  12484. "mov r6, %[a]\n\t"
  12485. "mov r5, #2\n\t"
  12486. "lsl r5, r5, #8\n\t"
  12487. "add r6, r6, r5\n\t"
  12488. "\n1:\n\t"
  12489. "mov r5, #0\n\t"
  12490. "subs r5, r5, %[c]\n\t"
  12491. "ldr r4, [%[a]]\n\t"
  12492. "ldr r5, [%[b]]\n\t"
  12493. "sbcs r4, r4, r5\n\t"
  12494. "str r4, [%[r]]\n\t"
  12495. "sbc %[c], %[c], %[c]\n\t"
  12496. "add %[a], %[a], #4\n\t"
  12497. "add %[b], %[b], #4\n\t"
  12498. "add %[r], %[r], #4\n\t"
  12499. "cmp %[a], r6\n\t"
  12500. #ifdef __GNUC__
  12501. "bne 1b\n\t"
  12502. #else
  12503. "bne.n 1b\n\t"
  12504. #endif /* __GNUC__ */
  12505. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  12506. :
  12507. : "memory", "r4", "r5", "r6"
  12508. );
  12509. return c;
  12510. }
  12511. #else
  12512. /* Sub b from a into r. (r = a - b)
  12513. *
  12514. * r A single precision integer.
  12515. * a A single precision integer.
  12516. * b A single precision integer.
  12517. */
  12518. SP_NOINLINE static sp_digit sp_4096_sub_128(sp_digit* r, const sp_digit* a,
  12519. const sp_digit* b)
  12520. {
  12521. sp_digit c = 0;
  12522. __asm__ __volatile__ (
  12523. "ldm %[a]!, {r4, r5}\n\t"
  12524. "ldm %[b]!, {r6, r8}\n\t"
  12525. "subs r4, r4, r6\n\t"
  12526. "sbcs r5, r5, r8\n\t"
  12527. "stm %[r]!, {r4, r5}\n\t"
  12528. "ldm %[a]!, {r4, r5}\n\t"
  12529. "ldm %[b]!, {r6, r8}\n\t"
  12530. "sbcs r4, r4, r6\n\t"
  12531. "sbcs r5, r5, r8\n\t"
  12532. "stm %[r]!, {r4, r5}\n\t"
  12533. "ldm %[a]!, {r4, r5}\n\t"
  12534. "ldm %[b]!, {r6, r8}\n\t"
  12535. "sbcs r4, r4, r6\n\t"
  12536. "sbcs r5, r5, r8\n\t"
  12537. "stm %[r]!, {r4, r5}\n\t"
  12538. "ldm %[a]!, {r4, r5}\n\t"
  12539. "ldm %[b]!, {r6, r8}\n\t"
  12540. "sbcs r4, r4, r6\n\t"
  12541. "sbcs r5, r5, r8\n\t"
  12542. "stm %[r]!, {r4, r5}\n\t"
  12543. "ldm %[a]!, {r4, r5}\n\t"
  12544. "ldm %[b]!, {r6, r8}\n\t"
  12545. "sbcs r4, r4, r6\n\t"
  12546. "sbcs r5, r5, r8\n\t"
  12547. "stm %[r]!, {r4, r5}\n\t"
  12548. "ldm %[a]!, {r4, r5}\n\t"
  12549. "ldm %[b]!, {r6, r8}\n\t"
  12550. "sbcs r4, r4, r6\n\t"
  12551. "sbcs r5, r5, r8\n\t"
  12552. "stm %[r]!, {r4, r5}\n\t"
  12553. "ldm %[a]!, {r4, r5}\n\t"
  12554. "ldm %[b]!, {r6, r8}\n\t"
  12555. "sbcs r4, r4, r6\n\t"
  12556. "sbcs r5, r5, r8\n\t"
  12557. "stm %[r]!, {r4, r5}\n\t"
  12558. "ldm %[a]!, {r4, r5}\n\t"
  12559. "ldm %[b]!, {r6, r8}\n\t"
  12560. "sbcs r4, r4, r6\n\t"
  12561. "sbcs r5, r5, r8\n\t"
  12562. "stm %[r]!, {r4, r5}\n\t"
  12563. "ldm %[a]!, {r4, r5}\n\t"
  12564. "ldm %[b]!, {r6, r8}\n\t"
  12565. "sbcs r4, r4, r6\n\t"
  12566. "sbcs r5, r5, r8\n\t"
  12567. "stm %[r]!, {r4, r5}\n\t"
  12568. "ldm %[a]!, {r4, r5}\n\t"
  12569. "ldm %[b]!, {r6, r8}\n\t"
  12570. "sbcs r4, r4, r6\n\t"
  12571. "sbcs r5, r5, r8\n\t"
  12572. "stm %[r]!, {r4, r5}\n\t"
  12573. "ldm %[a]!, {r4, r5}\n\t"
  12574. "ldm %[b]!, {r6, r8}\n\t"
  12575. "sbcs r4, r4, r6\n\t"
  12576. "sbcs r5, r5, r8\n\t"
  12577. "stm %[r]!, {r4, r5}\n\t"
  12578. "ldm %[a]!, {r4, r5}\n\t"
  12579. "ldm %[b]!, {r6, r8}\n\t"
  12580. "sbcs r4, r4, r6\n\t"
  12581. "sbcs r5, r5, r8\n\t"
  12582. "stm %[r]!, {r4, r5}\n\t"
  12583. "ldm %[a]!, {r4, r5}\n\t"
  12584. "ldm %[b]!, {r6, r8}\n\t"
  12585. "sbcs r4, r4, r6\n\t"
  12586. "sbcs r5, r5, r8\n\t"
  12587. "stm %[r]!, {r4, r5}\n\t"
  12588. "ldm %[a]!, {r4, r5}\n\t"
  12589. "ldm %[b]!, {r6, r8}\n\t"
  12590. "sbcs r4, r4, r6\n\t"
  12591. "sbcs r5, r5, r8\n\t"
  12592. "stm %[r]!, {r4, r5}\n\t"
  12593. "ldm %[a]!, {r4, r5}\n\t"
  12594. "ldm %[b]!, {r6, r8}\n\t"
  12595. "sbcs r4, r4, r6\n\t"
  12596. "sbcs r5, r5, r8\n\t"
  12597. "stm %[r]!, {r4, r5}\n\t"
  12598. "ldm %[a]!, {r4, r5}\n\t"
  12599. "ldm %[b]!, {r6, r8}\n\t"
  12600. "sbcs r4, r4, r6\n\t"
  12601. "sbcs r5, r5, r8\n\t"
  12602. "stm %[r]!, {r4, r5}\n\t"
  12603. "ldm %[a]!, {r4, r5}\n\t"
  12604. "ldm %[b]!, {r6, r8}\n\t"
  12605. "sbcs r4, r4, r6\n\t"
  12606. "sbcs r5, r5, r8\n\t"
  12607. "stm %[r]!, {r4, r5}\n\t"
  12608. "ldm %[a]!, {r4, r5}\n\t"
  12609. "ldm %[b]!, {r6, r8}\n\t"
  12610. "sbcs r4, r4, r6\n\t"
  12611. "sbcs r5, r5, r8\n\t"
  12612. "stm %[r]!, {r4, r5}\n\t"
  12613. "ldm %[a]!, {r4, r5}\n\t"
  12614. "ldm %[b]!, {r6, r8}\n\t"
  12615. "sbcs r4, r4, r6\n\t"
  12616. "sbcs r5, r5, r8\n\t"
  12617. "stm %[r]!, {r4, r5}\n\t"
  12618. "ldm %[a]!, {r4, r5}\n\t"
  12619. "ldm %[b]!, {r6, r8}\n\t"
  12620. "sbcs r4, r4, r6\n\t"
  12621. "sbcs r5, r5, r8\n\t"
  12622. "stm %[r]!, {r4, r5}\n\t"
  12623. "ldm %[a]!, {r4, r5}\n\t"
  12624. "ldm %[b]!, {r6, r8}\n\t"
  12625. "sbcs r4, r4, r6\n\t"
  12626. "sbcs r5, r5, r8\n\t"
  12627. "stm %[r]!, {r4, r5}\n\t"
  12628. "ldm %[a]!, {r4, r5}\n\t"
  12629. "ldm %[b]!, {r6, r8}\n\t"
  12630. "sbcs r4, r4, r6\n\t"
  12631. "sbcs r5, r5, r8\n\t"
  12632. "stm %[r]!, {r4, r5}\n\t"
  12633. "ldm %[a]!, {r4, r5}\n\t"
  12634. "ldm %[b]!, {r6, r8}\n\t"
  12635. "sbcs r4, r4, r6\n\t"
  12636. "sbcs r5, r5, r8\n\t"
  12637. "stm %[r]!, {r4, r5}\n\t"
  12638. "ldm %[a]!, {r4, r5}\n\t"
  12639. "ldm %[b]!, {r6, r8}\n\t"
  12640. "sbcs r4, r4, r6\n\t"
  12641. "sbcs r5, r5, r8\n\t"
  12642. "stm %[r]!, {r4, r5}\n\t"
  12643. "ldm %[a]!, {r4, r5}\n\t"
  12644. "ldm %[b]!, {r6, r8}\n\t"
  12645. "sbcs r4, r4, r6\n\t"
  12646. "sbcs r5, r5, r8\n\t"
  12647. "stm %[r]!, {r4, r5}\n\t"
  12648. "ldm %[a]!, {r4, r5}\n\t"
  12649. "ldm %[b]!, {r6, r8}\n\t"
  12650. "sbcs r4, r4, r6\n\t"
  12651. "sbcs r5, r5, r8\n\t"
  12652. "stm %[r]!, {r4, r5}\n\t"
  12653. "ldm %[a]!, {r4, r5}\n\t"
  12654. "ldm %[b]!, {r6, r8}\n\t"
  12655. "sbcs r4, r4, r6\n\t"
  12656. "sbcs r5, r5, r8\n\t"
  12657. "stm %[r]!, {r4, r5}\n\t"
  12658. "ldm %[a]!, {r4, r5}\n\t"
  12659. "ldm %[b]!, {r6, r8}\n\t"
  12660. "sbcs r4, r4, r6\n\t"
  12661. "sbcs r5, r5, r8\n\t"
  12662. "stm %[r]!, {r4, r5}\n\t"
  12663. "ldm %[a]!, {r4, r5}\n\t"
  12664. "ldm %[b]!, {r6, r8}\n\t"
  12665. "sbcs r4, r4, r6\n\t"
  12666. "sbcs r5, r5, r8\n\t"
  12667. "stm %[r]!, {r4, r5}\n\t"
  12668. "ldm %[a]!, {r4, r5}\n\t"
  12669. "ldm %[b]!, {r6, r8}\n\t"
  12670. "sbcs r4, r4, r6\n\t"
  12671. "sbcs r5, r5, r8\n\t"
  12672. "stm %[r]!, {r4, r5}\n\t"
  12673. "ldm %[a]!, {r4, r5}\n\t"
  12674. "ldm %[b]!, {r6, r8}\n\t"
  12675. "sbcs r4, r4, r6\n\t"
  12676. "sbcs r5, r5, r8\n\t"
  12677. "stm %[r]!, {r4, r5}\n\t"
  12678. "ldm %[a]!, {r4, r5}\n\t"
  12679. "ldm %[b]!, {r6, r8}\n\t"
  12680. "sbcs r4, r4, r6\n\t"
  12681. "sbcs r5, r5, r8\n\t"
  12682. "stm %[r]!, {r4, r5}\n\t"
  12683. "ldm %[a]!, {r4, r5}\n\t"
  12684. "ldm %[b]!, {r6, r8}\n\t"
  12685. "sbcs r4, r4, r6\n\t"
  12686. "sbcs r5, r5, r8\n\t"
  12687. "stm %[r]!, {r4, r5}\n\t"
  12688. "ldm %[a]!, {r4, r5}\n\t"
  12689. "ldm %[b]!, {r6, r8}\n\t"
  12690. "sbcs r4, r4, r6\n\t"
  12691. "sbcs r5, r5, r8\n\t"
  12692. "stm %[r]!, {r4, r5}\n\t"
  12693. "ldm %[a]!, {r4, r5}\n\t"
  12694. "ldm %[b]!, {r6, r8}\n\t"
  12695. "sbcs r4, r4, r6\n\t"
  12696. "sbcs r5, r5, r8\n\t"
  12697. "stm %[r]!, {r4, r5}\n\t"
  12698. "ldm %[a]!, {r4, r5}\n\t"
  12699. "ldm %[b]!, {r6, r8}\n\t"
  12700. "sbcs r4, r4, r6\n\t"
  12701. "sbcs r5, r5, r8\n\t"
  12702. "stm %[r]!, {r4, r5}\n\t"
  12703. "ldm %[a]!, {r4, r5}\n\t"
  12704. "ldm %[b]!, {r6, r8}\n\t"
  12705. "sbcs r4, r4, r6\n\t"
  12706. "sbcs r5, r5, r8\n\t"
  12707. "stm %[r]!, {r4, r5}\n\t"
  12708. "ldm %[a]!, {r4, r5}\n\t"
  12709. "ldm %[b]!, {r6, r8}\n\t"
  12710. "sbcs r4, r4, r6\n\t"
  12711. "sbcs r5, r5, r8\n\t"
  12712. "stm %[r]!, {r4, r5}\n\t"
  12713. "ldm %[a]!, {r4, r5}\n\t"
  12714. "ldm %[b]!, {r6, r8}\n\t"
  12715. "sbcs r4, r4, r6\n\t"
  12716. "sbcs r5, r5, r8\n\t"
  12717. "stm %[r]!, {r4, r5}\n\t"
  12718. "ldm %[a]!, {r4, r5}\n\t"
  12719. "ldm %[b]!, {r6, r8}\n\t"
  12720. "sbcs r4, r4, r6\n\t"
  12721. "sbcs r5, r5, r8\n\t"
  12722. "stm %[r]!, {r4, r5}\n\t"
  12723. "ldm %[a]!, {r4, r5}\n\t"
  12724. "ldm %[b]!, {r6, r8}\n\t"
  12725. "sbcs r4, r4, r6\n\t"
  12726. "sbcs r5, r5, r8\n\t"
  12727. "stm %[r]!, {r4, r5}\n\t"
  12728. "ldm %[a]!, {r4, r5}\n\t"
  12729. "ldm %[b]!, {r6, r8}\n\t"
  12730. "sbcs r4, r4, r6\n\t"
  12731. "sbcs r5, r5, r8\n\t"
  12732. "stm %[r]!, {r4, r5}\n\t"
  12733. "ldm %[a]!, {r4, r5}\n\t"
  12734. "ldm %[b]!, {r6, r8}\n\t"
  12735. "sbcs r4, r4, r6\n\t"
  12736. "sbcs r5, r5, r8\n\t"
  12737. "stm %[r]!, {r4, r5}\n\t"
  12738. "ldm %[a]!, {r4, r5}\n\t"
  12739. "ldm %[b]!, {r6, r8}\n\t"
  12740. "sbcs r4, r4, r6\n\t"
  12741. "sbcs r5, r5, r8\n\t"
  12742. "stm %[r]!, {r4, r5}\n\t"
  12743. "ldm %[a]!, {r4, r5}\n\t"
  12744. "ldm %[b]!, {r6, r8}\n\t"
  12745. "sbcs r4, r4, r6\n\t"
  12746. "sbcs r5, r5, r8\n\t"
  12747. "stm %[r]!, {r4, r5}\n\t"
  12748. "ldm %[a]!, {r4, r5}\n\t"
  12749. "ldm %[b]!, {r6, r8}\n\t"
  12750. "sbcs r4, r4, r6\n\t"
  12751. "sbcs r5, r5, r8\n\t"
  12752. "stm %[r]!, {r4, r5}\n\t"
  12753. "ldm %[a]!, {r4, r5}\n\t"
  12754. "ldm %[b]!, {r6, r8}\n\t"
  12755. "sbcs r4, r4, r6\n\t"
  12756. "sbcs r5, r5, r8\n\t"
  12757. "stm %[r]!, {r4, r5}\n\t"
  12758. "ldm %[a]!, {r4, r5}\n\t"
  12759. "ldm %[b]!, {r6, r8}\n\t"
  12760. "sbcs r4, r4, r6\n\t"
  12761. "sbcs r5, r5, r8\n\t"
  12762. "stm %[r]!, {r4, r5}\n\t"
  12763. "ldm %[a]!, {r4, r5}\n\t"
  12764. "ldm %[b]!, {r6, r8}\n\t"
  12765. "sbcs r4, r4, r6\n\t"
  12766. "sbcs r5, r5, r8\n\t"
  12767. "stm %[r]!, {r4, r5}\n\t"
  12768. "ldm %[a]!, {r4, r5}\n\t"
  12769. "ldm %[b]!, {r6, r8}\n\t"
  12770. "sbcs r4, r4, r6\n\t"
  12771. "sbcs r5, r5, r8\n\t"
  12772. "stm %[r]!, {r4, r5}\n\t"
  12773. "ldm %[a]!, {r4, r5}\n\t"
  12774. "ldm %[b]!, {r6, r8}\n\t"
  12775. "sbcs r4, r4, r6\n\t"
  12776. "sbcs r5, r5, r8\n\t"
  12777. "stm %[r]!, {r4, r5}\n\t"
  12778. "ldm %[a]!, {r4, r5}\n\t"
  12779. "ldm %[b]!, {r6, r8}\n\t"
  12780. "sbcs r4, r4, r6\n\t"
  12781. "sbcs r5, r5, r8\n\t"
  12782. "stm %[r]!, {r4, r5}\n\t"
  12783. "ldm %[a]!, {r4, r5}\n\t"
  12784. "ldm %[b]!, {r6, r8}\n\t"
  12785. "sbcs r4, r4, r6\n\t"
  12786. "sbcs r5, r5, r8\n\t"
  12787. "stm %[r]!, {r4, r5}\n\t"
  12788. "ldm %[a]!, {r4, r5}\n\t"
  12789. "ldm %[b]!, {r6, r8}\n\t"
  12790. "sbcs r4, r4, r6\n\t"
  12791. "sbcs r5, r5, r8\n\t"
  12792. "stm %[r]!, {r4, r5}\n\t"
  12793. "ldm %[a]!, {r4, r5}\n\t"
  12794. "ldm %[b]!, {r6, r8}\n\t"
  12795. "sbcs r4, r4, r6\n\t"
  12796. "sbcs r5, r5, r8\n\t"
  12797. "stm %[r]!, {r4, r5}\n\t"
  12798. "ldm %[a]!, {r4, r5}\n\t"
  12799. "ldm %[b]!, {r6, r8}\n\t"
  12800. "sbcs r4, r4, r6\n\t"
  12801. "sbcs r5, r5, r8\n\t"
  12802. "stm %[r]!, {r4, r5}\n\t"
  12803. "ldm %[a]!, {r4, r5}\n\t"
  12804. "ldm %[b]!, {r6, r8}\n\t"
  12805. "sbcs r4, r4, r6\n\t"
  12806. "sbcs r5, r5, r8\n\t"
  12807. "stm %[r]!, {r4, r5}\n\t"
  12808. "ldm %[a]!, {r4, r5}\n\t"
  12809. "ldm %[b]!, {r6, r8}\n\t"
  12810. "sbcs r4, r4, r6\n\t"
  12811. "sbcs r5, r5, r8\n\t"
  12812. "stm %[r]!, {r4, r5}\n\t"
  12813. "ldm %[a]!, {r4, r5}\n\t"
  12814. "ldm %[b]!, {r6, r8}\n\t"
  12815. "sbcs r4, r4, r6\n\t"
  12816. "sbcs r5, r5, r8\n\t"
  12817. "stm %[r]!, {r4, r5}\n\t"
  12818. "ldm %[a]!, {r4, r5}\n\t"
  12819. "ldm %[b]!, {r6, r8}\n\t"
  12820. "sbcs r4, r4, r6\n\t"
  12821. "sbcs r5, r5, r8\n\t"
  12822. "stm %[r]!, {r4, r5}\n\t"
  12823. "ldm %[a]!, {r4, r5}\n\t"
  12824. "ldm %[b]!, {r6, r8}\n\t"
  12825. "sbcs r4, r4, r6\n\t"
  12826. "sbcs r5, r5, r8\n\t"
  12827. "stm %[r]!, {r4, r5}\n\t"
  12828. "ldm %[a]!, {r4, r5}\n\t"
  12829. "ldm %[b]!, {r6, r8}\n\t"
  12830. "sbcs r4, r4, r6\n\t"
  12831. "sbcs r5, r5, r8\n\t"
  12832. "stm %[r]!, {r4, r5}\n\t"
  12833. "ldm %[a]!, {r4, r5}\n\t"
  12834. "ldm %[b]!, {r6, r8}\n\t"
  12835. "sbcs r4, r4, r6\n\t"
  12836. "sbcs r5, r5, r8\n\t"
  12837. "stm %[r]!, {r4, r5}\n\t"
  12838. "ldm %[a]!, {r4, r5}\n\t"
  12839. "ldm %[b]!, {r6, r8}\n\t"
  12840. "sbcs r4, r4, r6\n\t"
  12841. "sbcs r5, r5, r8\n\t"
  12842. "stm %[r]!, {r4, r5}\n\t"
  12843. "sbc %[c], %[c], %[c]\n\t"
  12844. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  12845. :
  12846. : "memory", "r4", "r5", "r6", "r8"
  12847. );
  12848. return c;
  12849. }
  12850. #endif /* WOLFSSL_SP_SMALL */
  12851. /* Divide the double width number (d1|d0) by the divisor. (d1|d0 / div)
  12852. *
  12853. * d1 The high order half of the number to divide.
  12854. * d0 The low order half of the number to divide.
  12855. * div The divisor.
  12856. * returns the result of the division.
  12857. *
  12858. * Note that this is an approximate div. It may give an answer 1 larger.
  12859. */
  12860. SP_NOINLINE static sp_digit div_4096_word_128(sp_digit d1, sp_digit d0,
  12861. sp_digit div)
  12862. {
  12863. sp_digit r = 0;
  12864. __asm__ __volatile__ (
  12865. "lsr r6, %[div], #16\n\t"
  12866. "add r6, r6, #1\n\t"
  12867. "udiv r4, %[d1], r6\n\t"
  12868. "lsl r8, r4, #16\n\t"
  12869. "umull r4, r5, %[div], r8\n\t"
  12870. "subs %[d0], %[d0], r4\n\t"
  12871. "sbc %[d1], %[d1], r5\n\t"
  12872. "udiv r5, %[d1], r6\n\t"
  12873. "lsl r4, r5, #16\n\t"
  12874. "add r8, r8, r4\n\t"
  12875. "umull r4, r5, %[div], r4\n\t"
  12876. "subs %[d0], %[d0], r4\n\t"
  12877. "sbc %[d1], %[d1], r5\n\t"
  12878. "lsl r4, %[d1], #16\n\t"
  12879. "orr r4, r4, %[d0], lsr #16\n\t"
  12880. "udiv r4, r4, r6\n\t"
  12881. "add r8, r8, r4\n\t"
  12882. "umull r4, r5, %[div], r4\n\t"
  12883. "subs %[d0], %[d0], r4\n\t"
  12884. "sbc %[d1], %[d1], r5\n\t"
  12885. "lsl r4, %[d1], #16\n\t"
  12886. "orr r4, r4, %[d0], lsr #16\n\t"
  12887. "udiv r4, r4, r6\n\t"
  12888. "add r8, r8, r4\n\t"
  12889. "umull r4, r5, %[div], r4\n\t"
  12890. "subs %[d0], %[d0], r4\n\t"
  12891. "sbc %[d1], %[d1], r5\n\t"
  12892. "udiv r4, %[d0], %[div]\n\t"
  12893. "add r8, r8, r4\n\t"
  12894. "mov %[r], r8\n\t"
  12895. : [r] "+r" (r)
  12896. : [d1] "r" (d1), [d0] "r" (d0), [div] "r" (div)
  12897. : "r4", "r5", "r6", "r8"
  12898. );
  12899. return r;
  12900. }
  12901. /* Divide d in a and put remainder into r (m*d + r = a)
  12902. * m is not calculated as it is not needed at this time.
  12903. *
  12904. * a Number to be divided.
  12905. * d Number to divide with.
  12906. * m Multiplier result.
  12907. * r Remainder from the division.
  12908. * returns MP_OKAY indicating success.
  12909. */
  12910. static WC_INLINE int sp_4096_div_128_cond(const sp_digit* a, const sp_digit* d, sp_digit* m,
  12911. sp_digit* r)
  12912. {
  12913. sp_digit t1[256], t2[129];
  12914. sp_digit div, r1;
  12915. int i;
  12916. (void)m;
  12917. div = d[127];
  12918. XMEMCPY(t1, a, sizeof(*t1) * 2 * 128);
  12919. for (i = 127; i > 0; i--) {
  12920. if (t1[i + 128] != d[i])
  12921. break;
  12922. }
  12923. if (t1[i + 128] >= d[i]) {
  12924. sp_4096_sub_in_place_128(&t1[128], d);
  12925. }
  12926. for (i = 127; i >= 0; i--) {
  12927. if (t1[128 + i] == div) {
  12928. r1 = SP_DIGIT_MAX;
  12929. }
  12930. else {
  12931. r1 = div_4096_word_128(t1[128 + i], t1[128 + i - 1], div);
  12932. }
  12933. sp_4096_mul_d_128(t2, d, r1);
  12934. t1[128 + i] += sp_4096_sub_in_place_128(&t1[i], t2);
  12935. t1[128 + i] -= t2[128];
  12936. if (t1[128 + i] != 0) {
  12937. t1[128 + i] += sp_4096_add_128(&t1[i], &t1[i], d);
  12938. if (t1[128 + i] != 0)
  12939. t1[128 + i] += sp_4096_add_128(&t1[i], &t1[i], d);
  12940. }
  12941. }
  12942. for (i = 127; i > 0; i--) {
  12943. if (t1[i] != d[i])
  12944. break;
  12945. }
  12946. if (t1[i] >= d[i]) {
  12947. sp_4096_sub_128(r, t1, d);
  12948. }
  12949. else {
  12950. XMEMCPY(r, t1, sizeof(*t1) * 128);
  12951. }
  12952. return MP_OKAY;
  12953. }
  12954. /* Reduce a modulo m into r. (r = a mod m)
  12955. *
  12956. * r A single precision number that is the reduced result.
  12957. * a A single precision number that is to be reduced.
  12958. * m A single precision number that is the modulus to reduce with.
  12959. * returns MP_OKAY indicating success.
  12960. */
  12961. static WC_INLINE int sp_4096_mod_128_cond(sp_digit* r, const sp_digit* a, const sp_digit* m)
  12962. {
  12963. return sp_4096_div_128_cond(a, m, NULL, r);
  12964. }
  12965. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || defined(WOLFSSL_HAVE_SP_DH)
  12966. /* AND m into each word of a and store in r.
  12967. *
  12968. * r A single precision integer.
  12969. * a A single precision integer.
  12970. * m Mask to AND against each digit.
  12971. */
  12972. static void sp_4096_mask_128(sp_digit* r, const sp_digit* a, sp_digit m)
  12973. {
  12974. #ifdef WOLFSSL_SP_SMALL
  12975. int i;
  12976. for (i=0; i<128; i++) {
  12977. r[i] = a[i] & m;
  12978. }
  12979. #else
  12980. int i;
  12981. for (i = 0; i < 128; i += 8) {
  12982. r[i+0] = a[i+0] & m;
  12983. r[i+1] = a[i+1] & m;
  12984. r[i+2] = a[i+2] & m;
  12985. r[i+3] = a[i+3] & m;
  12986. r[i+4] = a[i+4] & m;
  12987. r[i+5] = a[i+5] & m;
  12988. r[i+6] = a[i+6] & m;
  12989. r[i+7] = a[i+7] & m;
  12990. }
  12991. #endif
  12992. }
  12993. /* Compare a with b in constant time.
  12994. *
  12995. * a A single precision integer.
  12996. * b A single precision integer.
  12997. * return -ve, 0 or +ve if a is less than, equal to or greater than b
  12998. * respectively.
  12999. */
  13000. SP_NOINLINE static sp_int32 sp_4096_cmp_128(const sp_digit* a, const sp_digit* b)
  13001. {
  13002. sp_digit r = 0;
  13003. __asm__ __volatile__ (
  13004. "mov r3, #0\n\t"
  13005. "mvn r3, r3\n\t"
  13006. "mov r6, #1\n\t"
  13007. "lsl r6, r6, #8\n\t"
  13008. "add r6, r6, #252\n\t"
  13009. "\n1:\n\t"
  13010. "ldr r8, [%[a], r6]\n\t"
  13011. "ldr r5, [%[b], r6]\n\t"
  13012. "and r8, r8, r3\n\t"
  13013. "and r5, r5, r3\n\t"
  13014. "mov r4, r8\n\t"
  13015. "subs r8, r8, r5\n\t"
  13016. "sbc r8, r8, r8\n\t"
  13017. "add %[r], %[r], r8\n\t"
  13018. "mvn r8, r8\n\t"
  13019. "and r3, r3, r8\n\t"
  13020. "subs r5, r5, r4\n\t"
  13021. "sbc r8, r8, r8\n\t"
  13022. "sub %[r], %[r], r8\n\t"
  13023. "mvn r8, r8\n\t"
  13024. "and r3, r3, r8\n\t"
  13025. "sub r6, r6, #4\n\t"
  13026. "cmp r6, #0\n\t"
  13027. #ifdef __GNUC__
  13028. "bge 1b\n\t"
  13029. #else
  13030. "bge.n 1b\n\t"
  13031. #endif /* __GNUC__ */
  13032. : [r] "+r" (r)
  13033. : [a] "r" (a), [b] "r" (b)
  13034. : "r3", "r4", "r5", "r6", "r8"
  13035. );
  13036. return r;
  13037. }
  13038. /* Divide d in a and put remainder into r (m*d + r = a)
  13039. * m is not calculated as it is not needed at this time.
  13040. *
  13041. * a Number to be divided.
  13042. * d Number to divide with.
  13043. * m Multiplier result.
  13044. * r Remainder from the division.
  13045. * returns MP_OKAY indicating success.
  13046. */
  13047. static WC_INLINE int sp_4096_div_128(const sp_digit* a, const sp_digit* d, sp_digit* m,
  13048. sp_digit* r)
  13049. {
  13050. sp_digit t1[256], t2[129];
  13051. sp_digit div, r1;
  13052. int i;
  13053. (void)m;
  13054. div = d[127];
  13055. XMEMCPY(t1, a, sizeof(*t1) * 2 * 128);
  13056. r1 = sp_4096_cmp_128(&t1[128], d) >= 0;
  13057. sp_4096_cond_sub_128(&t1[128], &t1[128], d, (sp_digit)0 - r1);
  13058. for (i = 127; i >= 0; i--) {
  13059. sp_digit mask = 0 - (t1[128 + i] == div);
  13060. sp_digit hi = t1[128 + i] + mask;
  13061. r1 = div_4096_word_128(hi, t1[128 + i - 1], div);
  13062. r1 |= mask;
  13063. sp_4096_mul_d_128(t2, d, r1);
  13064. t1[128 + i] += sp_4096_sub_in_place_128(&t1[i], t2);
  13065. t1[128 + i] -= t2[128];
  13066. sp_4096_mask_128(t2, d, t1[128 + i]);
  13067. t1[128 + i] += sp_4096_add_128(&t1[i], &t1[i], t2);
  13068. sp_4096_mask_128(t2, d, t1[128 + i]);
  13069. t1[128 + i] += sp_4096_add_128(&t1[i], &t1[i], t2);
  13070. }
  13071. r1 = sp_4096_cmp_128(t1, d) >= 0;
  13072. sp_4096_cond_sub_128(r, t1, d, (sp_digit)0 - r1);
  13073. return MP_OKAY;
  13074. }
  13075. /* Reduce a modulo m into r. (r = a mod m)
  13076. *
  13077. * r A single precision number that is the reduced result.
  13078. * a A single precision number that is to be reduced.
  13079. * m A single precision number that is the modulus to reduce with.
  13080. * returns MP_OKAY indicating success.
  13081. */
  13082. static WC_INLINE int sp_4096_mod_128(sp_digit* r, const sp_digit* a, const sp_digit* m)
  13083. {
  13084. return sp_4096_div_128(a, m, NULL, r);
  13085. }
  13086. #if (defined(WOLFSSL_HAVE_SP_RSA) && !defined(WOLFSSL_RSA_PUBLIC_ONLY)) || \
  13087. defined(WOLFSSL_HAVE_SP_DH)
  13088. #ifdef WOLFSSL_SP_SMALL
  13089. /* Modular exponentiate a to the e mod m. (r = a^e mod m)
  13090. *
  13091. * r A single precision number that is the result of the operation.
  13092. * a A single precision number being exponentiated.
  13093. * e A single precision number that is the exponent.
  13094. * bits The number of bits in the exponent.
  13095. * m A single precision number that is the modulus.
  13096. * returns 0 on success.
  13097. * returns MEMORY_E on dynamic memory allocation failure.
  13098. * returns MP_VAL when base is even or exponent is 0.
  13099. */
  13100. static int sp_4096_mod_exp_128(sp_digit* r, const sp_digit* a, const sp_digit* e,
  13101. int bits, const sp_digit* m, int reduceA)
  13102. {
  13103. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13104. sp_digit* td = NULL;
  13105. #else
  13106. sp_digit td[8 * 256];
  13107. #endif
  13108. sp_digit* t[8];
  13109. sp_digit* norm = NULL;
  13110. sp_digit mp = 1;
  13111. sp_digit n;
  13112. sp_digit mask;
  13113. int i;
  13114. int c;
  13115. byte y;
  13116. int err = MP_OKAY;
  13117. if (bits == 0) {
  13118. err = MP_VAL;
  13119. }
  13120. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13121. if (err == MP_OKAY) {
  13122. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * (8 * 256), NULL,
  13123. DYNAMIC_TYPE_TMP_BUFFER);
  13124. if (td == NULL)
  13125. err = MEMORY_E;
  13126. }
  13127. #endif
  13128. if (err == MP_OKAY) {
  13129. norm = td;
  13130. for (i=0; i<8; i++) {
  13131. t[i] = td + i * 256;
  13132. }
  13133. sp_4096_mont_setup(m, &mp);
  13134. sp_4096_mont_norm_128(norm, m);
  13135. XMEMSET(t[1], 0, sizeof(sp_digit) * 128U);
  13136. if (reduceA != 0) {
  13137. err = sp_4096_mod_128(t[1] + 128, a, m);
  13138. if (err == MP_OKAY) {
  13139. err = sp_4096_mod_128(t[1], t[1], m);
  13140. }
  13141. }
  13142. else {
  13143. XMEMCPY(t[1] + 128, a, sizeof(sp_digit) * 128);
  13144. err = sp_4096_mod_128(t[1], t[1], m);
  13145. }
  13146. }
  13147. if (err == MP_OKAY) {
  13148. sp_4096_mont_sqr_128(t[ 2], t[ 1], m, mp);
  13149. sp_4096_mont_mul_128(t[ 3], t[ 2], t[ 1], m, mp);
  13150. sp_4096_mont_sqr_128(t[ 4], t[ 2], m, mp);
  13151. sp_4096_mont_mul_128(t[ 5], t[ 3], t[ 2], m, mp);
  13152. sp_4096_mont_sqr_128(t[ 6], t[ 3], m, mp);
  13153. sp_4096_mont_mul_128(t[ 7], t[ 4], t[ 3], m, mp);
  13154. i = (bits - 1) / 32;
  13155. n = e[i--];
  13156. c = bits & 31;
  13157. if (c == 0) {
  13158. c = 32;
  13159. }
  13160. c -= bits % 3;
  13161. if (c == 32) {
  13162. c = 29;
  13163. }
  13164. if (c < 0) {
  13165. /* Number of bits in top word is less than number needed. */
  13166. c = -c;
  13167. y = (byte)(n << c);
  13168. n = e[i--];
  13169. y |= (byte)(n >> (64 - c));
  13170. n <<= c;
  13171. c = 64 - c;
  13172. }
  13173. else if (c == 0) {
  13174. /* All bits in top word used. */
  13175. y = (byte)n;
  13176. }
  13177. else {
  13178. y = (byte)(n >> c);
  13179. n <<= 32 - c;
  13180. }
  13181. XMEMCPY(r, t[y], sizeof(sp_digit) * 128);
  13182. for (; i>=0 || c>=3; ) {
  13183. if (c == 0) {
  13184. n = e[i--];
  13185. y = (byte)(n >> 29);
  13186. n <<= 3;
  13187. c = 29;
  13188. }
  13189. else if (c < 3) {
  13190. y = (byte)(n >> 29);
  13191. n = e[i--];
  13192. c = 3 - c;
  13193. y |= (byte)(n >> (32 - c));
  13194. n <<= c;
  13195. c = 32 - c;
  13196. }
  13197. else {
  13198. y = (byte)((n >> 29) & 0x7);
  13199. n <<= 3;
  13200. c -= 3;
  13201. }
  13202. sp_4096_mont_sqr_128(r, r, m, mp);
  13203. sp_4096_mont_sqr_128(r, r, m, mp);
  13204. sp_4096_mont_sqr_128(r, r, m, mp);
  13205. sp_4096_mont_mul_128(r, r, t[y], m, mp);
  13206. }
  13207. XMEMSET(&r[128], 0, sizeof(sp_digit) * 128U);
  13208. sp_4096_mont_reduce_128(r, m, mp);
  13209. mask = 0 - (sp_4096_cmp_128(r, m) >= 0);
  13210. sp_4096_cond_sub_128(r, r, m, mask);
  13211. }
  13212. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13213. if (td != NULL)
  13214. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  13215. #endif
  13216. return err;
  13217. }
  13218. #else
  13219. /* Modular exponentiate a to the e mod m. (r = a^e mod m)
  13220. *
  13221. * r A single precision number that is the result of the operation.
  13222. * a A single precision number being exponentiated.
  13223. * e A single precision number that is the exponent.
  13224. * bits The number of bits in the exponent.
  13225. * m A single precision number that is the modulus.
  13226. * returns 0 on success.
  13227. * returns MEMORY_E on dynamic memory allocation failure.
  13228. * returns MP_VAL when base is even or exponent is 0.
  13229. */
  13230. static int sp_4096_mod_exp_128(sp_digit* r, const sp_digit* a, const sp_digit* e,
  13231. int bits, const sp_digit* m, int reduceA)
  13232. {
  13233. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13234. sp_digit* td = NULL;
  13235. #else
  13236. sp_digit td[16 * 256];
  13237. #endif
  13238. sp_digit* t[16];
  13239. sp_digit* norm = NULL;
  13240. sp_digit mp = 1;
  13241. sp_digit n;
  13242. sp_digit mask;
  13243. int i;
  13244. int c;
  13245. byte y;
  13246. int err = MP_OKAY;
  13247. if (bits == 0) {
  13248. err = MP_VAL;
  13249. }
  13250. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13251. if (err == MP_OKAY) {
  13252. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * (16 * 256), NULL,
  13253. DYNAMIC_TYPE_TMP_BUFFER);
  13254. if (td == NULL)
  13255. err = MEMORY_E;
  13256. }
  13257. #endif
  13258. if (err == MP_OKAY) {
  13259. norm = td;
  13260. for (i=0; i<16; i++) {
  13261. t[i] = td + i * 256;
  13262. }
  13263. sp_4096_mont_setup(m, &mp);
  13264. sp_4096_mont_norm_128(norm, m);
  13265. XMEMSET(t[1], 0, sizeof(sp_digit) * 128U);
  13266. if (reduceA != 0) {
  13267. err = sp_4096_mod_128(t[1] + 128, a, m);
  13268. if (err == MP_OKAY) {
  13269. err = sp_4096_mod_128(t[1], t[1], m);
  13270. }
  13271. }
  13272. else {
  13273. XMEMCPY(t[1] + 128, a, sizeof(sp_digit) * 128);
  13274. err = sp_4096_mod_128(t[1], t[1], m);
  13275. }
  13276. }
  13277. if (err == MP_OKAY) {
  13278. sp_4096_mont_sqr_128(t[ 2], t[ 1], m, mp);
  13279. sp_4096_mont_mul_128(t[ 3], t[ 2], t[ 1], m, mp);
  13280. sp_4096_mont_sqr_128(t[ 4], t[ 2], m, mp);
  13281. sp_4096_mont_mul_128(t[ 5], t[ 3], t[ 2], m, mp);
  13282. sp_4096_mont_sqr_128(t[ 6], t[ 3], m, mp);
  13283. sp_4096_mont_mul_128(t[ 7], t[ 4], t[ 3], m, mp);
  13284. sp_4096_mont_sqr_128(t[ 8], t[ 4], m, mp);
  13285. sp_4096_mont_mul_128(t[ 9], t[ 5], t[ 4], m, mp);
  13286. sp_4096_mont_sqr_128(t[10], t[ 5], m, mp);
  13287. sp_4096_mont_mul_128(t[11], t[ 6], t[ 5], m, mp);
  13288. sp_4096_mont_sqr_128(t[12], t[ 6], m, mp);
  13289. sp_4096_mont_mul_128(t[13], t[ 7], t[ 6], m, mp);
  13290. sp_4096_mont_sqr_128(t[14], t[ 7], m, mp);
  13291. sp_4096_mont_mul_128(t[15], t[ 8], t[ 7], m, mp);
  13292. i = (bits - 1) / 32;
  13293. n = e[i--];
  13294. c = bits & 31;
  13295. if (c == 0) {
  13296. c = 32;
  13297. }
  13298. c -= bits % 4;
  13299. if (c == 32) {
  13300. c = 28;
  13301. }
  13302. if (c < 0) {
  13303. /* Number of bits in top word is less than number needed. */
  13304. c = -c;
  13305. y = (byte)(n << c);
  13306. n = e[i--];
  13307. y |= (byte)(n >> (64 - c));
  13308. n <<= c;
  13309. c = 64 - c;
  13310. }
  13311. else if (c == 0) {
  13312. /* All bits in top word used. */
  13313. y = (byte)n;
  13314. }
  13315. else {
  13316. y = (byte)(n >> c);
  13317. n <<= 32 - c;
  13318. }
  13319. XMEMCPY(r, t[y], sizeof(sp_digit) * 128);
  13320. for (; i>=0 || c>=4; ) {
  13321. if (c == 0) {
  13322. n = e[i--];
  13323. y = (byte)(n >> 28);
  13324. n <<= 4;
  13325. c = 28;
  13326. }
  13327. else if (c < 4) {
  13328. y = (byte)(n >> 28);
  13329. n = e[i--];
  13330. c = 4 - c;
  13331. y |= (byte)(n >> (32 - c));
  13332. n <<= c;
  13333. c = 32 - c;
  13334. }
  13335. else {
  13336. y = (byte)((n >> 28) & 0xf);
  13337. n <<= 4;
  13338. c -= 4;
  13339. }
  13340. sp_4096_mont_sqr_128(r, r, m, mp);
  13341. sp_4096_mont_sqr_128(r, r, m, mp);
  13342. sp_4096_mont_sqr_128(r, r, m, mp);
  13343. sp_4096_mont_sqr_128(r, r, m, mp);
  13344. sp_4096_mont_mul_128(r, r, t[y], m, mp);
  13345. }
  13346. XMEMSET(&r[128], 0, sizeof(sp_digit) * 128U);
  13347. sp_4096_mont_reduce_128(r, m, mp);
  13348. mask = 0 - (sp_4096_cmp_128(r, m) >= 0);
  13349. sp_4096_cond_sub_128(r, r, m, mask);
  13350. }
  13351. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13352. if (td != NULL)
  13353. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  13354. #endif
  13355. return err;
  13356. }
  13357. #endif /* WOLFSSL_SP_SMALL */
  13358. #endif /* (WOLFSSL_HAVE_SP_RSA && !WOLFSSL_RSA_PUBLIC_ONLY) || WOLFSSL_HAVE_SP_DH */
  13359. #endif /* (WOLFSSL_HAVE_SP_RSA && !WOLFSSL_RSA_PUBLIC_ONLY) || WOLFSSL_HAVE_SP_DH */
  13360. #ifdef WOLFSSL_HAVE_SP_RSA
  13361. /* RSA public key operation.
  13362. *
  13363. * in Array of bytes representing the number to exponentiate, base.
  13364. * inLen Number of bytes in base.
  13365. * em Public exponent.
  13366. * mm Modulus.
  13367. * out Buffer to hold big-endian bytes of exponentiation result.
  13368. * Must be at least 512 bytes long.
  13369. * outLen Number of bytes in result.
  13370. * returns 0 on success, MP_TO_E when the outLen is too small, MP_READ_E when
  13371. * an array is too long and MEMORY_E when dynamic memory allocation fails.
  13372. */
  13373. int sp_RsaPublic_4096(const byte* in, word32 inLen, const mp_int* em,
  13374. const mp_int* mm, byte* out, word32* outLen)
  13375. {
  13376. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13377. sp_digit* a = NULL;
  13378. #else
  13379. sp_digit a[128 * 5];
  13380. #endif
  13381. sp_digit* m = NULL;
  13382. sp_digit* r = NULL;
  13383. sp_digit *ah = NULL;
  13384. sp_digit e[1] = {0};
  13385. int err = MP_OKAY;
  13386. if (*outLen < 512) {
  13387. err = MP_TO_E;
  13388. }
  13389. else if (mp_count_bits(em) > 32 || inLen > 512 ||
  13390. mp_count_bits(mm) != 4096) {
  13391. err = MP_READ_E;
  13392. }
  13393. else if (mp_iseven(mm)) {
  13394. err = MP_VAL;
  13395. }
  13396. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13397. if (err == MP_OKAY) {
  13398. a = (sp_digit*)XMALLOC(sizeof(sp_digit) * 128 * 5, NULL,
  13399. DYNAMIC_TYPE_RSA);
  13400. if (a == NULL)
  13401. err = MEMORY_E;
  13402. }
  13403. #endif
  13404. if (err == MP_OKAY) {
  13405. ah = a + 128;
  13406. r = a + 128 * 2;
  13407. m = r + 128 * 2;
  13408. sp_4096_from_bin(ah, 128, in, inLen);
  13409. #if DIGIT_BIT >= 32
  13410. e[0] = em->dp[0];
  13411. #else
  13412. e[0] = em->dp[0];
  13413. if (em->used > 1) {
  13414. e[0] |= ((sp_digit)em->dp[1]) << DIGIT_BIT;
  13415. }
  13416. #endif
  13417. if (e[0] == 0) {
  13418. err = MP_EXPTMOD_E;
  13419. }
  13420. }
  13421. if (err == MP_OKAY) {
  13422. sp_4096_from_mp(m, 128, mm);
  13423. if (e[0] == 0x10001) {
  13424. int i;
  13425. sp_digit mp;
  13426. sp_4096_mont_setup(m, &mp);
  13427. /* Convert to Montgomery form. */
  13428. XMEMSET(a, 0, sizeof(sp_digit) * 128);
  13429. err = sp_4096_mod_128_cond(r, a, m);
  13430. /* Montgomery form: r = a.R mod m */
  13431. if (err == MP_OKAY) {
  13432. /* r = a ^ 0x10000 => r = a squared 16 times */
  13433. for (i = 15; i >= 0; i--) {
  13434. sp_4096_mont_sqr_128(r, r, m, mp);
  13435. }
  13436. /* mont_red(r.R.R) = (r.R.R / R) mod m = r.R mod m
  13437. * mont_red(r.R * a) = (r.R.a / R) mod m = r.a mod m
  13438. */
  13439. sp_4096_mont_mul_128(r, r, ah, m, mp);
  13440. for (i = 127; i > 0; i--) {
  13441. if (r[i] != m[i]) {
  13442. break;
  13443. }
  13444. }
  13445. if (r[i] >= m[i]) {
  13446. sp_4096_sub_in_place_128(r, m);
  13447. }
  13448. }
  13449. }
  13450. else if (e[0] == 0x3) {
  13451. if (err == MP_OKAY) {
  13452. sp_4096_sqr_128(r, ah);
  13453. err = sp_4096_mod_128_cond(r, r, m);
  13454. }
  13455. if (err == MP_OKAY) {
  13456. sp_4096_mul_128(r, ah, r);
  13457. err = sp_4096_mod_128_cond(r, r, m);
  13458. }
  13459. }
  13460. else {
  13461. int i;
  13462. sp_digit mp;
  13463. sp_4096_mont_setup(m, &mp);
  13464. /* Convert to Montgomery form. */
  13465. XMEMSET(a, 0, sizeof(sp_digit) * 128);
  13466. err = sp_4096_mod_128_cond(a, a, m);
  13467. if (err == MP_OKAY) {
  13468. for (i = 31; i >= 0; i--) {
  13469. if (e[0] >> i) {
  13470. break;
  13471. }
  13472. }
  13473. XMEMCPY(r, a, sizeof(sp_digit) * 128);
  13474. for (i--; i >= 0; i--) {
  13475. sp_4096_mont_sqr_128(r, r, m, mp);
  13476. if (((e[0] >> i) & 1) == 1) {
  13477. sp_4096_mont_mul_128(r, r, a, m, mp);
  13478. }
  13479. }
  13480. XMEMSET(&r[128], 0, sizeof(sp_digit) * 128);
  13481. sp_4096_mont_reduce_128(r, m, mp);
  13482. for (i = 127; i > 0; i--) {
  13483. if (r[i] != m[i]) {
  13484. break;
  13485. }
  13486. }
  13487. if (r[i] >= m[i]) {
  13488. sp_4096_sub_in_place_128(r, m);
  13489. }
  13490. }
  13491. }
  13492. }
  13493. if (err == MP_OKAY) {
  13494. sp_4096_to_bin_128(r, out);
  13495. *outLen = 512;
  13496. }
  13497. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13498. if (a != NULL)
  13499. XFREE(a, NULL, DYNAMIC_TYPE_RSA);
  13500. #endif
  13501. return err;
  13502. }
  13503. #ifndef WOLFSSL_RSA_PUBLIC_ONLY
  13504. /* Conditionally add a and b using the mask m.
  13505. * m is -1 to add and 0 when not.
  13506. *
  13507. * r A single precision number representing conditional add result.
  13508. * a A single precision number to add with.
  13509. * b A single precision number to add.
  13510. * m Mask value to apply.
  13511. */
  13512. SP_NOINLINE static sp_digit sp_4096_cond_add_64(sp_digit* r, const sp_digit* a, const sp_digit* b,
  13513. sp_digit m)
  13514. {
  13515. sp_digit c = 0;
  13516. __asm__ __volatile__ (
  13517. "mov r5, #1\n\t"
  13518. "lsl r5, r5, #8\n\t"
  13519. "mov r9, r5\n\t"
  13520. "mov r8, #0\n\t"
  13521. "\n1:\n\t"
  13522. "ldr r6, [%[b], r8]\n\t"
  13523. "and r6, r6, %[m]\n\t"
  13524. "adds r5, %[c], #-1\n\t"
  13525. "ldr r5, [%[a], r8]\n\t"
  13526. "adcs r5, r5, r6\n\t"
  13527. "mov %[c], #0\n\t"
  13528. "adcs %[c], %[c], %[c]\n\t"
  13529. "str r5, [%[r], r8]\n\t"
  13530. "add r8, r8, #4\n\t"
  13531. "cmp r8, r9\n\t"
  13532. #ifdef __GNUC__
  13533. "blt 1b\n\t"
  13534. #else
  13535. "blt.n 1b\n\t"
  13536. #endif /* __GNUC__ */
  13537. : [c] "+r" (c)
  13538. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  13539. : "memory", "r5", "r6", "r8", "r9"
  13540. );
  13541. return c;
  13542. }
  13543. /* RSA private key operation.
  13544. *
  13545. * in Array of bytes representing the number to exponentiate, base.
  13546. * inLen Number of bytes in base.
  13547. * dm Private exponent.
  13548. * pm First prime.
  13549. * qm Second prime.
  13550. * dpm First prime's CRT exponent.
  13551. * dqm Second prime's CRT exponent.
  13552. * qim Inverse of second prime mod p.
  13553. * mm Modulus.
  13554. * out Buffer to hold big-endian bytes of exponentiation result.
  13555. * Must be at least 512 bytes long.
  13556. * outLen Number of bytes in result.
  13557. * returns 0 on success, MP_TO_E when the outLen is too small, MP_READ_E when
  13558. * an array is too long and MEMORY_E when dynamic memory allocation fails.
  13559. */
  13560. int sp_RsaPrivate_4096(const byte* in, word32 inLen, const mp_int* dm,
  13561. const mp_int* pm, const mp_int* qm, const mp_int* dpm, const mp_int* dqm,
  13562. const mp_int* qim, const mp_int* mm, byte* out, word32* outLen)
  13563. {
  13564. #if defined(SP_RSA_PRIVATE_EXP_D) || defined(RSA_LOW_MEM)
  13565. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13566. sp_digit* d = NULL;
  13567. #else
  13568. sp_digit d[128 * 4];
  13569. #endif
  13570. sp_digit* a = NULL;
  13571. sp_digit* m = NULL;
  13572. sp_digit* r = NULL;
  13573. int err = MP_OKAY;
  13574. (void)pm;
  13575. (void)qm;
  13576. (void)dpm;
  13577. (void)dqm;
  13578. (void)qim;
  13579. if (*outLen < 512U) {
  13580. err = MP_TO_E;
  13581. }
  13582. if (err == MP_OKAY) {
  13583. if (mp_count_bits(dm) > 4096) {
  13584. err = MP_READ_E;
  13585. }
  13586. else if (inLen > 512) {
  13587. err = MP_READ_E;
  13588. }
  13589. else if (mp_count_bits(mm) != 4096) {
  13590. err = MP_READ_E;
  13591. }
  13592. else if (mp_iseven(mm)) {
  13593. err = MP_VAL;
  13594. }
  13595. }
  13596. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13597. if (err == MP_OKAY) {
  13598. d = (sp_digit*)XMALLOC(sizeof(sp_digit) * 128 * 4, NULL,
  13599. DYNAMIC_TYPE_RSA);
  13600. if (d == NULL)
  13601. err = MEMORY_E;
  13602. }
  13603. #endif
  13604. if (err == MP_OKAY) {
  13605. a = d + 128;
  13606. m = a + 256;
  13607. r = a;
  13608. sp_4096_from_bin(a, 128, in, inLen);
  13609. sp_4096_from_mp(d, 128, dm);
  13610. sp_4096_from_mp(m, 128, mm);
  13611. err = sp_4096_mod_exp_128(r, a, d, 4096, m, 0);
  13612. }
  13613. if (err == MP_OKAY) {
  13614. sp_4096_to_bin_128(r, out);
  13615. *outLen = 512;
  13616. }
  13617. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13618. if (d != NULL)
  13619. #endif
  13620. {
  13621. /* only "a" and "r" are sensitive and need zeroized (same pointer) */
  13622. if (a != NULL)
  13623. ForceZero(a, sizeof(sp_digit) * 128);
  13624. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13625. XFREE(d, NULL, DYNAMIC_TYPE_RSA);
  13626. #endif
  13627. }
  13628. return err;
  13629. #else
  13630. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13631. sp_digit* a = NULL;
  13632. #else
  13633. sp_digit a[64 * 11];
  13634. #endif
  13635. sp_digit* p = NULL;
  13636. sp_digit* q = NULL;
  13637. sp_digit* dp = NULL;
  13638. sp_digit* tmpa = NULL;
  13639. sp_digit* tmpb = NULL;
  13640. sp_digit* r = NULL;
  13641. sp_digit* qi = NULL;
  13642. sp_digit* dq = NULL;
  13643. sp_digit c;
  13644. int err = MP_OKAY;
  13645. (void)dm;
  13646. (void)mm;
  13647. if (*outLen < 512) {
  13648. err = MP_TO_E;
  13649. }
  13650. else if (inLen > 512 || mp_count_bits(mm) != 4096) {
  13651. err = MP_READ_E;
  13652. }
  13653. else if (mp_iseven(mm)) {
  13654. err = MP_VAL;
  13655. }
  13656. else if (mp_iseven(pm)) {
  13657. err = MP_VAL;
  13658. }
  13659. else if (mp_iseven(qm)) {
  13660. err = MP_VAL;
  13661. }
  13662. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13663. if (err == MP_OKAY) {
  13664. a = (sp_digit*)XMALLOC(sizeof(sp_digit) * 64 * 11, NULL,
  13665. DYNAMIC_TYPE_RSA);
  13666. if (a == NULL)
  13667. err = MEMORY_E;
  13668. }
  13669. #endif
  13670. if (err == MP_OKAY) {
  13671. p = a + 128 * 2;
  13672. q = p + 64;
  13673. qi = dq = dp = q + 64;
  13674. tmpa = qi + 64;
  13675. tmpb = tmpa + 128;
  13676. r = a;
  13677. sp_4096_from_bin(a, 128, in, inLen);
  13678. sp_4096_from_mp(p, 64, pm);
  13679. sp_4096_from_mp(q, 64, qm);
  13680. sp_4096_from_mp(dp, 64, dpm);
  13681. err = sp_2048_mod_exp_64(tmpa, a, dp, 2048, p, 1);
  13682. }
  13683. if (err == MP_OKAY) {
  13684. sp_4096_from_mp(dq, 64, dqm);
  13685. err = sp_2048_mod_exp_64(tmpb, a, dq, 2048, q, 1);
  13686. }
  13687. if (err == MP_OKAY) {
  13688. c = sp_2048_sub_in_place_64(tmpa, tmpb);
  13689. c += sp_4096_cond_add_64(tmpa, tmpa, p, c);
  13690. sp_4096_cond_add_64(tmpa, tmpa, p, c);
  13691. sp_2048_from_mp(qi, 64, qim);
  13692. sp_2048_mul_64(tmpa, tmpa, qi);
  13693. err = sp_2048_mod_64(tmpa, tmpa, p);
  13694. }
  13695. if (err == MP_OKAY) {
  13696. sp_2048_mul_64(tmpa, q, tmpa);
  13697. XMEMSET(&tmpb[64], 0, sizeof(sp_digit) * 64);
  13698. sp_4096_add_128(r, tmpb, tmpa);
  13699. sp_4096_to_bin_128(r, out);
  13700. *outLen = 512;
  13701. }
  13702. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13703. if (a != NULL)
  13704. #endif
  13705. {
  13706. ForceZero(a, sizeof(sp_digit) * 64 * 11);
  13707. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  13708. XFREE(a, NULL, DYNAMIC_TYPE_RSA);
  13709. #endif
  13710. }
  13711. #endif /* SP_RSA_PRIVATE_EXP_D || RSA_LOW_MEM */
  13712. return err;
  13713. }
  13714. #endif /* WOLFSSL_RSA_PUBLIC_ONLY */
  13715. #endif /* WOLFSSL_HAVE_SP_RSA */
  13716. #if defined(WOLFSSL_HAVE_SP_DH) || (defined(WOLFSSL_HAVE_SP_RSA) && \
  13717. !defined(WOLFSSL_RSA_PUBLIC_ONLY))
  13718. /* Convert an array of sp_digit to an mp_int.
  13719. *
  13720. * a A single precision integer.
  13721. * r A multi-precision integer.
  13722. */
  13723. static int sp_4096_to_mp(const sp_digit* a, mp_int* r)
  13724. {
  13725. int err;
  13726. err = mp_grow(r, (4096 + DIGIT_BIT - 1) / DIGIT_BIT);
  13727. if (err == MP_OKAY) { /*lint !e774 case where err is always MP_OKAY*/
  13728. #if DIGIT_BIT == 32
  13729. XMEMCPY(r->dp, a, sizeof(sp_digit) * 128);
  13730. r->used = 128;
  13731. mp_clamp(r);
  13732. #elif DIGIT_BIT < 32
  13733. int i;
  13734. int j = 0;
  13735. int s = 0;
  13736. r->dp[0] = 0;
  13737. for (i = 0; i < 128; i++) {
  13738. r->dp[j] |= (mp_digit)(a[i] << s);
  13739. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  13740. s = DIGIT_BIT - s;
  13741. r->dp[++j] = (mp_digit)(a[i] >> s);
  13742. while (s + DIGIT_BIT <= 32) {
  13743. s += DIGIT_BIT;
  13744. r->dp[j++] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  13745. if (s == SP_WORD_SIZE) {
  13746. r->dp[j] = 0;
  13747. }
  13748. else {
  13749. r->dp[j] = (mp_digit)(a[i] >> s);
  13750. }
  13751. }
  13752. s = 32 - s;
  13753. }
  13754. r->used = (4096 + DIGIT_BIT - 1) / DIGIT_BIT;
  13755. mp_clamp(r);
  13756. #else
  13757. int i;
  13758. int j = 0;
  13759. int s = 0;
  13760. r->dp[0] = 0;
  13761. for (i = 0; i < 128; i++) {
  13762. r->dp[j] |= ((mp_digit)a[i]) << s;
  13763. if (s + 32 >= DIGIT_BIT) {
  13764. #if DIGIT_BIT != 32 && DIGIT_BIT != 64
  13765. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  13766. #endif
  13767. s = DIGIT_BIT - s;
  13768. r->dp[++j] = a[i] >> s;
  13769. s = 32 - s;
  13770. }
  13771. else {
  13772. s += 32;
  13773. }
  13774. }
  13775. r->used = (4096 + DIGIT_BIT - 1) / DIGIT_BIT;
  13776. mp_clamp(r);
  13777. #endif
  13778. }
  13779. return err;
  13780. }
  13781. /* Perform the modular exponentiation for Diffie-Hellman.
  13782. *
  13783. * base Base. MP integer.
  13784. * exp Exponent. MP integer.
  13785. * mod Modulus. MP integer.
  13786. * res Result. MP integer.
  13787. * returns 0 on success, MP_READ_E if there are too many bytes in an array
  13788. * and MEMORY_E if memory allocation fails.
  13789. */
  13790. int sp_ModExp_4096(const mp_int* base, const mp_int* exp, const mp_int* mod,
  13791. mp_int* res)
  13792. {
  13793. int err = MP_OKAY;
  13794. sp_digit b[256];
  13795. sp_digit e[128];
  13796. sp_digit m[128];
  13797. sp_digit* r = b;
  13798. int expBits = mp_count_bits(exp);
  13799. if (mp_count_bits(base) > 4096) {
  13800. err = MP_READ_E;
  13801. }
  13802. else if (expBits > 4096) {
  13803. err = MP_READ_E;
  13804. }
  13805. else if (mp_count_bits(mod) != 4096) {
  13806. err = MP_READ_E;
  13807. }
  13808. else if (mp_iseven(mod)) {
  13809. err = MP_VAL;
  13810. }
  13811. if (err == MP_OKAY) {
  13812. sp_4096_from_mp(b, 128, base);
  13813. sp_4096_from_mp(e, 128, exp);
  13814. sp_4096_from_mp(m, 128, mod);
  13815. err = sp_4096_mod_exp_128(r, b, e, expBits, m, 0);
  13816. }
  13817. if (err == MP_OKAY) {
  13818. err = sp_4096_to_mp(r, res);
  13819. }
  13820. XMEMSET(e, 0, sizeof(e));
  13821. return err;
  13822. }
  13823. #ifdef WOLFSSL_HAVE_SP_DH
  13824. #ifdef HAVE_FFDHE_4096
  13825. static void sp_4096_lshift_128(sp_digit* r, const sp_digit* a, byte n)
  13826. {
  13827. __asm__ __volatile__ (
  13828. "mov r6, #31\n\t"
  13829. "sub r6, r6, %[n]\n\t"
  13830. "add %[a], %[a], #448\n\t"
  13831. "add %[r], %[r], #448\n\t"
  13832. "ldr r3, [%[a], #60]\n\t"
  13833. "lsr r4, r3, #1\n\t"
  13834. "lsl r3, r3, %[n]\n\t"
  13835. "lsr r4, r4, r6\n\t"
  13836. "ldr r2, [%[a], #56]\n\t"
  13837. "str r4, [%[r], #64]\n\t"
  13838. "lsr r5, r2, #1\n\t"
  13839. "lsl r2, r2, %[n]\n\t"
  13840. "lsr r5, r5, r6\n\t"
  13841. "orr r3, r3, r5\n\t"
  13842. "ldr r4, [%[a], #52]\n\t"
  13843. "str r3, [%[r], #60]\n\t"
  13844. "lsr r5, r4, #1\n\t"
  13845. "lsl r4, r4, %[n]\n\t"
  13846. "lsr r5, r5, r6\n\t"
  13847. "orr r2, r2, r5\n\t"
  13848. "ldr r3, [%[a], #48]\n\t"
  13849. "str r2, [%[r], #56]\n\t"
  13850. "lsr r5, r3, #1\n\t"
  13851. "lsl r3, r3, %[n]\n\t"
  13852. "lsr r5, r5, r6\n\t"
  13853. "orr r4, r4, r5\n\t"
  13854. "ldr r2, [%[a], #44]\n\t"
  13855. "str r4, [%[r], #52]\n\t"
  13856. "lsr r5, r2, #1\n\t"
  13857. "lsl r2, r2, %[n]\n\t"
  13858. "lsr r5, r5, r6\n\t"
  13859. "orr r3, r3, r5\n\t"
  13860. "ldr r4, [%[a], #40]\n\t"
  13861. "str r3, [%[r], #48]\n\t"
  13862. "lsr r5, r4, #1\n\t"
  13863. "lsl r4, r4, %[n]\n\t"
  13864. "lsr r5, r5, r6\n\t"
  13865. "orr r2, r2, r5\n\t"
  13866. "ldr r3, [%[a], #36]\n\t"
  13867. "str r2, [%[r], #44]\n\t"
  13868. "lsr r5, r3, #1\n\t"
  13869. "lsl r3, r3, %[n]\n\t"
  13870. "lsr r5, r5, r6\n\t"
  13871. "orr r4, r4, r5\n\t"
  13872. "ldr r2, [%[a], #32]\n\t"
  13873. "str r4, [%[r], #40]\n\t"
  13874. "lsr r5, r2, #1\n\t"
  13875. "lsl r2, r2, %[n]\n\t"
  13876. "lsr r5, r5, r6\n\t"
  13877. "orr r3, r3, r5\n\t"
  13878. "ldr r4, [%[a], #28]\n\t"
  13879. "str r3, [%[r], #36]\n\t"
  13880. "lsr r5, r4, #1\n\t"
  13881. "lsl r4, r4, %[n]\n\t"
  13882. "lsr r5, r5, r6\n\t"
  13883. "orr r2, r2, r5\n\t"
  13884. "ldr r3, [%[a], #24]\n\t"
  13885. "str r2, [%[r], #32]\n\t"
  13886. "lsr r5, r3, #1\n\t"
  13887. "lsl r3, r3, %[n]\n\t"
  13888. "lsr r5, r5, r6\n\t"
  13889. "orr r4, r4, r5\n\t"
  13890. "ldr r2, [%[a], #20]\n\t"
  13891. "str r4, [%[r], #28]\n\t"
  13892. "lsr r5, r2, #1\n\t"
  13893. "lsl r2, r2, %[n]\n\t"
  13894. "lsr r5, r5, r6\n\t"
  13895. "orr r3, r3, r5\n\t"
  13896. "ldr r4, [%[a], #16]\n\t"
  13897. "str r3, [%[r], #24]\n\t"
  13898. "lsr r5, r4, #1\n\t"
  13899. "lsl r4, r4, %[n]\n\t"
  13900. "lsr r5, r5, r6\n\t"
  13901. "orr r2, r2, r5\n\t"
  13902. "ldr r3, [%[a], #12]\n\t"
  13903. "str r2, [%[r], #20]\n\t"
  13904. "lsr r5, r3, #1\n\t"
  13905. "lsl r3, r3, %[n]\n\t"
  13906. "lsr r5, r5, r6\n\t"
  13907. "orr r4, r4, r5\n\t"
  13908. "ldr r2, [%[a], #8]\n\t"
  13909. "str r4, [%[r], #16]\n\t"
  13910. "lsr r5, r2, #1\n\t"
  13911. "lsl r2, r2, %[n]\n\t"
  13912. "lsr r5, r5, r6\n\t"
  13913. "orr r3, r3, r5\n\t"
  13914. "ldr r4, [%[a], #4]\n\t"
  13915. "str r3, [%[r], #12]\n\t"
  13916. "lsr r5, r4, #1\n\t"
  13917. "lsl r4, r4, %[n]\n\t"
  13918. "lsr r5, r5, r6\n\t"
  13919. "orr r2, r2, r5\n\t"
  13920. "ldr r3, [%[a], #0]\n\t"
  13921. "str r2, [%[r], #8]\n\t"
  13922. "lsr r5, r3, #1\n\t"
  13923. "lsl r3, r3, %[n]\n\t"
  13924. "lsr r5, r5, r6\n\t"
  13925. "orr r4, r4, r5\n\t"
  13926. "sub %[a], %[a], #64\n\t"
  13927. "sub %[r], %[r], #64\n\t"
  13928. "ldr r2, [%[a], #60]\n\t"
  13929. "str r4, [%[r], #68]\n\t"
  13930. "lsr r5, r2, #1\n\t"
  13931. "lsl r2, r2, %[n]\n\t"
  13932. "lsr r5, r5, r6\n\t"
  13933. "orr r3, r3, r5\n\t"
  13934. "ldr r4, [%[a], #56]\n\t"
  13935. "str r3, [%[r], #64]\n\t"
  13936. "lsr r5, r4, #1\n\t"
  13937. "lsl r4, r4, %[n]\n\t"
  13938. "lsr r5, r5, r6\n\t"
  13939. "orr r2, r2, r5\n\t"
  13940. "ldr r3, [%[a], #52]\n\t"
  13941. "str r2, [%[r], #60]\n\t"
  13942. "lsr r5, r3, #1\n\t"
  13943. "lsl r3, r3, %[n]\n\t"
  13944. "lsr r5, r5, r6\n\t"
  13945. "orr r4, r4, r5\n\t"
  13946. "ldr r2, [%[a], #48]\n\t"
  13947. "str r4, [%[r], #56]\n\t"
  13948. "lsr r5, r2, #1\n\t"
  13949. "lsl r2, r2, %[n]\n\t"
  13950. "lsr r5, r5, r6\n\t"
  13951. "orr r3, r3, r5\n\t"
  13952. "ldr r4, [%[a], #44]\n\t"
  13953. "str r3, [%[r], #52]\n\t"
  13954. "lsr r5, r4, #1\n\t"
  13955. "lsl r4, r4, %[n]\n\t"
  13956. "lsr r5, r5, r6\n\t"
  13957. "orr r2, r2, r5\n\t"
  13958. "ldr r3, [%[a], #40]\n\t"
  13959. "str r2, [%[r], #48]\n\t"
  13960. "lsr r5, r3, #1\n\t"
  13961. "lsl r3, r3, %[n]\n\t"
  13962. "lsr r5, r5, r6\n\t"
  13963. "orr r4, r4, r5\n\t"
  13964. "ldr r2, [%[a], #36]\n\t"
  13965. "str r4, [%[r], #44]\n\t"
  13966. "lsr r5, r2, #1\n\t"
  13967. "lsl r2, r2, %[n]\n\t"
  13968. "lsr r5, r5, r6\n\t"
  13969. "orr r3, r3, r5\n\t"
  13970. "ldr r4, [%[a], #32]\n\t"
  13971. "str r3, [%[r], #40]\n\t"
  13972. "lsr r5, r4, #1\n\t"
  13973. "lsl r4, r4, %[n]\n\t"
  13974. "lsr r5, r5, r6\n\t"
  13975. "orr r2, r2, r5\n\t"
  13976. "ldr r3, [%[a], #28]\n\t"
  13977. "str r2, [%[r], #36]\n\t"
  13978. "lsr r5, r3, #1\n\t"
  13979. "lsl r3, r3, %[n]\n\t"
  13980. "lsr r5, r5, r6\n\t"
  13981. "orr r4, r4, r5\n\t"
  13982. "ldr r2, [%[a], #24]\n\t"
  13983. "str r4, [%[r], #32]\n\t"
  13984. "lsr r5, r2, #1\n\t"
  13985. "lsl r2, r2, %[n]\n\t"
  13986. "lsr r5, r5, r6\n\t"
  13987. "orr r3, r3, r5\n\t"
  13988. "ldr r4, [%[a], #20]\n\t"
  13989. "str r3, [%[r], #28]\n\t"
  13990. "lsr r5, r4, #1\n\t"
  13991. "lsl r4, r4, %[n]\n\t"
  13992. "lsr r5, r5, r6\n\t"
  13993. "orr r2, r2, r5\n\t"
  13994. "ldr r3, [%[a], #16]\n\t"
  13995. "str r2, [%[r], #24]\n\t"
  13996. "lsr r5, r3, #1\n\t"
  13997. "lsl r3, r3, %[n]\n\t"
  13998. "lsr r5, r5, r6\n\t"
  13999. "orr r4, r4, r5\n\t"
  14000. "ldr r2, [%[a], #12]\n\t"
  14001. "str r4, [%[r], #20]\n\t"
  14002. "lsr r5, r2, #1\n\t"
  14003. "lsl r2, r2, %[n]\n\t"
  14004. "lsr r5, r5, r6\n\t"
  14005. "orr r3, r3, r5\n\t"
  14006. "ldr r4, [%[a], #8]\n\t"
  14007. "str r3, [%[r], #16]\n\t"
  14008. "lsr r5, r4, #1\n\t"
  14009. "lsl r4, r4, %[n]\n\t"
  14010. "lsr r5, r5, r6\n\t"
  14011. "orr r2, r2, r5\n\t"
  14012. "ldr r3, [%[a], #4]\n\t"
  14013. "str r2, [%[r], #12]\n\t"
  14014. "lsr r5, r3, #1\n\t"
  14015. "lsl r3, r3, %[n]\n\t"
  14016. "lsr r5, r5, r6\n\t"
  14017. "orr r4, r4, r5\n\t"
  14018. "ldr r2, [%[a], #0]\n\t"
  14019. "str r4, [%[r], #8]\n\t"
  14020. "lsr r5, r2, #1\n\t"
  14021. "lsl r2, r2, %[n]\n\t"
  14022. "lsr r5, r5, r6\n\t"
  14023. "orr r3, r3, r5\n\t"
  14024. "sub %[a], %[a], #64\n\t"
  14025. "sub %[r], %[r], #64\n\t"
  14026. "ldr r4, [%[a], #60]\n\t"
  14027. "str r3, [%[r], #68]\n\t"
  14028. "lsr r5, r4, #1\n\t"
  14029. "lsl r4, r4, %[n]\n\t"
  14030. "lsr r5, r5, r6\n\t"
  14031. "orr r2, r2, r5\n\t"
  14032. "ldr r3, [%[a], #56]\n\t"
  14033. "str r2, [%[r], #64]\n\t"
  14034. "lsr r5, r3, #1\n\t"
  14035. "lsl r3, r3, %[n]\n\t"
  14036. "lsr r5, r5, r6\n\t"
  14037. "orr r4, r4, r5\n\t"
  14038. "ldr r2, [%[a], #52]\n\t"
  14039. "str r4, [%[r], #60]\n\t"
  14040. "lsr r5, r2, #1\n\t"
  14041. "lsl r2, r2, %[n]\n\t"
  14042. "lsr r5, r5, r6\n\t"
  14043. "orr r3, r3, r5\n\t"
  14044. "ldr r4, [%[a], #48]\n\t"
  14045. "str r3, [%[r], #56]\n\t"
  14046. "lsr r5, r4, #1\n\t"
  14047. "lsl r4, r4, %[n]\n\t"
  14048. "lsr r5, r5, r6\n\t"
  14049. "orr r2, r2, r5\n\t"
  14050. "ldr r3, [%[a], #44]\n\t"
  14051. "str r2, [%[r], #52]\n\t"
  14052. "lsr r5, r3, #1\n\t"
  14053. "lsl r3, r3, %[n]\n\t"
  14054. "lsr r5, r5, r6\n\t"
  14055. "orr r4, r4, r5\n\t"
  14056. "ldr r2, [%[a], #40]\n\t"
  14057. "str r4, [%[r], #48]\n\t"
  14058. "lsr r5, r2, #1\n\t"
  14059. "lsl r2, r2, %[n]\n\t"
  14060. "lsr r5, r5, r6\n\t"
  14061. "orr r3, r3, r5\n\t"
  14062. "ldr r4, [%[a], #36]\n\t"
  14063. "str r3, [%[r], #44]\n\t"
  14064. "lsr r5, r4, #1\n\t"
  14065. "lsl r4, r4, %[n]\n\t"
  14066. "lsr r5, r5, r6\n\t"
  14067. "orr r2, r2, r5\n\t"
  14068. "ldr r3, [%[a], #32]\n\t"
  14069. "str r2, [%[r], #40]\n\t"
  14070. "lsr r5, r3, #1\n\t"
  14071. "lsl r3, r3, %[n]\n\t"
  14072. "lsr r5, r5, r6\n\t"
  14073. "orr r4, r4, r5\n\t"
  14074. "ldr r2, [%[a], #28]\n\t"
  14075. "str r4, [%[r], #36]\n\t"
  14076. "lsr r5, r2, #1\n\t"
  14077. "lsl r2, r2, %[n]\n\t"
  14078. "lsr r5, r5, r6\n\t"
  14079. "orr r3, r3, r5\n\t"
  14080. "ldr r4, [%[a], #24]\n\t"
  14081. "str r3, [%[r], #32]\n\t"
  14082. "lsr r5, r4, #1\n\t"
  14083. "lsl r4, r4, %[n]\n\t"
  14084. "lsr r5, r5, r6\n\t"
  14085. "orr r2, r2, r5\n\t"
  14086. "ldr r3, [%[a], #20]\n\t"
  14087. "str r2, [%[r], #28]\n\t"
  14088. "lsr r5, r3, #1\n\t"
  14089. "lsl r3, r3, %[n]\n\t"
  14090. "lsr r5, r5, r6\n\t"
  14091. "orr r4, r4, r5\n\t"
  14092. "ldr r2, [%[a], #16]\n\t"
  14093. "str r4, [%[r], #24]\n\t"
  14094. "lsr r5, r2, #1\n\t"
  14095. "lsl r2, r2, %[n]\n\t"
  14096. "lsr r5, r5, r6\n\t"
  14097. "orr r3, r3, r5\n\t"
  14098. "ldr r4, [%[a], #12]\n\t"
  14099. "str r3, [%[r], #20]\n\t"
  14100. "lsr r5, r4, #1\n\t"
  14101. "lsl r4, r4, %[n]\n\t"
  14102. "lsr r5, r5, r6\n\t"
  14103. "orr r2, r2, r5\n\t"
  14104. "ldr r3, [%[a], #8]\n\t"
  14105. "str r2, [%[r], #16]\n\t"
  14106. "lsr r5, r3, #1\n\t"
  14107. "lsl r3, r3, %[n]\n\t"
  14108. "lsr r5, r5, r6\n\t"
  14109. "orr r4, r4, r5\n\t"
  14110. "ldr r2, [%[a], #4]\n\t"
  14111. "str r4, [%[r], #12]\n\t"
  14112. "lsr r5, r2, #1\n\t"
  14113. "lsl r2, r2, %[n]\n\t"
  14114. "lsr r5, r5, r6\n\t"
  14115. "orr r3, r3, r5\n\t"
  14116. "ldr r4, [%[a], #0]\n\t"
  14117. "str r3, [%[r], #8]\n\t"
  14118. "lsr r5, r4, #1\n\t"
  14119. "lsl r4, r4, %[n]\n\t"
  14120. "lsr r5, r5, r6\n\t"
  14121. "orr r2, r2, r5\n\t"
  14122. "sub %[a], %[a], #64\n\t"
  14123. "sub %[r], %[r], #64\n\t"
  14124. "ldr r3, [%[a], #60]\n\t"
  14125. "str r2, [%[r], #68]\n\t"
  14126. "lsr r5, r3, #1\n\t"
  14127. "lsl r3, r3, %[n]\n\t"
  14128. "lsr r5, r5, r6\n\t"
  14129. "orr r4, r4, r5\n\t"
  14130. "ldr r2, [%[a], #56]\n\t"
  14131. "str r4, [%[r], #64]\n\t"
  14132. "lsr r5, r2, #1\n\t"
  14133. "lsl r2, r2, %[n]\n\t"
  14134. "lsr r5, r5, r6\n\t"
  14135. "orr r3, r3, r5\n\t"
  14136. "ldr r4, [%[a], #52]\n\t"
  14137. "str r3, [%[r], #60]\n\t"
  14138. "lsr r5, r4, #1\n\t"
  14139. "lsl r4, r4, %[n]\n\t"
  14140. "lsr r5, r5, r6\n\t"
  14141. "orr r2, r2, r5\n\t"
  14142. "ldr r3, [%[a], #48]\n\t"
  14143. "str r2, [%[r], #56]\n\t"
  14144. "lsr r5, r3, #1\n\t"
  14145. "lsl r3, r3, %[n]\n\t"
  14146. "lsr r5, r5, r6\n\t"
  14147. "orr r4, r4, r5\n\t"
  14148. "ldr r2, [%[a], #44]\n\t"
  14149. "str r4, [%[r], #52]\n\t"
  14150. "lsr r5, r2, #1\n\t"
  14151. "lsl r2, r2, %[n]\n\t"
  14152. "lsr r5, r5, r6\n\t"
  14153. "orr r3, r3, r5\n\t"
  14154. "ldr r4, [%[a], #40]\n\t"
  14155. "str r3, [%[r], #48]\n\t"
  14156. "lsr r5, r4, #1\n\t"
  14157. "lsl r4, r4, %[n]\n\t"
  14158. "lsr r5, r5, r6\n\t"
  14159. "orr r2, r2, r5\n\t"
  14160. "ldr r3, [%[a], #36]\n\t"
  14161. "str r2, [%[r], #44]\n\t"
  14162. "lsr r5, r3, #1\n\t"
  14163. "lsl r3, r3, %[n]\n\t"
  14164. "lsr r5, r5, r6\n\t"
  14165. "orr r4, r4, r5\n\t"
  14166. "ldr r2, [%[a], #32]\n\t"
  14167. "str r4, [%[r], #40]\n\t"
  14168. "lsr r5, r2, #1\n\t"
  14169. "lsl r2, r2, %[n]\n\t"
  14170. "lsr r5, r5, r6\n\t"
  14171. "orr r3, r3, r5\n\t"
  14172. "ldr r4, [%[a], #28]\n\t"
  14173. "str r3, [%[r], #36]\n\t"
  14174. "lsr r5, r4, #1\n\t"
  14175. "lsl r4, r4, %[n]\n\t"
  14176. "lsr r5, r5, r6\n\t"
  14177. "orr r2, r2, r5\n\t"
  14178. "ldr r3, [%[a], #24]\n\t"
  14179. "str r2, [%[r], #32]\n\t"
  14180. "lsr r5, r3, #1\n\t"
  14181. "lsl r3, r3, %[n]\n\t"
  14182. "lsr r5, r5, r6\n\t"
  14183. "orr r4, r4, r5\n\t"
  14184. "ldr r2, [%[a], #20]\n\t"
  14185. "str r4, [%[r], #28]\n\t"
  14186. "lsr r5, r2, #1\n\t"
  14187. "lsl r2, r2, %[n]\n\t"
  14188. "lsr r5, r5, r6\n\t"
  14189. "orr r3, r3, r5\n\t"
  14190. "ldr r4, [%[a], #16]\n\t"
  14191. "str r3, [%[r], #24]\n\t"
  14192. "lsr r5, r4, #1\n\t"
  14193. "lsl r4, r4, %[n]\n\t"
  14194. "lsr r5, r5, r6\n\t"
  14195. "orr r2, r2, r5\n\t"
  14196. "ldr r3, [%[a], #12]\n\t"
  14197. "str r2, [%[r], #20]\n\t"
  14198. "lsr r5, r3, #1\n\t"
  14199. "lsl r3, r3, %[n]\n\t"
  14200. "lsr r5, r5, r6\n\t"
  14201. "orr r4, r4, r5\n\t"
  14202. "ldr r2, [%[a], #8]\n\t"
  14203. "str r4, [%[r], #16]\n\t"
  14204. "lsr r5, r2, #1\n\t"
  14205. "lsl r2, r2, %[n]\n\t"
  14206. "lsr r5, r5, r6\n\t"
  14207. "orr r3, r3, r5\n\t"
  14208. "ldr r4, [%[a], #4]\n\t"
  14209. "str r3, [%[r], #12]\n\t"
  14210. "lsr r5, r4, #1\n\t"
  14211. "lsl r4, r4, %[n]\n\t"
  14212. "lsr r5, r5, r6\n\t"
  14213. "orr r2, r2, r5\n\t"
  14214. "ldr r3, [%[a], #0]\n\t"
  14215. "str r2, [%[r], #8]\n\t"
  14216. "lsr r5, r3, #1\n\t"
  14217. "lsl r3, r3, %[n]\n\t"
  14218. "lsr r5, r5, r6\n\t"
  14219. "orr r4, r4, r5\n\t"
  14220. "sub %[a], %[a], #64\n\t"
  14221. "sub %[r], %[r], #64\n\t"
  14222. "ldr r2, [%[a], #60]\n\t"
  14223. "str r4, [%[r], #68]\n\t"
  14224. "lsr r5, r2, #1\n\t"
  14225. "lsl r2, r2, %[n]\n\t"
  14226. "lsr r5, r5, r6\n\t"
  14227. "orr r3, r3, r5\n\t"
  14228. "ldr r4, [%[a], #56]\n\t"
  14229. "str r3, [%[r], #64]\n\t"
  14230. "lsr r5, r4, #1\n\t"
  14231. "lsl r4, r4, %[n]\n\t"
  14232. "lsr r5, r5, r6\n\t"
  14233. "orr r2, r2, r5\n\t"
  14234. "ldr r3, [%[a], #52]\n\t"
  14235. "str r2, [%[r], #60]\n\t"
  14236. "lsr r5, r3, #1\n\t"
  14237. "lsl r3, r3, %[n]\n\t"
  14238. "lsr r5, r5, r6\n\t"
  14239. "orr r4, r4, r5\n\t"
  14240. "ldr r2, [%[a], #48]\n\t"
  14241. "str r4, [%[r], #56]\n\t"
  14242. "lsr r5, r2, #1\n\t"
  14243. "lsl r2, r2, %[n]\n\t"
  14244. "lsr r5, r5, r6\n\t"
  14245. "orr r3, r3, r5\n\t"
  14246. "ldr r4, [%[a], #44]\n\t"
  14247. "str r3, [%[r], #52]\n\t"
  14248. "lsr r5, r4, #1\n\t"
  14249. "lsl r4, r4, %[n]\n\t"
  14250. "lsr r5, r5, r6\n\t"
  14251. "orr r2, r2, r5\n\t"
  14252. "ldr r3, [%[a], #40]\n\t"
  14253. "str r2, [%[r], #48]\n\t"
  14254. "lsr r5, r3, #1\n\t"
  14255. "lsl r3, r3, %[n]\n\t"
  14256. "lsr r5, r5, r6\n\t"
  14257. "orr r4, r4, r5\n\t"
  14258. "ldr r2, [%[a], #36]\n\t"
  14259. "str r4, [%[r], #44]\n\t"
  14260. "lsr r5, r2, #1\n\t"
  14261. "lsl r2, r2, %[n]\n\t"
  14262. "lsr r5, r5, r6\n\t"
  14263. "orr r3, r3, r5\n\t"
  14264. "ldr r4, [%[a], #32]\n\t"
  14265. "str r3, [%[r], #40]\n\t"
  14266. "lsr r5, r4, #1\n\t"
  14267. "lsl r4, r4, %[n]\n\t"
  14268. "lsr r5, r5, r6\n\t"
  14269. "orr r2, r2, r5\n\t"
  14270. "ldr r3, [%[a], #28]\n\t"
  14271. "str r2, [%[r], #36]\n\t"
  14272. "lsr r5, r3, #1\n\t"
  14273. "lsl r3, r3, %[n]\n\t"
  14274. "lsr r5, r5, r6\n\t"
  14275. "orr r4, r4, r5\n\t"
  14276. "ldr r2, [%[a], #24]\n\t"
  14277. "str r4, [%[r], #32]\n\t"
  14278. "lsr r5, r2, #1\n\t"
  14279. "lsl r2, r2, %[n]\n\t"
  14280. "lsr r5, r5, r6\n\t"
  14281. "orr r3, r3, r5\n\t"
  14282. "ldr r4, [%[a], #20]\n\t"
  14283. "str r3, [%[r], #28]\n\t"
  14284. "lsr r5, r4, #1\n\t"
  14285. "lsl r4, r4, %[n]\n\t"
  14286. "lsr r5, r5, r6\n\t"
  14287. "orr r2, r2, r5\n\t"
  14288. "ldr r3, [%[a], #16]\n\t"
  14289. "str r2, [%[r], #24]\n\t"
  14290. "lsr r5, r3, #1\n\t"
  14291. "lsl r3, r3, %[n]\n\t"
  14292. "lsr r5, r5, r6\n\t"
  14293. "orr r4, r4, r5\n\t"
  14294. "ldr r2, [%[a], #12]\n\t"
  14295. "str r4, [%[r], #20]\n\t"
  14296. "lsr r5, r2, #1\n\t"
  14297. "lsl r2, r2, %[n]\n\t"
  14298. "lsr r5, r5, r6\n\t"
  14299. "orr r3, r3, r5\n\t"
  14300. "ldr r4, [%[a], #8]\n\t"
  14301. "str r3, [%[r], #16]\n\t"
  14302. "lsr r5, r4, #1\n\t"
  14303. "lsl r4, r4, %[n]\n\t"
  14304. "lsr r5, r5, r6\n\t"
  14305. "orr r2, r2, r5\n\t"
  14306. "ldr r3, [%[a], #4]\n\t"
  14307. "str r2, [%[r], #12]\n\t"
  14308. "lsr r5, r3, #1\n\t"
  14309. "lsl r3, r3, %[n]\n\t"
  14310. "lsr r5, r5, r6\n\t"
  14311. "orr r4, r4, r5\n\t"
  14312. "ldr r2, [%[a], #0]\n\t"
  14313. "str r4, [%[r], #8]\n\t"
  14314. "lsr r5, r2, #1\n\t"
  14315. "lsl r2, r2, %[n]\n\t"
  14316. "lsr r5, r5, r6\n\t"
  14317. "orr r3, r3, r5\n\t"
  14318. "sub %[a], %[a], #64\n\t"
  14319. "sub %[r], %[r], #64\n\t"
  14320. "ldr r4, [%[a], #60]\n\t"
  14321. "str r3, [%[r], #68]\n\t"
  14322. "lsr r5, r4, #1\n\t"
  14323. "lsl r4, r4, %[n]\n\t"
  14324. "lsr r5, r5, r6\n\t"
  14325. "orr r2, r2, r5\n\t"
  14326. "ldr r3, [%[a], #56]\n\t"
  14327. "str r2, [%[r], #64]\n\t"
  14328. "lsr r5, r3, #1\n\t"
  14329. "lsl r3, r3, %[n]\n\t"
  14330. "lsr r5, r5, r6\n\t"
  14331. "orr r4, r4, r5\n\t"
  14332. "ldr r2, [%[a], #52]\n\t"
  14333. "str r4, [%[r], #60]\n\t"
  14334. "lsr r5, r2, #1\n\t"
  14335. "lsl r2, r2, %[n]\n\t"
  14336. "lsr r5, r5, r6\n\t"
  14337. "orr r3, r3, r5\n\t"
  14338. "ldr r4, [%[a], #48]\n\t"
  14339. "str r3, [%[r], #56]\n\t"
  14340. "lsr r5, r4, #1\n\t"
  14341. "lsl r4, r4, %[n]\n\t"
  14342. "lsr r5, r5, r6\n\t"
  14343. "orr r2, r2, r5\n\t"
  14344. "ldr r3, [%[a], #44]\n\t"
  14345. "str r2, [%[r], #52]\n\t"
  14346. "lsr r5, r3, #1\n\t"
  14347. "lsl r3, r3, %[n]\n\t"
  14348. "lsr r5, r5, r6\n\t"
  14349. "orr r4, r4, r5\n\t"
  14350. "ldr r2, [%[a], #40]\n\t"
  14351. "str r4, [%[r], #48]\n\t"
  14352. "lsr r5, r2, #1\n\t"
  14353. "lsl r2, r2, %[n]\n\t"
  14354. "lsr r5, r5, r6\n\t"
  14355. "orr r3, r3, r5\n\t"
  14356. "ldr r4, [%[a], #36]\n\t"
  14357. "str r3, [%[r], #44]\n\t"
  14358. "lsr r5, r4, #1\n\t"
  14359. "lsl r4, r4, %[n]\n\t"
  14360. "lsr r5, r5, r6\n\t"
  14361. "orr r2, r2, r5\n\t"
  14362. "ldr r3, [%[a], #32]\n\t"
  14363. "str r2, [%[r], #40]\n\t"
  14364. "lsr r5, r3, #1\n\t"
  14365. "lsl r3, r3, %[n]\n\t"
  14366. "lsr r5, r5, r6\n\t"
  14367. "orr r4, r4, r5\n\t"
  14368. "ldr r2, [%[a], #28]\n\t"
  14369. "str r4, [%[r], #36]\n\t"
  14370. "lsr r5, r2, #1\n\t"
  14371. "lsl r2, r2, %[n]\n\t"
  14372. "lsr r5, r5, r6\n\t"
  14373. "orr r3, r3, r5\n\t"
  14374. "ldr r4, [%[a], #24]\n\t"
  14375. "str r3, [%[r], #32]\n\t"
  14376. "lsr r5, r4, #1\n\t"
  14377. "lsl r4, r4, %[n]\n\t"
  14378. "lsr r5, r5, r6\n\t"
  14379. "orr r2, r2, r5\n\t"
  14380. "ldr r3, [%[a], #20]\n\t"
  14381. "str r2, [%[r], #28]\n\t"
  14382. "lsr r5, r3, #1\n\t"
  14383. "lsl r3, r3, %[n]\n\t"
  14384. "lsr r5, r5, r6\n\t"
  14385. "orr r4, r4, r5\n\t"
  14386. "ldr r2, [%[a], #16]\n\t"
  14387. "str r4, [%[r], #24]\n\t"
  14388. "lsr r5, r2, #1\n\t"
  14389. "lsl r2, r2, %[n]\n\t"
  14390. "lsr r5, r5, r6\n\t"
  14391. "orr r3, r3, r5\n\t"
  14392. "ldr r4, [%[a], #12]\n\t"
  14393. "str r3, [%[r], #20]\n\t"
  14394. "lsr r5, r4, #1\n\t"
  14395. "lsl r4, r4, %[n]\n\t"
  14396. "lsr r5, r5, r6\n\t"
  14397. "orr r2, r2, r5\n\t"
  14398. "ldr r3, [%[a], #8]\n\t"
  14399. "str r2, [%[r], #16]\n\t"
  14400. "lsr r5, r3, #1\n\t"
  14401. "lsl r3, r3, %[n]\n\t"
  14402. "lsr r5, r5, r6\n\t"
  14403. "orr r4, r4, r5\n\t"
  14404. "ldr r2, [%[a], #4]\n\t"
  14405. "str r4, [%[r], #12]\n\t"
  14406. "lsr r5, r2, #1\n\t"
  14407. "lsl r2, r2, %[n]\n\t"
  14408. "lsr r5, r5, r6\n\t"
  14409. "orr r3, r3, r5\n\t"
  14410. "ldr r4, [%[a], #0]\n\t"
  14411. "str r3, [%[r], #8]\n\t"
  14412. "lsr r5, r4, #1\n\t"
  14413. "lsl r4, r4, %[n]\n\t"
  14414. "lsr r5, r5, r6\n\t"
  14415. "orr r2, r2, r5\n\t"
  14416. "sub %[a], %[a], #64\n\t"
  14417. "sub %[r], %[r], #64\n\t"
  14418. "ldr r3, [%[a], #60]\n\t"
  14419. "str r2, [%[r], #68]\n\t"
  14420. "lsr r5, r3, #1\n\t"
  14421. "lsl r3, r3, %[n]\n\t"
  14422. "lsr r5, r5, r6\n\t"
  14423. "orr r4, r4, r5\n\t"
  14424. "ldr r2, [%[a], #56]\n\t"
  14425. "str r4, [%[r], #64]\n\t"
  14426. "lsr r5, r2, #1\n\t"
  14427. "lsl r2, r2, %[n]\n\t"
  14428. "lsr r5, r5, r6\n\t"
  14429. "orr r3, r3, r5\n\t"
  14430. "ldr r4, [%[a], #52]\n\t"
  14431. "str r3, [%[r], #60]\n\t"
  14432. "lsr r5, r4, #1\n\t"
  14433. "lsl r4, r4, %[n]\n\t"
  14434. "lsr r5, r5, r6\n\t"
  14435. "orr r2, r2, r5\n\t"
  14436. "ldr r3, [%[a], #48]\n\t"
  14437. "str r2, [%[r], #56]\n\t"
  14438. "lsr r5, r3, #1\n\t"
  14439. "lsl r3, r3, %[n]\n\t"
  14440. "lsr r5, r5, r6\n\t"
  14441. "orr r4, r4, r5\n\t"
  14442. "ldr r2, [%[a], #44]\n\t"
  14443. "str r4, [%[r], #52]\n\t"
  14444. "lsr r5, r2, #1\n\t"
  14445. "lsl r2, r2, %[n]\n\t"
  14446. "lsr r5, r5, r6\n\t"
  14447. "orr r3, r3, r5\n\t"
  14448. "ldr r4, [%[a], #40]\n\t"
  14449. "str r3, [%[r], #48]\n\t"
  14450. "lsr r5, r4, #1\n\t"
  14451. "lsl r4, r4, %[n]\n\t"
  14452. "lsr r5, r5, r6\n\t"
  14453. "orr r2, r2, r5\n\t"
  14454. "ldr r3, [%[a], #36]\n\t"
  14455. "str r2, [%[r], #44]\n\t"
  14456. "lsr r5, r3, #1\n\t"
  14457. "lsl r3, r3, %[n]\n\t"
  14458. "lsr r5, r5, r6\n\t"
  14459. "orr r4, r4, r5\n\t"
  14460. "ldr r2, [%[a], #32]\n\t"
  14461. "str r4, [%[r], #40]\n\t"
  14462. "lsr r5, r2, #1\n\t"
  14463. "lsl r2, r2, %[n]\n\t"
  14464. "lsr r5, r5, r6\n\t"
  14465. "orr r3, r3, r5\n\t"
  14466. "ldr r4, [%[a], #28]\n\t"
  14467. "str r3, [%[r], #36]\n\t"
  14468. "lsr r5, r4, #1\n\t"
  14469. "lsl r4, r4, %[n]\n\t"
  14470. "lsr r5, r5, r6\n\t"
  14471. "orr r2, r2, r5\n\t"
  14472. "ldr r3, [%[a], #24]\n\t"
  14473. "str r2, [%[r], #32]\n\t"
  14474. "lsr r5, r3, #1\n\t"
  14475. "lsl r3, r3, %[n]\n\t"
  14476. "lsr r5, r5, r6\n\t"
  14477. "orr r4, r4, r5\n\t"
  14478. "ldr r2, [%[a], #20]\n\t"
  14479. "str r4, [%[r], #28]\n\t"
  14480. "lsr r5, r2, #1\n\t"
  14481. "lsl r2, r2, %[n]\n\t"
  14482. "lsr r5, r5, r6\n\t"
  14483. "orr r3, r3, r5\n\t"
  14484. "ldr r4, [%[a], #16]\n\t"
  14485. "str r3, [%[r], #24]\n\t"
  14486. "lsr r5, r4, #1\n\t"
  14487. "lsl r4, r4, %[n]\n\t"
  14488. "lsr r5, r5, r6\n\t"
  14489. "orr r2, r2, r5\n\t"
  14490. "ldr r3, [%[a], #12]\n\t"
  14491. "str r2, [%[r], #20]\n\t"
  14492. "lsr r5, r3, #1\n\t"
  14493. "lsl r3, r3, %[n]\n\t"
  14494. "lsr r5, r5, r6\n\t"
  14495. "orr r4, r4, r5\n\t"
  14496. "ldr r2, [%[a], #8]\n\t"
  14497. "str r4, [%[r], #16]\n\t"
  14498. "lsr r5, r2, #1\n\t"
  14499. "lsl r2, r2, %[n]\n\t"
  14500. "lsr r5, r5, r6\n\t"
  14501. "orr r3, r3, r5\n\t"
  14502. "ldr r4, [%[a], #4]\n\t"
  14503. "str r3, [%[r], #12]\n\t"
  14504. "lsr r5, r4, #1\n\t"
  14505. "lsl r4, r4, %[n]\n\t"
  14506. "lsr r5, r5, r6\n\t"
  14507. "orr r2, r2, r5\n\t"
  14508. "ldr r3, [%[a], #0]\n\t"
  14509. "str r2, [%[r], #8]\n\t"
  14510. "lsr r5, r3, #1\n\t"
  14511. "lsl r3, r3, %[n]\n\t"
  14512. "lsr r5, r5, r6\n\t"
  14513. "orr r4, r4, r5\n\t"
  14514. "sub %[a], %[a], #64\n\t"
  14515. "sub %[r], %[r], #64\n\t"
  14516. "ldr r2, [%[a], #60]\n\t"
  14517. "str r4, [%[r], #68]\n\t"
  14518. "lsr r5, r2, #1\n\t"
  14519. "lsl r2, r2, %[n]\n\t"
  14520. "lsr r5, r5, r6\n\t"
  14521. "orr r3, r3, r5\n\t"
  14522. "ldr r4, [%[a], #56]\n\t"
  14523. "str r3, [%[r], #64]\n\t"
  14524. "lsr r5, r4, #1\n\t"
  14525. "lsl r4, r4, %[n]\n\t"
  14526. "lsr r5, r5, r6\n\t"
  14527. "orr r2, r2, r5\n\t"
  14528. "ldr r3, [%[a], #52]\n\t"
  14529. "str r2, [%[r], #60]\n\t"
  14530. "lsr r5, r3, #1\n\t"
  14531. "lsl r3, r3, %[n]\n\t"
  14532. "lsr r5, r5, r6\n\t"
  14533. "orr r4, r4, r5\n\t"
  14534. "ldr r2, [%[a], #48]\n\t"
  14535. "str r4, [%[r], #56]\n\t"
  14536. "lsr r5, r2, #1\n\t"
  14537. "lsl r2, r2, %[n]\n\t"
  14538. "lsr r5, r5, r6\n\t"
  14539. "orr r3, r3, r5\n\t"
  14540. "ldr r4, [%[a], #44]\n\t"
  14541. "str r3, [%[r], #52]\n\t"
  14542. "lsr r5, r4, #1\n\t"
  14543. "lsl r4, r4, %[n]\n\t"
  14544. "lsr r5, r5, r6\n\t"
  14545. "orr r2, r2, r5\n\t"
  14546. "ldr r3, [%[a], #40]\n\t"
  14547. "str r2, [%[r], #48]\n\t"
  14548. "lsr r5, r3, #1\n\t"
  14549. "lsl r3, r3, %[n]\n\t"
  14550. "lsr r5, r5, r6\n\t"
  14551. "orr r4, r4, r5\n\t"
  14552. "ldr r2, [%[a], #36]\n\t"
  14553. "str r4, [%[r], #44]\n\t"
  14554. "lsr r5, r2, #1\n\t"
  14555. "lsl r2, r2, %[n]\n\t"
  14556. "lsr r5, r5, r6\n\t"
  14557. "orr r3, r3, r5\n\t"
  14558. "ldr r4, [%[a], #32]\n\t"
  14559. "str r3, [%[r], #40]\n\t"
  14560. "lsr r5, r4, #1\n\t"
  14561. "lsl r4, r4, %[n]\n\t"
  14562. "lsr r5, r5, r6\n\t"
  14563. "orr r2, r2, r5\n\t"
  14564. "ldr r3, [%[a], #28]\n\t"
  14565. "str r2, [%[r], #36]\n\t"
  14566. "lsr r5, r3, #1\n\t"
  14567. "lsl r3, r3, %[n]\n\t"
  14568. "lsr r5, r5, r6\n\t"
  14569. "orr r4, r4, r5\n\t"
  14570. "ldr r2, [%[a], #24]\n\t"
  14571. "str r4, [%[r], #32]\n\t"
  14572. "lsr r5, r2, #1\n\t"
  14573. "lsl r2, r2, %[n]\n\t"
  14574. "lsr r5, r5, r6\n\t"
  14575. "orr r3, r3, r5\n\t"
  14576. "ldr r4, [%[a], #20]\n\t"
  14577. "str r3, [%[r], #28]\n\t"
  14578. "lsr r5, r4, #1\n\t"
  14579. "lsl r4, r4, %[n]\n\t"
  14580. "lsr r5, r5, r6\n\t"
  14581. "orr r2, r2, r5\n\t"
  14582. "ldr r3, [%[a], #16]\n\t"
  14583. "str r2, [%[r], #24]\n\t"
  14584. "lsr r5, r3, #1\n\t"
  14585. "lsl r3, r3, %[n]\n\t"
  14586. "lsr r5, r5, r6\n\t"
  14587. "orr r4, r4, r5\n\t"
  14588. "ldr r2, [%[a], #12]\n\t"
  14589. "str r4, [%[r], #20]\n\t"
  14590. "lsr r5, r2, #1\n\t"
  14591. "lsl r2, r2, %[n]\n\t"
  14592. "lsr r5, r5, r6\n\t"
  14593. "orr r3, r3, r5\n\t"
  14594. "ldr r4, [%[a], #8]\n\t"
  14595. "str r3, [%[r], #16]\n\t"
  14596. "lsr r5, r4, #1\n\t"
  14597. "lsl r4, r4, %[n]\n\t"
  14598. "lsr r5, r5, r6\n\t"
  14599. "orr r2, r2, r5\n\t"
  14600. "ldr r3, [%[a], #4]\n\t"
  14601. "str r2, [%[r], #12]\n\t"
  14602. "lsr r5, r3, #1\n\t"
  14603. "lsl r3, r3, %[n]\n\t"
  14604. "lsr r5, r5, r6\n\t"
  14605. "orr r4, r4, r5\n\t"
  14606. "ldr r2, [%[a], #0]\n\t"
  14607. "str r4, [%[r], #8]\n\t"
  14608. "lsr r5, r2, #1\n\t"
  14609. "lsl r2, r2, %[n]\n\t"
  14610. "lsr r5, r5, r6\n\t"
  14611. "orr r3, r3, r5\n\t"
  14612. "str r2, [%[r]]\n\t"
  14613. "str r3, [%[r], #4]\n\t"
  14614. :
  14615. : [r] "r" (r), [a] "r" (a), [n] "r" (n)
  14616. : "memory", "r2", "r3", "r4", "r5", "r6"
  14617. );
  14618. }
  14619. /* Modular exponentiate 2 to the e mod m. (r = 2^e mod m)
  14620. *
  14621. * r A single precision number that is the result of the operation.
  14622. * e A single precision number that is the exponent.
  14623. * bits The number of bits in the exponent.
  14624. * m A single precision number that is the modulus.
  14625. * returns 0 on success.
  14626. * returns MEMORY_E on dynamic memory allocation failure.
  14627. * returns MP_VAL when base is even.
  14628. */
  14629. static int sp_4096_mod_exp_2_128(sp_digit* r, const sp_digit* e, int bits,
  14630. const sp_digit* m)
  14631. {
  14632. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  14633. sp_digit* td = NULL;
  14634. #else
  14635. sp_digit td[385];
  14636. #endif
  14637. sp_digit* norm = NULL;
  14638. sp_digit* tmp = NULL;
  14639. sp_digit mp = 1;
  14640. sp_digit n;
  14641. sp_digit o;
  14642. sp_digit mask;
  14643. int i;
  14644. int c;
  14645. byte y;
  14646. int err = MP_OKAY;
  14647. if (bits == 0) {
  14648. err = MP_VAL;
  14649. }
  14650. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  14651. if (err == MP_OKAY) {
  14652. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * 385, NULL,
  14653. DYNAMIC_TYPE_TMP_BUFFER);
  14654. if (td == NULL)
  14655. err = MEMORY_E;
  14656. }
  14657. #endif
  14658. if (err == MP_OKAY) {
  14659. norm = td;
  14660. tmp = td + 256;
  14661. sp_4096_mont_setup(m, &mp);
  14662. sp_4096_mont_norm_128(norm, m);
  14663. i = (bits - 1) / 32;
  14664. n = e[i--];
  14665. c = bits & 31;
  14666. if (c == 0) {
  14667. c = 32;
  14668. }
  14669. c -= bits % 5;
  14670. if (c == 32) {
  14671. c = 27;
  14672. }
  14673. if (c < 0) {
  14674. /* Number of bits in top word is less than number needed. */
  14675. c = -c;
  14676. y = (byte)(n << c);
  14677. n = e[i--];
  14678. y |= (byte)(n >> (64 - c));
  14679. n <<= c;
  14680. c = 64 - c;
  14681. }
  14682. else if (c == 0) {
  14683. /* All bits in top word used. */
  14684. y = (byte)n;
  14685. }
  14686. else {
  14687. y = (byte)(n >> c);
  14688. n <<= 32 - c;
  14689. }
  14690. sp_4096_lshift_128(r, norm, y);
  14691. for (; i>=0 || c>=5; ) {
  14692. if (c == 0) {
  14693. n = e[i--];
  14694. y = (byte)(n >> 27);
  14695. n <<= 5;
  14696. c = 27;
  14697. }
  14698. else if (c < 5) {
  14699. y = (byte)(n >> 27);
  14700. n = e[i--];
  14701. c = 5 - c;
  14702. y |= (byte)(n >> (32 - c));
  14703. n <<= c;
  14704. c = 32 - c;
  14705. }
  14706. else {
  14707. y = (byte)((n >> 27) & 0x1f);
  14708. n <<= 5;
  14709. c -= 5;
  14710. }
  14711. sp_4096_mont_sqr_128(r, r, m, mp);
  14712. sp_4096_mont_sqr_128(r, r, m, mp);
  14713. sp_4096_mont_sqr_128(r, r, m, mp);
  14714. sp_4096_mont_sqr_128(r, r, m, mp);
  14715. sp_4096_mont_sqr_128(r, r, m, mp);
  14716. sp_4096_lshift_128(r, r, y);
  14717. sp_4096_mul_d_128(tmp, norm, r[128]);
  14718. r[128] = 0;
  14719. o = sp_4096_add_128(r, r, tmp);
  14720. sp_4096_cond_sub_128(r, r, m, (sp_digit)0 - o);
  14721. }
  14722. XMEMSET(&r[128], 0, sizeof(sp_digit) * 128U);
  14723. sp_4096_mont_reduce_128(r, m, mp);
  14724. mask = 0 - (sp_4096_cmp_128(r, m) >= 0);
  14725. sp_4096_cond_sub_128(r, r, m, mask);
  14726. }
  14727. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  14728. if (td != NULL)
  14729. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  14730. #endif
  14731. return err;
  14732. }
  14733. #endif /* HAVE_FFDHE_4096 */
  14734. /* Perform the modular exponentiation for Diffie-Hellman.
  14735. *
  14736. * base Base.
  14737. * exp Array of bytes that is the exponent.
  14738. * expLen Length of data, in bytes, in exponent.
  14739. * mod Modulus.
  14740. * out Buffer to hold big-endian bytes of exponentiation result.
  14741. * Must be at least 512 bytes long.
  14742. * outLen Length, in bytes, of exponentiation result.
  14743. * returns 0 on success, MP_READ_E if there are too many bytes in an array
  14744. * and MEMORY_E if memory allocation fails.
  14745. */
  14746. int sp_DhExp_4096(const mp_int* base, const byte* exp, word32 expLen,
  14747. const mp_int* mod, byte* out, word32* outLen)
  14748. {
  14749. int err = MP_OKAY;
  14750. sp_digit b[256];
  14751. sp_digit e[128];
  14752. sp_digit m[128];
  14753. sp_digit* r = b;
  14754. word32 i;
  14755. if (mp_count_bits(base) > 4096) {
  14756. err = MP_READ_E;
  14757. }
  14758. else if (expLen > 512) {
  14759. err = MP_READ_E;
  14760. }
  14761. else if (mp_count_bits(mod) != 4096) {
  14762. err = MP_READ_E;
  14763. }
  14764. else if (mp_iseven(mod)) {
  14765. err = MP_VAL;
  14766. }
  14767. if (err == MP_OKAY) {
  14768. sp_4096_from_mp(b, 128, base);
  14769. sp_4096_from_bin(e, 128, exp, expLen);
  14770. sp_4096_from_mp(m, 128, mod);
  14771. #ifdef HAVE_FFDHE_4096
  14772. if (base->used == 1 && base->dp[0] == 2 && m[127] == (sp_digit)-1)
  14773. err = sp_4096_mod_exp_2_128(r, e, expLen * 8, m);
  14774. else
  14775. #endif
  14776. err = sp_4096_mod_exp_128(r, b, e, expLen * 8, m, 0);
  14777. }
  14778. if (err == MP_OKAY) {
  14779. sp_4096_to_bin_128(r, out);
  14780. *outLen = 512;
  14781. for (i=0; i<512 && out[i] == 0; i++) {
  14782. /* Search for first non-zero. */
  14783. }
  14784. *outLen -= i;
  14785. XMEMMOVE(out, out + i, *outLen);
  14786. }
  14787. XMEMSET(e, 0, sizeof(e));
  14788. return err;
  14789. }
  14790. #endif /* WOLFSSL_HAVE_SP_DH */
  14791. #endif /* WOLFSSL_HAVE_SP_DH | (WOLFSSL_HAVE_SP_RSA & !WOLFSSL_RSA_PUBLIC_ONLY) */
  14792. #endif /* WOLFSSL_SP_4096 */
  14793. #endif /* WOLFSSL_HAVE_SP_RSA | WOLFSSL_HAVE_SP_DH */
  14794. #ifdef WOLFSSL_HAVE_SP_ECC
  14795. #ifndef WOLFSSL_SP_NO_256
  14796. /* Point structure to use. */
  14797. typedef struct sp_point_256 {
  14798. /* X ordinate of point. */
  14799. sp_digit x[2 * 8];
  14800. /* Y ordinate of point. */
  14801. sp_digit y[2 * 8];
  14802. /* Z ordinate of point. */
  14803. sp_digit z[2 * 8];
  14804. /* Indicates point is at infinity. */
  14805. int infinity;
  14806. } sp_point_256;
  14807. /* The modulus (prime) of the curve P256. */
  14808. static const sp_digit p256_mod[8] = {
  14809. 0xffffffff,0xffffffff,0xffffffff,0x00000000,0x00000000,0x00000000,
  14810. 0x00000001,0xffffffff
  14811. };
  14812. /* The Montgomery normalizer for modulus of the curve P256. */
  14813. static const sp_digit p256_norm_mod[8] = {
  14814. 0x00000001,0x00000000,0x00000000,0xffffffff,0xffffffff,0xffffffff,
  14815. 0xfffffffe,0x00000000
  14816. };
  14817. /* The Montgomery multiplier for modulus of the curve P256. */
  14818. static const sp_digit p256_mp_mod = 0x00000001;
  14819. #if defined(WOLFSSL_VALIDATE_ECC_KEYGEN) || defined(HAVE_ECC_SIGN) || \
  14820. defined(HAVE_ECC_VERIFY)
  14821. /* The order of the curve P256. */
  14822. static const sp_digit p256_order[8] = {
  14823. 0xfc632551,0xf3b9cac2,0xa7179e84,0xbce6faad,0xffffffff,0xffffffff,
  14824. 0x00000000,0xffffffff
  14825. };
  14826. #endif
  14827. /* The order of the curve P256 minus 2. */
  14828. static const sp_digit p256_order2[8] = {
  14829. 0xfc63254f,0xf3b9cac2,0xa7179e84,0xbce6faad,0xffffffff,0xffffffff,
  14830. 0x00000000,0xffffffff
  14831. };
  14832. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  14833. /* The Montgomery normalizer for order of the curve P256. */
  14834. static const sp_digit p256_norm_order[8] = {
  14835. 0x039cdaaf,0x0c46353d,0x58e8617b,0x43190552,0x00000000,0x00000000,
  14836. 0xffffffff,0x00000000
  14837. };
  14838. #endif
  14839. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  14840. /* The Montgomery multiplier for order of the curve P256. */
  14841. static const sp_digit p256_mp_order = 0xee00bc4f;
  14842. #endif
  14843. /* The base point of curve P256. */
  14844. static const sp_point_256 p256_base = {
  14845. /* X ordinate */
  14846. {
  14847. 0xd898c296,0xf4a13945,0x2deb33a0,0x77037d81,0x63a440f2,0xf8bce6e5,
  14848. 0xe12c4247,0x6b17d1f2,
  14849. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  14850. (sp_digit)0, (sp_digit)0, (sp_digit)0
  14851. },
  14852. /* Y ordinate */
  14853. {
  14854. 0x37bf51f5,0xcbb64068,0x6b315ece,0x2bce3357,0x7c0f9e16,0x8ee7eb4a,
  14855. 0xfe1a7f9b,0x4fe342e2,
  14856. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  14857. (sp_digit)0, (sp_digit)0, (sp_digit)0
  14858. },
  14859. /* Z ordinate */
  14860. {
  14861. 0x00000001,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  14862. 0x00000000,0x00000000,
  14863. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  14864. (sp_digit)0, (sp_digit)0, (sp_digit)0
  14865. },
  14866. /* infinity */
  14867. 0
  14868. };
  14869. #if defined(HAVE_ECC_CHECK_KEY) || defined(HAVE_COMP_KEY)
  14870. static const sp_digit p256_b[8] = {
  14871. 0x27d2604b,0x3bce3c3e,0xcc53b0f6,0x651d06b0,0x769886bc,0xb3ebbd55,
  14872. 0xaa3a93e7,0x5ac635d8
  14873. };
  14874. #endif
  14875. /* Multiply a and b into r. (r = a * b)
  14876. *
  14877. * r A single precision integer.
  14878. * a A single precision integer.
  14879. * b A single precision integer.
  14880. */
  14881. SP_NOINLINE static void sp_256_mul_8(sp_digit* r, const sp_digit* a,
  14882. const sp_digit* b)
  14883. {
  14884. sp_digit tmp_arr[8];
  14885. sp_digit* tmp = tmp_arr;
  14886. __asm__ __volatile__ (
  14887. /* A[0] * B[0] */
  14888. "ldr r6, [%[a], #0]\n\t"
  14889. "ldr r8, [%[b], #0]\n\t"
  14890. "umull r3, r4, r6, r8\n\t"
  14891. "mov r5, #0\n\t"
  14892. "str r3, [%[tmp], #0]\n\t"
  14893. "mov r3, #0\n\t"
  14894. /* A[0] * B[1] */
  14895. "ldr r8, [%[b], #4]\n\t"
  14896. "umull r6, r8, r6, r8\n\t"
  14897. "adds r4, r4, r6\n\t"
  14898. "adc r5, r5, r8\n\t"
  14899. /* A[1] * B[0] */
  14900. "ldr r6, [%[a], #4]\n\t"
  14901. "ldr r8, [%[b], #0]\n\t"
  14902. "umull r6, r8, r6, r8\n\t"
  14903. "adds r4, r4, r6\n\t"
  14904. "adcs r5, r5, r8\n\t"
  14905. "adc r3, r3, #0\n\t"
  14906. "str r4, [%[tmp], #4]\n\t"
  14907. "mov r4, #0\n\t"
  14908. /* A[0] * B[2] */
  14909. "ldr r6, [%[a], #0]\n\t"
  14910. "ldr r8, [%[b], #8]\n\t"
  14911. "umull r6, r8, r6, r8\n\t"
  14912. "adds r5, r5, r6\n\t"
  14913. "adcs r3, r3, r8\n\t"
  14914. "adc r4, r4, #0\n\t"
  14915. /* A[1] * B[1] */
  14916. "ldr r6, [%[a], #4]\n\t"
  14917. "ldr r8, [%[b], #4]\n\t"
  14918. "umull r6, r8, r6, r8\n\t"
  14919. "adds r5, r5, r6\n\t"
  14920. "adcs r3, r3, r8\n\t"
  14921. "adc r4, r4, #0\n\t"
  14922. /* A[2] * B[0] */
  14923. "ldr r6, [%[a], #8]\n\t"
  14924. "ldr r8, [%[b], #0]\n\t"
  14925. "umull r6, r8, r6, r8\n\t"
  14926. "adds r5, r5, r6\n\t"
  14927. "adcs r3, r3, r8\n\t"
  14928. "adc r4, r4, #0\n\t"
  14929. "str r5, [%[tmp], #8]\n\t"
  14930. "mov r5, #0\n\t"
  14931. /* A[0] * B[3] */
  14932. "ldr r6, [%[a], #0]\n\t"
  14933. "ldr r8, [%[b], #12]\n\t"
  14934. "umull r6, r8, r6, r8\n\t"
  14935. "adds r3, r3, r6\n\t"
  14936. "adcs r4, r4, r8\n\t"
  14937. "adc r5, r5, #0\n\t"
  14938. /* A[1] * B[2] */
  14939. "ldr r6, [%[a], #4]\n\t"
  14940. "ldr r8, [%[b], #8]\n\t"
  14941. "umull r6, r8, r6, r8\n\t"
  14942. "adds r3, r3, r6\n\t"
  14943. "adcs r4, r4, r8\n\t"
  14944. "adc r5, r5, #0\n\t"
  14945. /* A[2] * B[1] */
  14946. "ldr r6, [%[a], #8]\n\t"
  14947. "ldr r8, [%[b], #4]\n\t"
  14948. "umull r6, r8, r6, r8\n\t"
  14949. "adds r3, r3, r6\n\t"
  14950. "adcs r4, r4, r8\n\t"
  14951. "adc r5, r5, #0\n\t"
  14952. /* A[3] * B[0] */
  14953. "ldr r6, [%[a], #12]\n\t"
  14954. "ldr r8, [%[b], #0]\n\t"
  14955. "umull r6, r8, r6, r8\n\t"
  14956. "adds r3, r3, r6\n\t"
  14957. "adcs r4, r4, r8\n\t"
  14958. "adc r5, r5, #0\n\t"
  14959. "str r3, [%[tmp], #12]\n\t"
  14960. "mov r3, #0\n\t"
  14961. /* A[0] * B[4] */
  14962. "ldr r6, [%[a], #0]\n\t"
  14963. "ldr r8, [%[b], #16]\n\t"
  14964. "umull r6, r8, r6, r8\n\t"
  14965. "adds r4, r4, r6\n\t"
  14966. "adcs r5, r5, r8\n\t"
  14967. "adc r3, r3, #0\n\t"
  14968. /* A[1] * B[3] */
  14969. "ldr r6, [%[a], #4]\n\t"
  14970. "ldr r8, [%[b], #12]\n\t"
  14971. "umull r6, r8, r6, r8\n\t"
  14972. "adds r4, r4, r6\n\t"
  14973. "adcs r5, r5, r8\n\t"
  14974. "adc r3, r3, #0\n\t"
  14975. /* A[2] * B[2] */
  14976. "ldr r6, [%[a], #8]\n\t"
  14977. "ldr r8, [%[b], #8]\n\t"
  14978. "umull r6, r8, r6, r8\n\t"
  14979. "adds r4, r4, r6\n\t"
  14980. "adcs r5, r5, r8\n\t"
  14981. "adc r3, r3, #0\n\t"
  14982. /* A[3] * B[1] */
  14983. "ldr r6, [%[a], #12]\n\t"
  14984. "ldr r8, [%[b], #4]\n\t"
  14985. "umull r6, r8, r6, r8\n\t"
  14986. "adds r4, r4, r6\n\t"
  14987. "adcs r5, r5, r8\n\t"
  14988. "adc r3, r3, #0\n\t"
  14989. /* A[4] * B[0] */
  14990. "ldr r6, [%[a], #16]\n\t"
  14991. "ldr r8, [%[b], #0]\n\t"
  14992. "umull r6, r8, r6, r8\n\t"
  14993. "adds r4, r4, r6\n\t"
  14994. "adcs r5, r5, r8\n\t"
  14995. "adc r3, r3, #0\n\t"
  14996. "str r4, [%[tmp], #16]\n\t"
  14997. "mov r4, #0\n\t"
  14998. /* A[0] * B[5] */
  14999. "ldr r6, [%[a], #0]\n\t"
  15000. "ldr r8, [%[b], #20]\n\t"
  15001. "umull r6, r8, r6, r8\n\t"
  15002. "adds r5, r5, r6\n\t"
  15003. "adcs r3, r3, r8\n\t"
  15004. "adc r4, r4, #0\n\t"
  15005. /* A[1] * B[4] */
  15006. "ldr r6, [%[a], #4]\n\t"
  15007. "ldr r8, [%[b], #16]\n\t"
  15008. "umull r6, r8, r6, r8\n\t"
  15009. "adds r5, r5, r6\n\t"
  15010. "adcs r3, r3, r8\n\t"
  15011. "adc r4, r4, #0\n\t"
  15012. /* A[2] * B[3] */
  15013. "ldr r6, [%[a], #8]\n\t"
  15014. "ldr r8, [%[b], #12]\n\t"
  15015. "umull r6, r8, r6, r8\n\t"
  15016. "adds r5, r5, r6\n\t"
  15017. "adcs r3, r3, r8\n\t"
  15018. "adc r4, r4, #0\n\t"
  15019. /* A[3] * B[2] */
  15020. "ldr r6, [%[a], #12]\n\t"
  15021. "ldr r8, [%[b], #8]\n\t"
  15022. "umull r6, r8, r6, r8\n\t"
  15023. "adds r5, r5, r6\n\t"
  15024. "adcs r3, r3, r8\n\t"
  15025. "adc r4, r4, #0\n\t"
  15026. /* A[4] * B[1] */
  15027. "ldr r6, [%[a], #16]\n\t"
  15028. "ldr r8, [%[b], #4]\n\t"
  15029. "umull r6, r8, r6, r8\n\t"
  15030. "adds r5, r5, r6\n\t"
  15031. "adcs r3, r3, r8\n\t"
  15032. "adc r4, r4, #0\n\t"
  15033. /* A[5] * B[0] */
  15034. "ldr r6, [%[a], #20]\n\t"
  15035. "ldr r8, [%[b], #0]\n\t"
  15036. "umull r6, r8, r6, r8\n\t"
  15037. "adds r5, r5, r6\n\t"
  15038. "adcs r3, r3, r8\n\t"
  15039. "adc r4, r4, #0\n\t"
  15040. "str r5, [%[tmp], #20]\n\t"
  15041. "mov r5, #0\n\t"
  15042. /* A[0] * B[6] */
  15043. "ldr r6, [%[a], #0]\n\t"
  15044. "ldr r8, [%[b], #24]\n\t"
  15045. "umull r6, r8, r6, r8\n\t"
  15046. "adds r3, r3, r6\n\t"
  15047. "adcs r4, r4, r8\n\t"
  15048. "adc r5, r5, #0\n\t"
  15049. /* A[1] * B[5] */
  15050. "ldr r6, [%[a], #4]\n\t"
  15051. "ldr r8, [%[b], #20]\n\t"
  15052. "umull r6, r8, r6, r8\n\t"
  15053. "adds r3, r3, r6\n\t"
  15054. "adcs r4, r4, r8\n\t"
  15055. "adc r5, r5, #0\n\t"
  15056. /* A[2] * B[4] */
  15057. "ldr r6, [%[a], #8]\n\t"
  15058. "ldr r8, [%[b], #16]\n\t"
  15059. "umull r6, r8, r6, r8\n\t"
  15060. "adds r3, r3, r6\n\t"
  15061. "adcs r4, r4, r8\n\t"
  15062. "adc r5, r5, #0\n\t"
  15063. /* A[3] * B[3] */
  15064. "ldr r6, [%[a], #12]\n\t"
  15065. "ldr r8, [%[b], #12]\n\t"
  15066. "umull r6, r8, r6, r8\n\t"
  15067. "adds r3, r3, r6\n\t"
  15068. "adcs r4, r4, r8\n\t"
  15069. "adc r5, r5, #0\n\t"
  15070. /* A[4] * B[2] */
  15071. "ldr r6, [%[a], #16]\n\t"
  15072. "ldr r8, [%[b], #8]\n\t"
  15073. "umull r6, r8, r6, r8\n\t"
  15074. "adds r3, r3, r6\n\t"
  15075. "adcs r4, r4, r8\n\t"
  15076. "adc r5, r5, #0\n\t"
  15077. /* A[5] * B[1] */
  15078. "ldr r6, [%[a], #20]\n\t"
  15079. "ldr r8, [%[b], #4]\n\t"
  15080. "umull r6, r8, r6, r8\n\t"
  15081. "adds r3, r3, r6\n\t"
  15082. "adcs r4, r4, r8\n\t"
  15083. "adc r5, r5, #0\n\t"
  15084. /* A[6] * B[0] */
  15085. "ldr r6, [%[a], #24]\n\t"
  15086. "ldr r8, [%[b], #0]\n\t"
  15087. "umull r6, r8, r6, r8\n\t"
  15088. "adds r3, r3, r6\n\t"
  15089. "adcs r4, r4, r8\n\t"
  15090. "adc r5, r5, #0\n\t"
  15091. "str r3, [%[tmp], #24]\n\t"
  15092. "mov r3, #0\n\t"
  15093. /* A[0] * B[7] */
  15094. "ldr r6, [%[a], #0]\n\t"
  15095. "ldr r8, [%[b], #28]\n\t"
  15096. "umull r6, r8, r6, r8\n\t"
  15097. "adds r4, r4, r6\n\t"
  15098. "adcs r5, r5, r8\n\t"
  15099. "adc r3, r3, #0\n\t"
  15100. /* A[1] * B[6] */
  15101. "ldr r6, [%[a], #4]\n\t"
  15102. "ldr r8, [%[b], #24]\n\t"
  15103. "umull r6, r8, r6, r8\n\t"
  15104. "adds r4, r4, r6\n\t"
  15105. "adcs r5, r5, r8\n\t"
  15106. "adc r3, r3, #0\n\t"
  15107. /* A[2] * B[5] */
  15108. "ldr r6, [%[a], #8]\n\t"
  15109. "ldr r8, [%[b], #20]\n\t"
  15110. "umull r6, r8, r6, r8\n\t"
  15111. "adds r4, r4, r6\n\t"
  15112. "adcs r5, r5, r8\n\t"
  15113. "adc r3, r3, #0\n\t"
  15114. /* A[3] * B[4] */
  15115. "ldr r6, [%[a], #12]\n\t"
  15116. "ldr r8, [%[b], #16]\n\t"
  15117. "umull r6, r8, r6, r8\n\t"
  15118. "adds r4, r4, r6\n\t"
  15119. "adcs r5, r5, r8\n\t"
  15120. "adc r3, r3, #0\n\t"
  15121. /* A[4] * B[3] */
  15122. "ldr r6, [%[a], #16]\n\t"
  15123. "ldr r8, [%[b], #12]\n\t"
  15124. "umull r6, r8, r6, r8\n\t"
  15125. "adds r4, r4, r6\n\t"
  15126. "adcs r5, r5, r8\n\t"
  15127. "adc r3, r3, #0\n\t"
  15128. /* A[5] * B[2] */
  15129. "ldr r6, [%[a], #20]\n\t"
  15130. "ldr r8, [%[b], #8]\n\t"
  15131. "umull r6, r8, r6, r8\n\t"
  15132. "adds r4, r4, r6\n\t"
  15133. "adcs r5, r5, r8\n\t"
  15134. "adc r3, r3, #0\n\t"
  15135. /* A[6] * B[1] */
  15136. "ldr r6, [%[a], #24]\n\t"
  15137. "ldr r8, [%[b], #4]\n\t"
  15138. "umull r6, r8, r6, r8\n\t"
  15139. "adds r4, r4, r6\n\t"
  15140. "adcs r5, r5, r8\n\t"
  15141. "adc r3, r3, #0\n\t"
  15142. /* A[7] * B[0] */
  15143. "ldr r6, [%[a], #28]\n\t"
  15144. "ldr r8, [%[b], #0]\n\t"
  15145. "umull r6, r8, r6, r8\n\t"
  15146. "adds r4, r4, r6\n\t"
  15147. "adcs r5, r5, r8\n\t"
  15148. "adc r3, r3, #0\n\t"
  15149. "str r4, [%[tmp], #28]\n\t"
  15150. "mov r4, #0\n\t"
  15151. /* A[1] * B[7] */
  15152. "ldr r6, [%[a], #4]\n\t"
  15153. "ldr r8, [%[b], #28]\n\t"
  15154. "umull r6, r8, r6, r8\n\t"
  15155. "adds r5, r5, r6\n\t"
  15156. "adcs r3, r3, r8\n\t"
  15157. "adc r4, r4, #0\n\t"
  15158. /* A[2] * B[6] */
  15159. "ldr r6, [%[a], #8]\n\t"
  15160. "ldr r8, [%[b], #24]\n\t"
  15161. "umull r6, r8, r6, r8\n\t"
  15162. "adds r5, r5, r6\n\t"
  15163. "adcs r3, r3, r8\n\t"
  15164. "adc r4, r4, #0\n\t"
  15165. /* A[3] * B[5] */
  15166. "ldr r6, [%[a], #12]\n\t"
  15167. "ldr r8, [%[b], #20]\n\t"
  15168. "umull r6, r8, r6, r8\n\t"
  15169. "adds r5, r5, r6\n\t"
  15170. "adcs r3, r3, r8\n\t"
  15171. "adc r4, r4, #0\n\t"
  15172. /* A[4] * B[4] */
  15173. "ldr r6, [%[a], #16]\n\t"
  15174. "ldr r8, [%[b], #16]\n\t"
  15175. "umull r6, r8, r6, r8\n\t"
  15176. "adds r5, r5, r6\n\t"
  15177. "adcs r3, r3, r8\n\t"
  15178. "adc r4, r4, #0\n\t"
  15179. /* A[5] * B[3] */
  15180. "ldr r6, [%[a], #20]\n\t"
  15181. "ldr r8, [%[b], #12]\n\t"
  15182. "umull r6, r8, r6, r8\n\t"
  15183. "adds r5, r5, r6\n\t"
  15184. "adcs r3, r3, r8\n\t"
  15185. "adc r4, r4, #0\n\t"
  15186. /* A[6] * B[2] */
  15187. "ldr r6, [%[a], #24]\n\t"
  15188. "ldr r8, [%[b], #8]\n\t"
  15189. "umull r6, r8, r6, r8\n\t"
  15190. "adds r5, r5, r6\n\t"
  15191. "adcs r3, r3, r8\n\t"
  15192. "adc r4, r4, #0\n\t"
  15193. /* A[7] * B[1] */
  15194. "ldr r6, [%[a], #28]\n\t"
  15195. "ldr r8, [%[b], #4]\n\t"
  15196. "umull r6, r8, r6, r8\n\t"
  15197. "adds r5, r5, r6\n\t"
  15198. "adcs r3, r3, r8\n\t"
  15199. "adc r4, r4, #0\n\t"
  15200. "str r5, [%[r], #32]\n\t"
  15201. "mov r5, #0\n\t"
  15202. /* A[2] * B[7] */
  15203. "ldr r6, [%[a], #8]\n\t"
  15204. "ldr r8, [%[b], #28]\n\t"
  15205. "umull r6, r8, r6, r8\n\t"
  15206. "adds r3, r3, r6\n\t"
  15207. "adcs r4, r4, r8\n\t"
  15208. "adc r5, r5, #0\n\t"
  15209. /* A[3] * B[6] */
  15210. "ldr r6, [%[a], #12]\n\t"
  15211. "ldr r8, [%[b], #24]\n\t"
  15212. "umull r6, r8, r6, r8\n\t"
  15213. "adds r3, r3, r6\n\t"
  15214. "adcs r4, r4, r8\n\t"
  15215. "adc r5, r5, #0\n\t"
  15216. /* A[4] * B[5] */
  15217. "ldr r6, [%[a], #16]\n\t"
  15218. "ldr r8, [%[b], #20]\n\t"
  15219. "umull r6, r8, r6, r8\n\t"
  15220. "adds r3, r3, r6\n\t"
  15221. "adcs r4, r4, r8\n\t"
  15222. "adc r5, r5, #0\n\t"
  15223. /* A[5] * B[4] */
  15224. "ldr r6, [%[a], #20]\n\t"
  15225. "ldr r8, [%[b], #16]\n\t"
  15226. "umull r6, r8, r6, r8\n\t"
  15227. "adds r3, r3, r6\n\t"
  15228. "adcs r4, r4, r8\n\t"
  15229. "adc r5, r5, #0\n\t"
  15230. /* A[6] * B[3] */
  15231. "ldr r6, [%[a], #24]\n\t"
  15232. "ldr r8, [%[b], #12]\n\t"
  15233. "umull r6, r8, r6, r8\n\t"
  15234. "adds r3, r3, r6\n\t"
  15235. "adcs r4, r4, r8\n\t"
  15236. "adc r5, r5, #0\n\t"
  15237. /* A[7] * B[2] */
  15238. "ldr r6, [%[a], #28]\n\t"
  15239. "ldr r8, [%[b], #8]\n\t"
  15240. "umull r6, r8, r6, r8\n\t"
  15241. "adds r3, r3, r6\n\t"
  15242. "adcs r4, r4, r8\n\t"
  15243. "adc r5, r5, #0\n\t"
  15244. "str r3, [%[r], #36]\n\t"
  15245. "mov r3, #0\n\t"
  15246. /* A[3] * B[7] */
  15247. "ldr r6, [%[a], #12]\n\t"
  15248. "ldr r8, [%[b], #28]\n\t"
  15249. "umull r6, r8, r6, r8\n\t"
  15250. "adds r4, r4, r6\n\t"
  15251. "adcs r5, r5, r8\n\t"
  15252. "adc r3, r3, #0\n\t"
  15253. /* A[4] * B[6] */
  15254. "ldr r6, [%[a], #16]\n\t"
  15255. "ldr r8, [%[b], #24]\n\t"
  15256. "umull r6, r8, r6, r8\n\t"
  15257. "adds r4, r4, r6\n\t"
  15258. "adcs r5, r5, r8\n\t"
  15259. "adc r3, r3, #0\n\t"
  15260. /* A[5] * B[5] */
  15261. "ldr r6, [%[a], #20]\n\t"
  15262. "ldr r8, [%[b], #20]\n\t"
  15263. "umull r6, r8, r6, r8\n\t"
  15264. "adds r4, r4, r6\n\t"
  15265. "adcs r5, r5, r8\n\t"
  15266. "adc r3, r3, #0\n\t"
  15267. /* A[6] * B[4] */
  15268. "ldr r6, [%[a], #24]\n\t"
  15269. "ldr r8, [%[b], #16]\n\t"
  15270. "umull r6, r8, r6, r8\n\t"
  15271. "adds r4, r4, r6\n\t"
  15272. "adcs r5, r5, r8\n\t"
  15273. "adc r3, r3, #0\n\t"
  15274. /* A[7] * B[3] */
  15275. "ldr r6, [%[a], #28]\n\t"
  15276. "ldr r8, [%[b], #12]\n\t"
  15277. "umull r6, r8, r6, r8\n\t"
  15278. "adds r4, r4, r6\n\t"
  15279. "adcs r5, r5, r8\n\t"
  15280. "adc r3, r3, #0\n\t"
  15281. "str r4, [%[r], #40]\n\t"
  15282. "mov r4, #0\n\t"
  15283. /* A[4] * B[7] */
  15284. "ldr r6, [%[a], #16]\n\t"
  15285. "ldr r8, [%[b], #28]\n\t"
  15286. "umull r6, r8, r6, r8\n\t"
  15287. "adds r5, r5, r6\n\t"
  15288. "adcs r3, r3, r8\n\t"
  15289. "adc r4, r4, #0\n\t"
  15290. /* A[5] * B[6] */
  15291. "ldr r6, [%[a], #20]\n\t"
  15292. "ldr r8, [%[b], #24]\n\t"
  15293. "umull r6, r8, r6, r8\n\t"
  15294. "adds r5, r5, r6\n\t"
  15295. "adcs r3, r3, r8\n\t"
  15296. "adc r4, r4, #0\n\t"
  15297. /* A[6] * B[5] */
  15298. "ldr r6, [%[a], #24]\n\t"
  15299. "ldr r8, [%[b], #20]\n\t"
  15300. "umull r6, r8, r6, r8\n\t"
  15301. "adds r5, r5, r6\n\t"
  15302. "adcs r3, r3, r8\n\t"
  15303. "adc r4, r4, #0\n\t"
  15304. /* A[7] * B[4] */
  15305. "ldr r6, [%[a], #28]\n\t"
  15306. "ldr r8, [%[b], #16]\n\t"
  15307. "umull r6, r8, r6, r8\n\t"
  15308. "adds r5, r5, r6\n\t"
  15309. "adcs r3, r3, r8\n\t"
  15310. "adc r4, r4, #0\n\t"
  15311. "str r5, [%[r], #44]\n\t"
  15312. "mov r5, #0\n\t"
  15313. /* A[5] * B[7] */
  15314. "ldr r6, [%[a], #20]\n\t"
  15315. "ldr r8, [%[b], #28]\n\t"
  15316. "umull r6, r8, r6, r8\n\t"
  15317. "adds r3, r3, r6\n\t"
  15318. "adcs r4, r4, r8\n\t"
  15319. "adc r5, r5, #0\n\t"
  15320. /* A[6] * B[6] */
  15321. "ldr r6, [%[a], #24]\n\t"
  15322. "ldr r8, [%[b], #24]\n\t"
  15323. "umull r6, r8, r6, r8\n\t"
  15324. "adds r3, r3, r6\n\t"
  15325. "adcs r4, r4, r8\n\t"
  15326. "adc r5, r5, #0\n\t"
  15327. /* A[7] * B[5] */
  15328. "ldr r6, [%[a], #28]\n\t"
  15329. "ldr r8, [%[b], #20]\n\t"
  15330. "umull r6, r8, r6, r8\n\t"
  15331. "adds r3, r3, r6\n\t"
  15332. "adcs r4, r4, r8\n\t"
  15333. "adc r5, r5, #0\n\t"
  15334. "str r3, [%[r], #48]\n\t"
  15335. "mov r3, #0\n\t"
  15336. /* A[6] * B[7] */
  15337. "ldr r6, [%[a], #24]\n\t"
  15338. "ldr r8, [%[b], #28]\n\t"
  15339. "umull r6, r8, r6, r8\n\t"
  15340. "adds r4, r4, r6\n\t"
  15341. "adcs r5, r5, r8\n\t"
  15342. "adc r3, r3, #0\n\t"
  15343. /* A[7] * B[6] */
  15344. "ldr r6, [%[a], #28]\n\t"
  15345. "ldr r8, [%[b], #24]\n\t"
  15346. "umull r6, r8, r6, r8\n\t"
  15347. "adds r4, r4, r6\n\t"
  15348. "adcs r5, r5, r8\n\t"
  15349. "adc r3, r3, #0\n\t"
  15350. "str r4, [%[r], #52]\n\t"
  15351. "mov r4, #0\n\t"
  15352. /* A[7] * B[7] */
  15353. "ldr r6, [%[a], #28]\n\t"
  15354. "ldr r8, [%[b], #28]\n\t"
  15355. "umull r6, r8, r6, r8\n\t"
  15356. "adds r5, r5, r6\n\t"
  15357. "adc r3, r3, r8\n\t"
  15358. "str r5, [%[r], #56]\n\t"
  15359. "str r3, [%[r], #60]\n\t"
  15360. /* Transfer tmp to r */
  15361. "ldr r3, [%[tmp], #0]\n\t"
  15362. "ldr r4, [%[tmp], #4]\n\t"
  15363. "ldr r5, [%[tmp], #8]\n\t"
  15364. "ldr r6, [%[tmp], #12]\n\t"
  15365. "str r3, [%[r], #0]\n\t"
  15366. "str r4, [%[r], #4]\n\t"
  15367. "str r5, [%[r], #8]\n\t"
  15368. "str r6, [%[r], #12]\n\t"
  15369. "ldr r3, [%[tmp], #16]\n\t"
  15370. "ldr r4, [%[tmp], #20]\n\t"
  15371. "ldr r5, [%[tmp], #24]\n\t"
  15372. "ldr r6, [%[tmp], #28]\n\t"
  15373. "str r3, [%[r], #16]\n\t"
  15374. "str r4, [%[r], #20]\n\t"
  15375. "str r5, [%[r], #24]\n\t"
  15376. "str r6, [%[r], #28]\n\t"
  15377. :
  15378. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [tmp] "r" (tmp)
  15379. : "memory", "r3", "r4", "r5", "r6", "r8"
  15380. );
  15381. }
  15382. /* Square a and put result in r. (r = a * a)
  15383. *
  15384. * r A single precision integer.
  15385. * a A single precision integer.
  15386. */
  15387. SP_NOINLINE static void sp_256_sqr_8(sp_digit* r, const sp_digit* a)
  15388. {
  15389. sp_digit tmp_arr[8];
  15390. sp_digit* tmp = tmp_arr;
  15391. __asm__ __volatile__ (
  15392. /* A[0] * A[0] */
  15393. "ldr r6, [%[a], #0]\n\t"
  15394. "umull r3, r4, r6, r6\n\t"
  15395. "mov r5, #0\n\t"
  15396. "str r3, [%[tmp], #0]\n\t"
  15397. "mov r3, #0\n\t"
  15398. /* A[0] * A[1] */
  15399. "ldr r8, [%[a], #4]\n\t"
  15400. "umull r6, r8, r6, r8\n\t"
  15401. "adds r4, r4, r6\n\t"
  15402. "adc r5, r5, r8\n\t"
  15403. "adds r4, r4, r6\n\t"
  15404. "adcs r5, r5, r8\n\t"
  15405. "adc r3, r3, #0\n\t"
  15406. "str r4, [%[tmp], #4]\n\t"
  15407. "mov r4, #0\n\t"
  15408. /* A[0] * A[2] */
  15409. "ldr r6, [%[a], #0]\n\t"
  15410. "ldr r8, [%[a], #8]\n\t"
  15411. "umull r6, r8, r6, r8\n\t"
  15412. "adds r5, r5, r6\n\t"
  15413. "adc r3, r3, r8\n\t"
  15414. "adds r5, r5, r6\n\t"
  15415. "adcs r3, r3, r8\n\t"
  15416. "adc r4, r4, #0\n\t"
  15417. /* A[1] * A[1] */
  15418. "ldr r6, [%[a], #4]\n\t"
  15419. "umull r6, r8, r6, r6\n\t"
  15420. "adds r5, r5, r6\n\t"
  15421. "adcs r3, r3, r8\n\t"
  15422. "adc r4, r4, #0\n\t"
  15423. "str r5, [%[tmp], #8]\n\t"
  15424. "mov r5, #0\n\t"
  15425. /* A[0] * A[3] */
  15426. "ldr r6, [%[a], #0]\n\t"
  15427. "ldr r8, [%[a], #12]\n\t"
  15428. "umull r9, r10, r6, r8\n\t"
  15429. "mov r11, #0\n\t"
  15430. /* A[1] * A[2] */
  15431. "ldr r6, [%[a], #4]\n\t"
  15432. "ldr r8, [%[a], #8]\n\t"
  15433. "umull r6, r8, r6, r8\n\t"
  15434. "adds r9, r9, r6\n\t"
  15435. "adcs r10, r10, r8\n\t"
  15436. "adc r11, r11, #0\n\t"
  15437. "adds r9, r9, r9\n\t"
  15438. "adcs r10, r10, r10\n\t"
  15439. "adc r11, r11, r11\n\t"
  15440. "adds r3, r3, r9\n\t"
  15441. "adcs r4, r4, r10\n\t"
  15442. "adc r5, r5, r11\n\t"
  15443. "str r3, [%[tmp], #12]\n\t"
  15444. "mov r3, #0\n\t"
  15445. /* A[0] * A[4] */
  15446. "ldr r6, [%[a], #0]\n\t"
  15447. "ldr r8, [%[a], #16]\n\t"
  15448. "umull r9, r10, r6, r8\n\t"
  15449. "mov r11, #0\n\t"
  15450. /* A[1] * A[3] */
  15451. "ldr r6, [%[a], #4]\n\t"
  15452. "ldr r8, [%[a], #12]\n\t"
  15453. "umull r6, r8, r6, r8\n\t"
  15454. "adds r9, r9, r6\n\t"
  15455. "adcs r10, r10, r8\n\t"
  15456. "adc r11, r11, #0\n\t"
  15457. /* A[2] * A[2] */
  15458. "ldr r6, [%[a], #8]\n\t"
  15459. "umull r6, r8, r6, r6\n\t"
  15460. "adds r4, r4, r6\n\t"
  15461. "adcs r5, r5, r8\n\t"
  15462. "adc r3, r3, #0\n\t"
  15463. "adds r9, r9, r9\n\t"
  15464. "adcs r10, r10, r10\n\t"
  15465. "adc r11, r11, r11\n\t"
  15466. "adds r4, r4, r9\n\t"
  15467. "adcs r5, r5, r10\n\t"
  15468. "adc r3, r3, r11\n\t"
  15469. "str r4, [%[tmp], #16]\n\t"
  15470. "mov r4, #0\n\t"
  15471. /* A[0] * A[5] */
  15472. "ldr r6, [%[a], #0]\n\t"
  15473. "ldr r8, [%[a], #20]\n\t"
  15474. "umull r9, r10, r6, r8\n\t"
  15475. "mov r11, #0\n\t"
  15476. /* A[1] * A[4] */
  15477. "ldr r6, [%[a], #4]\n\t"
  15478. "ldr r8, [%[a], #16]\n\t"
  15479. "umull r6, r8, r6, r8\n\t"
  15480. "adds r9, r9, r6\n\t"
  15481. "adcs r10, r10, r8\n\t"
  15482. "adc r11, r11, #0\n\t"
  15483. /* A[2] * A[3] */
  15484. "ldr r6, [%[a], #8]\n\t"
  15485. "ldr r8, [%[a], #12]\n\t"
  15486. "umull r6, r8, r6, r8\n\t"
  15487. "adds r9, r9, r6\n\t"
  15488. "adcs r10, r10, r8\n\t"
  15489. "adc r11, r11, #0\n\t"
  15490. "adds r9, r9, r9\n\t"
  15491. "adcs r10, r10, r10\n\t"
  15492. "adc r11, r11, r11\n\t"
  15493. "adds r5, r5, r9\n\t"
  15494. "adcs r3, r3, r10\n\t"
  15495. "adc r4, r4, r11\n\t"
  15496. "str r5, [%[tmp], #20]\n\t"
  15497. "mov r5, #0\n\t"
  15498. /* A[0] * A[6] */
  15499. "ldr r6, [%[a], #0]\n\t"
  15500. "ldr r8, [%[a], #24]\n\t"
  15501. "umull r9, r10, r6, r8\n\t"
  15502. "mov r11, #0\n\t"
  15503. /* A[1] * A[5] */
  15504. "ldr r6, [%[a], #4]\n\t"
  15505. "ldr r8, [%[a], #20]\n\t"
  15506. "umull r6, r8, r6, r8\n\t"
  15507. "adds r9, r9, r6\n\t"
  15508. "adcs r10, r10, r8\n\t"
  15509. "adc r11, r11, #0\n\t"
  15510. /* A[2] * A[4] */
  15511. "ldr r6, [%[a], #8]\n\t"
  15512. "ldr r8, [%[a], #16]\n\t"
  15513. "umull r6, r8, r6, r8\n\t"
  15514. "adds r9, r9, r6\n\t"
  15515. "adcs r10, r10, r8\n\t"
  15516. "adc r11, r11, #0\n\t"
  15517. /* A[3] * A[3] */
  15518. "ldr r6, [%[a], #12]\n\t"
  15519. "umull r6, r8, r6, r6\n\t"
  15520. "adds r3, r3, r6\n\t"
  15521. "adcs r4, r4, r8\n\t"
  15522. "adc r5, r5, #0\n\t"
  15523. "adds r9, r9, r9\n\t"
  15524. "adcs r10, r10, r10\n\t"
  15525. "adc r11, r11, r11\n\t"
  15526. "adds r3, r3, r9\n\t"
  15527. "adcs r4, r4, r10\n\t"
  15528. "adc r5, r5, r11\n\t"
  15529. "str r3, [%[tmp], #24]\n\t"
  15530. "mov r3, #0\n\t"
  15531. /* A[0] * A[7] */
  15532. "ldr r6, [%[a], #0]\n\t"
  15533. "ldr r8, [%[a], #28]\n\t"
  15534. "umull r9, r10, r6, r8\n\t"
  15535. "mov r11, #0\n\t"
  15536. /* A[1] * A[6] */
  15537. "ldr r6, [%[a], #4]\n\t"
  15538. "ldr r8, [%[a], #24]\n\t"
  15539. "umull r6, r8, r6, r8\n\t"
  15540. "adds r9, r9, r6\n\t"
  15541. "adcs r10, r10, r8\n\t"
  15542. "adc r11, r11, #0\n\t"
  15543. /* A[2] * A[5] */
  15544. "ldr r6, [%[a], #8]\n\t"
  15545. "ldr r8, [%[a], #20]\n\t"
  15546. "umull r6, r8, r6, r8\n\t"
  15547. "adds r9, r9, r6\n\t"
  15548. "adcs r10, r10, r8\n\t"
  15549. "adc r11, r11, #0\n\t"
  15550. /* A[3] * A[4] */
  15551. "ldr r6, [%[a], #12]\n\t"
  15552. "ldr r8, [%[a], #16]\n\t"
  15553. "umull r6, r8, r6, r8\n\t"
  15554. "adds r9, r9, r6\n\t"
  15555. "adcs r10, r10, r8\n\t"
  15556. "adc r11, r11, #0\n\t"
  15557. "adds r9, r9, r9\n\t"
  15558. "adcs r10, r10, r10\n\t"
  15559. "adc r11, r11, r11\n\t"
  15560. "adds r4, r4, r9\n\t"
  15561. "adcs r5, r5, r10\n\t"
  15562. "adc r3, r3, r11\n\t"
  15563. "str r4, [%[tmp], #28]\n\t"
  15564. "mov r4, #0\n\t"
  15565. /* A[1] * A[7] */
  15566. "ldr r6, [%[a], #4]\n\t"
  15567. "ldr r8, [%[a], #28]\n\t"
  15568. "umull r9, r10, r6, r8\n\t"
  15569. "mov r11, #0\n\t"
  15570. /* A[2] * A[6] */
  15571. "ldr r6, [%[a], #8]\n\t"
  15572. "ldr r8, [%[a], #24]\n\t"
  15573. "umull r6, r8, r6, r8\n\t"
  15574. "adds r9, r9, r6\n\t"
  15575. "adcs r10, r10, r8\n\t"
  15576. "adc r11, r11, #0\n\t"
  15577. /* A[3] * A[5] */
  15578. "ldr r6, [%[a], #12]\n\t"
  15579. "ldr r8, [%[a], #20]\n\t"
  15580. "umull r6, r8, r6, r8\n\t"
  15581. "adds r9, r9, r6\n\t"
  15582. "adcs r10, r10, r8\n\t"
  15583. "adc r11, r11, #0\n\t"
  15584. /* A[4] * A[4] */
  15585. "ldr r6, [%[a], #16]\n\t"
  15586. "umull r6, r8, r6, r6\n\t"
  15587. "adds r5, r5, r6\n\t"
  15588. "adcs r3, r3, r8\n\t"
  15589. "adc r4, r4, #0\n\t"
  15590. "adds r9, r9, r9\n\t"
  15591. "adcs r10, r10, r10\n\t"
  15592. "adc r11, r11, r11\n\t"
  15593. "adds r5, r5, r9\n\t"
  15594. "adcs r3, r3, r10\n\t"
  15595. "adc r4, r4, r11\n\t"
  15596. "str r5, [%[r], #32]\n\t"
  15597. "mov r5, #0\n\t"
  15598. /* A[2] * A[7] */
  15599. "ldr r6, [%[a], #8]\n\t"
  15600. "ldr r8, [%[a], #28]\n\t"
  15601. "umull r9, r10, r6, r8\n\t"
  15602. "mov r11, #0\n\t"
  15603. /* A[3] * A[6] */
  15604. "ldr r6, [%[a], #12]\n\t"
  15605. "ldr r8, [%[a], #24]\n\t"
  15606. "umull r6, r8, r6, r8\n\t"
  15607. "adds r9, r9, r6\n\t"
  15608. "adcs r10, r10, r8\n\t"
  15609. "adc r11, r11, #0\n\t"
  15610. /* A[4] * A[5] */
  15611. "ldr r6, [%[a], #16]\n\t"
  15612. "ldr r8, [%[a], #20]\n\t"
  15613. "umull r6, r8, r6, r8\n\t"
  15614. "adds r9, r9, r6\n\t"
  15615. "adcs r10, r10, r8\n\t"
  15616. "adc r11, r11, #0\n\t"
  15617. "adds r9, r9, r9\n\t"
  15618. "adcs r10, r10, r10\n\t"
  15619. "adc r11, r11, r11\n\t"
  15620. "adds r3, r3, r9\n\t"
  15621. "adcs r4, r4, r10\n\t"
  15622. "adc r5, r5, r11\n\t"
  15623. "str r3, [%[r], #36]\n\t"
  15624. "mov r3, #0\n\t"
  15625. /* A[3] * A[7] */
  15626. "ldr r6, [%[a], #12]\n\t"
  15627. "ldr r8, [%[a], #28]\n\t"
  15628. "umull r9, r10, r6, r8\n\t"
  15629. "mov r11, #0\n\t"
  15630. /* A[4] * A[6] */
  15631. "ldr r6, [%[a], #16]\n\t"
  15632. "ldr r8, [%[a], #24]\n\t"
  15633. "umull r6, r8, r6, r8\n\t"
  15634. "adds r9, r9, r6\n\t"
  15635. "adcs r10, r10, r8\n\t"
  15636. "adc r11, r11, #0\n\t"
  15637. /* A[5] * A[5] */
  15638. "ldr r6, [%[a], #20]\n\t"
  15639. "umull r6, r8, r6, r6\n\t"
  15640. "adds r4, r4, r6\n\t"
  15641. "adcs r5, r5, r8\n\t"
  15642. "adc r3, r3, #0\n\t"
  15643. "adds r9, r9, r9\n\t"
  15644. "adcs r10, r10, r10\n\t"
  15645. "adc r11, r11, r11\n\t"
  15646. "adds r4, r4, r9\n\t"
  15647. "adcs r5, r5, r10\n\t"
  15648. "adc r3, r3, r11\n\t"
  15649. "str r4, [%[r], #40]\n\t"
  15650. "mov r4, #0\n\t"
  15651. /* A[4] * A[7] */
  15652. "ldr r6, [%[a], #16]\n\t"
  15653. "ldr r8, [%[a], #28]\n\t"
  15654. "umull r6, r8, r6, r8\n\t"
  15655. "adds r5, r5, r6\n\t"
  15656. "adcs r3, r3, r8\n\t"
  15657. "adc r4, r4, #0\n\t"
  15658. "adds r5, r5, r6\n\t"
  15659. "adcs r3, r3, r8\n\t"
  15660. "adc r4, r4, #0\n\t"
  15661. /* A[5] * A[6] */
  15662. "ldr r6, [%[a], #20]\n\t"
  15663. "ldr r8, [%[a], #24]\n\t"
  15664. "umull r6, r8, r6, r8\n\t"
  15665. "adds r5, r5, r6\n\t"
  15666. "adcs r3, r3, r8\n\t"
  15667. "adc r4, r4, #0\n\t"
  15668. "adds r5, r5, r6\n\t"
  15669. "adcs r3, r3, r8\n\t"
  15670. "adc r4, r4, #0\n\t"
  15671. "str r5, [%[r], #44]\n\t"
  15672. "mov r5, #0\n\t"
  15673. /* A[5] * A[7] */
  15674. "ldr r6, [%[a], #20]\n\t"
  15675. "ldr r8, [%[a], #28]\n\t"
  15676. "umull r6, r8, r6, r8\n\t"
  15677. "adds r3, r3, r6\n\t"
  15678. "adcs r4, r4, r8\n\t"
  15679. "adc r5, r5, #0\n\t"
  15680. "adds r3, r3, r6\n\t"
  15681. "adcs r4, r4, r8\n\t"
  15682. "adc r5, r5, #0\n\t"
  15683. /* A[6] * A[6] */
  15684. "ldr r6, [%[a], #24]\n\t"
  15685. "umull r6, r8, r6, r6\n\t"
  15686. "adds r3, r3, r6\n\t"
  15687. "adcs r4, r4, r8\n\t"
  15688. "adc r5, r5, #0\n\t"
  15689. "str r3, [%[r], #48]\n\t"
  15690. "mov r3, #0\n\t"
  15691. /* A[6] * A[7] */
  15692. "ldr r6, [%[a], #24]\n\t"
  15693. "ldr r8, [%[a], #28]\n\t"
  15694. "umull r6, r8, r6, r8\n\t"
  15695. "adds r4, r4, r6\n\t"
  15696. "adcs r5, r5, r8\n\t"
  15697. "adc r3, r3, #0\n\t"
  15698. "adds r4, r4, r6\n\t"
  15699. "adcs r5, r5, r8\n\t"
  15700. "adc r3, r3, #0\n\t"
  15701. "str r4, [%[r], #52]\n\t"
  15702. "mov r4, #0\n\t"
  15703. /* A[7] * A[7] */
  15704. "ldr r6, [%[a], #28]\n\t"
  15705. "umull r6, r8, r6, r6\n\t"
  15706. "adds r5, r5, r6\n\t"
  15707. "adc r3, r3, r8\n\t"
  15708. "str r5, [%[r], #56]\n\t"
  15709. "str r3, [%[r], #60]\n\t"
  15710. /* Transfer tmp to r */
  15711. "ldr r3, [%[tmp], #0]\n\t"
  15712. "ldr r4, [%[tmp], #4]\n\t"
  15713. "ldr r5, [%[tmp], #8]\n\t"
  15714. "ldr r6, [%[tmp], #12]\n\t"
  15715. "str r3, [%[r], #0]\n\t"
  15716. "str r4, [%[r], #4]\n\t"
  15717. "str r5, [%[r], #8]\n\t"
  15718. "str r6, [%[r], #12]\n\t"
  15719. "ldr r3, [%[tmp], #16]\n\t"
  15720. "ldr r4, [%[tmp], #20]\n\t"
  15721. "ldr r5, [%[tmp], #24]\n\t"
  15722. "ldr r6, [%[tmp], #28]\n\t"
  15723. "str r3, [%[r], #16]\n\t"
  15724. "str r4, [%[r], #20]\n\t"
  15725. "str r5, [%[r], #24]\n\t"
  15726. "str r6, [%[r], #28]\n\t"
  15727. :
  15728. : [r] "r" (r), [a] "r" (a), [tmp] "r" (tmp)
  15729. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11"
  15730. );
  15731. }
  15732. #ifdef WOLFSSL_SP_SMALL
  15733. /* Add b to a into r. (r = a + b)
  15734. *
  15735. * r A single precision integer.
  15736. * a A single precision integer.
  15737. * b A single precision integer.
  15738. */
  15739. SP_NOINLINE static sp_digit sp_256_add_8(sp_digit* r, const sp_digit* a,
  15740. const sp_digit* b)
  15741. {
  15742. sp_digit c = 0;
  15743. __asm__ __volatile__ (
  15744. "mov r6, %[a]\n\t"
  15745. "mov r8, #0\n\t"
  15746. "add r6, r6, #32\n\t"
  15747. "sub r8, r8, #1\n\t"
  15748. "\n1:\n\t"
  15749. "adds %[c], %[c], r8\n\t"
  15750. "ldr r4, [%[a]]\n\t"
  15751. "ldr r5, [%[b]]\n\t"
  15752. "adcs r4, r4, r5\n\t"
  15753. "str r4, [%[r]]\n\t"
  15754. "mov %[c], #0\n\t"
  15755. "adc %[c], %[c], %[c]\n\t"
  15756. "add %[a], %[a], #4\n\t"
  15757. "add %[b], %[b], #4\n\t"
  15758. "add %[r], %[r], #4\n\t"
  15759. "cmp %[a], r6\n\t"
  15760. #ifdef __GNUC__
  15761. "bne 1b\n\t"
  15762. #else
  15763. "bne.n 1b\n\t"
  15764. #endif /* __GNUC__ */
  15765. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  15766. :
  15767. : "memory", "r4", "r5", "r6", "r8"
  15768. );
  15769. return c;
  15770. }
  15771. #else
  15772. /* Add b to a into r. (r = a + b)
  15773. *
  15774. * r A single precision integer.
  15775. * a A single precision integer.
  15776. * b A single precision integer.
  15777. */
  15778. SP_NOINLINE static sp_digit sp_256_add_8(sp_digit* r, const sp_digit* a,
  15779. const sp_digit* b)
  15780. {
  15781. sp_digit c = 0;
  15782. __asm__ __volatile__ (
  15783. "ldm %[a]!, {r4, r5}\n\t"
  15784. "ldm %[b]!, {r6, r8}\n\t"
  15785. "adds r4, r4, r6\n\t"
  15786. "adcs r5, r5, r8\n\t"
  15787. "stm %[r]!, {r4, r5}\n\t"
  15788. "ldm %[a]!, {r4, r5}\n\t"
  15789. "ldm %[b]!, {r6, r8}\n\t"
  15790. "adcs r4, r4, r6\n\t"
  15791. "adcs r5, r5, r8\n\t"
  15792. "stm %[r]!, {r4, r5}\n\t"
  15793. "ldm %[a]!, {r4, r5}\n\t"
  15794. "ldm %[b]!, {r6, r8}\n\t"
  15795. "adcs r4, r4, r6\n\t"
  15796. "adcs r5, r5, r8\n\t"
  15797. "stm %[r]!, {r4, r5}\n\t"
  15798. "ldm %[a]!, {r4, r5}\n\t"
  15799. "ldm %[b]!, {r6, r8}\n\t"
  15800. "adcs r4, r4, r6\n\t"
  15801. "adcs r5, r5, r8\n\t"
  15802. "stm %[r]!, {r4, r5}\n\t"
  15803. "mov %[c], #0\n\t"
  15804. "adc %[c], %[c], %[c]\n\t"
  15805. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  15806. :
  15807. : "memory", "r4", "r5", "r6", "r8"
  15808. );
  15809. return c;
  15810. }
  15811. #endif /* WOLFSSL_SP_SMALL */
  15812. #ifdef WOLFSSL_SP_SMALL
  15813. /* Sub b from a into r. (r = a - b)
  15814. *
  15815. * r A single precision integer.
  15816. * a A single precision integer.
  15817. * b A single precision integer.
  15818. */
  15819. SP_NOINLINE static sp_digit sp_256_sub_8(sp_digit* r, const sp_digit* a,
  15820. const sp_digit* b)
  15821. {
  15822. sp_digit c = 0;
  15823. __asm__ __volatile__ (
  15824. "mov r6, %[a]\n\t"
  15825. "add r6, r6, #32\n\t"
  15826. "\n1:\n\t"
  15827. "mov r5, #0\n\t"
  15828. "subs r5, r5, %[c]\n\t"
  15829. "ldr r4, [%[a]]\n\t"
  15830. "ldr r5, [%[b]]\n\t"
  15831. "sbcs r4, r4, r5\n\t"
  15832. "str r4, [%[r]]\n\t"
  15833. "sbc %[c], %[c], %[c]\n\t"
  15834. "add %[a], %[a], #4\n\t"
  15835. "add %[b], %[b], #4\n\t"
  15836. "add %[r], %[r], #4\n\t"
  15837. "cmp %[a], r6\n\t"
  15838. #ifdef __GNUC__
  15839. "bne 1b\n\t"
  15840. #else
  15841. "bne.n 1b\n\t"
  15842. #endif /* __GNUC__ */
  15843. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  15844. :
  15845. : "memory", "r4", "r5", "r6"
  15846. );
  15847. return c;
  15848. }
  15849. #else
  15850. /* Sub b from a into r. (r = a - b)
  15851. *
  15852. * r A single precision integer.
  15853. * a A single precision integer.
  15854. * b A single precision integer.
  15855. */
  15856. SP_NOINLINE static sp_digit sp_256_sub_8(sp_digit* r, const sp_digit* a,
  15857. const sp_digit* b)
  15858. {
  15859. sp_digit c = 0;
  15860. __asm__ __volatile__ (
  15861. "ldm %[a]!, {r4, r5}\n\t"
  15862. "ldm %[b]!, {r6, r8}\n\t"
  15863. "subs r4, r4, r6\n\t"
  15864. "sbcs r5, r5, r8\n\t"
  15865. "stm %[r]!, {r4, r5}\n\t"
  15866. "ldm %[a]!, {r4, r5}\n\t"
  15867. "ldm %[b]!, {r6, r8}\n\t"
  15868. "sbcs r4, r4, r6\n\t"
  15869. "sbcs r5, r5, r8\n\t"
  15870. "stm %[r]!, {r4, r5}\n\t"
  15871. "ldm %[a]!, {r4, r5}\n\t"
  15872. "ldm %[b]!, {r6, r8}\n\t"
  15873. "sbcs r4, r4, r6\n\t"
  15874. "sbcs r5, r5, r8\n\t"
  15875. "stm %[r]!, {r4, r5}\n\t"
  15876. "ldm %[a]!, {r4, r5}\n\t"
  15877. "ldm %[b]!, {r6, r8}\n\t"
  15878. "sbcs r4, r4, r6\n\t"
  15879. "sbcs r5, r5, r8\n\t"
  15880. "stm %[r]!, {r4, r5}\n\t"
  15881. "sbc %[c], %[c], %[c]\n\t"
  15882. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  15883. :
  15884. : "memory", "r4", "r5", "r6", "r8"
  15885. );
  15886. return c;
  15887. }
  15888. #endif /* WOLFSSL_SP_SMALL */
  15889. /* Multiply a number by Montgomery normalizer mod modulus (prime).
  15890. *
  15891. * r The resulting Montgomery form number.
  15892. * a The number to convert.
  15893. * m The modulus (prime).
  15894. */
  15895. static int sp_256_mod_mul_norm_8(sp_digit* r, const sp_digit* a, const sp_digit* m)
  15896. {
  15897. (void)m;
  15898. __asm__ __volatile__ (
  15899. "sub sp, sp, #24\n\t"
  15900. "ldr r2, [%[a], #0]\n\t"
  15901. "ldr r3, [%[a], #4]\n\t"
  15902. "ldr r4, [%[a], #8]\n\t"
  15903. "ldr r5, [%[a], #12]\n\t"
  15904. "ldr r6, [%[a], #16]\n\t"
  15905. "ldr r8, [%[a], #20]\n\t"
  15906. "ldr r9, [%[a], #24]\n\t"
  15907. "ldr r10, [%[a], #28]\n\t"
  15908. /* Clear overflow and underflow */
  15909. "mov r14, #0\n\t"
  15910. "mov r12, #0\n\t"
  15911. /* t[0] = 1 1 0 -1 -1 -1 -1 0 */
  15912. "adds r11, r2, r3\n\t"
  15913. "adc r14, r14, #0\n\t"
  15914. "subs r11, r11, r5\n\t"
  15915. "sbc r12, r12, #0\n\t"
  15916. "subs r11, r11, r6\n\t"
  15917. "sbc r12, r12, #0\n\t"
  15918. "subs r11, r11, r8\n\t"
  15919. "sbc r12, r12, #0\n\t"
  15920. "subs r11, r11, r9\n\t"
  15921. "sbc r12, r12, #0\n\t"
  15922. /* Store t[0] */
  15923. "str r11, [sp, #0]\n\t"
  15924. "neg r12, r12\n\t"
  15925. "mov r11, #0\n\t"
  15926. /* t[1] = 0 1 1 0 -1 -1 -1 -1 */
  15927. "adds r14, r14, r3\n\t"
  15928. "adc r11, r11, #0\n\t"
  15929. "adds r14, r14, r4\n\t"
  15930. "adc r11, r11, #0\n\t"
  15931. "subs r14, r14, r12\n\t"
  15932. "mov r12, #0\n\t"
  15933. "sbc r12, r12, #0\n\t"
  15934. "subs r14, r14, r6\n\t"
  15935. "sbc r12, r12, #0\n\t"
  15936. "subs r14, r14, r8\n\t"
  15937. "sbc r12, r12, #0\n\t"
  15938. "subs r14, r14, r9\n\t"
  15939. "sbc r12, r12, #0\n\t"
  15940. "subs r14, r14, r10\n\t"
  15941. "sbc r12, r12, #0\n\t"
  15942. /* Store t[1] */
  15943. "str r14, [sp, #4]\n\t"
  15944. "neg r12, r12\n\t"
  15945. "mov r14, #0\n\t"
  15946. /* t[2] = 0 0 1 1 0 -1 -1 -1 */
  15947. "adds r11, r11, r4\n\t"
  15948. "adc r14, r14, #0\n\t"
  15949. "adds r11, r11, r5\n\t"
  15950. "adc r14, r14, #0\n\t"
  15951. "subs r11, r11, r12\n\t"
  15952. "mov r12, #0\n\t"
  15953. "sbc r12, r12, #0\n\t"
  15954. "subs r11, r11, r8\n\t"
  15955. "sbc r12, r12, #0\n\t"
  15956. "subs r11, r11, r9\n\t"
  15957. "sbc r12, r12, #0\n\t"
  15958. "subs r11, r11, r10\n\t"
  15959. "sbc r12, r12, #0\n\t"
  15960. /* Store t[2] */
  15961. "str r11, [sp, #8]\n\t"
  15962. "neg r12, r12\n\t"
  15963. "mov r11, #0\n\t"
  15964. /* t[3] = -1 -1 0 2 2 1 0 -1 */
  15965. "adds r14, r14, r5\n\t"
  15966. "adc r11, r11, #0\n\t"
  15967. "adds r14, r14, r5\n\t"
  15968. "adc r11, r11, #0\n\t"
  15969. "adds r14, r14, r6\n\t"
  15970. "adc r11, r11, #0\n\t"
  15971. "adds r14, r14, r6\n\t"
  15972. "adc r11, r11, #0\n\t"
  15973. "adds r14, r14, r8\n\t"
  15974. "adc r11, r11, #0\n\t"
  15975. "subs r14, r14, r12\n\t"
  15976. "mov r12, #0\n\t"
  15977. "sbc r12, r12, #0\n\t"
  15978. "subs r14, r14, r2\n\t"
  15979. "sbc r12, r12, #0\n\t"
  15980. "subs r14, r14, r3\n\t"
  15981. "sbc r12, r12, #0\n\t"
  15982. "subs r14, r14, r10\n\t"
  15983. "sbc r12, r12, #0\n\t"
  15984. /* Store t[3] */
  15985. "str r14, [sp, #12]\n\t"
  15986. "neg r12, r12\n\t"
  15987. "mov r14, #0\n\t"
  15988. /* t[4] = 0 -1 -1 0 2 2 1 0 */
  15989. "adds r11, r11, r6\n\t"
  15990. "adc r14, r14, #0\n\t"
  15991. "adds r11, r11, r6\n\t"
  15992. "adc r14, r14, #0\n\t"
  15993. "adds r11, r11, r8\n\t"
  15994. "adc r14, r14, #0\n\t"
  15995. "adds r11, r11, r8\n\t"
  15996. "adc r14, r14, #0\n\t"
  15997. "adds r11, r11, r9\n\t"
  15998. "adc r14, r14, #0\n\t"
  15999. "subs r11, r11, r12\n\t"
  16000. "mov r12, #0\n\t"
  16001. "sbc r12, r12, #0\n\t"
  16002. "subs r11, r11, r3\n\t"
  16003. "sbc r12, r12, #0\n\t"
  16004. "subs r11, r11, r4\n\t"
  16005. "sbc r12, r12, #0\n\t"
  16006. /* Store t[4] */
  16007. "str r11, [sp, #16]\n\t"
  16008. "neg r12, r12\n\t"
  16009. "mov r11, #0\n\t"
  16010. /* t[5] = 0 0 -1 -1 0 2 2 1 */
  16011. "adds r14, r14, r8\n\t"
  16012. "adc r11, r11, #0\n\t"
  16013. "adds r14, r14, r8\n\t"
  16014. "adc r11, r11, #0\n\t"
  16015. "adds r14, r14, r9\n\t"
  16016. "adc r11, r11, #0\n\t"
  16017. "adds r14, r14, r9\n\t"
  16018. "adc r11, r11, #0\n\t"
  16019. "adds r14, r14, r10\n\t"
  16020. "adc r11, r11, #0\n\t"
  16021. "subs r14, r14, r12\n\t"
  16022. "mov r12, #0\n\t"
  16023. "sbc r12, r12, #0\n\t"
  16024. "subs r14, r14, r4\n\t"
  16025. "sbc r12, r12, #0\n\t"
  16026. "subs r14, r14, r5\n\t"
  16027. "sbc r12, r12, #0\n\t"
  16028. /* Store t[5] */
  16029. "str r14, [sp, #20]\n\t"
  16030. "neg r12, r12\n\t"
  16031. "mov r14, #0\n\t"
  16032. /* t[6] = -1 -1 0 0 0 1 3 2 */
  16033. "adds r11, r11, r8\n\t"
  16034. "adc r14, r14, #0\n\t"
  16035. "adds r11, r11, r9\n\t"
  16036. "adc r14, r14, #0\n\t"
  16037. "adds r11, r11, r9\n\t"
  16038. "adc r14, r14, #0\n\t"
  16039. "adds r11, r11, r9\n\t"
  16040. "adc r14, r14, #0\n\t"
  16041. "adds r11, r11, r10\n\t"
  16042. "adc r14, r14, #0\n\t"
  16043. "adds r11, r11, r10\n\t"
  16044. "adc r14, r14, #0\n\t"
  16045. "subs r11, r11, r12\n\t"
  16046. "mov r12, #0\n\t"
  16047. "sbc r12, r12, #0\n\t"
  16048. "subs r11, r11, r2\n\t"
  16049. "sbc r12, r12, #0\n\t"
  16050. "subs r11, r11, r3\n\t"
  16051. "sbc r12, r12, #0\n\t"
  16052. /* Store t[6] */
  16053. "mov r9, r11\n\t"
  16054. "neg r12, r12\n\t"
  16055. "mov r11, #0\n\t"
  16056. /* t[7] = 1 0 -1 -1 -1 -1 0 3 */
  16057. "adds r14, r14, r2\n\t"
  16058. "adc r11, r11, #0\n\t"
  16059. "adds r14, r14, r10\n\t"
  16060. "adc r11, r11, #0\n\t"
  16061. "adds r14, r14, r10\n\t"
  16062. "adc r11, r11, #0\n\t"
  16063. "adds r14, r14, r10\n\t"
  16064. "adc r11, r11, #0\n\t"
  16065. "subs r14, r14, r12\n\t"
  16066. "mov r12, #0\n\t"
  16067. "sbc r12, r12, #0\n\t"
  16068. "subs r14, r14, r4\n\t"
  16069. "sbc r12, r12, #0\n\t"
  16070. "subs r14, r14, r5\n\t"
  16071. "sbc r12, r12, #0\n\t"
  16072. "subs r14, r14, r6\n\t"
  16073. "sbc r12, r12, #0\n\t"
  16074. "subs r14, r14, r8\n\t"
  16075. "sbc r12, r12, #0\n\t"
  16076. /* Store t[7] */
  16077. /* Load intermediate */
  16078. "ldr r2, [sp, #0]\n\t"
  16079. "ldr r3, [sp, #4]\n\t"
  16080. "ldr r4, [sp, #8]\n\t"
  16081. "ldr r5, [sp, #12]\n\t"
  16082. "ldr r6, [sp, #16]\n\t"
  16083. "ldr r8, [sp, #20]\n\t"
  16084. "neg r12, r12\n\t"
  16085. /* Add overflow */
  16086. /* Subtract underflow - add neg underflow */
  16087. "adds r2, r2, r11\n\t"
  16088. "adcs r3, r3, #0\n\t"
  16089. "adcs r4, r4, #0\n\t"
  16090. "adds r5, r5, r12\n\t"
  16091. "adcs r6, r6, #0\n\t"
  16092. "adcs r8, r8, #0\n\t"
  16093. "adcs r9, r9, r12\n\t"
  16094. "adc r14, r14, r11\n\t"
  16095. /* Subtract overflow */
  16096. /* Add underflow - subtract neg underflow */
  16097. "subs r2, r2, r12\n\t"
  16098. "sbcs r3, r3, #0\n\t"
  16099. "sbcs r4, r4, #0\n\t"
  16100. "subs r5, r5, r11\n\t"
  16101. "sbcs r6, r6, #0\n\t"
  16102. "sbcs r8, r8, #0\n\t"
  16103. "sbcs r9, r9, r11\n\t"
  16104. "sbc r14, r14, r12\n\t"
  16105. /* Store result */
  16106. "str r2, [%[r], #0]\n\t"
  16107. "str r3, [%[r], #4]\n\t"
  16108. "str r4, [%[r], #8]\n\t"
  16109. "str r5, [%[r], #12]\n\t"
  16110. "str r6, [%[r], #16]\n\t"
  16111. "str r8, [%[r], #20]\n\t"
  16112. "str r9, [%[r], #24]\n\t"
  16113. "str r14, [%[r], #28]\n\t"
  16114. "add sp, sp, #24\n\t"
  16115. :
  16116. : [r] "r" (r), [a] "r" (a)
  16117. : "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r14", "r12"
  16118. );
  16119. return MP_OKAY;
  16120. }
  16121. /* Convert an mp_int to an array of sp_digit.
  16122. *
  16123. * r A single precision integer.
  16124. * size Maximum number of bytes to convert
  16125. * a A multi-precision integer.
  16126. */
  16127. static void sp_256_from_mp(sp_digit* r, int size, const mp_int* a)
  16128. {
  16129. #if DIGIT_BIT == 32
  16130. int j;
  16131. XMEMCPY(r, a->dp, sizeof(sp_digit) * a->used);
  16132. for (j = a->used; j < size; j++) {
  16133. r[j] = 0;
  16134. }
  16135. #elif DIGIT_BIT > 32
  16136. int i;
  16137. int j = 0;
  16138. word32 s = 0;
  16139. r[0] = 0;
  16140. for (i = 0; i < a->used && j < size; i++) {
  16141. r[j] |= ((sp_digit)a->dp[i] << s);
  16142. r[j] &= 0xffffffff;
  16143. s = 32U - s;
  16144. if (j + 1 >= size) {
  16145. break;
  16146. }
  16147. /* lint allow cast of mismatch word32 and mp_digit */
  16148. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  16149. while ((s + 32U) <= (word32)DIGIT_BIT) {
  16150. s += 32U;
  16151. r[j] &= 0xffffffff;
  16152. if (j + 1 >= size) {
  16153. break;
  16154. }
  16155. if (s < (word32)DIGIT_BIT) {
  16156. /* lint allow cast of mismatch word32 and mp_digit */
  16157. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  16158. }
  16159. else {
  16160. r[++j] = (sp_digit)0;
  16161. }
  16162. }
  16163. s = (word32)DIGIT_BIT - s;
  16164. }
  16165. for (j++; j < size; j++) {
  16166. r[j] = 0;
  16167. }
  16168. #else
  16169. int i;
  16170. int j = 0;
  16171. int s = 0;
  16172. r[0] = 0;
  16173. for (i = 0; i < a->used && j < size; i++) {
  16174. r[j] |= ((sp_digit)a->dp[i]) << s;
  16175. if (s + DIGIT_BIT >= 32) {
  16176. r[j] &= 0xffffffff;
  16177. if (j + 1 >= size) {
  16178. break;
  16179. }
  16180. s = 32 - s;
  16181. if (s == DIGIT_BIT) {
  16182. r[++j] = 0;
  16183. s = 0;
  16184. }
  16185. else {
  16186. r[++j] = a->dp[i] >> s;
  16187. s = DIGIT_BIT - s;
  16188. }
  16189. }
  16190. else {
  16191. s += DIGIT_BIT;
  16192. }
  16193. }
  16194. for (j++; j < size; j++) {
  16195. r[j] = 0;
  16196. }
  16197. #endif
  16198. }
  16199. /* Convert a point of type ecc_point to type sp_point_256.
  16200. *
  16201. * p Point of type sp_point_256 (result).
  16202. * pm Point of type ecc_point.
  16203. */
  16204. static void sp_256_point_from_ecc_point_8(sp_point_256* p,
  16205. const ecc_point* pm)
  16206. {
  16207. XMEMSET(p->x, 0, sizeof(p->x));
  16208. XMEMSET(p->y, 0, sizeof(p->y));
  16209. XMEMSET(p->z, 0, sizeof(p->z));
  16210. sp_256_from_mp(p->x, 8, pm->x);
  16211. sp_256_from_mp(p->y, 8, pm->y);
  16212. sp_256_from_mp(p->z, 8, pm->z);
  16213. p->infinity = 0;
  16214. }
  16215. /* Convert an array of sp_digit to an mp_int.
  16216. *
  16217. * a A single precision integer.
  16218. * r A multi-precision integer.
  16219. */
  16220. static int sp_256_to_mp(const sp_digit* a, mp_int* r)
  16221. {
  16222. int err;
  16223. err = mp_grow(r, (256 + DIGIT_BIT - 1) / DIGIT_BIT);
  16224. if (err == MP_OKAY) { /*lint !e774 case where err is always MP_OKAY*/
  16225. #if DIGIT_BIT == 32
  16226. XMEMCPY(r->dp, a, sizeof(sp_digit) * 8);
  16227. r->used = 8;
  16228. mp_clamp(r);
  16229. #elif DIGIT_BIT < 32
  16230. int i;
  16231. int j = 0;
  16232. int s = 0;
  16233. r->dp[0] = 0;
  16234. for (i = 0; i < 8; i++) {
  16235. r->dp[j] |= (mp_digit)(a[i] << s);
  16236. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  16237. s = DIGIT_BIT - s;
  16238. r->dp[++j] = (mp_digit)(a[i] >> s);
  16239. while (s + DIGIT_BIT <= 32) {
  16240. s += DIGIT_BIT;
  16241. r->dp[j++] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  16242. if (s == SP_WORD_SIZE) {
  16243. r->dp[j] = 0;
  16244. }
  16245. else {
  16246. r->dp[j] = (mp_digit)(a[i] >> s);
  16247. }
  16248. }
  16249. s = 32 - s;
  16250. }
  16251. r->used = (256 + DIGIT_BIT - 1) / DIGIT_BIT;
  16252. mp_clamp(r);
  16253. #else
  16254. int i;
  16255. int j = 0;
  16256. int s = 0;
  16257. r->dp[0] = 0;
  16258. for (i = 0; i < 8; i++) {
  16259. r->dp[j] |= ((mp_digit)a[i]) << s;
  16260. if (s + 32 >= DIGIT_BIT) {
  16261. #if DIGIT_BIT != 32 && DIGIT_BIT != 64
  16262. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  16263. #endif
  16264. s = DIGIT_BIT - s;
  16265. r->dp[++j] = a[i] >> s;
  16266. s = 32 - s;
  16267. }
  16268. else {
  16269. s += 32;
  16270. }
  16271. }
  16272. r->used = (256 + DIGIT_BIT - 1) / DIGIT_BIT;
  16273. mp_clamp(r);
  16274. #endif
  16275. }
  16276. return err;
  16277. }
  16278. /* Convert a point of type sp_point_256 to type ecc_point.
  16279. *
  16280. * p Point of type sp_point_256.
  16281. * pm Point of type ecc_point (result).
  16282. * returns MEMORY_E when allocation of memory in ecc_point fails otherwise
  16283. * MP_OKAY.
  16284. */
  16285. static int sp_256_point_to_ecc_point_8(const sp_point_256* p, ecc_point* pm)
  16286. {
  16287. int err;
  16288. err = sp_256_to_mp(p->x, pm->x);
  16289. if (err == MP_OKAY) {
  16290. err = sp_256_to_mp(p->y, pm->y);
  16291. }
  16292. if (err == MP_OKAY) {
  16293. err = sp_256_to_mp(p->z, pm->z);
  16294. }
  16295. return err;
  16296. }
  16297. /* Multiply two Montgomery form numbers mod the modulus (prime).
  16298. * (r = a * b mod m)
  16299. *
  16300. * r Result of multiplication.
  16301. * a First number to multiply in Montgomery form.
  16302. * b Second number to multiply in Montgomery form.
  16303. * m Modulus (prime).
  16304. * mp Montgomery mulitplier.
  16305. */
  16306. SP_NOINLINE static void sp_256_mont_mul_8(sp_digit* r, const sp_digit* a, const sp_digit* b,
  16307. const sp_digit* m, sp_digit mp)
  16308. {
  16309. (void)mp;
  16310. (void)m;
  16311. __asm__ __volatile__ (
  16312. "sub sp, sp, #68\n\t"
  16313. "mov r5, #0\n\t"
  16314. /* A[0] * B[0] */
  16315. "ldr r6, [%[a], #0]\n\t"
  16316. "ldr r8, [%[b], #0]\n\t"
  16317. "umull r9, r10, r6, r8\n\t"
  16318. "str r9, [sp, #0]\n\t"
  16319. /* A[0] * B[1] */
  16320. "ldr r6, [%[a], #0]\n\t"
  16321. "ldr r8, [%[b], #4]\n\t"
  16322. "umull r3, r4, r6, r8\n\t"
  16323. "adds r10, r3, r10\n\t"
  16324. "adc r11, r4, #0\n\t"
  16325. /* A[1] * B[0] */
  16326. "ldr r6, [%[a], #4]\n\t"
  16327. "ldr r8, [%[b], #0]\n\t"
  16328. "umull r3, r4, r6, r8\n\t"
  16329. "adds r10, r3, r10\n\t"
  16330. "adcs r11, r4, r11\n\t"
  16331. "adc r14, r5, #0\n\t"
  16332. "str r10, [sp, #4]\n\t"
  16333. /* A[0] * B[2] */
  16334. "ldr r6, [%[a], #0]\n\t"
  16335. "ldr r8, [%[b], #8]\n\t"
  16336. "umull r3, r4, r6, r8\n\t"
  16337. "adds r11, r3, r11\n\t"
  16338. "adc r14, r4, r14\n\t"
  16339. /* A[1] * B[1] */
  16340. "ldr r6, [%[a], #4]\n\t"
  16341. "ldr r8, [%[b], #4]\n\t"
  16342. "umull r3, r4, r6, r8\n\t"
  16343. "adds r11, r3, r11\n\t"
  16344. "adcs r14, r4, r14\n\t"
  16345. "adc r9, r5, #0\n\t"
  16346. /* A[2] * B[0] */
  16347. "ldr r6, [%[a], #8]\n\t"
  16348. "ldr r8, [%[b], #0]\n\t"
  16349. "umull r3, r4, r6, r8\n\t"
  16350. "adds r11, r3, r11\n\t"
  16351. "adcs r14, r4, r14\n\t"
  16352. "adc r9, r5, r9\n\t"
  16353. "str r11, [sp, #8]\n\t"
  16354. /* A[0] * B[3] */
  16355. "ldr r6, [%[a], #0]\n\t"
  16356. "ldr r8, [%[b], #12]\n\t"
  16357. "umull r3, r4, r6, r8\n\t"
  16358. "adds r14, r3, r14\n\t"
  16359. "adcs r9, r4, r9\n\t"
  16360. "adc r10, r5, #0\n\t"
  16361. /* A[1] * B[2] */
  16362. "ldr r6, [%[a], #4]\n\t"
  16363. "ldr r8, [%[b], #8]\n\t"
  16364. "umull r3, r4, r6, r8\n\t"
  16365. "adds r14, r3, r14\n\t"
  16366. "adcs r9, r4, r9\n\t"
  16367. "adc r10, r5, r10\n\t"
  16368. /* A[2] * B[1] */
  16369. "ldr r6, [%[a], #8]\n\t"
  16370. "ldr r8, [%[b], #4]\n\t"
  16371. "umull r3, r4, r6, r8\n\t"
  16372. "adds r14, r3, r14\n\t"
  16373. "adcs r9, r4, r9\n\t"
  16374. "adc r10, r5, r10\n\t"
  16375. /* A[3] * B[0] */
  16376. "ldr r6, [%[a], #12]\n\t"
  16377. "ldr r8, [%[b], #0]\n\t"
  16378. "umull r3, r4, r6, r8\n\t"
  16379. "adds r14, r3, r14\n\t"
  16380. "adcs r9, r4, r9\n\t"
  16381. "adc r10, r5, r10\n\t"
  16382. "str r14, [sp, #12]\n\t"
  16383. /* A[0] * B[4] */
  16384. "ldr r6, [%[a], #0]\n\t"
  16385. "ldr r8, [%[b], #16]\n\t"
  16386. "umull r3, r4, r6, r8\n\t"
  16387. "adds r9, r3, r9\n\t"
  16388. "adcs r10, r4, r10\n\t"
  16389. "adc r11, r5, #0\n\t"
  16390. /* A[1] * B[3] */
  16391. "ldr r6, [%[a], #4]\n\t"
  16392. "ldr r8, [%[b], #12]\n\t"
  16393. "umull r3, r4, r6, r8\n\t"
  16394. "adds r9, r3, r9\n\t"
  16395. "adcs r10, r4, r10\n\t"
  16396. "adc r11, r5, r11\n\t"
  16397. /* A[2] * B[2] */
  16398. "ldr r6, [%[a], #8]\n\t"
  16399. "ldr r8, [%[b], #8]\n\t"
  16400. "umull r3, r4, r6, r8\n\t"
  16401. "adds r9, r3, r9\n\t"
  16402. "adcs r10, r4, r10\n\t"
  16403. "adc r11, r5, r11\n\t"
  16404. /* A[3] * B[1] */
  16405. "ldr r6, [%[a], #12]\n\t"
  16406. "ldr r8, [%[b], #4]\n\t"
  16407. "umull r3, r4, r6, r8\n\t"
  16408. "adds r9, r3, r9\n\t"
  16409. "adcs r10, r4, r10\n\t"
  16410. "adc r11, r5, r11\n\t"
  16411. /* A[4] * B[0] */
  16412. "ldr r6, [%[a], #16]\n\t"
  16413. "ldr r8, [%[b], #0]\n\t"
  16414. "umull r3, r4, r6, r8\n\t"
  16415. "adds r9, r3, r9\n\t"
  16416. "adcs r10, r4, r10\n\t"
  16417. "adc r11, r5, r11\n\t"
  16418. "str r9, [sp, #16]\n\t"
  16419. /* A[0] * B[5] */
  16420. "ldr r6, [%[a], #0]\n\t"
  16421. "ldr r8, [%[b], #20]\n\t"
  16422. "umull r3, r4, r6, r8\n\t"
  16423. "adds r10, r3, r10\n\t"
  16424. "adcs r11, r4, r11\n\t"
  16425. "adc r14, r5, #0\n\t"
  16426. /* A[1] * B[4] */
  16427. "ldr r6, [%[a], #4]\n\t"
  16428. "ldr r8, [%[b], #16]\n\t"
  16429. "umull r3, r4, r6, r8\n\t"
  16430. "adds r10, r3, r10\n\t"
  16431. "adcs r11, r4, r11\n\t"
  16432. "adc r14, r5, r14\n\t"
  16433. /* A[2] * B[3] */
  16434. "ldr r6, [%[a], #8]\n\t"
  16435. "ldr r8, [%[b], #12]\n\t"
  16436. "umull r3, r4, r6, r8\n\t"
  16437. "adds r10, r3, r10\n\t"
  16438. "adcs r11, r4, r11\n\t"
  16439. "adc r14, r5, r14\n\t"
  16440. /* A[3] * B[2] */
  16441. "ldr r6, [%[a], #12]\n\t"
  16442. "ldr r8, [%[b], #8]\n\t"
  16443. "umull r3, r4, r6, r8\n\t"
  16444. "adds r10, r3, r10\n\t"
  16445. "adcs r11, r4, r11\n\t"
  16446. "adc r14, r5, r14\n\t"
  16447. /* A[4] * B[1] */
  16448. "ldr r6, [%[a], #16]\n\t"
  16449. "ldr r8, [%[b], #4]\n\t"
  16450. "umull r3, r4, r6, r8\n\t"
  16451. "adds r10, r3, r10\n\t"
  16452. "adcs r11, r4, r11\n\t"
  16453. "adc r14, r5, r14\n\t"
  16454. /* A[5] * B[0] */
  16455. "ldr r6, [%[a], #20]\n\t"
  16456. "ldr r8, [%[b], #0]\n\t"
  16457. "umull r3, r4, r6, r8\n\t"
  16458. "adds r10, r3, r10\n\t"
  16459. "adcs r11, r4, r11\n\t"
  16460. "adc r14, r5, r14\n\t"
  16461. "str r10, [sp, #20]\n\t"
  16462. /* A[0] * B[6] */
  16463. "ldr r6, [%[a], #0]\n\t"
  16464. "ldr r8, [%[b], #24]\n\t"
  16465. "umull r3, r4, r6, r8\n\t"
  16466. "adds r11, r3, r11\n\t"
  16467. "adcs r14, r4, r14\n\t"
  16468. "adc r9, r5, #0\n\t"
  16469. /* A[1] * B[5] */
  16470. "ldr r6, [%[a], #4]\n\t"
  16471. "ldr r8, [%[b], #20]\n\t"
  16472. "umull r3, r4, r6, r8\n\t"
  16473. "adds r11, r3, r11\n\t"
  16474. "adcs r14, r4, r14\n\t"
  16475. "adc r9, r5, r9\n\t"
  16476. /* A[2] * B[4] */
  16477. "ldr r6, [%[a], #8]\n\t"
  16478. "ldr r8, [%[b], #16]\n\t"
  16479. "umull r3, r4, r6, r8\n\t"
  16480. "adds r11, r3, r11\n\t"
  16481. "adcs r14, r4, r14\n\t"
  16482. "adc r9, r5, r9\n\t"
  16483. /* A[3] * B[3] */
  16484. "ldr r6, [%[a], #12]\n\t"
  16485. "ldr r8, [%[b], #12]\n\t"
  16486. "umull r3, r4, r6, r8\n\t"
  16487. "adds r11, r3, r11\n\t"
  16488. "adcs r14, r4, r14\n\t"
  16489. "adc r9, r5, r9\n\t"
  16490. /* A[4] * B[2] */
  16491. "ldr r6, [%[a], #16]\n\t"
  16492. "ldr r8, [%[b], #8]\n\t"
  16493. "umull r3, r4, r6, r8\n\t"
  16494. "adds r11, r3, r11\n\t"
  16495. "adcs r14, r4, r14\n\t"
  16496. "adc r9, r5, r9\n\t"
  16497. /* A[5] * B[1] */
  16498. "ldr r6, [%[a], #20]\n\t"
  16499. "ldr r8, [%[b], #4]\n\t"
  16500. "umull r3, r4, r6, r8\n\t"
  16501. "adds r11, r3, r11\n\t"
  16502. "adcs r14, r4, r14\n\t"
  16503. "adc r9, r5, r9\n\t"
  16504. /* A[6] * B[0] */
  16505. "ldr r6, [%[a], #24]\n\t"
  16506. "ldr r8, [%[b], #0]\n\t"
  16507. "umull r3, r4, r6, r8\n\t"
  16508. "adds r11, r3, r11\n\t"
  16509. "adcs r14, r4, r14\n\t"
  16510. "adc r9, r5, r9\n\t"
  16511. "str r11, [sp, #24]\n\t"
  16512. /* A[0] * B[7] */
  16513. "ldr r6, [%[a], #0]\n\t"
  16514. "ldr r8, [%[b], #28]\n\t"
  16515. "umull r3, r4, r6, r8\n\t"
  16516. "adds r14, r3, r14\n\t"
  16517. "adcs r9, r4, r9\n\t"
  16518. "adc r10, r5, #0\n\t"
  16519. /* A[1] * B[6] */
  16520. "ldr r6, [%[a], #4]\n\t"
  16521. "ldr r8, [%[b], #24]\n\t"
  16522. "umull r3, r4, r6, r8\n\t"
  16523. "adds r14, r3, r14\n\t"
  16524. "adcs r9, r4, r9\n\t"
  16525. "adc r10, r5, r10\n\t"
  16526. /* A[2] * B[5] */
  16527. "ldr r6, [%[a], #8]\n\t"
  16528. "ldr r8, [%[b], #20]\n\t"
  16529. "umull r3, r4, r6, r8\n\t"
  16530. "adds r14, r3, r14\n\t"
  16531. "adcs r9, r4, r9\n\t"
  16532. "adc r10, r5, r10\n\t"
  16533. /* A[3] * B[4] */
  16534. "ldr r6, [%[a], #12]\n\t"
  16535. "ldr r8, [%[b], #16]\n\t"
  16536. "umull r3, r4, r6, r8\n\t"
  16537. "adds r14, r3, r14\n\t"
  16538. "adcs r9, r4, r9\n\t"
  16539. "adc r10, r5, r10\n\t"
  16540. /* A[4] * B[3] */
  16541. "ldr r6, [%[a], #16]\n\t"
  16542. "ldr r8, [%[b], #12]\n\t"
  16543. "umull r3, r4, r6, r8\n\t"
  16544. "adds r14, r3, r14\n\t"
  16545. "adcs r9, r4, r9\n\t"
  16546. "adc r10, r5, r10\n\t"
  16547. /* A[5] * B[2] */
  16548. "ldr r6, [%[a], #20]\n\t"
  16549. "ldr r8, [%[b], #8]\n\t"
  16550. "umull r3, r4, r6, r8\n\t"
  16551. "adds r14, r3, r14\n\t"
  16552. "adcs r9, r4, r9\n\t"
  16553. "adc r10, r5, r10\n\t"
  16554. /* A[6] * B[1] */
  16555. "ldr r6, [%[a], #24]\n\t"
  16556. "ldr r8, [%[b], #4]\n\t"
  16557. "umull r3, r4, r6, r8\n\t"
  16558. "adds r14, r3, r14\n\t"
  16559. "adcs r9, r4, r9\n\t"
  16560. "adc r10, r5, r10\n\t"
  16561. /* A[7] * B[0] */
  16562. "ldr r6, [%[a], #28]\n\t"
  16563. "ldr r8, [%[b], #0]\n\t"
  16564. "umull r3, r4, r6, r8\n\t"
  16565. "adds r14, r3, r14\n\t"
  16566. "adcs r9, r4, r9\n\t"
  16567. "adc r10, r5, r10\n\t"
  16568. "str r14, [sp, #28]\n\t"
  16569. /* A[1] * B[7] */
  16570. "ldr r6, [%[a], #4]\n\t"
  16571. "ldr r8, [%[b], #28]\n\t"
  16572. "umull r3, r4, r6, r8\n\t"
  16573. "adds r9, r3, r9\n\t"
  16574. "adcs r10, r4, r10\n\t"
  16575. "adc r11, r5, #0\n\t"
  16576. /* A[2] * B[6] */
  16577. "ldr r6, [%[a], #8]\n\t"
  16578. "ldr r8, [%[b], #24]\n\t"
  16579. "umull r3, r4, r6, r8\n\t"
  16580. "adds r9, r3, r9\n\t"
  16581. "adcs r10, r4, r10\n\t"
  16582. "adc r11, r5, r11\n\t"
  16583. /* A[3] * B[5] */
  16584. "ldr r6, [%[a], #12]\n\t"
  16585. "ldr r8, [%[b], #20]\n\t"
  16586. "umull r3, r4, r6, r8\n\t"
  16587. "adds r9, r3, r9\n\t"
  16588. "adcs r10, r4, r10\n\t"
  16589. "adc r11, r5, r11\n\t"
  16590. /* A[4] * B[4] */
  16591. "ldr r6, [%[a], #16]\n\t"
  16592. "ldr r8, [%[b], #16]\n\t"
  16593. "umull r3, r4, r6, r8\n\t"
  16594. "adds r9, r3, r9\n\t"
  16595. "adcs r10, r4, r10\n\t"
  16596. "adc r11, r5, r11\n\t"
  16597. /* A[5] * B[3] */
  16598. "ldr r6, [%[a], #20]\n\t"
  16599. "ldr r8, [%[b], #12]\n\t"
  16600. "umull r3, r4, r6, r8\n\t"
  16601. "adds r9, r3, r9\n\t"
  16602. "adcs r10, r4, r10\n\t"
  16603. "adc r11, r5, r11\n\t"
  16604. /* A[6] * B[2] */
  16605. "ldr r6, [%[a], #24]\n\t"
  16606. "ldr r8, [%[b], #8]\n\t"
  16607. "umull r3, r4, r6, r8\n\t"
  16608. "adds r9, r3, r9\n\t"
  16609. "adcs r10, r4, r10\n\t"
  16610. "adc r11, r5, r11\n\t"
  16611. /* A[7] * B[1] */
  16612. "ldr r6, [%[a], #28]\n\t"
  16613. "ldr r8, [%[b], #4]\n\t"
  16614. "umull r3, r4, r6, r8\n\t"
  16615. "adds r9, r3, r9\n\t"
  16616. "adcs r10, r4, r10\n\t"
  16617. "adc r11, r5, r11\n\t"
  16618. "str r9, [sp, #32]\n\t"
  16619. /* A[2] * B[7] */
  16620. "ldr r6, [%[a], #8]\n\t"
  16621. "ldr r8, [%[b], #28]\n\t"
  16622. "umull r3, r4, r6, r8\n\t"
  16623. "adds r10, r3, r10\n\t"
  16624. "adcs r11, r4, r11\n\t"
  16625. "adc r14, r5, #0\n\t"
  16626. /* A[3] * B[6] */
  16627. "ldr r6, [%[a], #12]\n\t"
  16628. "ldr r8, [%[b], #24]\n\t"
  16629. "umull r3, r4, r6, r8\n\t"
  16630. "adds r10, r3, r10\n\t"
  16631. "adcs r11, r4, r11\n\t"
  16632. "adc r14, r5, r14\n\t"
  16633. /* A[4] * B[5] */
  16634. "ldr r6, [%[a], #16]\n\t"
  16635. "ldr r8, [%[b], #20]\n\t"
  16636. "umull r3, r4, r6, r8\n\t"
  16637. "adds r10, r3, r10\n\t"
  16638. "adcs r11, r4, r11\n\t"
  16639. "adc r14, r5, r14\n\t"
  16640. /* A[5] * B[4] */
  16641. "ldr r6, [%[a], #20]\n\t"
  16642. "ldr r8, [%[b], #16]\n\t"
  16643. "umull r3, r4, r6, r8\n\t"
  16644. "adds r10, r3, r10\n\t"
  16645. "adcs r11, r4, r11\n\t"
  16646. "adc r14, r5, r14\n\t"
  16647. /* A[6] * B[3] */
  16648. "ldr r6, [%[a], #24]\n\t"
  16649. "ldr r8, [%[b], #12]\n\t"
  16650. "umull r3, r4, r6, r8\n\t"
  16651. "adds r10, r3, r10\n\t"
  16652. "adcs r11, r4, r11\n\t"
  16653. "adc r14, r5, r14\n\t"
  16654. /* A[7] * B[2] */
  16655. "ldr r6, [%[a], #28]\n\t"
  16656. "ldr r8, [%[b], #8]\n\t"
  16657. "umull r3, r4, r6, r8\n\t"
  16658. "adds r10, r3, r10\n\t"
  16659. "adcs r11, r4, r11\n\t"
  16660. "adc r14, r5, r14\n\t"
  16661. "str r10, [sp, #36]\n\t"
  16662. /* A[3] * B[7] */
  16663. "ldr r6, [%[a], #12]\n\t"
  16664. "ldr r8, [%[b], #28]\n\t"
  16665. "umull r3, r4, r6, r8\n\t"
  16666. "adds r11, r3, r11\n\t"
  16667. "adcs r14, r4, r14\n\t"
  16668. "adc r9, r5, #0\n\t"
  16669. /* A[4] * B[6] */
  16670. "ldr r6, [%[a], #16]\n\t"
  16671. "ldr r8, [%[b], #24]\n\t"
  16672. "umull r3, r4, r6, r8\n\t"
  16673. "adds r11, r3, r11\n\t"
  16674. "adcs r14, r4, r14\n\t"
  16675. "adc r9, r5, r9\n\t"
  16676. /* A[5] * B[5] */
  16677. "ldr r6, [%[a], #20]\n\t"
  16678. "ldr r8, [%[b], #20]\n\t"
  16679. "umull r3, r4, r6, r8\n\t"
  16680. "adds r11, r3, r11\n\t"
  16681. "adcs r14, r4, r14\n\t"
  16682. "adc r9, r5, r9\n\t"
  16683. /* A[6] * B[4] */
  16684. "ldr r6, [%[a], #24]\n\t"
  16685. "ldr r8, [%[b], #16]\n\t"
  16686. "umull r3, r4, r6, r8\n\t"
  16687. "adds r11, r3, r11\n\t"
  16688. "adcs r14, r4, r14\n\t"
  16689. "adc r9, r5, r9\n\t"
  16690. /* A[7] * B[3] */
  16691. "ldr r6, [%[a], #28]\n\t"
  16692. "ldr r8, [%[b], #12]\n\t"
  16693. "umull r3, r4, r6, r8\n\t"
  16694. "adds r11, r3, r11\n\t"
  16695. "adcs r14, r4, r14\n\t"
  16696. "adc r9, r5, r9\n\t"
  16697. "str r11, [sp, #40]\n\t"
  16698. /* A[4] * B[7] */
  16699. "ldr r6, [%[a], #16]\n\t"
  16700. "ldr r8, [%[b], #28]\n\t"
  16701. "umull r3, r4, r6, r8\n\t"
  16702. "adds r14, r3, r14\n\t"
  16703. "adcs r9, r4, r9\n\t"
  16704. "adc r10, r5, #0\n\t"
  16705. /* A[5] * B[6] */
  16706. "ldr r6, [%[a], #20]\n\t"
  16707. "ldr r8, [%[b], #24]\n\t"
  16708. "umull r3, r4, r6, r8\n\t"
  16709. "adds r14, r3, r14\n\t"
  16710. "adcs r9, r4, r9\n\t"
  16711. "adc r10, r5, r10\n\t"
  16712. /* A[6] * B[5] */
  16713. "ldr r6, [%[a], #24]\n\t"
  16714. "ldr r8, [%[b], #20]\n\t"
  16715. "umull r3, r4, r6, r8\n\t"
  16716. "adds r14, r3, r14\n\t"
  16717. "adcs r9, r4, r9\n\t"
  16718. "adc r10, r5, r10\n\t"
  16719. /* A[7] * B[4] */
  16720. "ldr r6, [%[a], #28]\n\t"
  16721. "ldr r8, [%[b], #16]\n\t"
  16722. "umull r3, r4, r6, r8\n\t"
  16723. "adds r14, r3, r14\n\t"
  16724. "adcs r9, r4, r9\n\t"
  16725. "adc r10, r5, r10\n\t"
  16726. "str r14, [sp, #44]\n\t"
  16727. /* A[5] * B[7] */
  16728. "ldr r6, [%[a], #20]\n\t"
  16729. "ldr r8, [%[b], #28]\n\t"
  16730. "umull r3, r4, r6, r8\n\t"
  16731. "adds r9, r3, r9\n\t"
  16732. "adcs r10, r4, r10\n\t"
  16733. "adc r11, r5, #0\n\t"
  16734. /* A[6] * B[6] */
  16735. "ldr r6, [%[a], #24]\n\t"
  16736. "ldr r8, [%[b], #24]\n\t"
  16737. "umull r3, r4, r6, r8\n\t"
  16738. "adds r9, r3, r9\n\t"
  16739. "adcs r10, r4, r10\n\t"
  16740. "adc r11, r5, r11\n\t"
  16741. /* A[7] * B[5] */
  16742. "ldr r6, [%[a], #28]\n\t"
  16743. "ldr r8, [%[b], #20]\n\t"
  16744. "umull r3, r4, r6, r8\n\t"
  16745. "adds r9, r3, r9\n\t"
  16746. "adcs r10, r4, r10\n\t"
  16747. "adc r11, r5, r11\n\t"
  16748. /* A[6] * B[7] */
  16749. "ldr r6, [%[a], #24]\n\t"
  16750. "ldr r8, [%[b], #28]\n\t"
  16751. "umull r3, r4, r6, r8\n\t"
  16752. "adds r10, r3, r10\n\t"
  16753. "adcs r11, r4, r11\n\t"
  16754. "adc r14, r5, #0\n\t"
  16755. /* A[7] * B[6] */
  16756. "ldr r6, [%[a], #28]\n\t"
  16757. "ldr r8, [%[b], #24]\n\t"
  16758. "umull r3, r4, r6, r8\n\t"
  16759. "adds r10, r3, r10\n\t"
  16760. "adcs r11, r4, r11\n\t"
  16761. "adc r14, r5, r14\n\t"
  16762. /* A[7] * B[7] */
  16763. "ldr r6, [%[a], #28]\n\t"
  16764. "ldr r8, [%[b], #28]\n\t"
  16765. "umull r3, r4, r6, r8\n\t"
  16766. "adds r11, r3, r11\n\t"
  16767. "adc r14, r4, r14\n\t"
  16768. "str r9, [sp, #48]\n\t"
  16769. "str r10, [sp, #52]\n\t"
  16770. "str r11, [sp, #56]\n\t"
  16771. "str r14, [sp, #60]\n\t"
  16772. /* Start Reduction */
  16773. "ldr r4, [sp, #0]\n\t"
  16774. "ldr r5, [sp, #4]\n\t"
  16775. "ldr r6, [sp, #8]\n\t"
  16776. "ldr r8, [sp, #12]\n\t"
  16777. "ldr r9, [sp, #16]\n\t"
  16778. "ldr r10, [sp, #20]\n\t"
  16779. "ldr r11, [sp, #24]\n\t"
  16780. "ldr r14, [sp, #28]\n\t"
  16781. /* mu = a[0]-a[7] + a[0]-a[4] << 96 + (a[0]-a[1] * 2) << 192 */
  16782. /* - a[0] << 224 */
  16783. /* + (a[0]-a[1] * 2) << (6 * 32) */
  16784. "adds r11, r11, r4\n\t"
  16785. "adc r14, r14, r5\n\t"
  16786. "adds r11, r11, r4\n\t"
  16787. "adc r14, r14, r5\n\t"
  16788. /* - a[0] << (7 * 32) */
  16789. "sub r14, r14, r4\n\t"
  16790. /* + a[0]-a[4] << (3 * 32) */
  16791. "mov %[a], r8\n\t"
  16792. "mov %[b], r9\n\t"
  16793. "adds r8, r8, r4\n\t"
  16794. "adcs r9, r9, r5\n\t"
  16795. "adcs r10, r10, r6\n\t"
  16796. "adcs r11, r11, %[a]\n\t"
  16797. "adc r14, r14, %[b]\n\t"
  16798. "str r4, [sp, #0]\n\t"
  16799. "str r5, [sp, #4]\n\t"
  16800. "str r6, [sp, #8]\n\t"
  16801. "str r8, [sp, #12]\n\t"
  16802. "str r9, [sp, #16]\n\t"
  16803. "str r10, [sp, #20]\n\t"
  16804. /* a += mu * m */
  16805. /* += mu * ((1 << 256) - (1 << 224) + (1 << 192) + (1 << 96) - 1) */
  16806. "mov %[a], #0\n\t"
  16807. /* a[6] += t[0] + t[3] */
  16808. "ldr r3, [sp, #24]\n\t"
  16809. "adds r3, r3, r4\n\t"
  16810. "adc %[b], %[a], #0\n\t"
  16811. "adds r3, r3, r8\n\t"
  16812. "adc %[b], %[b], #0\n\t"
  16813. "str r11, [sp, #24]\n\t"
  16814. /* a[7] += t[1] + t[4] */
  16815. "ldr r3, [sp, #28]\n\t"
  16816. "adds r3, r3, %[b]\n\t"
  16817. "adc %[b], %[a], #0\n\t"
  16818. "adds r3, r3, r5\n\t"
  16819. "adc %[b], %[b], #0\n\t"
  16820. "adds r3, r3, r9\n\t"
  16821. "adc %[b], %[b], #0\n\t"
  16822. "str r14, [sp, #28]\n\t"
  16823. "str r3, [sp, #64]\n\t"
  16824. /* a[8] += t[0] + t[2] + t[5] */
  16825. "ldr r3, [sp, #32]\n\t"
  16826. "adds r3, r3, %[b]\n\t"
  16827. "adc %[b], %[a], #0\n\t"
  16828. "adds r3, r3, r4\n\t"
  16829. "adc %[b], %[b], #0\n\t"
  16830. "adds r3, r3, r6\n\t"
  16831. "adc %[b], %[b], #0\n\t"
  16832. "adds r3, r3, r10\n\t"
  16833. "adc %[b], %[b], #0\n\t"
  16834. "str r3, [sp, #32]\n\t"
  16835. /* a[9] += t[1] + t[3] + t[6] */
  16836. /* a[10] += t[2] + t[4] + t[7] */
  16837. "ldr r3, [sp, #36]\n\t"
  16838. "ldr r4, [sp, #40]\n\t"
  16839. "adds r3, r3, %[b]\n\t"
  16840. "adcs r4, r4, #0\n\t"
  16841. "adc %[b], %[a], #0\n\t"
  16842. "adds r3, r3, r5\n\t"
  16843. "adcs r4, r4, r6\n\t"
  16844. "adc %[b], %[b], #0\n\t"
  16845. "adds r3, r3, r8\n\t"
  16846. "adcs r4, r4, r9\n\t"
  16847. "adc %[b], %[b], #0\n\t"
  16848. "adds r3, r3, r11\n\t"
  16849. "adcs r4, r4, r14\n\t"
  16850. "adc %[b], %[b], #0\n\t"
  16851. "str r3, [sp, #36]\n\t"
  16852. "str r4, [sp, #40]\n\t"
  16853. /* a[11] += t[3] + t[5] */
  16854. /* a[12] += t[4] + t[6] */
  16855. /* a[13] += t[5] + t[7] */
  16856. /* a[14] += t[6] */
  16857. "ldr r3, [sp, #44]\n\t"
  16858. "ldr r4, [sp, #48]\n\t"
  16859. "ldr r5, [sp, #52]\n\t"
  16860. "ldr r6, [sp, #56]\n\t"
  16861. "adds r3, r3, %[b]\n\t"
  16862. "adcs r4, r4, #0\n\t"
  16863. "adcs r5, r5, #0\n\t"
  16864. "adcs r6, r6, #0\n\t"
  16865. "adc %[b], %[a], #0\n\t"
  16866. "adds r3, r3, r8\n\t"
  16867. "adcs r4, r4, r9\n\t"
  16868. "adcs r5, r5, r10\n\t"
  16869. "adcs r6, r6, r11\n\t"
  16870. "adc %[b], %[b], #0\n\t"
  16871. "adds r3, r3, r10\n\t"
  16872. "adcs r4, r4, r11\n\t"
  16873. "adcs r5, r5, r14\n\t"
  16874. "adcs r6, r6, #0\n\t"
  16875. "adc %[b], %[b], #0\n\t"
  16876. "str r3, [sp, #44]\n\t"
  16877. "str r4, [sp, #48]\n\t"
  16878. "str r5, [sp, #52]\n\t"
  16879. "str r6, [sp, #56]\n\t"
  16880. /* a[15] += t[7] */
  16881. "ldr r3, [sp, #60]\n\t"
  16882. "adds r3, r3, %[b]\n\t"
  16883. "adc %[b], %[a], #0\n\t"
  16884. "adds r3, r3, r14\n\t"
  16885. "adc %[b], %[b], #0\n\t"
  16886. "str r3, [sp, #60]\n\t"
  16887. "ldr r3, [sp, #64]\n\t"
  16888. "ldr r4, [sp, #32]\n\t"
  16889. "ldr r5, [sp, #36]\n\t"
  16890. "ldr r6, [sp, #40]\n\t"
  16891. "ldr r9, [sp, #0]\n\t"
  16892. "ldr r10, [sp, #4]\n\t"
  16893. "ldr r11, [sp, #8]\n\t"
  16894. "ldr r14, [sp, #12]\n\t"
  16895. "subs r3, r3, r9\n\t"
  16896. "sbcs r4, r4, r10\n\t"
  16897. "sbcs r5, r5, r11\n\t"
  16898. "sbcs r6, r6, r14\n\t"
  16899. "str r4, [sp, #32]\n\t"
  16900. "str r5, [sp, #36]\n\t"
  16901. "str r6, [sp, #40]\n\t"
  16902. "ldr r3, [sp, #44]\n\t"
  16903. "ldr r4, [sp, #48]\n\t"
  16904. "ldr r5, [sp, #52]\n\t"
  16905. "ldr r6, [sp, #56]\n\t"
  16906. "ldr r8, [sp, #60]\n\t"
  16907. "ldr r9, [sp, #16]\n\t"
  16908. "ldr r10, [sp, #20]\n\t"
  16909. "ldr r11, [sp, #24]\n\t"
  16910. "ldr r14, [sp, #28]\n\t"
  16911. "sbcs r3, r3, r9\n\t"
  16912. "sbcs r4, r4, r10\n\t"
  16913. "sbcs r5, r5, r11\n\t"
  16914. "sbcs r6, r6, r14\n\t"
  16915. "sbc r8, r8, #0\n\t"
  16916. "str r3, [sp, #44]\n\t"
  16917. "str r4, [sp, #48]\n\t"
  16918. "str r5, [sp, #52]\n\t"
  16919. "str r6, [sp, #56]\n\t"
  16920. "str r8, [sp, #60]\n\t"
  16921. /* mask m and sub from result if overflow */
  16922. "sub %[b], %[a], %[b]\n\t"
  16923. "and %[a], %[b], #1\n\t"
  16924. "ldr r3, [sp, #32]\n\t"
  16925. "ldr r4, [sp, #36]\n\t"
  16926. "ldr r5, [sp, #40]\n\t"
  16927. "ldr r6, [sp, #44]\n\t"
  16928. "ldr r8, [sp, #48]\n\t"
  16929. "ldr r9, [sp, #52]\n\t"
  16930. "ldr r10, [sp, #56]\n\t"
  16931. "ldr r11, [sp, #60]\n\t"
  16932. "subs r3, r3, %[b]\n\t"
  16933. "sbcs r4, r4, %[b]\n\t"
  16934. "sbcs r5, r5, %[b]\n\t"
  16935. "sbcs r6, r6, #0\n\t"
  16936. "sbcs r8, r8, #0\n\t"
  16937. "sbcs r9, r9, #0\n\t"
  16938. "sbcs r10, r10, %[a]\n\t"
  16939. "sbc r11, r11, %[b]\n\t"
  16940. "str r3, [%[r], #0]\n\t"
  16941. "str r4, [%[r], #4]\n\t"
  16942. "str r5, [%[r], #8]\n\t"
  16943. "str r6, [%[r], #12]\n\t"
  16944. "str r8, [%[r], #16]\n\t"
  16945. "str r9, [%[r], #20]\n\t"
  16946. "str r10, [%[r], #24]\n\t"
  16947. "str r11, [%[r], #28]\n\t"
  16948. "add sp, sp, #68\n\t"
  16949. : [a] "+r" (a), [b] "+r" (b)
  16950. : [r] "r" (r)
  16951. : "memory", "r9", "r10", "r11", "r14", "r3", "r4", "r5", "r6", "r8"
  16952. );
  16953. }
  16954. /* Square the Montgomery form number mod the modulus (prime). (r = a * a mod m)
  16955. *
  16956. * r Result of squaring.
  16957. * a Number to square in Montgomery form.
  16958. * m Modulus (prime).
  16959. * mp Montgomery mulitplier.
  16960. */
  16961. SP_NOINLINE static void sp_256_mont_sqr_8(sp_digit* r, const sp_digit* a, const sp_digit* m,
  16962. sp_digit mp)
  16963. {
  16964. (void)mp;
  16965. (void)m;
  16966. __asm__ __volatile__ (
  16967. "sub sp, sp, #68\n\t"
  16968. "mov r5, #0\n\t"
  16969. /* A[0] * A[1] */
  16970. "ldr r6, [%[a], #0]\n\t"
  16971. "ldr r8, [%[a], #4]\n\t"
  16972. "umull r10, r11, r6, r8\n\t"
  16973. "str r10, [sp, #4]\n\t"
  16974. /* A[0] * A[2] */
  16975. "ldr r6, [%[a], #0]\n\t"
  16976. "ldr r8, [%[a], #8]\n\t"
  16977. "umull r3, r4, r6, r8\n\t"
  16978. "adds r11, r3, r11\n\t"
  16979. "adc r14, r4, #0\n\t"
  16980. "str r11, [sp, #8]\n\t"
  16981. /* A[0] * A[3] */
  16982. "ldr r6, [%[a], #0]\n\t"
  16983. "ldr r8, [%[a], #12]\n\t"
  16984. "umull r3, r4, r6, r8\n\t"
  16985. "adds r14, r3, r14\n\t"
  16986. "adc r9, r4, #0\n\t"
  16987. /* A[1] * A[2] */
  16988. "ldr r6, [%[a], #4]\n\t"
  16989. "ldr r8, [%[a], #8]\n\t"
  16990. "umull r3, r4, r6, r8\n\t"
  16991. "adds r14, r3, r14\n\t"
  16992. "adcs r9, r4, r9\n\t"
  16993. "adc r10, r5, #0\n\t"
  16994. "str r14, [sp, #12]\n\t"
  16995. /* A[0] * A[4] */
  16996. "ldr r6, [%[a], #0]\n\t"
  16997. "ldr r8, [%[a], #16]\n\t"
  16998. "umull r3, r4, r6, r8\n\t"
  16999. "adds r9, r3, r9\n\t"
  17000. "adc r10, r4, r10\n\t"
  17001. /* A[1] * A[3] */
  17002. "ldr r6, [%[a], #4]\n\t"
  17003. "ldr r8, [%[a], #12]\n\t"
  17004. "umull r3, r4, r6, r8\n\t"
  17005. "adds r9, r3, r9\n\t"
  17006. "adcs r10, r4, r10\n\t"
  17007. "adc r11, r5, #0\n\t"
  17008. "str r9, [sp, #16]\n\t"
  17009. /* A[0] * A[5] */
  17010. "ldr r6, [%[a], #0]\n\t"
  17011. "ldr r8, [%[a], #20]\n\t"
  17012. "umull r3, r4, r6, r8\n\t"
  17013. "adds r10, r3, r10\n\t"
  17014. "adc r11, r4, r11\n\t"
  17015. /* A[1] * A[4] */
  17016. "ldr r6, [%[a], #4]\n\t"
  17017. "ldr r8, [%[a], #16]\n\t"
  17018. "umull r3, r4, r6, r8\n\t"
  17019. "adds r10, r3, r10\n\t"
  17020. "adcs r11, r4, r11\n\t"
  17021. "adc r14, r5, #0\n\t"
  17022. /* A[2] * A[3] */
  17023. "ldr r6, [%[a], #8]\n\t"
  17024. "ldr r8, [%[a], #12]\n\t"
  17025. "umull r3, r4, r6, r8\n\t"
  17026. "adds r10, r3, r10\n\t"
  17027. "adcs r11, r4, r11\n\t"
  17028. "adc r14, r5, r14\n\t"
  17029. "str r10, [sp, #20]\n\t"
  17030. /* A[0] * A[6] */
  17031. "ldr r6, [%[a], #0]\n\t"
  17032. "ldr r8, [%[a], #24]\n\t"
  17033. "umull r3, r4, r6, r8\n\t"
  17034. "adds r11, r3, r11\n\t"
  17035. "adcs r14, r4, r14\n\t"
  17036. "adc r9, r5, #0\n\t"
  17037. /* A[1] * A[5] */
  17038. "ldr r6, [%[a], #4]\n\t"
  17039. "ldr r8, [%[a], #20]\n\t"
  17040. "umull r3, r4, r6, r8\n\t"
  17041. "adds r11, r3, r11\n\t"
  17042. "adcs r14, r4, r14\n\t"
  17043. "adc r9, r5, r9\n\t"
  17044. /* A[2] * A[4] */
  17045. "ldr r6, [%[a], #8]\n\t"
  17046. "ldr r8, [%[a], #16]\n\t"
  17047. "umull r3, r4, r6, r8\n\t"
  17048. "adds r11, r3, r11\n\t"
  17049. "adcs r14, r4, r14\n\t"
  17050. "adc r9, r5, r9\n\t"
  17051. "str r11, [sp, #24]\n\t"
  17052. /* A[0] * A[7] */
  17053. "ldr r6, [%[a], #0]\n\t"
  17054. "ldr r8, [%[a], #28]\n\t"
  17055. "umull r3, r4, r6, r8\n\t"
  17056. "adds r14, r3, r14\n\t"
  17057. "adcs r9, r4, r9\n\t"
  17058. "adc r10, r5, #0\n\t"
  17059. /* A[1] * A[6] */
  17060. "ldr r6, [%[a], #4]\n\t"
  17061. "ldr r8, [%[a], #24]\n\t"
  17062. "umull r3, r4, r6, r8\n\t"
  17063. "adds r14, r3, r14\n\t"
  17064. "adcs r9, r4, r9\n\t"
  17065. "adc r10, r5, r10\n\t"
  17066. /* A[2] * A[5] */
  17067. "ldr r6, [%[a], #8]\n\t"
  17068. "ldr r8, [%[a], #20]\n\t"
  17069. "umull r3, r4, r6, r8\n\t"
  17070. "adds r14, r3, r14\n\t"
  17071. "adcs r9, r4, r9\n\t"
  17072. "adc r10, r5, r10\n\t"
  17073. /* A[3] * A[4] */
  17074. "ldr r6, [%[a], #12]\n\t"
  17075. "ldr r8, [%[a], #16]\n\t"
  17076. "umull r3, r4, r6, r8\n\t"
  17077. "adds r14, r3, r14\n\t"
  17078. "adcs r9, r4, r9\n\t"
  17079. "adc r10, r5, r10\n\t"
  17080. "str r14, [sp, #28]\n\t"
  17081. /* A[1] * A[7] */
  17082. "ldr r6, [%[a], #4]\n\t"
  17083. "ldr r8, [%[a], #28]\n\t"
  17084. "umull r3, r4, r6, r8\n\t"
  17085. "adds r9, r3, r9\n\t"
  17086. "adcs r10, r4, r10\n\t"
  17087. "adc r11, r5, #0\n\t"
  17088. /* A[2] * A[6] */
  17089. "ldr r6, [%[a], #8]\n\t"
  17090. "ldr r8, [%[a], #24]\n\t"
  17091. "umull r3, r4, r6, r8\n\t"
  17092. "adds r9, r3, r9\n\t"
  17093. "adcs r10, r4, r10\n\t"
  17094. "adc r11, r5, r11\n\t"
  17095. /* A[3] * A[5] */
  17096. "ldr r6, [%[a], #12]\n\t"
  17097. "ldr r8, [%[a], #20]\n\t"
  17098. "umull r3, r4, r6, r8\n\t"
  17099. "adds r9, r3, r9\n\t"
  17100. "adcs r10, r4, r10\n\t"
  17101. "adc r11, r5, r11\n\t"
  17102. "str r9, [sp, #32]\n\t"
  17103. /* A[2] * A[7] */
  17104. "ldr r6, [%[a], #8]\n\t"
  17105. "ldr r8, [%[a], #28]\n\t"
  17106. "umull r3, r4, r6, r8\n\t"
  17107. "adds r10, r3, r10\n\t"
  17108. "adcs r11, r4, r11\n\t"
  17109. "adc r14, r5, #0\n\t"
  17110. /* A[3] * A[6] */
  17111. "ldr r6, [%[a], #12]\n\t"
  17112. "ldr r8, [%[a], #24]\n\t"
  17113. "umull r3, r4, r6, r8\n\t"
  17114. "adds r10, r3, r10\n\t"
  17115. "adcs r11, r4, r11\n\t"
  17116. "adc r14, r5, r14\n\t"
  17117. /* A[4] * A[5] */
  17118. "ldr r6, [%[a], #16]\n\t"
  17119. "ldr r8, [%[a], #20]\n\t"
  17120. "umull r3, r4, r6, r8\n\t"
  17121. "adds r10, r3, r10\n\t"
  17122. "adcs r11, r4, r11\n\t"
  17123. "adc r14, r5, r14\n\t"
  17124. "str r10, [sp, #36]\n\t"
  17125. /* A[3] * A[7] */
  17126. "ldr r6, [%[a], #12]\n\t"
  17127. "ldr r8, [%[a], #28]\n\t"
  17128. "umull r3, r4, r6, r8\n\t"
  17129. "adds r11, r3, r11\n\t"
  17130. "adcs r14, r4, r14\n\t"
  17131. "adc r9, r5, #0\n\t"
  17132. /* A[4] * A[6] */
  17133. "ldr r6, [%[a], #16]\n\t"
  17134. "ldr r8, [%[a], #24]\n\t"
  17135. "umull r3, r4, r6, r8\n\t"
  17136. "adds r11, r3, r11\n\t"
  17137. "adcs r14, r4, r14\n\t"
  17138. "adc r9, r5, r9\n\t"
  17139. "str r11, [sp, #40]\n\t"
  17140. /* A[4] * A[7] */
  17141. "ldr r6, [%[a], #16]\n\t"
  17142. "ldr r8, [%[a], #28]\n\t"
  17143. "umull r3, r4, r6, r8\n\t"
  17144. "adds r14, r3, r14\n\t"
  17145. "adcs r9, r4, r9\n\t"
  17146. "adc r10, r5, #0\n\t"
  17147. /* A[5] * A[6] */
  17148. "ldr r6, [%[a], #20]\n\t"
  17149. "ldr r8, [%[a], #24]\n\t"
  17150. "umull r3, r4, r6, r8\n\t"
  17151. "adds r14, r3, r14\n\t"
  17152. "adcs r9, r4, r9\n\t"
  17153. "adc r10, r5, r10\n\t"
  17154. "str r14, [sp, #44]\n\t"
  17155. /* A[5] * A[7] */
  17156. "ldr r6, [%[a], #20]\n\t"
  17157. "ldr r8, [%[a], #28]\n\t"
  17158. "umull r3, r4, r6, r8\n\t"
  17159. "adds r9, r3, r9\n\t"
  17160. "adcs r10, r4, r10\n\t"
  17161. "adc r11, r5, #0\n\t"
  17162. "str r9, [sp, #48]\n\t"
  17163. /* A[6] * A[7] */
  17164. "ldr r6, [%[a], #24]\n\t"
  17165. "ldr r8, [%[a], #28]\n\t"
  17166. "umull r3, r4, r6, r8\n\t"
  17167. "adds r10, r3, r10\n\t"
  17168. "adc r11, r4, r11\n\t"
  17169. "str r10, [sp, #52]\n\t"
  17170. "str r11, [sp, #56]\n\t"
  17171. /* Double */
  17172. "ldr r4, [sp, #4]\n\t"
  17173. "ldr r6, [sp, #8]\n\t"
  17174. "ldr r8, [sp, #12]\n\t"
  17175. "ldr r9, [sp, #16]\n\t"
  17176. "ldr r10, [sp, #20]\n\t"
  17177. "ldr r11, [sp, #24]\n\t"
  17178. "ldr r14, [sp, #28]\n\t"
  17179. "ldr r12, [sp, #32]\n\t"
  17180. "ldr r3, [sp, #36]\n\t"
  17181. "adds r4, r4, r4\n\t"
  17182. "adcs r6, r6, r6\n\t"
  17183. "adcs r8, r8, r8\n\t"
  17184. "adcs r9, r9, r9\n\t"
  17185. "adcs r10, r10, r10\n\t"
  17186. "adcs r11, r11, r11\n\t"
  17187. "adcs r14, r14, r14\n\t"
  17188. "adcs r12, r12, r12\n\t"
  17189. "adcs r3, r3, r3\n\t"
  17190. "str r4, [sp, #4]\n\t"
  17191. "str r6, [sp, #8]\n\t"
  17192. "str r8, [sp, #12]\n\t"
  17193. "str r9, [sp, #16]\n\t"
  17194. "str r10, [sp, #20]\n\t"
  17195. "str r11, [sp, #24]\n\t"
  17196. "str r14, [sp, #28]\n\t"
  17197. "str r12, [sp, #32]\n\t"
  17198. "str r3, [sp, #36]\n\t"
  17199. "ldr r4, [sp, #40]\n\t"
  17200. "ldr r6, [sp, #44]\n\t"
  17201. "ldr r8, [sp, #48]\n\t"
  17202. "ldr r9, [sp, #52]\n\t"
  17203. "ldr r10, [sp, #56]\n\t"
  17204. "adcs r4, r4, r4\n\t"
  17205. "adcs r6, r6, r6\n\t"
  17206. "adcs r8, r8, r8\n\t"
  17207. "adcs r9, r9, r9\n\t"
  17208. "adcs r10, r10, r10\n\t"
  17209. "str r4, [sp, #40]\n\t"
  17210. "str r6, [sp, #44]\n\t"
  17211. "str r8, [sp, #48]\n\t"
  17212. "str r9, [sp, #52]\n\t"
  17213. "str r10, [sp, #56]\n\t"
  17214. "adc r11, r5, #0\n\t"
  17215. "str r11, [sp, #60]\n\t"
  17216. "ldr r4, [sp, #4]\n\t"
  17217. "ldr r5, [sp, #8]\n\t"
  17218. "ldr r12, [sp, #12]\n\t"
  17219. /* A[0] * A[0] */
  17220. "ldr r6, [%[a], #0]\n\t"
  17221. "umull r9, r10, r6, r6\n\t"
  17222. /* A[1] * A[1] */
  17223. "ldr r6, [%[a], #4]\n\t"
  17224. "umull r11, r14, r6, r6\n\t"
  17225. "adds r10, r10, r4\n\t"
  17226. "adcs r11, r11, r5\n\t"
  17227. "adcs r14, r14, r12\n\t"
  17228. "str r9, [sp, #0]\n\t"
  17229. "str r10, [sp, #4]\n\t"
  17230. "str r11, [sp, #8]\n\t"
  17231. "str r14, [sp, #12]\n\t"
  17232. "ldr r3, [sp, #16]\n\t"
  17233. "ldr r4, [sp, #20]\n\t"
  17234. "ldr r5, [sp, #24]\n\t"
  17235. "ldr r12, [sp, #28]\n\t"
  17236. /* A[2] * A[2] */
  17237. "ldr r6, [%[a], #8]\n\t"
  17238. "umull r9, r10, r6, r6\n\t"
  17239. /* A[3] * A[3] */
  17240. "ldr r6, [%[a], #12]\n\t"
  17241. "umull r11, r14, r6, r6\n\t"
  17242. "adcs r9, r9, r3\n\t"
  17243. "adcs r10, r10, r4\n\t"
  17244. "adcs r11, r11, r5\n\t"
  17245. "adcs r14, r14, r12\n\t"
  17246. "str r9, [sp, #16]\n\t"
  17247. "str r10, [sp, #20]\n\t"
  17248. "str r11, [sp, #24]\n\t"
  17249. "str r14, [sp, #28]\n\t"
  17250. "ldr r3, [sp, #32]\n\t"
  17251. "ldr r4, [sp, #36]\n\t"
  17252. "ldr r5, [sp, #40]\n\t"
  17253. "ldr r12, [sp, #44]\n\t"
  17254. /* A[4] * A[4] */
  17255. "ldr r6, [%[a], #16]\n\t"
  17256. "umull r9, r10, r6, r6\n\t"
  17257. /* A[5] * A[5] */
  17258. "ldr r6, [%[a], #20]\n\t"
  17259. "umull r11, r14, r6, r6\n\t"
  17260. "adcs r9, r9, r3\n\t"
  17261. "adcs r10, r10, r4\n\t"
  17262. "adcs r11, r11, r5\n\t"
  17263. "adcs r14, r14, r12\n\t"
  17264. "str r9, [sp, #32]\n\t"
  17265. "str r10, [sp, #36]\n\t"
  17266. "str r11, [sp, #40]\n\t"
  17267. "str r14, [sp, #44]\n\t"
  17268. "ldr r3, [sp, #48]\n\t"
  17269. "ldr r4, [sp, #52]\n\t"
  17270. "ldr r5, [sp, #56]\n\t"
  17271. "ldr r12, [sp, #60]\n\t"
  17272. /* A[6] * A[6] */
  17273. "ldr r6, [%[a], #24]\n\t"
  17274. "umull r9, r10, r6, r6\n\t"
  17275. /* A[7] * A[7] */
  17276. "ldr r6, [%[a], #28]\n\t"
  17277. "umull r11, r14, r6, r6\n\t"
  17278. "adcs r9, r9, r3\n\t"
  17279. "adcs r10, r10, r4\n\t"
  17280. "adcs r11, r11, r5\n\t"
  17281. "adc r14, r14, r12\n\t"
  17282. "str r9, [sp, #48]\n\t"
  17283. "str r10, [sp, #52]\n\t"
  17284. "str r11, [sp, #56]\n\t"
  17285. "str r14, [sp, #60]\n\t"
  17286. /* Start Reduction */
  17287. "ldr r4, [sp, #0]\n\t"
  17288. "ldr r5, [sp, #4]\n\t"
  17289. "ldr r6, [sp, #8]\n\t"
  17290. "ldr r8, [sp, #12]\n\t"
  17291. "ldr r9, [sp, #16]\n\t"
  17292. "ldr r10, [sp, #20]\n\t"
  17293. "ldr r11, [sp, #24]\n\t"
  17294. "ldr r14, [sp, #28]\n\t"
  17295. /* mu = a[0]-a[7] + a[0]-a[4] << 96 + (a[0]-a[1] * 2) << 192 */
  17296. /* - a[0] << 224 */
  17297. /* + (a[0]-a[1] * 2) << (6 * 32) */
  17298. "adds r11, r11, r4\n\t"
  17299. "adc r14, r14, r5\n\t"
  17300. "adds r11, r11, r4\n\t"
  17301. "adc r14, r14, r5\n\t"
  17302. /* - a[0] << (7 * 32) */
  17303. "sub r14, r14, r4\n\t"
  17304. /* + a[0]-a[4] << (3 * 32) */
  17305. "mov %[a], r8\n\t"
  17306. "mov r12, r9\n\t"
  17307. "adds r8, r8, r4\n\t"
  17308. "adcs r9, r9, r5\n\t"
  17309. "adcs r10, r10, r6\n\t"
  17310. "adcs r11, r11, %[a]\n\t"
  17311. "adc r14, r14, r12\n\t"
  17312. "str r4, [sp, #0]\n\t"
  17313. "str r5, [sp, #4]\n\t"
  17314. "str r6, [sp, #8]\n\t"
  17315. "str r8, [sp, #12]\n\t"
  17316. "str r9, [sp, #16]\n\t"
  17317. "str r10, [sp, #20]\n\t"
  17318. /* a += mu * m */
  17319. /* += mu * ((1 << 256) - (1 << 224) + (1 << 192) + (1 << 96) - 1) */
  17320. "mov %[a], #0\n\t"
  17321. /* a[6] += t[0] + t[3] */
  17322. "ldr r3, [sp, #24]\n\t"
  17323. "adds r3, r3, r4\n\t"
  17324. "adc r12, %[a], #0\n\t"
  17325. "adds r3, r3, r8\n\t"
  17326. "adc r12, r12, #0\n\t"
  17327. "str r11, [sp, #24]\n\t"
  17328. /* a[7] += t[1] + t[4] */
  17329. "ldr r3, [sp, #28]\n\t"
  17330. "adds r3, r3, r12\n\t"
  17331. "adc r12, %[a], #0\n\t"
  17332. "adds r3, r3, r5\n\t"
  17333. "adc r12, r12, #0\n\t"
  17334. "adds r3, r3, r9\n\t"
  17335. "adc r12, r12, #0\n\t"
  17336. "str r14, [sp, #28]\n\t"
  17337. "str r3, [sp, #64]\n\t"
  17338. /* a[8] += t[0] + t[2] + t[5] */
  17339. "ldr r3, [sp, #32]\n\t"
  17340. "adds r3, r3, r12\n\t"
  17341. "adc r12, %[a], #0\n\t"
  17342. "adds r3, r3, r4\n\t"
  17343. "adc r12, r12, #0\n\t"
  17344. "adds r3, r3, r6\n\t"
  17345. "adc r12, r12, #0\n\t"
  17346. "adds r3, r3, r10\n\t"
  17347. "adc r12, r12, #0\n\t"
  17348. "str r3, [sp, #32]\n\t"
  17349. /* a[9] += t[1] + t[3] + t[6] */
  17350. /* a[10] += t[2] + t[4] + t[7] */
  17351. "ldr r3, [sp, #36]\n\t"
  17352. "ldr r4, [sp, #40]\n\t"
  17353. "adds r3, r3, r12\n\t"
  17354. "adcs r4, r4, #0\n\t"
  17355. "adc r12, %[a], #0\n\t"
  17356. "adds r3, r3, r5\n\t"
  17357. "adcs r4, r4, r6\n\t"
  17358. "adc r12, r12, #0\n\t"
  17359. "adds r3, r3, r8\n\t"
  17360. "adcs r4, r4, r9\n\t"
  17361. "adc r12, r12, #0\n\t"
  17362. "adds r3, r3, r11\n\t"
  17363. "adcs r4, r4, r14\n\t"
  17364. "adc r12, r12, #0\n\t"
  17365. "str r3, [sp, #36]\n\t"
  17366. "str r4, [sp, #40]\n\t"
  17367. /* a[11] += t[3] + t[5] */
  17368. /* a[12] += t[4] + t[6] */
  17369. /* a[13] += t[5] + t[7] */
  17370. /* a[14] += t[6] */
  17371. "ldr r3, [sp, #44]\n\t"
  17372. "ldr r4, [sp, #48]\n\t"
  17373. "ldr r5, [sp, #52]\n\t"
  17374. "ldr r6, [sp, #56]\n\t"
  17375. "adds r3, r3, r12\n\t"
  17376. "adcs r4, r4, #0\n\t"
  17377. "adcs r5, r5, #0\n\t"
  17378. "adcs r6, r6, #0\n\t"
  17379. "adc r12, %[a], #0\n\t"
  17380. "adds r3, r3, r8\n\t"
  17381. "adcs r4, r4, r9\n\t"
  17382. "adcs r5, r5, r10\n\t"
  17383. "adcs r6, r6, r11\n\t"
  17384. "adc r12, r12, #0\n\t"
  17385. "adds r3, r3, r10\n\t"
  17386. "adcs r4, r4, r11\n\t"
  17387. "adcs r5, r5, r14\n\t"
  17388. "adcs r6, r6, #0\n\t"
  17389. "adc r12, r12, #0\n\t"
  17390. "str r3, [sp, #44]\n\t"
  17391. "str r4, [sp, #48]\n\t"
  17392. "str r5, [sp, #52]\n\t"
  17393. "str r6, [sp, #56]\n\t"
  17394. /* a[15] += t[7] */
  17395. "ldr r3, [sp, #60]\n\t"
  17396. "adds r3, r3, r12\n\t"
  17397. "adc r12, %[a], #0\n\t"
  17398. "adds r3, r3, r14\n\t"
  17399. "adc r12, r12, #0\n\t"
  17400. "str r3, [sp, #60]\n\t"
  17401. "ldr r3, [sp, #64]\n\t"
  17402. "ldr r4, [sp, #32]\n\t"
  17403. "ldr r5, [sp, #36]\n\t"
  17404. "ldr r6, [sp, #40]\n\t"
  17405. "ldr r9, [sp, #0]\n\t"
  17406. "ldr r10, [sp, #4]\n\t"
  17407. "ldr r11, [sp, #8]\n\t"
  17408. "ldr r14, [sp, #12]\n\t"
  17409. "subs r3, r3, r9\n\t"
  17410. "sbcs r4, r4, r10\n\t"
  17411. "sbcs r5, r5, r11\n\t"
  17412. "sbcs r6, r6, r14\n\t"
  17413. "str r4, [sp, #32]\n\t"
  17414. "str r5, [sp, #36]\n\t"
  17415. "str r6, [sp, #40]\n\t"
  17416. "ldr r3, [sp, #44]\n\t"
  17417. "ldr r4, [sp, #48]\n\t"
  17418. "ldr r5, [sp, #52]\n\t"
  17419. "ldr r6, [sp, #56]\n\t"
  17420. "ldr r8, [sp, #60]\n\t"
  17421. "ldr r9, [sp, #16]\n\t"
  17422. "ldr r10, [sp, #20]\n\t"
  17423. "ldr r11, [sp, #24]\n\t"
  17424. "ldr r14, [sp, #28]\n\t"
  17425. "sbcs r3, r3, r9\n\t"
  17426. "sbcs r4, r4, r10\n\t"
  17427. "sbcs r5, r5, r11\n\t"
  17428. "sbcs r6, r6, r14\n\t"
  17429. "sbc r8, r8, #0\n\t"
  17430. "str r3, [sp, #44]\n\t"
  17431. "str r4, [sp, #48]\n\t"
  17432. "str r5, [sp, #52]\n\t"
  17433. "str r6, [sp, #56]\n\t"
  17434. "str r8, [sp, #60]\n\t"
  17435. /* mask m and sub from result if overflow */
  17436. "sub r12, %[a], r12\n\t"
  17437. "and %[a], r12, #1\n\t"
  17438. "ldr r3, [sp, #32]\n\t"
  17439. "ldr r4, [sp, #36]\n\t"
  17440. "ldr r5, [sp, #40]\n\t"
  17441. "ldr r6, [sp, #44]\n\t"
  17442. "ldr r8, [sp, #48]\n\t"
  17443. "ldr r9, [sp, #52]\n\t"
  17444. "ldr r10, [sp, #56]\n\t"
  17445. "ldr r11, [sp, #60]\n\t"
  17446. "subs r3, r3, r12\n\t"
  17447. "sbcs r4, r4, r12\n\t"
  17448. "sbcs r5, r5, r12\n\t"
  17449. "sbcs r6, r6, #0\n\t"
  17450. "sbcs r8, r8, #0\n\t"
  17451. "sbcs r9, r9, #0\n\t"
  17452. "sbcs r10, r10, %[a]\n\t"
  17453. "sbc r11, r11, r12\n\t"
  17454. "str r3, [%[r], #0]\n\t"
  17455. "str r4, [%[r], #4]\n\t"
  17456. "str r5, [%[r], #8]\n\t"
  17457. "str r6, [%[r], #12]\n\t"
  17458. "str r8, [%[r], #16]\n\t"
  17459. "str r9, [%[r], #20]\n\t"
  17460. "str r10, [%[r], #24]\n\t"
  17461. "str r11, [%[r], #28]\n\t"
  17462. "add sp, sp, #68\n\t"
  17463. : [a] "+r" (a)
  17464. : [r] "r" (r)
  17465. : "memory", "r9", "r10", "r11", "r14", "r3", "r4", "r5", "r6", "r8", "r12"
  17466. );
  17467. }
  17468. #if !defined(WOLFSSL_SP_SMALL) || defined(HAVE_COMP_KEY)
  17469. /* Square the Montgomery form number a number of times. (r = a ^ n mod m)
  17470. *
  17471. * r Result of squaring.
  17472. * a Number to square in Montgomery form.
  17473. * n Number of times to square.
  17474. * m Modulus (prime).
  17475. * mp Montgomery mulitplier.
  17476. */
  17477. static void sp_256_mont_sqr_n_8(sp_digit* r, const sp_digit* a, int n,
  17478. const sp_digit* m, sp_digit mp)
  17479. {
  17480. sp_256_mont_sqr_8(r, a, m, mp);
  17481. for (; n > 1; n--) {
  17482. sp_256_mont_sqr_8(r, r, m, mp);
  17483. }
  17484. }
  17485. #endif /* !WOLFSSL_SP_SMALL | HAVE_COMP_KEY */
  17486. #ifdef WOLFSSL_SP_SMALL
  17487. /* Mod-2 for the P256 curve. */
  17488. static const uint32_t p256_mod_minus_2[8] = {
  17489. 0xfffffffdU,0xffffffffU,0xffffffffU,0x00000000U,0x00000000U,0x00000000U,
  17490. 0x00000001U,0xffffffffU
  17491. };
  17492. #endif /* !WOLFSSL_SP_SMALL */
  17493. /* Invert the number, in Montgomery form, modulo the modulus (prime) of the
  17494. * P256 curve. (r = 1 / a mod m)
  17495. *
  17496. * r Inverse result.
  17497. * a Number to invert.
  17498. * td Temporary data.
  17499. */
  17500. static void sp_256_mont_inv_8(sp_digit* r, const sp_digit* a, sp_digit* td)
  17501. {
  17502. #ifdef WOLFSSL_SP_SMALL
  17503. sp_digit* t = td;
  17504. int i;
  17505. XMEMCPY(t, a, sizeof(sp_digit) * 8);
  17506. for (i=254; i>=0; i--) {
  17507. sp_256_mont_sqr_8(t, t, p256_mod, p256_mp_mod);
  17508. if (p256_mod_minus_2[i / 32] & ((sp_digit)1 << (i % 32)))
  17509. sp_256_mont_mul_8(t, t, a, p256_mod, p256_mp_mod);
  17510. }
  17511. XMEMCPY(r, t, sizeof(sp_digit) * 8);
  17512. #else
  17513. sp_digit* t1 = td;
  17514. sp_digit* t2 = td + 2 * 8;
  17515. sp_digit* t3 = td + 4 * 8;
  17516. /* 0x2 */
  17517. sp_256_mont_sqr_8(t1, a, p256_mod, p256_mp_mod);
  17518. /* 0x3 */
  17519. sp_256_mont_mul_8(t2, t1, a, p256_mod, p256_mp_mod);
  17520. /* 0xc */
  17521. sp_256_mont_sqr_n_8(t1, t2, 2, p256_mod, p256_mp_mod);
  17522. /* 0xd */
  17523. sp_256_mont_mul_8(t3, t1, a, p256_mod, p256_mp_mod);
  17524. /* 0xf */
  17525. sp_256_mont_mul_8(t2, t2, t1, p256_mod, p256_mp_mod);
  17526. /* 0xf0 */
  17527. sp_256_mont_sqr_n_8(t1, t2, 4, p256_mod, p256_mp_mod);
  17528. /* 0xfd */
  17529. sp_256_mont_mul_8(t3, t3, t1, p256_mod, p256_mp_mod);
  17530. /* 0xff */
  17531. sp_256_mont_mul_8(t2, t2, t1, p256_mod, p256_mp_mod);
  17532. /* 0xff00 */
  17533. sp_256_mont_sqr_n_8(t1, t2, 8, p256_mod, p256_mp_mod);
  17534. /* 0xfffd */
  17535. sp_256_mont_mul_8(t3, t3, t1, p256_mod, p256_mp_mod);
  17536. /* 0xffff */
  17537. sp_256_mont_mul_8(t2, t2, t1, p256_mod, p256_mp_mod);
  17538. /* 0xffff0000 */
  17539. sp_256_mont_sqr_n_8(t1, t2, 16, p256_mod, p256_mp_mod);
  17540. /* 0xfffffffd */
  17541. sp_256_mont_mul_8(t3, t3, t1, p256_mod, p256_mp_mod);
  17542. /* 0xffffffff */
  17543. sp_256_mont_mul_8(t2, t2, t1, p256_mod, p256_mp_mod);
  17544. /* 0xffffffff00000000 */
  17545. sp_256_mont_sqr_n_8(t1, t2, 32, p256_mod, p256_mp_mod);
  17546. /* 0xffffffffffffffff */
  17547. sp_256_mont_mul_8(t2, t2, t1, p256_mod, p256_mp_mod);
  17548. /* 0xffffffff00000001 */
  17549. sp_256_mont_mul_8(r, t1, a, p256_mod, p256_mp_mod);
  17550. /* 0xffffffff000000010000000000000000000000000000000000000000 */
  17551. sp_256_mont_sqr_n_8(r, r, 160, p256_mod, p256_mp_mod);
  17552. /* 0xffffffff00000001000000000000000000000000ffffffffffffffff */
  17553. sp_256_mont_mul_8(r, r, t2, p256_mod, p256_mp_mod);
  17554. /* 0xffffffff00000001000000000000000000000000ffffffffffffffff00000000 */
  17555. sp_256_mont_sqr_n_8(r, r, 32, p256_mod, p256_mp_mod);
  17556. /* 0xffffffff00000001000000000000000000000000fffffffffffffffffffffffd */
  17557. sp_256_mont_mul_8(r, r, t3, p256_mod, p256_mp_mod);
  17558. #endif /* WOLFSSL_SP_SMALL */
  17559. }
  17560. /* Compare a with b in constant time.
  17561. *
  17562. * a A single precision integer.
  17563. * b A single precision integer.
  17564. * return -ve, 0 or +ve if a is less than, equal to or greater than b
  17565. * respectively.
  17566. */
  17567. SP_NOINLINE static sp_int32 sp_256_cmp_8(const sp_digit* a, const sp_digit* b)
  17568. {
  17569. sp_digit r = 0;
  17570. __asm__ __volatile__ (
  17571. "mov r3, #0\n\t"
  17572. "mvn r3, r3\n\t"
  17573. "mov r6, #28\n\t"
  17574. "\n1:\n\t"
  17575. "ldr r8, [%[a], r6]\n\t"
  17576. "ldr r5, [%[b], r6]\n\t"
  17577. "and r8, r8, r3\n\t"
  17578. "and r5, r5, r3\n\t"
  17579. "mov r4, r8\n\t"
  17580. "subs r8, r8, r5\n\t"
  17581. "sbc r8, r8, r8\n\t"
  17582. "add %[r], %[r], r8\n\t"
  17583. "mvn r8, r8\n\t"
  17584. "and r3, r3, r8\n\t"
  17585. "subs r5, r5, r4\n\t"
  17586. "sbc r8, r8, r8\n\t"
  17587. "sub %[r], %[r], r8\n\t"
  17588. "mvn r8, r8\n\t"
  17589. "and r3, r3, r8\n\t"
  17590. "sub r6, r6, #4\n\t"
  17591. "cmp r6, #0\n\t"
  17592. #ifdef __GNUC__
  17593. "bge 1b\n\t"
  17594. #else
  17595. "bge.n 1b\n\t"
  17596. #endif /* __GNUC__ */
  17597. : [r] "+r" (r)
  17598. : [a] "r" (a), [b] "r" (b)
  17599. : "r3", "r4", "r5", "r6", "r8"
  17600. );
  17601. return r;
  17602. }
  17603. /* Normalize the values in each word to 32.
  17604. *
  17605. * a Array of sp_digit to normalize.
  17606. */
  17607. #define sp_256_norm_8(a)
  17608. /* Conditionally subtract b from a using the mask m.
  17609. * m is -1 to subtract and 0 when not copying.
  17610. *
  17611. * r A single precision number representing condition subtract result.
  17612. * a A single precision number to subtract from.
  17613. * b A single precision number to subtract.
  17614. * m Mask value to apply.
  17615. */
  17616. SP_NOINLINE static sp_digit sp_256_cond_sub_8(sp_digit* r, const sp_digit* a,
  17617. const sp_digit* b, sp_digit m)
  17618. {
  17619. sp_digit c = 0;
  17620. __asm__ __volatile__ (
  17621. "mov r5, #32\n\t"
  17622. "mov r9, r5\n\t"
  17623. "mov r8, #0\n\t"
  17624. "\n1:\n\t"
  17625. "ldr r6, [%[b], r8]\n\t"
  17626. "and r6, r6, %[m]\n\t"
  17627. "mov r5, #0\n\t"
  17628. "subs r5, r5, %[c]\n\t"
  17629. "ldr r5, [%[a], r8]\n\t"
  17630. "sbcs r5, r5, r6\n\t"
  17631. "sbcs %[c], %[c], %[c]\n\t"
  17632. "str r5, [%[r], r8]\n\t"
  17633. "add r8, r8, #4\n\t"
  17634. "cmp r8, r9\n\t"
  17635. #ifdef __GNUC__
  17636. "blt 1b\n\t"
  17637. #else
  17638. "blt.n 1b\n\t"
  17639. #endif /* __GNUC__ */
  17640. : [c] "+r" (c)
  17641. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  17642. : "memory", "r5", "r6", "r8", "r9"
  17643. );
  17644. return c;
  17645. }
  17646. /* Reduce the number back to 256 bits using Montgomery reduction.
  17647. *
  17648. * a A single precision number to reduce in place.
  17649. * m The single precision number representing the modulus.
  17650. * mp The digit representing the negative inverse of m mod 2^n.
  17651. */
  17652. SP_NOINLINE static void sp_256_mont_reduce_8(sp_digit* a, const sp_digit* m,
  17653. sp_digit mp)
  17654. {
  17655. (void)mp;
  17656. (void)m;
  17657. __asm__ __volatile__ (
  17658. "mov r2, #0\n\t"
  17659. "mov r1, #0\n\t"
  17660. /* i = 0 */
  17661. "mov r9, r2\n\t"
  17662. "\n1:\n\t"
  17663. "mov r4, #0\n\t"
  17664. /* mu = a[i] * 1 (mp) = a[i] */
  17665. "ldr r3, [%[a]]\n\t"
  17666. /* a[i] += -1 * mu = -1 * a[i] => a[i] = 0 no carry */
  17667. /* a[i+1] += -1 * mu */
  17668. "ldr r6, [%[a], #4]\n\t"
  17669. "mov r5, #0\n\t"
  17670. "adds r4, r4, r6\n\t"
  17671. "adc r5, r5, r2\n\t"
  17672. "str r4, [%[a], #4]\n\t"
  17673. /* a[i+2] += -1 * mu */
  17674. "ldr r6, [%[a], #8]\n\t"
  17675. "mov r4, #0\n\t"
  17676. "adds r5, r5, r6\n\t"
  17677. "adc r4, r4, r2\n\t"
  17678. "str r5, [%[a], #8]\n\t"
  17679. /* a[i+3] += 0 * mu */
  17680. "ldr r6, [%[a], #12]\n\t"
  17681. "mov r5, #0\n\t"
  17682. "adds r4, r4, r3\n\t"
  17683. "adc r5, r5, r2\n\t"
  17684. "adds r4, r4, r6\n\t"
  17685. "adc r5, r5, r2\n\t"
  17686. "str r4, [%[a], #12]\n\t"
  17687. /* a[i+4] += 0 * mu */
  17688. "ldr r6, [%[a], #16]\n\t"
  17689. "mov r4, #0\n\t"
  17690. "adds r5, r5, r6\n\t"
  17691. "adc r4, r4, r2\n\t"
  17692. "str r5, [%[a], #16]\n\t"
  17693. /* a[i+5] += 0 * mu */
  17694. "ldr r6, [%[a], #20]\n\t"
  17695. "mov r5, #0\n\t"
  17696. "adds r4, r4, r6\n\t"
  17697. "adc r5, r5, r2\n\t"
  17698. "str r4, [%[a], #20]\n\t"
  17699. /* a[i+6] += 1 * mu */
  17700. "ldr r6, [%[a], #24]\n\t"
  17701. "mov r4, #0\n\t"
  17702. "adds r5, r5, r3\n\t"
  17703. "adc r4, r4, r2\n\t"
  17704. "adds r5, r5, r6\n\t"
  17705. "adc r4, r4, r2\n\t"
  17706. "str r5, [%[a], #24]\n\t"
  17707. /* a[i+7] += -1 * mu */
  17708. "ldr r6, [%[a], #28]\n\t"
  17709. "ldr r8, [%[a], #32]\n\t"
  17710. "adds r5, r1, r3\n\t"
  17711. "mov r1, #0\n\t"
  17712. "adc r1, r1, r2\n\t"
  17713. "subs r4, r4, r3\n\t"
  17714. "sbcs r5, r5, r2\n\t"
  17715. "sbc r1, r1, r2\n\t"
  17716. "adds r4, r4, r6\n\t"
  17717. "adcs r5, r5, r8\n\t"
  17718. "adc r1, r1, r2\n\t"
  17719. "str r4, [%[a], #28]\n\t"
  17720. "str r5, [%[a], #32]\n\t"
  17721. /* i += 1 */
  17722. "add r9, r9, #1\n\t"
  17723. "add %[a], %[a], #4\n\t"
  17724. "mov r6, #8\n\t"
  17725. "cmp r9, r6\n\t"
  17726. #ifdef __GNUC__
  17727. "blt 1b\n\t"
  17728. #else
  17729. "blt.n 1b\n\t"
  17730. #endif /* __GNUC__ */
  17731. "sub %[a], %[a], #32\n\t"
  17732. "mov r3, r1\n\t"
  17733. "sub r1, r1, #1\n\t"
  17734. "mvn r1, r1\n\t"
  17735. "ldr r4, [%[a],#32]\n\t"
  17736. "ldr r5, [%[a],#36]\n\t"
  17737. "ldr r6, [%[a],#40]\n\t"
  17738. "ldr r8, [%[a],#44]\n\t"
  17739. "ldr r9, [%[a],#48]\n\t"
  17740. "ldr r10, [%[a],#52]\n\t"
  17741. "ldr r11, [%[a],#56]\n\t"
  17742. "ldr r14, [%[a],#60]\n\t"
  17743. "subs r4, r4, r1\n\t"
  17744. "sbcs r5, r5, r1\n\t"
  17745. "sbcs r6, r6, r1\n\t"
  17746. "sbcs r8, r8, r2\n\t"
  17747. "sbcs r9, r9, r2\n\t"
  17748. "sbcs r10, r10, r2\n\t"
  17749. "sbcs r11, r11, r3\n\t"
  17750. "sbc r14, r14, r1\n\t"
  17751. "str r4, [%[a],#0]\n\t"
  17752. "str r5, [%[a],#4]\n\t"
  17753. "str r6, [%[a],#8]\n\t"
  17754. "str r8, [%[a],#12]\n\t"
  17755. "str r9, [%[a],#16]\n\t"
  17756. "str r10, [%[a],#20]\n\t"
  17757. "str r11, [%[a],#24]\n\t"
  17758. "str r14, [%[a],#28]\n\t"
  17759. : [a] "+r" (a)
  17760. :
  17761. : "memory", "r1", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r14"
  17762. );
  17763. (void)m;
  17764. (void)mp;
  17765. }
  17766. /* Reduce the number back to 256 bits using Montgomery reduction.
  17767. *
  17768. * a A single precision number to reduce in place.
  17769. * m The single precision number representing the modulus.
  17770. * mp The digit representing the negative inverse of m mod 2^n.
  17771. */
  17772. SP_NOINLINE static void sp_256_mont_reduce_order_8(sp_digit* a, const sp_digit* m,
  17773. sp_digit mp)
  17774. {
  17775. sp_digit ca = 0;
  17776. __asm__ __volatile__ (
  17777. "mov r9, %[mp]\n\t"
  17778. "mov r12, %[m]\n\t"
  17779. "mov r10, %[a]\n\t"
  17780. "mov r4, #0\n\t"
  17781. "add r11, r10, #32\n\t"
  17782. "\n1:\n\t"
  17783. /* mu = a[i] * mp */
  17784. "mov %[mp], r9\n\t"
  17785. "ldr %[a], [r10]\n\t"
  17786. "mul %[mp], %[mp], %[a]\n\t"
  17787. "mov %[m], r12\n\t"
  17788. "add r14, r10, #24\n\t"
  17789. "\n2:\n\t"
  17790. /* a[i+j] += m[j] * mu */
  17791. "ldr %[a], [r10]\n\t"
  17792. "mov r5, #0\n\t"
  17793. /* Multiply m[j] and mu - Start */
  17794. "ldr r8, [%[m]], #4\n\t"
  17795. "umull r6, r8, %[mp], r8\n\t"
  17796. "adds %[a], %[a], r6\n\t"
  17797. "adc r5, r5, r8\n\t"
  17798. /* Multiply m[j] and mu - Done */
  17799. "adds r4, r4, %[a]\n\t"
  17800. "adc r5, r5, #0\n\t"
  17801. "str r4, [r10], #4\n\t"
  17802. /* a[i+j+1] += m[j+1] * mu */
  17803. "ldr %[a], [r10]\n\t"
  17804. "mov r4, #0\n\t"
  17805. /* Multiply m[j] and mu - Start */
  17806. "ldr r8, [%[m]], #4\n\t"
  17807. "umull r6, r8, %[mp], r8\n\t"
  17808. "adds %[a], %[a], r6\n\t"
  17809. "adc r4, r4, r8\n\t"
  17810. /* Multiply m[j] and mu - Done */
  17811. "adds r5, r5, %[a]\n\t"
  17812. "adc r4, r4, #0\n\t"
  17813. "str r5, [r10], #4\n\t"
  17814. "cmp r10, r14\n\t"
  17815. #ifdef __GNUC__
  17816. "blt 2b\n\t"
  17817. #else
  17818. "blt.n 2b\n\t"
  17819. #endif /* __GNUC__ */
  17820. /* a[i+6] += m[6] * mu */
  17821. "ldr %[a], [r10]\n\t"
  17822. "mov r5, #0\n\t"
  17823. /* Multiply m[j] and mu - Start */
  17824. "ldr r8, [%[m]], #4\n\t"
  17825. "umull r6, r8, %[mp], r8\n\t"
  17826. "adds %[a], %[a], r6\n\t"
  17827. "adc r5, r5, r8\n\t"
  17828. /* Multiply m[j] and mu - Done */
  17829. "adds r4, r4, %[a]\n\t"
  17830. "adc r5, r5, #0\n\t"
  17831. "str r4, [r10], #4\n\t"
  17832. /* a[i+7] += m[7] * mu */
  17833. "mov r4, %[ca]\n\t"
  17834. "mov %[ca], #0\n\t"
  17835. /* Multiply m[7] and mu - Start */
  17836. "ldr r8, [%[m]]\n\t"
  17837. "umull r6, r8, %[mp], r8\n\t"
  17838. "adds r5, r5, r6\n\t"
  17839. "adcs r4, r4, r8\n\t"
  17840. "adc %[ca], %[ca], #0\n\t"
  17841. /* Multiply m[7] and mu - Done */
  17842. "ldr r6, [r10]\n\t"
  17843. "ldr r8, [r10, #4]\n\t"
  17844. "adds r6, r6, r5\n\t"
  17845. "adcs r8, r8, r4\n\t"
  17846. "adc %[ca], %[ca], #0\n\t"
  17847. "str r6, [r10]\n\t"
  17848. "str r8, [r10, #4]\n\t"
  17849. /* Next word in a */
  17850. "sub r10, r10, #24\n\t"
  17851. "cmp r10, r11\n\t"
  17852. #ifdef __GNUC__
  17853. "blt 1b\n\t"
  17854. #else
  17855. "blt.n 1b\n\t"
  17856. #endif /* __GNUC__ */
  17857. "mov %[a], r10\n\t"
  17858. "mov %[m], r12\n\t"
  17859. : [ca] "+r" (ca), [a] "+r" (a)
  17860. : [m] "r" (m), [mp] "r" (mp)
  17861. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  17862. );
  17863. sp_256_cond_sub_8(a - 8, a, m, (sp_digit)0 - ca);
  17864. }
  17865. /* Map the Montgomery form projective coordinate point to an affine point.
  17866. *
  17867. * r Resulting affine coordinate point.
  17868. * p Montgomery form projective coordinate point.
  17869. * t Temporary ordinate data.
  17870. */
  17871. static void sp_256_map_8(sp_point_256* r, const sp_point_256* p,
  17872. sp_digit* t)
  17873. {
  17874. sp_digit* t1 = t;
  17875. sp_digit* t2 = t + 2*8;
  17876. sp_int32 n;
  17877. sp_256_mont_inv_8(t1, p->z, t + 2*8);
  17878. sp_256_mont_sqr_8(t2, t1, p256_mod, p256_mp_mod);
  17879. sp_256_mont_mul_8(t1, t2, t1, p256_mod, p256_mp_mod);
  17880. /* x /= z^2 */
  17881. sp_256_mont_mul_8(r->x, p->x, t2, p256_mod, p256_mp_mod);
  17882. XMEMSET(r->x + 8, 0, sizeof(r->x) / 2U);
  17883. sp_256_mont_reduce_8(r->x, p256_mod, p256_mp_mod);
  17884. /* Reduce x to less than modulus */
  17885. n = sp_256_cmp_8(r->x, p256_mod);
  17886. sp_256_cond_sub_8(r->x, r->x, p256_mod, ~(n >> 31));
  17887. sp_256_norm_8(r->x);
  17888. /* y /= z^3 */
  17889. sp_256_mont_mul_8(r->y, p->y, t1, p256_mod, p256_mp_mod);
  17890. XMEMSET(r->y + 8, 0, sizeof(r->y) / 2U);
  17891. sp_256_mont_reduce_8(r->y, p256_mod, p256_mp_mod);
  17892. /* Reduce y to less than modulus */
  17893. n = sp_256_cmp_8(r->y, p256_mod);
  17894. sp_256_cond_sub_8(r->y, r->y, p256_mod, ~(n >> 31));
  17895. sp_256_norm_8(r->y);
  17896. XMEMSET(r->z, 0, sizeof(r->z) / 2);
  17897. r->z[0] = 1;
  17898. }
  17899. /* Add two Montgomery form numbers (r = a + b % m).
  17900. *
  17901. * r Result of addition.
  17902. * a First number to add in Montgomery form.
  17903. * b Second number to add in Montgomery form.
  17904. * m Modulus (prime).
  17905. */
  17906. SP_NOINLINE static void sp_256_mont_add_8(sp_digit* r, const sp_digit* a, const sp_digit* b,
  17907. const sp_digit* m)
  17908. {
  17909. (void)m;
  17910. __asm__ __volatile__ (
  17911. "mov r12, #0\n\t"
  17912. "ldr r4, [%[a],#0]\n\t"
  17913. "ldr r5, [%[a],#4]\n\t"
  17914. "ldr r6, [%[a],#8]\n\t"
  17915. "ldr r8, [%[a],#12]\n\t"
  17916. "ldr r9, [%[b],#0]\n\t"
  17917. "ldr r10, [%[b],#4]\n\t"
  17918. "ldr r11, [%[b],#8]\n\t"
  17919. "ldr r14, [%[b],#12]\n\t"
  17920. "adds r4, r4, r9\n\t"
  17921. "adcs r5, r5, r10\n\t"
  17922. "adcs r6, r6, r11\n\t"
  17923. "adcs r8, r8, r14\n\t"
  17924. "str r4, [%[r],#0]\n\t"
  17925. "str r5, [%[r],#4]\n\t"
  17926. "str r6, [%[r],#8]\n\t"
  17927. "str r8, [%[r],#12]\n\t"
  17928. "ldr r4, [%[a],#16]\n\t"
  17929. "ldr r5, [%[a],#20]\n\t"
  17930. "ldr r6, [%[a],#24]\n\t"
  17931. "ldr r8, [%[a],#28]\n\t"
  17932. "ldr r9, [%[b],#16]\n\t"
  17933. "ldr r10, [%[b],#20]\n\t"
  17934. "ldr r11, [%[b],#24]\n\t"
  17935. "ldr r14, [%[b],#28]\n\t"
  17936. "adcs r4, r4, r9\n\t"
  17937. "adcs r5, r5, r10\n\t"
  17938. "adcs r6, r6, r11\n\t"
  17939. "adcs r8, r8, r14\n\t"
  17940. "adc r3, r12, #0\n\t"
  17941. "sub r3, r12, r3\n\t"
  17942. "and r12, r3, #1\n\t"
  17943. "ldr r9, [%[r],#0]\n\t"
  17944. "ldr r10, [%[r],#4]\n\t"
  17945. "ldr r11, [%[r],#8]\n\t"
  17946. "ldr r14, [%[r],#12]\n\t"
  17947. "subs r9, r9, r3\n\t"
  17948. "sbcs r10, r10, r3\n\t"
  17949. "sbcs r11, r11, r3\n\t"
  17950. "sbcs r14, r14, #0\n\t"
  17951. "sbcs r4, r4, #0\n\t"
  17952. "sbcs r5, r5, #0\n\t"
  17953. "sbcs r6, r6, r12\n\t"
  17954. "sbc r8, r8, r3\n\t"
  17955. "str r9, [%[r],#0]\n\t"
  17956. "str r10, [%[r],#4]\n\t"
  17957. "str r11, [%[r],#8]\n\t"
  17958. "str r14, [%[r],#12]\n\t"
  17959. "str r4, [%[r],#16]\n\t"
  17960. "str r5, [%[r],#20]\n\t"
  17961. "str r6, [%[r],#24]\n\t"
  17962. "str r8, [%[r],#28]\n\t"
  17963. :
  17964. : [r] "r" (r), [a] "r" (a), [b] "r" (b)
  17965. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r14", "r3", "r12"
  17966. );
  17967. }
  17968. /* Double a Montgomery form number (r = a + a % m).
  17969. *
  17970. * r Result of doubling.
  17971. * a Number to double in Montgomery form.
  17972. * m Modulus (prime).
  17973. */
  17974. SP_NOINLINE static void sp_256_mont_dbl_8(sp_digit* r, const sp_digit* a, const sp_digit* m)
  17975. {
  17976. (void)m;
  17977. __asm__ __volatile__ (
  17978. "mov r12, #0\n\t"
  17979. "ldr r4, [%[a],#0]\n\t"
  17980. "ldr r5, [%[a],#4]\n\t"
  17981. "ldr r6, [%[a],#8]\n\t"
  17982. "ldr r8, [%[a],#12]\n\t"
  17983. "ldr r9, [%[a],#16]\n\t"
  17984. "ldr r10, [%[a],#20]\n\t"
  17985. "ldr r11, [%[a],#24]\n\t"
  17986. "ldr r14, [%[a],#28]\n\t"
  17987. "adds r4, r4, r4\n\t"
  17988. "adcs r5, r5, r5\n\t"
  17989. "adcs r6, r6, r6\n\t"
  17990. "adcs r8, r8, r8\n\t"
  17991. "adcs r9, r9, r9\n\t"
  17992. "adcs r10, r10, r10\n\t"
  17993. "adcs r11, r11, r11\n\t"
  17994. "adcs r14, r14, r14\n\t"
  17995. "adc r3, r12, #0\n\t"
  17996. "sub r3, r12, r3\n\t"
  17997. "and r12, r3, #1\n\t"
  17998. "subs r4, r4, r3\n\t"
  17999. "sbcs r5, r5, r3\n\t"
  18000. "sbcs r6, r6, r3\n\t"
  18001. "sbcs r8, r8, #0\n\t"
  18002. "sbcs r9, r9, #0\n\t"
  18003. "sbcs r10, r10, #0\n\t"
  18004. "sbcs r11, r11, r12\n\t"
  18005. "sbc r14, r14, r3\n\t"
  18006. "str r4, [%[r],#0]\n\t"
  18007. "str r5, [%[r],#4]\n\t"
  18008. "str r6, [%[r],#8]\n\t"
  18009. "str r8, [%[r],#12]\n\t"
  18010. "str r9, [%[r],#16]\n\t"
  18011. "str r10, [%[r],#20]\n\t"
  18012. "str r11, [%[r],#24]\n\t"
  18013. "str r14, [%[r],#28]\n\t"
  18014. :
  18015. : [r] "r" (r), [a] "r" (a)
  18016. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r14", "r3", "r12"
  18017. );
  18018. }
  18019. /* Triple a Montgomery form number (r = a + a + a % m).
  18020. *
  18021. * r Result of Tripling.
  18022. * a Number to triple in Montgomery form.
  18023. * m Modulus (prime).
  18024. */
  18025. SP_NOINLINE static void sp_256_mont_tpl_8(sp_digit* r, const sp_digit* a, const sp_digit* m)
  18026. {
  18027. (void)m;
  18028. __asm__ __volatile__ (
  18029. "ldr r2, [%[a],#0]\n\t"
  18030. "ldr r3, [%[a],#4]\n\t"
  18031. "ldr r4, [%[a],#8]\n\t"
  18032. "ldr r5, [%[a],#12]\n\t"
  18033. "ldr r6, [%[a],#16]\n\t"
  18034. "ldr r8, [%[a],#20]\n\t"
  18035. "ldr r9, [%[a],#24]\n\t"
  18036. "ldr r10, [%[a],#28]\n\t"
  18037. "adds r2, r2, r2\n\t"
  18038. "adcs r3, r3, r3\n\t"
  18039. "adcs r4, r4, r4\n\t"
  18040. "adcs r5, r5, r5\n\t"
  18041. "adcs r6, r6, r6\n\t"
  18042. "adcs r8, r8, r8\n\t"
  18043. "adcs r9, r9, r9\n\t"
  18044. "adcs r10, r10, r10\n\t"
  18045. "mov r11, #0\n\t"
  18046. "mov r14, #0\n\t"
  18047. "adc r11, r11, r11\n\t"
  18048. "mov r12, r11\n\t"
  18049. "sub r11, r11, #1\n\t"
  18050. "mvn r11, r11\n\t"
  18051. "subs r2, r2, r11\n\t"
  18052. "sbcs r3, r3, r11\n\t"
  18053. "sbcs r4, r4, r11\n\t"
  18054. "sbcs r5, r5, r14\n\t"
  18055. "sbcs r6, r6, r14\n\t"
  18056. "sbcs r8, r8, r14\n\t"
  18057. "sbcs r9, r9, r12\n\t"
  18058. "sbc r10, r10, r11\n\t"
  18059. "ldr r12, [%[a],#0]\n\t"
  18060. "ldr r14, [%[a],#4]\n\t"
  18061. "adds r2, r2, r12\n\t"
  18062. "adcs r3, r3, r14\n\t"
  18063. "ldr r12, [%[a],#8]\n\t"
  18064. "ldr r14, [%[a],#12]\n\t"
  18065. "adcs r4, r4, r12\n\t"
  18066. "adcs r5, r5, r14\n\t"
  18067. "ldr r12, [%[a],#16]\n\t"
  18068. "ldr r14, [%[a],#20]\n\t"
  18069. "adcs r6, r6, r12\n\t"
  18070. "adcs r8, r8, r14\n\t"
  18071. "ldr r12, [%[a],#24]\n\t"
  18072. "ldr r14, [%[a],#28]\n\t"
  18073. "adcs r9, r9, r12\n\t"
  18074. "adcs r10, r10, r14\n\t"
  18075. "mov r11, #0\n\t"
  18076. "mov r14, #0\n\t"
  18077. "adc r11, r11, r11\n\t"
  18078. "mov r12, r11\n\t"
  18079. "sub r11, r11, #1\n\t"
  18080. "mvn r11, r11\n\t"
  18081. "subs r2, r2, r11\n\t"
  18082. "str r2, [%[r],#0]\n\t"
  18083. "sbcs r3, r3, r11\n\t"
  18084. "str r3, [%[r],#4]\n\t"
  18085. "sbcs r4, r4, r11\n\t"
  18086. "str r4, [%[r],#8]\n\t"
  18087. "sbcs r5, r5, r14\n\t"
  18088. "str r5, [%[r],#12]\n\t"
  18089. "sbcs r6, r6, r14\n\t"
  18090. "str r6, [%[r],#16]\n\t"
  18091. "sbcs r8, r8, r14\n\t"
  18092. "str r8, [%[r],#20]\n\t"
  18093. "sbcs r9, r9, r12\n\t"
  18094. "str r9, [%[r],#24]\n\t"
  18095. "sbc r10, r10, r11\n\t"
  18096. "str r10, [%[r],#28]\n\t"
  18097. :
  18098. : [r] "r" (r), [a] "r" (a)
  18099. : "memory", "r11", "r12", "r14", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10"
  18100. );
  18101. }
  18102. /* Subtract two Montgomery form numbers (r = a - b % m).
  18103. *
  18104. * r Result of subtration.
  18105. * a Number to subtract from in Montgomery form.
  18106. * b Number to subtract with in Montgomery form.
  18107. * m Modulus (prime).
  18108. */
  18109. SP_NOINLINE static void sp_256_mont_sub_8(sp_digit* r, const sp_digit* a, const sp_digit* b,
  18110. const sp_digit* m)
  18111. {
  18112. (void)m;
  18113. __asm__ __volatile__ (
  18114. "mov r12, #0\n\t"
  18115. "ldr r4, [%[a],#0]\n\t"
  18116. "ldr r5, [%[a],#4]\n\t"
  18117. "ldr r6, [%[a],#8]\n\t"
  18118. "ldr r8, [%[a],#12]\n\t"
  18119. "ldr r9, [%[b],#0]\n\t"
  18120. "ldr r10, [%[b],#4]\n\t"
  18121. "ldr r11, [%[b],#8]\n\t"
  18122. "ldr r14, [%[b],#12]\n\t"
  18123. "subs r4, r4, r9\n\t"
  18124. "sbcs r5, r5, r10\n\t"
  18125. "sbcs r6, r6, r11\n\t"
  18126. "sbcs r8, r8, r14\n\t"
  18127. "str r4, [%[r],#0]\n\t"
  18128. "str r5, [%[r],#4]\n\t"
  18129. "str r6, [%[r],#8]\n\t"
  18130. "str r8, [%[r],#12]\n\t"
  18131. "ldr r4, [%[a],#16]\n\t"
  18132. "ldr r5, [%[a],#20]\n\t"
  18133. "ldr r6, [%[a],#24]\n\t"
  18134. "ldr r8, [%[a],#28]\n\t"
  18135. "ldr r9, [%[b],#16]\n\t"
  18136. "ldr r10, [%[b],#20]\n\t"
  18137. "ldr r11, [%[b],#24]\n\t"
  18138. "ldr r14, [%[b],#28]\n\t"
  18139. "sbcs r4, r4, r9\n\t"
  18140. "sbcs r5, r5, r10\n\t"
  18141. "sbcs r6, r6, r11\n\t"
  18142. "sbcs r8, r8, r14\n\t"
  18143. "sbc r3, r12, #0\n\t"
  18144. "and r12, r3, #1\n\t"
  18145. "ldr r9, [%[r],#0]\n\t"
  18146. "ldr r10, [%[r],#4]\n\t"
  18147. "ldr r11, [%[r],#8]\n\t"
  18148. "ldr r14, [%[r],#12]\n\t"
  18149. "adds r9, r9, r3\n\t"
  18150. "adcs r10, r10, r3\n\t"
  18151. "adcs r11, r11, r3\n\t"
  18152. "adcs r14, r14, #0\n\t"
  18153. "adcs r4, r4, #0\n\t"
  18154. "adcs r5, r5, #0\n\t"
  18155. "adcs r6, r6, r12\n\t"
  18156. "adc r8, r8, r3\n\t"
  18157. "str r9, [%[r],#0]\n\t"
  18158. "str r10, [%[r],#4]\n\t"
  18159. "str r11, [%[r],#8]\n\t"
  18160. "str r14, [%[r],#12]\n\t"
  18161. "str r4, [%[r],#16]\n\t"
  18162. "str r5, [%[r],#20]\n\t"
  18163. "str r6, [%[r],#24]\n\t"
  18164. "str r8, [%[r],#28]\n\t"
  18165. :
  18166. : [r] "r" (r), [a] "r" (a), [b] "r" (b)
  18167. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r14", "r3", "r12"
  18168. );
  18169. }
  18170. #define sp_256_mont_sub_lower_8 sp_256_mont_sub_8
  18171. /* Divide the number by 2 mod the modulus (prime). (r = a / 2 % m)
  18172. *
  18173. * r Result of division by 2.
  18174. * a Number to divide.
  18175. * m Modulus (prime).
  18176. */
  18177. SP_NOINLINE static void sp_256_div2_8(sp_digit* r, const sp_digit* a, const sp_digit* m)
  18178. {
  18179. __asm__ __volatile__ (
  18180. "ldr r8, [%[a], #0]\n\t"
  18181. "lsl r8, r8, #31\n\t"
  18182. "lsr r8, r8, #31\n\t"
  18183. "mov r5, #0\n\t"
  18184. "sub r5, r5, r8\n\t"
  18185. "mov r8, #0\n\t"
  18186. "lsl r6, r5, #31\n\t"
  18187. "lsr r6, r6, #31\n\t"
  18188. "ldr r3, [%[a], #0]\n\t"
  18189. "ldr r4, [%[a], #4]\n\t"
  18190. "adds r3, r3, r5\n\t"
  18191. "adcs r4, r4, r5\n\t"
  18192. "str r3, [%[r], #0]\n\t"
  18193. "str r4, [%[r], #4]\n\t"
  18194. "ldr r3, [%[a], #8]\n\t"
  18195. "ldr r4, [%[a], #12]\n\t"
  18196. "adcs r3, r3, r5\n\t"
  18197. "adcs r4, r4, r8\n\t"
  18198. "str r3, [%[r], #8]\n\t"
  18199. "str r4, [%[r], #12]\n\t"
  18200. "ldr r3, [%[a], #16]\n\t"
  18201. "ldr r4, [%[a], #20]\n\t"
  18202. "adcs r3, r3, r8\n\t"
  18203. "adcs r4, r4, r8\n\t"
  18204. "str r3, [%[r], #16]\n\t"
  18205. "str r4, [%[r], #20]\n\t"
  18206. "ldr r3, [%[a], #24]\n\t"
  18207. "ldr r4, [%[a], #28]\n\t"
  18208. "adcs r3, r3, r6\n\t"
  18209. "adcs r4, r4, r5\n\t"
  18210. "adc r8, r8, r8\n\t"
  18211. "lsl r8, r8, #31\n\t"
  18212. "lsr r5, r3, #1\n\t"
  18213. "lsl r3, r3, #31\n\t"
  18214. "lsr r6, r4, #1\n\t"
  18215. "lsl r4, r4, #31\n\t"
  18216. "orr r5, r5, r4\n\t"
  18217. "orr r6, r6, r8\n\t"
  18218. "mov r8, r3\n\t"
  18219. "str r5, [%[r], #24]\n\t"
  18220. "str r6, [%[r], #28]\n\t"
  18221. "ldr r3, [%[a], #16]\n\t"
  18222. "ldr r4, [%[a], #20]\n\t"
  18223. "lsr r5, r3, #1\n\t"
  18224. "lsl r3, r3, #31\n\t"
  18225. "lsr r6, r4, #1\n\t"
  18226. "lsl r4, r4, #31\n\t"
  18227. "orr r5, r5, r4\n\t"
  18228. "orr r6, r6, r8\n\t"
  18229. "mov r8, r3\n\t"
  18230. "str r5, [%[r], #16]\n\t"
  18231. "str r6, [%[r], #20]\n\t"
  18232. "ldr r3, [%[a], #8]\n\t"
  18233. "ldr r4, [%[a], #12]\n\t"
  18234. "lsr r5, r3, #1\n\t"
  18235. "lsl r3, r3, #31\n\t"
  18236. "lsr r6, r4, #1\n\t"
  18237. "lsl r4, r4, #31\n\t"
  18238. "orr r5, r5, r4\n\t"
  18239. "orr r6, r6, r8\n\t"
  18240. "mov r8, r3\n\t"
  18241. "str r5, [%[r], #8]\n\t"
  18242. "str r6, [%[r], #12]\n\t"
  18243. "ldr r3, [%[r], #0]\n\t"
  18244. "ldr r4, [%[r], #4]\n\t"
  18245. "lsr r5, r3, #1\n\t"
  18246. "lsr r6, r4, #1\n\t"
  18247. "lsl r4, r4, #31\n\t"
  18248. "orr r5, r5, r4\n\t"
  18249. "orr r6, r6, r8\n\t"
  18250. "str r5, [%[r], #0]\n\t"
  18251. "str r6, [%[r], #4]\n\t"
  18252. :
  18253. : [r] "r" (r), [a] "r" (a), [m] "r" (m)
  18254. : "memory", "r3", "r4", "r5", "r6", "r8"
  18255. );
  18256. }
  18257. /* Double the Montgomery form projective point p.
  18258. *
  18259. * r Result of doubling point.
  18260. * p Point to double.
  18261. * t Temporary ordinate data.
  18262. */
  18263. #ifdef WOLFSSL_SP_NONBLOCK
  18264. typedef struct sp_256_proj_point_dbl_8_ctx {
  18265. int state;
  18266. sp_digit* t1;
  18267. sp_digit* t2;
  18268. sp_digit* x;
  18269. sp_digit* y;
  18270. sp_digit* z;
  18271. } sp_256_proj_point_dbl_8_ctx;
  18272. static int sp_256_proj_point_dbl_8_nb(sp_ecc_ctx_t* sp_ctx, sp_point_256* r, const sp_point_256* p, sp_digit* t)
  18273. {
  18274. int err = FP_WOULDBLOCK;
  18275. sp_256_proj_point_dbl_8_ctx* ctx = (sp_256_proj_point_dbl_8_ctx*)sp_ctx->data;
  18276. typedef char ctx_size_test[sizeof(sp_256_proj_point_dbl_8_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  18277. (void)sizeof(ctx_size_test);
  18278. switch (ctx->state) {
  18279. case 0:
  18280. ctx->t1 = t;
  18281. ctx->t2 = t + 2*8;
  18282. ctx->x = r->x;
  18283. ctx->y = r->y;
  18284. ctx->z = r->z;
  18285. /* Put infinity into result. */
  18286. if (r != p) {
  18287. r->infinity = p->infinity;
  18288. }
  18289. ctx->state = 1;
  18290. break;
  18291. case 1:
  18292. /* T1 = Z * Z */
  18293. sp_256_mont_sqr_8(ctx->t1, p->z, p256_mod, p256_mp_mod);
  18294. ctx->state = 2;
  18295. break;
  18296. case 2:
  18297. /* Z = Y * Z */
  18298. sp_256_mont_mul_8(ctx->z, p->y, p->z, p256_mod, p256_mp_mod);
  18299. ctx->state = 3;
  18300. break;
  18301. case 3:
  18302. /* Z = 2Z */
  18303. sp_256_mont_dbl_8(ctx->z, ctx->z, p256_mod);
  18304. ctx->state = 4;
  18305. break;
  18306. case 4:
  18307. /* T2 = X - T1 */
  18308. sp_256_mont_sub_8(ctx->t2, p->x, ctx->t1, p256_mod);
  18309. ctx->state = 5;
  18310. break;
  18311. case 5:
  18312. /* T1 = X + T1 */
  18313. sp_256_mont_add_8(ctx->t1, p->x, ctx->t1, p256_mod);
  18314. ctx->state = 6;
  18315. break;
  18316. case 6:
  18317. /* T2 = T1 * T2 */
  18318. sp_256_mont_mul_8(ctx->t2, ctx->t1, ctx->t2, p256_mod, p256_mp_mod);
  18319. ctx->state = 7;
  18320. break;
  18321. case 7:
  18322. /* T1 = 3T2 */
  18323. sp_256_mont_tpl_8(ctx->t1, ctx->t2, p256_mod);
  18324. ctx->state = 8;
  18325. break;
  18326. case 8:
  18327. /* Y = 2Y */
  18328. sp_256_mont_dbl_8(ctx->y, p->y, p256_mod);
  18329. ctx->state = 9;
  18330. break;
  18331. case 9:
  18332. /* Y = Y * Y */
  18333. sp_256_mont_sqr_8(ctx->y, ctx->y, p256_mod, p256_mp_mod);
  18334. ctx->state = 10;
  18335. break;
  18336. case 10:
  18337. /* T2 = Y * Y */
  18338. sp_256_mont_sqr_8(ctx->t2, ctx->y, p256_mod, p256_mp_mod);
  18339. ctx->state = 11;
  18340. break;
  18341. case 11:
  18342. /* T2 = T2/2 */
  18343. sp_256_div2_8(ctx->t2, ctx->t2, p256_mod);
  18344. ctx->state = 12;
  18345. break;
  18346. case 12:
  18347. /* Y = Y * X */
  18348. sp_256_mont_mul_8(ctx->y, ctx->y, p->x, p256_mod, p256_mp_mod);
  18349. ctx->state = 13;
  18350. break;
  18351. case 13:
  18352. /* X = T1 * T1 */
  18353. sp_256_mont_sqr_8(ctx->x, ctx->t1, p256_mod, p256_mp_mod);
  18354. ctx->state = 14;
  18355. break;
  18356. case 14:
  18357. /* X = X - Y */
  18358. sp_256_mont_sub_8(ctx->x, ctx->x, ctx->y, p256_mod);
  18359. ctx->state = 15;
  18360. break;
  18361. case 15:
  18362. /* X = X - Y */
  18363. sp_256_mont_sub_8(ctx->x, ctx->x, ctx->y, p256_mod);
  18364. ctx->state = 16;
  18365. break;
  18366. case 16:
  18367. /* Y = Y - X */
  18368. sp_256_mont_sub_lower_8(ctx->y, ctx->y, ctx->x, p256_mod);
  18369. ctx->state = 17;
  18370. break;
  18371. case 17:
  18372. /* Y = Y * T1 */
  18373. sp_256_mont_mul_8(ctx->y, ctx->y, ctx->t1, p256_mod, p256_mp_mod);
  18374. ctx->state = 18;
  18375. break;
  18376. case 18:
  18377. /* Y = Y - T2 */
  18378. sp_256_mont_sub_8(ctx->y, ctx->y, ctx->t2, p256_mod);
  18379. ctx->state = 19;
  18380. /* fall-through */
  18381. case 19:
  18382. err = MP_OKAY;
  18383. break;
  18384. }
  18385. if (err == MP_OKAY && ctx->state != 19) {
  18386. err = FP_WOULDBLOCK;
  18387. }
  18388. return err;
  18389. }
  18390. #endif /* WOLFSSL_SP_NONBLOCK */
  18391. static void sp_256_proj_point_dbl_8(sp_point_256* r, const sp_point_256* p,
  18392. sp_digit* t)
  18393. {
  18394. sp_digit* t1 = t;
  18395. sp_digit* t2 = t + 2*8;
  18396. sp_digit* x;
  18397. sp_digit* y;
  18398. sp_digit* z;
  18399. x = r->x;
  18400. y = r->y;
  18401. z = r->z;
  18402. /* Put infinity into result. */
  18403. if (r != p) {
  18404. r->infinity = p->infinity;
  18405. }
  18406. /* T1 = Z * Z */
  18407. sp_256_mont_sqr_8(t1, p->z, p256_mod, p256_mp_mod);
  18408. /* Z = Y * Z */
  18409. sp_256_mont_mul_8(z, p->y, p->z, p256_mod, p256_mp_mod);
  18410. /* Z = 2Z */
  18411. sp_256_mont_dbl_8(z, z, p256_mod);
  18412. /* T2 = X - T1 */
  18413. sp_256_mont_sub_8(t2, p->x, t1, p256_mod);
  18414. /* T1 = X + T1 */
  18415. sp_256_mont_add_8(t1, p->x, t1, p256_mod);
  18416. /* T2 = T1 * T2 */
  18417. sp_256_mont_mul_8(t2, t1, t2, p256_mod, p256_mp_mod);
  18418. /* T1 = 3T2 */
  18419. sp_256_mont_tpl_8(t1, t2, p256_mod);
  18420. /* Y = 2Y */
  18421. sp_256_mont_dbl_8(y, p->y, p256_mod);
  18422. /* Y = Y * Y */
  18423. sp_256_mont_sqr_8(y, y, p256_mod, p256_mp_mod);
  18424. /* T2 = Y * Y */
  18425. sp_256_mont_sqr_8(t2, y, p256_mod, p256_mp_mod);
  18426. /* T2 = T2/2 */
  18427. sp_256_div2_8(t2, t2, p256_mod);
  18428. /* Y = Y * X */
  18429. sp_256_mont_mul_8(y, y, p->x, p256_mod, p256_mp_mod);
  18430. /* X = T1 * T1 */
  18431. sp_256_mont_sqr_8(x, t1, p256_mod, p256_mp_mod);
  18432. /* X = X - Y */
  18433. sp_256_mont_sub_8(x, x, y, p256_mod);
  18434. /* X = X - Y */
  18435. sp_256_mont_sub_8(x, x, y, p256_mod);
  18436. /* Y = Y - X */
  18437. sp_256_mont_sub_lower_8(y, y, x, p256_mod);
  18438. /* Y = Y * T1 */
  18439. sp_256_mont_mul_8(y, y, t1, p256_mod, p256_mp_mod);
  18440. /* Y = Y - T2 */
  18441. sp_256_mont_sub_8(y, y, t2, p256_mod);
  18442. }
  18443. /* Compare two numbers to determine if they are equal.
  18444. * Constant time implementation.
  18445. *
  18446. * a First number to compare.
  18447. * b Second number to compare.
  18448. * returns 1 when equal and 0 otherwise.
  18449. */
  18450. static int sp_256_cmp_equal_8(const sp_digit* a, const sp_digit* b)
  18451. {
  18452. return ((a[0] ^ b[0]) | (a[1] ^ b[1]) | (a[2] ^ b[2]) |
  18453. (a[3] ^ b[3]) | (a[4] ^ b[4]) | (a[5] ^ b[5]) |
  18454. (a[6] ^ b[6]) | (a[7] ^ b[7])) == 0;
  18455. }
  18456. /* Returns 1 if the number of zero.
  18457. * Implementation is constant time.
  18458. *
  18459. * a Number to check.
  18460. * returns 1 if the number is zero and 0 otherwise.
  18461. */
  18462. static int sp_256_iszero_8(const sp_digit* a)
  18463. {
  18464. return (a[0] | a[1] | a[2] | a[3] | a[4] | a[5] | a[6] | a[7]) == 0;
  18465. }
  18466. /* Add two Montgomery form projective points.
  18467. *
  18468. * r Result of addition.
  18469. * p First point to add.
  18470. * q Second point to add.
  18471. * t Temporary ordinate data.
  18472. */
  18473. #ifdef WOLFSSL_SP_NONBLOCK
  18474. typedef struct sp_256_proj_point_add_8_ctx {
  18475. int state;
  18476. sp_256_proj_point_dbl_8_ctx dbl_ctx;
  18477. const sp_point_256* ap[2];
  18478. sp_point_256* rp[2];
  18479. sp_digit* t1;
  18480. sp_digit* t2;
  18481. sp_digit* t3;
  18482. sp_digit* t4;
  18483. sp_digit* t5;
  18484. sp_digit* t6;
  18485. sp_digit* x;
  18486. sp_digit* y;
  18487. sp_digit* z;
  18488. } sp_256_proj_point_add_8_ctx;
  18489. static int sp_256_proj_point_add_8_nb(sp_ecc_ctx_t* sp_ctx, sp_point_256* r,
  18490. const sp_point_256* p, const sp_point_256* q, sp_digit* t)
  18491. {
  18492. int err = FP_WOULDBLOCK;
  18493. sp_256_proj_point_add_8_ctx* ctx = (sp_256_proj_point_add_8_ctx*)sp_ctx->data;
  18494. /* Ensure only the first point is the same as the result. */
  18495. if (q == r) {
  18496. const sp_point_256* a = p;
  18497. p = q;
  18498. q = a;
  18499. }
  18500. typedef char ctx_size_test[sizeof(sp_256_proj_point_add_8_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  18501. (void)sizeof(ctx_size_test);
  18502. switch (ctx->state) {
  18503. case 0: /* INIT */
  18504. ctx->t1 = t;
  18505. ctx->t2 = t + 2*8;
  18506. ctx->t3 = t + 4*8;
  18507. ctx->t4 = t + 6*8;
  18508. ctx->t5 = t + 8*8;
  18509. ctx->t6 = t + 10*8;
  18510. ctx->x = ctx->t6;
  18511. ctx->y = ctx->t1;
  18512. ctx->z = ctx->t2;
  18513. ctx->state = 1;
  18514. break;
  18515. case 1:
  18516. /* Check double */
  18517. (void)sp_256_sub_8(ctx->t1, p256_mod, q->y);
  18518. sp_256_norm_8(ctx->t1);
  18519. if ((~p->infinity & ~q->infinity &
  18520. sp_256_cmp_equal_8(p->x, q->x) & sp_256_cmp_equal_8(p->z, q->z) &
  18521. (sp_256_cmp_equal_8(p->y, q->y) | sp_256_cmp_equal_8(p->y, ctx->t1))) != 0)
  18522. {
  18523. XMEMSET(&ctx->dbl_ctx, 0, sizeof(ctx->dbl_ctx));
  18524. ctx->state = 2;
  18525. }
  18526. else {
  18527. ctx->state = 3;
  18528. }
  18529. break;
  18530. case 2:
  18531. err = sp_256_proj_point_dbl_8_nb((sp_ecc_ctx_t*)&ctx->dbl_ctx, r, p, t);
  18532. if (err == MP_OKAY)
  18533. ctx->state = 27; /* done */
  18534. break;
  18535. case 3:
  18536. {
  18537. ctx->state = 4;
  18538. break;
  18539. }
  18540. case 4:
  18541. /* U1 = X1*Z2^2 */
  18542. sp_256_mont_sqr_8(ctx->t1, q->z, p256_mod, p256_mp_mod);
  18543. ctx->state = 5;
  18544. break;
  18545. case 5:
  18546. sp_256_mont_mul_8(ctx->t3, ctx->t1, q->z, p256_mod, p256_mp_mod);
  18547. ctx->state = 6;
  18548. break;
  18549. case 6:
  18550. sp_256_mont_mul_8(ctx->t1, ctx->t1, p->x, p256_mod, p256_mp_mod);
  18551. ctx->state = 7;
  18552. break;
  18553. case 7:
  18554. /* U2 = X2*Z1^2 */
  18555. sp_256_mont_sqr_8(ctx->t2, p->z, p256_mod, p256_mp_mod);
  18556. ctx->state = 8;
  18557. break;
  18558. case 8:
  18559. sp_256_mont_mul_8(ctx->t4, ctx->t2, p->z, p256_mod, p256_mp_mod);
  18560. ctx->state = 9;
  18561. break;
  18562. case 9:
  18563. sp_256_mont_mul_8(ctx->t2, ctx->t2, q->x, p256_mod, p256_mp_mod);
  18564. ctx->state = 10;
  18565. break;
  18566. case 10:
  18567. /* S1 = Y1*Z2^3 */
  18568. sp_256_mont_mul_8(ctx->t3, ctx->t3, p->y, p256_mod, p256_mp_mod);
  18569. ctx->state = 11;
  18570. break;
  18571. case 11:
  18572. /* S2 = Y2*Z1^3 */
  18573. sp_256_mont_mul_8(ctx->t4, ctx->t4, q->y, p256_mod, p256_mp_mod);
  18574. ctx->state = 12;
  18575. break;
  18576. case 12:
  18577. /* H = U2 - U1 */
  18578. sp_256_mont_sub_8(ctx->t2, ctx->t2, ctx->t1, p256_mod);
  18579. ctx->state = 13;
  18580. break;
  18581. case 13:
  18582. /* R = S2 - S1 */
  18583. sp_256_mont_sub_8(ctx->t4, ctx->t4, ctx->t3, p256_mod);
  18584. ctx->state = 14;
  18585. break;
  18586. case 14:
  18587. /* X3 = R^2 - H^3 - 2*U1*H^2 */
  18588. sp_256_mont_sqr_8(ctx->t5, ctx->t2, p256_mod, p256_mp_mod);
  18589. ctx->state = 15;
  18590. break;
  18591. case 15:
  18592. sp_256_mont_mul_8(ctx->y, ctx->t1, ctx->t5, p256_mod, p256_mp_mod);
  18593. ctx->state = 16;
  18594. break;
  18595. case 16:
  18596. sp_256_mont_mul_8(ctx->t5, ctx->t5, ctx->t2, p256_mod, p256_mp_mod);
  18597. ctx->state = 17;
  18598. break;
  18599. case 17:
  18600. /* Z3 = H*Z1*Z2 */
  18601. sp_256_mont_mul_8(ctx->z, p->z, ctx->t2, p256_mod, p256_mp_mod);
  18602. ctx->state = 18;
  18603. break;
  18604. case 18:
  18605. sp_256_mont_mul_8(ctx->z, ctx->z, q->z, p256_mod, p256_mp_mod);
  18606. ctx->state = 19;
  18607. break;
  18608. case 19:
  18609. sp_256_mont_sqr_8(ctx->x, ctx->t4, p256_mod, p256_mp_mod);
  18610. ctx->state = 20;
  18611. break;
  18612. case 20:
  18613. sp_256_mont_sub_8(ctx->x, ctx->x, ctx->t5, p256_mod);
  18614. ctx->state = 21;
  18615. break;
  18616. case 21:
  18617. sp_256_mont_mul_8(ctx->t5, ctx->t5, ctx->t3, p256_mod, p256_mp_mod);
  18618. ctx->state = 22;
  18619. break;
  18620. case 22:
  18621. sp_256_mont_dbl_8(ctx->t3, ctx->y, p256_mod);
  18622. ctx->state = 23;
  18623. break;
  18624. case 23:
  18625. sp_256_mont_sub_8(ctx->x, ctx->x, ctx->t3, p256_mod);
  18626. ctx->state = 24;
  18627. break;
  18628. case 24:
  18629. /* Y3 = R*(U1*H^2 - X3) - S1*H^3 */
  18630. sp_256_mont_sub_lower_8(ctx->y, ctx->y, ctx->x, p256_mod);
  18631. ctx->state = 25;
  18632. break;
  18633. case 25:
  18634. sp_256_mont_mul_8(ctx->y, ctx->y, ctx->t4, p256_mod, p256_mp_mod);
  18635. ctx->state = 26;
  18636. break;
  18637. case 26:
  18638. sp_256_mont_sub_8(ctx->y, ctx->y, ctx->t5, p256_mod);
  18639. ctx->state = 27;
  18640. /* fall-through */
  18641. case 27:
  18642. {
  18643. int i;
  18644. sp_digit maskp = 0 - (q->infinity & (!p->infinity));
  18645. sp_digit maskq = 0 - (p->infinity & (!q->infinity));
  18646. sp_digit maskt = ~(maskp | maskq);
  18647. for (i = 0; i < 8; i++) {
  18648. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) |
  18649. (ctx->x[i] & maskt);
  18650. }
  18651. for (i = 0; i < 8; i++) {
  18652. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) |
  18653. (ctx->y[i] & maskt);
  18654. }
  18655. for (i = 0; i < 8; i++) {
  18656. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) |
  18657. (ctx->z[i] & maskt);
  18658. }
  18659. r->z[0] |= p->infinity & q->infinity;
  18660. r->infinity = p->infinity & q->infinity;
  18661. err = MP_OKAY;
  18662. break;
  18663. }
  18664. }
  18665. if (err == MP_OKAY && ctx->state != 27) {
  18666. err = FP_WOULDBLOCK;
  18667. }
  18668. return err;
  18669. }
  18670. #endif /* WOLFSSL_SP_NONBLOCK */
  18671. static void sp_256_proj_point_add_8(sp_point_256* r,
  18672. const sp_point_256* p, const sp_point_256* q, sp_digit* t)
  18673. {
  18674. sp_digit* t1 = t;
  18675. sp_digit* t2 = t + 2*8;
  18676. sp_digit* t3 = t + 4*8;
  18677. sp_digit* t4 = t + 6*8;
  18678. sp_digit* t5 = t + 8*8;
  18679. sp_digit* t6 = t + 10*8;
  18680. /* Check double */
  18681. (void)sp_256_sub_8(t1, p256_mod, q->y);
  18682. sp_256_norm_8(t1);
  18683. if ((~p->infinity & ~q->infinity &
  18684. sp_256_cmp_equal_8(p->x, q->x) & sp_256_cmp_equal_8(p->z, q->z) &
  18685. (sp_256_cmp_equal_8(p->y, q->y) | sp_256_cmp_equal_8(p->y, t1))) != 0) {
  18686. sp_256_proj_point_dbl_8(r, p, t);
  18687. }
  18688. else {
  18689. sp_digit maskp;
  18690. sp_digit maskq;
  18691. sp_digit maskt;
  18692. sp_digit* x = t6;
  18693. sp_digit* y = t1;
  18694. sp_digit* z = t2;
  18695. int i;
  18696. maskp = 0 - (q->infinity & (!p->infinity));
  18697. maskq = 0 - (p->infinity & (!q->infinity));
  18698. maskt = ~(maskp | maskq);
  18699. /* U1 = X1*Z2^2 */
  18700. sp_256_mont_sqr_8(t1, q->z, p256_mod, p256_mp_mod);
  18701. sp_256_mont_mul_8(t3, t1, q->z, p256_mod, p256_mp_mod);
  18702. sp_256_mont_mul_8(t1, t1, p->x, p256_mod, p256_mp_mod);
  18703. /* U2 = X2*Z1^2 */
  18704. sp_256_mont_sqr_8(t2, p->z, p256_mod, p256_mp_mod);
  18705. sp_256_mont_mul_8(t4, t2, p->z, p256_mod, p256_mp_mod);
  18706. sp_256_mont_mul_8(t2, t2, q->x, p256_mod, p256_mp_mod);
  18707. /* S1 = Y1*Z2^3 */
  18708. sp_256_mont_mul_8(t3, t3, p->y, p256_mod, p256_mp_mod);
  18709. /* S2 = Y2*Z1^3 */
  18710. sp_256_mont_mul_8(t4, t4, q->y, p256_mod, p256_mp_mod);
  18711. /* H = U2 - U1 */
  18712. sp_256_mont_sub_8(t2, t2, t1, p256_mod);
  18713. /* R = S2 - S1 */
  18714. sp_256_mont_sub_8(t4, t4, t3, p256_mod);
  18715. if (~p->infinity & ~q->infinity &
  18716. sp_256_iszero_8(t2) & sp_256_iszero_8(t4) & maskt) {
  18717. sp_256_proj_point_dbl_8(r, p, t);
  18718. }
  18719. else {
  18720. /* X3 = R^2 - H^3 - 2*U1*H^2 */
  18721. sp_256_mont_sqr_8(t5, t2, p256_mod, p256_mp_mod);
  18722. sp_256_mont_mul_8(y, t1, t5, p256_mod, p256_mp_mod);
  18723. sp_256_mont_mul_8(t5, t5, t2, p256_mod, p256_mp_mod);
  18724. /* Z3 = H*Z1*Z2 */
  18725. sp_256_mont_mul_8(z, p->z, t2, p256_mod, p256_mp_mod);
  18726. sp_256_mont_mul_8(z, z, q->z, p256_mod, p256_mp_mod);
  18727. sp_256_mont_sqr_8(x, t4, p256_mod, p256_mp_mod);
  18728. sp_256_mont_sub_8(x, x, t5, p256_mod);
  18729. sp_256_mont_mul_8(t5, t5, t3, p256_mod, p256_mp_mod);
  18730. sp_256_mont_dbl_8(t3, y, p256_mod);
  18731. sp_256_mont_sub_8(x, x, t3, p256_mod);
  18732. /* Y3 = R*(U1*H^2 - X3) - S1*H^3 */
  18733. sp_256_mont_sub_lower_8(y, y, x, p256_mod);
  18734. sp_256_mont_mul_8(y, y, t4, p256_mod, p256_mp_mod);
  18735. sp_256_mont_sub_8(y, y, t5, p256_mod);
  18736. for (i = 0; i < 8; i++) {
  18737. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) |
  18738. (x[i] & maskt);
  18739. }
  18740. for (i = 0; i < 8; i++) {
  18741. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) |
  18742. (y[i] & maskt);
  18743. }
  18744. for (i = 0; i < 8; i++) {
  18745. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) |
  18746. (z[i] & maskt);
  18747. }
  18748. r->z[0] |= p->infinity & q->infinity;
  18749. r->infinity = p->infinity & q->infinity;
  18750. }
  18751. }
  18752. }
  18753. #ifndef WC_NO_CACHE_RESISTANT
  18754. /* Touch each possible point that could be being copied.
  18755. *
  18756. * r Point to copy into.
  18757. * table Table - start of the entires to access
  18758. * idx Index of entry to retrieve.
  18759. */
  18760. static void sp_256_get_point_16_8(sp_point_256* r, const sp_point_256* table,
  18761. int idx)
  18762. {
  18763. int i;
  18764. sp_digit mask;
  18765. r->x[0] = 0;
  18766. r->x[1] = 0;
  18767. r->x[2] = 0;
  18768. r->x[3] = 0;
  18769. r->x[4] = 0;
  18770. r->x[5] = 0;
  18771. r->x[6] = 0;
  18772. r->x[7] = 0;
  18773. r->y[0] = 0;
  18774. r->y[1] = 0;
  18775. r->y[2] = 0;
  18776. r->y[3] = 0;
  18777. r->y[4] = 0;
  18778. r->y[5] = 0;
  18779. r->y[6] = 0;
  18780. r->y[7] = 0;
  18781. r->z[0] = 0;
  18782. r->z[1] = 0;
  18783. r->z[2] = 0;
  18784. r->z[3] = 0;
  18785. r->z[4] = 0;
  18786. r->z[5] = 0;
  18787. r->z[6] = 0;
  18788. r->z[7] = 0;
  18789. for (i = 1; i < 16; i++) {
  18790. mask = 0 - (i == idx);
  18791. r->x[0] |= mask & table[i].x[0];
  18792. r->x[1] |= mask & table[i].x[1];
  18793. r->x[2] |= mask & table[i].x[2];
  18794. r->x[3] |= mask & table[i].x[3];
  18795. r->x[4] |= mask & table[i].x[4];
  18796. r->x[5] |= mask & table[i].x[5];
  18797. r->x[6] |= mask & table[i].x[6];
  18798. r->x[7] |= mask & table[i].x[7];
  18799. r->y[0] |= mask & table[i].y[0];
  18800. r->y[1] |= mask & table[i].y[1];
  18801. r->y[2] |= mask & table[i].y[2];
  18802. r->y[3] |= mask & table[i].y[3];
  18803. r->y[4] |= mask & table[i].y[4];
  18804. r->y[5] |= mask & table[i].y[5];
  18805. r->y[6] |= mask & table[i].y[6];
  18806. r->y[7] |= mask & table[i].y[7];
  18807. r->z[0] |= mask & table[i].z[0];
  18808. r->z[1] |= mask & table[i].z[1];
  18809. r->z[2] |= mask & table[i].z[2];
  18810. r->z[3] |= mask & table[i].z[3];
  18811. r->z[4] |= mask & table[i].z[4];
  18812. r->z[5] |= mask & table[i].z[5];
  18813. r->z[6] |= mask & table[i].z[6];
  18814. r->z[7] |= mask & table[i].z[7];
  18815. }
  18816. }
  18817. #endif /* !WC_NO_CACHE_RESISTANT */
  18818. /* Multiply the point by the scalar and return the result.
  18819. * If map is true then convert result to affine coordinates.
  18820. *
  18821. * Fast implementation that generates a pre-computation table.
  18822. * 4 bits of window (no sliding!).
  18823. * Uses add and double for calculating table.
  18824. * 256 doubles.
  18825. * 76 adds.
  18826. *
  18827. * r Resulting point.
  18828. * g Point to multiply.
  18829. * k Scalar to multiply by.
  18830. * map Indicates whether to convert result to affine.
  18831. * ct Constant time required.
  18832. * heap Heap to use for allocation.
  18833. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  18834. */
  18835. static int sp_256_ecc_mulmod_fast_8(sp_point_256* r, const sp_point_256* g, const sp_digit* k,
  18836. int map, int ct, void* heap)
  18837. {
  18838. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  18839. sp_point_256* t = NULL;
  18840. sp_digit* tmp = NULL;
  18841. #else
  18842. sp_point_256 t[16 + 1];
  18843. sp_digit tmp[2 * 8 * 6];
  18844. #endif
  18845. sp_point_256* rt = NULL;
  18846. #ifndef WC_NO_CACHE_RESISTANT
  18847. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  18848. sp_point_256* p = NULL;
  18849. #else
  18850. sp_point_256 p[1];
  18851. #endif
  18852. #endif /* !WC_NO_CACHE_RESISTANT */
  18853. sp_digit n;
  18854. int i;
  18855. int c;
  18856. int y;
  18857. int err = MP_OKAY;
  18858. /* Constant time used for cache attack resistance implementation. */
  18859. (void)ct;
  18860. (void)heap;
  18861. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  18862. t = (sp_point_256*)XMALLOC(sizeof(sp_point_256) * (16 + 1),
  18863. heap, DYNAMIC_TYPE_ECC);
  18864. if (t == NULL)
  18865. err = MEMORY_E;
  18866. #ifndef WC_NO_CACHE_RESISTANT
  18867. if (err == MP_OKAY) {
  18868. p = (sp_point_256*)XMALLOC(sizeof(sp_point_256),
  18869. heap, DYNAMIC_TYPE_ECC);
  18870. if (p == NULL)
  18871. err = MEMORY_E;
  18872. }
  18873. #endif
  18874. if (err == MP_OKAY) {
  18875. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 8 * 6, heap,
  18876. DYNAMIC_TYPE_ECC);
  18877. if (tmp == NULL)
  18878. err = MEMORY_E;
  18879. }
  18880. #endif
  18881. if (err == MP_OKAY) {
  18882. rt = t + 16;
  18883. /* t[0] = {0, 0, 1} * norm */
  18884. XMEMSET(&t[0], 0, sizeof(t[0]));
  18885. t[0].infinity = 1;
  18886. /* t[1] = {g->x, g->y, g->z} * norm */
  18887. (void)sp_256_mod_mul_norm_8(t[1].x, g->x, p256_mod);
  18888. (void)sp_256_mod_mul_norm_8(t[1].y, g->y, p256_mod);
  18889. (void)sp_256_mod_mul_norm_8(t[1].z, g->z, p256_mod);
  18890. t[1].infinity = 0;
  18891. sp_256_proj_point_dbl_8(&t[ 2], &t[ 1], tmp);
  18892. t[ 2].infinity = 0;
  18893. sp_256_proj_point_add_8(&t[ 3], &t[ 2], &t[ 1], tmp);
  18894. t[ 3].infinity = 0;
  18895. sp_256_proj_point_dbl_8(&t[ 4], &t[ 2], tmp);
  18896. t[ 4].infinity = 0;
  18897. sp_256_proj_point_add_8(&t[ 5], &t[ 3], &t[ 2], tmp);
  18898. t[ 5].infinity = 0;
  18899. sp_256_proj_point_dbl_8(&t[ 6], &t[ 3], tmp);
  18900. t[ 6].infinity = 0;
  18901. sp_256_proj_point_add_8(&t[ 7], &t[ 4], &t[ 3], tmp);
  18902. t[ 7].infinity = 0;
  18903. sp_256_proj_point_dbl_8(&t[ 8], &t[ 4], tmp);
  18904. t[ 8].infinity = 0;
  18905. sp_256_proj_point_add_8(&t[ 9], &t[ 5], &t[ 4], tmp);
  18906. t[ 9].infinity = 0;
  18907. sp_256_proj_point_dbl_8(&t[10], &t[ 5], tmp);
  18908. t[10].infinity = 0;
  18909. sp_256_proj_point_add_8(&t[11], &t[ 6], &t[ 5], tmp);
  18910. t[11].infinity = 0;
  18911. sp_256_proj_point_dbl_8(&t[12], &t[ 6], tmp);
  18912. t[12].infinity = 0;
  18913. sp_256_proj_point_add_8(&t[13], &t[ 7], &t[ 6], tmp);
  18914. t[13].infinity = 0;
  18915. sp_256_proj_point_dbl_8(&t[14], &t[ 7], tmp);
  18916. t[14].infinity = 0;
  18917. sp_256_proj_point_add_8(&t[15], &t[ 8], &t[ 7], tmp);
  18918. t[15].infinity = 0;
  18919. i = 6;
  18920. n = k[i+1] << 0;
  18921. c = 28;
  18922. y = (int)(n >> 28);
  18923. #ifndef WC_NO_CACHE_RESISTANT
  18924. if (ct) {
  18925. sp_256_get_point_16_8(rt, t, y);
  18926. rt->infinity = !y;
  18927. }
  18928. else
  18929. #endif
  18930. {
  18931. XMEMCPY(rt, &t[y], sizeof(sp_point_256));
  18932. }
  18933. n <<= 4;
  18934. for (; i>=0 || c>=4; ) {
  18935. if (c < 4) {
  18936. n |= k[i--];
  18937. c += 32;
  18938. }
  18939. y = (n >> 28) & 0xf;
  18940. n <<= 4;
  18941. c -= 4;
  18942. sp_256_proj_point_dbl_8(rt, rt, tmp);
  18943. sp_256_proj_point_dbl_8(rt, rt, tmp);
  18944. sp_256_proj_point_dbl_8(rt, rt, tmp);
  18945. sp_256_proj_point_dbl_8(rt, rt, tmp);
  18946. #ifndef WC_NO_CACHE_RESISTANT
  18947. if (ct) {
  18948. sp_256_get_point_16_8(p, t, y);
  18949. p->infinity = !y;
  18950. sp_256_proj_point_add_8(rt, rt, p, tmp);
  18951. }
  18952. else
  18953. #endif
  18954. {
  18955. sp_256_proj_point_add_8(rt, rt, &t[y], tmp);
  18956. }
  18957. }
  18958. if (map != 0) {
  18959. sp_256_map_8(r, rt, tmp);
  18960. }
  18961. else {
  18962. XMEMCPY(r, rt, sizeof(sp_point_256));
  18963. }
  18964. }
  18965. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  18966. if (tmp != NULL)
  18967. #endif
  18968. {
  18969. ForceZero(tmp, sizeof(sp_digit) * 2 * 8 * 6);
  18970. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  18971. XFREE(tmp, heap, DYNAMIC_TYPE_ECC);
  18972. #endif
  18973. }
  18974. #ifndef WC_NO_CACHE_RESISTANT
  18975. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  18976. if (p != NULL)
  18977. #endif
  18978. {
  18979. ForceZero(p, sizeof(sp_point_256));
  18980. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  18981. XFREE(p, heap, DYNAMIC_TYPE_ECC);
  18982. #endif
  18983. }
  18984. #endif /* !WC_NO_CACHE_RESISTANT */
  18985. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  18986. if (t != NULL)
  18987. #endif
  18988. {
  18989. ForceZero(t, sizeof(sp_point_256) * 17);
  18990. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  18991. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  18992. #endif
  18993. }
  18994. return err;
  18995. }
  18996. #ifdef FP_ECC
  18997. #define sp_256_mont_dbl_lower_8 sp_256_mont_dbl_8
  18998. #define sp_256_mont_tpl_lower_8 sp_256_mont_tpl_8
  18999. /* Double the Montgomery form projective point p a number of times.
  19000. *
  19001. * r Result of repeated doubling of point.
  19002. * p Point to double.
  19003. * n Number of times to double
  19004. * t Temporary ordinate data.
  19005. */
  19006. static void sp_256_proj_point_dbl_n_8(sp_point_256* p, int i,
  19007. sp_digit* t)
  19008. {
  19009. sp_digit* w = t;
  19010. sp_digit* a = t + 2*8;
  19011. sp_digit* b = t + 4*8;
  19012. sp_digit* t1 = t + 6*8;
  19013. sp_digit* t2 = t + 8*8;
  19014. sp_digit* x;
  19015. sp_digit* y;
  19016. sp_digit* z;
  19017. volatile int n = i;
  19018. x = p->x;
  19019. y = p->y;
  19020. z = p->z;
  19021. /* Y = 2*Y */
  19022. sp_256_mont_dbl_8(y, y, p256_mod);
  19023. /* W = Z^4 */
  19024. sp_256_mont_sqr_8(w, z, p256_mod, p256_mp_mod);
  19025. sp_256_mont_sqr_8(w, w, p256_mod, p256_mp_mod);
  19026. #ifndef WOLFSSL_SP_SMALL
  19027. while (--n > 0)
  19028. #else
  19029. while (--n >= 0)
  19030. #endif
  19031. {
  19032. /* A = 3*(X^2 - W) */
  19033. sp_256_mont_sqr_8(t1, x, p256_mod, p256_mp_mod);
  19034. sp_256_mont_sub_8(t1, t1, w, p256_mod);
  19035. sp_256_mont_tpl_lower_8(a, t1, p256_mod);
  19036. /* B = X*Y^2 */
  19037. sp_256_mont_sqr_8(t1, y, p256_mod, p256_mp_mod);
  19038. sp_256_mont_mul_8(b, t1, x, p256_mod, p256_mp_mod);
  19039. /* X = A^2 - 2B */
  19040. sp_256_mont_sqr_8(x, a, p256_mod, p256_mp_mod);
  19041. sp_256_mont_dbl_8(t2, b, p256_mod);
  19042. sp_256_mont_sub_8(x, x, t2, p256_mod);
  19043. /* b = 2.(B - X) */
  19044. sp_256_mont_sub_lower_8(t2, b, x, p256_mod);
  19045. sp_256_mont_dbl_lower_8(b, t2, p256_mod);
  19046. /* Z = Z*Y */
  19047. sp_256_mont_mul_8(z, z, y, p256_mod, p256_mp_mod);
  19048. /* t1 = Y^4 */
  19049. sp_256_mont_sqr_8(t1, t1, p256_mod, p256_mp_mod);
  19050. #ifdef WOLFSSL_SP_SMALL
  19051. if (n != 0)
  19052. #endif
  19053. {
  19054. /* W = W*Y^4 */
  19055. sp_256_mont_mul_8(w, w, t1, p256_mod, p256_mp_mod);
  19056. }
  19057. /* y = 2*A*(B - X) - Y^4 */
  19058. sp_256_mont_mul_8(y, b, a, p256_mod, p256_mp_mod);
  19059. sp_256_mont_sub_8(y, y, t1, p256_mod);
  19060. }
  19061. #ifndef WOLFSSL_SP_SMALL
  19062. /* A = 3*(X^2 - W) */
  19063. sp_256_mont_sqr_8(t1, x, p256_mod, p256_mp_mod);
  19064. sp_256_mont_sub_8(t1, t1, w, p256_mod);
  19065. sp_256_mont_tpl_lower_8(a, t1, p256_mod);
  19066. /* B = X*Y^2 */
  19067. sp_256_mont_sqr_8(t1, y, p256_mod, p256_mp_mod);
  19068. sp_256_mont_mul_8(b, t1, x, p256_mod, p256_mp_mod);
  19069. /* X = A^2 - 2B */
  19070. sp_256_mont_sqr_8(x, a, p256_mod, p256_mp_mod);
  19071. sp_256_mont_dbl_8(t2, b, p256_mod);
  19072. sp_256_mont_sub_8(x, x, t2, p256_mod);
  19073. /* b = 2.(B - X) */
  19074. sp_256_mont_sub_lower_8(t2, b, x, p256_mod);
  19075. sp_256_mont_dbl_lower_8(b, t2, p256_mod);
  19076. /* Z = Z*Y */
  19077. sp_256_mont_mul_8(z, z, y, p256_mod, p256_mp_mod);
  19078. /* t1 = Y^4 */
  19079. sp_256_mont_sqr_8(t1, t1, p256_mod, p256_mp_mod);
  19080. /* y = 2*A*(B - X) - Y^4 */
  19081. sp_256_mont_mul_8(y, b, a, p256_mod, p256_mp_mod);
  19082. sp_256_mont_sub_8(y, y, t1, p256_mod);
  19083. #endif
  19084. /* Y = Y/2 */
  19085. sp_256_div2_8(y, y, p256_mod);
  19086. }
  19087. /* Convert the projective point to affine.
  19088. * Ordinates are in Montgomery form.
  19089. *
  19090. * a Point to convert.
  19091. * t Temporary data.
  19092. */
  19093. static void sp_256_proj_to_affine_8(sp_point_256* a, sp_digit* t)
  19094. {
  19095. sp_digit* t1 = t;
  19096. sp_digit* t2 = t + 2 * 8;
  19097. sp_digit* tmp = t + 4 * 8;
  19098. sp_256_mont_inv_8(t1, a->z, tmp);
  19099. sp_256_mont_sqr_8(t2, t1, p256_mod, p256_mp_mod);
  19100. sp_256_mont_mul_8(t1, t2, t1, p256_mod, p256_mp_mod);
  19101. sp_256_mont_mul_8(a->x, a->x, t2, p256_mod, p256_mp_mod);
  19102. sp_256_mont_mul_8(a->y, a->y, t1, p256_mod, p256_mp_mod);
  19103. XMEMCPY(a->z, p256_norm_mod, sizeof(p256_norm_mod));
  19104. }
  19105. #endif /* FP_ECC */
  19106. /* A table entry for pre-computed points. */
  19107. typedef struct sp_table_entry_256 {
  19108. sp_digit x[8];
  19109. sp_digit y[8];
  19110. } sp_table_entry_256;
  19111. #ifdef FP_ECC
  19112. #endif /* FP_ECC */
  19113. /* Add two Montgomery form projective points. The second point has a q value of
  19114. * one.
  19115. * Only the first point can be the same pointer as the result point.
  19116. *
  19117. * r Result of addition.
  19118. * p First point to add.
  19119. * q Second point to add.
  19120. * t Temporary ordinate data.
  19121. */
  19122. static void sp_256_proj_point_add_qz1_8(sp_point_256* r, const sp_point_256* p,
  19123. const sp_point_256* q, sp_digit* t)
  19124. {
  19125. sp_digit* t1 = t;
  19126. sp_digit* t2 = t + 2*8;
  19127. sp_digit* t3 = t + 4*8;
  19128. sp_digit* t4 = t + 6*8;
  19129. sp_digit* t5 = t + 8*8;
  19130. sp_digit* t6 = t + 10*8;
  19131. /* Check double */
  19132. (void)sp_256_sub_8(t1, p256_mod, q->y);
  19133. sp_256_norm_8(t1);
  19134. if ((~p->infinity & ~q->infinity &
  19135. sp_256_cmp_equal_8(p->x, q->x) & sp_256_cmp_equal_8(p->z, q->z) &
  19136. (sp_256_cmp_equal_8(p->y, q->y) | sp_256_cmp_equal_8(p->y, t1))) != 0) {
  19137. sp_256_proj_point_dbl_8(r, p, t);
  19138. }
  19139. else {
  19140. sp_digit maskp;
  19141. sp_digit maskq;
  19142. sp_digit maskt;
  19143. sp_digit* x = t2;
  19144. sp_digit* y = t5;
  19145. sp_digit* z = t6;
  19146. int i;
  19147. /* U2 = X2*Z1^2 */
  19148. sp_256_mont_sqr_8(t2, p->z, p256_mod, p256_mp_mod);
  19149. sp_256_mont_mul_8(t4, t2, p->z, p256_mod, p256_mp_mod);
  19150. sp_256_mont_mul_8(t2, t2, q->x, p256_mod, p256_mp_mod);
  19151. /* S2 = Y2*Z1^3 */
  19152. sp_256_mont_mul_8(t4, t4, q->y, p256_mod, p256_mp_mod);
  19153. /* H = U2 - X1 */
  19154. sp_256_mont_sub_8(t2, t2, p->x, p256_mod);
  19155. /* R = S2 - Y1 */
  19156. sp_256_mont_sub_8(t4, t4, p->y, p256_mod);
  19157. /* Z3 = H*Z1 */
  19158. sp_256_mont_mul_8(z, p->z, t2, p256_mod, p256_mp_mod);
  19159. /* X3 = R^2 - H^3 - 2*X1*H^2 */
  19160. sp_256_mont_sqr_8(t1, t4, p256_mod, p256_mp_mod);
  19161. sp_256_mont_sqr_8(t5, t2, p256_mod, p256_mp_mod);
  19162. sp_256_mont_mul_8(t3, p->x, t5, p256_mod, p256_mp_mod);
  19163. sp_256_mont_mul_8(t5, t5, t2, p256_mod, p256_mp_mod);
  19164. sp_256_mont_sub_8(x, t1, t5, p256_mod);
  19165. sp_256_mont_dbl_8(t1, t3, p256_mod);
  19166. sp_256_mont_sub_8(x, x, t1, p256_mod);
  19167. /* Y3 = R*(X1*H^2 - X3) - Y1*H^3 */
  19168. sp_256_mont_sub_lower_8(t3, t3, x, p256_mod);
  19169. sp_256_mont_mul_8(t3, t3, t4, p256_mod, p256_mp_mod);
  19170. sp_256_mont_mul_8(t5, t5, p->y, p256_mod, p256_mp_mod);
  19171. sp_256_mont_sub_8(y, t3, t5, p256_mod);
  19172. maskp = 0 - (q->infinity & (!p->infinity));
  19173. maskq = 0 - (p->infinity & (!q->infinity));
  19174. maskt = ~(maskp | maskq);
  19175. for (i = 0; i < 8; i++) {
  19176. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) | (x[i] & maskt);
  19177. }
  19178. for (i = 0; i < 8; i++) {
  19179. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) | (y[i] & maskt);
  19180. }
  19181. for (i = 0; i < 8; i++) {
  19182. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) | (z[i] & maskt);
  19183. }
  19184. r->z[0] |= p->infinity & q->infinity;
  19185. r->infinity = p->infinity & q->infinity;
  19186. }
  19187. }
  19188. #ifdef WOLFSSL_SP_SMALL
  19189. #ifdef FP_ECC
  19190. /* Generate the pre-computed table of points for the base point.
  19191. *
  19192. * width = 4
  19193. * 16 entries
  19194. * 64 bits between
  19195. *
  19196. * a The base point.
  19197. * table Place to store generated point data.
  19198. * tmp Temporary data.
  19199. * heap Heap to use for allocation.
  19200. */
  19201. static int sp_256_gen_stripe_table_8(const sp_point_256* a,
  19202. sp_table_entry_256* table, sp_digit* tmp, void* heap)
  19203. {
  19204. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19205. sp_point_256* t = NULL;
  19206. #else
  19207. sp_point_256 t[3];
  19208. #endif
  19209. sp_point_256* s1 = NULL;
  19210. sp_point_256* s2 = NULL;
  19211. int i;
  19212. int j;
  19213. int err = MP_OKAY;
  19214. (void)heap;
  19215. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19216. t = (sp_point_256*)XMALLOC(sizeof(sp_point_256) * 3, heap,
  19217. DYNAMIC_TYPE_ECC);
  19218. if (t == NULL)
  19219. err = MEMORY_E;
  19220. #endif
  19221. if (err == MP_OKAY) {
  19222. s1 = t + 1;
  19223. s2 = t + 2;
  19224. err = sp_256_mod_mul_norm_8(t->x, a->x, p256_mod);
  19225. }
  19226. if (err == MP_OKAY) {
  19227. err = sp_256_mod_mul_norm_8(t->y, a->y, p256_mod);
  19228. }
  19229. if (err == MP_OKAY) {
  19230. err = sp_256_mod_mul_norm_8(t->z, a->z, p256_mod);
  19231. }
  19232. if (err == MP_OKAY) {
  19233. t->infinity = 0;
  19234. sp_256_proj_to_affine_8(t, tmp);
  19235. XMEMCPY(s1->z, p256_norm_mod, sizeof(p256_norm_mod));
  19236. s1->infinity = 0;
  19237. XMEMCPY(s2->z, p256_norm_mod, sizeof(p256_norm_mod));
  19238. s2->infinity = 0;
  19239. /* table[0] = {0, 0, infinity} */
  19240. XMEMSET(&table[0], 0, sizeof(sp_table_entry_256));
  19241. /* table[1] = Affine version of 'a' in Montgomery form */
  19242. XMEMCPY(table[1].x, t->x, sizeof(table->x));
  19243. XMEMCPY(table[1].y, t->y, sizeof(table->y));
  19244. for (i=1; i<4; i++) {
  19245. sp_256_proj_point_dbl_n_8(t, 64, tmp);
  19246. sp_256_proj_to_affine_8(t, tmp);
  19247. XMEMCPY(table[1<<i].x, t->x, sizeof(table->x));
  19248. XMEMCPY(table[1<<i].y, t->y, sizeof(table->y));
  19249. }
  19250. for (i=1; i<4; i++) {
  19251. XMEMCPY(s1->x, table[1<<i].x, sizeof(table->x));
  19252. XMEMCPY(s1->y, table[1<<i].y, sizeof(table->y));
  19253. for (j=(1<<i)+1; j<(1<<(i+1)); j++) {
  19254. XMEMCPY(s2->x, table[j-(1<<i)].x, sizeof(table->x));
  19255. XMEMCPY(s2->y, table[j-(1<<i)].y, sizeof(table->y));
  19256. sp_256_proj_point_add_qz1_8(t, s1, s2, tmp);
  19257. sp_256_proj_to_affine_8(t, tmp);
  19258. XMEMCPY(table[j].x, t->x, sizeof(table->x));
  19259. XMEMCPY(table[j].y, t->y, sizeof(table->y));
  19260. }
  19261. }
  19262. }
  19263. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19264. if (t != NULL)
  19265. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  19266. #endif
  19267. return err;
  19268. }
  19269. #endif /* FP_ECC */
  19270. #ifndef WC_NO_CACHE_RESISTANT
  19271. /* Touch each possible entry that could be being copied.
  19272. *
  19273. * r Point to copy into.
  19274. * table Table - start of the entires to access
  19275. * idx Index of entry to retrieve.
  19276. */
  19277. static void sp_256_get_entry_16_8(sp_point_256* r,
  19278. const sp_table_entry_256* table, int idx)
  19279. {
  19280. int i;
  19281. sp_digit mask;
  19282. r->x[0] = 0;
  19283. r->x[1] = 0;
  19284. r->x[2] = 0;
  19285. r->x[3] = 0;
  19286. r->x[4] = 0;
  19287. r->x[5] = 0;
  19288. r->x[6] = 0;
  19289. r->x[7] = 0;
  19290. r->y[0] = 0;
  19291. r->y[1] = 0;
  19292. r->y[2] = 0;
  19293. r->y[3] = 0;
  19294. r->y[4] = 0;
  19295. r->y[5] = 0;
  19296. r->y[6] = 0;
  19297. r->y[7] = 0;
  19298. for (i = 1; i < 16; i++) {
  19299. mask = 0 - (i == idx);
  19300. r->x[0] |= mask & table[i].x[0];
  19301. r->x[1] |= mask & table[i].x[1];
  19302. r->x[2] |= mask & table[i].x[2];
  19303. r->x[3] |= mask & table[i].x[3];
  19304. r->x[4] |= mask & table[i].x[4];
  19305. r->x[5] |= mask & table[i].x[5];
  19306. r->x[6] |= mask & table[i].x[6];
  19307. r->x[7] |= mask & table[i].x[7];
  19308. r->y[0] |= mask & table[i].y[0];
  19309. r->y[1] |= mask & table[i].y[1];
  19310. r->y[2] |= mask & table[i].y[2];
  19311. r->y[3] |= mask & table[i].y[3];
  19312. r->y[4] |= mask & table[i].y[4];
  19313. r->y[5] |= mask & table[i].y[5];
  19314. r->y[6] |= mask & table[i].y[6];
  19315. r->y[7] |= mask & table[i].y[7];
  19316. }
  19317. }
  19318. #endif /* !WC_NO_CACHE_RESISTANT */
  19319. /* Multiply the point by the scalar and return the result.
  19320. * If map is true then convert result to affine coordinates.
  19321. *
  19322. * Stripe implementation.
  19323. * Pre-generated: 2^0, 2^64, ...
  19324. * Pre-generated: products of all combinations of above.
  19325. * 4 doubles and adds (with qz=1)
  19326. *
  19327. * r Resulting point.
  19328. * k Scalar to multiply by.
  19329. * table Pre-computed table.
  19330. * map Indicates whether to convert result to affine.
  19331. * ct Constant time required.
  19332. * heap Heap to use for allocation.
  19333. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  19334. */
  19335. static int sp_256_ecc_mulmod_stripe_8(sp_point_256* r, const sp_point_256* g,
  19336. const sp_table_entry_256* table, const sp_digit* k, int map,
  19337. int ct, void* heap)
  19338. {
  19339. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19340. sp_point_256* rt = NULL;
  19341. sp_digit* t = NULL;
  19342. #else
  19343. sp_point_256 rt[2];
  19344. sp_digit t[2 * 8 * 6];
  19345. #endif
  19346. sp_point_256* p = NULL;
  19347. int i;
  19348. int j;
  19349. int y;
  19350. int x;
  19351. int err = MP_OKAY;
  19352. (void)g;
  19353. /* Constant time used for cache attack resistance implementation. */
  19354. (void)ct;
  19355. (void)heap;
  19356. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19357. rt = (sp_point_256*)XMALLOC(sizeof(sp_point_256) * 2, heap,
  19358. DYNAMIC_TYPE_ECC);
  19359. if (rt == NULL)
  19360. err = MEMORY_E;
  19361. if (err == MP_OKAY) {
  19362. t = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 8 * 6, heap,
  19363. DYNAMIC_TYPE_ECC);
  19364. if (t == NULL)
  19365. err = MEMORY_E;
  19366. }
  19367. #endif
  19368. if (err == MP_OKAY) {
  19369. p = rt + 1;
  19370. XMEMCPY(p->z, p256_norm_mod, sizeof(p256_norm_mod));
  19371. XMEMCPY(rt->z, p256_norm_mod, sizeof(p256_norm_mod));
  19372. y = 0;
  19373. x = 63;
  19374. for (j=0; j<4; j++) {
  19375. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  19376. x += 64;
  19377. }
  19378. #ifndef WC_NO_CACHE_RESISTANT
  19379. if (ct) {
  19380. sp_256_get_entry_16_8(rt, table, y);
  19381. } else
  19382. #endif
  19383. {
  19384. XMEMCPY(rt->x, table[y].x, sizeof(table[y].x));
  19385. XMEMCPY(rt->y, table[y].y, sizeof(table[y].y));
  19386. }
  19387. rt->infinity = !y;
  19388. for (i=62; i>=0; i--) {
  19389. y = 0;
  19390. x = i;
  19391. for (j=0; j<4; j++) {
  19392. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  19393. x += 64;
  19394. }
  19395. sp_256_proj_point_dbl_8(rt, rt, t);
  19396. #ifndef WC_NO_CACHE_RESISTANT
  19397. if (ct) {
  19398. sp_256_get_entry_16_8(p, table, y);
  19399. }
  19400. else
  19401. #endif
  19402. {
  19403. XMEMCPY(p->x, table[y].x, sizeof(table[y].x));
  19404. XMEMCPY(p->y, table[y].y, sizeof(table[y].y));
  19405. }
  19406. p->infinity = !y;
  19407. sp_256_proj_point_add_qz1_8(rt, rt, p, t);
  19408. }
  19409. if (map != 0) {
  19410. sp_256_map_8(r, rt, t);
  19411. }
  19412. else {
  19413. XMEMCPY(r, rt, sizeof(sp_point_256));
  19414. }
  19415. }
  19416. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19417. if (t != NULL)
  19418. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  19419. if (rt != NULL)
  19420. XFREE(rt, heap, DYNAMIC_TYPE_ECC);
  19421. #endif
  19422. return err;
  19423. }
  19424. #ifdef FP_ECC
  19425. #ifndef FP_ENTRIES
  19426. #define FP_ENTRIES 16
  19427. #endif
  19428. /* Cache entry - holds precomputation tables for a point. */
  19429. typedef struct sp_cache_256_t {
  19430. /* X ordinate of point that table was generated from. */
  19431. sp_digit x[8];
  19432. /* Y ordinate of point that table was generated from. */
  19433. sp_digit y[8];
  19434. /* Precomputation table for point. */
  19435. sp_table_entry_256 table[16];
  19436. /* Count of entries in table. */
  19437. uint32_t cnt;
  19438. /* Point and table set in entry. */
  19439. int set;
  19440. } sp_cache_256_t;
  19441. /* Cache of tables. */
  19442. static THREAD_LS_T sp_cache_256_t sp_cache_256[FP_ENTRIES];
  19443. /* Index of last entry in cache. */
  19444. static THREAD_LS_T int sp_cache_256_last = -1;
  19445. /* Cache has been initialized. */
  19446. static THREAD_LS_T int sp_cache_256_inited = 0;
  19447. #ifndef HAVE_THREAD_LS
  19448. static volatile int initCacheMutex_256 = 0;
  19449. static wolfSSL_Mutex sp_cache_256_lock;
  19450. #endif
  19451. /* Get the cache entry for the point.
  19452. *
  19453. * g [in] Point scalar multipling.
  19454. * cache [out] Cache table to use.
  19455. */
  19456. static void sp_ecc_get_cache_256(const sp_point_256* g, sp_cache_256_t** cache)
  19457. {
  19458. int i;
  19459. int j;
  19460. uint32_t least;
  19461. if (sp_cache_256_inited == 0) {
  19462. for (i=0; i<FP_ENTRIES; i++) {
  19463. sp_cache_256[i].set = 0;
  19464. }
  19465. sp_cache_256_inited = 1;
  19466. }
  19467. /* Compare point with those in cache. */
  19468. for (i=0; i<FP_ENTRIES; i++) {
  19469. if (!sp_cache_256[i].set)
  19470. continue;
  19471. if (sp_256_cmp_equal_8(g->x, sp_cache_256[i].x) &
  19472. sp_256_cmp_equal_8(g->y, sp_cache_256[i].y)) {
  19473. sp_cache_256[i].cnt++;
  19474. break;
  19475. }
  19476. }
  19477. /* No match. */
  19478. if (i == FP_ENTRIES) {
  19479. /* Find empty entry. */
  19480. i = (sp_cache_256_last + 1) % FP_ENTRIES;
  19481. for (; i != sp_cache_256_last; i=(i+1)%FP_ENTRIES) {
  19482. if (!sp_cache_256[i].set) {
  19483. break;
  19484. }
  19485. }
  19486. /* Evict least used. */
  19487. if (i == sp_cache_256_last) {
  19488. least = sp_cache_256[0].cnt;
  19489. for (j=1; j<FP_ENTRIES; j++) {
  19490. if (sp_cache_256[j].cnt < least) {
  19491. i = j;
  19492. least = sp_cache_256[i].cnt;
  19493. }
  19494. }
  19495. }
  19496. XMEMCPY(sp_cache_256[i].x, g->x, sizeof(sp_cache_256[i].x));
  19497. XMEMCPY(sp_cache_256[i].y, g->y, sizeof(sp_cache_256[i].y));
  19498. sp_cache_256[i].set = 1;
  19499. sp_cache_256[i].cnt = 1;
  19500. }
  19501. *cache = &sp_cache_256[i];
  19502. sp_cache_256_last = i;
  19503. }
  19504. #endif /* FP_ECC */
  19505. /* Multiply the base point of P256 by the scalar and return the result.
  19506. * If map is true then convert result to affine coordinates.
  19507. *
  19508. * r Resulting point.
  19509. * g Point to multiply.
  19510. * k Scalar to multiply by.
  19511. * map Indicates whether to convert result to affine.
  19512. * ct Constant time required.
  19513. * heap Heap to use for allocation.
  19514. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  19515. */
  19516. static int sp_256_ecc_mulmod_8(sp_point_256* r, const sp_point_256* g, const sp_digit* k,
  19517. int map, int ct, void* heap)
  19518. {
  19519. #ifndef FP_ECC
  19520. return sp_256_ecc_mulmod_fast_8(r, g, k, map, ct, heap);
  19521. #else
  19522. sp_digit tmp[2 * 8 * 6];
  19523. sp_cache_256_t* cache;
  19524. int err = MP_OKAY;
  19525. #ifndef HAVE_THREAD_LS
  19526. if (initCacheMutex_256 == 0) {
  19527. wc_InitMutex(&sp_cache_256_lock);
  19528. initCacheMutex_256 = 1;
  19529. }
  19530. if (wc_LockMutex(&sp_cache_256_lock) != 0)
  19531. err = BAD_MUTEX_E;
  19532. #endif /* HAVE_THREAD_LS */
  19533. if (err == MP_OKAY) {
  19534. sp_ecc_get_cache_256(g, &cache);
  19535. if (cache->cnt == 2)
  19536. sp_256_gen_stripe_table_8(g, cache->table, tmp, heap);
  19537. #ifndef HAVE_THREAD_LS
  19538. wc_UnLockMutex(&sp_cache_256_lock);
  19539. #endif /* HAVE_THREAD_LS */
  19540. if (cache->cnt < 2) {
  19541. err = sp_256_ecc_mulmod_fast_8(r, g, k, map, ct, heap);
  19542. }
  19543. else {
  19544. err = sp_256_ecc_mulmod_stripe_8(r, g, cache->table, k,
  19545. map, ct, heap);
  19546. }
  19547. }
  19548. return err;
  19549. #endif
  19550. }
  19551. #else
  19552. #ifdef FP_ECC
  19553. /* Generate the pre-computed table of points for the base point.
  19554. *
  19555. * width = 8
  19556. * 256 entries
  19557. * 32 bits between
  19558. *
  19559. * a The base point.
  19560. * table Place to store generated point data.
  19561. * tmp Temporary data.
  19562. * heap Heap to use for allocation.
  19563. */
  19564. static int sp_256_gen_stripe_table_8(const sp_point_256* a,
  19565. sp_table_entry_256* table, sp_digit* tmp, void* heap)
  19566. {
  19567. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19568. sp_point_256* t = NULL;
  19569. #else
  19570. sp_point_256 t[3];
  19571. #endif
  19572. sp_point_256* s1 = NULL;
  19573. sp_point_256* s2 = NULL;
  19574. int i;
  19575. int j;
  19576. int err = MP_OKAY;
  19577. (void)heap;
  19578. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19579. t = (sp_point_256*)XMALLOC(sizeof(sp_point_256) * 3, heap,
  19580. DYNAMIC_TYPE_ECC);
  19581. if (t == NULL)
  19582. err = MEMORY_E;
  19583. #endif
  19584. if (err == MP_OKAY) {
  19585. s1 = t + 1;
  19586. s2 = t + 2;
  19587. err = sp_256_mod_mul_norm_8(t->x, a->x, p256_mod);
  19588. }
  19589. if (err == MP_OKAY) {
  19590. err = sp_256_mod_mul_norm_8(t->y, a->y, p256_mod);
  19591. }
  19592. if (err == MP_OKAY) {
  19593. err = sp_256_mod_mul_norm_8(t->z, a->z, p256_mod);
  19594. }
  19595. if (err == MP_OKAY) {
  19596. t->infinity = 0;
  19597. sp_256_proj_to_affine_8(t, tmp);
  19598. XMEMCPY(s1->z, p256_norm_mod, sizeof(p256_norm_mod));
  19599. s1->infinity = 0;
  19600. XMEMCPY(s2->z, p256_norm_mod, sizeof(p256_norm_mod));
  19601. s2->infinity = 0;
  19602. /* table[0] = {0, 0, infinity} */
  19603. XMEMSET(&table[0], 0, sizeof(sp_table_entry_256));
  19604. /* table[1] = Affine version of 'a' in Montgomery form */
  19605. XMEMCPY(table[1].x, t->x, sizeof(table->x));
  19606. XMEMCPY(table[1].y, t->y, sizeof(table->y));
  19607. for (i=1; i<8; i++) {
  19608. sp_256_proj_point_dbl_n_8(t, 32, tmp);
  19609. sp_256_proj_to_affine_8(t, tmp);
  19610. XMEMCPY(table[1<<i].x, t->x, sizeof(table->x));
  19611. XMEMCPY(table[1<<i].y, t->y, sizeof(table->y));
  19612. }
  19613. for (i=1; i<8; i++) {
  19614. XMEMCPY(s1->x, table[1<<i].x, sizeof(table->x));
  19615. XMEMCPY(s1->y, table[1<<i].y, sizeof(table->y));
  19616. for (j=(1<<i)+1; j<(1<<(i+1)); j++) {
  19617. XMEMCPY(s2->x, table[j-(1<<i)].x, sizeof(table->x));
  19618. XMEMCPY(s2->y, table[j-(1<<i)].y, sizeof(table->y));
  19619. sp_256_proj_point_add_qz1_8(t, s1, s2, tmp);
  19620. sp_256_proj_to_affine_8(t, tmp);
  19621. XMEMCPY(table[j].x, t->x, sizeof(table->x));
  19622. XMEMCPY(table[j].y, t->y, sizeof(table->y));
  19623. }
  19624. }
  19625. }
  19626. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19627. if (t != NULL)
  19628. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  19629. #endif
  19630. return err;
  19631. }
  19632. #endif /* FP_ECC */
  19633. #ifndef WC_NO_CACHE_RESISTANT
  19634. /* Touch each possible entry that could be being copied.
  19635. *
  19636. * r Point to copy into.
  19637. * table Table - start of the entires to access
  19638. * idx Index of entry to retrieve.
  19639. */
  19640. static void sp_256_get_entry_256_8(sp_point_256* r,
  19641. const sp_table_entry_256* table, int idx)
  19642. {
  19643. int i;
  19644. sp_digit mask;
  19645. r->x[0] = 0;
  19646. r->x[1] = 0;
  19647. r->x[2] = 0;
  19648. r->x[3] = 0;
  19649. r->x[4] = 0;
  19650. r->x[5] = 0;
  19651. r->x[6] = 0;
  19652. r->x[7] = 0;
  19653. r->y[0] = 0;
  19654. r->y[1] = 0;
  19655. r->y[2] = 0;
  19656. r->y[3] = 0;
  19657. r->y[4] = 0;
  19658. r->y[5] = 0;
  19659. r->y[6] = 0;
  19660. r->y[7] = 0;
  19661. for (i = 1; i < 256; i++) {
  19662. mask = 0 - (i == idx);
  19663. r->x[0] |= mask & table[i].x[0];
  19664. r->x[1] |= mask & table[i].x[1];
  19665. r->x[2] |= mask & table[i].x[2];
  19666. r->x[3] |= mask & table[i].x[3];
  19667. r->x[4] |= mask & table[i].x[4];
  19668. r->x[5] |= mask & table[i].x[5];
  19669. r->x[6] |= mask & table[i].x[6];
  19670. r->x[7] |= mask & table[i].x[7];
  19671. r->y[0] |= mask & table[i].y[0];
  19672. r->y[1] |= mask & table[i].y[1];
  19673. r->y[2] |= mask & table[i].y[2];
  19674. r->y[3] |= mask & table[i].y[3];
  19675. r->y[4] |= mask & table[i].y[4];
  19676. r->y[5] |= mask & table[i].y[5];
  19677. r->y[6] |= mask & table[i].y[6];
  19678. r->y[7] |= mask & table[i].y[7];
  19679. }
  19680. }
  19681. #endif /* !WC_NO_CACHE_RESISTANT */
  19682. /* Multiply the point by the scalar and return the result.
  19683. * If map is true then convert result to affine coordinates.
  19684. *
  19685. * Stripe implementation.
  19686. * Pre-generated: 2^0, 2^32, ...
  19687. * Pre-generated: products of all combinations of above.
  19688. * 8 doubles and adds (with qz=1)
  19689. *
  19690. * r Resulting point.
  19691. * k Scalar to multiply by.
  19692. * table Pre-computed table.
  19693. * map Indicates whether to convert result to affine.
  19694. * ct Constant time required.
  19695. * heap Heap to use for allocation.
  19696. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  19697. */
  19698. static int sp_256_ecc_mulmod_stripe_8(sp_point_256* r, const sp_point_256* g,
  19699. const sp_table_entry_256* table, const sp_digit* k, int map,
  19700. int ct, void* heap)
  19701. {
  19702. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19703. sp_point_256* rt = NULL;
  19704. sp_digit* t = NULL;
  19705. #else
  19706. sp_point_256 rt[2];
  19707. sp_digit t[2 * 8 * 6];
  19708. #endif
  19709. sp_point_256* p = NULL;
  19710. int i;
  19711. int j;
  19712. int y;
  19713. int x;
  19714. int err = MP_OKAY;
  19715. (void)g;
  19716. /* Constant time used for cache attack resistance implementation. */
  19717. (void)ct;
  19718. (void)heap;
  19719. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19720. rt = (sp_point_256*)XMALLOC(sizeof(sp_point_256) * 2, heap,
  19721. DYNAMIC_TYPE_ECC);
  19722. if (rt == NULL)
  19723. err = MEMORY_E;
  19724. if (err == MP_OKAY) {
  19725. t = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 8 * 6, heap,
  19726. DYNAMIC_TYPE_ECC);
  19727. if (t == NULL)
  19728. err = MEMORY_E;
  19729. }
  19730. #endif
  19731. if (err == MP_OKAY) {
  19732. p = rt + 1;
  19733. XMEMCPY(p->z, p256_norm_mod, sizeof(p256_norm_mod));
  19734. XMEMCPY(rt->z, p256_norm_mod, sizeof(p256_norm_mod));
  19735. y = 0;
  19736. x = 31;
  19737. for (j=0; j<8; j++) {
  19738. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  19739. x += 32;
  19740. }
  19741. #ifndef WC_NO_CACHE_RESISTANT
  19742. if (ct) {
  19743. sp_256_get_entry_256_8(rt, table, y);
  19744. } else
  19745. #endif
  19746. {
  19747. XMEMCPY(rt->x, table[y].x, sizeof(table[y].x));
  19748. XMEMCPY(rt->y, table[y].y, sizeof(table[y].y));
  19749. }
  19750. rt->infinity = !y;
  19751. for (i=30; i>=0; i--) {
  19752. y = 0;
  19753. x = i;
  19754. for (j=0; j<8; j++) {
  19755. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  19756. x += 32;
  19757. }
  19758. sp_256_proj_point_dbl_8(rt, rt, t);
  19759. #ifndef WC_NO_CACHE_RESISTANT
  19760. if (ct) {
  19761. sp_256_get_entry_256_8(p, table, y);
  19762. }
  19763. else
  19764. #endif
  19765. {
  19766. XMEMCPY(p->x, table[y].x, sizeof(table[y].x));
  19767. XMEMCPY(p->y, table[y].y, sizeof(table[y].y));
  19768. }
  19769. p->infinity = !y;
  19770. sp_256_proj_point_add_qz1_8(rt, rt, p, t);
  19771. }
  19772. if (map != 0) {
  19773. sp_256_map_8(r, rt, t);
  19774. }
  19775. else {
  19776. XMEMCPY(r, rt, sizeof(sp_point_256));
  19777. }
  19778. }
  19779. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19780. if (t != NULL)
  19781. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  19782. if (rt != NULL)
  19783. XFREE(rt, heap, DYNAMIC_TYPE_ECC);
  19784. #endif
  19785. return err;
  19786. }
  19787. #ifdef FP_ECC
  19788. #ifndef FP_ENTRIES
  19789. #define FP_ENTRIES 16
  19790. #endif
  19791. /* Cache entry - holds precomputation tables for a point. */
  19792. typedef struct sp_cache_256_t {
  19793. /* X ordinate of point that table was generated from. */
  19794. sp_digit x[8];
  19795. /* Y ordinate of point that table was generated from. */
  19796. sp_digit y[8];
  19797. /* Precomputation table for point. */
  19798. sp_table_entry_256 table[256];
  19799. /* Count of entries in table. */
  19800. uint32_t cnt;
  19801. /* Point and table set in entry. */
  19802. int set;
  19803. } sp_cache_256_t;
  19804. /* Cache of tables. */
  19805. static THREAD_LS_T sp_cache_256_t sp_cache_256[FP_ENTRIES];
  19806. /* Index of last entry in cache. */
  19807. static THREAD_LS_T int sp_cache_256_last = -1;
  19808. /* Cache has been initialized. */
  19809. static THREAD_LS_T int sp_cache_256_inited = 0;
  19810. #ifndef HAVE_THREAD_LS
  19811. static volatile int initCacheMutex_256 = 0;
  19812. static wolfSSL_Mutex sp_cache_256_lock;
  19813. #endif
  19814. /* Get the cache entry for the point.
  19815. *
  19816. * g [in] Point scalar multipling.
  19817. * cache [out] Cache table to use.
  19818. */
  19819. static void sp_ecc_get_cache_256(const sp_point_256* g, sp_cache_256_t** cache)
  19820. {
  19821. int i;
  19822. int j;
  19823. uint32_t least;
  19824. if (sp_cache_256_inited == 0) {
  19825. for (i=0; i<FP_ENTRIES; i++) {
  19826. sp_cache_256[i].set = 0;
  19827. }
  19828. sp_cache_256_inited = 1;
  19829. }
  19830. /* Compare point with those in cache. */
  19831. for (i=0; i<FP_ENTRIES; i++) {
  19832. if (!sp_cache_256[i].set)
  19833. continue;
  19834. if (sp_256_cmp_equal_8(g->x, sp_cache_256[i].x) &
  19835. sp_256_cmp_equal_8(g->y, sp_cache_256[i].y)) {
  19836. sp_cache_256[i].cnt++;
  19837. break;
  19838. }
  19839. }
  19840. /* No match. */
  19841. if (i == FP_ENTRIES) {
  19842. /* Find empty entry. */
  19843. i = (sp_cache_256_last + 1) % FP_ENTRIES;
  19844. for (; i != sp_cache_256_last; i=(i+1)%FP_ENTRIES) {
  19845. if (!sp_cache_256[i].set) {
  19846. break;
  19847. }
  19848. }
  19849. /* Evict least used. */
  19850. if (i == sp_cache_256_last) {
  19851. least = sp_cache_256[0].cnt;
  19852. for (j=1; j<FP_ENTRIES; j++) {
  19853. if (sp_cache_256[j].cnt < least) {
  19854. i = j;
  19855. least = sp_cache_256[i].cnt;
  19856. }
  19857. }
  19858. }
  19859. XMEMCPY(sp_cache_256[i].x, g->x, sizeof(sp_cache_256[i].x));
  19860. XMEMCPY(sp_cache_256[i].y, g->y, sizeof(sp_cache_256[i].y));
  19861. sp_cache_256[i].set = 1;
  19862. sp_cache_256[i].cnt = 1;
  19863. }
  19864. *cache = &sp_cache_256[i];
  19865. sp_cache_256_last = i;
  19866. }
  19867. #endif /* FP_ECC */
  19868. /* Multiply the base point of P256 by the scalar and return the result.
  19869. * If map is true then convert result to affine coordinates.
  19870. *
  19871. * r Resulting point.
  19872. * g Point to multiply.
  19873. * k Scalar to multiply by.
  19874. * map Indicates whether to convert result to affine.
  19875. * ct Constant time required.
  19876. * heap Heap to use for allocation.
  19877. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  19878. */
  19879. static int sp_256_ecc_mulmod_8(sp_point_256* r, const sp_point_256* g, const sp_digit* k,
  19880. int map, int ct, void* heap)
  19881. {
  19882. #ifndef FP_ECC
  19883. return sp_256_ecc_mulmod_fast_8(r, g, k, map, ct, heap);
  19884. #else
  19885. sp_digit tmp[2 * 8 * 6];
  19886. sp_cache_256_t* cache;
  19887. int err = MP_OKAY;
  19888. #ifndef HAVE_THREAD_LS
  19889. if (initCacheMutex_256 == 0) {
  19890. wc_InitMutex(&sp_cache_256_lock);
  19891. initCacheMutex_256 = 1;
  19892. }
  19893. if (wc_LockMutex(&sp_cache_256_lock) != 0)
  19894. err = BAD_MUTEX_E;
  19895. #endif /* HAVE_THREAD_LS */
  19896. if (err == MP_OKAY) {
  19897. sp_ecc_get_cache_256(g, &cache);
  19898. if (cache->cnt == 2)
  19899. sp_256_gen_stripe_table_8(g, cache->table, tmp, heap);
  19900. #ifndef HAVE_THREAD_LS
  19901. wc_UnLockMutex(&sp_cache_256_lock);
  19902. #endif /* HAVE_THREAD_LS */
  19903. if (cache->cnt < 2) {
  19904. err = sp_256_ecc_mulmod_fast_8(r, g, k, map, ct, heap);
  19905. }
  19906. else {
  19907. err = sp_256_ecc_mulmod_stripe_8(r, g, cache->table, k,
  19908. map, ct, heap);
  19909. }
  19910. }
  19911. return err;
  19912. #endif
  19913. }
  19914. #endif /* WOLFSSL_SP_SMALL */
  19915. /* Multiply the point by the scalar and return the result.
  19916. * If map is true then convert result to affine coordinates.
  19917. *
  19918. * km Scalar to multiply by.
  19919. * p Point to multiply.
  19920. * r Resulting point.
  19921. * map Indicates whether to convert result to affine.
  19922. * heap Heap to use for allocation.
  19923. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  19924. */
  19925. int sp_ecc_mulmod_256(const mp_int* km, const ecc_point* gm, ecc_point* r,
  19926. int map, void* heap)
  19927. {
  19928. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19929. sp_point_256* point = NULL;
  19930. sp_digit* k = NULL;
  19931. #else
  19932. sp_point_256 point[1];
  19933. sp_digit k[8];
  19934. #endif
  19935. int err = MP_OKAY;
  19936. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19937. point = (sp_point_256*)XMALLOC(sizeof(sp_point_256), heap,
  19938. DYNAMIC_TYPE_ECC);
  19939. if (point == NULL)
  19940. err = MEMORY_E;
  19941. if (err == MP_OKAY) {
  19942. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 8, heap,
  19943. DYNAMIC_TYPE_ECC);
  19944. if (k == NULL)
  19945. err = MEMORY_E;
  19946. }
  19947. #endif
  19948. if (err == MP_OKAY) {
  19949. sp_256_from_mp(k, 8, km);
  19950. sp_256_point_from_ecc_point_8(point, gm);
  19951. err = sp_256_ecc_mulmod_8(point, point, k, map, 1, heap);
  19952. }
  19953. if (err == MP_OKAY) {
  19954. err = sp_256_point_to_ecc_point_8(point, r);
  19955. }
  19956. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19957. if (k != NULL)
  19958. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  19959. if (point != NULL)
  19960. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  19961. #endif
  19962. return err;
  19963. }
  19964. /* Multiply the point by the scalar, add point a and return the result.
  19965. * If map is true then convert result to affine coordinates.
  19966. *
  19967. * km Scalar to multiply by.
  19968. * p Point to multiply.
  19969. * am Point to add to scalar mulitply result.
  19970. * inMont Point to add is in montgomery form.
  19971. * r Resulting point.
  19972. * map Indicates whether to convert result to affine.
  19973. * heap Heap to use for allocation.
  19974. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  19975. */
  19976. int sp_ecc_mulmod_add_256(const mp_int* km, const ecc_point* gm,
  19977. const ecc_point* am, int inMont, ecc_point* r, int map, void* heap)
  19978. {
  19979. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19980. sp_point_256* point = NULL;
  19981. sp_digit* k = NULL;
  19982. #else
  19983. sp_point_256 point[2];
  19984. sp_digit k[8 + 8 * 2 * 6];
  19985. #endif
  19986. sp_point_256* addP = NULL;
  19987. sp_digit* tmp = NULL;
  19988. int err = MP_OKAY;
  19989. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  19990. point = (sp_point_256*)XMALLOC(sizeof(sp_point_256) * 2, heap,
  19991. DYNAMIC_TYPE_ECC);
  19992. if (point == NULL)
  19993. err = MEMORY_E;
  19994. if (err == MP_OKAY) {
  19995. k = (sp_digit*)XMALLOC(
  19996. sizeof(sp_digit) * (8 + 8 * 2 * 6), heap,
  19997. DYNAMIC_TYPE_ECC);
  19998. if (k == NULL)
  19999. err = MEMORY_E;
  20000. }
  20001. #endif
  20002. if (err == MP_OKAY) {
  20003. addP = point + 1;
  20004. tmp = k + 8;
  20005. sp_256_from_mp(k, 8, km);
  20006. sp_256_point_from_ecc_point_8(point, gm);
  20007. sp_256_point_from_ecc_point_8(addP, am);
  20008. }
  20009. if ((err == MP_OKAY) && (!inMont)) {
  20010. err = sp_256_mod_mul_norm_8(addP->x, addP->x, p256_mod);
  20011. }
  20012. if ((err == MP_OKAY) && (!inMont)) {
  20013. err = sp_256_mod_mul_norm_8(addP->y, addP->y, p256_mod);
  20014. }
  20015. if ((err == MP_OKAY) && (!inMont)) {
  20016. err = sp_256_mod_mul_norm_8(addP->z, addP->z, p256_mod);
  20017. }
  20018. if (err == MP_OKAY) {
  20019. err = sp_256_ecc_mulmod_8(point, point, k, 0, 0, heap);
  20020. }
  20021. if (err == MP_OKAY) {
  20022. sp_256_proj_point_add_8(point, point, addP, tmp);
  20023. if (map) {
  20024. sp_256_map_8(point, point, tmp);
  20025. }
  20026. err = sp_256_point_to_ecc_point_8(point, r);
  20027. }
  20028. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  20029. if (k != NULL)
  20030. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  20031. if (point != NULL)
  20032. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  20033. #endif
  20034. return err;
  20035. }
  20036. #ifdef WOLFSSL_SP_SMALL
  20037. /* Striping precomputation table.
  20038. * 4 points combined into a table of 16 points.
  20039. * Distance of 64 between points.
  20040. */
  20041. static const sp_table_entry_256 p256_table[16] = {
  20042. /* 0 */
  20043. { { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 },
  20044. { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 } },
  20045. /* 1 */
  20046. { { 0x18a9143c,0x79e730d4,0x5fedb601,0x75ba95fc,0x77622510,0x79fb732b,
  20047. 0xa53755c6,0x18905f76 },
  20048. { 0xce95560a,0xddf25357,0xba19e45c,0x8b4ab8e4,0xdd21f325,0xd2e88688,
  20049. 0x25885d85,0x8571ff18 } },
  20050. /* 2 */
  20051. { { 0x16a0d2bb,0x4f922fc5,0x1a623499,0x0d5cc16c,0x57c62c8b,0x9241cf3a,
  20052. 0xfd1b667f,0x2f5e6961 },
  20053. { 0xf5a01797,0x5c15c70b,0x60956192,0x3d20b44d,0x071fdb52,0x04911b37,
  20054. 0x8d6f0f7b,0xf648f916 } },
  20055. /* 3 */
  20056. { { 0xe137bbbc,0x9e566847,0x8a6a0bec,0xe434469e,0x79d73463,0xb1c42761,
  20057. 0x133d0015,0x5abe0285 },
  20058. { 0xc04c7dab,0x92aa837c,0x43260c07,0x573d9f4c,0x78e6cc37,0x0c931562,
  20059. 0x6b6f7383,0x94bb725b } },
  20060. /* 4 */
  20061. { { 0xbfe20925,0x62a8c244,0x8fdce867,0x91c19ac3,0xdd387063,0x5a96a5d5,
  20062. 0x21d324f6,0x61d587d4 },
  20063. { 0xa37173ea,0xe87673a2,0x53778b65,0x23848008,0x05bab43e,0x10f8441e,
  20064. 0x4621efbe,0xfa11fe12 } },
  20065. /* 5 */
  20066. { { 0x2cb19ffd,0x1c891f2b,0xb1923c23,0x01ba8d5b,0x8ac5ca8e,0xb6d03d67,
  20067. 0x1f13bedc,0x586eb04c },
  20068. { 0x27e8ed09,0x0c35c6e5,0x1819ede2,0x1e81a33c,0x56c652fa,0x278fd6c0,
  20069. 0x70864f11,0x19d5ac08 } },
  20070. /* 6 */
  20071. { { 0xd2b533d5,0x62577734,0xa1bdddc0,0x673b8af6,0xa79ec293,0x577e7c9a,
  20072. 0xc3b266b1,0xbb6de651 },
  20073. { 0xb65259b3,0xe7e9303a,0xd03a7480,0xd6a0afd3,0x9b3cfc27,0xc5ac83d1,
  20074. 0x5d18b99b,0x60b4619a } },
  20075. /* 7 */
  20076. { { 0x1ae5aa1c,0xbd6a38e1,0x49e73658,0xb8b7652b,0xee5f87ed,0x0b130014,
  20077. 0xaeebffcd,0x9d0f27b2 },
  20078. { 0x7a730a55,0xca924631,0xddbbc83a,0x9c955b2f,0xac019a71,0x07c1dfe0,
  20079. 0x356ec48d,0x244a566d } },
  20080. /* 8 */
  20081. { { 0xf4f8b16a,0x56f8410e,0xc47b266a,0x97241afe,0x6d9c87c1,0x0a406b8e,
  20082. 0xcd42ab1b,0x803f3e02 },
  20083. { 0x04dbec69,0x7f0309a8,0x3bbad05f,0xa83b85f7,0xad8e197f,0xc6097273,
  20084. 0x5067adc1,0xc097440e } },
  20085. /* 9 */
  20086. { { 0xc379ab34,0x846a56f2,0x841df8d1,0xa8ee068b,0x176c68ef,0x20314459,
  20087. 0x915f1f30,0xf1af32d5 },
  20088. { 0x5d75bd50,0x99c37531,0xf72f67bc,0x837cffba,0x48d7723f,0x0613a418,
  20089. 0xe2d41c8b,0x23d0f130 } },
  20090. /* 10 */
  20091. { { 0xd5be5a2b,0xed93e225,0x5934f3c6,0x6fe79983,0x22626ffc,0x43140926,
  20092. 0x7990216a,0x50bbb4d9 },
  20093. { 0xe57ec63e,0x378191c6,0x181dcdb2,0x65422c40,0x0236e0f6,0x41a8099b,
  20094. 0x01fe49c3,0x2b100118 } },
  20095. /* 11 */
  20096. { { 0x9b391593,0xfc68b5c5,0x598270fc,0xc385f5a2,0xd19adcbb,0x7144f3aa,
  20097. 0x83fbae0c,0xdd558999 },
  20098. { 0x74b82ff4,0x93b88b8e,0x71e734c9,0xd2e03c40,0x43c0322a,0x9a7a9eaf,
  20099. 0x149d6041,0xe6e4c551 } },
  20100. /* 12 */
  20101. { { 0x80ec21fe,0x5fe14bfe,0xc255be82,0xf6ce116a,0x2f4a5d67,0x98bc5a07,
  20102. 0xdb7e63af,0xfad27148 },
  20103. { 0x29ab05b3,0x90c0b6ac,0x4e251ae6,0x37a9a83c,0xc2aade7d,0x0a7dc875,
  20104. 0x9f0e1a84,0x77387de3 } },
  20105. /* 13 */
  20106. { { 0xa56c0dd7,0x1e9ecc49,0x46086c74,0xa5cffcd8,0xf505aece,0x8f7a1408,
  20107. 0xbef0c47e,0xb37b85c0 },
  20108. { 0xcc0e6a8f,0x3596b6e4,0x6b388f23,0xfd6d4bbf,0xc39cef4e,0xaba453fa,
  20109. 0xf9f628d5,0x9c135ac8 } },
  20110. /* 14 */
  20111. { { 0x95c8f8be,0x0a1c7294,0x3bf362bf,0x2961c480,0xdf63d4ac,0x9e418403,
  20112. 0x91ece900,0xc109f9cb },
  20113. { 0x58945705,0xc2d095d0,0xddeb85c0,0xb9083d96,0x7a40449b,0x84692b8d,
  20114. 0x2eee1ee1,0x9bc3344f } },
  20115. /* 15 */
  20116. { { 0x42913074,0x0d5ae356,0x48a542b1,0x55491b27,0xb310732a,0x469ca665,
  20117. 0x5f1a4cc1,0x29591d52 },
  20118. { 0xb84f983f,0xe76f5b6b,0x9f5f84e1,0xbe7eef41,0x80baa189,0x1200d496,
  20119. 0x18ef332c,0x6376551f } },
  20120. };
  20121. /* Multiply the base point of P256 by the scalar and return the result.
  20122. * If map is true then convert result to affine coordinates.
  20123. *
  20124. * Stripe implementation.
  20125. * Pre-generated: 2^0, 2^64, ...
  20126. * Pre-generated: products of all combinations of above.
  20127. * 4 doubles and adds (with qz=1)
  20128. *
  20129. * r Resulting point.
  20130. * k Scalar to multiply by.
  20131. * map Indicates whether to convert result to affine.
  20132. * ct Constant time required.
  20133. * heap Heap to use for allocation.
  20134. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  20135. */
  20136. static int sp_256_ecc_mulmod_base_8(sp_point_256* r, const sp_digit* k,
  20137. int map, int ct, void* heap)
  20138. {
  20139. return sp_256_ecc_mulmod_stripe_8(r, &p256_base, p256_table,
  20140. k, map, ct, heap);
  20141. }
  20142. #else
  20143. /* Striping precomputation table.
  20144. * 8 points combined into a table of 256 points.
  20145. * Distance of 32 between points.
  20146. */
  20147. static const sp_table_entry_256 p256_table[256] = {
  20148. /* 0 */
  20149. { { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 },
  20150. { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 } },
  20151. /* 1 */
  20152. { { 0x18a9143c,0x79e730d4,0x5fedb601,0x75ba95fc,0x77622510,0x79fb732b,
  20153. 0xa53755c6,0x18905f76 },
  20154. { 0xce95560a,0xddf25357,0xba19e45c,0x8b4ab8e4,0xdd21f325,0xd2e88688,
  20155. 0x25885d85,0x8571ff18 } },
  20156. /* 2 */
  20157. { { 0x4147519a,0x20288602,0x26b372f0,0xd0981eac,0xa785ebc8,0xa9d4a7ca,
  20158. 0xdbdf58e9,0xd953c50d },
  20159. { 0xfd590f8f,0x9d6361cc,0x44e6c917,0x72e9626b,0x22eb64cf,0x7fd96110,
  20160. 0x9eb288f3,0x863ebb7e } },
  20161. /* 3 */
  20162. { { 0x5cdb6485,0x7856b623,0x2f0a2f97,0x808f0ea2,0x4f7e300b,0x3e68d954,
  20163. 0xb5ff80a0,0x00076055 },
  20164. { 0x838d2010,0x7634eb9b,0x3243708a,0x54014fbb,0x842a6606,0xe0e47d39,
  20165. 0x34373ee0,0x83087761 } },
  20166. /* 4 */
  20167. { { 0x16a0d2bb,0x4f922fc5,0x1a623499,0x0d5cc16c,0x57c62c8b,0x9241cf3a,
  20168. 0xfd1b667f,0x2f5e6961 },
  20169. { 0xf5a01797,0x5c15c70b,0x60956192,0x3d20b44d,0x071fdb52,0x04911b37,
  20170. 0x8d6f0f7b,0xf648f916 } },
  20171. /* 5 */
  20172. { { 0xe137bbbc,0x9e566847,0x8a6a0bec,0xe434469e,0x79d73463,0xb1c42761,
  20173. 0x133d0015,0x5abe0285 },
  20174. { 0xc04c7dab,0x92aa837c,0x43260c07,0x573d9f4c,0x78e6cc37,0x0c931562,
  20175. 0x6b6f7383,0x94bb725b } },
  20176. /* 6 */
  20177. { { 0x720f141c,0xbbf9b48f,0x2df5bc74,0x6199b3cd,0x411045c4,0xdc3f6129,
  20178. 0x2f7dc4ef,0xcdd6bbcb },
  20179. { 0xeaf436fd,0xcca6700b,0xb99326be,0x6f647f6d,0x014f2522,0x0c0fa792,
  20180. 0x4bdae5f6,0xa361bebd } },
  20181. /* 7 */
  20182. { { 0x597c13c7,0x28aa2558,0x50b7c3e1,0xc38d635f,0xf3c09d1d,0x07039aec,
  20183. 0xc4b5292c,0xba12ca09 },
  20184. { 0x59f91dfd,0x9e408fa4,0xceea07fb,0x3af43b66,0x9d780b29,0x1eceb089,
  20185. 0x701fef4b,0x53ebb99d } },
  20186. /* 8 */
  20187. { { 0xb0e63d34,0x4fe7ee31,0xa9e54fab,0xf4600572,0xd5e7b5a4,0xc0493334,
  20188. 0x06d54831,0x8589fb92 },
  20189. { 0x6583553a,0xaa70f5cc,0xe25649e5,0x0879094a,0x10044652,0xcc904507,
  20190. 0x02541c4f,0xebb0696d } },
  20191. /* 9 */
  20192. { { 0xac1647c5,0x4616ca15,0xc4cf5799,0xb8127d47,0x764dfbac,0xdc666aa3,
  20193. 0xd1b27da3,0xeb2820cb },
  20194. { 0x6a87e008,0x9406f8d8,0x922378f3,0xd87dfa9d,0x80ccecb2,0x56ed2e42,
  20195. 0x55a7da1d,0x1f28289b } },
  20196. /* 10 */
  20197. { { 0x3b89da99,0xabbaa0c0,0xb8284022,0xa6f2d79e,0xb81c05e8,0x27847862,
  20198. 0x05e54d63,0x337a4b59 },
  20199. { 0x21f7794a,0x3c67500d,0x7d6d7f61,0x207005b7,0x04cfd6e8,0x0a5a3781,
  20200. 0xf4c2fbd6,0x0d65e0d5 } },
  20201. /* 11 */
  20202. { { 0xb5275d38,0xd9d09bbe,0x0be0a358,0x4268a745,0x973eb265,0xf0762ff4,
  20203. 0x52f4a232,0xc23da242 },
  20204. { 0x0b94520c,0x5da1b84f,0xb05bd78e,0x09666763,0x94d29ea1,0x3a4dcb86,
  20205. 0xc790cff1,0x19de3b8c } },
  20206. /* 12 */
  20207. { { 0x26c5fe04,0x183a716c,0x3bba1bdb,0x3b28de0b,0xa4cb712c,0x7432c586,
  20208. 0x91fccbfd,0xe34dcbd4 },
  20209. { 0xaaa58403,0xb408d46b,0x82e97a53,0x9a697486,0x36aaa8af,0x9e390127,
  20210. 0x7b4e0f7f,0xe7641f44 } },
  20211. /* 13 */
  20212. { { 0xdf64ba59,0x7d753941,0x0b0242fc,0xd33f10ec,0xa1581859,0x4f06dfc6,
  20213. 0x052a57bf,0x4a12df57 },
  20214. { 0x9439dbd0,0xbfa6338f,0xbde53e1f,0xd3c24bd4,0x21f1b314,0xfd5e4ffa,
  20215. 0xbb5bea46,0x6af5aa93 } },
  20216. /* 14 */
  20217. { { 0x10c91999,0xda10b699,0x2a580491,0x0a24b440,0xb8cc2090,0x3e0094b4,
  20218. 0x66a44013,0x5fe3475a },
  20219. { 0xf93e7b4b,0xb0f8cabd,0x7c23f91a,0x292b501a,0xcd1e6263,0x42e889ae,
  20220. 0xecfea916,0xb544e308 } },
  20221. /* 15 */
  20222. { { 0x16ddfdce,0x6478c6e9,0xf89179e6,0x2c329166,0x4d4e67e1,0x4e8d6e76,
  20223. 0xa6b0c20b,0xe0b6b2bd },
  20224. { 0xbb7efb57,0x0d312df2,0x790c4007,0x1aac0dde,0x679bc944,0xf90336ad,
  20225. 0x25a63774,0x71c023de } },
  20226. /* 16 */
  20227. { { 0xbfe20925,0x62a8c244,0x8fdce867,0x91c19ac3,0xdd387063,0x5a96a5d5,
  20228. 0x21d324f6,0x61d587d4 },
  20229. { 0xa37173ea,0xe87673a2,0x53778b65,0x23848008,0x05bab43e,0x10f8441e,
  20230. 0x4621efbe,0xfa11fe12 } },
  20231. /* 17 */
  20232. { { 0x2cb19ffd,0x1c891f2b,0xb1923c23,0x01ba8d5b,0x8ac5ca8e,0xb6d03d67,
  20233. 0x1f13bedc,0x586eb04c },
  20234. { 0x27e8ed09,0x0c35c6e5,0x1819ede2,0x1e81a33c,0x56c652fa,0x278fd6c0,
  20235. 0x70864f11,0x19d5ac08 } },
  20236. /* 18 */
  20237. { { 0x309a4e1f,0x1e99f581,0xe9270074,0xab7de71b,0xefd28d20,0x26a5ef0b,
  20238. 0x7f9c563f,0xe7c0073f },
  20239. { 0x0ef59f76,0x1f6d663a,0x20fcb050,0x669b3b54,0x7a6602d4,0xc08c1f7a,
  20240. 0xc65b3c0a,0xe08504fe } },
  20241. /* 19 */
  20242. { { 0xa031b3ca,0xf098f68d,0xe6da6d66,0x6d1cab9e,0x94f246e8,0x5bfd81fa,
  20243. 0x5b0996b4,0x78f01882 },
  20244. { 0x3a25787f,0xb7eefde4,0x1dccac9b,0x8016f80d,0xb35bfc36,0x0cea4877,
  20245. 0x7e94747a,0x43a773b8 } },
  20246. /* 20 */
  20247. { { 0xd2b533d5,0x62577734,0xa1bdddc0,0x673b8af6,0xa79ec293,0x577e7c9a,
  20248. 0xc3b266b1,0xbb6de651 },
  20249. { 0xb65259b3,0xe7e9303a,0xd03a7480,0xd6a0afd3,0x9b3cfc27,0xc5ac83d1,
  20250. 0x5d18b99b,0x60b4619a } },
  20251. /* 21 */
  20252. { { 0x1ae5aa1c,0xbd6a38e1,0x49e73658,0xb8b7652b,0xee5f87ed,0x0b130014,
  20253. 0xaeebffcd,0x9d0f27b2 },
  20254. { 0x7a730a55,0xca924631,0xddbbc83a,0x9c955b2f,0xac019a71,0x07c1dfe0,
  20255. 0x356ec48d,0x244a566d } },
  20256. /* 22 */
  20257. { { 0xeacf1f96,0x6db0394a,0x024c271c,0x9f2122a9,0x82cbd3b9,0x2626ac1b,
  20258. 0x3581ef69,0x45e58c87 },
  20259. { 0xa38f9dbc,0xd3ff479d,0xe888a040,0xa8aaf146,0x46e0bed7,0x945adfb2,
  20260. 0xc1e4b7a4,0xc040e21c } },
  20261. /* 23 */
  20262. { { 0x6f8117b6,0x847af000,0x73a35433,0x651969ff,0x1d9475eb,0x482b3576,
  20263. 0x682c6ec7,0x1cdf5c97 },
  20264. { 0x11f04839,0x7db775b4,0x48de1698,0x7dbeacf4,0xb70b3219,0xb2921dd1,
  20265. 0xa92dff3d,0x046755f8 } },
  20266. /* 24 */
  20267. { { 0xbce8ffcd,0xcc8ac5d2,0x2fe61a82,0x0d53c48b,0x7202d6c7,0xf6f16172,
  20268. 0x3b83a5f3,0x046e5e11 },
  20269. { 0xd8007f01,0xe7b8ff64,0x5af43183,0x7fb1ef12,0x35e1a03c,0x045c5ea6,
  20270. 0x303d005b,0x6e0106c3 } },
  20271. /* 25 */
  20272. { { 0x88dd73b1,0x48c73584,0x995ed0d9,0x7670708f,0xc56a2ab7,0x38385ea8,
  20273. 0xe901cf1f,0x442594ed },
  20274. { 0x12d4b65b,0xf8faa2c9,0x96c90c37,0x94c2343b,0x5e978d1f,0xd326e4a1,
  20275. 0x4c2ee68e,0xa796fa51 } },
  20276. /* 26 */
  20277. { { 0x823addd7,0x359fb604,0xe56693b3,0x9e2a6183,0x3cbf3c80,0xf885b78e,
  20278. 0xc69766e9,0xe4ad2da9 },
  20279. { 0x8e048a61,0x357f7f42,0xc092d9a0,0x082d198c,0xc03ed8ef,0xfc3a1af4,
  20280. 0xc37b5143,0xc5e94046 } },
  20281. /* 27 */
  20282. { { 0x2be75f9e,0x476a538c,0xcb123a78,0x6fd1a9e8,0xb109c04b,0xd85e4df0,
  20283. 0xdb464747,0x63283daf },
  20284. { 0xbaf2df15,0xce728cf7,0x0ad9a7f4,0xe592c455,0xe834bcc3,0xfab226ad,
  20285. 0x1981a938,0x68bd19ab } },
  20286. /* 28 */
  20287. { { 0x1887d659,0xc08ead51,0xb359305a,0x3374d5f4,0xcfe74fe3,0x96986981,
  20288. 0x3c6fdfd6,0x495292f5 },
  20289. { 0x1acec896,0x4a878c9e,0xec5b4484,0xd964b210,0x664d60a7,0x6696f7e2,
  20290. 0x26036837,0x0ec7530d } },
  20291. /* 29 */
  20292. { { 0xad2687bb,0x2da13a05,0xf32e21fa,0xa1f83b6a,0x1dd4607b,0x390f5ef5,
  20293. 0x64863f0b,0x0f6207a6 },
  20294. { 0x0f138233,0xbd67e3bb,0x272aa718,0xdd66b96c,0x26ec88ae,0x8ed00407,
  20295. 0x08ed6dcf,0xff0db072 } },
  20296. /* 30 */
  20297. { { 0x4c95d553,0x749fa101,0x5d680a8a,0xa44052fd,0xff3b566f,0x183b4317,
  20298. 0x88740ea3,0x313b513c },
  20299. { 0x08d11549,0xb402e2ac,0xb4dee21c,0x071ee10b,0x47f2320e,0x26b987dd,
  20300. 0x86f19f81,0x2d3abcf9 } },
  20301. /* 31 */
  20302. { { 0x815581a2,0x4c288501,0x632211af,0x9a0a6d56,0x0cab2e99,0x19ba7a0f,
  20303. 0xded98cdf,0xc036fa10 },
  20304. { 0xc1fbd009,0x29ae08ba,0x06d15816,0x0b68b190,0x9b9e0d8f,0xc2eb3277,
  20305. 0xb6d40194,0xa6b2a2c4 } },
  20306. /* 32 */
  20307. { { 0x6d3549cf,0xd433e50f,0xfacd665e,0x6f33696f,0xce11fcb4,0x695bfdac,
  20308. 0xaf7c9860,0x810ee252 },
  20309. { 0x7159bb2c,0x65450fe1,0x758b357b,0xf7dfbebe,0xd69fea72,0x2b057e74,
  20310. 0x92731745,0xd485717a } },
  20311. /* 33 */
  20312. { { 0xf0cb5a98,0x11741a8a,0x1f3110bf,0xd3da8f93,0xab382adf,0x1994e2cb,
  20313. 0x2f9a604e,0x6a6045a7 },
  20314. { 0xa2b2411d,0x170c0d3f,0x510e96e0,0xbe0eb83e,0x8865b3cc,0x3bcc9f73,
  20315. 0xf9e15790,0xd3e45cfa } },
  20316. /* 34 */
  20317. { { 0xe83f7669,0xce1f69bb,0x72877d6b,0x09f8ae82,0x3244278d,0x9548ae54,
  20318. 0xe3c2c19c,0x207755de },
  20319. { 0x6fef1945,0x87bd61d9,0xb12d28c3,0x18813cef,0x72df64aa,0x9fbcd1d6,
  20320. 0x7154b00d,0x48dc5ee5 } },
  20321. /* 35 */
  20322. { { 0xf7e5a199,0x123790bf,0x989ccbb7,0xe0efb8cf,0x0a519c79,0xc27a2bfe,
  20323. 0xdff6f445,0xf2fb0aed },
  20324. { 0xf0b5025f,0x41c09575,0x40fa9f22,0x550543d7,0x380bfbd0,0x8fa3c8ad,
  20325. 0xdb28d525,0xa13e9015 } },
  20326. /* 36 */
  20327. { { 0xa2b65cbc,0xf9f7a350,0x2a464226,0x0b04b972,0xe23f07a1,0x265ce241,
  20328. 0x1497526f,0x2bf0d6b0 },
  20329. { 0x4b216fb7,0xd3d4dd3f,0xfbdda26a,0xf7d7b867,0x6708505c,0xaeb7b83f,
  20330. 0x162fe89f,0x42a94a5a } },
  20331. /* 37 */
  20332. { { 0xeaadf191,0x5846ad0b,0x25a268d7,0x0f8a4890,0x494dc1f6,0xe8603050,
  20333. 0xc65ede3d,0x2c2dd969 },
  20334. { 0x93849c17,0x6d02171d,0x1da250dd,0x460488ba,0x3c3a5485,0x4810c706,
  20335. 0x42c56dbc,0xf437fa1f } },
  20336. /* 38 */
  20337. { { 0x4a0f7dab,0x6aa0d714,0x1776e9ac,0x0f049793,0xf5f39786,0x52c0a050,
  20338. 0x54707aa8,0xaaf45b33 },
  20339. { 0xc18d364a,0x85e37c33,0x3e497165,0xd40b9b06,0x15ec5444,0xf4171681,
  20340. 0xf4f272bc,0xcdf6310d } },
  20341. /* 39 */
  20342. { { 0x8ea8b7ef,0x7473c623,0x85bc2287,0x08e93518,0x2bda8e34,0x41956772,
  20343. 0xda9e2ff2,0xf0d008ba },
  20344. { 0x2414d3b1,0x2912671d,0xb019ea76,0xb3754985,0x453bcbdb,0x5c61b96d,
  20345. 0xca887b8b,0x5bd5c2f5 } },
  20346. /* 40 */
  20347. { { 0xf49a3154,0xef0f469e,0x6e2b2e9a,0x3e85a595,0xaa924a9c,0x45aaec1e,
  20348. 0xa09e4719,0xaa12dfc8 },
  20349. { 0x4df69f1d,0x26f27227,0xa2ff5e73,0xe0e4c82c,0xb7a9dd44,0xb9d8ce73,
  20350. 0xe48ca901,0x6c036e73 } },
  20351. /* 41 */
  20352. { { 0x0f6e3138,0x5cfae12a,0x25ad345a,0x6966ef00,0x45672bc5,0x8993c64b,
  20353. 0x96afbe24,0x292ff658 },
  20354. { 0x5e213402,0xd5250d44,0x4392c9fe,0xf6580e27,0xda1c72e8,0x097b397f,
  20355. 0x311b7276,0x644e0c90 } },
  20356. /* 42 */
  20357. { { 0xa47153f0,0xe1e421e1,0x920418c9,0xb86c3b79,0x705d7672,0x93bdce87,
  20358. 0xcab79a77,0xf25ae793 },
  20359. { 0x6d869d0c,0x1f3194a3,0x4986c264,0x9d55c882,0x096e945e,0x49fb5ea3,
  20360. 0x13db0a3e,0x39b8e653 } },
  20361. /* 43 */
  20362. { { 0xb6fd2e59,0x37754200,0x9255c98f,0x35e2c066,0x0e2a5739,0xd9dab21a,
  20363. 0x0f19db06,0x39122f2f },
  20364. { 0x03cad53c,0xcfbce1e0,0xe65c17e3,0x225b2c0f,0x9aa13877,0x72baf1d2,
  20365. 0xce80ff8d,0x8de80af8 } },
  20366. /* 44 */
  20367. { { 0x207bbb76,0xafbea8d9,0x21782758,0x921c7e7c,0x1c0436b1,0xdfa2b74b,
  20368. 0x2e368c04,0x87194906 },
  20369. { 0xa3993df5,0xb5f928bb,0xf3b3d26a,0x639d75b5,0x85b55050,0x011aa78a,
  20370. 0x5b74fde1,0xfc315e6a } },
  20371. /* 45 */
  20372. { { 0xe8d6ecfa,0x561fd41a,0x1aec7f86,0x5f8c44f6,0x4924741d,0x98452a7b,
  20373. 0xee389088,0xe6d4a7ad },
  20374. { 0x4593c75d,0x60552ed1,0xdd271162,0x70a70da4,0x7ba2c7db,0xd2aede93,
  20375. 0x9be2ae57,0x35dfaf9a } },
  20376. /* 46 */
  20377. { { 0xaa736636,0x6b956fcd,0xae2cab7e,0x09f51d97,0x0f349966,0xfb10bf41,
  20378. 0x1c830d2b,0x1da5c7d7 },
  20379. { 0x3cce6825,0x5c41e483,0xf9573c3b,0x15ad118f,0xf23036b8,0xa28552c7,
  20380. 0xdbf4b9d6,0x7077c0fd } },
  20381. /* 47 */
  20382. { { 0x46b9661c,0xbf63ff8d,0x0d2cfd71,0xa1dfd36b,0xa847f8f7,0x0373e140,
  20383. 0xe50efe44,0x53a8632e },
  20384. { 0x696d8051,0x0976ff68,0xc74f468a,0xdaec0c95,0x5e4e26bd,0x62994dc3,
  20385. 0x34e1fcc1,0x028ca76d } },
  20386. /* 48 */
  20387. { { 0xfc9877ee,0xd11d47dc,0x801d0002,0xc8b36210,0x54c260b6,0xd002c117,
  20388. 0x6962f046,0x04c17cd8 },
  20389. { 0xb0daddf5,0x6d9bd094,0x24ce55c0,0xbea23575,0x72da03b5,0x663356e6,
  20390. 0xfed97474,0xf7ba4de9 } },
  20391. /* 49 */
  20392. { { 0xebe1263f,0xd0dbfa34,0x71ae7ce6,0x55763735,0x82a6f523,0xd2440553,
  20393. 0x52131c41,0xe31f9600 },
  20394. { 0xea6b6ec6,0xd1bb9216,0x73c2fc44,0x37a1d12e,0x89d0a294,0xc10e7eac,
  20395. 0xce34d47b,0xaa3a6259 } },
  20396. /* 50 */
  20397. { { 0x36f3dcd3,0xfbcf9df5,0xd2bf7360,0x6ceded50,0xdf504f5b,0x491710fa,
  20398. 0x7e79daee,0x2398dd62 },
  20399. { 0x6d09569e,0xcf4705a3,0x5149f769,0xea0619bb,0x35f6034c,0xff9c0377,
  20400. 0x1c046210,0x5717f5b2 } },
  20401. /* 51 */
  20402. { { 0x21dd895e,0x9fe229c9,0x40c28451,0x8e518500,0x1d637ecd,0xfa13d239,
  20403. 0x0e3c28de,0x660a2c56 },
  20404. { 0xd67fcbd0,0x9cca88ae,0x0ea9f096,0xc8472478,0x72e92b4d,0x32b2f481,
  20405. 0x4f522453,0x624ee54c } },
  20406. /* 52 */
  20407. { { 0xd897eccc,0x09549ce4,0x3f9880aa,0x4d49d1d9,0x043a7c20,0x723c2423,
  20408. 0x92bdfbc0,0x4f392afb },
  20409. { 0x7de44fd9,0x6969f8fa,0x57b32156,0xb66cfbe4,0x368ebc3c,0xdb2fa803,
  20410. 0xccdb399c,0x8a3e7977 } },
  20411. /* 53 */
  20412. { { 0x06c4b125,0xdde1881f,0xf6e3ca8c,0xae34e300,0x5c7a13e9,0xef6999de,
  20413. 0x70c24404,0x3888d023 },
  20414. { 0x44f91081,0x76280356,0x5f015504,0x3d9fcf61,0x632cd36e,0x1827edc8,
  20415. 0x18102336,0xa5e62e47 } },
  20416. /* 54 */
  20417. { { 0x2facd6c8,0x1a825ee3,0x54bcbc66,0x699c6354,0x98df9931,0x0ce3edf7,
  20418. 0x466a5adc,0x2c4768e6 },
  20419. { 0x90a64bc9,0xb346ff8c,0xe4779f5c,0x630a6020,0xbc05e884,0xd949d064,
  20420. 0xf9e652a0,0x7b5e6441 } },
  20421. /* 55 */
  20422. { { 0x1d28444a,0x2169422c,0xbe136a39,0xe996c5d8,0xfb0c7fce,0x2387afe5,
  20423. 0x0c8d744a,0xb8af73cb },
  20424. { 0x338b86fd,0x5fde83aa,0xa58a5cff,0xfee3f158,0x20ac9433,0xc9ee8f6f,
  20425. 0x7f3f0895,0xa036395f } },
  20426. /* 56 */
  20427. { { 0xa10f7770,0x8c73c6bb,0xa12a0e24,0xa6f16d81,0x51bc2b9f,0x100df682,
  20428. 0x875fb533,0x4be36b01 },
  20429. { 0x9fb56dbb,0x9226086e,0x07e7a4f8,0x306fef8b,0x66d52f20,0xeeaccc05,
  20430. 0x1bdc00c0,0x8cbc9a87 } },
  20431. /* 57 */
  20432. { { 0xc0dac4ab,0xe131895c,0x712ff112,0xa874a440,0x6a1cee57,0x6332ae7c,
  20433. 0x0c0835f8,0x44e7553e },
  20434. { 0x7734002d,0x6d503fff,0x0b34425c,0x9d35cb8b,0x0e8738b5,0x95f70276,
  20435. 0x5eb8fc18,0x470a683a } },
  20436. /* 58 */
  20437. { { 0x90513482,0x81b761dc,0x01e9276a,0x0287202a,0x0ce73083,0xcda441ee,
  20438. 0xc63dc6ef,0x16410690 },
  20439. { 0x6d06a2ed,0xf5034a06,0x189b100b,0xdd4d7745,0xab8218c9,0xd914ae72,
  20440. 0x7abcbb4f,0xd73479fd } },
  20441. /* 59 */
  20442. { { 0x5ad4c6e5,0x7edefb16,0x5b06d04d,0x262cf08f,0x8575cb14,0x12ed5bb1,
  20443. 0x0771666b,0x816469e3 },
  20444. { 0x561e291e,0xd7ab9d79,0xc1de1661,0xeb9daf22,0x135e0513,0xf49827eb,
  20445. 0xf0dd3f9c,0x0a36dd23 } },
  20446. /* 60 */
  20447. { { 0x41d5533c,0x098d32c7,0x8684628f,0x7c5f5a9e,0xe349bd11,0x39a228ad,
  20448. 0xfdbab118,0xe331dfd6 },
  20449. { 0x6bcc6ed8,0x5100ab68,0xef7a260e,0x7160c3bd,0xbce850d7,0x9063d9a7,
  20450. 0x492e3389,0xd3b4782a } },
  20451. /* 61 */
  20452. { { 0xf3821f90,0xa149b6e8,0x66eb7aad,0x92edd9ed,0x1a013116,0x0bb66953,
  20453. 0x4c86a5bd,0x7281275a },
  20454. { 0xd3ff47e5,0x503858f7,0x61016441,0x5e1616bc,0x7dfd9bb1,0x62b0f11a,
  20455. 0xce145059,0x2c062e7e } },
  20456. /* 62 */
  20457. { { 0x0159ac2e,0xa76f996f,0xcbdb2713,0x281e7736,0x08e46047,0x2ad6d288,
  20458. 0x2c4e7ef1,0x282a35f9 },
  20459. { 0xc0ce5cd2,0x9c354b1e,0x1379c229,0xcf99efc9,0x3e82c11e,0x992caf38,
  20460. 0x554d2abd,0xc71cd513 } },
  20461. /* 63 */
  20462. { { 0x09b578f4,0x4885de9c,0xe3affa7a,0x1884e258,0x59182f1f,0x8f76b1b7,
  20463. 0xcf47f3a3,0xc50f6740 },
  20464. { 0x374b68ea,0xa9c4adf3,0x69965fe2,0xa406f323,0x85a53050,0x2f86a222,
  20465. 0x212958dc,0xb9ecb3a7 } },
  20466. /* 64 */
  20467. { { 0xf4f8b16a,0x56f8410e,0xc47b266a,0x97241afe,0x6d9c87c1,0x0a406b8e,
  20468. 0xcd42ab1b,0x803f3e02 },
  20469. { 0x04dbec69,0x7f0309a8,0x3bbad05f,0xa83b85f7,0xad8e197f,0xc6097273,
  20470. 0x5067adc1,0xc097440e } },
  20471. /* 65 */
  20472. { { 0xc379ab34,0x846a56f2,0x841df8d1,0xa8ee068b,0x176c68ef,0x20314459,
  20473. 0x915f1f30,0xf1af32d5 },
  20474. { 0x5d75bd50,0x99c37531,0xf72f67bc,0x837cffba,0x48d7723f,0x0613a418,
  20475. 0xe2d41c8b,0x23d0f130 } },
  20476. /* 66 */
  20477. { { 0xf41500d9,0x857ab6ed,0xfcbeada8,0x0d890ae5,0x89725951,0x52fe8648,
  20478. 0xc0a3fadd,0xb0288dd6 },
  20479. { 0x650bcb08,0x85320f30,0x695d6e16,0x71af6313,0xb989aa76,0x31f520a7,
  20480. 0xf408c8d2,0xffd3724f } },
  20481. /* 67 */
  20482. { { 0xb458e6cb,0x53968e64,0x317a5d28,0x992dad20,0x7aa75f56,0x3814ae0b,
  20483. 0xd78c26df,0xf5590f4a },
  20484. { 0xcf0ba55a,0x0fc24bd3,0x0c778bae,0x0fc4724a,0x683b674a,0x1ce9864f,
  20485. 0xf6f74a20,0x18d6da54 } },
  20486. /* 68 */
  20487. { { 0xd5be5a2b,0xed93e225,0x5934f3c6,0x6fe79983,0x22626ffc,0x43140926,
  20488. 0x7990216a,0x50bbb4d9 },
  20489. { 0xe57ec63e,0x378191c6,0x181dcdb2,0x65422c40,0x0236e0f6,0x41a8099b,
  20490. 0x01fe49c3,0x2b100118 } },
  20491. /* 69 */
  20492. { { 0x9b391593,0xfc68b5c5,0x598270fc,0xc385f5a2,0xd19adcbb,0x7144f3aa,
  20493. 0x83fbae0c,0xdd558999 },
  20494. { 0x74b82ff4,0x93b88b8e,0x71e734c9,0xd2e03c40,0x43c0322a,0x9a7a9eaf,
  20495. 0x149d6041,0xe6e4c551 } },
  20496. /* 70 */
  20497. { { 0x1e9af288,0x55f655bb,0xf7ada931,0x647e1a64,0xcb2820e5,0x43697e4b,
  20498. 0x07ed56ff,0x51e00db1 },
  20499. { 0x771c327e,0x43d169b8,0x4a96c2ad,0x29cdb20b,0x3deb4779,0xc07d51f5,
  20500. 0x49829177,0xe22f4241 } },
  20501. /* 71 */
  20502. { { 0x635f1abb,0xcd45e8f4,0x68538874,0x7edc0cb5,0xb5a8034d,0xc9472c1f,
  20503. 0x52dc48c9,0xf709373d },
  20504. { 0xa8af30d6,0x401966bb,0xf137b69c,0x95bf5f4a,0x9361c47e,0x3966162a,
  20505. 0xe7275b11,0xbd52d288 } },
  20506. /* 72 */
  20507. { { 0x9c5fa877,0xab155c7a,0x7d3a3d48,0x17dad672,0x73d189d8,0x43f43f9e,
  20508. 0xc8aa77a6,0xa0d0f8e4 },
  20509. { 0xcc94f92d,0x0bbeafd8,0x0c4ddb3a,0xd818c8be,0xb82eba14,0x22cc65f8,
  20510. 0x946d6a00,0xa56c78c7 } },
  20511. /* 73 */
  20512. { { 0x0dd09529,0x2962391b,0x3daddfcf,0x803e0ea6,0x5b5bf481,0x2c77351f,
  20513. 0x731a367a,0xd8befdf8 },
  20514. { 0xfc0157f4,0xab919d42,0xfec8e650,0xf51caed7,0x02d48b0a,0xcdf9cb40,
  20515. 0xce9f6478,0x854a68a5 } },
  20516. /* 74 */
  20517. { { 0x63506ea5,0xdc35f67b,0xa4fe0d66,0x9286c489,0xfe95cd4d,0x3f101d3b,
  20518. 0x98846a95,0x5cacea0b },
  20519. { 0x9ceac44d,0xa90df60c,0x354d1c3a,0x3db29af4,0xad5dbabe,0x08dd3de8,
  20520. 0x35e4efa9,0xe4982d12 } },
  20521. /* 75 */
  20522. { { 0xc34cd55e,0x23104a22,0x2680d132,0x58695bb3,0x1fa1d943,0xfb345afa,
  20523. 0x16b20499,0x8046b7f6 },
  20524. { 0x38e7d098,0xb533581e,0xf46f0b70,0xd7f61e8d,0x44cb78c4,0x30dea9ea,
  20525. 0x9082af55,0xeb17ca7b } },
  20526. /* 76 */
  20527. { { 0x76a145b9,0x1751b598,0xc1bc71ec,0xa5cf6b0f,0x392715bb,0xd3e03565,
  20528. 0xfab5e131,0x097b00ba },
  20529. { 0x565f69e1,0xaa66c8e9,0xb5be5199,0x77e8f75a,0xda4fd984,0x6033ba11,
  20530. 0xafdbcc9e,0xf95c747b } },
  20531. /* 77 */
  20532. { { 0xbebae45e,0x558f01d3,0xc4bc6955,0xa8ebe9f0,0xdbc64fc6,0xaeb705b1,
  20533. 0x566ed837,0x3512601e },
  20534. { 0xfa1161cd,0x9336f1e1,0x4c65ef87,0x328ab8d5,0x724f21e5,0x4757eee2,
  20535. 0x6068ab6b,0x0ef97123 } },
  20536. /* 78 */
  20537. { { 0x54ca4226,0x02598cf7,0xf8642c8e,0x5eede138,0x468e1790,0x48963f74,
  20538. 0x3b4fbc95,0xfc16d933 },
  20539. { 0xe7c800ca,0xbe96fb31,0x2678adaa,0x13806331,0x6ff3e8b5,0x3d624497,
  20540. 0xb95d7a17,0x14ca4af1 } },
  20541. /* 79 */
  20542. { { 0xbd2f81d5,0x7a4771ba,0x01f7d196,0x1a5f9d69,0xcad9c907,0xd898bef7,
  20543. 0xf59c231d,0x4057b063 },
  20544. { 0x89c05c0a,0xbffd82fe,0x1dc0df85,0xe4911c6f,0xa35a16db,0x3befccae,
  20545. 0xf1330b13,0x1c3b5d64 } },
  20546. /* 80 */
  20547. { { 0x80ec21fe,0x5fe14bfe,0xc255be82,0xf6ce116a,0x2f4a5d67,0x98bc5a07,
  20548. 0xdb7e63af,0xfad27148 },
  20549. { 0x29ab05b3,0x90c0b6ac,0x4e251ae6,0x37a9a83c,0xc2aade7d,0x0a7dc875,
  20550. 0x9f0e1a84,0x77387de3 } },
  20551. /* 81 */
  20552. { { 0xa56c0dd7,0x1e9ecc49,0x46086c74,0xa5cffcd8,0xf505aece,0x8f7a1408,
  20553. 0xbef0c47e,0xb37b85c0 },
  20554. { 0xcc0e6a8f,0x3596b6e4,0x6b388f23,0xfd6d4bbf,0xc39cef4e,0xaba453fa,
  20555. 0xf9f628d5,0x9c135ac8 } },
  20556. /* 82 */
  20557. { { 0x84e35743,0x32aa3202,0x85a3cdef,0x320d6ab1,0x1df19819,0xb821b176,
  20558. 0xc433851f,0x5721361f },
  20559. { 0x71fc9168,0x1f0db36a,0x5e5c403c,0x5f98ba73,0x37bcd8f5,0xf64ca87e,
  20560. 0xe6bb11bd,0xdcbac3c9 } },
  20561. /* 83 */
  20562. { { 0x4518cbe2,0xf01d9968,0x9c9eb04e,0xd242fc18,0xe47feebf,0x727663c7,
  20563. 0x2d626862,0xb8c1c89e },
  20564. { 0xc8e1d569,0x51a58bdd,0xb7d88cd0,0x563809c8,0xf11f31eb,0x26c27fd9,
  20565. 0x2f9422d4,0x5d23bbda } },
  20566. /* 84 */
  20567. { { 0x95c8f8be,0x0a1c7294,0x3bf362bf,0x2961c480,0xdf63d4ac,0x9e418403,
  20568. 0x91ece900,0xc109f9cb },
  20569. { 0x58945705,0xc2d095d0,0xddeb85c0,0xb9083d96,0x7a40449b,0x84692b8d,
  20570. 0x2eee1ee1,0x9bc3344f } },
  20571. /* 85 */
  20572. { { 0x42913074,0x0d5ae356,0x48a542b1,0x55491b27,0xb310732a,0x469ca665,
  20573. 0x5f1a4cc1,0x29591d52 },
  20574. { 0xb84f983f,0xe76f5b6b,0x9f5f84e1,0xbe7eef41,0x80baa189,0x1200d496,
  20575. 0x18ef332c,0x6376551f } },
  20576. /* 86 */
  20577. { { 0x562976cc,0xbda5f14e,0x0ef12c38,0x22bca3e6,0x6cca9852,0xbbfa3064,
  20578. 0x08e2987a,0xbdb79dc8 },
  20579. { 0xcb06a772,0xfd2cb5c9,0xfe536dce,0x38f475aa,0x7c2b5db8,0xc2a3e022,
  20580. 0xadd3c14a,0x8ee86001 } },
  20581. /* 87 */
  20582. { { 0xa4ade873,0xcbe96981,0xc4fba48c,0x7ee9aa4d,0x5a054ba5,0x2cee2899,
  20583. 0x6f77aa4b,0x92e51d7a },
  20584. { 0x7190a34d,0x948bafa8,0xf6bd1ed1,0xd698f75b,0x0caf1144,0xd00ee6e3,
  20585. 0x0a56aaaa,0x5182f86f } },
  20586. /* 88 */
  20587. { { 0x7a4cc99c,0xfba6212c,0x3e6d9ca1,0xff609b68,0x5ac98c5a,0x5dbb27cb,
  20588. 0x4073a6f2,0x91dcab5d },
  20589. { 0x5f575a70,0x01b6cc3d,0x6f8d87fa,0x0cb36139,0x89981736,0x165d4e8c,
  20590. 0x97974f2b,0x17a0cedb } },
  20591. /* 89 */
  20592. { { 0x076c8d3a,0x38861e2a,0x210f924b,0x701aad39,0x13a835d9,0x94d0eae4,
  20593. 0x7f4cdf41,0x2e8ce36c },
  20594. { 0x037a862b,0x91273dab,0x60e4c8fa,0x01ba9bb7,0x33baf2dd,0xf9645388,
  20595. 0x34f668f3,0xf4ccc6cb } },
  20596. /* 90 */
  20597. { { 0xf1f79687,0x44ef525c,0x92efa815,0x7c595495,0xa5c78d29,0xe1231741,
  20598. 0x9a0df3c9,0xac0db488 },
  20599. { 0xdf01747f,0x86bfc711,0xef17df13,0x592b9358,0x5ccb6bb5,0xe5880e4f,
  20600. 0x94c974a2,0x95a64a61 } },
  20601. /* 91 */
  20602. { { 0xc15a4c93,0x72c1efda,0x82585141,0x40269b73,0x16cb0bad,0x6a8dfb1c,
  20603. 0x29210677,0x231e54ba },
  20604. { 0x8ae6d2dc,0xa70df917,0x39112918,0x4d6aa63f,0x5e5b7223,0xf627726b,
  20605. 0xd8a731e1,0xab0be032 } },
  20606. /* 92 */
  20607. { { 0x8d131f2d,0x097ad0e9,0x3b04f101,0x637f09e3,0xd5e9a748,0x1ac86196,
  20608. 0x2cf6a679,0xf1bcc880 },
  20609. { 0xe8daacb4,0x25c69140,0x60f65009,0x3c4e4055,0x477937a6,0x591cc8fc,
  20610. 0x5aebb271,0x85169469 } },
  20611. /* 93 */
  20612. { { 0xf1dcf593,0xde35c143,0xb018be3b,0x78202b29,0x9bdd9d3d,0xe9cdadc2,
  20613. 0xdaad55d8,0x8f67d9d2 },
  20614. { 0x7481ea5f,0x84111656,0xe34c590c,0xe7d2dde9,0x05053fa8,0xffdd43f4,
  20615. 0xc0728b5d,0xf84572b9 } },
  20616. /* 94 */
  20617. { { 0x97af71c9,0x5e1a7a71,0x7a736565,0xa1449444,0x0e1d5063,0xa1b4ae07,
  20618. 0x616b2c19,0xedee2710 },
  20619. { 0x11734121,0xb2f034f5,0x4a25e9f0,0x1cac6e55,0xa40c2ecf,0x8dc148f3,
  20620. 0x44ebd7f4,0x9fd27e9b } },
  20621. /* 95 */
  20622. { { 0xf6e2cb16,0x3cc7658a,0xfe5919b6,0xe3eb7d2c,0x168d5583,0x5a8c5816,
  20623. 0x958ff387,0xa40c2fb6 },
  20624. { 0xfedcc158,0x8c9ec560,0x55f23056,0x7ad804c6,0x9a307e12,0xd9396704,
  20625. 0x7dc6decf,0x99bc9bb8 } },
  20626. /* 96 */
  20627. { { 0x927dafc6,0x84a9521d,0x5c09cd19,0x52c1fb69,0xf9366dde,0x9d9581a0,
  20628. 0xa16d7e64,0x9abe210b },
  20629. { 0x48915220,0x480af84a,0x4dd816c6,0xfa73176a,0x1681ca5a,0xc7d53987,
  20630. 0x87f344b0,0x7881c257 } },
  20631. /* 97 */
  20632. { { 0xe0bcf3ff,0x93399b51,0x127f74f6,0x0d02cbc5,0xdd01d968,0x8fb465a2,
  20633. 0xa30e8940,0x15e6e319 },
  20634. { 0x3e0e05f4,0x646d6e0d,0x43588404,0xfad7bddc,0xc4f850d3,0xbe61c7d1,
  20635. 0x191172ce,0x0e55facf } },
  20636. /* 98 */
  20637. { { 0xf8787564,0x7e9d9806,0x31e85ce6,0x1a331721,0xb819e8d6,0x6b0158ca,
  20638. 0x6fe96577,0xd73d0976 },
  20639. { 0x1eb7206e,0x42483425,0xc618bb42,0xa519290f,0x5e30a520,0x5dcbb859,
  20640. 0x8f15a50b,0x9250a374 } },
  20641. /* 99 */
  20642. { { 0xbe577410,0xcaff08f8,0x5077a8c6,0xfd408a03,0xec0a63a4,0xf1f63289,
  20643. 0xc1cc8c0b,0x77414082 },
  20644. { 0xeb0991cd,0x05a40fa6,0x49fdc296,0xc1ca0866,0xb324fd40,0x3a68a3c7,
  20645. 0x12eb20b9,0x8cb04f4d } },
  20646. /* 100 */
  20647. { { 0x6906171c,0xb1c2d055,0xb0240c3f,0x9073e9cd,0xd8906841,0xdb8e6b4f,
  20648. 0x47123b51,0xe4e429ef },
  20649. { 0x38ec36f4,0x0b8dd53c,0xff4b6a27,0xf9d2dc01,0x879a9a48,0x5d066e07,
  20650. 0x3c6e6552,0x37bca2ff } },
  20651. /* 101 */
  20652. { { 0xdf562470,0x4cd2e3c7,0xc0964ac9,0x44f272a2,0x80c793be,0x7c6d5df9,
  20653. 0x3002b22a,0x59913edc },
  20654. { 0x5750592a,0x7a139a83,0xe783de02,0x99e01d80,0xea05d64f,0xcf8c0375,
  20655. 0xb013e226,0x43786e4a } },
  20656. /* 102 */
  20657. { { 0x9e56b5a6,0xff32b0ed,0xd9fc68f9,0x0750d9a6,0x597846a7,0xec15e845,
  20658. 0xb7e79e7a,0x8638ca98 },
  20659. { 0x0afc24b2,0x2f5ae096,0x4dace8f2,0x05398eaf,0xaecba78f,0x3b765dd0,
  20660. 0x7b3aa6f0,0x1ecdd36a } },
  20661. /* 103 */
  20662. { { 0x6c5ff2f3,0x5d3acd62,0x2873a978,0xa2d516c0,0xd2110d54,0xad94c9fa,
  20663. 0xd459f32d,0xd85d0f85 },
  20664. { 0x10b11da3,0x9f700b8d,0xa78318c4,0xd2c22c30,0x9208decd,0x556988f4,
  20665. 0xb4ed3c62,0xa04f19c3 } },
  20666. /* 104 */
  20667. { { 0xed7f93bd,0x087924c8,0x392f51f6,0xcb64ac5d,0x821b71af,0x7cae330a,
  20668. 0x5c0950b0,0x92b2eeea },
  20669. { 0x85b6e235,0x85ac4c94,0x2936c0f0,0xab2ca4a9,0xe0508891,0x80faa6b3,
  20670. 0x5834276c,0x1ee78221 } },
  20671. /* 105 */
  20672. { { 0xe63e79f7,0xa60a2e00,0xf399d906,0xf590e7b2,0x6607c09d,0x9021054a,
  20673. 0x57a6e150,0xf3f2ced8 },
  20674. { 0xf10d9b55,0x200510f3,0xd8642648,0x9d2fcfac,0xe8bd0e7c,0xe5631aa7,
  20675. 0x3da3e210,0x0f56a454 } },
  20676. /* 106 */
  20677. { { 0x1043e0df,0x5b21bffa,0x9c007e6d,0x6c74b6cc,0xd4a8517a,0x1a656ec0,
  20678. 0x1969e263,0xbd8f1741 },
  20679. { 0xbeb7494a,0x8a9bbb86,0x45f3b838,0x1567d46f,0xa4e5a79a,0xdf7a12a7,
  20680. 0x30ccfa09,0x2d1a1c35 } },
  20681. /* 107 */
  20682. { { 0x506508da,0x192e3813,0xa1d795a7,0x336180c4,0x7a9944b3,0xcddb5949,
  20683. 0xb91fba46,0xa107a65e },
  20684. { 0x0f94d639,0xe6d1d1c5,0x8a58b7d7,0x8b4af375,0xbd37ca1c,0x1a7c5584,
  20685. 0xf87a9af2,0x183d760a } },
  20686. /* 108 */
  20687. { { 0x0dde59a4,0x29d69711,0x0e8bef87,0xf1ad8d07,0x4f2ebe78,0x229b4963,
  20688. 0xc269d754,0x1d44179d },
  20689. { 0x8390d30e,0xb32dc0cf,0x0de8110c,0x0a3b2753,0x2bc0339a,0x31af1dc5,
  20690. 0x9606d262,0x771f9cc2 } },
  20691. /* 109 */
  20692. { { 0x85040739,0x99993e77,0x8026a939,0x44539db9,0xf5f8fc26,0xcf40f6f2,
  20693. 0x0362718e,0x64427a31 },
  20694. { 0x85428aa8,0x4f4f2d87,0xebfb49a8,0x7b7adc3f,0xf23d01ac,0x201b2c6d,
  20695. 0x6ae90d6d,0x49d9b749 } },
  20696. /* 110 */
  20697. { { 0x435d1099,0xcc78d8bc,0x8e8d1a08,0x2adbcd4e,0x2cb68a41,0x02c2e2a0,
  20698. 0x3f605445,0x9037d81b },
  20699. { 0x074c7b61,0x7cdbac27,0x57bfd72e,0xfe2031ab,0x596d5352,0x61ccec96,
  20700. 0x7cc0639c,0x08c3de6a } },
  20701. /* 111 */
  20702. { { 0xf6d552ab,0x20fdd020,0x05cd81f1,0x56baff98,0x91351291,0x06fb7c3e,
  20703. 0x45796b2f,0xc6909442 },
  20704. { 0x41231bd1,0x17b3ae9c,0x5cc58205,0x1eac6e87,0xf9d6a122,0x208837ab,
  20705. 0xcafe3ac0,0x3fa3db02 } },
  20706. /* 112 */
  20707. { { 0x05058880,0xd75a3e65,0x643943f2,0x7da365ef,0xfab24925,0x4147861c,
  20708. 0xfdb808ff,0xc5c4bdb0 },
  20709. { 0xb272b56b,0x73513e34,0x11b9043a,0xc8327e95,0xf8844969,0xfd8ce37d,
  20710. 0x46c2b6b5,0x2d56db94 } },
  20711. /* 113 */
  20712. { { 0xff46ac6b,0x2461782f,0x07a2e425,0xd19f7926,0x09a48de1,0xfafea3c4,
  20713. 0xe503ba42,0x0f56bd9d },
  20714. { 0x345cda49,0x137d4ed1,0x816f299d,0x821158fc,0xaeb43402,0xe7c6a54a,
  20715. 0x1173b5f1,0x4003bb9d } },
  20716. /* 114 */
  20717. { { 0xa0803387,0x3b8e8189,0x39cbd404,0xece115f5,0xd2877f21,0x4297208d,
  20718. 0xa07f2f9e,0x53765522 },
  20719. { 0xa8a4182d,0xa4980a21,0x3219df79,0xa2bbd07a,0x1a19a2d4,0x674d0a2e,
  20720. 0x6c5d4549,0x7a056f58 } },
  20721. /* 115 */
  20722. { { 0x9d8a2a47,0x646b2558,0xc3df2773,0x5b582948,0xabf0d539,0x51ec000e,
  20723. 0x7a1a2675,0x77d482f1 },
  20724. { 0x87853948,0xb8a1bd95,0x6cfbffee,0xa6f817bd,0x80681e47,0xab6ec057,
  20725. 0x2b38b0e4,0x4115012b } },
  20726. /* 116 */
  20727. { { 0x6de28ced,0x3c73f0f4,0x9b13ec47,0x1d5da760,0x6e5c6392,0x61b8ce9e,
  20728. 0xfbea0946,0xcdf04572 },
  20729. { 0x6c53c3b0,0x1cb3c58b,0x447b843c,0x97fe3c10,0x2cb9780e,0xfb2b8ae1,
  20730. 0x97383109,0xee703dda } },
  20731. /* 117 */
  20732. { { 0xff57e43a,0x34515140,0xb1b811b8,0xd44660d3,0x8f42b986,0x2b3b5dff,
  20733. 0xa162ce21,0x2a0ad89d },
  20734. { 0x6bc277ba,0x64e4a694,0xc141c276,0xc788c954,0xcabf6274,0x141aa64c,
  20735. 0xac2b4659,0xd62d0b67 } },
  20736. /* 118 */
  20737. { { 0x2c054ac4,0x39c5d87b,0xf27df788,0x57005859,0xb18128d6,0xedf7cbf3,
  20738. 0x991c2426,0xb39a23f2 },
  20739. { 0xf0b16ae5,0x95284a15,0xa136f51b,0x0c6a05b1,0xf2700783,0x1d63c137,
  20740. 0xc0674cc5,0x04ed0092 } },
  20741. /* 119 */
  20742. { { 0x9ae90393,0x1f4185d1,0x4a3d64e6,0x3047b429,0x9854fc14,0xae0001a6,
  20743. 0x0177c387,0xa0a91fc1 },
  20744. { 0xae2c831e,0xff0a3f01,0x2b727e16,0xbb76ae82,0x5a3075b4,0x8f12c8a1,
  20745. 0x9ed20c41,0x084cf988 } },
  20746. /* 120 */
  20747. { { 0xfca6becf,0xd98509de,0x7dffb328,0x2fceae80,0x4778e8b9,0x5d8a15c4,
  20748. 0x73abf77e,0xd57955b2 },
  20749. { 0x31b5d4f1,0x210da79e,0x3cfa7a1c,0xaa52f04b,0xdc27c20b,0xd4d12089,
  20750. 0x02d141f1,0x8e14ea42 } },
  20751. /* 121 */
  20752. { { 0xf2897042,0xeed50345,0x43402c4a,0x8d05331f,0xc8bdfb21,0xc8d9c194,
  20753. 0x2aa4d158,0x597e1a37 },
  20754. { 0xcf0bd68c,0x0327ec1a,0xab024945,0x6d4be0dc,0xc9fe3e84,0x5b9c8d7a,
  20755. 0x199b4dea,0xca3f0236 } },
  20756. /* 122 */
  20757. { { 0x6170bd20,0x592a10b5,0x6d3f5de7,0x0ea897f1,0x44b2ade2,0xa3363ff1,
  20758. 0x309c07e4,0xbde7fd7e },
  20759. { 0xb8f5432c,0x516bb6d2,0xe043444b,0x210dc1cb,0xf8f95b5a,0x3db01e6f,
  20760. 0x0a7dd198,0xb623ad0e } },
  20761. /* 123 */
  20762. { { 0x60c7b65b,0xa75bd675,0x23a4a289,0xab8c5590,0xd7b26795,0xf8220fd0,
  20763. 0x58ec137b,0xd6aa2e46 },
  20764. { 0x5138bb85,0x10abc00b,0xd833a95c,0x8c31d121,0x1702a32e,0xb24ff00b,
  20765. 0x2dcc513a,0x111662e0 } },
  20766. /* 124 */
  20767. { { 0xefb42b87,0x78114015,0x1b6c4dff,0xbd9f5d70,0xa7d7c129,0x66ecccd7,
  20768. 0x94b750f8,0xdb3ee1cb },
  20769. { 0xf34837cf,0xb26f3db0,0xb9578d4f,0xe7eed18b,0x7c56657d,0x5d2cdf93,
  20770. 0x52206a59,0x886a6442 } },
  20771. /* 125 */
  20772. { { 0x65b569ea,0x3c234cfb,0xf72119c1,0x20011141,0xa15a619e,0x8badc85d,
  20773. 0x018a17bc,0xa70cf4eb },
  20774. { 0x8c4a6a65,0x224f97ae,0x0134378f,0x36e5cf27,0x4f7e0960,0xbe3a609e,
  20775. 0xd1747b77,0xaa4772ab } },
  20776. /* 126 */
  20777. { { 0x7aa60cc0,0x67676131,0x0368115f,0xc7916361,0xbbc1bb5a,0xded98bb4,
  20778. 0x30faf974,0x611a6ddc },
  20779. { 0xc15ee47a,0x30e78cbc,0x4e0d96a5,0x2e896282,0x3dd9ed88,0x36f35adf,
  20780. 0x16429c88,0x5cfffaf8 } },
  20781. /* 127 */
  20782. { { 0x9b7a99cd,0xc0d54cff,0x843c45a1,0x7bf3b99d,0x62c739e1,0x038a908f,
  20783. 0x7dc1994c,0x6e5a6b23 },
  20784. { 0x0ba5db77,0xef8b454e,0xacf60d63,0xb7b8807f,0x76608378,0xe591c0c6,
  20785. 0x242dabcc,0x481a238d } },
  20786. /* 128 */
  20787. { { 0x35d0b34a,0xe3417bc0,0x8327c0a7,0x440b386b,0xac0362d1,0x8fb7262d,
  20788. 0xe0cdf943,0x2c41114c },
  20789. { 0xad95a0b1,0x2ba5cef1,0x67d54362,0xc09b37a8,0x01e486c9,0x26d6cdd2,
  20790. 0x42ff9297,0x20477abf } },
  20791. /* 129 */
  20792. { { 0x18d65dbf,0x2f75173c,0x339edad8,0x77bf940e,0xdcf1001c,0x7022d26b,
  20793. 0xc77396b6,0xac66409a },
  20794. { 0xc6261cc3,0x8b0bb36f,0x190e7e90,0x213f7bc9,0xa45e6c10,0x6541ceba,
  20795. 0xcc122f85,0xce8e6975 } },
  20796. /* 130 */
  20797. { { 0xbc0a67d2,0x0f121b41,0x444d248a,0x62d4760a,0x659b4737,0x0e044f1d,
  20798. 0x250bb4a8,0x08fde365 },
  20799. { 0x848bf287,0xaceec3da,0xd3369d6e,0xc2a62182,0x92449482,0x3582dfdc,
  20800. 0x565d6cd7,0x2f7e2fd2 } },
  20801. /* 131 */
  20802. { { 0xc3770fa7,0xae4b92db,0x379043f9,0x095e8d5c,0x17761171,0x54f34e9d,
  20803. 0x907702ae,0xc65be92e },
  20804. { 0xf6fd0a40,0x2758a303,0xbcce784b,0xe7d822e3,0x4f9767bf,0x7ae4f585,
  20805. 0xd1193b3a,0x4bff8e47 } },
  20806. /* 132 */
  20807. { { 0x00ff1480,0xcd41d21f,0x0754db16,0x2ab8fb7d,0xbbe0f3ea,0xac81d2ef,
  20808. 0x5772967d,0x3e4e4ae6 },
  20809. { 0x3c5303e6,0x7e18f36d,0x92262397,0x3bd9994b,0x1324c3c0,0x9ed70e26,
  20810. 0x58ec6028,0x5388aefd } },
  20811. /* 133 */
  20812. { { 0x5e5d7713,0xad1317eb,0x75de49da,0x09b985ee,0xc74fb261,0x32f5bc4f,
  20813. 0x4f75be0e,0x5cf908d1 },
  20814. { 0x8e657b12,0x76043510,0xb96ed9e6,0xbfd421a5,0x8970ccc2,0x0e29f51f,
  20815. 0x60f00ce2,0xa698ba40 } },
  20816. /* 134 */
  20817. { { 0xef748fec,0x73db1686,0x7e9d2cf9,0xe6e755a2,0xce265eff,0x630b6544,
  20818. 0x7aebad8d,0xb142ef8a },
  20819. { 0x17d5770a,0xad31af9f,0x2cb3412f,0x66af3b67,0xdf3359de,0x6bd60d1b,
  20820. 0x58515075,0xd1896a96 } },
  20821. /* 135 */
  20822. { { 0x33c41c08,0xec5957ab,0x5468e2e1,0x87de94ac,0xac472f6c,0x18816b73,
  20823. 0x7981da39,0x267b0e0b },
  20824. { 0x8e62b988,0x6e554e5d,0x116d21e7,0xd8ddc755,0x3d2a6f99,0x4610faf0,
  20825. 0xa1119393,0xb54e287a } },
  20826. /* 136 */
  20827. { { 0x178a876b,0x0a0122b5,0x085104b4,0x51ff96ff,0x14f29f76,0x050b31ab,
  20828. 0x5f87d4e6,0x84abb28b },
  20829. { 0x8270790a,0xd5ed439f,0x85e3f46b,0x2d6cb59d,0x6c1e2212,0x75f55c1b,
  20830. 0x17655640,0xe5436f67 } },
  20831. /* 137 */
  20832. { { 0x2286e8d5,0x53f9025e,0x864453be,0x353c95b4,0xe408e3a0,0xd832f5bd,
  20833. 0x5b9ce99e,0x0404f68b },
  20834. { 0xa781e8e5,0xcad33bde,0x163c2f5b,0x3cdf5018,0x0119caa3,0x57576960,
  20835. 0x0ac1c701,0x3a4263df } },
  20836. /* 138 */
  20837. { { 0x9aeb596d,0xc2965ecc,0x023c92b4,0x01ea03e7,0x2e013961,0x4704b4b6,
  20838. 0x905ea367,0x0ca8fd3f },
  20839. { 0x551b2b61,0x92523a42,0x390fcd06,0x1eb7a89c,0x0392a63e,0xe7f1d2be,
  20840. 0x4ddb0c33,0x96dca264 } },
  20841. /* 139 */
  20842. { { 0x387510af,0x203bb43a,0xa9a36a01,0x846feaa8,0x2f950378,0xd23a5770,
  20843. 0x3aad59dc,0x4363e212 },
  20844. { 0x40246a47,0xca43a1c7,0xe55dd24d,0xb362b8d2,0x5d8faf96,0xf9b08604,
  20845. 0xd8bb98c4,0x840e115c } },
  20846. /* 140 */
  20847. { { 0x1023e8a7,0xf12205e2,0xd8dc7a0b,0xc808a8cd,0x163a5ddf,0xe292a272,
  20848. 0x30ded6d4,0x5e0d6abd },
  20849. { 0x7cfc0f64,0x07a721c2,0x0e55ed88,0x42eec01d,0x1d1f9db2,0x26a7bef9,
  20850. 0x2945a25a,0x7dea48f4 } },
  20851. /* 141 */
  20852. { { 0xe5060a81,0xabdf6f1c,0xf8f95615,0xe79f9c72,0x06ac268b,0xcfd36c54,
  20853. 0xebfd16d1,0xabc2a2be },
  20854. { 0xd3e2eac7,0x8ac66f91,0xd2dd0466,0x6f10ba63,0x0282d31b,0x6790e377,
  20855. 0x6c7eefc1,0x4ea35394 } },
  20856. /* 142 */
  20857. { { 0x5266309d,0xed8a2f8d,0x81945a3e,0x0a51c6c0,0x578c5dc1,0xcecaf45a,
  20858. 0x1c94ffc3,0x3a76e689 },
  20859. { 0x7d7b0d0f,0x9aace8a4,0x8f584a5f,0x963ace96,0x4e697fbe,0x51a30c72,
  20860. 0x465e6464,0x8212a10a } },
  20861. /* 143 */
  20862. { { 0xcfab8caa,0xef7c61c3,0x0e142390,0x18eb8e84,0x7e9733ca,0xcd1dff67,
  20863. 0x599cb164,0xaa7cab71 },
  20864. { 0xbc837bd1,0x02fc9273,0xc36af5d7,0xc06407d0,0xf423da49,0x17621292,
  20865. 0xfe0617c3,0x40e38073 } },
  20866. /* 144 */
  20867. { { 0xa7bf9b7c,0xf4f80824,0x3fbe30d0,0x365d2320,0x97cf9ce3,0xbfbe5320,
  20868. 0xb3055526,0xe3604700 },
  20869. { 0x6cc6c2c7,0x4dcb9911,0xba4cbee6,0x72683708,0x637ad9ec,0xdcded434,
  20870. 0xa3dee15f,0x6542d677 } },
  20871. /* 145 */
  20872. { { 0x7b6c377a,0x3f32b6d0,0x903448be,0x6cb03847,0x20da8af7,0xd6fdd3a8,
  20873. 0x09bb6f21,0xa6534aee },
  20874. { 0x1035facf,0x30a1780d,0x9dcb47e6,0x35e55a33,0xc447f393,0x6ea50fe1,
  20875. 0xdc9aef22,0xf3cb672f } },
  20876. /* 146 */
  20877. { { 0x3b55fd83,0xeb3719fe,0x875ddd10,0xe0d7a46c,0x05cea784,0x33ac9fa9,
  20878. 0xaae870e7,0x7cafaa2e },
  20879. { 0x1d53b338,0x9b814d04,0xef87e6c6,0xe0acc0a0,0x11672b0f,0xfb93d108,
  20880. 0xb9bd522e,0x0aab13c1 } },
  20881. /* 147 */
  20882. { { 0xd2681297,0xddcce278,0xb509546a,0xcb350eb1,0x7661aaf2,0x2dc43173,
  20883. 0x847012e9,0x4b91a602 },
  20884. { 0x72f8ddcf,0xdcff1095,0x9a911af4,0x08ebf61e,0xc372430e,0x48f4360a,
  20885. 0x72321cab,0x49534c53 } },
  20886. /* 148 */
  20887. { { 0xf07b7e9d,0x83df7d71,0x13cd516f,0xa478efa3,0x6c047ee3,0x78ef264b,
  20888. 0xd65ac5ee,0xcaf46c4f },
  20889. { 0x92aa8266,0xa04d0c77,0x913684bb,0xedf45466,0xae4b16b0,0x56e65168,
  20890. 0x04c6770f,0x14ce9e57 } },
  20891. /* 149 */
  20892. { { 0x965e8f91,0x99445e3e,0xcb0f2492,0xd3aca1ba,0x90c8a0a0,0xd31cc70f,
  20893. 0x3e4c9a71,0x1bb708a5 },
  20894. { 0x558bdd7a,0xd5ca9e69,0x018a26b1,0x734a0508,0x4c9cf1ec,0xb093aa71,
  20895. 0xda300102,0xf9d126f2 } },
  20896. /* 150 */
  20897. { { 0xaff9563e,0x749bca7a,0xb49914a0,0xdd077afe,0xbf5f1671,0xe27a0311,
  20898. 0x729ecc69,0x807afcb9 },
  20899. { 0xc9b08b77,0x7f8a9337,0x443c7e38,0x86c3a785,0x476fd8ba,0x85fafa59,
  20900. 0x6568cd8c,0x751adcd1 } },
  20901. /* 151 */
  20902. { { 0x10715c0d,0x8aea38b4,0x8f7697f7,0xd113ea71,0x93fbf06d,0x665eab14,
  20903. 0x2537743f,0x29ec4468 },
  20904. { 0xb50bebbc,0x3d94719c,0xe4505422,0x399ee5bf,0x8d2dedb1,0x90cd5b3a,
  20905. 0x92a4077d,0xff9370e3 } },
  20906. /* 152 */
  20907. { { 0xc6b75b65,0x59a2d69b,0x266651c5,0x4188f8d5,0x3de9d7d2,0x28a9f33e,
  20908. 0xa2a9d01a,0x9776478b },
  20909. { 0x929af2c7,0x8852622d,0x4e690923,0x334f5d6d,0xa89a51e9,0xce6cc7e5,
  20910. 0xac2f82fa,0x74a6313f } },
  20911. /* 153 */
  20912. { { 0xb75f079c,0xb2f4dfdd,0x18e36fbb,0x85b07c95,0xe7cd36dd,0x1b6cfcf0,
  20913. 0x0ff4863d,0xab75be15 },
  20914. { 0x173fc9b7,0x81b367c0,0xd2594fd0,0xb90a7420,0xc4091236,0x15fdbf03,
  20915. 0x0b4459f6,0x4ebeac2e } },
  20916. /* 154 */
  20917. { { 0x5c9f2c53,0xeb6c5fe7,0x8eae9411,0xd2522011,0xf95ac5d8,0xc8887633,
  20918. 0x2c1baffc,0xdf99887b },
  20919. { 0x850aaecb,0xbb78eed2,0x01d6a272,0x9d49181b,0xb1cdbcac,0x978dd511,
  20920. 0x779f4058,0x27b040a7 } },
  20921. /* 155 */
  20922. { { 0xf73b2eb2,0x90405db7,0x8e1b2118,0xe0df8508,0x5962327e,0x501b7152,
  20923. 0xe4cfa3f5,0xb393dd37 },
  20924. { 0x3fd75165,0xa1230e7b,0xbcd33554,0xd66344c2,0x0f7b5022,0x6c36f1be,
  20925. 0xd0463419,0x09588c12 } },
  20926. /* 156 */
  20927. { { 0x02601c3b,0xe086093f,0xcf5c335f,0xfb0252f8,0x894aff28,0x955cf280,
  20928. 0xdb9f648b,0x81c879a9 },
  20929. { 0xc6f56c51,0x040e687c,0x3f17618c,0xfed47169,0x9059353b,0x44f88a41,
  20930. 0x5fc11bc4,0xfa0d48f5 } },
  20931. /* 157 */
  20932. { { 0xe1608e4d,0xbc6e1c9d,0x3582822c,0x010dda11,0x157ec2d7,0xf6b7ddc1,
  20933. 0xb6a367d6,0x8ea0e156 },
  20934. { 0x2383b3b4,0xa354e02f,0x3f01f53c,0x69966b94,0x2de03ca5,0x4ff6632b,
  20935. 0xfa00b5ac,0x3f5ab924 } },
  20936. /* 158 */
  20937. { { 0x59739efb,0x337bb0d9,0xe7ebec0d,0xc751b0f4,0x411a67d1,0x2da52dd6,
  20938. 0x2b74256e,0x8bc76887 },
  20939. { 0x82d3d253,0xa5be3b72,0xf58d779f,0xa9f679a1,0xe16767bb,0xa1cac168,
  20940. 0x60fcf34f,0xb386f190 } },
  20941. /* 159 */
  20942. { { 0x2fedcfc2,0x31f3c135,0x62f8af0d,0x5396bf62,0xe57288c2,0x9a02b4ea,
  20943. 0x1b069c4d,0x4cb460f7 },
  20944. { 0x5b8095ea,0xae67b4d3,0x6fc07603,0x92bbf859,0xb614a165,0xe1475f66,
  20945. 0x95ef5223,0x52c0d508 } },
  20946. /* 160 */
  20947. { { 0x15339848,0x231c210e,0x70778c8d,0xe87a28e8,0x6956e170,0x9d1de661,
  20948. 0x2bb09c0b,0x4ac3c938 },
  20949. { 0x6998987d,0x19be0551,0xae09f4d6,0x8b2376c4,0x1a3f933d,0x1de0b765,
  20950. 0xe39705f4,0x380d94c7 } },
  20951. /* 161 */
  20952. { { 0x81542e75,0x01a355aa,0xee01b9b7,0x96c724a1,0x624d7087,0x6b3a2977,
  20953. 0xde2637af,0x2ce3e171 },
  20954. { 0xf5d5bc1a,0xcfefeb49,0x2777e2b5,0xa655607e,0x9513756c,0x4feaac2f,
  20955. 0x0b624e4d,0x2e6cd852 } },
  20956. /* 162 */
  20957. { { 0x8c31c31d,0x3685954b,0x5bf21a0c,0x68533d00,0x75c79ec9,0x0bd7626e,
  20958. 0x42c69d54,0xca177547 },
  20959. { 0xf6d2dbb2,0xcc6edaff,0x174a9d18,0xfd0d8cbd,0xaa4578e8,0x875e8793,
  20960. 0x9cab2ce6,0xa976a713 } },
  20961. /* 163 */
  20962. { { 0x93fb353d,0x0a651f1b,0x57fcfa72,0xd75cab8b,0x31b15281,0xaa88cfa7,
  20963. 0x0a1f4999,0x8720a717 },
  20964. { 0x693e1b90,0x8c3e8d37,0x16f6dfc3,0xd345dc0b,0xb52a8742,0x8ea8d00a,
  20965. 0xc769893c,0x9719ef29 } },
  20966. /* 164 */
  20967. { { 0x58e35909,0x820eed8d,0x33ddc116,0x9366d8dc,0x6e205026,0xd7f999d0,
  20968. 0xe15704c1,0xa5072976 },
  20969. { 0xc4e70b2e,0x002a37ea,0x6890aa8a,0x84dcf657,0x645b2a5c,0xcd71bf18,
  20970. 0xf7b77725,0x99389c9d } },
  20971. /* 165 */
  20972. { { 0x7ada7a4b,0x238c08f2,0xfd389366,0x3abe9d03,0x766f512c,0x6b672e89,
  20973. 0x202c82e4,0xa88806aa },
  20974. { 0xd380184e,0x6602044a,0x126a8b85,0xa8cb78c4,0xad844f17,0x79d670c0,
  20975. 0x4738dcfe,0x0043bffb } },
  20976. /* 166 */
  20977. { { 0x36d5192e,0x8d59b5dc,0x4590b2af,0xacf885d3,0x11601781,0x83566d0a,
  20978. 0xba6c4866,0x52f3ef01 },
  20979. { 0x0edcb64d,0x3986732a,0x8068379f,0x0a482c23,0x7040f309,0x16cbe5fa,
  20980. 0x9ef27e75,0x3296bd89 } },
  20981. /* 167 */
  20982. { { 0x454d81d7,0x476aba89,0x51eb9b3c,0x9eade7ef,0x81c57986,0x619a21cd,
  20983. 0xaee571e9,0x3b90febf },
  20984. { 0x5496f7cb,0x9393023e,0x7fb51bc4,0x55be41d8,0x99beb5ce,0x03f1dd48,
  20985. 0x9f810b18,0x6e88069d } },
  20986. /* 168 */
  20987. { { 0xb43ea1db,0xce37ab11,0x5259d292,0x0a7ff1a9,0x8f84f186,0x851b0221,
  20988. 0xdefaad13,0xa7222bea },
  20989. { 0x2b0a9144,0xa2ac78ec,0xf2fa59c5,0x5a024051,0x6147ce38,0x91d1eca5,
  20990. 0xbc2ac690,0xbe94d523 } },
  20991. /* 169 */
  20992. { { 0x0b226ce7,0x72f4945e,0x967e8b70,0xb8afd747,0x85a6c63e,0xedea46f1,
  20993. 0x9be8c766,0x7782defe },
  20994. { 0x3db38626,0x760d2aa4,0x76f67ad1,0x460ae787,0x54499cdb,0x341b86fc,
  20995. 0xa2892e4b,0x03838567 } },
  20996. /* 170 */
  20997. { { 0x79ec1a0f,0x2d8daefd,0xceb39c97,0x3bbcd6fd,0x58f61a95,0xf5575ffc,
  20998. 0xadf7b420,0xdbd986c4 },
  20999. { 0x15f39eb7,0x81aa8814,0xb98d976c,0x6ee2fcf5,0xcf2f717d,0x5465475d,
  21000. 0x6860bbd0,0x8e24d3c4 } },
  21001. /* 171 */
  21002. { { 0x9a587390,0x749d8e54,0x0cbec588,0x12bb194f,0xb25983c6,0x46e07da4,
  21003. 0x407bafc8,0x541a99c4 },
  21004. { 0x624c8842,0xdb241692,0xd86c05ff,0x6044c12a,0x4f7fcf62,0xc59d14b4,
  21005. 0xf57d35d1,0xc0092c49 } },
  21006. /* 172 */
  21007. { { 0xdf2e61ef,0xd3cc75c3,0x2e1b35ca,0x7e8841c8,0x909f29f4,0xc62d30d1,
  21008. 0x7286944d,0x75e40634 },
  21009. { 0xbbc237d0,0xe7d41fc5,0xec4f01c9,0xc9537bf0,0x282bd534,0x91c51a16,
  21010. 0xc7848586,0x5b7cb658 } },
  21011. /* 173 */
  21012. { { 0x8a28ead1,0x964a7084,0xfd3b47f6,0x802dc508,0x767e5b39,0x9ae4bfd1,
  21013. 0x8df097a1,0x7ae13eba },
  21014. { 0xeadd384e,0xfd216ef8,0xb6b2ff06,0x0361a2d9,0x4bcdb5f3,0x204b9878,
  21015. 0xe2a8e3fd,0x787d8074 } },
  21016. /* 174 */
  21017. { { 0x757fbb1c,0xc5e25d6b,0xca201deb,0xe47bddb2,0x6d2233ff,0x4a55e9a3,
  21018. 0x9ef28484,0x5c222819 },
  21019. { 0x88315250,0x773d4a85,0x827097c1,0x21b21a2b,0xdef5d33f,0xab7c4ea1,
  21020. 0xbaf0f2b0,0xe45d37ab } },
  21021. /* 175 */
  21022. { { 0x28511c8a,0xd2df1e34,0xbdca6cd3,0xebb229c8,0x627c39a7,0x578a71a7,
  21023. 0x84dfb9d3,0xed7bc122 },
  21024. { 0x93dea561,0xcf22a6df,0xd48f0ed1,0x5443f18d,0x5bad23e8,0xd8b86140,
  21025. 0x45ca6d27,0xaac97cc9 } },
  21026. /* 176 */
  21027. { { 0xa16bd00a,0xeb54ea74,0xf5c0bcc1,0xd839e9ad,0x1f9bfc06,0x092bb7f1,
  21028. 0x1163dc4e,0x318f97b3 },
  21029. { 0xc30d7138,0xecc0c5be,0xabc30220,0x44e8df23,0xb0223606,0x2bb7972f,
  21030. 0x9a84ff4d,0xfa41faa1 } },
  21031. /* 177 */
  21032. { { 0xa6642269,0x4402d974,0x9bb783bd,0xc81814ce,0x7941e60b,0x398d38e4,
  21033. 0x1d26e9e2,0x38bb6b2c },
  21034. { 0x6a577f87,0xc64e4a25,0xdc11fe1c,0x8b52d253,0x62280728,0xff336abf,
  21035. 0xce7601a5,0x94dd0905 } },
  21036. /* 178 */
  21037. { { 0xde93f92a,0x156cf7dc,0x89b5f315,0xa01333cb,0xc995e750,0x02404df9,
  21038. 0xd25c2ae9,0x92077867 },
  21039. { 0x0bf39d44,0xe2471e01,0x96bb53d7,0x5f2c9020,0x5c9c3d8f,0x4c44b7b3,
  21040. 0xd29beb51,0x81e8428b } },
  21041. /* 179 */
  21042. { { 0xc477199f,0x6dd9c2ba,0x6b5ecdd9,0x8cb8eeee,0xee40fd0e,0x8af7db3f,
  21043. 0xdbbfa4b1,0x1b94ab62 },
  21044. { 0xce47f143,0x44f0d8b3,0x63f46163,0x51e623fc,0xcc599383,0xf18f270f,
  21045. 0x055590ee,0x06a38e28 } },
  21046. /* 180 */
  21047. { { 0xb3355b49,0x2e5b0139,0xb4ebf99b,0x20e26560,0xd269f3dc,0xc08ffa6b,
  21048. 0x83d9d4f8,0xa7b36c20 },
  21049. { 0x1b3e8830,0x64d15c3a,0xa89f9c0b,0xd5fceae1,0xe2d16930,0xcfeee4a2,
  21050. 0xa2822a20,0xbe54c6b4 } },
  21051. /* 181 */
  21052. { { 0x8d91167c,0xd6cdb3df,0xe7a6625e,0x517c3f79,0x346ac7f4,0x7105648f,
  21053. 0xeae022bb,0xbf30a5ab },
  21054. { 0x93828a68,0x8e7785be,0x7f3ef036,0x5161c332,0x592146b2,0xe11b5feb,
  21055. 0x2732d13a,0xd1c820de } },
  21056. /* 182 */
  21057. { { 0x9038b363,0x043e1347,0x6b05e519,0x58c11f54,0x6026cad1,0x4fe57abe,
  21058. 0x68a18da3,0xb7d17bed },
  21059. { 0xe29c2559,0x44ca5891,0x5bfffd84,0x4f7a0376,0x74e46948,0x498de4af,
  21060. 0x6412cc64,0x3997fd5e } },
  21061. /* 183 */
  21062. { { 0x8bd61507,0xf2074682,0x34a64d2a,0x29e132d5,0x8a8a15e3,0xffeddfb0,
  21063. 0x3c6c13e8,0x0eeb8929 },
  21064. { 0xa7e259f8,0xe9b69a3e,0xd13e7e67,0xce1db7e6,0xad1fa685,0x277318f6,
  21065. 0xc922b6ef,0x228916f8 } },
  21066. /* 184 */
  21067. { { 0x0a12ab5b,0x959ae25b,0x957bc136,0xcc11171f,0xd16e2b0c,0x8058429e,
  21068. 0x6e93097e,0xec05ad1d },
  21069. { 0xac3f3708,0x157ba5be,0x30b59d77,0x31baf935,0x118234e5,0x47b55237,
  21070. 0x7ff11b37,0x7d314156 } },
  21071. /* 185 */
  21072. { { 0xf6dfefab,0x7bd9c05c,0xdcb37707,0xbe2f2268,0x3a38bb95,0xe53ead97,
  21073. 0x9bc1d7a3,0xe9ce66fc },
  21074. { 0x6f6a02a1,0x75aa1576,0x60e600ed,0x38c087df,0x68cdc1b9,0xf8947f34,
  21075. 0x72280651,0xd9650b01 } },
  21076. /* 186 */
  21077. { { 0x5a057e60,0x504b4c4a,0x8def25e4,0xcbccc3be,0x17c1ccbd,0xa6353208,
  21078. 0x804eb7a2,0x14d6699a },
  21079. { 0xdb1f411a,0x2c8a8415,0xf80d769c,0x09fbaf0b,0x1c2f77ad,0xb4deef90,
  21080. 0x0d43598a,0x6f4c6841 } },
  21081. /* 187 */
  21082. { { 0x96c24a96,0x8726df4e,0xfcbd99a3,0x534dbc85,0x8b2ae30a,0x3c466ef2,
  21083. 0x61189abb,0x4c4350fd },
  21084. { 0xf855b8da,0x2967f716,0x463c38a1,0x41a42394,0xeae93343,0xc37e1413,
  21085. 0x5a3118b5,0xa726d242 } },
  21086. /* 188 */
  21087. { { 0x948c1086,0xdae6b3ee,0xcbd3a2e1,0xf1de503d,0x03d022f3,0x3f35ed3f,
  21088. 0xcc6cf392,0x13639e82 },
  21089. { 0xcdafaa86,0x9ac938fb,0x2654a258,0xf45bc5fb,0x45051329,0x1963b26e,
  21090. 0xc1a335a3,0xca9365e1 } },
  21091. /* 189 */
  21092. { { 0x4c3b2d20,0x3615ac75,0x904e241b,0x742a5417,0xcc9d071d,0xb08521c4,
  21093. 0x970b72a5,0x9ce29c34 },
  21094. { 0x6d3e0ad6,0x8cc81f73,0xf2f8434c,0x8060da9e,0x6ce862d9,0x35ed1d1a,
  21095. 0xab42af98,0x48c4abd7 } },
  21096. /* 190 */
  21097. { { 0x40c7485a,0xd221b0cc,0xe5274dbf,0xead455bb,0x9263d2e8,0x493c7698,
  21098. 0xf67b33cb,0x78017c32 },
  21099. { 0x930cb5ee,0xb9d35769,0x0c408ed2,0xc0d14e94,0x272f1a4d,0xf8b7bf55,
  21100. 0xde5c1c04,0x53cd0454 } },
  21101. /* 191 */
  21102. { { 0x5d28ccac,0xbcd585fa,0x005b746e,0x5f823e56,0xcd0123aa,0x7c79f0a1,
  21103. 0xd3d7fa8f,0xeea465c1 },
  21104. { 0x0551803b,0x7810659f,0x7ce6af70,0x6c0b599f,0x29288e70,0x4195a770,
  21105. 0x7ae69193,0x1b6e42a4 } },
  21106. /* 192 */
  21107. { { 0xf67d04c3,0x2e80937c,0x89eeb811,0x1e312be2,0x92594d60,0x56b5d887,
  21108. 0x187fbd3d,0x0224da14 },
  21109. { 0x0c5fe36f,0x87abb863,0x4ef51f5f,0x580f3c60,0xb3b429ec,0x964fb1bf,
  21110. 0x42bfff33,0x60838ef0 } },
  21111. /* 193 */
  21112. { { 0x7e0bbe99,0x432cb2f2,0x04aa39ee,0x7bda44f3,0x9fa93903,0x5f497c7a,
  21113. 0x2d331643,0x636eb202 },
  21114. { 0x93ae00aa,0xfcfd0e61,0x31ae6d2f,0x875a00fe,0x9f93901c,0xf43658a2,
  21115. 0x39218bac,0x8844eeb6 } },
  21116. /* 194 */
  21117. { { 0x6b3bae58,0x114171d2,0x17e39f3e,0x7db3df71,0x81a8eada,0xcd37bc7f,
  21118. 0x51fb789e,0x27ba83dc },
  21119. { 0xfbf54de5,0xa7df439f,0xb5fe1a71,0x7277030b,0xdb297a48,0x42ee8e35,
  21120. 0x87f3a4ab,0xadb62d34 } },
  21121. /* 195 */
  21122. { { 0xa175df2a,0x9b1168a2,0x618c32e9,0x082aa04f,0x146b0916,0xc9e4f2e7,
  21123. 0x75e7c8b2,0xb990fd76 },
  21124. { 0x4df37313,0x0829d96b,0xd0b40789,0x1c205579,0x78087711,0x66c9ae4a,
  21125. 0x4d10d18d,0x81707ef9 } },
  21126. /* 196 */
  21127. { { 0x03d6ff96,0x97d7cab2,0x0d843360,0x5b851bfc,0xd042db4b,0x268823c4,
  21128. 0xd5a8aa5c,0x3792daea },
  21129. { 0x941afa0b,0x52818865,0x42d83671,0xf3e9e741,0x5be4e0a7,0x17c82527,
  21130. 0x94b001ba,0x5abd635e } },
  21131. /* 197 */
  21132. { { 0x0ac4927c,0x727fa84e,0xa7c8cf23,0xe3886035,0x4adca0df,0xa4bcd5ea,
  21133. 0x846ab610,0x5995bf21 },
  21134. { 0x829dfa33,0xe90f860b,0x958fc18b,0xcaafe2ae,0x78630366,0x9b3baf44,
  21135. 0xd483411e,0x44c32ca2 } },
  21136. /* 198 */
  21137. { { 0xe40ed80c,0xa74a97f1,0x31d2ca82,0x5f938cb1,0x7c2d6ad9,0x53f2124b,
  21138. 0x8082a54c,0x1f2162fb },
  21139. { 0x720b173e,0x7e467cc5,0x085f12f9,0x40e8a666,0x4c9d65dc,0x8cebc20e,
  21140. 0xc3e907c9,0x8f1d402b } },
  21141. /* 199 */
  21142. { { 0xfbc4058a,0x4f592f9c,0x292f5670,0xb15e14b6,0xbc1d8c57,0xc55cfe37,
  21143. 0x926edbf9,0xb1980f43 },
  21144. { 0x32c76b09,0x98c33e09,0x33b07f78,0x1df5279d,0x863bb461,0x6f08ead4,
  21145. 0x37448e45,0x2828ad9b } },
  21146. /* 200 */
  21147. { { 0xc4cf4ac5,0x696722c4,0xdde64afb,0xf5ac1a3f,0xe0890832,0x0551baa2,
  21148. 0x5a14b390,0x4973f127 },
  21149. { 0x322eac5d,0xe59d8335,0x0bd9b568,0x5e07eef5,0xa2588393,0xab36720f,
  21150. 0xdb168ac7,0x6dac8ed0 } },
  21151. /* 201 */
  21152. { { 0xeda835ef,0xf7b545ae,0x1d10ed51,0x4aa113d2,0x13741b09,0x035a65e0,
  21153. 0x20b9de4c,0x4b23ef59 },
  21154. { 0x3c4c7341,0xe82bb680,0x3f58bc37,0xd457706d,0xa51e3ee8,0x73527863,
  21155. 0xddf49a4e,0x4dd71534 } },
  21156. /* 202 */
  21157. { { 0x95476cd9,0xbf944672,0xe31a725b,0x648d072f,0xfc4b67e0,0x1441c8b8,
  21158. 0x2f4a4dbb,0xfd317000 },
  21159. { 0x8995d0e1,0x1cb43ff4,0x0ef729aa,0x76e695d1,0x41798982,0xe0d5f976,
  21160. 0x9569f365,0x14fac58c } },
  21161. /* 203 */
  21162. { { 0xf312ae18,0xad9a0065,0xfcc93fc9,0x51958dc0,0x8a7d2846,0xd9a14240,
  21163. 0x36abda50,0xed7c7651 },
  21164. { 0x25d4abbc,0x46270f1a,0xf1a113ea,0x9b5dd8f3,0x5b51952f,0xc609b075,
  21165. 0x4d2e9f53,0xfefcb7f7 } },
  21166. /* 204 */
  21167. { { 0xba119185,0xbd09497a,0xaac45ba4,0xd54e8c30,0xaa521179,0x492479de,
  21168. 0x87e0d80b,0x1801a57e },
  21169. { 0xfcafffb0,0x073d3f8d,0xae255240,0x6cf33c0b,0x5b5fdfbc,0x781d763b,
  21170. 0x1ead1064,0x9f8fc11e } },
  21171. /* 205 */
  21172. { { 0x5e69544c,0x1583a171,0xf04b7813,0x0eaf8567,0x278a4c32,0x1e22a8fd,
  21173. 0x3d3a69a9,0xa9d3809d },
  21174. { 0x59a2da3b,0x936c2c2c,0x1895c847,0x38ccbcf6,0x63d50869,0x5e65244e,
  21175. 0xe1178ef7,0x3006b9ae } },
  21176. /* 206 */
  21177. { { 0xc9eead28,0x0bb1f2b0,0x89f4dfbc,0x7eef635d,0xb2ce8939,0x074757fd,
  21178. 0x45f8f761,0x0ab85fd7 },
  21179. { 0x3e5b4549,0xecda7c93,0x97922f21,0x4be2bb5c,0xb43b8040,0x261a1274,
  21180. 0x11e942c2,0xb122d675 } },
  21181. /* 207 */
  21182. { { 0x66a5ae7a,0x3be607be,0x76adcbe3,0x01e703fa,0x4eb6e5c5,0xaf904301,
  21183. 0x097dbaec,0x9f599dc1 },
  21184. { 0x0ff250ed,0x6d75b718,0x349a20dc,0x8eb91574,0x10b227a3,0x425605a4,
  21185. 0x8a294b78,0x7d5528e0 } },
  21186. /* 208 */
  21187. { { 0x20c26def,0xf0f58f66,0x582b2d1e,0x025585ea,0x01ce3881,0xfbe7d79b,
  21188. 0x303f1730,0x28ccea01 },
  21189. { 0x79644ba5,0xd1dabcd1,0x06fff0b8,0x1fc643e8,0x66b3e17b,0xa60a76fc,
  21190. 0xa1d013bf,0xc18baf48 } },
  21191. /* 209 */
  21192. { { 0x5dc4216d,0x34e638c8,0x206142ac,0x00c01067,0x95f5064a,0xd453a171,
  21193. 0xb7a9596b,0x9def809d },
  21194. { 0x67ab8d2c,0x41e8642e,0x6237a2b6,0xb4240433,0x64c4218b,0x7d506a6d,
  21195. 0x68808ce5,0x0357f8b0 } },
  21196. /* 210 */
  21197. { { 0x4cd2cc88,0x8e9dbe64,0xf0b8f39d,0xcc61c28d,0xcd30a0c8,0x4a309874,
  21198. 0x1b489887,0xe4a01add },
  21199. { 0xf57cd8f9,0x2ed1eeac,0xbd594c48,0x1b767d3e,0x7bd2f787,0xa7295c71,
  21200. 0xce10cc30,0x466d7d79 } },
  21201. /* 211 */
  21202. { { 0x9dada2c7,0x47d31892,0x8f9aa27d,0x4fa0a6c3,0x820a59e1,0x90e4fd28,
  21203. 0x451ead1a,0xc672a522 },
  21204. { 0x5d86b655,0x30607cc8,0xf9ad4af1,0xf0235d3b,0x571172a6,0x99a08680,
  21205. 0xf2a67513,0x5e3d64fa } },
  21206. /* 212 */
  21207. { { 0x9b3b4416,0xaa6410c7,0xeab26d99,0xcd8fcf85,0xdb656a74,0x5ebff74a,
  21208. 0xeb8e42fc,0x6c8a7a95 },
  21209. { 0xb02a63bd,0x10c60ba7,0x8b8f0047,0x6b2f2303,0x312d90b0,0x8c6c3738,
  21210. 0xad82ca91,0x348ae422 } },
  21211. /* 213 */
  21212. { { 0x5ccda2fb,0x7f474663,0x8e0726d2,0x22accaa1,0x492b1f20,0x85adf782,
  21213. 0xd9ef2d2e,0xc1074de0 },
  21214. { 0xae9a65b3,0xfcf3ce44,0x05d7151b,0xfd71e4ac,0xce6a9788,0xd4711f50,
  21215. 0xc9e54ffc,0xfbadfbdb } },
  21216. /* 214 */
  21217. { { 0x20a99363,0x1713f1cd,0x6cf22775,0xb915658f,0x24d359b2,0x968175cd,
  21218. 0x83716fcd,0xb7f976b4 },
  21219. { 0x5d6dbf74,0x5758e24d,0x71c3af36,0x8d23bafd,0x0243dfe3,0x48f47760,
  21220. 0xcafcc805,0xf4d41b2e } },
  21221. /* 215 */
  21222. { { 0xfdabd48d,0x51f1cf28,0x32c078a4,0xce81be36,0x117146e9,0x6ace2974,
  21223. 0xe0160f10,0x180824ea },
  21224. { 0x66e58358,0x0387698b,0xce6ca358,0x63568752,0x5e41e6c5,0x82380e34,
  21225. 0x83cf6d25,0x67e5f639 } },
  21226. /* 216 */
  21227. { { 0xcf4899ef,0xf89ccb8d,0x9ebb44c0,0x949015f0,0xb2598ec9,0x546f9276,
  21228. 0x04c11fc6,0x9fef789a },
  21229. { 0x53d2a071,0x6d367ecf,0xa4519b09,0xb10e1a7f,0x611e2eef,0xca6b3fb0,
  21230. 0xa99c4e20,0xbc80c181 } },
  21231. /* 217 */
  21232. { { 0xe5eb82e6,0x972536f8,0xf56cb920,0x1a484fc7,0x50b5da5e,0xc78e2171,
  21233. 0x9f8cdf10,0x49270e62 },
  21234. { 0xea6b50ad,0x1a39b7bb,0xa2388ffc,0x9a0284c1,0x8107197b,0x5403eb17,
  21235. 0x61372f7f,0xd2ee52f9 } },
  21236. /* 218 */
  21237. { { 0x88e0362a,0xd37cd285,0x8fa5d94d,0x442fa8a7,0xa434a526,0xaff836e5,
  21238. 0xe5abb733,0xdfb478be },
  21239. { 0x673eede6,0xa91f1ce7,0x2b5b2f04,0xa5390ad4,0x5530da2f,0x5e66f7bf,
  21240. 0x08df473a,0xd9a140b4 } },
  21241. /* 219 */
  21242. { { 0x6e8ea498,0x0e0221b5,0x3563ee09,0x62347829,0x335d2ade,0xe06b8391,
  21243. 0x623f4b1a,0x760c058d },
  21244. { 0xc198aa79,0x0b89b58c,0xf07aba7f,0xf74890d2,0xfde2556a,0x4e204110,
  21245. 0x8f190409,0x7141982d } },
  21246. /* 220 */
  21247. { { 0x4d4b0f45,0x6f0a0e33,0x392a94e1,0xd9280b38,0xb3c61d5e,0x3af324c6,
  21248. 0x89d54e47,0x3af9d1ce },
  21249. { 0x20930371,0xfd8f7981,0x21c17097,0xeda2664c,0xdc42309b,0x0e9545dc,
  21250. 0x73957dd6,0xb1f815c3 } },
  21251. /* 221 */
  21252. { { 0x89fec44a,0x84faa78e,0x3caa4caf,0xc8c2ae47,0xc1b6a624,0x691c807d,
  21253. 0x1543f052,0xa41aed14 },
  21254. { 0x7d5ffe04,0x42435399,0x625b6e20,0x8bacb2df,0x87817775,0x85d660be,
  21255. 0x86fb60ef,0xd6e9c1dd } },
  21256. /* 222 */
  21257. { { 0xc6853264,0x3aa2e97e,0xe2304a0b,0x771533b7,0xb8eae9be,0x1b912bb7,
  21258. 0xae9bf8c2,0x9c9c6e10 },
  21259. { 0xe030b74c,0xa2309a59,0x6a631e90,0x4ed7494d,0xa49b79f2,0x89f44b23,
  21260. 0x40fa61b6,0x566bd596 } },
  21261. /* 223 */
  21262. { { 0xc18061f3,0x066c0118,0x7c83fc70,0x190b25d3,0x27273245,0xf05fc8e0,
  21263. 0xf525345e,0xcf2c7390 },
  21264. { 0x10eb30cf,0xa09bceb4,0x0d77703a,0xcfd2ebba,0x150ff255,0xe842c43a,
  21265. 0x8aa20979,0x02f51755 } },
  21266. /* 224 */
  21267. { { 0xaddb7d07,0x396ef794,0x24455500,0x0b4fc742,0xc78aa3ce,0xfaff8eac,
  21268. 0xe8d4d97d,0x14e9ada5 },
  21269. { 0x2f7079e2,0xdaa480a1,0xe4b0800e,0x45baa3cd,0x7838157d,0x01765e2d,
  21270. 0x8e9d9ae8,0xa0ad4fab } },
  21271. /* 225 */
  21272. { { 0x4a653618,0x0bfb7621,0x31eaaa5f,0x1872813c,0x44949d5e,0x1553e737,
  21273. 0x6e56ed1e,0xbcd530b8 },
  21274. { 0x32e9c47b,0x169be853,0xb50059ab,0xdc2776fe,0x192bfbb4,0xcdba9761,
  21275. 0x6979341d,0x909283cf } },
  21276. /* 226 */
  21277. { { 0x76e81a13,0x67b00324,0x62171239,0x9bee1a99,0xd32e19d6,0x08ed361b,
  21278. 0xace1549a,0x35eeb7c9 },
  21279. { 0x7e4e5bdc,0x1280ae5a,0xb6ceec6e,0x2dcd2cd3,0x6e266bc1,0x52e4224c,
  21280. 0x448ae864,0x9a8b2cf4 } },
  21281. /* 227 */
  21282. { { 0x09d03b59,0xf6471bf2,0xb65af2ab,0xc90e62a3,0xebd5eec9,0xff7ff168,
  21283. 0xd4491379,0x6bdb60f4 },
  21284. { 0x8a55bc30,0xdadafebc,0x10097fe0,0xc79ead16,0x4c1e3bdd,0x42e19741,
  21285. 0x94ba08a9,0x01ec3cfd } },
  21286. /* 228 */
  21287. { { 0xdc9485c2,0xba6277eb,0x22fb10c7,0x48cc9a79,0x70a28d8a,0x4f61d60f,
  21288. 0x475464f6,0xd1acb1c0 },
  21289. { 0x26f36612,0xd26902b1,0xe0618d8b,0x59c3a44e,0x308357ee,0x4df8a813,
  21290. 0x405626c2,0x7dcd079d } },
  21291. /* 229 */
  21292. { { 0xf05a4b48,0x5ce7d4d3,0x37230772,0xadcd2952,0x812a915a,0xd18f7971,
  21293. 0x377d19b8,0x0bf53589 },
  21294. { 0x6c68ea73,0x35ecd95a,0x823a584d,0xc7f3bbca,0xf473a723,0x9fb674c6,
  21295. 0xe16686fc,0xd28be4d9 } },
  21296. /* 230 */
  21297. { { 0x38fa8e4b,0x5d2b9906,0x893fd8fc,0x559f186e,0x436fb6fc,0x3a6de2aa,
  21298. 0x510f88ce,0xd76007aa },
  21299. { 0x523a4988,0x2d10aab6,0x74dd0273,0xb455cf44,0xa3407278,0x7f467082,
  21300. 0xb303bb01,0xf2b52f68 } },
  21301. /* 231 */
  21302. { { 0x9835b4ca,0x0d57eafa,0xbb669cbc,0x2d2232fc,0xc6643198,0x8eeeb680,
  21303. 0xcc5aed3a,0xd8dbe98e },
  21304. { 0xc5a02709,0xcba9be3f,0xf5ba1fa8,0x30be68e5,0xf10ea852,0xfebd43cd,
  21305. 0xee559705,0xe01593a3 } },
  21306. /* 232 */
  21307. { { 0xea75a0a6,0xd3e5af50,0x57858033,0x512226ac,0xd0176406,0x6fe6d50f,
  21308. 0xaeb8ef06,0xafec07b1 },
  21309. { 0x80bb0a31,0x7fb99567,0x37309aae,0x6f1af3cc,0x01abf389,0x9153a15a,
  21310. 0x6e2dbfdd,0xa71b9354 } },
  21311. /* 233 */
  21312. { { 0x18f593d2,0xbf8e12e0,0xa078122b,0xd1a90428,0x0ba4f2ad,0x150505db,
  21313. 0x628523d9,0x53a2005c },
  21314. { 0xe7f2b935,0x07c8b639,0xc182961a,0x2bff975a,0x7518ca2c,0x86bceea7,
  21315. 0x3d588e3d,0xbf47d19b } },
  21316. /* 234 */
  21317. { { 0xdd7665d5,0x672967a7,0x2f2f4de5,0x4e303057,0x80d4903f,0x144005ae,
  21318. 0x39c9a1b6,0x001c2c7f },
  21319. { 0x69efc6d6,0x143a8014,0x7bc7a724,0xc810bdaa,0xa78150a4,0x5f65670b,
  21320. 0x86ffb99b,0xfdadf8e7 } },
  21321. /* 235 */
  21322. { { 0xffc00785,0xfd38cb88,0x3b48eb67,0x77fa7591,0xbf368fbc,0x0454d055,
  21323. 0x5aa43c94,0x3a838e4d },
  21324. { 0x3e97bb9a,0x56166329,0x441d94d9,0x9eb93363,0x0adb2a83,0x515591a6,
  21325. 0x873e1da3,0x3cdb8257 } },
  21326. /* 236 */
  21327. { { 0x7de77eab,0x137140a9,0x41648109,0xf7e1c50d,0xceb1d0df,0x762dcad2,
  21328. 0xf1f57fba,0x5a60cc89 },
  21329. { 0x40d45673,0x80b36382,0x5913c655,0x1b82be19,0xdd64b741,0x057284b8,
  21330. 0xdbfd8fc0,0x922ff56f } },
  21331. /* 237 */
  21332. { { 0xc9a129a1,0x1b265dee,0xcc284e04,0xa5b1ce57,0xcebfbe3c,0x04380c46,
  21333. 0xf6c5cd62,0x72919a7d },
  21334. { 0x8fb90f9a,0x298f453a,0x88e4031b,0xd719c00b,0x796f1856,0xe32c0e77,
  21335. 0x3624089a,0x5e791780 } },
  21336. /* 238 */
  21337. { { 0x7f63cdfb,0x5c16ec55,0xf1cae4fd,0x8e6a3571,0x560597ca,0xfce26bea,
  21338. 0xe24c2fab,0x4e0a5371 },
  21339. { 0xa5765357,0x276a40d3,0x0d73a2b4,0x3c89af44,0x41d11a32,0xb8f370ae,
  21340. 0xd56604ee,0xf5ff7818 } },
  21341. /* 239 */
  21342. { { 0x1a09df21,0xfbf3e3fe,0xe66e8e47,0x26d5d28e,0x29c89015,0x2096bd0a,
  21343. 0x533f5e64,0xe41df0e9 },
  21344. { 0xb3ba9e3f,0x305fda40,0x2604d895,0xf2340ceb,0x7f0367c7,0x0866e192,
  21345. 0xac4f155f,0x8edd7d6e } },
  21346. /* 240 */
  21347. { { 0x0bfc8ff3,0xc9a1dc0e,0xe936f42f,0x14efd82b,0xcca381ef,0x67016f7c,
  21348. 0xed8aee96,0x1432c1ca },
  21349. { 0x70b23c26,0xec684829,0x0735b273,0xa64fe873,0xeaef0f5a,0xe389f6e5,
  21350. 0x5ac8d2c6,0xcaef480b } },
  21351. /* 241 */
  21352. { { 0x75315922,0x5245c978,0x3063cca5,0xd8295171,0xb64ef2cb,0xf3ce60d0,
  21353. 0x8efae236,0xd0ba177e },
  21354. { 0xb1b3af60,0x53a9ae8f,0x3d2da20e,0x1a796ae5,0xdf9eef28,0x01d63605,
  21355. 0x1c54ae16,0xf31c957c } },
  21356. /* 242 */
  21357. { { 0x49cc4597,0xc0f58d52,0xbae0a028,0xdc5015b0,0x734a814a,0xefc5fc55,
  21358. 0x96e17c3a,0x013404cb },
  21359. { 0xc9a824bf,0xb29e2585,0x001eaed7,0xd593185e,0x61ef68ac,0x8d6ee682,
  21360. 0x91933e6c,0x6f377c4b } },
  21361. /* 243 */
  21362. { { 0xa8333fd2,0x9f93bad1,0x5a2a95b8,0xa8930202,0xeaf75ace,0x211e5037,
  21363. 0xd2d09506,0x6dba3e4e },
  21364. { 0xd04399cd,0xa48ef98c,0xe6b73ade,0x1811c66e,0xc17ecaf3,0x72f60752,
  21365. 0x3becf4a7,0xf13cf342 } },
  21366. /* 244 */
  21367. { { 0xa919e2eb,0xceeb9ec0,0xf62c0f68,0x83a9a195,0x7aba2299,0xcfba3bb6,
  21368. 0x274bbad3,0xc83fa9a9 },
  21369. { 0x62fa1ce0,0x0d7d1b0b,0x3418efbf,0xe58b60f5,0x52706f04,0xbfa8ef9e,
  21370. 0x5d702683,0xb49d70f4 } },
  21371. /* 245 */
  21372. { { 0xfad5513b,0x914c7510,0xb1751e2d,0x05f32eec,0xd9fb9d59,0x6d850418,
  21373. 0x0c30f1cf,0x59cfadbb },
  21374. { 0x55cb7fd6,0xe167ac23,0x820426a3,0x249367b8,0x90a78864,0xeaeec58c,
  21375. 0x354a4b67,0x5babf362 } },
  21376. /* 246 */
  21377. { { 0xee424865,0x37c981d1,0xf2e5577f,0x8b002878,0xb9e0c058,0x702970f1,
  21378. 0x9026c8f0,0x6188c6a7 },
  21379. { 0xd0f244da,0x06f9a19b,0xfb080873,0x1ecced5c,0x9f213637,0x35470f9b,
  21380. 0xdf50b9d9,0x993fe475 } },
  21381. /* 247 */
  21382. { { 0x9b2c3609,0x68e31cdf,0x2c46d4ea,0x84eb19c0,0x9a775101,0x7ac9ec1a,
  21383. 0x4c80616b,0x81f76466 },
  21384. { 0x75fbe978,0x1d7c2a5a,0xf183b356,0x6743fed3,0x501dd2bf,0x838d1f04,
  21385. 0x5fe9060d,0x564a812a } },
  21386. /* 248 */
  21387. { { 0xfa817d1d,0x7a5a64f4,0xbea82e0f,0x55f96844,0xcd57f9aa,0xb5ff5a0f,
  21388. 0x00e51d6c,0x226bf3cf },
  21389. { 0x2f2833cf,0xd6d1a9f9,0x4f4f89a8,0x20a0a35a,0x8f3f7f77,0x11536c49,
  21390. 0xff257836,0x68779f47 } },
  21391. /* 249 */
  21392. { { 0x73043d08,0x79b0c1c1,0x1fc020fa,0xa5446774,0x9a6d26d0,0xd3767e28,
  21393. 0xeb092e0b,0x97bcb0d1 },
  21394. { 0xf32ed3c3,0x2ab6eaa8,0xb281bc48,0xc8a4f151,0xbfa178f3,0x4d1bf4f3,
  21395. 0x0a784655,0xa872ffe8 } },
  21396. /* 250 */
  21397. { { 0xa32b2086,0xb1ab7935,0x8160f486,0xe1eb710e,0x3b6ae6be,0x9bd0cd91,
  21398. 0xb732a36a,0x02812bfc },
  21399. { 0xcf605318,0xa63fd7ca,0xfdfd6d1d,0x646e5d50,0x2102d619,0xa1d68398,
  21400. 0xfe5396af,0x07391cc9 } },
  21401. /* 251 */
  21402. { { 0x8b80d02b,0xc50157f0,0x62877f7f,0x6b8333d1,0x78d542ae,0x7aca1af8,
  21403. 0x7e6d2a08,0x355d2adc },
  21404. { 0x287386e1,0xb41f335a,0xf8e43275,0xfd272a94,0xe79989ea,0x286ca2cd,
  21405. 0x7c2a3a79,0x3dc2b1e3 } },
  21406. /* 252 */
  21407. { { 0x04581352,0xd689d21c,0x376782be,0x0a00c825,0x9fed701f,0x203bd590,
  21408. 0x3ccd846b,0xc4786910 },
  21409. { 0x24c768ed,0x5dba7708,0x6841f657,0x72feea02,0x6accce0e,0x73313ed5,
  21410. 0xd5bb4d32,0xccc42968 } },
  21411. /* 253 */
  21412. { { 0x3d7620b9,0x94e50de1,0x5992a56a,0xd89a5c8a,0x675487c9,0xdc007640,
  21413. 0xaa4871cf,0xe147eb42 },
  21414. { 0xacf3ae46,0x274ab4ee,0x50350fbe,0xfd4936fb,0x48c840ea,0xdf2afe47,
  21415. 0x080e96e3,0x239ac047 } },
  21416. /* 254 */
  21417. { { 0x2bfee8d4,0x481d1f35,0xfa7b0fec,0xce80b5cf,0x2ce9af3c,0x105c4c9e,
  21418. 0xf5f7e59d,0xc55fa1a3 },
  21419. { 0x8257c227,0x3186f14e,0x342be00b,0xc5b1653f,0xaa904fb2,0x09afc998,
  21420. 0xd4f4b699,0x094cd99c } },
  21421. /* 255 */
  21422. { { 0xd703beba,0x8a981c84,0x32ceb291,0x8631d150,0xe3bd49ec,0xa445f2c9,
  21423. 0x42abad33,0xb90a30b6 },
  21424. { 0xb4a5abf9,0xb465404f,0x75db7603,0x004750c3,0xca35d89f,0x6f9a42cc,
  21425. 0x1b7924f7,0x019f8b9a } },
  21426. };
  21427. /* Multiply the base point of P256 by the scalar and return the result.
  21428. * If map is true then convert result to affine coordinates.
  21429. *
  21430. * Stripe implementation.
  21431. * Pre-generated: 2^0, 2^32, ...
  21432. * Pre-generated: products of all combinations of above.
  21433. * 8 doubles and adds (with qz=1)
  21434. *
  21435. * r Resulting point.
  21436. * k Scalar to multiply by.
  21437. * map Indicates whether to convert result to affine.
  21438. * ct Constant time required.
  21439. * heap Heap to use for allocation.
  21440. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  21441. */
  21442. static int sp_256_ecc_mulmod_base_8(sp_point_256* r, const sp_digit* k,
  21443. int map, int ct, void* heap)
  21444. {
  21445. return sp_256_ecc_mulmod_stripe_8(r, &p256_base, p256_table,
  21446. k, map, ct, heap);
  21447. }
  21448. #endif
  21449. /* Multiply the base point of P256 by the scalar and return the result.
  21450. * If map is true then convert result to affine coordinates.
  21451. *
  21452. * km Scalar to multiply by.
  21453. * r Resulting point.
  21454. * map Indicates whether to convert result to affine.
  21455. * heap Heap to use for allocation.
  21456. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  21457. */
  21458. int sp_ecc_mulmod_base_256(const mp_int* km, ecc_point* r, int map, void* heap)
  21459. {
  21460. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21461. sp_point_256* point = NULL;
  21462. sp_digit* k = NULL;
  21463. #else
  21464. sp_point_256 point[1];
  21465. sp_digit k[8];
  21466. #endif
  21467. int err = MP_OKAY;
  21468. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21469. point = (sp_point_256*)XMALLOC(sizeof(sp_point_256), heap,
  21470. DYNAMIC_TYPE_ECC);
  21471. if (point == NULL)
  21472. err = MEMORY_E;
  21473. if (err == MP_OKAY) {
  21474. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 8, heap,
  21475. DYNAMIC_TYPE_ECC);
  21476. if (k == NULL)
  21477. err = MEMORY_E;
  21478. }
  21479. #endif
  21480. if (err == MP_OKAY) {
  21481. sp_256_from_mp(k, 8, km);
  21482. err = sp_256_ecc_mulmod_base_8(point, k, map, 1, heap);
  21483. }
  21484. if (err == MP_OKAY) {
  21485. err = sp_256_point_to_ecc_point_8(point, r);
  21486. }
  21487. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21488. if (k != NULL)
  21489. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  21490. if (point != NULL)
  21491. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  21492. #endif
  21493. return err;
  21494. }
  21495. /* Multiply the base point of P256 by the scalar, add point a and return
  21496. * the result. If map is true then convert result to affine coordinates.
  21497. *
  21498. * km Scalar to multiply by.
  21499. * am Point to add to scalar mulitply result.
  21500. * inMont Point to add is in montgomery form.
  21501. * r Resulting point.
  21502. * map Indicates whether to convert result to affine.
  21503. * heap Heap to use for allocation.
  21504. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  21505. */
  21506. int sp_ecc_mulmod_base_add_256(const mp_int* km, const ecc_point* am,
  21507. int inMont, ecc_point* r, int map, void* heap)
  21508. {
  21509. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21510. sp_point_256* point = NULL;
  21511. sp_digit* k = NULL;
  21512. #else
  21513. sp_point_256 point[2];
  21514. sp_digit k[8 + 8 * 2 * 6];
  21515. #endif
  21516. sp_point_256* addP = NULL;
  21517. sp_digit* tmp = NULL;
  21518. int err = MP_OKAY;
  21519. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21520. point = (sp_point_256*)XMALLOC(sizeof(sp_point_256) * 2, heap,
  21521. DYNAMIC_TYPE_ECC);
  21522. if (point == NULL)
  21523. err = MEMORY_E;
  21524. if (err == MP_OKAY) {
  21525. k = (sp_digit*)XMALLOC(
  21526. sizeof(sp_digit) * (8 + 8 * 2 * 6),
  21527. heap, DYNAMIC_TYPE_ECC);
  21528. if (k == NULL)
  21529. err = MEMORY_E;
  21530. }
  21531. #endif
  21532. if (err == MP_OKAY) {
  21533. addP = point + 1;
  21534. tmp = k + 8;
  21535. sp_256_from_mp(k, 8, km);
  21536. sp_256_point_from_ecc_point_8(addP, am);
  21537. }
  21538. if ((err == MP_OKAY) && (!inMont)) {
  21539. err = sp_256_mod_mul_norm_8(addP->x, addP->x, p256_mod);
  21540. }
  21541. if ((err == MP_OKAY) && (!inMont)) {
  21542. err = sp_256_mod_mul_norm_8(addP->y, addP->y, p256_mod);
  21543. }
  21544. if ((err == MP_OKAY) && (!inMont)) {
  21545. err = sp_256_mod_mul_norm_8(addP->z, addP->z, p256_mod);
  21546. }
  21547. if (err == MP_OKAY) {
  21548. err = sp_256_ecc_mulmod_base_8(point, k, 0, 0, heap);
  21549. }
  21550. if (err == MP_OKAY) {
  21551. sp_256_proj_point_add_8(point, point, addP, tmp);
  21552. if (map) {
  21553. sp_256_map_8(point, point, tmp);
  21554. }
  21555. err = sp_256_point_to_ecc_point_8(point, r);
  21556. }
  21557. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21558. if (k != NULL)
  21559. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  21560. if (point)
  21561. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  21562. #endif
  21563. return err;
  21564. }
  21565. #if defined(WOLFSSL_VALIDATE_ECC_KEYGEN) || defined(HAVE_ECC_SIGN) || \
  21566. defined(HAVE_ECC_VERIFY)
  21567. #endif /* WOLFSSL_VALIDATE_ECC_KEYGEN | HAVE_ECC_SIGN | HAVE_ECC_VERIFY */
  21568. /* Add 1 to a. (a = a + 1)
  21569. *
  21570. * a A single precision integer.
  21571. */
  21572. SP_NOINLINE static void sp_256_add_one_8(sp_digit* a)
  21573. {
  21574. __asm__ __volatile__ (
  21575. "mov r2, #1\n\t"
  21576. "ldr r1, [%[a], #0]\n\t"
  21577. "adds r1, r1, r2\n\t"
  21578. "mov r2, #0\n\t"
  21579. "str r1, [%[a], #0]\n\t"
  21580. "ldr r1, [%[a], #4]\n\t"
  21581. "adcs r1, r1, r2\n\t"
  21582. "str r1, [%[a], #4]\n\t"
  21583. "ldr r1, [%[a], #8]\n\t"
  21584. "adcs r1, r1, r2\n\t"
  21585. "str r1, [%[a], #8]\n\t"
  21586. "ldr r1, [%[a], #12]\n\t"
  21587. "adcs r1, r1, r2\n\t"
  21588. "str r1, [%[a], #12]\n\t"
  21589. "ldr r1, [%[a], #16]\n\t"
  21590. "adcs r1, r1, r2\n\t"
  21591. "str r1, [%[a], #16]\n\t"
  21592. "ldr r1, [%[a], #20]\n\t"
  21593. "adcs r1, r1, r2\n\t"
  21594. "str r1, [%[a], #20]\n\t"
  21595. "ldr r1, [%[a], #24]\n\t"
  21596. "adcs r1, r1, r2\n\t"
  21597. "str r1, [%[a], #24]\n\t"
  21598. "ldr r1, [%[a], #28]\n\t"
  21599. "adcs r1, r1, r2\n\t"
  21600. "str r1, [%[a], #28]\n\t"
  21601. :
  21602. : [a] "r" (a)
  21603. : "memory", "r1", "r2"
  21604. );
  21605. }
  21606. /* Read big endian unsigned byte array into r.
  21607. *
  21608. * r A single precision integer.
  21609. * size Maximum number of bytes to convert
  21610. * a Byte array.
  21611. * n Number of bytes in array to read.
  21612. */
  21613. static void sp_256_from_bin(sp_digit* r, int size, const byte* a, int n)
  21614. {
  21615. int i;
  21616. int j;
  21617. byte* d;
  21618. for (i = n - 1,j = 0; i >= 3; i -= 4) {
  21619. r[j] = ((sp_digit)a[i - 0] << 0) |
  21620. ((sp_digit)a[i - 1] << 8) |
  21621. ((sp_digit)a[i - 2] << 16) |
  21622. ((sp_digit)a[i - 3] << 24);
  21623. j++;
  21624. }
  21625. if (i >= 0) {
  21626. r[j] = 0;
  21627. d = (byte*)r;
  21628. switch (i) {
  21629. case 2: d[n - 1 - 2] = a[2]; //fallthrough
  21630. case 1: d[n - 1 - 1] = a[1]; //fallthrough
  21631. case 0: d[n - 1 - 0] = a[0]; //fallthrough
  21632. }
  21633. j++;
  21634. }
  21635. for (; j < size; j++) {
  21636. r[j] = 0;
  21637. }
  21638. }
  21639. /* Generates a scalar that is in the range 1..order-1.
  21640. *
  21641. * rng Random number generator.
  21642. * k Scalar value.
  21643. * returns RNG failures, MEMORY_E when memory allocation fails and
  21644. * MP_OKAY on success.
  21645. */
  21646. static int sp_256_ecc_gen_k_8(WC_RNG* rng, sp_digit* k)
  21647. {
  21648. int err;
  21649. byte buf[32];
  21650. do {
  21651. err = wc_RNG_GenerateBlock(rng, buf, sizeof(buf));
  21652. if (err == 0) {
  21653. sp_256_from_bin(k, 8, buf, (int)sizeof(buf));
  21654. if (sp_256_cmp_8(k, p256_order2) <= 0) {
  21655. sp_256_add_one_8(k);
  21656. break;
  21657. }
  21658. }
  21659. }
  21660. while (err == 0);
  21661. return err;
  21662. }
  21663. /* Makes a random EC key pair.
  21664. *
  21665. * rng Random number generator.
  21666. * priv Generated private value.
  21667. * pub Generated public point.
  21668. * heap Heap to use for allocation.
  21669. * returns ECC_INF_E when the point does not have the correct order, RNG
  21670. * failures, MEMORY_E when memory allocation fails and MP_OKAY on success.
  21671. */
  21672. int sp_ecc_make_key_256(WC_RNG* rng, mp_int* priv, ecc_point* pub, void* heap)
  21673. {
  21674. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21675. sp_point_256* point = NULL;
  21676. sp_digit* k = NULL;
  21677. #else
  21678. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  21679. sp_point_256 point[2];
  21680. #else
  21681. sp_point_256 point[1];
  21682. #endif
  21683. sp_digit k[8];
  21684. #endif
  21685. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  21686. sp_point_256* infinity = NULL;
  21687. #endif
  21688. int err = MP_OKAY;
  21689. (void)heap;
  21690. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21691. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  21692. point = (sp_point_256*)XMALLOC(sizeof(sp_point_256) * 2, heap, DYNAMIC_TYPE_ECC);
  21693. #else
  21694. point = (sp_point_256*)XMALLOC(sizeof(sp_point_256), heap, DYNAMIC_TYPE_ECC);
  21695. #endif
  21696. if (point == NULL)
  21697. err = MEMORY_E;
  21698. if (err == MP_OKAY) {
  21699. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 8, heap,
  21700. DYNAMIC_TYPE_ECC);
  21701. if (k == NULL)
  21702. err = MEMORY_E;
  21703. }
  21704. #endif
  21705. if (err == MP_OKAY) {
  21706. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  21707. infinity = point + 1;
  21708. #endif
  21709. err = sp_256_ecc_gen_k_8(rng, k);
  21710. }
  21711. if (err == MP_OKAY) {
  21712. err = sp_256_ecc_mulmod_base_8(point, k, 1, 1, NULL);
  21713. }
  21714. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  21715. if (err == MP_OKAY) {
  21716. err = sp_256_ecc_mulmod_8(infinity, point, p256_order, 1, 1, NULL);
  21717. }
  21718. if (err == MP_OKAY) {
  21719. if (sp_256_iszero_8(point->x) || sp_256_iszero_8(point->y)) {
  21720. err = ECC_INF_E;
  21721. }
  21722. }
  21723. #endif
  21724. if (err == MP_OKAY) {
  21725. err = sp_256_to_mp(k, priv);
  21726. }
  21727. if (err == MP_OKAY) {
  21728. err = sp_256_point_to_ecc_point_8(point, pub);
  21729. }
  21730. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21731. if (k != NULL)
  21732. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  21733. if (point != NULL) {
  21734. /* point is not sensitive, so no need to zeroize */
  21735. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  21736. }
  21737. #endif
  21738. return err;
  21739. }
  21740. #ifdef HAVE_ECC_DHE
  21741. /* Write r as big endian to byte array.
  21742. * Fixed length number of bytes written: 32
  21743. *
  21744. * r A single precision integer.
  21745. * a Byte array.
  21746. */
  21747. static void sp_256_to_bin_8(sp_digit* r, byte* a)
  21748. {
  21749. int i;
  21750. int j = 0;
  21751. for (i = 7; i >= 0; i--) {
  21752. a[j++] = r[i] >> 24;
  21753. a[j++] = r[i] >> 16;
  21754. a[j++] = r[i] >> 8;
  21755. a[j++] = r[i] >> 0;
  21756. }
  21757. }
  21758. /* Multiply the point by the scalar and serialize the X ordinate.
  21759. * The number is 0 padded to maximum size on output.
  21760. *
  21761. * priv Scalar to multiply the point by.
  21762. * pub Point to multiply.
  21763. * out Buffer to hold X ordinate.
  21764. * outLen On entry, size of the buffer in bytes.
  21765. * On exit, length of data in buffer in bytes.
  21766. * heap Heap to use for allocation.
  21767. * returns BUFFER_E if the buffer is to small for output size,
  21768. * MEMORY_E when memory allocation fails and MP_OKAY on success.
  21769. */
  21770. int sp_ecc_secret_gen_256(const mp_int* priv, const ecc_point* pub, byte* out,
  21771. word32* outLen, void* heap)
  21772. {
  21773. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21774. sp_point_256* point = NULL;
  21775. sp_digit* k = NULL;
  21776. #else
  21777. sp_point_256 point[1];
  21778. sp_digit k[8];
  21779. #endif
  21780. int err = MP_OKAY;
  21781. if (*outLen < 32U) {
  21782. err = BUFFER_E;
  21783. }
  21784. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21785. if (err == MP_OKAY) {
  21786. point = (sp_point_256*)XMALLOC(sizeof(sp_point_256), heap,
  21787. DYNAMIC_TYPE_ECC);
  21788. if (point == NULL)
  21789. err = MEMORY_E;
  21790. }
  21791. if (err == MP_OKAY) {
  21792. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 8, heap,
  21793. DYNAMIC_TYPE_ECC);
  21794. if (k == NULL)
  21795. err = MEMORY_E;
  21796. }
  21797. #endif
  21798. if (err == MP_OKAY) {
  21799. sp_256_from_mp(k, 8, priv);
  21800. sp_256_point_from_ecc_point_8(point, pub);
  21801. err = sp_256_ecc_mulmod_8(point, point, k, 1, 1, heap);
  21802. }
  21803. if (err == MP_OKAY) {
  21804. sp_256_to_bin_8(point->x, out);
  21805. *outLen = 32;
  21806. }
  21807. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  21808. if (k != NULL)
  21809. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  21810. if (point != NULL)
  21811. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  21812. #endif
  21813. return err;
  21814. }
  21815. #endif /* HAVE_ECC_DHE */
  21816. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  21817. #endif
  21818. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  21819. #endif
  21820. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  21821. #ifdef WOLFSSL_SP_SMALL
  21822. /* Sub b from a into a. (a -= b)
  21823. *
  21824. * a A single precision integer.
  21825. * b A single precision integer.
  21826. */
  21827. SP_NOINLINE static sp_digit sp_256_sub_in_place_8(sp_digit* a,
  21828. const sp_digit* b)
  21829. {
  21830. sp_digit c = 0;
  21831. __asm__ __volatile__ (
  21832. "mov r8, %[a]\n\t"
  21833. "add r8, r8, #32\n\t"
  21834. "\n1:\n\t"
  21835. "mov r5, #0\n\t"
  21836. "subs r5, r5, %[c]\n\t"
  21837. "ldr r3, [%[a]]\n\t"
  21838. "ldr r4, [%[a], #4]\n\t"
  21839. "ldr r5, [%[b]]\n\t"
  21840. "ldr r6, [%[b], #4]\n\t"
  21841. "sbcs r3, r3, r5\n\t"
  21842. "sbcs r4, r4, r6\n\t"
  21843. "str r3, [%[a]]\n\t"
  21844. "str r4, [%[a], #4]\n\t"
  21845. "sbc %[c], %[c], %[c]\n\t"
  21846. "add %[a], %[a], #8\n\t"
  21847. "add %[b], %[b], #8\n\t"
  21848. "cmp %[a], r8\n\t"
  21849. #ifdef __GNUC__
  21850. "bne 1b\n\t"
  21851. #else
  21852. "bne.n 1b\n\t"
  21853. #endif /* __GNUC__ */
  21854. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  21855. :
  21856. : "memory", "r3", "r4", "r5", "r6", "r8"
  21857. );
  21858. return c;
  21859. }
  21860. #else
  21861. /* Sub b from a into r. (r = a - b)
  21862. *
  21863. * r A single precision integer.
  21864. * a A single precision integer.
  21865. * b A single precision integer.
  21866. */
  21867. SP_NOINLINE static sp_digit sp_256_sub_in_place_8(sp_digit* a,
  21868. const sp_digit* b)
  21869. {
  21870. sp_digit c = 0;
  21871. __asm__ __volatile__ (
  21872. "ldm %[a], {r3, r4}\n\t"
  21873. "ldm %[b]!, {r5, r6}\n\t"
  21874. "subs r3, r3, r5\n\t"
  21875. "sbcs r4, r4, r6\n\t"
  21876. "stm %[a]!, {r3, r4}\n\t"
  21877. "ldm %[a], {r3, r4}\n\t"
  21878. "ldm %[b]!, {r5, r6}\n\t"
  21879. "sbcs r3, r3, r5\n\t"
  21880. "sbcs r4, r4, r6\n\t"
  21881. "stm %[a]!, {r3, r4}\n\t"
  21882. "ldm %[a], {r3, r4}\n\t"
  21883. "ldm %[b]!, {r5, r6}\n\t"
  21884. "sbcs r3, r3, r5\n\t"
  21885. "sbcs r4, r4, r6\n\t"
  21886. "stm %[a]!, {r3, r4}\n\t"
  21887. "ldm %[a], {r3, r4}\n\t"
  21888. "ldm %[b]!, {r5, r6}\n\t"
  21889. "sbcs r3, r3, r5\n\t"
  21890. "sbcs r4, r4, r6\n\t"
  21891. "stm %[a]!, {r3, r4}\n\t"
  21892. "sbc %[c], %[c], %[c]\n\t"
  21893. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  21894. :
  21895. : "memory", "r3", "r4", "r5", "r6"
  21896. );
  21897. return c;
  21898. }
  21899. #endif /* WOLFSSL_SP_SMALL */
  21900. /* Mul a by digit b into r. (r = a * b)
  21901. *
  21902. * r A single precision integer.
  21903. * a A single precision integer.
  21904. * b A single precision digit.
  21905. */
  21906. SP_NOINLINE static void sp_256_mul_d_8(sp_digit* r, const sp_digit* a,
  21907. sp_digit b)
  21908. {
  21909. __asm__ __volatile__ (
  21910. "add r9, %[a], #32\n\t"
  21911. /* A[0] * B */
  21912. "ldr r6, [%[a]], #4\n\t"
  21913. "umull r5, r3, r6, %[b]\n\t"
  21914. "mov r4, #0\n\t"
  21915. "str r5, [%[r]], #4\n\t"
  21916. /* A[0] * B - Done */
  21917. "\n1:\n\t"
  21918. "mov r5, #0\n\t"
  21919. /* A[] * B */
  21920. "ldr r6, [%[a]], #4\n\t"
  21921. "umull r6, r8, r6, %[b]\n\t"
  21922. "adds r3, r3, r6\n\t"
  21923. "adcs r4, r4, r8\n\t"
  21924. "adc r5, r5, #0\n\t"
  21925. /* A[] * B - Done */
  21926. "str r3, [%[r]], #4\n\t"
  21927. "mov r3, r4\n\t"
  21928. "mov r4, r5\n\t"
  21929. "cmp %[a], r9\n\t"
  21930. #ifdef __GNUC__
  21931. "blt 1b\n\t"
  21932. #else
  21933. "blt.n 1b\n\t"
  21934. #endif /* __GNUC__ */
  21935. "str r3, [%[r]]\n\t"
  21936. : [r] "+r" (r), [a] "+r" (a)
  21937. : [b] "r" (b)
  21938. : "memory", "r3", "r4", "r5", "r6", "r8", "r9"
  21939. );
  21940. }
  21941. /* Divide the double width number (d1|d0) by the divisor. (d1|d0 / div)
  21942. *
  21943. * d1 The high order half of the number to divide.
  21944. * d0 The low order half of the number to divide.
  21945. * div The divisor.
  21946. * returns the result of the division.
  21947. *
  21948. * Note that this is an approximate div. It may give an answer 1 larger.
  21949. */
  21950. SP_NOINLINE static sp_digit div_256_word_8(sp_digit d1, sp_digit d0,
  21951. sp_digit div)
  21952. {
  21953. sp_digit r = 0;
  21954. __asm__ __volatile__ (
  21955. "lsr r6, %[div], #16\n\t"
  21956. "add r6, r6, #1\n\t"
  21957. "udiv r4, %[d1], r6\n\t"
  21958. "lsl r8, r4, #16\n\t"
  21959. "umull r4, r5, %[div], r8\n\t"
  21960. "subs %[d0], %[d0], r4\n\t"
  21961. "sbc %[d1], %[d1], r5\n\t"
  21962. "udiv r5, %[d1], r6\n\t"
  21963. "lsl r4, r5, #16\n\t"
  21964. "add r8, r8, r4\n\t"
  21965. "umull r4, r5, %[div], r4\n\t"
  21966. "subs %[d0], %[d0], r4\n\t"
  21967. "sbc %[d1], %[d1], r5\n\t"
  21968. "lsl r4, %[d1], #16\n\t"
  21969. "orr r4, r4, %[d0], lsr #16\n\t"
  21970. "udiv r4, r4, r6\n\t"
  21971. "add r8, r8, r4\n\t"
  21972. "umull r4, r5, %[div], r4\n\t"
  21973. "subs %[d0], %[d0], r4\n\t"
  21974. "sbc %[d1], %[d1], r5\n\t"
  21975. "lsl r4, %[d1], #16\n\t"
  21976. "orr r4, r4, %[d0], lsr #16\n\t"
  21977. "udiv r4, r4, r6\n\t"
  21978. "add r8, r8, r4\n\t"
  21979. "umull r4, r5, %[div], r4\n\t"
  21980. "subs %[d0], %[d0], r4\n\t"
  21981. "sbc %[d1], %[d1], r5\n\t"
  21982. "udiv r4, %[d0], %[div]\n\t"
  21983. "add r8, r8, r4\n\t"
  21984. "mov %[r], r8\n\t"
  21985. : [r] "+r" (r)
  21986. : [d1] "r" (d1), [d0] "r" (d0), [div] "r" (div)
  21987. : "r4", "r5", "r6", "r8"
  21988. );
  21989. return r;
  21990. }
  21991. /* AND m into each word of a and store in r.
  21992. *
  21993. * r A single precision integer.
  21994. * a A single precision integer.
  21995. * m Mask to AND against each digit.
  21996. */
  21997. static void sp_256_mask_8(sp_digit* r, const sp_digit* a, sp_digit m)
  21998. {
  21999. #ifdef WOLFSSL_SP_SMALL
  22000. int i;
  22001. for (i=0; i<8; i++) {
  22002. r[i] = a[i] & m;
  22003. }
  22004. #else
  22005. r[0] = a[0] & m;
  22006. r[1] = a[1] & m;
  22007. r[2] = a[2] & m;
  22008. r[3] = a[3] & m;
  22009. r[4] = a[4] & m;
  22010. r[5] = a[5] & m;
  22011. r[6] = a[6] & m;
  22012. r[7] = a[7] & m;
  22013. #endif
  22014. }
  22015. /* Divide d in a and put remainder into r (m*d + r = a)
  22016. * m is not calculated as it is not needed at this time.
  22017. *
  22018. * a Number to be divided.
  22019. * d Number to divide with.
  22020. * m Multiplier result.
  22021. * r Remainder from the division.
  22022. * returns MP_OKAY indicating success.
  22023. */
  22024. static WC_INLINE int sp_256_div_8(const sp_digit* a, const sp_digit* d, sp_digit* m,
  22025. sp_digit* r)
  22026. {
  22027. sp_digit t1[16], t2[9];
  22028. sp_digit div, r1;
  22029. int i;
  22030. (void)m;
  22031. div = d[7];
  22032. XMEMCPY(t1, a, sizeof(*t1) * 2 * 8);
  22033. r1 = sp_256_cmp_8(&t1[8], d) >= 0;
  22034. sp_256_cond_sub_8(&t1[8], &t1[8], d, (sp_digit)0 - r1);
  22035. for (i = 7; i >= 0; i--) {
  22036. sp_digit mask = 0 - (t1[8 + i] == div);
  22037. sp_digit hi = t1[8 + i] + mask;
  22038. r1 = div_256_word_8(hi, t1[8 + i - 1], div);
  22039. r1 |= mask;
  22040. sp_256_mul_d_8(t2, d, r1);
  22041. t1[8 + i] += sp_256_sub_in_place_8(&t1[i], t2);
  22042. t1[8 + i] -= t2[8];
  22043. sp_256_mask_8(t2, d, t1[8 + i]);
  22044. t1[8 + i] += sp_256_add_8(&t1[i], &t1[i], t2);
  22045. sp_256_mask_8(t2, d, t1[8 + i]);
  22046. t1[8 + i] += sp_256_add_8(&t1[i], &t1[i], t2);
  22047. }
  22048. r1 = sp_256_cmp_8(t1, d) >= 0;
  22049. sp_256_cond_sub_8(r, t1, d, (sp_digit)0 - r1);
  22050. return MP_OKAY;
  22051. }
  22052. /* Reduce a modulo m into r. (r = a mod m)
  22053. *
  22054. * r A single precision number that is the reduced result.
  22055. * a A single precision number that is to be reduced.
  22056. * m A single precision number that is the modulus to reduce with.
  22057. * returns MP_OKAY indicating success.
  22058. */
  22059. static WC_INLINE int sp_256_mod_8(sp_digit* r, const sp_digit* a, const sp_digit* m)
  22060. {
  22061. return sp_256_div_8(a, m, NULL, r);
  22062. }
  22063. #endif
  22064. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  22065. /* Multiply two number mod the order of P256 curve. (r = a * b mod order)
  22066. *
  22067. * r Result of the multiplication.
  22068. * a First operand of the multiplication.
  22069. * b Second operand of the multiplication.
  22070. */
  22071. static void sp_256_mont_mul_order_8(sp_digit* r, const sp_digit* a, const sp_digit* b)
  22072. {
  22073. sp_256_mul_8(r, a, b);
  22074. sp_256_mont_reduce_order_8(r, p256_order, p256_mp_order);
  22075. }
  22076. #if defined(HAVE_ECC_SIGN) || (defined(HAVE_ECC_VERIFY) && defined(WOLFSSL_SP_SMALL))
  22077. #ifdef WOLFSSL_SP_SMALL
  22078. /* Order-2 for the P256 curve. */
  22079. static const uint32_t p256_order_minus_2[8] = {
  22080. 0xfc63254fU,0xf3b9cac2U,0xa7179e84U,0xbce6faadU,0xffffffffU,0xffffffffU,
  22081. 0x00000000U,0xffffffffU
  22082. };
  22083. #else
  22084. /* The low half of the order-2 of the P256 curve. */
  22085. static const sp_int_digit p256_order_low[4] = {
  22086. 0xfc63254fU,0xf3b9cac2U,0xa7179e84U,0xbce6faadU
  22087. };
  22088. #endif /* WOLFSSL_SP_SMALL */
  22089. /* Square number mod the order of P256 curve. (r = a * a mod order)
  22090. *
  22091. * r Result of the squaring.
  22092. * a Number to square.
  22093. */
  22094. static void sp_256_mont_sqr_order_8(sp_digit* r, const sp_digit* a)
  22095. {
  22096. sp_256_sqr_8(r, a);
  22097. sp_256_mont_reduce_order_8(r, p256_order, p256_mp_order);
  22098. }
  22099. #ifndef WOLFSSL_SP_SMALL
  22100. /* Square number mod the order of P256 curve a number of times.
  22101. * (r = a ^ n mod order)
  22102. *
  22103. * r Result of the squaring.
  22104. * a Number to square.
  22105. */
  22106. static void sp_256_mont_sqr_n_order_8(sp_digit* r, const sp_digit* a, int n)
  22107. {
  22108. int i;
  22109. sp_256_mont_sqr_order_8(r, a);
  22110. for (i=1; i<n; i++) {
  22111. sp_256_mont_sqr_order_8(r, r);
  22112. }
  22113. }
  22114. #endif /* !WOLFSSL_SP_SMALL */
  22115. /* Invert the number, in Montgomery form, modulo the order of the P256 curve.
  22116. * (r = 1 / a mod order)
  22117. *
  22118. * r Inverse result.
  22119. * a Number to invert.
  22120. * td Temporary data.
  22121. */
  22122. #ifdef WOLFSSL_SP_NONBLOCK
  22123. typedef struct sp_256_mont_inv_order_8_ctx {
  22124. int state;
  22125. int i;
  22126. } sp_256_mont_inv_order_8_ctx;
  22127. static int sp_256_mont_inv_order_8_nb(sp_ecc_ctx_t* sp_ctx, sp_digit* r, const sp_digit* a,
  22128. sp_digit* t)
  22129. {
  22130. int err = FP_WOULDBLOCK;
  22131. sp_256_mont_inv_order_8_ctx* ctx = (sp_256_mont_inv_order_8_ctx*)sp_ctx;
  22132. typedef char ctx_size_test[sizeof(sp_256_mont_inv_order_8_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  22133. (void)sizeof(ctx_size_test);
  22134. switch (ctx->state) {
  22135. case 0:
  22136. XMEMCPY(t, a, sizeof(sp_digit) * 8);
  22137. ctx->i = 254;
  22138. ctx->state = 1;
  22139. break;
  22140. case 1:
  22141. sp_256_mont_sqr_order_8(t, t);
  22142. ctx->state = 2;
  22143. break;
  22144. case 2:
  22145. if ((p256_order_minus_2[ctx->i / 32] & ((sp_int_digit)1 << (ctx->i % 32))) != 0) {
  22146. sp_256_mont_mul_order_8(t, t, a);
  22147. }
  22148. ctx->i--;
  22149. ctx->state = (ctx->i == 0) ? 3 : 1;
  22150. break;
  22151. case 3:
  22152. XMEMCPY(r, t, sizeof(sp_digit) * 8U);
  22153. err = MP_OKAY;
  22154. break;
  22155. }
  22156. return err;
  22157. }
  22158. #endif /* WOLFSSL_SP_NONBLOCK */
  22159. static void sp_256_mont_inv_order_8(sp_digit* r, const sp_digit* a,
  22160. sp_digit* td)
  22161. {
  22162. #ifdef WOLFSSL_SP_SMALL
  22163. sp_digit* t = td;
  22164. int i;
  22165. XMEMCPY(t, a, sizeof(sp_digit) * 8);
  22166. for (i=254; i>=0; i--) {
  22167. sp_256_mont_sqr_order_8(t, t);
  22168. if ((p256_order_minus_2[i / 32] & ((sp_int_digit)1 << (i % 32))) != 0) {
  22169. sp_256_mont_mul_order_8(t, t, a);
  22170. }
  22171. }
  22172. XMEMCPY(r, t, sizeof(sp_digit) * 8U);
  22173. #else
  22174. sp_digit* t = td;
  22175. sp_digit* t2 = td + 2 * 8;
  22176. sp_digit* t3 = td + 4 * 8;
  22177. int i;
  22178. /* t = a^2 */
  22179. sp_256_mont_sqr_order_8(t, a);
  22180. /* t = a^3 = t * a */
  22181. sp_256_mont_mul_order_8(t, t, a);
  22182. /* t2= a^c = t ^ 2 ^ 2 */
  22183. sp_256_mont_sqr_n_order_8(t2, t, 2);
  22184. /* t3= a^f = t2 * t */
  22185. sp_256_mont_mul_order_8(t3, t2, t);
  22186. /* t2= a^f0 = t3 ^ 2 ^ 4 */
  22187. sp_256_mont_sqr_n_order_8(t2, t3, 4);
  22188. /* t = a^ff = t2 * t3 */
  22189. sp_256_mont_mul_order_8(t, t2, t3);
  22190. /* t3= a^ff00 = t ^ 2 ^ 8 */
  22191. sp_256_mont_sqr_n_order_8(t2, t, 8);
  22192. /* t = a^ffff = t2 * t */
  22193. sp_256_mont_mul_order_8(t, t2, t);
  22194. /* t2= a^ffff0000 = t ^ 2 ^ 16 */
  22195. sp_256_mont_sqr_n_order_8(t2, t, 16);
  22196. /* t = a^ffffffff = t2 * t */
  22197. sp_256_mont_mul_order_8(t, t2, t);
  22198. /* t2= a^ffffffff0000000000000000 = t ^ 2 ^ 64 */
  22199. sp_256_mont_sqr_n_order_8(t2, t, 64);
  22200. /* t2= a^ffffffff00000000ffffffff = t2 * t */
  22201. sp_256_mont_mul_order_8(t2, t2, t);
  22202. /* t2= a^ffffffff00000000ffffffff00000000 = t2 ^ 2 ^ 32 */
  22203. sp_256_mont_sqr_n_order_8(t2, t2, 32);
  22204. /* t2= a^ffffffff00000000ffffffffffffffff = t2 * t */
  22205. sp_256_mont_mul_order_8(t2, t2, t);
  22206. /* t2= a^ffffffff00000000ffffffffffffffffbce6 */
  22207. for (i=127; i>=112; i--) {
  22208. sp_256_mont_sqr_order_8(t2, t2);
  22209. if ((p256_order_low[i / 32] & ((sp_int_digit)1 << (i % 32))) != 0) {
  22210. sp_256_mont_mul_order_8(t2, t2, a);
  22211. }
  22212. }
  22213. /* t2= a^ffffffff00000000ffffffffffffffffbce6f */
  22214. sp_256_mont_sqr_n_order_8(t2, t2, 4);
  22215. sp_256_mont_mul_order_8(t2, t2, t3);
  22216. /* t2= a^ffffffff00000000ffffffffffffffffbce6faada7179e84 */
  22217. for (i=107; i>=64; i--) {
  22218. sp_256_mont_sqr_order_8(t2, t2);
  22219. if ((p256_order_low[i / 32] & ((sp_int_digit)1 << (i % 32))) != 0) {
  22220. sp_256_mont_mul_order_8(t2, t2, a);
  22221. }
  22222. }
  22223. /* t2= a^ffffffff00000000ffffffffffffffffbce6faada7179e84f */
  22224. sp_256_mont_sqr_n_order_8(t2, t2, 4);
  22225. sp_256_mont_mul_order_8(t2, t2, t3);
  22226. /* t2= a^ffffffff00000000ffffffffffffffffbce6faada7179e84f3b9cac2 */
  22227. for (i=59; i>=32; i--) {
  22228. sp_256_mont_sqr_order_8(t2, t2);
  22229. if ((p256_order_low[i / 32] & ((sp_int_digit)1 << (i % 32))) != 0) {
  22230. sp_256_mont_mul_order_8(t2, t2, a);
  22231. }
  22232. }
  22233. /* t2= a^ffffffff00000000ffffffffffffffffbce6faada7179e84f3b9cac2f */
  22234. sp_256_mont_sqr_n_order_8(t2, t2, 4);
  22235. sp_256_mont_mul_order_8(t2, t2, t3);
  22236. /* t2= a^ffffffff00000000ffffffffffffffffbce6faada7179e84f3b9cac2fc63254 */
  22237. for (i=27; i>=0; i--) {
  22238. sp_256_mont_sqr_order_8(t2, t2);
  22239. if ((p256_order_low[i / 32] & ((sp_int_digit)1 << (i % 32))) != 0) {
  22240. sp_256_mont_mul_order_8(t2, t2, a);
  22241. }
  22242. }
  22243. /* t2= a^ffffffff00000000ffffffffffffffffbce6faada7179e84f3b9cac2fc632540 */
  22244. sp_256_mont_sqr_n_order_8(t2, t2, 4);
  22245. /* r = a^ffffffff00000000ffffffffffffffffbce6faada7179e84f3b9cac2fc63254f */
  22246. sp_256_mont_mul_order_8(r, t2, t3);
  22247. #endif /* WOLFSSL_SP_SMALL */
  22248. }
  22249. #endif /* HAVE_ECC_SIGN || (HAVE_ECC_VERIFY && WOLFSSL_SP_SMALL) */
  22250. #endif /* HAVE_ECC_SIGN | HAVE_ECC_VERIFY */
  22251. #ifdef HAVE_ECC_SIGN
  22252. #ifndef SP_ECC_MAX_SIG_GEN
  22253. #define SP_ECC_MAX_SIG_GEN 64
  22254. #endif
  22255. /* Calculate second signature value S from R, k and private value.
  22256. *
  22257. * s = (r * x + e) / k
  22258. *
  22259. * s Signature value.
  22260. * r First signature value.
  22261. * k Ephemeral private key.
  22262. * x Private key as a number.
  22263. * e Hash of message as a number.
  22264. * tmp Temporary storage for intermediate numbers.
  22265. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  22266. */
  22267. static int sp_256_calc_s_8(sp_digit* s, const sp_digit* r, sp_digit* k,
  22268. sp_digit* x, const sp_digit* e, sp_digit* tmp)
  22269. {
  22270. int err;
  22271. sp_digit carry;
  22272. sp_int32 c;
  22273. sp_digit* kInv = k;
  22274. /* Conv k to Montgomery form (mod order) */
  22275. sp_256_mul_8(k, k, p256_norm_order);
  22276. err = sp_256_mod_8(k, k, p256_order);
  22277. if (err == MP_OKAY) {
  22278. sp_256_norm_8(k);
  22279. /* kInv = 1/k mod order */
  22280. sp_256_mont_inv_order_8(kInv, k, tmp);
  22281. sp_256_norm_8(kInv);
  22282. /* s = r * x + e */
  22283. sp_256_mul_8(x, x, r);
  22284. err = sp_256_mod_8(x, x, p256_order);
  22285. }
  22286. if (err == MP_OKAY) {
  22287. sp_256_norm_8(x);
  22288. carry = sp_256_add_8(s, e, x);
  22289. sp_256_cond_sub_8(s, s, p256_order, 0 - carry);
  22290. sp_256_norm_8(s);
  22291. c = sp_256_cmp_8(s, p256_order);
  22292. sp_256_cond_sub_8(s, s, p256_order,
  22293. (sp_digit)0 - (sp_digit)(c >= 0));
  22294. sp_256_norm_8(s);
  22295. /* s = s * k^-1 mod order */
  22296. sp_256_mont_mul_order_8(s, s, kInv);
  22297. sp_256_norm_8(s);
  22298. }
  22299. return err;
  22300. }
  22301. /* Sign the hash using the private key.
  22302. * e = [hash, 256 bits] from binary
  22303. * r = (k.G)->x mod order
  22304. * s = (r * x + e) / k mod order
  22305. * The hash is truncated to the first 256 bits.
  22306. *
  22307. * hash Hash to sign.
  22308. * hashLen Length of the hash data.
  22309. * rng Random number generator.
  22310. * priv Private part of key - scalar.
  22311. * rm First part of result as an mp_int.
  22312. * sm Sirst part of result as an mp_int.
  22313. * heap Heap to use for allocation.
  22314. * returns RNG failures, MEMORY_E when memory allocation fails and
  22315. * MP_OKAY on success.
  22316. */
  22317. #ifdef WOLFSSL_SP_NONBLOCK
  22318. typedef struct sp_ecc_sign_256_ctx {
  22319. int state;
  22320. union {
  22321. sp_256_ecc_mulmod_8_ctx mulmod_ctx;
  22322. sp_256_mont_inv_order_8_ctx mont_inv_order_ctx;
  22323. };
  22324. sp_digit e[2*8];
  22325. sp_digit x[2*8];
  22326. sp_digit k[2*8];
  22327. sp_digit r[2*8];
  22328. sp_digit tmp[3 * 2*8];
  22329. sp_point_256 point;
  22330. sp_digit* s;
  22331. sp_digit* kInv;
  22332. int i;
  22333. } sp_ecc_sign_256_ctx;
  22334. int sp_ecc_sign_256_nb(sp_ecc_ctx_t* sp_ctx, const byte* hash, word32 hashLen, WC_RNG* rng,
  22335. mp_int* priv, mp_int* rm, mp_int* sm, mp_int* km, void* heap)
  22336. {
  22337. int err = FP_WOULDBLOCK;
  22338. sp_ecc_sign_256_ctx* ctx = (sp_ecc_sign_256_ctx*)sp_ctx->data;
  22339. typedef char ctx_size_test[sizeof(sp_ecc_sign_256_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  22340. (void)sizeof(ctx_size_test);
  22341. (void)heap;
  22342. switch (ctx->state) {
  22343. case 0: /* INIT */
  22344. ctx->s = ctx->e;
  22345. ctx->kInv = ctx->k;
  22346. ctx->i = SP_ECC_MAX_SIG_GEN;
  22347. ctx->state = 1;
  22348. break;
  22349. case 1: /* GEN */
  22350. /* New random point. */
  22351. if (km == NULL || mp_iszero(km)) {
  22352. err = sp_256_ecc_gen_k_8(rng, ctx->k);
  22353. }
  22354. else {
  22355. sp_256_from_mp(ctx->k, 8, km);
  22356. mp_zero(km);
  22357. }
  22358. XMEMSET(&ctx->mulmod_ctx, 0, sizeof(ctx->mulmod_ctx));
  22359. ctx->state = 2;
  22360. break;
  22361. case 2: /* MULMOD */
  22362. err = sp_256_ecc_mulmod_8_nb((sp_ecc_ctx_t*)&ctx->mulmod_ctx,
  22363. &ctx->point, &p256_base, ctx->k, 1, 1, heap);
  22364. if (err == MP_OKAY) {
  22365. ctx->state = 3;
  22366. }
  22367. break;
  22368. case 3: /* MODORDER */
  22369. {
  22370. sp_int32 c;
  22371. /* r = point->x mod order */
  22372. XMEMCPY(ctx->r, ctx->point.x, sizeof(sp_digit) * 8U);
  22373. sp_256_norm_8(ctx->r);
  22374. c = sp_256_cmp_8(ctx->r, p256_order);
  22375. sp_256_cond_sub_8(ctx->r, ctx->r, p256_order,
  22376. (sp_digit)0 - (sp_digit)(c >= 0));
  22377. sp_256_norm_8(ctx->r);
  22378. if (hashLen > 32U) {
  22379. hashLen = 32U;
  22380. }
  22381. sp_256_from_mp(ctx->x, 8, priv);
  22382. sp_256_from_bin(ctx->e, 8, hash, (int)hashLen);
  22383. ctx->state = 4;
  22384. break;
  22385. }
  22386. case 4: /* KMODORDER */
  22387. /* Conv k to Montgomery form (mod order) */
  22388. sp_256_mul_8(ctx->k, ctx->k, p256_norm_order);
  22389. err = sp_256_mod_8(ctx->k, ctx->k, p256_order);
  22390. if (err == MP_OKAY) {
  22391. sp_256_norm_8(ctx->k);
  22392. XMEMSET(&ctx->mont_inv_order_ctx, 0, sizeof(ctx->mont_inv_order_ctx));
  22393. ctx->state = 5;
  22394. }
  22395. break;
  22396. case 5: /* KINV */
  22397. /* kInv = 1/k mod order */
  22398. err = sp_256_mont_inv_order_8_nb((sp_ecc_ctx_t*)&ctx->mont_inv_order_ctx, ctx->kInv, ctx->k, ctx->tmp);
  22399. if (err == MP_OKAY) {
  22400. XMEMSET(&ctx->mont_inv_order_ctx, 0, sizeof(ctx->mont_inv_order_ctx));
  22401. ctx->state = 6;
  22402. }
  22403. break;
  22404. case 6: /* KINVNORM */
  22405. sp_256_norm_8(ctx->kInv);
  22406. ctx->state = 7;
  22407. break;
  22408. case 7: /* R */
  22409. /* s = r * x + e */
  22410. sp_256_mul_8(ctx->x, ctx->x, ctx->r);
  22411. ctx->state = 8;
  22412. break;
  22413. case 8: /* S1 */
  22414. err = sp_256_mod_8(ctx->x, ctx->x, p256_order);
  22415. if (err == MP_OKAY)
  22416. ctx->state = 9;
  22417. break;
  22418. case 9: /* S2 */
  22419. {
  22420. sp_digit carry;
  22421. sp_int32 c;
  22422. sp_256_norm_8(ctx->x);
  22423. carry = sp_256_add_8(ctx->s, ctx->e, ctx->x);
  22424. sp_256_cond_sub_8(ctx->s, ctx->s,
  22425. p256_order, 0 - carry);
  22426. sp_256_norm_8(ctx->s);
  22427. c = sp_256_cmp_8(ctx->s, p256_order);
  22428. sp_256_cond_sub_8(ctx->s, ctx->s, p256_order,
  22429. (sp_digit)0 - (sp_digit)(c >= 0));
  22430. sp_256_norm_8(ctx->s);
  22431. /* s = s * k^-1 mod order */
  22432. sp_256_mont_mul_order_8(ctx->s, ctx->s, ctx->kInv);
  22433. sp_256_norm_8(ctx->s);
  22434. /* Check that signature is usable. */
  22435. if (sp_256_iszero_8(ctx->s) == 0) {
  22436. ctx->state = 10;
  22437. break;
  22438. }
  22439. #ifdef WOLFSSL_ECDSA_SET_K_ONE_LOOP
  22440. ctx->i = 1;
  22441. #endif
  22442. /* not usable gen, try again */
  22443. ctx->i--;
  22444. if (ctx->i == 0) {
  22445. err = RNG_FAILURE_E;
  22446. }
  22447. ctx->state = 1;
  22448. break;
  22449. }
  22450. case 10: /* RES */
  22451. err = sp_256_to_mp(ctx->r, rm);
  22452. if (err == MP_OKAY) {
  22453. err = sp_256_to_mp(ctx->s, sm);
  22454. }
  22455. break;
  22456. }
  22457. if (err == MP_OKAY && ctx->state != 10) {
  22458. err = FP_WOULDBLOCK;
  22459. }
  22460. if (err != FP_WOULDBLOCK) {
  22461. XMEMSET(ctx->e, 0, sizeof(sp_digit) * 2U * 8U);
  22462. XMEMSET(ctx->x, 0, sizeof(sp_digit) * 2U * 8U);
  22463. XMEMSET(ctx->k, 0, sizeof(sp_digit) * 2U * 8U);
  22464. XMEMSET(ctx->r, 0, sizeof(sp_digit) * 2U * 8U);
  22465. XMEMSET(ctx->tmp, 0, sizeof(sp_digit) * 3U * 2U * 8U);
  22466. }
  22467. return err;
  22468. }
  22469. #endif /* WOLFSSL_SP_NONBLOCK */
  22470. int sp_ecc_sign_256(const byte* hash, word32 hashLen, WC_RNG* rng,
  22471. const mp_int* priv, mp_int* rm, mp_int* sm, mp_int* km, void* heap)
  22472. {
  22473. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  22474. sp_digit* e = NULL;
  22475. sp_point_256* point = NULL;
  22476. #else
  22477. sp_digit e[7 * 2 * 8];
  22478. sp_point_256 point[1];
  22479. #endif
  22480. sp_digit* x = NULL;
  22481. sp_digit* k = NULL;
  22482. sp_digit* r = NULL;
  22483. sp_digit* tmp = NULL;
  22484. sp_digit* s = NULL;
  22485. sp_int32 c;
  22486. int err = MP_OKAY;
  22487. int i;
  22488. (void)heap;
  22489. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  22490. if (err == MP_OKAY) {
  22491. point = (sp_point_256*)XMALLOC(sizeof(sp_point_256), heap,
  22492. DYNAMIC_TYPE_ECC);
  22493. if (point == NULL)
  22494. err = MEMORY_E;
  22495. }
  22496. if (err == MP_OKAY) {
  22497. e = (sp_digit*)XMALLOC(sizeof(sp_digit) * 7 * 2 * 8, heap,
  22498. DYNAMIC_TYPE_ECC);
  22499. if (e == NULL)
  22500. err = MEMORY_E;
  22501. }
  22502. #endif
  22503. if (err == MP_OKAY) {
  22504. x = e + 2 * 8;
  22505. k = e + 4 * 8;
  22506. r = e + 6 * 8;
  22507. tmp = e + 8 * 8;
  22508. s = e;
  22509. if (hashLen > 32U) {
  22510. hashLen = 32U;
  22511. }
  22512. }
  22513. for (i = SP_ECC_MAX_SIG_GEN; err == MP_OKAY && i > 0; i--) {
  22514. /* New random point. */
  22515. if (km == NULL || mp_iszero(km)) {
  22516. err = sp_256_ecc_gen_k_8(rng, k);
  22517. }
  22518. else {
  22519. sp_256_from_mp(k, 8, km);
  22520. mp_zero(km);
  22521. }
  22522. if (err == MP_OKAY) {
  22523. err = sp_256_ecc_mulmod_base_8(point, k, 1, 1, heap);
  22524. }
  22525. if (err == MP_OKAY) {
  22526. /* r = point->x mod order */
  22527. XMEMCPY(r, point->x, sizeof(sp_digit) * 8U);
  22528. sp_256_norm_8(r);
  22529. c = sp_256_cmp_8(r, p256_order);
  22530. sp_256_cond_sub_8(r, r, p256_order,
  22531. (sp_digit)0 - (sp_digit)(c >= 0));
  22532. sp_256_norm_8(r);
  22533. sp_256_from_mp(x, 8, priv);
  22534. sp_256_from_bin(e, 8, hash, (int)hashLen);
  22535. err = sp_256_calc_s_8(s, r, k, x, e, tmp);
  22536. }
  22537. /* Check that signature is usable. */
  22538. if ((err == MP_OKAY) && (sp_256_iszero_8(s) == 0)) {
  22539. break;
  22540. }
  22541. #ifdef WOLFSSL_ECDSA_SET_K_ONE_LOOP
  22542. i = 1;
  22543. #endif
  22544. }
  22545. if (i == 0) {
  22546. err = RNG_FAILURE_E;
  22547. }
  22548. if (err == MP_OKAY) {
  22549. err = sp_256_to_mp(r, rm);
  22550. }
  22551. if (err == MP_OKAY) {
  22552. err = sp_256_to_mp(s, sm);
  22553. }
  22554. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  22555. if (e != NULL)
  22556. #endif
  22557. {
  22558. ForceZero(e, sizeof(sp_digit) * 7 * 2 * 8);
  22559. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  22560. XFREE(e, heap, DYNAMIC_TYPE_ECC);
  22561. #endif
  22562. }
  22563. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  22564. if (point != NULL)
  22565. #endif
  22566. {
  22567. ForceZero(point, sizeof(sp_point_256));
  22568. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  22569. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  22570. #endif
  22571. }
  22572. return err;
  22573. }
  22574. #endif /* HAVE_ECC_SIGN */
  22575. #ifndef WOLFSSL_SP_SMALL
  22576. static void sp_256_rshift1_8(sp_digit* r, const sp_digit* a)
  22577. {
  22578. __asm__ __volatile__ (
  22579. "mov r10, #0\n\t"
  22580. "mov r9, #0\n\t"
  22581. "ldr r3, [%[a], #16]\n\t"
  22582. "ldr r4, [%[a], #20]\n\t"
  22583. "ldr r5, [%[a], #24]\n\t"
  22584. "ldr r6, [%[a], #28]\n\t"
  22585. "lsr r7, r3, #1\n\t"
  22586. "and r3, r3, #1\n\t"
  22587. "lsr r8, r4, #1\n\t"
  22588. "lsr r10, r5, #1\n\t"
  22589. "lsr r14, r6, #1\n\t"
  22590. "orr r7, r7, r4, lsl #31\n\t"
  22591. "orr r8, r8, r5, lsl #31\n\t"
  22592. "orr r10, r10, r6, lsl #31\n\t"
  22593. "orr r14, r14, r9, lsl #31\n\t"
  22594. "mov r9, r3\n\t"
  22595. "str r7, [%[r], #16]\n\t"
  22596. "str r8, [%[r], #20]\n\t"
  22597. "str r10, [%[r], #24]\n\t"
  22598. "str r14, [%[r], #28]\n\t"
  22599. "ldr r3, [%[r], #0]\n\t"
  22600. "ldr r4, [%[r], #4]\n\t"
  22601. "ldr r5, [%[r], #8]\n\t"
  22602. "ldr r6, [%[r], #12]\n\t"
  22603. "lsr r7, r3, #1\n\t"
  22604. "lsr r8, r4, #1\n\t"
  22605. "lsr r10, r5, #1\n\t"
  22606. "lsr r14, r6, #1\n\t"
  22607. "orr r7, r7, r4, lsl #31\n\t"
  22608. "orr r8, r8, r5, lsl #31\n\t"
  22609. "orr r10, r10, r6, lsl #31\n\t"
  22610. "orr r14, r14, r9, lsl #31\n\t"
  22611. "str r7, [%[r], #0]\n\t"
  22612. "str r8, [%[r], #4]\n\t"
  22613. "str r10, [%[r], #8]\n\t"
  22614. "str r14, [%[r], #12]\n\t"
  22615. :
  22616. : [r] "r" (r), [a] "r" (a)
  22617. : "memory", "r3", "r4", "r5", "r6", "r7", "r8", "r10", "r14", "r9"
  22618. );
  22619. }
  22620. /* Divide the number by 2 mod the modulus. (r = a / 2 % m)
  22621. *
  22622. * r Result of division by 2.
  22623. * a Number to divide.
  22624. * m Modulus.
  22625. */
  22626. static void sp_256_div2_mod_8(sp_digit* r, const sp_digit* a, const sp_digit* m)
  22627. {
  22628. __asm__ __volatile__ (
  22629. "mov r10, #0\n\t"
  22630. "ldr r3, [%[a], #0]\n\t"
  22631. "ands r9, r3, #1\n\t"
  22632. "beq 1f\n\t"
  22633. "ldr r4, [%[a], #4]\n\t"
  22634. "ldr r5, [%[a], #8]\n\t"
  22635. "ldr r6, [%[a], #12]\n\t"
  22636. "ldr r7, [%[m], #0]\n\t"
  22637. "ldr r8, [%[m], #4]\n\t"
  22638. "ldr r10, [%[m], #8]\n\t"
  22639. "ldr r14, [%[m], #12]\n\t"
  22640. "adds r3, r3, r7\n\t"
  22641. "adcs r4, r4, r8\n\t"
  22642. "adcs r5, r5, r10\n\t"
  22643. "adcs r6, r6, r14\n\t"
  22644. "str r3, [%[r], #0]\n\t"
  22645. "str r4, [%[r], #4]\n\t"
  22646. "str r5, [%[r], #8]\n\t"
  22647. "str r6, [%[r], #12]\n\t"
  22648. "ldr r3, [%[a], #16]\n\t"
  22649. "ldr r4, [%[a], #20]\n\t"
  22650. "ldr r5, [%[a], #24]\n\t"
  22651. "ldr r6, [%[a], #28]\n\t"
  22652. "ldr r7, [%[m], #16]\n\t"
  22653. "ldr r8, [%[m], #20]\n\t"
  22654. "ldr r10, [%[m], #24]\n\t"
  22655. "ldr r14, [%[m], #28]\n\t"
  22656. "adcs r3, r3, r7\n\t"
  22657. "adcs r4, r4, r8\n\t"
  22658. "adcs r5, r5, r10\n\t"
  22659. "adcs r6, r6, r14\n\t"
  22660. "adc r9, r10, r10\n\t"
  22661. "b 2f\n\t"
  22662. "\n1:\n\t"
  22663. "ldr r3, [%[a], #16]\n\t"
  22664. "ldr r4, [%[a], #20]\n\t"
  22665. "ldr r5, [%[a], #24]\n\t"
  22666. "ldr r6, [%[a], #28]\n\t"
  22667. "\n2:\n\t"
  22668. "lsr r7, r3, #1\n\t"
  22669. "and r3, r3, #1\n\t"
  22670. "lsr r8, r4, #1\n\t"
  22671. "lsr r10, r5, #1\n\t"
  22672. "lsr r14, r6, #1\n\t"
  22673. "orr r7, r7, r4, lsl #31\n\t"
  22674. "orr r8, r8, r5, lsl #31\n\t"
  22675. "orr r10, r10, r6, lsl #31\n\t"
  22676. "orr r14, r14, r9, lsl #31\n\t"
  22677. "mov r9, r3\n\t"
  22678. "str r7, [%[r], #16]\n\t"
  22679. "str r8, [%[r], #20]\n\t"
  22680. "str r10, [%[r], #24]\n\t"
  22681. "str r14, [%[r], #28]\n\t"
  22682. "ldr r3, [%[r], #0]\n\t"
  22683. "ldr r4, [%[r], #4]\n\t"
  22684. "ldr r5, [%[r], #8]\n\t"
  22685. "ldr r6, [%[r], #12]\n\t"
  22686. "lsr r7, r3, #1\n\t"
  22687. "lsr r8, r4, #1\n\t"
  22688. "lsr r10, r5, #1\n\t"
  22689. "lsr r14, r6, #1\n\t"
  22690. "orr r7, r7, r4, lsl #31\n\t"
  22691. "orr r8, r8, r5, lsl #31\n\t"
  22692. "orr r10, r10, r6, lsl #31\n\t"
  22693. "orr r14, r14, r9, lsl #31\n\t"
  22694. "str r7, [%[r], #0]\n\t"
  22695. "str r8, [%[r], #4]\n\t"
  22696. "str r10, [%[r], #8]\n\t"
  22697. "str r14, [%[r], #12]\n\t"
  22698. :
  22699. : [r] "r" (r), [a] "r" (a), [m] "r" (m)
  22700. : "memory", "r3", "r4", "r5", "r6", "r7", "r8", "r10", "r14", "r9"
  22701. );
  22702. }
  22703. static int sp_256_num_bits_8(sp_digit* a)
  22704. {
  22705. int r = 0;
  22706. __asm__ __volatile__ (
  22707. "ldr r2, [%[a], #28]\n\t"
  22708. "cmp r2, #0\n\t"
  22709. "beq 7f\n\t"
  22710. "mov r3, #256\n\t"
  22711. "clz %[r], r2\n\t"
  22712. "sub %[r], r3, %[r]\n\t"
  22713. "b 9f\n\t"
  22714. "\n7:\n\t"
  22715. "ldr r2, [%[a], #24]\n\t"
  22716. "cmp r2, #0\n\t"
  22717. "beq 6f\n\t"
  22718. "mov r3, #224\n\t"
  22719. "clz %[r], r2\n\t"
  22720. "sub %[r], r3, %[r]\n\t"
  22721. "b 9f\n\t"
  22722. "\n6:\n\t"
  22723. "ldr r2, [%[a], #20]\n\t"
  22724. "cmp r2, #0\n\t"
  22725. "beq 5f\n\t"
  22726. "mov r3, #192\n\t"
  22727. "clz %[r], r2\n\t"
  22728. "sub %[r], r3, %[r]\n\t"
  22729. "b 9f\n\t"
  22730. "\n5:\n\t"
  22731. "ldr r2, [%[a], #16]\n\t"
  22732. "cmp r2, #0\n\t"
  22733. "beq 4f\n\t"
  22734. "mov r3, #160\n\t"
  22735. "clz %[r], r2\n\t"
  22736. "sub %[r], r3, %[r]\n\t"
  22737. "b 9f\n\t"
  22738. "\n4:\n\t"
  22739. "ldr r2, [%[a], #12]\n\t"
  22740. "cmp r2, #0\n\t"
  22741. "beq 3f\n\t"
  22742. "mov r3, #128\n\t"
  22743. "clz %[r], r2\n\t"
  22744. "sub %[r], r3, %[r]\n\t"
  22745. "b 9f\n\t"
  22746. "\n3:\n\t"
  22747. "ldr r2, [%[a], #8]\n\t"
  22748. "cmp r2, #0\n\t"
  22749. "beq 2f\n\t"
  22750. "mov r3, #96\n\t"
  22751. "clz %[r], r2\n\t"
  22752. "sub %[r], r3, %[r]\n\t"
  22753. "b 9f\n\t"
  22754. "\n2:\n\t"
  22755. "ldr r2, [%[a], #4]\n\t"
  22756. "cmp r2, #0\n\t"
  22757. "beq 1f\n\t"
  22758. "mov r3, #64\n\t"
  22759. "clz %[r], r2\n\t"
  22760. "sub %[r], r3, %[r]\n\t"
  22761. "b 9f\n\t"
  22762. "\n1:\n\t"
  22763. "ldr r2, [%[a], #0]\n\t"
  22764. "mov r3, #32\n\t"
  22765. "clz %[r], r2\n\t"
  22766. "sub %[r], r3, %[r]\n\t"
  22767. "\n9:\n\t"
  22768. : [r] "+r" (r)
  22769. : [a] "r" (a)
  22770. : "r2", "r3"
  22771. );
  22772. return r;
  22773. }
  22774. /* Non-constant time modular inversion.
  22775. *
  22776. * @param [out] r Resulting number.
  22777. * @param [in] a Number to invert.
  22778. * @param [in] m Modulus.
  22779. * @return MP_OKAY on success.
  22780. */
  22781. static int sp_256_mod_inv_8(sp_digit* r, const sp_digit* a, const sp_digit* m)
  22782. {
  22783. sp_digit u[8];
  22784. sp_digit v[8];
  22785. sp_digit b[8];
  22786. sp_digit d[8];
  22787. int ut, vt;
  22788. sp_digit o;
  22789. XMEMCPY(u, m, sizeof(u));
  22790. XMEMCPY(v, a, sizeof(v));
  22791. ut = sp_256_num_bits_8(u);
  22792. vt = sp_256_num_bits_8(v);
  22793. XMEMSET(b, 0, sizeof(b));
  22794. if ((v[0] & 1) == 0) {
  22795. sp_256_rshift1_8(v, v);
  22796. XMEMCPY(d, m, sizeof(u));
  22797. d[0] += 1;
  22798. sp_256_rshift1_8(d, d);
  22799. vt--;
  22800. while ((v[0] & 1) == 0) {
  22801. sp_256_rshift1_8(v, v);
  22802. sp_256_div2_mod_8(d, d, m);
  22803. vt--;
  22804. }
  22805. }
  22806. else {
  22807. XMEMSET(d+1, 0, sizeof(d)-sizeof(sp_digit));
  22808. d[0] = 1;
  22809. }
  22810. while (ut > 1 && vt > 1) {
  22811. if (ut > vt || (ut == vt && sp_256_cmp_8(u, v) >= 0)) {
  22812. sp_256_sub_8(u, u, v);
  22813. o = sp_256_sub_8(b, b, d);
  22814. if (o != 0)
  22815. sp_256_add_8(b, b, m);
  22816. ut = sp_256_num_bits_8(u);
  22817. do {
  22818. sp_256_rshift1_8(u, u);
  22819. sp_256_div2_mod_8(b, b, m);
  22820. ut--;
  22821. }
  22822. while (ut > 0 && (u[0] & 1) == 0);
  22823. }
  22824. else {
  22825. sp_256_sub_8(v, v, u);
  22826. o = sp_256_sub_8(d, d, b);
  22827. if (o != 0)
  22828. sp_256_add_8(d, d, m);
  22829. vt = sp_256_num_bits_8(v);
  22830. do {
  22831. sp_256_rshift1_8(v, v);
  22832. sp_256_div2_mod_8(d, d, m);
  22833. vt--;
  22834. }
  22835. while (vt > 0 && (v[0] & 1) == 0);
  22836. }
  22837. }
  22838. if (ut == 1)
  22839. XMEMCPY(r, b, sizeof(b));
  22840. else
  22841. XMEMCPY(r, d, sizeof(d));
  22842. return MP_OKAY;
  22843. }
  22844. #endif /* WOLFSSL_SP_SMALL */
  22845. /* Add point p1 into point p2. Handles p1 == p2 and result at infinity.
  22846. *
  22847. * p1 First point to add and holds result.
  22848. * p2 Second point to add.
  22849. * tmp Temporary storage for intermediate numbers.
  22850. */
  22851. static void sp_256_add_points_8(sp_point_256* p1, const sp_point_256* p2,
  22852. sp_digit* tmp)
  22853. {
  22854. sp_256_proj_point_add_8(p1, p1, p2, tmp);
  22855. if (sp_256_iszero_8(p1->z)) {
  22856. if (sp_256_iszero_8(p1->x) && sp_256_iszero_8(p1->y)) {
  22857. sp_256_proj_point_dbl_8(p1, p2, tmp);
  22858. }
  22859. else {
  22860. /* Y ordinate is not used from here - don't set. */
  22861. p1->x[0] = 0;
  22862. p1->x[1] = 0;
  22863. p1->x[2] = 0;
  22864. p1->x[3] = 0;
  22865. p1->x[4] = 0;
  22866. p1->x[5] = 0;
  22867. p1->x[6] = 0;
  22868. p1->x[7] = 0;
  22869. XMEMCPY(p1->z, p256_norm_mod, sizeof(p256_norm_mod));
  22870. }
  22871. }
  22872. }
  22873. /* Calculate the verification point: [e/s]G + [r/s]Q
  22874. *
  22875. * p1 Calculated point.
  22876. * p2 Public point and temporary.
  22877. * s Second part of signature as a number.
  22878. * u1 Temporary number.
  22879. * u2 Temproray number.
  22880. * heap Heap to use for allocation.
  22881. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  22882. */
  22883. static int sp_256_calc_vfy_point_8(sp_point_256* p1, sp_point_256* p2,
  22884. sp_digit* s, sp_digit* u1, sp_digit* u2, sp_digit* tmp, void* heap)
  22885. {
  22886. int err;
  22887. #ifndef WOLFSSL_SP_SMALL
  22888. err = sp_256_mod_inv_8(s, s, p256_order);
  22889. if (err == MP_OKAY)
  22890. #endif /* !WOLFSSL_SP_SMALL */
  22891. {
  22892. sp_256_mul_8(s, s, p256_norm_order);
  22893. err = sp_256_mod_8(s, s, p256_order);
  22894. }
  22895. if (err == MP_OKAY) {
  22896. sp_256_norm_8(s);
  22897. #ifdef WOLFSSL_SP_SMALL
  22898. {
  22899. sp_256_mont_inv_order_8(s, s, tmp);
  22900. sp_256_mont_mul_order_8(u1, u1, s);
  22901. sp_256_mont_mul_order_8(u2, u2, s);
  22902. }
  22903. #else
  22904. {
  22905. sp_256_mont_mul_order_8(u1, u1, s);
  22906. sp_256_mont_mul_order_8(u2, u2, s);
  22907. }
  22908. #endif /* WOLFSSL_SP_SMALL */
  22909. {
  22910. err = sp_256_ecc_mulmod_base_8(p1, u1, 0, 0, heap);
  22911. }
  22912. }
  22913. if ((err == MP_OKAY) && sp_256_iszero_8(p1->z)) {
  22914. p1->infinity = 1;
  22915. }
  22916. if (err == MP_OKAY) {
  22917. err = sp_256_ecc_mulmod_8(p2, p2, u2, 0, 0, heap);
  22918. }
  22919. if ((err == MP_OKAY) && sp_256_iszero_8(p2->z)) {
  22920. p2->infinity = 1;
  22921. }
  22922. if (err == MP_OKAY) {
  22923. sp_256_add_points_8(p1, p2, tmp);
  22924. }
  22925. return err;
  22926. }
  22927. #ifdef HAVE_ECC_VERIFY
  22928. /* Verify the signature values with the hash and public key.
  22929. * e = Truncate(hash, 256)
  22930. * u1 = e/s mod order
  22931. * u2 = r/s mod order
  22932. * r == (u1.G + u2.Q)->x mod order
  22933. * Optimization: Leave point in projective form.
  22934. * (x, y, 1) == (x' / z'*z', y' / z'*z'*z', z' / z')
  22935. * (r + n*order).z'.z' mod prime == (u1.G + u2.Q)->x'
  22936. * The hash is truncated to the first 256 bits.
  22937. *
  22938. * hash Hash to sign.
  22939. * hashLen Length of the hash data.
  22940. * rng Random number generator.
  22941. * priv Private part of key - scalar.
  22942. * rm First part of result as an mp_int.
  22943. * sm Sirst part of result as an mp_int.
  22944. * heap Heap to use for allocation.
  22945. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  22946. */
  22947. #ifdef WOLFSSL_SP_NONBLOCK
  22948. typedef struct sp_ecc_verify_256_ctx {
  22949. int state;
  22950. union {
  22951. sp_256_ecc_mulmod_8_ctx mulmod_ctx;
  22952. sp_256_mont_inv_order_8_ctx mont_inv_order_ctx;
  22953. sp_256_proj_point_dbl_8_ctx dbl_ctx;
  22954. sp_256_proj_point_add_8_ctx add_ctx;
  22955. };
  22956. sp_digit u1[2*8];
  22957. sp_digit u2[2*8];
  22958. sp_digit s[2*8];
  22959. sp_digit tmp[2*8 * 6];
  22960. sp_point_256 p1;
  22961. sp_point_256 p2;
  22962. } sp_ecc_verify_256_ctx;
  22963. int sp_ecc_verify_256_nb(sp_ecc_ctx_t* sp_ctx, const byte* hash,
  22964. word32 hashLen, const mp_int* pX, const mp_int* pY, const mp_int* pZ,
  22965. const mp_int* rm, const mp_int* sm, int* res, void* heap)
  22966. {
  22967. int err = FP_WOULDBLOCK;
  22968. sp_ecc_verify_256_ctx* ctx = (sp_ecc_verify_256_ctx*)sp_ctx->data;
  22969. typedef char ctx_size_test[sizeof(sp_ecc_verify_256_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  22970. (void)sizeof(ctx_size_test);
  22971. switch (ctx->state) {
  22972. case 0: /* INIT */
  22973. if (hashLen > 32U) {
  22974. hashLen = 32U;
  22975. }
  22976. sp_256_from_bin(ctx->u1, 8, hash, (int)hashLen);
  22977. sp_256_from_mp(ctx->u2, 8, rm);
  22978. sp_256_from_mp(ctx->s, 8, sm);
  22979. sp_256_from_mp(ctx->p2.x, 8, pX);
  22980. sp_256_from_mp(ctx->p2.y, 8, pY);
  22981. sp_256_from_mp(ctx->p2.z, 8, pZ);
  22982. ctx->state = 1;
  22983. break;
  22984. case 1: /* NORMS0 */
  22985. sp_256_mul_8(ctx->s, ctx->s, p256_norm_order);
  22986. err = sp_256_mod_8(ctx->s, ctx->s, p256_order);
  22987. if (err == MP_OKAY)
  22988. ctx->state = 2;
  22989. break;
  22990. case 2: /* NORMS1 */
  22991. sp_256_norm_8(ctx->s);
  22992. XMEMSET(&ctx->mont_inv_order_ctx, 0, sizeof(ctx->mont_inv_order_ctx));
  22993. ctx->state = 3;
  22994. break;
  22995. case 3: /* NORMS2 */
  22996. err = sp_256_mont_inv_order_8_nb((sp_ecc_ctx_t*)&ctx->mont_inv_order_ctx, ctx->s, ctx->s, ctx->tmp);
  22997. if (err == MP_OKAY) {
  22998. ctx->state = 4;
  22999. }
  23000. break;
  23001. case 4: /* NORMS3 */
  23002. sp_256_mont_mul_order_8(ctx->u1, ctx->u1, ctx->s);
  23003. ctx->state = 5;
  23004. break;
  23005. case 5: /* NORMS4 */
  23006. sp_256_mont_mul_order_8(ctx->u2, ctx->u2, ctx->s);
  23007. XMEMSET(&ctx->mulmod_ctx, 0, sizeof(ctx->mulmod_ctx));
  23008. ctx->state = 6;
  23009. break;
  23010. case 6: /* MULBASE */
  23011. err = sp_256_ecc_mulmod_8_nb((sp_ecc_ctx_t*)&ctx->mulmod_ctx, &ctx->p1, &p256_base, ctx->u1, 0, 0, heap);
  23012. if (err == MP_OKAY) {
  23013. if (sp_256_iszero_8(ctx->p1.z)) {
  23014. ctx->p1.infinity = 1;
  23015. }
  23016. XMEMSET(&ctx->mulmod_ctx, 0, sizeof(ctx->mulmod_ctx));
  23017. ctx->state = 7;
  23018. }
  23019. break;
  23020. case 7: /* MULMOD */
  23021. err = sp_256_ecc_mulmod_8_nb((sp_ecc_ctx_t*)&ctx->mulmod_ctx, &ctx->p2, &ctx->p2, ctx->u2, 0, 0, heap);
  23022. if (err == MP_OKAY) {
  23023. if (sp_256_iszero_8(ctx->p2.z)) {
  23024. ctx->p2.infinity = 1;
  23025. }
  23026. XMEMSET(&ctx->add_ctx, 0, sizeof(ctx->add_ctx));
  23027. ctx->state = 8;
  23028. }
  23029. break;
  23030. case 8: /* ADD */
  23031. err = sp_256_proj_point_add_8_nb((sp_ecc_ctx_t*)&ctx->add_ctx, &ctx->p1, &ctx->p1, &ctx->p2, ctx->tmp);
  23032. if (err == MP_OKAY)
  23033. ctx->state = 9;
  23034. break;
  23035. case 9: /* MONT */
  23036. /* (r + n*order).z'.z' mod prime == (u1.G + u2.Q)->x' */
  23037. /* Reload r and convert to Montgomery form. */
  23038. sp_256_from_mp(ctx->u2, 8, rm);
  23039. err = sp_256_mod_mul_norm_8(ctx->u2, ctx->u2, p256_mod);
  23040. if (err == MP_OKAY)
  23041. ctx->state = 10;
  23042. break;
  23043. case 10: /* SQR */
  23044. /* u1 = r.z'.z' mod prime */
  23045. sp_256_mont_sqr_8(ctx->p1.z, ctx->p1.z, p256_mod, p256_mp_mod);
  23046. ctx->state = 11;
  23047. break;
  23048. case 11: /* MUL */
  23049. sp_256_mont_mul_8(ctx->u1, ctx->u2, ctx->p1.z, p256_mod, p256_mp_mod);
  23050. ctx->state = 12;
  23051. break;
  23052. case 12: /* RES */
  23053. {
  23054. sp_int32 c = 0;
  23055. err = MP_OKAY; /* math okay, now check result */
  23056. *res = (int)(sp_256_cmp_8(ctx->p1.x, ctx->u1) == 0);
  23057. if (*res == 0) {
  23058. sp_digit carry;
  23059. /* Reload r and add order. */
  23060. sp_256_from_mp(ctx->u2, 8, rm);
  23061. carry = sp_256_add_8(ctx->u2, ctx->u2, p256_order);
  23062. /* Carry means result is greater than mod and is not valid. */
  23063. if (carry == 0) {
  23064. sp_256_norm_8(ctx->u2);
  23065. /* Compare with mod and if greater or equal then not valid. */
  23066. c = sp_256_cmp_8(ctx->u2, p256_mod);
  23067. }
  23068. }
  23069. if ((*res == 0) && (c < 0)) {
  23070. /* Convert to Montogomery form */
  23071. err = sp_256_mod_mul_norm_8(ctx->u2, ctx->u2, p256_mod);
  23072. if (err == MP_OKAY) {
  23073. /* u1 = (r + 1*order).z'.z' mod prime */
  23074. sp_256_mont_mul_8(ctx->u1, ctx->u2, ctx->p1.z, p256_mod,
  23075. p256_mp_mod);
  23076. *res = (int)(sp_256_cmp_8(ctx->p1.x, ctx->u1) == 0);
  23077. }
  23078. }
  23079. break;
  23080. }
  23081. } /* switch */
  23082. if (err == MP_OKAY && ctx->state != 12) {
  23083. err = FP_WOULDBLOCK;
  23084. }
  23085. return err;
  23086. }
  23087. #endif /* WOLFSSL_SP_NONBLOCK */
  23088. int sp_ecc_verify_256(const byte* hash, word32 hashLen, const mp_int* pX,
  23089. const mp_int* pY, const mp_int* pZ, const mp_int* rm, const mp_int* sm,
  23090. int* res, void* heap)
  23091. {
  23092. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23093. sp_digit* u1 = NULL;
  23094. sp_point_256* p1 = NULL;
  23095. #else
  23096. sp_digit u1[18 * 8];
  23097. sp_point_256 p1[2];
  23098. #endif
  23099. sp_digit* u2 = NULL;
  23100. sp_digit* s = NULL;
  23101. sp_digit* tmp = NULL;
  23102. sp_point_256* p2 = NULL;
  23103. sp_digit carry;
  23104. sp_int32 c = 0;
  23105. int err = MP_OKAY;
  23106. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23107. if (err == MP_OKAY) {
  23108. p1 = (sp_point_256*)XMALLOC(sizeof(sp_point_256) * 2, heap,
  23109. DYNAMIC_TYPE_ECC);
  23110. if (p1 == NULL)
  23111. err = MEMORY_E;
  23112. }
  23113. if (err == MP_OKAY) {
  23114. u1 = (sp_digit*)XMALLOC(sizeof(sp_digit) * 18 * 8, heap,
  23115. DYNAMIC_TYPE_ECC);
  23116. if (u1 == NULL)
  23117. err = MEMORY_E;
  23118. }
  23119. #endif
  23120. if (err == MP_OKAY) {
  23121. u2 = u1 + 2 * 8;
  23122. s = u1 + 4 * 8;
  23123. tmp = u1 + 6 * 8;
  23124. p2 = p1 + 1;
  23125. if (hashLen > 32U) {
  23126. hashLen = 32U;
  23127. }
  23128. sp_256_from_bin(u1, 8, hash, (int)hashLen);
  23129. sp_256_from_mp(u2, 8, rm);
  23130. sp_256_from_mp(s, 8, sm);
  23131. sp_256_from_mp(p2->x, 8, pX);
  23132. sp_256_from_mp(p2->y, 8, pY);
  23133. sp_256_from_mp(p2->z, 8, pZ);
  23134. err = sp_256_calc_vfy_point_8(p1, p2, s, u1, u2, tmp, heap);
  23135. }
  23136. if (err == MP_OKAY) {
  23137. /* (r + n*order).z'.z' mod prime == (u1.G + u2.Q)->x' */
  23138. /* Reload r and convert to Montgomery form. */
  23139. sp_256_from_mp(u2, 8, rm);
  23140. err = sp_256_mod_mul_norm_8(u2, u2, p256_mod);
  23141. }
  23142. if (err == MP_OKAY) {
  23143. /* u1 = r.z'.z' mod prime */
  23144. sp_256_mont_sqr_8(p1->z, p1->z, p256_mod, p256_mp_mod);
  23145. sp_256_mont_mul_8(u1, u2, p1->z, p256_mod, p256_mp_mod);
  23146. *res = (int)(sp_256_cmp_8(p1->x, u1) == 0);
  23147. if (*res == 0) {
  23148. /* Reload r and add order. */
  23149. sp_256_from_mp(u2, 8, rm);
  23150. carry = sp_256_add_8(u2, u2, p256_order);
  23151. /* Carry means result is greater than mod and is not valid. */
  23152. if (carry == 0) {
  23153. sp_256_norm_8(u2);
  23154. /* Compare with mod and if greater or equal then not valid. */
  23155. c = sp_256_cmp_8(u2, p256_mod);
  23156. }
  23157. }
  23158. if ((*res == 0) && (c < 0)) {
  23159. /* Convert to Montogomery form */
  23160. err = sp_256_mod_mul_norm_8(u2, u2, p256_mod);
  23161. if (err == MP_OKAY) {
  23162. /* u1 = (r + 1*order).z'.z' mod prime */
  23163. {
  23164. sp_256_mont_mul_8(u1, u2, p1->z, p256_mod, p256_mp_mod);
  23165. }
  23166. *res = (sp_256_cmp_8(p1->x, u1) == 0);
  23167. }
  23168. }
  23169. }
  23170. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23171. if (u1 != NULL)
  23172. XFREE(u1, heap, DYNAMIC_TYPE_ECC);
  23173. if (p1 != NULL)
  23174. XFREE(p1, heap, DYNAMIC_TYPE_ECC);
  23175. #endif
  23176. return err;
  23177. }
  23178. #endif /* HAVE_ECC_VERIFY */
  23179. #ifdef HAVE_ECC_CHECK_KEY
  23180. /* Check that the x and y oridinates are a valid point on the curve.
  23181. *
  23182. * point EC point.
  23183. * heap Heap to use if dynamically allocating.
  23184. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  23185. * not on the curve and MP_OKAY otherwise.
  23186. */
  23187. static int sp_256_ecc_is_point_8(const sp_point_256* point,
  23188. void* heap)
  23189. {
  23190. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23191. sp_digit* t1 = NULL;
  23192. #else
  23193. sp_digit t1[8 * 4];
  23194. #endif
  23195. sp_digit* t2 = NULL;
  23196. int err = MP_OKAY;
  23197. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23198. t1 = (sp_digit*)XMALLOC(sizeof(sp_digit) * 8 * 4, heap, DYNAMIC_TYPE_ECC);
  23199. if (t1 == NULL)
  23200. err = MEMORY_E;
  23201. #endif
  23202. (void)heap;
  23203. if (err == MP_OKAY) {
  23204. t2 = t1 + 2 * 8;
  23205. sp_256_sqr_8(t1, point->y);
  23206. (void)sp_256_mod_8(t1, t1, p256_mod);
  23207. sp_256_sqr_8(t2, point->x);
  23208. (void)sp_256_mod_8(t2, t2, p256_mod);
  23209. sp_256_mul_8(t2, t2, point->x);
  23210. (void)sp_256_mod_8(t2, t2, p256_mod);
  23211. (void)sp_256_sub_8(t2, p256_mod, t2);
  23212. sp_256_mont_add_8(t1, t1, t2, p256_mod);
  23213. sp_256_mont_add_8(t1, t1, point->x, p256_mod);
  23214. sp_256_mont_add_8(t1, t1, point->x, p256_mod);
  23215. sp_256_mont_add_8(t1, t1, point->x, p256_mod);
  23216. if (sp_256_cmp_8(t1, p256_b) != 0) {
  23217. err = MP_VAL;
  23218. }
  23219. }
  23220. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23221. if (t1 != NULL)
  23222. XFREE(t1, heap, DYNAMIC_TYPE_ECC);
  23223. #endif
  23224. return err;
  23225. }
  23226. /* Check that the x and y oridinates are a valid point on the curve.
  23227. *
  23228. * pX X ordinate of EC point.
  23229. * pY Y ordinate of EC point.
  23230. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  23231. * not on the curve and MP_OKAY otherwise.
  23232. */
  23233. int sp_ecc_is_point_256(const mp_int* pX, const mp_int* pY)
  23234. {
  23235. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23236. sp_point_256* pub = NULL;
  23237. #else
  23238. sp_point_256 pub[1];
  23239. #endif
  23240. const byte one[1] = { 1 };
  23241. int err = MP_OKAY;
  23242. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23243. pub = (sp_point_256*)XMALLOC(sizeof(sp_point_256), NULL,
  23244. DYNAMIC_TYPE_ECC);
  23245. if (pub == NULL)
  23246. err = MEMORY_E;
  23247. #endif
  23248. if (err == MP_OKAY) {
  23249. sp_256_from_mp(pub->x, 8, pX);
  23250. sp_256_from_mp(pub->y, 8, pY);
  23251. sp_256_from_bin(pub->z, 8, one, (int)sizeof(one));
  23252. err = sp_256_ecc_is_point_8(pub, NULL);
  23253. }
  23254. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23255. if (pub != NULL)
  23256. XFREE(pub, NULL, DYNAMIC_TYPE_ECC);
  23257. #endif
  23258. return err;
  23259. }
  23260. /* Check that the private scalar generates the EC point (px, py), the point is
  23261. * on the curve and the point has the correct order.
  23262. *
  23263. * pX X ordinate of EC point.
  23264. * pY Y ordinate of EC point.
  23265. * privm Private scalar that generates EC point.
  23266. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  23267. * not on the curve, ECC_INF_E if the point does not have the correct order,
  23268. * ECC_PRIV_KEY_E when the private scalar doesn't generate the EC point and
  23269. * MP_OKAY otherwise.
  23270. */
  23271. int sp_ecc_check_key_256(const mp_int* pX, const mp_int* pY,
  23272. const mp_int* privm, void* heap)
  23273. {
  23274. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23275. sp_digit* priv = NULL;
  23276. sp_point_256* pub = NULL;
  23277. #else
  23278. sp_digit priv[8];
  23279. sp_point_256 pub[2];
  23280. #endif
  23281. sp_point_256* p = NULL;
  23282. const byte one[1] = { 1 };
  23283. int err = MP_OKAY;
  23284. /* Quick check the lengs of public key ordinates and private key are in
  23285. * range. Proper check later.
  23286. */
  23287. if (((mp_count_bits(pX) > 256) ||
  23288. (mp_count_bits(pY) > 256) ||
  23289. ((privm != NULL) && (mp_count_bits(privm) > 256)))) {
  23290. err = ECC_OUT_OF_RANGE_E;
  23291. }
  23292. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23293. if (err == MP_OKAY) {
  23294. pub = (sp_point_256*)XMALLOC(sizeof(sp_point_256) * 2, heap,
  23295. DYNAMIC_TYPE_ECC);
  23296. if (pub == NULL)
  23297. err = MEMORY_E;
  23298. }
  23299. if (err == MP_OKAY && privm) {
  23300. priv = (sp_digit*)XMALLOC(sizeof(sp_digit) * 8, heap,
  23301. DYNAMIC_TYPE_ECC);
  23302. if (priv == NULL)
  23303. err = MEMORY_E;
  23304. }
  23305. #endif
  23306. if (err == MP_OKAY) {
  23307. p = pub + 1;
  23308. sp_256_from_mp(pub->x, 8, pX);
  23309. sp_256_from_mp(pub->y, 8, pY);
  23310. sp_256_from_bin(pub->z, 8, one, (int)sizeof(one));
  23311. if (privm)
  23312. sp_256_from_mp(priv, 8, privm);
  23313. /* Check point at infinitiy. */
  23314. if ((sp_256_iszero_8(pub->x) != 0) &&
  23315. (sp_256_iszero_8(pub->y) != 0)) {
  23316. err = ECC_INF_E;
  23317. }
  23318. }
  23319. /* Check range of X and Y */
  23320. if ((err == MP_OKAY) &&
  23321. ((sp_256_cmp_8(pub->x, p256_mod) >= 0) ||
  23322. (sp_256_cmp_8(pub->y, p256_mod) >= 0))) {
  23323. err = ECC_OUT_OF_RANGE_E;
  23324. }
  23325. if (err == MP_OKAY) {
  23326. /* Check point is on curve */
  23327. err = sp_256_ecc_is_point_8(pub, heap);
  23328. }
  23329. if (err == MP_OKAY) {
  23330. /* Point * order = infinity */
  23331. err = sp_256_ecc_mulmod_8(p, pub, p256_order, 1, 1, heap);
  23332. }
  23333. /* Check result is infinity */
  23334. if ((err == MP_OKAY) && ((sp_256_iszero_8(p->x) == 0) ||
  23335. (sp_256_iszero_8(p->y) == 0))) {
  23336. err = ECC_INF_E;
  23337. }
  23338. if (privm) {
  23339. if (err == MP_OKAY) {
  23340. /* Base * private = point */
  23341. err = sp_256_ecc_mulmod_base_8(p, priv, 1, 1, heap);
  23342. }
  23343. /* Check result is public key */
  23344. if ((err == MP_OKAY) &&
  23345. ((sp_256_cmp_8(p->x, pub->x) != 0) ||
  23346. (sp_256_cmp_8(p->y, pub->y) != 0))) {
  23347. err = ECC_PRIV_KEY_E;
  23348. }
  23349. }
  23350. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23351. if (pub != NULL)
  23352. XFREE(pub, heap, DYNAMIC_TYPE_ECC);
  23353. if (priv != NULL)
  23354. XFREE(priv, heap, DYNAMIC_TYPE_ECC);
  23355. #endif
  23356. return err;
  23357. }
  23358. #endif
  23359. #ifdef WOLFSSL_PUBLIC_ECC_ADD_DBL
  23360. /* Add two projective EC points together.
  23361. * (pX, pY, pZ) + (qX, qY, qZ) = (rX, rY, rZ)
  23362. *
  23363. * pX First EC point's X ordinate.
  23364. * pY First EC point's Y ordinate.
  23365. * pZ First EC point's Z ordinate.
  23366. * qX Second EC point's X ordinate.
  23367. * qY Second EC point's Y ordinate.
  23368. * qZ Second EC point's Z ordinate.
  23369. * rX Resultant EC point's X ordinate.
  23370. * rY Resultant EC point's Y ordinate.
  23371. * rZ Resultant EC point's Z ordinate.
  23372. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  23373. */
  23374. int sp_ecc_proj_add_point_256(mp_int* pX, mp_int* pY, mp_int* pZ,
  23375. mp_int* qX, mp_int* qY, mp_int* qZ,
  23376. mp_int* rX, mp_int* rY, mp_int* rZ)
  23377. {
  23378. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23379. sp_digit* tmp = NULL;
  23380. sp_point_256* p = NULL;
  23381. #else
  23382. sp_digit tmp[2 * 8 * 6];
  23383. sp_point_256 p[2];
  23384. #endif
  23385. sp_point_256* q = NULL;
  23386. int err = MP_OKAY;
  23387. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23388. if (err == MP_OKAY) {
  23389. p = (sp_point_256*)XMALLOC(sizeof(sp_point_256) * 2, NULL,
  23390. DYNAMIC_TYPE_ECC);
  23391. if (p == NULL)
  23392. err = MEMORY_E;
  23393. }
  23394. if (err == MP_OKAY) {
  23395. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 8 * 6, NULL,
  23396. DYNAMIC_TYPE_ECC);
  23397. if (tmp == NULL) {
  23398. err = MEMORY_E;
  23399. }
  23400. }
  23401. #endif
  23402. if (err == MP_OKAY) {
  23403. q = p + 1;
  23404. sp_256_from_mp(p->x, 8, pX);
  23405. sp_256_from_mp(p->y, 8, pY);
  23406. sp_256_from_mp(p->z, 8, pZ);
  23407. sp_256_from_mp(q->x, 8, qX);
  23408. sp_256_from_mp(q->y, 8, qY);
  23409. sp_256_from_mp(q->z, 8, qZ);
  23410. p->infinity = sp_256_iszero_8(p->x) &
  23411. sp_256_iszero_8(p->y);
  23412. q->infinity = sp_256_iszero_8(q->x) &
  23413. sp_256_iszero_8(q->y);
  23414. sp_256_proj_point_add_8(p, p, q, tmp);
  23415. }
  23416. if (err == MP_OKAY) {
  23417. err = sp_256_to_mp(p->x, rX);
  23418. }
  23419. if (err == MP_OKAY) {
  23420. err = sp_256_to_mp(p->y, rY);
  23421. }
  23422. if (err == MP_OKAY) {
  23423. err = sp_256_to_mp(p->z, rZ);
  23424. }
  23425. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23426. if (tmp != NULL)
  23427. XFREE(tmp, NULL, DYNAMIC_TYPE_ECC);
  23428. if (p != NULL)
  23429. XFREE(p, NULL, DYNAMIC_TYPE_ECC);
  23430. #endif
  23431. return err;
  23432. }
  23433. /* Double a projective EC point.
  23434. * (pX, pY, pZ) + (pX, pY, pZ) = (rX, rY, rZ)
  23435. *
  23436. * pX EC point's X ordinate.
  23437. * pY EC point's Y ordinate.
  23438. * pZ EC point's Z ordinate.
  23439. * rX Resultant EC point's X ordinate.
  23440. * rY Resultant EC point's Y ordinate.
  23441. * rZ Resultant EC point's Z ordinate.
  23442. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  23443. */
  23444. int sp_ecc_proj_dbl_point_256(mp_int* pX, mp_int* pY, mp_int* pZ,
  23445. mp_int* rX, mp_int* rY, mp_int* rZ)
  23446. {
  23447. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23448. sp_digit* tmp = NULL;
  23449. sp_point_256* p = NULL;
  23450. #else
  23451. sp_digit tmp[2 * 8 * 2];
  23452. sp_point_256 p[1];
  23453. #endif
  23454. int err = MP_OKAY;
  23455. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23456. if (err == MP_OKAY) {
  23457. p = (sp_point_256*)XMALLOC(sizeof(sp_point_256), NULL,
  23458. DYNAMIC_TYPE_ECC);
  23459. if (p == NULL)
  23460. err = MEMORY_E;
  23461. }
  23462. if (err == MP_OKAY) {
  23463. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 8 * 2, NULL,
  23464. DYNAMIC_TYPE_ECC);
  23465. if (tmp == NULL)
  23466. err = MEMORY_E;
  23467. }
  23468. #endif
  23469. if (err == MP_OKAY) {
  23470. sp_256_from_mp(p->x, 8, pX);
  23471. sp_256_from_mp(p->y, 8, pY);
  23472. sp_256_from_mp(p->z, 8, pZ);
  23473. p->infinity = sp_256_iszero_8(p->x) &
  23474. sp_256_iszero_8(p->y);
  23475. sp_256_proj_point_dbl_8(p, p, tmp);
  23476. }
  23477. if (err == MP_OKAY) {
  23478. err = sp_256_to_mp(p->x, rX);
  23479. }
  23480. if (err == MP_OKAY) {
  23481. err = sp_256_to_mp(p->y, rY);
  23482. }
  23483. if (err == MP_OKAY) {
  23484. err = sp_256_to_mp(p->z, rZ);
  23485. }
  23486. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23487. if (tmp != NULL)
  23488. XFREE(tmp, NULL, DYNAMIC_TYPE_ECC);
  23489. if (p != NULL)
  23490. XFREE(p, NULL, DYNAMIC_TYPE_ECC);
  23491. #endif
  23492. return err;
  23493. }
  23494. /* Map a projective EC point to affine in place.
  23495. * pZ will be one.
  23496. *
  23497. * pX EC point's X ordinate.
  23498. * pY EC point's Y ordinate.
  23499. * pZ EC point's Z ordinate.
  23500. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  23501. */
  23502. int sp_ecc_map_256(mp_int* pX, mp_int* pY, mp_int* pZ)
  23503. {
  23504. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23505. sp_digit* tmp = NULL;
  23506. sp_point_256* p = NULL;
  23507. #else
  23508. sp_digit tmp[2 * 8 * 4];
  23509. sp_point_256 p[1];
  23510. #endif
  23511. int err = MP_OKAY;
  23512. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23513. if (err == MP_OKAY) {
  23514. p = (sp_point_256*)XMALLOC(sizeof(sp_point_256), NULL,
  23515. DYNAMIC_TYPE_ECC);
  23516. if (p == NULL)
  23517. err = MEMORY_E;
  23518. }
  23519. if (err == MP_OKAY) {
  23520. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 8 * 4, NULL,
  23521. DYNAMIC_TYPE_ECC);
  23522. if (tmp == NULL)
  23523. err = MEMORY_E;
  23524. }
  23525. #endif
  23526. if (err == MP_OKAY) {
  23527. sp_256_from_mp(p->x, 8, pX);
  23528. sp_256_from_mp(p->y, 8, pY);
  23529. sp_256_from_mp(p->z, 8, pZ);
  23530. p->infinity = sp_256_iszero_8(p->x) &
  23531. sp_256_iszero_8(p->y);
  23532. sp_256_map_8(p, p, tmp);
  23533. }
  23534. if (err == MP_OKAY) {
  23535. err = sp_256_to_mp(p->x, pX);
  23536. }
  23537. if (err == MP_OKAY) {
  23538. err = sp_256_to_mp(p->y, pY);
  23539. }
  23540. if (err == MP_OKAY) {
  23541. err = sp_256_to_mp(p->z, pZ);
  23542. }
  23543. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23544. if (tmp != NULL)
  23545. XFREE(tmp, NULL, DYNAMIC_TYPE_ECC);
  23546. if (p != NULL)
  23547. XFREE(p, NULL, DYNAMIC_TYPE_ECC);
  23548. #endif
  23549. return err;
  23550. }
  23551. #endif /* WOLFSSL_PUBLIC_ECC_ADD_DBL */
  23552. #ifdef HAVE_COMP_KEY
  23553. /* Find the square root of a number mod the prime of the curve.
  23554. *
  23555. * y The number to operate on and the result.
  23556. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  23557. */
  23558. static int sp_256_mont_sqrt_8(sp_digit* y)
  23559. {
  23560. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23561. sp_digit* t1 = NULL;
  23562. #else
  23563. sp_digit t1[4 * 8];
  23564. #endif
  23565. sp_digit* t2 = NULL;
  23566. int err = MP_OKAY;
  23567. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23568. t1 = (sp_digit*)XMALLOC(sizeof(sp_digit) * 4 * 8, NULL, DYNAMIC_TYPE_ECC);
  23569. if (t1 == NULL) {
  23570. err = MEMORY_E;
  23571. }
  23572. #endif
  23573. if (err == MP_OKAY) {
  23574. t2 = t1 + 2 * 8;
  23575. {
  23576. /* t2 = y ^ 0x2 */
  23577. sp_256_mont_sqr_8(t2, y, p256_mod, p256_mp_mod);
  23578. /* t1 = y ^ 0x3 */
  23579. sp_256_mont_mul_8(t1, t2, y, p256_mod, p256_mp_mod);
  23580. /* t2 = y ^ 0xc */
  23581. sp_256_mont_sqr_n_8(t2, t1, 2, p256_mod, p256_mp_mod);
  23582. /* t1 = y ^ 0xf */
  23583. sp_256_mont_mul_8(t1, t1, t2, p256_mod, p256_mp_mod);
  23584. /* t2 = y ^ 0xf0 */
  23585. sp_256_mont_sqr_n_8(t2, t1, 4, p256_mod, p256_mp_mod);
  23586. /* t1 = y ^ 0xff */
  23587. sp_256_mont_mul_8(t1, t1, t2, p256_mod, p256_mp_mod);
  23588. /* t2 = y ^ 0xff00 */
  23589. sp_256_mont_sqr_n_8(t2, t1, 8, p256_mod, p256_mp_mod);
  23590. /* t1 = y ^ 0xffff */
  23591. sp_256_mont_mul_8(t1, t1, t2, p256_mod, p256_mp_mod);
  23592. /* t2 = y ^ 0xffff0000 */
  23593. sp_256_mont_sqr_n_8(t2, t1, 16, p256_mod, p256_mp_mod);
  23594. /* t1 = y ^ 0xffffffff */
  23595. sp_256_mont_mul_8(t1, t1, t2, p256_mod, p256_mp_mod);
  23596. /* t1 = y ^ 0xffffffff00000000 */
  23597. sp_256_mont_sqr_n_8(t1, t1, 32, p256_mod, p256_mp_mod);
  23598. /* t1 = y ^ 0xffffffff00000001 */
  23599. sp_256_mont_mul_8(t1, t1, y, p256_mod, p256_mp_mod);
  23600. /* t1 = y ^ 0xffffffff00000001000000000000000000000000 */
  23601. sp_256_mont_sqr_n_8(t1, t1, 96, p256_mod, p256_mp_mod);
  23602. /* t1 = y ^ 0xffffffff00000001000000000000000000000001 */
  23603. sp_256_mont_mul_8(t1, t1, y, p256_mod, p256_mp_mod);
  23604. sp_256_mont_sqr_n_8(y, t1, 94, p256_mod, p256_mp_mod);
  23605. }
  23606. }
  23607. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23608. if (t1 != NULL)
  23609. XFREE(t1, NULL, DYNAMIC_TYPE_ECC);
  23610. #endif
  23611. return err;
  23612. }
  23613. /* Uncompress the point given the X ordinate.
  23614. *
  23615. * xm X ordinate.
  23616. * odd Whether the Y ordinate is odd.
  23617. * ym Calculated Y ordinate.
  23618. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  23619. */
  23620. int sp_ecc_uncompress_256(mp_int* xm, int odd, mp_int* ym)
  23621. {
  23622. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23623. sp_digit* x = NULL;
  23624. #else
  23625. sp_digit x[4 * 8];
  23626. #endif
  23627. sp_digit* y = NULL;
  23628. int err = MP_OKAY;
  23629. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23630. x = (sp_digit*)XMALLOC(sizeof(sp_digit) * 4 * 8, NULL, DYNAMIC_TYPE_ECC);
  23631. if (x == NULL)
  23632. err = MEMORY_E;
  23633. #endif
  23634. if (err == MP_OKAY) {
  23635. y = x + 2 * 8;
  23636. sp_256_from_mp(x, 8, xm);
  23637. err = sp_256_mod_mul_norm_8(x, x, p256_mod);
  23638. }
  23639. if (err == MP_OKAY) {
  23640. /* y = x^3 */
  23641. {
  23642. sp_256_mont_sqr_8(y, x, p256_mod, p256_mp_mod);
  23643. sp_256_mont_mul_8(y, y, x, p256_mod, p256_mp_mod);
  23644. }
  23645. /* y = x^3 - 3x */
  23646. sp_256_mont_sub_8(y, y, x, p256_mod);
  23647. sp_256_mont_sub_8(y, y, x, p256_mod);
  23648. sp_256_mont_sub_8(y, y, x, p256_mod);
  23649. /* y = x^3 - 3x + b */
  23650. err = sp_256_mod_mul_norm_8(x, p256_b, p256_mod);
  23651. }
  23652. if (err == MP_OKAY) {
  23653. sp_256_mont_add_8(y, y, x, p256_mod);
  23654. /* y = sqrt(x^3 - 3x + b) */
  23655. err = sp_256_mont_sqrt_8(y);
  23656. }
  23657. if (err == MP_OKAY) {
  23658. XMEMSET(y + 8, 0, 8U * sizeof(sp_digit));
  23659. sp_256_mont_reduce_8(y, p256_mod, p256_mp_mod);
  23660. if ((((word32)y[0] ^ (word32)odd) & 1U) != 0U) {
  23661. sp_256_mont_sub_8(y, p256_mod, y, p256_mod);
  23662. }
  23663. err = sp_256_to_mp(y, ym);
  23664. }
  23665. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  23666. if (x != NULL)
  23667. XFREE(x, NULL, DYNAMIC_TYPE_ECC);
  23668. #endif
  23669. return err;
  23670. }
  23671. #endif
  23672. #endif /* !WOLFSSL_SP_NO_256 */
  23673. #ifdef WOLFSSL_SP_384
  23674. /* Point structure to use. */
  23675. typedef struct sp_point_384 {
  23676. /* X ordinate of point. */
  23677. sp_digit x[2 * 12];
  23678. /* Y ordinate of point. */
  23679. sp_digit y[2 * 12];
  23680. /* Z ordinate of point. */
  23681. sp_digit z[2 * 12];
  23682. /* Indicates point is at infinity. */
  23683. int infinity;
  23684. } sp_point_384;
  23685. /* The modulus (prime) of the curve P384. */
  23686. static const sp_digit p384_mod[12] = {
  23687. 0xffffffff,0x00000000,0x00000000,0xffffffff,0xfffffffe,0xffffffff,
  23688. 0xffffffff,0xffffffff,0xffffffff,0xffffffff,0xffffffff,0xffffffff
  23689. };
  23690. /* The Montgomery normalizer for modulus of the curve P384. */
  23691. static const sp_digit p384_norm_mod[12] = {
  23692. 0x00000001,0xffffffff,0xffffffff,0x00000000,0x00000001,0x00000000,
  23693. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000
  23694. };
  23695. /* The Montgomery multiplier for modulus of the curve P384. */
  23696. static sp_digit p384_mp_mod = 0x00000001;
  23697. #if defined(WOLFSSL_VALIDATE_ECC_KEYGEN) || defined(HAVE_ECC_SIGN) || \
  23698. defined(HAVE_ECC_VERIFY)
  23699. /* The order of the curve P384. */
  23700. static const sp_digit p384_order[12] = {
  23701. 0xccc52973,0xecec196a,0x48b0a77a,0x581a0db2,0xf4372ddf,0xc7634d81,
  23702. 0xffffffff,0xffffffff,0xffffffff,0xffffffff,0xffffffff,0xffffffff
  23703. };
  23704. #endif
  23705. /* The order of the curve P384 minus 2. */
  23706. static const sp_digit p384_order2[12] = {
  23707. 0xccc52971,0xecec196a,0x48b0a77a,0x581a0db2,0xf4372ddf,0xc7634d81,
  23708. 0xffffffff,0xffffffff,0xffffffff,0xffffffff,0xffffffff,0xffffffff
  23709. };
  23710. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  23711. /* The Montgomery normalizer for order of the curve P384. */
  23712. static const sp_digit p384_norm_order[12] = {
  23713. 0x333ad68d,0x1313e695,0xb74f5885,0xa7e5f24d,0x0bc8d220,0x389cb27e,
  23714. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000
  23715. };
  23716. #endif
  23717. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  23718. /* The Montgomery multiplier for order of the curve P384. */
  23719. static sp_digit p384_mp_order = 0xe88fdc45;
  23720. #endif
  23721. /* The base point of curve P384. */
  23722. static const sp_point_384 p384_base = {
  23723. /* X ordinate */
  23724. {
  23725. 0x72760ab7,0x3a545e38,0xbf55296c,0x5502f25d,0x82542a38,0x59f741e0,
  23726. 0x8ba79b98,0x6e1d3b62,0xf320ad74,0x8eb1c71e,0xbe8b0537,0xaa87ca22,
  23727. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  23728. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  23729. (sp_digit)0, (sp_digit)0
  23730. },
  23731. /* Y ordinate */
  23732. {
  23733. 0x90ea0e5f,0x7a431d7c,0x1d7e819d,0x0a60b1ce,0xb5f0b8c0,0xe9da3113,
  23734. 0x289a147c,0xf8f41dbd,0x9292dc29,0x5d9e98bf,0x96262c6f,0x3617de4a,
  23735. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  23736. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  23737. (sp_digit)0, (sp_digit)0
  23738. },
  23739. /* Z ordinate */
  23740. {
  23741. 0x00000001,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  23742. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  23743. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  23744. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  23745. (sp_digit)0, (sp_digit)0
  23746. },
  23747. /* infinity */
  23748. 0
  23749. };
  23750. #if defined(HAVE_ECC_CHECK_KEY) || defined(HAVE_COMP_KEY)
  23751. static const sp_digit p384_b[12] = {
  23752. 0xd3ec2aef,0x2a85c8ed,0x8a2ed19d,0xc656398d,0x5013875a,0x0314088f,
  23753. 0xfe814112,0x181d9c6e,0xe3f82d19,0x988e056b,0xe23ee7e4,0xb3312fa7
  23754. };
  23755. #endif
  23756. /* Multiply a and b into r. (r = a * b)
  23757. *
  23758. * r A single precision integer.
  23759. * a A single precision integer.
  23760. * b A single precision integer.
  23761. */
  23762. SP_NOINLINE static void sp_384_mul_12(sp_digit* r, const sp_digit* a,
  23763. const sp_digit* b)
  23764. {
  23765. sp_digit tmp_arr[12 * 2];
  23766. sp_digit* tmp = tmp_arr;
  23767. __asm__ __volatile__ (
  23768. "mov r3, #0\n\t"
  23769. "mov r4, #0\n\t"
  23770. "mov r9, r3\n\t"
  23771. "mov r12, %[r]\n\t"
  23772. "mov r10, %[a]\n\t"
  23773. "mov r11, %[b]\n\t"
  23774. "mov r6, #48\n\t"
  23775. "add r6, r6, r10\n\t"
  23776. "mov r14, r6\n\t"
  23777. "\n1:\n\t"
  23778. "mov %[r], #0\n\t"
  23779. "mov r5, #0\n\t"
  23780. "mov r6, #44\n\t"
  23781. "mov %[a], r9\n\t"
  23782. "subs %[a], %[a], r6\n\t"
  23783. "sbc r6, r6, r6\n\t"
  23784. "mvn r6, r6\n\t"
  23785. "and %[a], %[a], r6\n\t"
  23786. "mov %[b], r9\n\t"
  23787. "sub %[b], %[b], %[a]\n\t"
  23788. "add %[a], %[a], r10\n\t"
  23789. "add %[b], %[b], r11\n\t"
  23790. "\n2:\n\t"
  23791. /* Multiply Start */
  23792. "ldr r6, [%[a]]\n\t"
  23793. "ldr r8, [%[b]]\n\t"
  23794. "umull r6, r8, r6, r8\n\t"
  23795. "adds r3, r3, r6\n\t"
  23796. "adcs r4, r4, r8\n\t"
  23797. "adc r5, r5, %[r]\n\t"
  23798. /* Multiply Done */
  23799. "add %[a], %[a], #4\n\t"
  23800. "sub %[b], %[b], #4\n\t"
  23801. "cmp %[a], r14\n\t"
  23802. #ifdef __GNUC__
  23803. "beq 3f\n\t"
  23804. #else
  23805. "beq.n 3f\n\t"
  23806. #endif /* __GNUC__ */
  23807. "mov r6, r9\n\t"
  23808. "add r6, r6, r10\n\t"
  23809. "cmp %[a], r6\n\t"
  23810. #ifdef __GNUC__
  23811. "ble 2b\n\t"
  23812. #else
  23813. "ble.n 2b\n\t"
  23814. #endif /* __GNUC__ */
  23815. "\n3:\n\t"
  23816. "mov %[r], r12\n\t"
  23817. "mov r8, r9\n\t"
  23818. "str r3, [%[r], r8]\n\t"
  23819. "mov r3, r4\n\t"
  23820. "mov r4, r5\n\t"
  23821. "add r8, r8, #4\n\t"
  23822. "mov r9, r8\n\t"
  23823. "mov r6, #88\n\t"
  23824. "cmp r8, r6\n\t"
  23825. #ifdef __GNUC__
  23826. "ble 1b\n\t"
  23827. #else
  23828. "ble.n 1b\n\t"
  23829. #endif /* __GNUC__ */
  23830. "str r3, [%[r], r8]\n\t"
  23831. "mov %[a], r10\n\t"
  23832. "mov %[b], r11\n\t"
  23833. :
  23834. : [r] "r" (tmp), [a] "r" (a), [b] "r" (b)
  23835. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  23836. );
  23837. XMEMCPY(r, tmp_arr, sizeof(tmp_arr));
  23838. }
  23839. /* Square a and put result in r. (r = a * a)
  23840. *
  23841. * r A single precision integer.
  23842. * a A single precision integer.
  23843. */
  23844. SP_NOINLINE static void sp_384_sqr_12(sp_digit* r, const sp_digit* a)
  23845. {
  23846. __asm__ __volatile__ (
  23847. "mov r3, #0\n\t"
  23848. "mov r4, #0\n\t"
  23849. "mov r5, #0\n\t"
  23850. "mov r9, r3\n\t"
  23851. "mov r12, %[r]\n\t"
  23852. "mov r6, #96\n\t"
  23853. "neg r6, r6\n\t"
  23854. "add sp, sp, r6\n\t"
  23855. "mov r11, sp\n\t"
  23856. "mov r10, %[a]\n\t"
  23857. "\n1:\n\t"
  23858. "mov %[r], #0\n\t"
  23859. "mov r6, #44\n\t"
  23860. "mov %[a], r9\n\t"
  23861. "subs %[a], %[a], r6\n\t"
  23862. "sbc r6, r6, r6\n\t"
  23863. "mvn r6, r6\n\t"
  23864. "and %[a], %[a], r6\n\t"
  23865. "mov r2, r9\n\t"
  23866. "sub r2, r2, %[a]\n\t"
  23867. "add %[a], %[a], r10\n\t"
  23868. "add r2, r2, r10\n\t"
  23869. "\n2:\n\t"
  23870. "cmp r2, %[a]\n\t"
  23871. #ifdef __GNUC__
  23872. "beq 4f\n\t"
  23873. #else
  23874. "beq.n 4f\n\t"
  23875. #endif /* __GNUC__ */
  23876. /* Multiply * 2: Start */
  23877. "ldr r6, [%[a]]\n\t"
  23878. "ldr r8, [r2]\n\t"
  23879. "umull r6, r8, r6, r8\n\t"
  23880. "adds r3, r3, r6\n\t"
  23881. "adcs r4, r4, r8\n\t"
  23882. "adc r5, r5, %[r]\n\t"
  23883. "adds r3, r3, r6\n\t"
  23884. "adcs r4, r4, r8\n\t"
  23885. "adc r5, r5, %[r]\n\t"
  23886. /* Multiply * 2: Done */
  23887. #ifdef __GNUC__
  23888. "bal 5f\n\t"
  23889. #else
  23890. "bal.n 5f\n\t"
  23891. #endif /* __GNUC__ */
  23892. "\n4:\n\t"
  23893. /* Square: Start */
  23894. "ldr r6, [%[a]]\n\t"
  23895. "umull r6, r8, r6, r6\n\t"
  23896. "adds r3, r3, r6\n\t"
  23897. "adcs r4, r4, r8\n\t"
  23898. "adc r5, r5, %[r]\n\t"
  23899. /* Square: Done */
  23900. "\n5:\n\t"
  23901. "add %[a], %[a], #4\n\t"
  23902. "sub r2, r2, #4\n\t"
  23903. "mov r6, #48\n\t"
  23904. "add r6, r6, r10\n\t"
  23905. "cmp %[a], r6\n\t"
  23906. #ifdef __GNUC__
  23907. "beq 3f\n\t"
  23908. #else
  23909. "beq.n 3f\n\t"
  23910. #endif /* __GNUC__ */
  23911. "cmp %[a], r2\n\t"
  23912. #ifdef __GNUC__
  23913. "bgt 3f\n\t"
  23914. #else
  23915. "bgt.n 3f\n\t"
  23916. #endif /* __GNUC__ */
  23917. "mov r8, r9\n\t"
  23918. "add r8, r8, r10\n\t"
  23919. "cmp %[a], r8\n\t"
  23920. #ifdef __GNUC__
  23921. "ble 2b\n\t"
  23922. #else
  23923. "ble.n 2b\n\t"
  23924. #endif /* __GNUC__ */
  23925. "\n3:\n\t"
  23926. "mov %[r], r11\n\t"
  23927. "mov r8, r9\n\t"
  23928. "str r3, [%[r], r8]\n\t"
  23929. "mov r3, r4\n\t"
  23930. "mov r4, r5\n\t"
  23931. "mov r5, #0\n\t"
  23932. "add r8, r8, #4\n\t"
  23933. "mov r9, r8\n\t"
  23934. "mov r6, #88\n\t"
  23935. "cmp r8, r6\n\t"
  23936. #ifdef __GNUC__
  23937. "ble 1b\n\t"
  23938. #else
  23939. "ble.n 1b\n\t"
  23940. #endif /* __GNUC__ */
  23941. "mov %[a], r10\n\t"
  23942. "str r3, [%[r], r8]\n\t"
  23943. "mov %[r], r12\n\t"
  23944. "mov %[a], r11\n\t"
  23945. "mov r3, #92\n\t"
  23946. "\n4:\n\t"
  23947. "ldr r6, [%[a], r3]\n\t"
  23948. "str r6, [%[r], r3]\n\t"
  23949. "subs r3, r3, #4\n\t"
  23950. #ifdef __GNUC__
  23951. "bge 4b\n\t"
  23952. #else
  23953. "bge.n 4b\n\t"
  23954. #endif /* __GNUC__ */
  23955. "mov r6, #96\n\t"
  23956. "add sp, sp, r6\n\t"
  23957. :
  23958. : [r] "r" (r), [a] "r" (a)
  23959. : "memory", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12"
  23960. );
  23961. }
  23962. #ifdef WOLFSSL_SP_SMALL
  23963. /* Add b to a into r. (r = a + b)
  23964. *
  23965. * r A single precision integer.
  23966. * a A single precision integer.
  23967. * b A single precision integer.
  23968. */
  23969. SP_NOINLINE static sp_digit sp_384_add_12(sp_digit* r, const sp_digit* a,
  23970. const sp_digit* b)
  23971. {
  23972. sp_digit c = 0;
  23973. __asm__ __volatile__ (
  23974. "mov r6, %[a]\n\t"
  23975. "mov r8, #0\n\t"
  23976. "add r6, r6, #48\n\t"
  23977. "sub r8, r8, #1\n\t"
  23978. "\n1:\n\t"
  23979. "adds %[c], %[c], r8\n\t"
  23980. "ldr r4, [%[a]]\n\t"
  23981. "ldr r5, [%[b]]\n\t"
  23982. "adcs r4, r4, r5\n\t"
  23983. "str r4, [%[r]]\n\t"
  23984. "mov %[c], #0\n\t"
  23985. "adc %[c], %[c], %[c]\n\t"
  23986. "add %[a], %[a], #4\n\t"
  23987. "add %[b], %[b], #4\n\t"
  23988. "add %[r], %[r], #4\n\t"
  23989. "cmp %[a], r6\n\t"
  23990. #ifdef __GNUC__
  23991. "bne 1b\n\t"
  23992. #else
  23993. "bne.n 1b\n\t"
  23994. #endif /* __GNUC__ */
  23995. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  23996. :
  23997. : "memory", "r4", "r5", "r6", "r8"
  23998. );
  23999. return c;
  24000. }
  24001. #else
  24002. /* Add b to a into r. (r = a + b)
  24003. *
  24004. * r A single precision integer.
  24005. * a A single precision integer.
  24006. * b A single precision integer.
  24007. */
  24008. SP_NOINLINE static sp_digit sp_384_add_12(sp_digit* r, const sp_digit* a,
  24009. const sp_digit* b)
  24010. {
  24011. sp_digit c = 0;
  24012. __asm__ __volatile__ (
  24013. "ldm %[a]!, {r4, r5}\n\t"
  24014. "ldm %[b]!, {r6, r8}\n\t"
  24015. "adds r4, r4, r6\n\t"
  24016. "adcs r5, r5, r8\n\t"
  24017. "stm %[r]!, {r4, r5}\n\t"
  24018. "ldm %[a]!, {r4, r5}\n\t"
  24019. "ldm %[b]!, {r6, r8}\n\t"
  24020. "adcs r4, r4, r6\n\t"
  24021. "adcs r5, r5, r8\n\t"
  24022. "stm %[r]!, {r4, r5}\n\t"
  24023. "ldm %[a]!, {r4, r5}\n\t"
  24024. "ldm %[b]!, {r6, r8}\n\t"
  24025. "adcs r4, r4, r6\n\t"
  24026. "adcs r5, r5, r8\n\t"
  24027. "stm %[r]!, {r4, r5}\n\t"
  24028. "ldm %[a]!, {r4, r5}\n\t"
  24029. "ldm %[b]!, {r6, r8}\n\t"
  24030. "adcs r4, r4, r6\n\t"
  24031. "adcs r5, r5, r8\n\t"
  24032. "stm %[r]!, {r4, r5}\n\t"
  24033. "ldm %[a]!, {r4, r5}\n\t"
  24034. "ldm %[b]!, {r6, r8}\n\t"
  24035. "adcs r4, r4, r6\n\t"
  24036. "adcs r5, r5, r8\n\t"
  24037. "stm %[r]!, {r4, r5}\n\t"
  24038. "ldm %[a]!, {r4, r5}\n\t"
  24039. "ldm %[b]!, {r6, r8}\n\t"
  24040. "adcs r4, r4, r6\n\t"
  24041. "adcs r5, r5, r8\n\t"
  24042. "stm %[r]!, {r4, r5}\n\t"
  24043. "mov %[c], #0\n\t"
  24044. "adc %[c], %[c], %[c]\n\t"
  24045. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  24046. :
  24047. : "memory", "r4", "r5", "r6", "r8"
  24048. );
  24049. return c;
  24050. }
  24051. #endif /* WOLFSSL_SP_SMALL */
  24052. #ifdef WOLFSSL_SP_SMALL
  24053. /* Sub b from a into r. (r = a - b)
  24054. *
  24055. * r A single precision integer.
  24056. * a A single precision integer.
  24057. * b A single precision integer.
  24058. */
  24059. SP_NOINLINE static sp_digit sp_384_sub_12(sp_digit* r, const sp_digit* a,
  24060. const sp_digit* b)
  24061. {
  24062. sp_digit c = 0;
  24063. __asm__ __volatile__ (
  24064. "mov r6, %[a]\n\t"
  24065. "add r6, r6, #48\n\t"
  24066. "\n1:\n\t"
  24067. "mov r5, #0\n\t"
  24068. "subs r5, r5, %[c]\n\t"
  24069. "ldr r4, [%[a]]\n\t"
  24070. "ldr r5, [%[b]]\n\t"
  24071. "sbcs r4, r4, r5\n\t"
  24072. "str r4, [%[r]]\n\t"
  24073. "sbc %[c], %[c], %[c]\n\t"
  24074. "add %[a], %[a], #4\n\t"
  24075. "add %[b], %[b], #4\n\t"
  24076. "add %[r], %[r], #4\n\t"
  24077. "cmp %[a], r6\n\t"
  24078. #ifdef __GNUC__
  24079. "bne 1b\n\t"
  24080. #else
  24081. "bne.n 1b\n\t"
  24082. #endif /* __GNUC__ */
  24083. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  24084. :
  24085. : "memory", "r4", "r5", "r6"
  24086. );
  24087. return c;
  24088. }
  24089. #else
  24090. /* Sub b from a into r. (r = a - b)
  24091. *
  24092. * r A single precision integer.
  24093. * a A single precision integer.
  24094. * b A single precision integer.
  24095. */
  24096. SP_NOINLINE static sp_digit sp_384_sub_12(sp_digit* r, const sp_digit* a,
  24097. const sp_digit* b)
  24098. {
  24099. sp_digit c = 0;
  24100. __asm__ __volatile__ (
  24101. "ldm %[a]!, {r4, r5}\n\t"
  24102. "ldm %[b]!, {r6, r8}\n\t"
  24103. "subs r4, r4, r6\n\t"
  24104. "sbcs r5, r5, r8\n\t"
  24105. "stm %[r]!, {r4, r5}\n\t"
  24106. "ldm %[a]!, {r4, r5}\n\t"
  24107. "ldm %[b]!, {r6, r8}\n\t"
  24108. "sbcs r4, r4, r6\n\t"
  24109. "sbcs r5, r5, r8\n\t"
  24110. "stm %[r]!, {r4, r5}\n\t"
  24111. "ldm %[a]!, {r4, r5}\n\t"
  24112. "ldm %[b]!, {r6, r8}\n\t"
  24113. "sbcs r4, r4, r6\n\t"
  24114. "sbcs r5, r5, r8\n\t"
  24115. "stm %[r]!, {r4, r5}\n\t"
  24116. "ldm %[a]!, {r4, r5}\n\t"
  24117. "ldm %[b]!, {r6, r8}\n\t"
  24118. "sbcs r4, r4, r6\n\t"
  24119. "sbcs r5, r5, r8\n\t"
  24120. "stm %[r]!, {r4, r5}\n\t"
  24121. "ldm %[a]!, {r4, r5}\n\t"
  24122. "ldm %[b]!, {r6, r8}\n\t"
  24123. "sbcs r4, r4, r6\n\t"
  24124. "sbcs r5, r5, r8\n\t"
  24125. "stm %[r]!, {r4, r5}\n\t"
  24126. "ldm %[a]!, {r4, r5}\n\t"
  24127. "ldm %[b]!, {r6, r8}\n\t"
  24128. "sbcs r4, r4, r6\n\t"
  24129. "sbcs r5, r5, r8\n\t"
  24130. "stm %[r]!, {r4, r5}\n\t"
  24131. "sbc %[c], %[c], %[c]\n\t"
  24132. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  24133. :
  24134. : "memory", "r4", "r5", "r6", "r8"
  24135. );
  24136. return c;
  24137. }
  24138. #endif /* WOLFSSL_SP_SMALL */
  24139. /* Multiply a number by Montgomery normalizer mod modulus (prime).
  24140. *
  24141. * r The resulting Montgomery form number.
  24142. * a The number to convert.
  24143. * m The modulus (prime).
  24144. * returns MEMORY_E when memory allocation fails and MP_OKAY otherwise.
  24145. */
  24146. static int sp_384_mod_mul_norm_12(sp_digit* r, const sp_digit* a, const sp_digit* m)
  24147. {
  24148. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  24149. int64_t* t = NULL;
  24150. #else
  24151. int64_t t[12];
  24152. #endif
  24153. int64_t o;
  24154. int err = MP_OKAY;
  24155. (void)m;
  24156. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  24157. t = (int64_t*)XMALLOC(sizeof(int64_t) * 12, NULL, DYNAMIC_TYPE_ECC);
  24158. if (t == NULL) {
  24159. err = MEMORY_E;
  24160. }
  24161. #endif
  24162. if (err == MP_OKAY) {
  24163. /* 1 0 0 0 0 0 0 0 1 1 0 -1 */
  24164. t[0] = 0 + (int64_t)a[0] + (int64_t)a[8] + (int64_t)a[9] - (int64_t)a[11];
  24165. /* -1 1 0 0 0 0 0 0 -1 0 1 1 */
  24166. t[1] = 0 - (int64_t)a[0] + (int64_t)a[1] - (int64_t)a[8] + (int64_t)a[10] + (int64_t)a[11];
  24167. /* 0 -1 1 0 0 0 0 0 0 -1 0 1 */
  24168. t[2] = 0 - (int64_t)a[1] + (int64_t)a[2] - (int64_t)a[9] + (int64_t)a[11];
  24169. /* 1 0 -1 1 0 0 0 0 1 1 -1 -1 */
  24170. t[3] = 0 + (int64_t)a[0] - (int64_t)a[2] + (int64_t)a[3] + (int64_t)a[8] + (int64_t)a[9] - (int64_t)a[10] - (int64_t)a[11];
  24171. /* 1 1 0 -1 1 0 0 0 1 2 1 -2 */
  24172. t[4] = 0 + (int64_t)a[0] + (int64_t)a[1] - (int64_t)a[3] + (int64_t)a[4] + (int64_t)a[8] + 2 * (int64_t)a[9] + (int64_t)a[10] - 2 * (int64_t)a[11];
  24173. /* 0 1 1 0 -1 1 0 0 0 1 2 1 */
  24174. t[5] = 0 + (int64_t)a[1] + (int64_t)a[2] - (int64_t)a[4] + (int64_t)a[5] + (int64_t)a[9] + 2 * (int64_t)a[10] + (int64_t)a[11];
  24175. /* 0 0 1 1 0 -1 1 0 0 0 1 2 */
  24176. t[6] = 0 + (int64_t)a[2] + (int64_t)a[3] - (int64_t)a[5] + (int64_t)a[6] + (int64_t)a[10] + 2 * (int64_t)a[11];
  24177. /* 0 0 0 1 1 0 -1 1 0 0 0 1 */
  24178. t[7] = 0 + (int64_t)a[3] + (int64_t)a[4] - (int64_t)a[6] + (int64_t)a[7] + (int64_t)a[11];
  24179. /* 0 0 0 0 1 1 0 -1 1 0 0 0 */
  24180. t[8] = 0 + (int64_t)a[4] + (int64_t)a[5] - (int64_t)a[7] + (int64_t)a[8];
  24181. /* 0 0 0 0 0 1 1 0 -1 1 0 0 */
  24182. t[9] = 0 + (int64_t)a[5] + (int64_t)a[6] - (int64_t)a[8] + (int64_t)a[9];
  24183. /* 0 0 0 0 0 0 1 1 0 -1 1 0 */
  24184. t[10] = 0 + (int64_t)a[6] + (int64_t)a[7] - (int64_t)a[9] + (int64_t)a[10];
  24185. /* 0 0 0 0 0 0 0 1 1 0 -1 1 */
  24186. t[11] = 0 + (int64_t)a[7] + (int64_t)a[8] - (int64_t)a[10] + (int64_t)a[11];
  24187. t[1] += t[0] >> 32; t[0] &= 0xffffffff;
  24188. t[2] += t[1] >> 32; t[1] &= 0xffffffff;
  24189. t[3] += t[2] >> 32; t[2] &= 0xffffffff;
  24190. t[4] += t[3] >> 32; t[3] &= 0xffffffff;
  24191. t[5] += t[4] >> 32; t[4] &= 0xffffffff;
  24192. t[6] += t[5] >> 32; t[5] &= 0xffffffff;
  24193. t[7] += t[6] >> 32; t[6] &= 0xffffffff;
  24194. t[8] += t[7] >> 32; t[7] &= 0xffffffff;
  24195. t[9] += t[8] >> 32; t[8] &= 0xffffffff;
  24196. t[10] += t[9] >> 32; t[9] &= 0xffffffff;
  24197. t[11] += t[10] >> 32; t[10] &= 0xffffffff;
  24198. o = t[11] >> 32; t[11] &= 0xffffffff;
  24199. t[0] += o;
  24200. t[1] -= o;
  24201. t[3] += o;
  24202. t[4] += o;
  24203. t[1] += t[0] >> 32; t[0] &= 0xffffffff;
  24204. t[2] += t[1] >> 32; t[1] &= 0xffffffff;
  24205. t[3] += t[2] >> 32; t[2] &= 0xffffffff;
  24206. t[4] += t[3] >> 32; t[3] &= 0xffffffff;
  24207. t[5] += t[4] >> 32; t[4] &= 0xffffffff;
  24208. t[6] += t[5] >> 32; t[5] &= 0xffffffff;
  24209. t[7] += t[6] >> 32; t[6] &= 0xffffffff;
  24210. t[8] += t[7] >> 32; t[7] &= 0xffffffff;
  24211. t[9] += t[8] >> 32; t[8] &= 0xffffffff;
  24212. t[10] += t[9] >> 32; t[9] &= 0xffffffff;
  24213. t[11] += t[10] >> 32; t[10] &= 0xffffffff;
  24214. r[0] = t[0];
  24215. r[1] = t[1];
  24216. r[2] = t[2];
  24217. r[3] = t[3];
  24218. r[4] = t[4];
  24219. r[5] = t[5];
  24220. r[6] = t[6];
  24221. r[7] = t[7];
  24222. r[8] = t[8];
  24223. r[9] = t[9];
  24224. r[10] = t[10];
  24225. r[11] = t[11];
  24226. }
  24227. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  24228. if (t != NULL)
  24229. XFREE(t, NULL, DYNAMIC_TYPE_ECC);
  24230. #endif
  24231. return err;
  24232. }
  24233. /* Convert an mp_int to an array of sp_digit.
  24234. *
  24235. * r A single precision integer.
  24236. * size Maximum number of bytes to convert
  24237. * a A multi-precision integer.
  24238. */
  24239. static void sp_384_from_mp(sp_digit* r, int size, const mp_int* a)
  24240. {
  24241. #if DIGIT_BIT == 32
  24242. int j;
  24243. XMEMCPY(r, a->dp, sizeof(sp_digit) * a->used);
  24244. for (j = a->used; j < size; j++) {
  24245. r[j] = 0;
  24246. }
  24247. #elif DIGIT_BIT > 32
  24248. int i;
  24249. int j = 0;
  24250. word32 s = 0;
  24251. r[0] = 0;
  24252. for (i = 0; i < a->used && j < size; i++) {
  24253. r[j] |= ((sp_digit)a->dp[i] << s);
  24254. r[j] &= 0xffffffff;
  24255. s = 32U - s;
  24256. if (j + 1 >= size) {
  24257. break;
  24258. }
  24259. /* lint allow cast of mismatch word32 and mp_digit */
  24260. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  24261. while ((s + 32U) <= (word32)DIGIT_BIT) {
  24262. s += 32U;
  24263. r[j] &= 0xffffffff;
  24264. if (j + 1 >= size) {
  24265. break;
  24266. }
  24267. if (s < (word32)DIGIT_BIT) {
  24268. /* lint allow cast of mismatch word32 and mp_digit */
  24269. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  24270. }
  24271. else {
  24272. r[++j] = (sp_digit)0;
  24273. }
  24274. }
  24275. s = (word32)DIGIT_BIT - s;
  24276. }
  24277. for (j++; j < size; j++) {
  24278. r[j] = 0;
  24279. }
  24280. #else
  24281. int i;
  24282. int j = 0;
  24283. int s = 0;
  24284. r[0] = 0;
  24285. for (i = 0; i < a->used && j < size; i++) {
  24286. r[j] |= ((sp_digit)a->dp[i]) << s;
  24287. if (s + DIGIT_BIT >= 32) {
  24288. r[j] &= 0xffffffff;
  24289. if (j + 1 >= size) {
  24290. break;
  24291. }
  24292. s = 32 - s;
  24293. if (s == DIGIT_BIT) {
  24294. r[++j] = 0;
  24295. s = 0;
  24296. }
  24297. else {
  24298. r[++j] = a->dp[i] >> s;
  24299. s = DIGIT_BIT - s;
  24300. }
  24301. }
  24302. else {
  24303. s += DIGIT_BIT;
  24304. }
  24305. }
  24306. for (j++; j < size; j++) {
  24307. r[j] = 0;
  24308. }
  24309. #endif
  24310. }
  24311. /* Convert a point of type ecc_point to type sp_point_384.
  24312. *
  24313. * p Point of type sp_point_384 (result).
  24314. * pm Point of type ecc_point.
  24315. */
  24316. static void sp_384_point_from_ecc_point_12(sp_point_384* p,
  24317. const ecc_point* pm)
  24318. {
  24319. XMEMSET(p->x, 0, sizeof(p->x));
  24320. XMEMSET(p->y, 0, sizeof(p->y));
  24321. XMEMSET(p->z, 0, sizeof(p->z));
  24322. sp_384_from_mp(p->x, 12, pm->x);
  24323. sp_384_from_mp(p->y, 12, pm->y);
  24324. sp_384_from_mp(p->z, 12, pm->z);
  24325. p->infinity = 0;
  24326. }
  24327. /* Convert an array of sp_digit to an mp_int.
  24328. *
  24329. * a A single precision integer.
  24330. * r A multi-precision integer.
  24331. */
  24332. static int sp_384_to_mp(const sp_digit* a, mp_int* r)
  24333. {
  24334. int err;
  24335. err = mp_grow(r, (384 + DIGIT_BIT - 1) / DIGIT_BIT);
  24336. if (err == MP_OKAY) { /*lint !e774 case where err is always MP_OKAY*/
  24337. #if DIGIT_BIT == 32
  24338. XMEMCPY(r->dp, a, sizeof(sp_digit) * 12);
  24339. r->used = 12;
  24340. mp_clamp(r);
  24341. #elif DIGIT_BIT < 32
  24342. int i;
  24343. int j = 0;
  24344. int s = 0;
  24345. r->dp[0] = 0;
  24346. for (i = 0; i < 12; i++) {
  24347. r->dp[j] |= (mp_digit)(a[i] << s);
  24348. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  24349. s = DIGIT_BIT - s;
  24350. r->dp[++j] = (mp_digit)(a[i] >> s);
  24351. while (s + DIGIT_BIT <= 32) {
  24352. s += DIGIT_BIT;
  24353. r->dp[j++] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  24354. if (s == SP_WORD_SIZE) {
  24355. r->dp[j] = 0;
  24356. }
  24357. else {
  24358. r->dp[j] = (mp_digit)(a[i] >> s);
  24359. }
  24360. }
  24361. s = 32 - s;
  24362. }
  24363. r->used = (384 + DIGIT_BIT - 1) / DIGIT_BIT;
  24364. mp_clamp(r);
  24365. #else
  24366. int i;
  24367. int j = 0;
  24368. int s = 0;
  24369. r->dp[0] = 0;
  24370. for (i = 0; i < 12; i++) {
  24371. r->dp[j] |= ((mp_digit)a[i]) << s;
  24372. if (s + 32 >= DIGIT_BIT) {
  24373. #if DIGIT_BIT != 32 && DIGIT_BIT != 64
  24374. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  24375. #endif
  24376. s = DIGIT_BIT - s;
  24377. r->dp[++j] = a[i] >> s;
  24378. s = 32 - s;
  24379. }
  24380. else {
  24381. s += 32;
  24382. }
  24383. }
  24384. r->used = (384 + DIGIT_BIT - 1) / DIGIT_BIT;
  24385. mp_clamp(r);
  24386. #endif
  24387. }
  24388. return err;
  24389. }
  24390. /* Convert a point of type sp_point_384 to type ecc_point.
  24391. *
  24392. * p Point of type sp_point_384.
  24393. * pm Point of type ecc_point (result).
  24394. * returns MEMORY_E when allocation of memory in ecc_point fails otherwise
  24395. * MP_OKAY.
  24396. */
  24397. static int sp_384_point_to_ecc_point_12(const sp_point_384* p, ecc_point* pm)
  24398. {
  24399. int err;
  24400. err = sp_384_to_mp(p->x, pm->x);
  24401. if (err == MP_OKAY) {
  24402. err = sp_384_to_mp(p->y, pm->y);
  24403. }
  24404. if (err == MP_OKAY) {
  24405. err = sp_384_to_mp(p->z, pm->z);
  24406. }
  24407. return err;
  24408. }
  24409. /* Conditionally subtract b from a using the mask m.
  24410. * m is -1 to subtract and 0 when not copying.
  24411. *
  24412. * r A single precision number representing condition subtract result.
  24413. * a A single precision number to subtract from.
  24414. * b A single precision number to subtract.
  24415. * m Mask value to apply.
  24416. */
  24417. SP_NOINLINE static sp_digit sp_384_cond_sub_12(sp_digit* r, const sp_digit* a,
  24418. const sp_digit* b, sp_digit m)
  24419. {
  24420. sp_digit c = 0;
  24421. __asm__ __volatile__ (
  24422. "mov r5, #48\n\t"
  24423. "mov r9, r5\n\t"
  24424. "mov r8, #0\n\t"
  24425. "\n1:\n\t"
  24426. "ldr r6, [%[b], r8]\n\t"
  24427. "and r6, r6, %[m]\n\t"
  24428. "mov r5, #0\n\t"
  24429. "subs r5, r5, %[c]\n\t"
  24430. "ldr r5, [%[a], r8]\n\t"
  24431. "sbcs r5, r5, r6\n\t"
  24432. "sbcs %[c], %[c], %[c]\n\t"
  24433. "str r5, [%[r], r8]\n\t"
  24434. "add r8, r8, #4\n\t"
  24435. "cmp r8, r9\n\t"
  24436. #ifdef __GNUC__
  24437. "blt 1b\n\t"
  24438. #else
  24439. "blt.n 1b\n\t"
  24440. #endif /* __GNUC__ */
  24441. : [c] "+r" (c)
  24442. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  24443. : "memory", "r5", "r6", "r8", "r9"
  24444. );
  24445. return c;
  24446. }
  24447. #define sp_384_mont_reduce_order_12 sp_384_mont_reduce_12
  24448. /* Reduce the number back to 384 bits using Montgomery reduction.
  24449. *
  24450. * a A single precision number to reduce in place.
  24451. * m The single precision number representing the modulus.
  24452. * mp The digit representing the negative inverse of m mod 2^n.
  24453. */
  24454. SP_NOINLINE static void sp_384_mont_reduce_12(sp_digit* a, const sp_digit* m,
  24455. sp_digit mp)
  24456. {
  24457. sp_digit ca = 0;
  24458. __asm__ __volatile__ (
  24459. "mov r9, %[mp]\n\t"
  24460. "mov r12, %[m]\n\t"
  24461. "mov r10, %[a]\n\t"
  24462. "mov r4, #0\n\t"
  24463. "add r11, r10, #48\n\t"
  24464. "\n1:\n\t"
  24465. /* mu = a[i] * mp */
  24466. "mov %[mp], r9\n\t"
  24467. "ldr %[a], [r10]\n\t"
  24468. "mul %[mp], %[mp], %[a]\n\t"
  24469. "mov %[m], r12\n\t"
  24470. "add r14, r10, #40\n\t"
  24471. "\n2:\n\t"
  24472. /* a[i+j] += m[j] * mu */
  24473. "ldr %[a], [r10]\n\t"
  24474. "mov r5, #0\n\t"
  24475. /* Multiply m[j] and mu - Start */
  24476. "ldr r8, [%[m]], #4\n\t"
  24477. "umull r6, r8, %[mp], r8\n\t"
  24478. "adds %[a], %[a], r6\n\t"
  24479. "adc r5, r5, r8\n\t"
  24480. /* Multiply m[j] and mu - Done */
  24481. "adds r4, r4, %[a]\n\t"
  24482. "adc r5, r5, #0\n\t"
  24483. "str r4, [r10], #4\n\t"
  24484. /* a[i+j+1] += m[j+1] * mu */
  24485. "ldr %[a], [r10]\n\t"
  24486. "mov r4, #0\n\t"
  24487. /* Multiply m[j] and mu - Start */
  24488. "ldr r8, [%[m]], #4\n\t"
  24489. "umull r6, r8, %[mp], r8\n\t"
  24490. "adds %[a], %[a], r6\n\t"
  24491. "adc r4, r4, r8\n\t"
  24492. /* Multiply m[j] and mu - Done */
  24493. "adds r5, r5, %[a]\n\t"
  24494. "adc r4, r4, #0\n\t"
  24495. "str r5, [r10], #4\n\t"
  24496. "cmp r10, r14\n\t"
  24497. #ifdef __GNUC__
  24498. "blt 2b\n\t"
  24499. #else
  24500. "blt.n 2b\n\t"
  24501. #endif /* __GNUC__ */
  24502. /* a[i+10] += m[10] * mu */
  24503. "ldr %[a], [r10]\n\t"
  24504. "mov r5, #0\n\t"
  24505. /* Multiply m[j] and mu - Start */
  24506. "ldr r8, [%[m]], #4\n\t"
  24507. "umull r6, r8, %[mp], r8\n\t"
  24508. "adds %[a], %[a], r6\n\t"
  24509. "adc r5, r5, r8\n\t"
  24510. /* Multiply m[j] and mu - Done */
  24511. "adds r4, r4, %[a]\n\t"
  24512. "adc r5, r5, #0\n\t"
  24513. "str r4, [r10], #4\n\t"
  24514. /* a[i+11] += m[11] * mu */
  24515. "mov r4, %[ca]\n\t"
  24516. "mov %[ca], #0\n\t"
  24517. /* Multiply m[11] and mu - Start */
  24518. "ldr r8, [%[m]]\n\t"
  24519. "umull r6, r8, %[mp], r8\n\t"
  24520. "adds r5, r5, r6\n\t"
  24521. "adcs r4, r4, r8\n\t"
  24522. "adc %[ca], %[ca], #0\n\t"
  24523. /* Multiply m[11] and mu - Done */
  24524. "ldr r6, [r10]\n\t"
  24525. "ldr r8, [r10, #4]\n\t"
  24526. "adds r6, r6, r5\n\t"
  24527. "adcs r8, r8, r4\n\t"
  24528. "adc %[ca], %[ca], #0\n\t"
  24529. "str r6, [r10]\n\t"
  24530. "str r8, [r10, #4]\n\t"
  24531. /* Next word in a */
  24532. "sub r10, r10, #40\n\t"
  24533. "cmp r10, r11\n\t"
  24534. #ifdef __GNUC__
  24535. "blt 1b\n\t"
  24536. #else
  24537. "blt.n 1b\n\t"
  24538. #endif /* __GNUC__ */
  24539. "mov %[a], r10\n\t"
  24540. "mov %[m], r12\n\t"
  24541. : [ca] "+r" (ca), [a] "+r" (a)
  24542. : [m] "r" (m), [mp] "r" (mp)
  24543. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  24544. );
  24545. sp_384_cond_sub_12(a - 12, a, m, (sp_digit)0 - ca);
  24546. }
  24547. /* Multiply two Montgomery form numbers mod the modulus (prime).
  24548. * (r = a * b mod m)
  24549. *
  24550. * r Result of multiplication.
  24551. * a First number to multiply in Montgomery form.
  24552. * b Second number to multiply in Montgomery form.
  24553. * m Modulus (prime).
  24554. * mp Montgomery mulitplier.
  24555. */
  24556. SP_NOINLINE static void sp_384_mont_mul_12(sp_digit* r, const sp_digit* a,
  24557. const sp_digit* b, const sp_digit* m, sp_digit mp)
  24558. {
  24559. sp_384_mul_12(r, a, b);
  24560. sp_384_mont_reduce_12(r, m, mp);
  24561. }
  24562. /* Square the Montgomery form number. (r = a * a mod m)
  24563. *
  24564. * r Result of squaring.
  24565. * a Number to square in Montgomery form.
  24566. * m Modulus (prime).
  24567. * mp Montgomery mulitplier.
  24568. */
  24569. SP_NOINLINE static void sp_384_mont_sqr_12(sp_digit* r, const sp_digit* a,
  24570. const sp_digit* m, sp_digit mp)
  24571. {
  24572. sp_384_sqr_12(r, a);
  24573. sp_384_mont_reduce_12(r, m, mp);
  24574. }
  24575. #if !defined(WOLFSSL_SP_SMALL) || defined(HAVE_COMP_KEY)
  24576. /* Square the Montgomery form number a number of times. (r = a ^ n mod m)
  24577. *
  24578. * r Result of squaring.
  24579. * a Number to square in Montgomery form.
  24580. * n Number of times to square.
  24581. * m Modulus (prime).
  24582. * mp Montgomery mulitplier.
  24583. */
  24584. static void sp_384_mont_sqr_n_12(sp_digit* r, const sp_digit* a, int n,
  24585. const sp_digit* m, sp_digit mp)
  24586. {
  24587. sp_384_mont_sqr_12(r, a, m, mp);
  24588. for (; n > 1; n--) {
  24589. sp_384_mont_sqr_12(r, r, m, mp);
  24590. }
  24591. }
  24592. #endif /* !WOLFSSL_SP_SMALL | HAVE_COMP_KEY */
  24593. #ifdef WOLFSSL_SP_SMALL
  24594. /* Mod-2 for the P384 curve. */
  24595. static const uint32_t p384_mod_minus_2[12] = {
  24596. 0xfffffffdU,0x00000000U,0x00000000U,0xffffffffU,0xfffffffeU,0xffffffffU,
  24597. 0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU
  24598. };
  24599. #endif /* !WOLFSSL_SP_SMALL */
  24600. /* Invert the number, in Montgomery form, modulo the modulus (prime) of the
  24601. * P384 curve. (r = 1 / a mod m)
  24602. *
  24603. * r Inverse result.
  24604. * a Number to invert.
  24605. * td Temporary data.
  24606. */
  24607. static void sp_384_mont_inv_12(sp_digit* r, const sp_digit* a, sp_digit* td)
  24608. {
  24609. #ifdef WOLFSSL_SP_SMALL
  24610. sp_digit* t = td;
  24611. int i;
  24612. XMEMCPY(t, a, sizeof(sp_digit) * 12);
  24613. for (i=382; i>=0; i--) {
  24614. sp_384_mont_sqr_12(t, t, p384_mod, p384_mp_mod);
  24615. if (p384_mod_minus_2[i / 32] & ((sp_digit)1 << (i % 32)))
  24616. sp_384_mont_mul_12(t, t, a, p384_mod, p384_mp_mod);
  24617. }
  24618. XMEMCPY(r, t, sizeof(sp_digit) * 12);
  24619. #else
  24620. sp_digit* t1 = td;
  24621. sp_digit* t2 = td + 2 * 12;
  24622. sp_digit* t3 = td + 4 * 12;
  24623. sp_digit* t4 = td + 6 * 12;
  24624. sp_digit* t5 = td + 8 * 12;
  24625. /* 0x2 */
  24626. sp_384_mont_sqr_12(t1, a, p384_mod, p384_mp_mod);
  24627. /* 0x3 */
  24628. sp_384_mont_mul_12(t5, t1, a, p384_mod, p384_mp_mod);
  24629. /* 0xc */
  24630. sp_384_mont_sqr_n_12(t1, t5, 2, p384_mod, p384_mp_mod);
  24631. /* 0xf */
  24632. sp_384_mont_mul_12(t2, t5, t1, p384_mod, p384_mp_mod);
  24633. /* 0x1e */
  24634. sp_384_mont_sqr_12(t1, t2, p384_mod, p384_mp_mod);
  24635. /* 0x1f */
  24636. sp_384_mont_mul_12(t4, t1, a, p384_mod, p384_mp_mod);
  24637. /* 0x3e0 */
  24638. sp_384_mont_sqr_n_12(t1, t4, 5, p384_mod, p384_mp_mod);
  24639. /* 0x3ff */
  24640. sp_384_mont_mul_12(t2, t4, t1, p384_mod, p384_mp_mod);
  24641. /* 0x7fe0 */
  24642. sp_384_mont_sqr_n_12(t1, t2, 5, p384_mod, p384_mp_mod);
  24643. /* 0x7fff */
  24644. sp_384_mont_mul_12(t4, t4, t1, p384_mod, p384_mp_mod);
  24645. /* 0x3fff8000 */
  24646. sp_384_mont_sqr_n_12(t1, t4, 15, p384_mod, p384_mp_mod);
  24647. /* 0x3fffffff */
  24648. sp_384_mont_mul_12(t2, t4, t1, p384_mod, p384_mp_mod);
  24649. /* 0xfffffffc */
  24650. sp_384_mont_sqr_n_12(t3, t2, 2, p384_mod, p384_mp_mod);
  24651. /* 0xfffffffd */
  24652. sp_384_mont_mul_12(r, t3, a, p384_mod, p384_mp_mod);
  24653. /* 0xffffffff */
  24654. sp_384_mont_mul_12(t3, t5, t3, p384_mod, p384_mp_mod);
  24655. /* 0xfffffffc0000000 */
  24656. sp_384_mont_sqr_n_12(t1, t2, 30, p384_mod, p384_mp_mod);
  24657. /* 0xfffffffffffffff */
  24658. sp_384_mont_mul_12(t2, t2, t1, p384_mod, p384_mp_mod);
  24659. /* 0xfffffffffffffff000000000000000 */
  24660. sp_384_mont_sqr_n_12(t1, t2, 60, p384_mod, p384_mp_mod);
  24661. /* 0xffffffffffffffffffffffffffffff */
  24662. sp_384_mont_mul_12(t2, t2, t1, p384_mod, p384_mp_mod);
  24663. /* 0xffffffffffffffffffffffffffffff000000000000000000000000000000 */
  24664. sp_384_mont_sqr_n_12(t1, t2, 120, p384_mod, p384_mp_mod);
  24665. /* 0xffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff */
  24666. sp_384_mont_mul_12(t2, t2, t1, p384_mod, p384_mp_mod);
  24667. /* 0x7fffffffffffffffffffffffffffffffffffffffffffffffffffffffffff8000 */
  24668. sp_384_mont_sqr_n_12(t1, t2, 15, p384_mod, p384_mp_mod);
  24669. /* 0x7fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff */
  24670. sp_384_mont_mul_12(t2, t4, t1, p384_mod, p384_mp_mod);
  24671. /* 0xfffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffe00000000 */
  24672. sp_384_mont_sqr_n_12(t1, t2, 33, p384_mod, p384_mp_mod);
  24673. /* 0xfffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffeffffffff */
  24674. sp_384_mont_mul_12(t2, t3, t1, p384_mod, p384_mp_mod);
  24675. /* 0xfffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffeffffffff000000000000000000000000 */
  24676. sp_384_mont_sqr_n_12(t1, t2, 96, p384_mod, p384_mp_mod);
  24677. /* 0xfffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffeffffffff0000000000000000fffffffd */
  24678. sp_384_mont_mul_12(r, r, t1, p384_mod, p384_mp_mod);
  24679. #endif /* WOLFSSL_SP_SMALL */
  24680. }
  24681. /* Compare a with b in constant time.
  24682. *
  24683. * a A single precision integer.
  24684. * b A single precision integer.
  24685. * return -ve, 0 or +ve if a is less than, equal to or greater than b
  24686. * respectively.
  24687. */
  24688. SP_NOINLINE static sp_int32 sp_384_cmp_12(const sp_digit* a, const sp_digit* b)
  24689. {
  24690. sp_digit r = 0;
  24691. __asm__ __volatile__ (
  24692. "mov r3, #0\n\t"
  24693. "mvn r3, r3\n\t"
  24694. "mov r6, #44\n\t"
  24695. "\n1:\n\t"
  24696. "ldr r8, [%[a], r6]\n\t"
  24697. "ldr r5, [%[b], r6]\n\t"
  24698. "and r8, r8, r3\n\t"
  24699. "and r5, r5, r3\n\t"
  24700. "mov r4, r8\n\t"
  24701. "subs r8, r8, r5\n\t"
  24702. "sbc r8, r8, r8\n\t"
  24703. "add %[r], %[r], r8\n\t"
  24704. "mvn r8, r8\n\t"
  24705. "and r3, r3, r8\n\t"
  24706. "subs r5, r5, r4\n\t"
  24707. "sbc r8, r8, r8\n\t"
  24708. "sub %[r], %[r], r8\n\t"
  24709. "mvn r8, r8\n\t"
  24710. "and r3, r3, r8\n\t"
  24711. "sub r6, r6, #4\n\t"
  24712. "cmp r6, #0\n\t"
  24713. #ifdef __GNUC__
  24714. "bge 1b\n\t"
  24715. #else
  24716. "bge.n 1b\n\t"
  24717. #endif /* __GNUC__ */
  24718. : [r] "+r" (r)
  24719. : [a] "r" (a), [b] "r" (b)
  24720. : "r3", "r4", "r5", "r6", "r8"
  24721. );
  24722. return r;
  24723. }
  24724. /* Normalize the values in each word to 32.
  24725. *
  24726. * a Array of sp_digit to normalize.
  24727. */
  24728. #define sp_384_norm_12(a)
  24729. /* Map the Montgomery form projective coordinate point to an affine point.
  24730. *
  24731. * r Resulting affine coordinate point.
  24732. * p Montgomery form projective coordinate point.
  24733. * t Temporary ordinate data.
  24734. */
  24735. static void sp_384_map_12(sp_point_384* r, const sp_point_384* p,
  24736. sp_digit* t)
  24737. {
  24738. sp_digit* t1 = t;
  24739. sp_digit* t2 = t + 2*12;
  24740. sp_int32 n;
  24741. sp_384_mont_inv_12(t1, p->z, t + 2*12);
  24742. sp_384_mont_sqr_12(t2, t1, p384_mod, p384_mp_mod);
  24743. sp_384_mont_mul_12(t1, t2, t1, p384_mod, p384_mp_mod);
  24744. /* x /= z^2 */
  24745. sp_384_mont_mul_12(r->x, p->x, t2, p384_mod, p384_mp_mod);
  24746. XMEMSET(r->x + 12, 0, sizeof(r->x) / 2U);
  24747. sp_384_mont_reduce_12(r->x, p384_mod, p384_mp_mod);
  24748. /* Reduce x to less than modulus */
  24749. n = sp_384_cmp_12(r->x, p384_mod);
  24750. sp_384_cond_sub_12(r->x, r->x, p384_mod, ~(n >> 31));
  24751. sp_384_norm_12(r->x);
  24752. /* y /= z^3 */
  24753. sp_384_mont_mul_12(r->y, p->y, t1, p384_mod, p384_mp_mod);
  24754. XMEMSET(r->y + 12, 0, sizeof(r->y) / 2U);
  24755. sp_384_mont_reduce_12(r->y, p384_mod, p384_mp_mod);
  24756. /* Reduce y to less than modulus */
  24757. n = sp_384_cmp_12(r->y, p384_mod);
  24758. sp_384_cond_sub_12(r->y, r->y, p384_mod, ~(n >> 31));
  24759. sp_384_norm_12(r->y);
  24760. XMEMSET(r->z, 0, sizeof(r->z) / 2);
  24761. r->z[0] = 1;
  24762. }
  24763. /* Add two Montgomery form numbers (r = a + b % m).
  24764. *
  24765. * r Result of addition.
  24766. * a First number to add in Montgomery form.
  24767. * b Second number to add in Montgomery form.
  24768. * m Modulus (prime).
  24769. */
  24770. SP_NOINLINE static void sp_384_mont_add_12(sp_digit* r, const sp_digit* a, const sp_digit* b,
  24771. const sp_digit* m)
  24772. {
  24773. sp_digit o;
  24774. o = sp_384_add_12(r, a, b);
  24775. sp_384_cond_sub_12(r, r, m, 0 - o);
  24776. }
  24777. /* Double a Montgomery form number (r = a + a % m).
  24778. *
  24779. * r Result of doubling.
  24780. * a Number to double in Montgomery form.
  24781. * m Modulus (prime).
  24782. */
  24783. SP_NOINLINE static void sp_384_mont_dbl_12(sp_digit* r, const sp_digit* a, const sp_digit* m)
  24784. {
  24785. sp_digit o;
  24786. o = sp_384_add_12(r, a, a);
  24787. sp_384_cond_sub_12(r, r, m, 0 - o);
  24788. }
  24789. /* Triple a Montgomery form number (r = a + a + a % m).
  24790. *
  24791. * r Result of Tripling.
  24792. * a Number to triple in Montgomery form.
  24793. * m Modulus (prime).
  24794. */
  24795. SP_NOINLINE static void sp_384_mont_tpl_12(sp_digit* r, const sp_digit* a, const sp_digit* m)
  24796. {
  24797. sp_digit o;
  24798. o = sp_384_add_12(r, a, a);
  24799. sp_384_cond_sub_12(r, r, m, 0 - o);
  24800. o = sp_384_add_12(r, r, a);
  24801. sp_384_cond_sub_12(r, r, m, 0 - o);
  24802. }
  24803. /* Conditionally add a and b using the mask m.
  24804. * m is -1 to add and 0 when not.
  24805. *
  24806. * r A single precision number representing conditional add result.
  24807. * a A single precision number to add with.
  24808. * b A single precision number to add.
  24809. * m Mask value to apply.
  24810. */
  24811. SP_NOINLINE static sp_digit sp_384_cond_add_12(sp_digit* r, const sp_digit* a, const sp_digit* b,
  24812. sp_digit m)
  24813. {
  24814. sp_digit c = 0;
  24815. __asm__ __volatile__ (
  24816. "mov r5, #48\n\t"
  24817. "mov r9, r5\n\t"
  24818. "mov r8, #0\n\t"
  24819. "\n1:\n\t"
  24820. "ldr r6, [%[b], r8]\n\t"
  24821. "and r6, r6, %[m]\n\t"
  24822. "adds r5, %[c], #-1\n\t"
  24823. "ldr r5, [%[a], r8]\n\t"
  24824. "adcs r5, r5, r6\n\t"
  24825. "mov %[c], #0\n\t"
  24826. "adcs %[c], %[c], %[c]\n\t"
  24827. "str r5, [%[r], r8]\n\t"
  24828. "add r8, r8, #4\n\t"
  24829. "cmp r8, r9\n\t"
  24830. #ifdef __GNUC__
  24831. "blt 1b\n\t"
  24832. #else
  24833. "blt.n 1b\n\t"
  24834. #endif /* __GNUC__ */
  24835. : [c] "+r" (c)
  24836. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  24837. : "memory", "r5", "r6", "r8", "r9"
  24838. );
  24839. return c;
  24840. }
  24841. /* Subtract two Montgomery form numbers (r = a - b % m).
  24842. *
  24843. * r Result of subtration.
  24844. * a Number to subtract from in Montgomery form.
  24845. * b Number to subtract with in Montgomery form.
  24846. * m Modulus (prime).
  24847. */
  24848. SP_NOINLINE static void sp_384_mont_sub_12(sp_digit* r, const sp_digit* a, const sp_digit* b,
  24849. const sp_digit* m)
  24850. {
  24851. sp_digit o;
  24852. o = sp_384_sub_12(r, a, b);
  24853. sp_384_cond_add_12(r, r, m, o);
  24854. }
  24855. #define sp_384_mont_sub_lower_12 sp_384_mont_sub_12
  24856. static void sp_384_rshift1_12(sp_digit* r, const sp_digit* a)
  24857. {
  24858. __asm__ __volatile__ (
  24859. "ldr r2, [%[a]]\n\t"
  24860. "ldr r3, [%[a], #4]\n\t"
  24861. "lsr r2, r2, #1\n\t"
  24862. "orr r2, r2, r3, lsl #31\n\t"
  24863. "lsr r3, r3, #1\n\t"
  24864. "ldr r4, [%[a], #8]\n\t"
  24865. "str r2, [%[r], #0]\n\t"
  24866. "orr r3, r3, r4, lsl #31\n\t"
  24867. "lsr r4, r4, #1\n\t"
  24868. "ldr r2, [%[a], #12]\n\t"
  24869. "str r3, [%[r], #4]\n\t"
  24870. "orr r4, r4, r2, lsl #31\n\t"
  24871. "lsr r2, r2, #1\n\t"
  24872. "ldr r3, [%[a], #16]\n\t"
  24873. "str r4, [%[r], #8]\n\t"
  24874. "orr r2, r2, r3, lsl #31\n\t"
  24875. "lsr r3, r3, #1\n\t"
  24876. "ldr r4, [%[a], #20]\n\t"
  24877. "str r2, [%[r], #12]\n\t"
  24878. "orr r3, r3, r4, lsl #31\n\t"
  24879. "lsr r4, r4, #1\n\t"
  24880. "ldr r2, [%[a], #24]\n\t"
  24881. "str r3, [%[r], #16]\n\t"
  24882. "orr r4, r4, r2, lsl #31\n\t"
  24883. "lsr r2, r2, #1\n\t"
  24884. "ldr r3, [%[a], #28]\n\t"
  24885. "str r4, [%[r], #20]\n\t"
  24886. "orr r2, r2, r3, lsl #31\n\t"
  24887. "lsr r3, r3, #1\n\t"
  24888. "ldr r4, [%[a], #32]\n\t"
  24889. "str r2, [%[r], #24]\n\t"
  24890. "orr r3, r3, r4, lsl #31\n\t"
  24891. "lsr r4, r4, #1\n\t"
  24892. "ldr r2, [%[a], #36]\n\t"
  24893. "str r3, [%[r], #28]\n\t"
  24894. "orr r4, r4, r2, lsl #31\n\t"
  24895. "lsr r2, r2, #1\n\t"
  24896. "ldr r3, [%[a], #40]\n\t"
  24897. "str r4, [%[r], #32]\n\t"
  24898. "orr r2, r2, r3, lsl #31\n\t"
  24899. "lsr r3, r3, #1\n\t"
  24900. "ldr r4, [%[a], #44]\n\t"
  24901. "str r2, [%[r], #36]\n\t"
  24902. "orr r3, r3, r4, lsl #31\n\t"
  24903. "lsr r4, r4, #1\n\t"
  24904. "str r3, [%[r], #40]\n\t"
  24905. "str r4, [%[r], #44]\n\t"
  24906. :
  24907. : [r] "r" (r), [a] "r" (a)
  24908. : "memory", "r2", "r3", "r4"
  24909. );
  24910. }
  24911. /* Divide the number by 2 mod the modulus (prime). (r = a / 2 % m)
  24912. *
  24913. * r Result of division by 2.
  24914. * a Number to divide.
  24915. * m Modulus (prime).
  24916. */
  24917. SP_NOINLINE static void sp_384_div2_12(sp_digit* r, const sp_digit* a, const sp_digit* m)
  24918. {
  24919. sp_digit o;
  24920. o = sp_384_cond_add_12(r, a, m, 0 - (a[0] & 1));
  24921. sp_384_rshift1_12(r, r);
  24922. r[11] |= o << 31;
  24923. }
  24924. /* Double the Montgomery form projective point p.
  24925. *
  24926. * r Result of doubling point.
  24927. * p Point to double.
  24928. * t Temporary ordinate data.
  24929. */
  24930. #ifdef WOLFSSL_SP_NONBLOCK
  24931. typedef struct sp_384_proj_point_dbl_12_ctx {
  24932. int state;
  24933. sp_digit* t1;
  24934. sp_digit* t2;
  24935. sp_digit* x;
  24936. sp_digit* y;
  24937. sp_digit* z;
  24938. } sp_384_proj_point_dbl_12_ctx;
  24939. static int sp_384_proj_point_dbl_12_nb(sp_ecc_ctx_t* sp_ctx, sp_point_384* r, const sp_point_384* p, sp_digit* t)
  24940. {
  24941. int err = FP_WOULDBLOCK;
  24942. sp_384_proj_point_dbl_12_ctx* ctx = (sp_384_proj_point_dbl_12_ctx*)sp_ctx->data;
  24943. typedef char ctx_size_test[sizeof(sp_384_proj_point_dbl_12_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  24944. (void)sizeof(ctx_size_test);
  24945. switch (ctx->state) {
  24946. case 0:
  24947. ctx->t1 = t;
  24948. ctx->t2 = t + 2*12;
  24949. ctx->x = r->x;
  24950. ctx->y = r->y;
  24951. ctx->z = r->z;
  24952. /* Put infinity into result. */
  24953. if (r != p) {
  24954. r->infinity = p->infinity;
  24955. }
  24956. ctx->state = 1;
  24957. break;
  24958. case 1:
  24959. /* T1 = Z * Z */
  24960. sp_384_mont_sqr_12(ctx->t1, p->z, p384_mod, p384_mp_mod);
  24961. ctx->state = 2;
  24962. break;
  24963. case 2:
  24964. /* Z = Y * Z */
  24965. sp_384_mont_mul_12(ctx->z, p->y, p->z, p384_mod, p384_mp_mod);
  24966. ctx->state = 3;
  24967. break;
  24968. case 3:
  24969. /* Z = 2Z */
  24970. sp_384_mont_dbl_12(ctx->z, ctx->z, p384_mod);
  24971. ctx->state = 4;
  24972. break;
  24973. case 4:
  24974. /* T2 = X - T1 */
  24975. sp_384_mont_sub_12(ctx->t2, p->x, ctx->t1, p384_mod);
  24976. ctx->state = 5;
  24977. break;
  24978. case 5:
  24979. /* T1 = X + T1 */
  24980. sp_384_mont_add_12(ctx->t1, p->x, ctx->t1, p384_mod);
  24981. ctx->state = 6;
  24982. break;
  24983. case 6:
  24984. /* T2 = T1 * T2 */
  24985. sp_384_mont_mul_12(ctx->t2, ctx->t1, ctx->t2, p384_mod, p384_mp_mod);
  24986. ctx->state = 7;
  24987. break;
  24988. case 7:
  24989. /* T1 = 3T2 */
  24990. sp_384_mont_tpl_12(ctx->t1, ctx->t2, p384_mod);
  24991. ctx->state = 8;
  24992. break;
  24993. case 8:
  24994. /* Y = 2Y */
  24995. sp_384_mont_dbl_12(ctx->y, p->y, p384_mod);
  24996. ctx->state = 9;
  24997. break;
  24998. case 9:
  24999. /* Y = Y * Y */
  25000. sp_384_mont_sqr_12(ctx->y, ctx->y, p384_mod, p384_mp_mod);
  25001. ctx->state = 10;
  25002. break;
  25003. case 10:
  25004. /* T2 = Y * Y */
  25005. sp_384_mont_sqr_12(ctx->t2, ctx->y, p384_mod, p384_mp_mod);
  25006. ctx->state = 11;
  25007. break;
  25008. case 11:
  25009. /* T2 = T2/2 */
  25010. sp_384_div2_12(ctx->t2, ctx->t2, p384_mod);
  25011. ctx->state = 12;
  25012. break;
  25013. case 12:
  25014. /* Y = Y * X */
  25015. sp_384_mont_mul_12(ctx->y, ctx->y, p->x, p384_mod, p384_mp_mod);
  25016. ctx->state = 13;
  25017. break;
  25018. case 13:
  25019. /* X = T1 * T1 */
  25020. sp_384_mont_sqr_12(ctx->x, ctx->t1, p384_mod, p384_mp_mod);
  25021. ctx->state = 14;
  25022. break;
  25023. case 14:
  25024. /* X = X - Y */
  25025. sp_384_mont_sub_12(ctx->x, ctx->x, ctx->y, p384_mod);
  25026. ctx->state = 15;
  25027. break;
  25028. case 15:
  25029. /* X = X - Y */
  25030. sp_384_mont_sub_12(ctx->x, ctx->x, ctx->y, p384_mod);
  25031. ctx->state = 16;
  25032. break;
  25033. case 16:
  25034. /* Y = Y - X */
  25035. sp_384_mont_sub_lower_12(ctx->y, ctx->y, ctx->x, p384_mod);
  25036. ctx->state = 17;
  25037. break;
  25038. case 17:
  25039. /* Y = Y * T1 */
  25040. sp_384_mont_mul_12(ctx->y, ctx->y, ctx->t1, p384_mod, p384_mp_mod);
  25041. ctx->state = 18;
  25042. break;
  25043. case 18:
  25044. /* Y = Y - T2 */
  25045. sp_384_mont_sub_12(ctx->y, ctx->y, ctx->t2, p384_mod);
  25046. ctx->state = 19;
  25047. /* fall-through */
  25048. case 19:
  25049. err = MP_OKAY;
  25050. break;
  25051. }
  25052. if (err == MP_OKAY && ctx->state != 19) {
  25053. err = FP_WOULDBLOCK;
  25054. }
  25055. return err;
  25056. }
  25057. #endif /* WOLFSSL_SP_NONBLOCK */
  25058. static void sp_384_proj_point_dbl_12(sp_point_384* r, const sp_point_384* p,
  25059. sp_digit* t)
  25060. {
  25061. sp_digit* t1 = t;
  25062. sp_digit* t2 = t + 2*12;
  25063. sp_digit* x;
  25064. sp_digit* y;
  25065. sp_digit* z;
  25066. x = r->x;
  25067. y = r->y;
  25068. z = r->z;
  25069. /* Put infinity into result. */
  25070. if (r != p) {
  25071. r->infinity = p->infinity;
  25072. }
  25073. /* T1 = Z * Z */
  25074. sp_384_mont_sqr_12(t1, p->z, p384_mod, p384_mp_mod);
  25075. /* Z = Y * Z */
  25076. sp_384_mont_mul_12(z, p->y, p->z, p384_mod, p384_mp_mod);
  25077. /* Z = 2Z */
  25078. sp_384_mont_dbl_12(z, z, p384_mod);
  25079. /* T2 = X - T1 */
  25080. sp_384_mont_sub_12(t2, p->x, t1, p384_mod);
  25081. /* T1 = X + T1 */
  25082. sp_384_mont_add_12(t1, p->x, t1, p384_mod);
  25083. /* T2 = T1 * T2 */
  25084. sp_384_mont_mul_12(t2, t1, t2, p384_mod, p384_mp_mod);
  25085. /* T1 = 3T2 */
  25086. sp_384_mont_tpl_12(t1, t2, p384_mod);
  25087. /* Y = 2Y */
  25088. sp_384_mont_dbl_12(y, p->y, p384_mod);
  25089. /* Y = Y * Y */
  25090. sp_384_mont_sqr_12(y, y, p384_mod, p384_mp_mod);
  25091. /* T2 = Y * Y */
  25092. sp_384_mont_sqr_12(t2, y, p384_mod, p384_mp_mod);
  25093. /* T2 = T2/2 */
  25094. sp_384_div2_12(t2, t2, p384_mod);
  25095. /* Y = Y * X */
  25096. sp_384_mont_mul_12(y, y, p->x, p384_mod, p384_mp_mod);
  25097. /* X = T1 * T1 */
  25098. sp_384_mont_sqr_12(x, t1, p384_mod, p384_mp_mod);
  25099. /* X = X - Y */
  25100. sp_384_mont_sub_12(x, x, y, p384_mod);
  25101. /* X = X - Y */
  25102. sp_384_mont_sub_12(x, x, y, p384_mod);
  25103. /* Y = Y - X */
  25104. sp_384_mont_sub_lower_12(y, y, x, p384_mod);
  25105. /* Y = Y * T1 */
  25106. sp_384_mont_mul_12(y, y, t1, p384_mod, p384_mp_mod);
  25107. /* Y = Y - T2 */
  25108. sp_384_mont_sub_12(y, y, t2, p384_mod);
  25109. }
  25110. /* Compare two numbers to determine if they are equal.
  25111. * Constant time implementation.
  25112. *
  25113. * a First number to compare.
  25114. * b Second number to compare.
  25115. * returns 1 when equal and 0 otherwise.
  25116. */
  25117. static int sp_384_cmp_equal_12(const sp_digit* a, const sp_digit* b)
  25118. {
  25119. return ((a[0] ^ b[0]) | (a[1] ^ b[1]) | (a[2] ^ b[2]) |
  25120. (a[3] ^ b[3]) | (a[4] ^ b[4]) | (a[5] ^ b[5]) |
  25121. (a[6] ^ b[6]) | (a[7] ^ b[7]) | (a[8] ^ b[8]) |
  25122. (a[9] ^ b[9]) | (a[10] ^ b[10]) | (a[11] ^ b[11])) == 0;
  25123. }
  25124. /* Returns 1 if the number of zero.
  25125. * Implementation is constant time.
  25126. *
  25127. * a Number to check.
  25128. * returns 1 if the number is zero and 0 otherwise.
  25129. */
  25130. static int sp_384_iszero_12(const sp_digit* a)
  25131. {
  25132. return (a[0] | a[1] | a[2] | a[3] | a[4] | a[5] | a[6] | a[7] |
  25133. a[8] | a[9] | a[10] | a[11]) == 0;
  25134. }
  25135. /* Add two Montgomery form projective points.
  25136. *
  25137. * r Result of addition.
  25138. * p First point to add.
  25139. * q Second point to add.
  25140. * t Temporary ordinate data.
  25141. */
  25142. #ifdef WOLFSSL_SP_NONBLOCK
  25143. typedef struct sp_384_proj_point_add_12_ctx {
  25144. int state;
  25145. sp_384_proj_point_dbl_12_ctx dbl_ctx;
  25146. const sp_point_384* ap[2];
  25147. sp_point_384* rp[2];
  25148. sp_digit* t1;
  25149. sp_digit* t2;
  25150. sp_digit* t3;
  25151. sp_digit* t4;
  25152. sp_digit* t5;
  25153. sp_digit* t6;
  25154. sp_digit* x;
  25155. sp_digit* y;
  25156. sp_digit* z;
  25157. } sp_384_proj_point_add_12_ctx;
  25158. static int sp_384_proj_point_add_12_nb(sp_ecc_ctx_t* sp_ctx, sp_point_384* r,
  25159. const sp_point_384* p, const sp_point_384* q, sp_digit* t)
  25160. {
  25161. int err = FP_WOULDBLOCK;
  25162. sp_384_proj_point_add_12_ctx* ctx = (sp_384_proj_point_add_12_ctx*)sp_ctx->data;
  25163. /* Ensure only the first point is the same as the result. */
  25164. if (q == r) {
  25165. const sp_point_384* a = p;
  25166. p = q;
  25167. q = a;
  25168. }
  25169. typedef char ctx_size_test[sizeof(sp_384_proj_point_add_12_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  25170. (void)sizeof(ctx_size_test);
  25171. switch (ctx->state) {
  25172. case 0: /* INIT */
  25173. ctx->t1 = t;
  25174. ctx->t2 = t + 2*12;
  25175. ctx->t3 = t + 4*12;
  25176. ctx->t4 = t + 6*12;
  25177. ctx->t5 = t + 8*12;
  25178. ctx->t6 = t + 10*12;
  25179. ctx->x = ctx->t6;
  25180. ctx->y = ctx->t1;
  25181. ctx->z = ctx->t2;
  25182. ctx->state = 1;
  25183. break;
  25184. case 1:
  25185. /* Check double */
  25186. (void)sp_384_sub_12(ctx->t1, p384_mod, q->y);
  25187. sp_384_norm_12(ctx->t1);
  25188. if ((~p->infinity & ~q->infinity &
  25189. sp_384_cmp_equal_12(p->x, q->x) & sp_384_cmp_equal_12(p->z, q->z) &
  25190. (sp_384_cmp_equal_12(p->y, q->y) | sp_384_cmp_equal_12(p->y, ctx->t1))) != 0)
  25191. {
  25192. XMEMSET(&ctx->dbl_ctx, 0, sizeof(ctx->dbl_ctx));
  25193. ctx->state = 2;
  25194. }
  25195. else {
  25196. ctx->state = 3;
  25197. }
  25198. break;
  25199. case 2:
  25200. err = sp_384_proj_point_dbl_12_nb((sp_ecc_ctx_t*)&ctx->dbl_ctx, r, p, t);
  25201. if (err == MP_OKAY)
  25202. ctx->state = 27; /* done */
  25203. break;
  25204. case 3:
  25205. {
  25206. ctx->state = 4;
  25207. break;
  25208. }
  25209. case 4:
  25210. /* U1 = X1*Z2^2 */
  25211. sp_384_mont_sqr_12(ctx->t1, q->z, p384_mod, p384_mp_mod);
  25212. ctx->state = 5;
  25213. break;
  25214. case 5:
  25215. sp_384_mont_mul_12(ctx->t3, ctx->t1, q->z, p384_mod, p384_mp_mod);
  25216. ctx->state = 6;
  25217. break;
  25218. case 6:
  25219. sp_384_mont_mul_12(ctx->t1, ctx->t1, p->x, p384_mod, p384_mp_mod);
  25220. ctx->state = 7;
  25221. break;
  25222. case 7:
  25223. /* U2 = X2*Z1^2 */
  25224. sp_384_mont_sqr_12(ctx->t2, p->z, p384_mod, p384_mp_mod);
  25225. ctx->state = 8;
  25226. break;
  25227. case 8:
  25228. sp_384_mont_mul_12(ctx->t4, ctx->t2, p->z, p384_mod, p384_mp_mod);
  25229. ctx->state = 9;
  25230. break;
  25231. case 9:
  25232. sp_384_mont_mul_12(ctx->t2, ctx->t2, q->x, p384_mod, p384_mp_mod);
  25233. ctx->state = 10;
  25234. break;
  25235. case 10:
  25236. /* S1 = Y1*Z2^3 */
  25237. sp_384_mont_mul_12(ctx->t3, ctx->t3, p->y, p384_mod, p384_mp_mod);
  25238. ctx->state = 11;
  25239. break;
  25240. case 11:
  25241. /* S2 = Y2*Z1^3 */
  25242. sp_384_mont_mul_12(ctx->t4, ctx->t4, q->y, p384_mod, p384_mp_mod);
  25243. ctx->state = 12;
  25244. break;
  25245. case 12:
  25246. /* H = U2 - U1 */
  25247. sp_384_mont_sub_12(ctx->t2, ctx->t2, ctx->t1, p384_mod);
  25248. ctx->state = 13;
  25249. break;
  25250. case 13:
  25251. /* R = S2 - S1 */
  25252. sp_384_mont_sub_12(ctx->t4, ctx->t4, ctx->t3, p384_mod);
  25253. ctx->state = 14;
  25254. break;
  25255. case 14:
  25256. /* X3 = R^2 - H^3 - 2*U1*H^2 */
  25257. sp_384_mont_sqr_12(ctx->t5, ctx->t2, p384_mod, p384_mp_mod);
  25258. ctx->state = 15;
  25259. break;
  25260. case 15:
  25261. sp_384_mont_mul_12(ctx->y, ctx->t1, ctx->t5, p384_mod, p384_mp_mod);
  25262. ctx->state = 16;
  25263. break;
  25264. case 16:
  25265. sp_384_mont_mul_12(ctx->t5, ctx->t5, ctx->t2, p384_mod, p384_mp_mod);
  25266. ctx->state = 17;
  25267. break;
  25268. case 17:
  25269. /* Z3 = H*Z1*Z2 */
  25270. sp_384_mont_mul_12(ctx->z, p->z, ctx->t2, p384_mod, p384_mp_mod);
  25271. ctx->state = 18;
  25272. break;
  25273. case 18:
  25274. sp_384_mont_mul_12(ctx->z, ctx->z, q->z, p384_mod, p384_mp_mod);
  25275. ctx->state = 19;
  25276. break;
  25277. case 19:
  25278. sp_384_mont_sqr_12(ctx->x, ctx->t4, p384_mod, p384_mp_mod);
  25279. ctx->state = 20;
  25280. break;
  25281. case 20:
  25282. sp_384_mont_sub_12(ctx->x, ctx->x, ctx->t5, p384_mod);
  25283. ctx->state = 21;
  25284. break;
  25285. case 21:
  25286. sp_384_mont_mul_12(ctx->t5, ctx->t5, ctx->t3, p384_mod, p384_mp_mod);
  25287. ctx->state = 22;
  25288. break;
  25289. case 22:
  25290. sp_384_mont_dbl_12(ctx->t3, ctx->y, p384_mod);
  25291. ctx->state = 23;
  25292. break;
  25293. case 23:
  25294. sp_384_mont_sub_12(ctx->x, ctx->x, ctx->t3, p384_mod);
  25295. ctx->state = 24;
  25296. break;
  25297. case 24:
  25298. /* Y3 = R*(U1*H^2 - X3) - S1*H^3 */
  25299. sp_384_mont_sub_lower_12(ctx->y, ctx->y, ctx->x, p384_mod);
  25300. ctx->state = 25;
  25301. break;
  25302. case 25:
  25303. sp_384_mont_mul_12(ctx->y, ctx->y, ctx->t4, p384_mod, p384_mp_mod);
  25304. ctx->state = 26;
  25305. break;
  25306. case 26:
  25307. sp_384_mont_sub_12(ctx->y, ctx->y, ctx->t5, p384_mod);
  25308. ctx->state = 27;
  25309. /* fall-through */
  25310. case 27:
  25311. {
  25312. int i;
  25313. sp_digit maskp = 0 - (q->infinity & (!p->infinity));
  25314. sp_digit maskq = 0 - (p->infinity & (!q->infinity));
  25315. sp_digit maskt = ~(maskp | maskq);
  25316. for (i = 0; i < 12; i++) {
  25317. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) |
  25318. (ctx->x[i] & maskt);
  25319. }
  25320. for (i = 0; i < 12; i++) {
  25321. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) |
  25322. (ctx->y[i] & maskt);
  25323. }
  25324. for (i = 0; i < 12; i++) {
  25325. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) |
  25326. (ctx->z[i] & maskt);
  25327. }
  25328. r->z[0] |= p->infinity & q->infinity;
  25329. r->infinity = p->infinity & q->infinity;
  25330. err = MP_OKAY;
  25331. break;
  25332. }
  25333. }
  25334. if (err == MP_OKAY && ctx->state != 27) {
  25335. err = FP_WOULDBLOCK;
  25336. }
  25337. return err;
  25338. }
  25339. #endif /* WOLFSSL_SP_NONBLOCK */
  25340. static void sp_384_proj_point_add_12(sp_point_384* r,
  25341. const sp_point_384* p, const sp_point_384* q, sp_digit* t)
  25342. {
  25343. sp_digit* t1 = t;
  25344. sp_digit* t2 = t + 2*12;
  25345. sp_digit* t3 = t + 4*12;
  25346. sp_digit* t4 = t + 6*12;
  25347. sp_digit* t5 = t + 8*12;
  25348. sp_digit* t6 = t + 10*12;
  25349. /* Check double */
  25350. (void)sp_384_sub_12(t1, p384_mod, q->y);
  25351. sp_384_norm_12(t1);
  25352. if ((~p->infinity & ~q->infinity &
  25353. sp_384_cmp_equal_12(p->x, q->x) & sp_384_cmp_equal_12(p->z, q->z) &
  25354. (sp_384_cmp_equal_12(p->y, q->y) | sp_384_cmp_equal_12(p->y, t1))) != 0) {
  25355. sp_384_proj_point_dbl_12(r, p, t);
  25356. }
  25357. else {
  25358. sp_digit maskp;
  25359. sp_digit maskq;
  25360. sp_digit maskt;
  25361. sp_digit* x = t6;
  25362. sp_digit* y = t1;
  25363. sp_digit* z = t2;
  25364. int i;
  25365. maskp = 0 - (q->infinity & (!p->infinity));
  25366. maskq = 0 - (p->infinity & (!q->infinity));
  25367. maskt = ~(maskp | maskq);
  25368. /* U1 = X1*Z2^2 */
  25369. sp_384_mont_sqr_12(t1, q->z, p384_mod, p384_mp_mod);
  25370. sp_384_mont_mul_12(t3, t1, q->z, p384_mod, p384_mp_mod);
  25371. sp_384_mont_mul_12(t1, t1, p->x, p384_mod, p384_mp_mod);
  25372. /* U2 = X2*Z1^2 */
  25373. sp_384_mont_sqr_12(t2, p->z, p384_mod, p384_mp_mod);
  25374. sp_384_mont_mul_12(t4, t2, p->z, p384_mod, p384_mp_mod);
  25375. sp_384_mont_mul_12(t2, t2, q->x, p384_mod, p384_mp_mod);
  25376. /* S1 = Y1*Z2^3 */
  25377. sp_384_mont_mul_12(t3, t3, p->y, p384_mod, p384_mp_mod);
  25378. /* S2 = Y2*Z1^3 */
  25379. sp_384_mont_mul_12(t4, t4, q->y, p384_mod, p384_mp_mod);
  25380. /* H = U2 - U1 */
  25381. sp_384_mont_sub_12(t2, t2, t1, p384_mod);
  25382. /* R = S2 - S1 */
  25383. sp_384_mont_sub_12(t4, t4, t3, p384_mod);
  25384. if (~p->infinity & ~q->infinity &
  25385. sp_384_iszero_12(t2) & sp_384_iszero_12(t4) & maskt) {
  25386. sp_384_proj_point_dbl_12(r, p, t);
  25387. }
  25388. else {
  25389. /* X3 = R^2 - H^3 - 2*U1*H^2 */
  25390. sp_384_mont_sqr_12(t5, t2, p384_mod, p384_mp_mod);
  25391. sp_384_mont_mul_12(y, t1, t5, p384_mod, p384_mp_mod);
  25392. sp_384_mont_mul_12(t5, t5, t2, p384_mod, p384_mp_mod);
  25393. /* Z3 = H*Z1*Z2 */
  25394. sp_384_mont_mul_12(z, p->z, t2, p384_mod, p384_mp_mod);
  25395. sp_384_mont_mul_12(z, z, q->z, p384_mod, p384_mp_mod);
  25396. sp_384_mont_sqr_12(x, t4, p384_mod, p384_mp_mod);
  25397. sp_384_mont_sub_12(x, x, t5, p384_mod);
  25398. sp_384_mont_mul_12(t5, t5, t3, p384_mod, p384_mp_mod);
  25399. sp_384_mont_dbl_12(t3, y, p384_mod);
  25400. sp_384_mont_sub_12(x, x, t3, p384_mod);
  25401. /* Y3 = R*(U1*H^2 - X3) - S1*H^3 */
  25402. sp_384_mont_sub_lower_12(y, y, x, p384_mod);
  25403. sp_384_mont_mul_12(y, y, t4, p384_mod, p384_mp_mod);
  25404. sp_384_mont_sub_12(y, y, t5, p384_mod);
  25405. for (i = 0; i < 12; i++) {
  25406. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) |
  25407. (x[i] & maskt);
  25408. }
  25409. for (i = 0; i < 12; i++) {
  25410. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) |
  25411. (y[i] & maskt);
  25412. }
  25413. for (i = 0; i < 12; i++) {
  25414. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) |
  25415. (z[i] & maskt);
  25416. }
  25417. r->z[0] |= p->infinity & q->infinity;
  25418. r->infinity = p->infinity & q->infinity;
  25419. }
  25420. }
  25421. }
  25422. #ifndef WC_NO_CACHE_RESISTANT
  25423. /* Touch each possible point that could be being copied.
  25424. *
  25425. * r Point to copy into.
  25426. * table Table - start of the entires to access
  25427. * idx Index of entry to retrieve.
  25428. */
  25429. static void sp_384_get_point_16_12(sp_point_384* r, const sp_point_384* table,
  25430. int idx)
  25431. {
  25432. int i;
  25433. sp_digit mask;
  25434. r->x[0] = 0;
  25435. r->x[1] = 0;
  25436. r->x[2] = 0;
  25437. r->x[3] = 0;
  25438. r->x[4] = 0;
  25439. r->x[5] = 0;
  25440. r->x[6] = 0;
  25441. r->x[7] = 0;
  25442. r->x[8] = 0;
  25443. r->x[9] = 0;
  25444. r->x[10] = 0;
  25445. r->x[11] = 0;
  25446. r->y[0] = 0;
  25447. r->y[1] = 0;
  25448. r->y[2] = 0;
  25449. r->y[3] = 0;
  25450. r->y[4] = 0;
  25451. r->y[5] = 0;
  25452. r->y[6] = 0;
  25453. r->y[7] = 0;
  25454. r->y[8] = 0;
  25455. r->y[9] = 0;
  25456. r->y[10] = 0;
  25457. r->y[11] = 0;
  25458. r->z[0] = 0;
  25459. r->z[1] = 0;
  25460. r->z[2] = 0;
  25461. r->z[3] = 0;
  25462. r->z[4] = 0;
  25463. r->z[5] = 0;
  25464. r->z[6] = 0;
  25465. r->z[7] = 0;
  25466. r->z[8] = 0;
  25467. r->z[9] = 0;
  25468. r->z[10] = 0;
  25469. r->z[11] = 0;
  25470. for (i = 1; i < 16; i++) {
  25471. mask = 0 - (i == idx);
  25472. r->x[0] |= mask & table[i].x[0];
  25473. r->x[1] |= mask & table[i].x[1];
  25474. r->x[2] |= mask & table[i].x[2];
  25475. r->x[3] |= mask & table[i].x[3];
  25476. r->x[4] |= mask & table[i].x[4];
  25477. r->x[5] |= mask & table[i].x[5];
  25478. r->x[6] |= mask & table[i].x[6];
  25479. r->x[7] |= mask & table[i].x[7];
  25480. r->x[8] |= mask & table[i].x[8];
  25481. r->x[9] |= mask & table[i].x[9];
  25482. r->x[10] |= mask & table[i].x[10];
  25483. r->x[11] |= mask & table[i].x[11];
  25484. r->y[0] |= mask & table[i].y[0];
  25485. r->y[1] |= mask & table[i].y[1];
  25486. r->y[2] |= mask & table[i].y[2];
  25487. r->y[3] |= mask & table[i].y[3];
  25488. r->y[4] |= mask & table[i].y[4];
  25489. r->y[5] |= mask & table[i].y[5];
  25490. r->y[6] |= mask & table[i].y[6];
  25491. r->y[7] |= mask & table[i].y[7];
  25492. r->y[8] |= mask & table[i].y[8];
  25493. r->y[9] |= mask & table[i].y[9];
  25494. r->y[10] |= mask & table[i].y[10];
  25495. r->y[11] |= mask & table[i].y[11];
  25496. r->z[0] |= mask & table[i].z[0];
  25497. r->z[1] |= mask & table[i].z[1];
  25498. r->z[2] |= mask & table[i].z[2];
  25499. r->z[3] |= mask & table[i].z[3];
  25500. r->z[4] |= mask & table[i].z[4];
  25501. r->z[5] |= mask & table[i].z[5];
  25502. r->z[6] |= mask & table[i].z[6];
  25503. r->z[7] |= mask & table[i].z[7];
  25504. r->z[8] |= mask & table[i].z[8];
  25505. r->z[9] |= mask & table[i].z[9];
  25506. r->z[10] |= mask & table[i].z[10];
  25507. r->z[11] |= mask & table[i].z[11];
  25508. }
  25509. }
  25510. #endif /* !WC_NO_CACHE_RESISTANT */
  25511. /* Multiply the point by the scalar and return the result.
  25512. * If map is true then convert result to affine coordinates.
  25513. *
  25514. * Fast implementation that generates a pre-computation table.
  25515. * 4 bits of window (no sliding!).
  25516. * Uses add and double for calculating table.
  25517. * 384 doubles.
  25518. * 108 adds.
  25519. *
  25520. * r Resulting point.
  25521. * g Point to multiply.
  25522. * k Scalar to multiply by.
  25523. * map Indicates whether to convert result to affine.
  25524. * ct Constant time required.
  25525. * heap Heap to use for allocation.
  25526. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  25527. */
  25528. static int sp_384_ecc_mulmod_fast_12(sp_point_384* r, const sp_point_384* g, const sp_digit* k,
  25529. int map, int ct, void* heap)
  25530. {
  25531. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25532. sp_point_384* t = NULL;
  25533. sp_digit* tmp = NULL;
  25534. #else
  25535. sp_point_384 t[16 + 1];
  25536. sp_digit tmp[2 * 12 * 6];
  25537. #endif
  25538. sp_point_384* rt = NULL;
  25539. #ifndef WC_NO_CACHE_RESISTANT
  25540. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25541. sp_point_384* p = NULL;
  25542. #else
  25543. sp_point_384 p[1];
  25544. #endif
  25545. #endif /* !WC_NO_CACHE_RESISTANT */
  25546. sp_digit n;
  25547. int i;
  25548. int c;
  25549. int y;
  25550. int err = MP_OKAY;
  25551. /* Constant time used for cache attack resistance implementation. */
  25552. (void)ct;
  25553. (void)heap;
  25554. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25555. t = (sp_point_384*)XMALLOC(sizeof(sp_point_384) * (16 + 1),
  25556. heap, DYNAMIC_TYPE_ECC);
  25557. if (t == NULL)
  25558. err = MEMORY_E;
  25559. #ifndef WC_NO_CACHE_RESISTANT
  25560. if (err == MP_OKAY) {
  25561. p = (sp_point_384*)XMALLOC(sizeof(sp_point_384),
  25562. heap, DYNAMIC_TYPE_ECC);
  25563. if (p == NULL)
  25564. err = MEMORY_E;
  25565. }
  25566. #endif
  25567. if (err == MP_OKAY) {
  25568. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 12 * 6, heap,
  25569. DYNAMIC_TYPE_ECC);
  25570. if (tmp == NULL)
  25571. err = MEMORY_E;
  25572. }
  25573. #endif
  25574. if (err == MP_OKAY) {
  25575. rt = t + 16;
  25576. /* t[0] = {0, 0, 1} * norm */
  25577. XMEMSET(&t[0], 0, sizeof(t[0]));
  25578. t[0].infinity = 1;
  25579. /* t[1] = {g->x, g->y, g->z} * norm */
  25580. (void)sp_384_mod_mul_norm_12(t[1].x, g->x, p384_mod);
  25581. (void)sp_384_mod_mul_norm_12(t[1].y, g->y, p384_mod);
  25582. (void)sp_384_mod_mul_norm_12(t[1].z, g->z, p384_mod);
  25583. t[1].infinity = 0;
  25584. sp_384_proj_point_dbl_12(&t[ 2], &t[ 1], tmp);
  25585. t[ 2].infinity = 0;
  25586. sp_384_proj_point_add_12(&t[ 3], &t[ 2], &t[ 1], tmp);
  25587. t[ 3].infinity = 0;
  25588. sp_384_proj_point_dbl_12(&t[ 4], &t[ 2], tmp);
  25589. t[ 4].infinity = 0;
  25590. sp_384_proj_point_add_12(&t[ 5], &t[ 3], &t[ 2], tmp);
  25591. t[ 5].infinity = 0;
  25592. sp_384_proj_point_dbl_12(&t[ 6], &t[ 3], tmp);
  25593. t[ 6].infinity = 0;
  25594. sp_384_proj_point_add_12(&t[ 7], &t[ 4], &t[ 3], tmp);
  25595. t[ 7].infinity = 0;
  25596. sp_384_proj_point_dbl_12(&t[ 8], &t[ 4], tmp);
  25597. t[ 8].infinity = 0;
  25598. sp_384_proj_point_add_12(&t[ 9], &t[ 5], &t[ 4], tmp);
  25599. t[ 9].infinity = 0;
  25600. sp_384_proj_point_dbl_12(&t[10], &t[ 5], tmp);
  25601. t[10].infinity = 0;
  25602. sp_384_proj_point_add_12(&t[11], &t[ 6], &t[ 5], tmp);
  25603. t[11].infinity = 0;
  25604. sp_384_proj_point_dbl_12(&t[12], &t[ 6], tmp);
  25605. t[12].infinity = 0;
  25606. sp_384_proj_point_add_12(&t[13], &t[ 7], &t[ 6], tmp);
  25607. t[13].infinity = 0;
  25608. sp_384_proj_point_dbl_12(&t[14], &t[ 7], tmp);
  25609. t[14].infinity = 0;
  25610. sp_384_proj_point_add_12(&t[15], &t[ 8], &t[ 7], tmp);
  25611. t[15].infinity = 0;
  25612. i = 10;
  25613. n = k[i+1] << 0;
  25614. c = 28;
  25615. y = (int)(n >> 28);
  25616. #ifndef WC_NO_CACHE_RESISTANT
  25617. if (ct) {
  25618. sp_384_get_point_16_12(rt, t, y);
  25619. rt->infinity = !y;
  25620. }
  25621. else
  25622. #endif
  25623. {
  25624. XMEMCPY(rt, &t[y], sizeof(sp_point_384));
  25625. }
  25626. n <<= 4;
  25627. for (; i>=0 || c>=4; ) {
  25628. if (c < 4) {
  25629. n |= k[i--];
  25630. c += 32;
  25631. }
  25632. y = (n >> 28) & 0xf;
  25633. n <<= 4;
  25634. c -= 4;
  25635. sp_384_proj_point_dbl_12(rt, rt, tmp);
  25636. sp_384_proj_point_dbl_12(rt, rt, tmp);
  25637. sp_384_proj_point_dbl_12(rt, rt, tmp);
  25638. sp_384_proj_point_dbl_12(rt, rt, tmp);
  25639. #ifndef WC_NO_CACHE_RESISTANT
  25640. if (ct) {
  25641. sp_384_get_point_16_12(p, t, y);
  25642. p->infinity = !y;
  25643. sp_384_proj_point_add_12(rt, rt, p, tmp);
  25644. }
  25645. else
  25646. #endif
  25647. {
  25648. sp_384_proj_point_add_12(rt, rt, &t[y], tmp);
  25649. }
  25650. }
  25651. if (map != 0) {
  25652. sp_384_map_12(r, rt, tmp);
  25653. }
  25654. else {
  25655. XMEMCPY(r, rt, sizeof(sp_point_384));
  25656. }
  25657. }
  25658. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25659. if (tmp != NULL)
  25660. #endif
  25661. {
  25662. ForceZero(tmp, sizeof(sp_digit) * 2 * 12 * 6);
  25663. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25664. XFREE(tmp, heap, DYNAMIC_TYPE_ECC);
  25665. #endif
  25666. }
  25667. #ifndef WC_NO_CACHE_RESISTANT
  25668. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25669. if (p != NULL)
  25670. #endif
  25671. {
  25672. ForceZero(p, sizeof(sp_point_384));
  25673. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25674. XFREE(p, heap, DYNAMIC_TYPE_ECC);
  25675. #endif
  25676. }
  25677. #endif /* !WC_NO_CACHE_RESISTANT */
  25678. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25679. if (t != NULL)
  25680. #endif
  25681. {
  25682. ForceZero(t, sizeof(sp_point_384) * 17);
  25683. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25684. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  25685. #endif
  25686. }
  25687. return err;
  25688. }
  25689. #ifdef FP_ECC
  25690. #define sp_384_mont_dbl_lower_12 sp_384_mont_dbl_12
  25691. #define sp_384_mont_tpl_lower_12 sp_384_mont_tpl_12
  25692. /* Double the Montgomery form projective point p a number of times.
  25693. *
  25694. * r Result of repeated doubling of point.
  25695. * p Point to double.
  25696. * n Number of times to double
  25697. * t Temporary ordinate data.
  25698. */
  25699. static void sp_384_proj_point_dbl_n_12(sp_point_384* p, int i,
  25700. sp_digit* t)
  25701. {
  25702. sp_digit* w = t;
  25703. sp_digit* a = t + 2*12;
  25704. sp_digit* b = t + 4*12;
  25705. sp_digit* t1 = t + 6*12;
  25706. sp_digit* t2 = t + 8*12;
  25707. sp_digit* x;
  25708. sp_digit* y;
  25709. sp_digit* z;
  25710. volatile int n = i;
  25711. x = p->x;
  25712. y = p->y;
  25713. z = p->z;
  25714. /* Y = 2*Y */
  25715. sp_384_mont_dbl_12(y, y, p384_mod);
  25716. /* W = Z^4 */
  25717. sp_384_mont_sqr_12(w, z, p384_mod, p384_mp_mod);
  25718. sp_384_mont_sqr_12(w, w, p384_mod, p384_mp_mod);
  25719. #ifndef WOLFSSL_SP_SMALL
  25720. while (--n > 0)
  25721. #else
  25722. while (--n >= 0)
  25723. #endif
  25724. {
  25725. /* A = 3*(X^2 - W) */
  25726. sp_384_mont_sqr_12(t1, x, p384_mod, p384_mp_mod);
  25727. sp_384_mont_sub_12(t1, t1, w, p384_mod);
  25728. sp_384_mont_tpl_lower_12(a, t1, p384_mod);
  25729. /* B = X*Y^2 */
  25730. sp_384_mont_sqr_12(t1, y, p384_mod, p384_mp_mod);
  25731. sp_384_mont_mul_12(b, t1, x, p384_mod, p384_mp_mod);
  25732. /* X = A^2 - 2B */
  25733. sp_384_mont_sqr_12(x, a, p384_mod, p384_mp_mod);
  25734. sp_384_mont_dbl_12(t2, b, p384_mod);
  25735. sp_384_mont_sub_12(x, x, t2, p384_mod);
  25736. /* b = 2.(B - X) */
  25737. sp_384_mont_sub_lower_12(t2, b, x, p384_mod);
  25738. sp_384_mont_dbl_lower_12(b, t2, p384_mod);
  25739. /* Z = Z*Y */
  25740. sp_384_mont_mul_12(z, z, y, p384_mod, p384_mp_mod);
  25741. /* t1 = Y^4 */
  25742. sp_384_mont_sqr_12(t1, t1, p384_mod, p384_mp_mod);
  25743. #ifdef WOLFSSL_SP_SMALL
  25744. if (n != 0)
  25745. #endif
  25746. {
  25747. /* W = W*Y^4 */
  25748. sp_384_mont_mul_12(w, w, t1, p384_mod, p384_mp_mod);
  25749. }
  25750. /* y = 2*A*(B - X) - Y^4 */
  25751. sp_384_mont_mul_12(y, b, a, p384_mod, p384_mp_mod);
  25752. sp_384_mont_sub_12(y, y, t1, p384_mod);
  25753. }
  25754. #ifndef WOLFSSL_SP_SMALL
  25755. /* A = 3*(X^2 - W) */
  25756. sp_384_mont_sqr_12(t1, x, p384_mod, p384_mp_mod);
  25757. sp_384_mont_sub_12(t1, t1, w, p384_mod);
  25758. sp_384_mont_tpl_lower_12(a, t1, p384_mod);
  25759. /* B = X*Y^2 */
  25760. sp_384_mont_sqr_12(t1, y, p384_mod, p384_mp_mod);
  25761. sp_384_mont_mul_12(b, t1, x, p384_mod, p384_mp_mod);
  25762. /* X = A^2 - 2B */
  25763. sp_384_mont_sqr_12(x, a, p384_mod, p384_mp_mod);
  25764. sp_384_mont_dbl_12(t2, b, p384_mod);
  25765. sp_384_mont_sub_12(x, x, t2, p384_mod);
  25766. /* b = 2.(B - X) */
  25767. sp_384_mont_sub_lower_12(t2, b, x, p384_mod);
  25768. sp_384_mont_dbl_lower_12(b, t2, p384_mod);
  25769. /* Z = Z*Y */
  25770. sp_384_mont_mul_12(z, z, y, p384_mod, p384_mp_mod);
  25771. /* t1 = Y^4 */
  25772. sp_384_mont_sqr_12(t1, t1, p384_mod, p384_mp_mod);
  25773. /* y = 2*A*(B - X) - Y^4 */
  25774. sp_384_mont_mul_12(y, b, a, p384_mod, p384_mp_mod);
  25775. sp_384_mont_sub_12(y, y, t1, p384_mod);
  25776. #endif
  25777. /* Y = Y/2 */
  25778. sp_384_div2_12(y, y, p384_mod);
  25779. }
  25780. /* Convert the projective point to affine.
  25781. * Ordinates are in Montgomery form.
  25782. *
  25783. * a Point to convert.
  25784. * t Temporary data.
  25785. */
  25786. static void sp_384_proj_to_affine_12(sp_point_384* a, sp_digit* t)
  25787. {
  25788. sp_digit* t1 = t;
  25789. sp_digit* t2 = t + 2 * 12;
  25790. sp_digit* tmp = t + 4 * 12;
  25791. sp_384_mont_inv_12(t1, a->z, tmp);
  25792. sp_384_mont_sqr_12(t2, t1, p384_mod, p384_mp_mod);
  25793. sp_384_mont_mul_12(t1, t2, t1, p384_mod, p384_mp_mod);
  25794. sp_384_mont_mul_12(a->x, a->x, t2, p384_mod, p384_mp_mod);
  25795. sp_384_mont_mul_12(a->y, a->y, t1, p384_mod, p384_mp_mod);
  25796. XMEMCPY(a->z, p384_norm_mod, sizeof(p384_norm_mod));
  25797. }
  25798. #endif /* FP_ECC */
  25799. /* A table entry for pre-computed points. */
  25800. typedef struct sp_table_entry_384 {
  25801. sp_digit x[12];
  25802. sp_digit y[12];
  25803. } sp_table_entry_384;
  25804. #ifdef FP_ECC
  25805. #endif /* FP_ECC */
  25806. /* Add two Montgomery form projective points. The second point has a q value of
  25807. * one.
  25808. * Only the first point can be the same pointer as the result point.
  25809. *
  25810. * r Result of addition.
  25811. * p First point to add.
  25812. * q Second point to add.
  25813. * t Temporary ordinate data.
  25814. */
  25815. static void sp_384_proj_point_add_qz1_12(sp_point_384* r, const sp_point_384* p,
  25816. const sp_point_384* q, sp_digit* t)
  25817. {
  25818. sp_digit* t1 = t;
  25819. sp_digit* t2 = t + 2*12;
  25820. sp_digit* t3 = t + 4*12;
  25821. sp_digit* t4 = t + 6*12;
  25822. sp_digit* t5 = t + 8*12;
  25823. sp_digit* t6 = t + 10*12;
  25824. /* Check double */
  25825. (void)sp_384_sub_12(t1, p384_mod, q->y);
  25826. sp_384_norm_12(t1);
  25827. if ((~p->infinity & ~q->infinity &
  25828. sp_384_cmp_equal_12(p->x, q->x) & sp_384_cmp_equal_12(p->z, q->z) &
  25829. (sp_384_cmp_equal_12(p->y, q->y) | sp_384_cmp_equal_12(p->y, t1))) != 0) {
  25830. sp_384_proj_point_dbl_12(r, p, t);
  25831. }
  25832. else {
  25833. sp_digit maskp;
  25834. sp_digit maskq;
  25835. sp_digit maskt;
  25836. sp_digit* x = t2;
  25837. sp_digit* y = t5;
  25838. sp_digit* z = t6;
  25839. int i;
  25840. /* U2 = X2*Z1^2 */
  25841. sp_384_mont_sqr_12(t2, p->z, p384_mod, p384_mp_mod);
  25842. sp_384_mont_mul_12(t4, t2, p->z, p384_mod, p384_mp_mod);
  25843. sp_384_mont_mul_12(t2, t2, q->x, p384_mod, p384_mp_mod);
  25844. /* S2 = Y2*Z1^3 */
  25845. sp_384_mont_mul_12(t4, t4, q->y, p384_mod, p384_mp_mod);
  25846. /* H = U2 - X1 */
  25847. sp_384_mont_sub_12(t2, t2, p->x, p384_mod);
  25848. /* R = S2 - Y1 */
  25849. sp_384_mont_sub_12(t4, t4, p->y, p384_mod);
  25850. /* Z3 = H*Z1 */
  25851. sp_384_mont_mul_12(z, p->z, t2, p384_mod, p384_mp_mod);
  25852. /* X3 = R^2 - H^3 - 2*X1*H^2 */
  25853. sp_384_mont_sqr_12(t1, t4, p384_mod, p384_mp_mod);
  25854. sp_384_mont_sqr_12(t5, t2, p384_mod, p384_mp_mod);
  25855. sp_384_mont_mul_12(t3, p->x, t5, p384_mod, p384_mp_mod);
  25856. sp_384_mont_mul_12(t5, t5, t2, p384_mod, p384_mp_mod);
  25857. sp_384_mont_sub_12(x, t1, t5, p384_mod);
  25858. sp_384_mont_dbl_12(t1, t3, p384_mod);
  25859. sp_384_mont_sub_12(x, x, t1, p384_mod);
  25860. /* Y3 = R*(X1*H^2 - X3) - Y1*H^3 */
  25861. sp_384_mont_sub_lower_12(t3, t3, x, p384_mod);
  25862. sp_384_mont_mul_12(t3, t3, t4, p384_mod, p384_mp_mod);
  25863. sp_384_mont_mul_12(t5, t5, p->y, p384_mod, p384_mp_mod);
  25864. sp_384_mont_sub_12(y, t3, t5, p384_mod);
  25865. maskp = 0 - (q->infinity & (!p->infinity));
  25866. maskq = 0 - (p->infinity & (!q->infinity));
  25867. maskt = ~(maskp | maskq);
  25868. for (i = 0; i < 12; i++) {
  25869. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) | (x[i] & maskt);
  25870. }
  25871. for (i = 0; i < 12; i++) {
  25872. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) | (y[i] & maskt);
  25873. }
  25874. for (i = 0; i < 12; i++) {
  25875. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) | (z[i] & maskt);
  25876. }
  25877. r->z[0] |= p->infinity & q->infinity;
  25878. r->infinity = p->infinity & q->infinity;
  25879. }
  25880. }
  25881. #ifdef WOLFSSL_SP_SMALL
  25882. #ifdef FP_ECC
  25883. /* Generate the pre-computed table of points for the base point.
  25884. *
  25885. * width = 4
  25886. * 16 entries
  25887. * 96 bits between
  25888. *
  25889. * a The base point.
  25890. * table Place to store generated point data.
  25891. * tmp Temporary data.
  25892. * heap Heap to use for allocation.
  25893. */
  25894. static int sp_384_gen_stripe_table_12(const sp_point_384* a,
  25895. sp_table_entry_384* table, sp_digit* tmp, void* heap)
  25896. {
  25897. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25898. sp_point_384* t = NULL;
  25899. #else
  25900. sp_point_384 t[3];
  25901. #endif
  25902. sp_point_384* s1 = NULL;
  25903. sp_point_384* s2 = NULL;
  25904. int i;
  25905. int j;
  25906. int err = MP_OKAY;
  25907. (void)heap;
  25908. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25909. t = (sp_point_384*)XMALLOC(sizeof(sp_point_384) * 3, heap,
  25910. DYNAMIC_TYPE_ECC);
  25911. if (t == NULL)
  25912. err = MEMORY_E;
  25913. #endif
  25914. if (err == MP_OKAY) {
  25915. s1 = t + 1;
  25916. s2 = t + 2;
  25917. err = sp_384_mod_mul_norm_12(t->x, a->x, p384_mod);
  25918. }
  25919. if (err == MP_OKAY) {
  25920. err = sp_384_mod_mul_norm_12(t->y, a->y, p384_mod);
  25921. }
  25922. if (err == MP_OKAY) {
  25923. err = sp_384_mod_mul_norm_12(t->z, a->z, p384_mod);
  25924. }
  25925. if (err == MP_OKAY) {
  25926. t->infinity = 0;
  25927. sp_384_proj_to_affine_12(t, tmp);
  25928. XMEMCPY(s1->z, p384_norm_mod, sizeof(p384_norm_mod));
  25929. s1->infinity = 0;
  25930. XMEMCPY(s2->z, p384_norm_mod, sizeof(p384_norm_mod));
  25931. s2->infinity = 0;
  25932. /* table[0] = {0, 0, infinity} */
  25933. XMEMSET(&table[0], 0, sizeof(sp_table_entry_384));
  25934. /* table[1] = Affine version of 'a' in Montgomery form */
  25935. XMEMCPY(table[1].x, t->x, sizeof(table->x));
  25936. XMEMCPY(table[1].y, t->y, sizeof(table->y));
  25937. for (i=1; i<4; i++) {
  25938. sp_384_proj_point_dbl_n_12(t, 96, tmp);
  25939. sp_384_proj_to_affine_12(t, tmp);
  25940. XMEMCPY(table[1<<i].x, t->x, sizeof(table->x));
  25941. XMEMCPY(table[1<<i].y, t->y, sizeof(table->y));
  25942. }
  25943. for (i=1; i<4; i++) {
  25944. XMEMCPY(s1->x, table[1<<i].x, sizeof(table->x));
  25945. XMEMCPY(s1->y, table[1<<i].y, sizeof(table->y));
  25946. for (j=(1<<i)+1; j<(1<<(i+1)); j++) {
  25947. XMEMCPY(s2->x, table[j-(1<<i)].x, sizeof(table->x));
  25948. XMEMCPY(s2->y, table[j-(1<<i)].y, sizeof(table->y));
  25949. sp_384_proj_point_add_qz1_12(t, s1, s2, tmp);
  25950. sp_384_proj_to_affine_12(t, tmp);
  25951. XMEMCPY(table[j].x, t->x, sizeof(table->x));
  25952. XMEMCPY(table[j].y, t->y, sizeof(table->y));
  25953. }
  25954. }
  25955. }
  25956. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  25957. if (t != NULL)
  25958. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  25959. #endif
  25960. return err;
  25961. }
  25962. #endif /* FP_ECC */
  25963. #ifndef WC_NO_CACHE_RESISTANT
  25964. /* Touch each possible entry that could be being copied.
  25965. *
  25966. * r Point to copy into.
  25967. * table Table - start of the entires to access
  25968. * idx Index of entry to retrieve.
  25969. */
  25970. static void sp_384_get_entry_16_12(sp_point_384* r,
  25971. const sp_table_entry_384* table, int idx)
  25972. {
  25973. int i;
  25974. sp_digit mask;
  25975. r->x[0] = 0;
  25976. r->x[1] = 0;
  25977. r->x[2] = 0;
  25978. r->x[3] = 0;
  25979. r->x[4] = 0;
  25980. r->x[5] = 0;
  25981. r->x[6] = 0;
  25982. r->x[7] = 0;
  25983. r->x[8] = 0;
  25984. r->x[9] = 0;
  25985. r->x[10] = 0;
  25986. r->x[11] = 0;
  25987. r->y[0] = 0;
  25988. r->y[1] = 0;
  25989. r->y[2] = 0;
  25990. r->y[3] = 0;
  25991. r->y[4] = 0;
  25992. r->y[5] = 0;
  25993. r->y[6] = 0;
  25994. r->y[7] = 0;
  25995. r->y[8] = 0;
  25996. r->y[9] = 0;
  25997. r->y[10] = 0;
  25998. r->y[11] = 0;
  25999. for (i = 1; i < 16; i++) {
  26000. mask = 0 - (i == idx);
  26001. r->x[0] |= mask & table[i].x[0];
  26002. r->x[1] |= mask & table[i].x[1];
  26003. r->x[2] |= mask & table[i].x[2];
  26004. r->x[3] |= mask & table[i].x[3];
  26005. r->x[4] |= mask & table[i].x[4];
  26006. r->x[5] |= mask & table[i].x[5];
  26007. r->x[6] |= mask & table[i].x[6];
  26008. r->x[7] |= mask & table[i].x[7];
  26009. r->x[8] |= mask & table[i].x[8];
  26010. r->x[9] |= mask & table[i].x[9];
  26011. r->x[10] |= mask & table[i].x[10];
  26012. r->x[11] |= mask & table[i].x[11];
  26013. r->y[0] |= mask & table[i].y[0];
  26014. r->y[1] |= mask & table[i].y[1];
  26015. r->y[2] |= mask & table[i].y[2];
  26016. r->y[3] |= mask & table[i].y[3];
  26017. r->y[4] |= mask & table[i].y[4];
  26018. r->y[5] |= mask & table[i].y[5];
  26019. r->y[6] |= mask & table[i].y[6];
  26020. r->y[7] |= mask & table[i].y[7];
  26021. r->y[8] |= mask & table[i].y[8];
  26022. r->y[9] |= mask & table[i].y[9];
  26023. r->y[10] |= mask & table[i].y[10];
  26024. r->y[11] |= mask & table[i].y[11];
  26025. }
  26026. }
  26027. #endif /* !WC_NO_CACHE_RESISTANT */
  26028. /* Multiply the point by the scalar and return the result.
  26029. * If map is true then convert result to affine coordinates.
  26030. *
  26031. * Stripe implementation.
  26032. * Pre-generated: 2^0, 2^96, ...
  26033. * Pre-generated: products of all combinations of above.
  26034. * 4 doubles and adds (with qz=1)
  26035. *
  26036. * r Resulting point.
  26037. * k Scalar to multiply by.
  26038. * table Pre-computed table.
  26039. * map Indicates whether to convert result to affine.
  26040. * ct Constant time required.
  26041. * heap Heap to use for allocation.
  26042. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  26043. */
  26044. static int sp_384_ecc_mulmod_stripe_12(sp_point_384* r, const sp_point_384* g,
  26045. const sp_table_entry_384* table, const sp_digit* k, int map,
  26046. int ct, void* heap)
  26047. {
  26048. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26049. sp_point_384* rt = NULL;
  26050. sp_digit* t = NULL;
  26051. #else
  26052. sp_point_384 rt[2];
  26053. sp_digit t[2 * 12 * 6];
  26054. #endif
  26055. sp_point_384* p = NULL;
  26056. int i;
  26057. int j;
  26058. int y;
  26059. int x;
  26060. int err = MP_OKAY;
  26061. (void)g;
  26062. /* Constant time used for cache attack resistance implementation. */
  26063. (void)ct;
  26064. (void)heap;
  26065. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26066. rt = (sp_point_384*)XMALLOC(sizeof(sp_point_384) * 2, heap,
  26067. DYNAMIC_TYPE_ECC);
  26068. if (rt == NULL)
  26069. err = MEMORY_E;
  26070. if (err == MP_OKAY) {
  26071. t = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 12 * 6, heap,
  26072. DYNAMIC_TYPE_ECC);
  26073. if (t == NULL)
  26074. err = MEMORY_E;
  26075. }
  26076. #endif
  26077. if (err == MP_OKAY) {
  26078. p = rt + 1;
  26079. XMEMCPY(p->z, p384_norm_mod, sizeof(p384_norm_mod));
  26080. XMEMCPY(rt->z, p384_norm_mod, sizeof(p384_norm_mod));
  26081. y = 0;
  26082. x = 95;
  26083. for (j=0; j<4; j++) {
  26084. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  26085. x += 96;
  26086. }
  26087. #ifndef WC_NO_CACHE_RESISTANT
  26088. if (ct) {
  26089. sp_384_get_entry_16_12(rt, table, y);
  26090. } else
  26091. #endif
  26092. {
  26093. XMEMCPY(rt->x, table[y].x, sizeof(table[y].x));
  26094. XMEMCPY(rt->y, table[y].y, sizeof(table[y].y));
  26095. }
  26096. rt->infinity = !y;
  26097. for (i=94; i>=0; i--) {
  26098. y = 0;
  26099. x = i;
  26100. for (j=0; j<4; j++) {
  26101. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  26102. x += 96;
  26103. }
  26104. sp_384_proj_point_dbl_12(rt, rt, t);
  26105. #ifndef WC_NO_CACHE_RESISTANT
  26106. if (ct) {
  26107. sp_384_get_entry_16_12(p, table, y);
  26108. }
  26109. else
  26110. #endif
  26111. {
  26112. XMEMCPY(p->x, table[y].x, sizeof(table[y].x));
  26113. XMEMCPY(p->y, table[y].y, sizeof(table[y].y));
  26114. }
  26115. p->infinity = !y;
  26116. sp_384_proj_point_add_qz1_12(rt, rt, p, t);
  26117. }
  26118. if (map != 0) {
  26119. sp_384_map_12(r, rt, t);
  26120. }
  26121. else {
  26122. XMEMCPY(r, rt, sizeof(sp_point_384));
  26123. }
  26124. }
  26125. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26126. if (t != NULL)
  26127. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  26128. if (rt != NULL)
  26129. XFREE(rt, heap, DYNAMIC_TYPE_ECC);
  26130. #endif
  26131. return err;
  26132. }
  26133. #ifdef FP_ECC
  26134. #ifndef FP_ENTRIES
  26135. #define FP_ENTRIES 16
  26136. #endif
  26137. /* Cache entry - holds precomputation tables for a point. */
  26138. typedef struct sp_cache_384_t {
  26139. /* X ordinate of point that table was generated from. */
  26140. sp_digit x[12];
  26141. /* Y ordinate of point that table was generated from. */
  26142. sp_digit y[12];
  26143. /* Precomputation table for point. */
  26144. sp_table_entry_384 table[16];
  26145. /* Count of entries in table. */
  26146. uint32_t cnt;
  26147. /* Point and table set in entry. */
  26148. int set;
  26149. } sp_cache_384_t;
  26150. /* Cache of tables. */
  26151. static THREAD_LS_T sp_cache_384_t sp_cache_384[FP_ENTRIES];
  26152. /* Index of last entry in cache. */
  26153. static THREAD_LS_T int sp_cache_384_last = -1;
  26154. /* Cache has been initialized. */
  26155. static THREAD_LS_T int sp_cache_384_inited = 0;
  26156. #ifndef HAVE_THREAD_LS
  26157. static volatile int initCacheMutex_384 = 0;
  26158. static wolfSSL_Mutex sp_cache_384_lock;
  26159. #endif
  26160. /* Get the cache entry for the point.
  26161. *
  26162. * g [in] Point scalar multipling.
  26163. * cache [out] Cache table to use.
  26164. */
  26165. static void sp_ecc_get_cache_384(const sp_point_384* g, sp_cache_384_t** cache)
  26166. {
  26167. int i;
  26168. int j;
  26169. uint32_t least;
  26170. if (sp_cache_384_inited == 0) {
  26171. for (i=0; i<FP_ENTRIES; i++) {
  26172. sp_cache_384[i].set = 0;
  26173. }
  26174. sp_cache_384_inited = 1;
  26175. }
  26176. /* Compare point with those in cache. */
  26177. for (i=0; i<FP_ENTRIES; i++) {
  26178. if (!sp_cache_384[i].set)
  26179. continue;
  26180. if (sp_384_cmp_equal_12(g->x, sp_cache_384[i].x) &
  26181. sp_384_cmp_equal_12(g->y, sp_cache_384[i].y)) {
  26182. sp_cache_384[i].cnt++;
  26183. break;
  26184. }
  26185. }
  26186. /* No match. */
  26187. if (i == FP_ENTRIES) {
  26188. /* Find empty entry. */
  26189. i = (sp_cache_384_last + 1) % FP_ENTRIES;
  26190. for (; i != sp_cache_384_last; i=(i+1)%FP_ENTRIES) {
  26191. if (!sp_cache_384[i].set) {
  26192. break;
  26193. }
  26194. }
  26195. /* Evict least used. */
  26196. if (i == sp_cache_384_last) {
  26197. least = sp_cache_384[0].cnt;
  26198. for (j=1; j<FP_ENTRIES; j++) {
  26199. if (sp_cache_384[j].cnt < least) {
  26200. i = j;
  26201. least = sp_cache_384[i].cnt;
  26202. }
  26203. }
  26204. }
  26205. XMEMCPY(sp_cache_384[i].x, g->x, sizeof(sp_cache_384[i].x));
  26206. XMEMCPY(sp_cache_384[i].y, g->y, sizeof(sp_cache_384[i].y));
  26207. sp_cache_384[i].set = 1;
  26208. sp_cache_384[i].cnt = 1;
  26209. }
  26210. *cache = &sp_cache_384[i];
  26211. sp_cache_384_last = i;
  26212. }
  26213. #endif /* FP_ECC */
  26214. /* Multiply the base point of P384 by the scalar and return the result.
  26215. * If map is true then convert result to affine coordinates.
  26216. *
  26217. * r Resulting point.
  26218. * g Point to multiply.
  26219. * k Scalar to multiply by.
  26220. * map Indicates whether to convert result to affine.
  26221. * ct Constant time required.
  26222. * heap Heap to use for allocation.
  26223. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  26224. */
  26225. static int sp_384_ecc_mulmod_12(sp_point_384* r, const sp_point_384* g, const sp_digit* k,
  26226. int map, int ct, void* heap)
  26227. {
  26228. #ifndef FP_ECC
  26229. return sp_384_ecc_mulmod_fast_12(r, g, k, map, ct, heap);
  26230. #else
  26231. sp_digit tmp[2 * 12 * 7];
  26232. sp_cache_384_t* cache;
  26233. int err = MP_OKAY;
  26234. #ifndef HAVE_THREAD_LS
  26235. if (initCacheMutex_384 == 0) {
  26236. wc_InitMutex(&sp_cache_384_lock);
  26237. initCacheMutex_384 = 1;
  26238. }
  26239. if (wc_LockMutex(&sp_cache_384_lock) != 0)
  26240. err = BAD_MUTEX_E;
  26241. #endif /* HAVE_THREAD_LS */
  26242. if (err == MP_OKAY) {
  26243. sp_ecc_get_cache_384(g, &cache);
  26244. if (cache->cnt == 2)
  26245. sp_384_gen_stripe_table_12(g, cache->table, tmp, heap);
  26246. #ifndef HAVE_THREAD_LS
  26247. wc_UnLockMutex(&sp_cache_384_lock);
  26248. #endif /* HAVE_THREAD_LS */
  26249. if (cache->cnt < 2) {
  26250. err = sp_384_ecc_mulmod_fast_12(r, g, k, map, ct, heap);
  26251. }
  26252. else {
  26253. err = sp_384_ecc_mulmod_stripe_12(r, g, cache->table, k,
  26254. map, ct, heap);
  26255. }
  26256. }
  26257. return err;
  26258. #endif
  26259. }
  26260. #else
  26261. #ifdef FP_ECC
  26262. /* Generate the pre-computed table of points for the base point.
  26263. *
  26264. * width = 8
  26265. * 256 entries
  26266. * 48 bits between
  26267. *
  26268. * a The base point.
  26269. * table Place to store generated point data.
  26270. * tmp Temporary data.
  26271. * heap Heap to use for allocation.
  26272. */
  26273. static int sp_384_gen_stripe_table_12(const sp_point_384* a,
  26274. sp_table_entry_384* table, sp_digit* tmp, void* heap)
  26275. {
  26276. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26277. sp_point_384* t = NULL;
  26278. #else
  26279. sp_point_384 t[3];
  26280. #endif
  26281. sp_point_384* s1 = NULL;
  26282. sp_point_384* s2 = NULL;
  26283. int i;
  26284. int j;
  26285. int err = MP_OKAY;
  26286. (void)heap;
  26287. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26288. t = (sp_point_384*)XMALLOC(sizeof(sp_point_384) * 3, heap,
  26289. DYNAMIC_TYPE_ECC);
  26290. if (t == NULL)
  26291. err = MEMORY_E;
  26292. #endif
  26293. if (err == MP_OKAY) {
  26294. s1 = t + 1;
  26295. s2 = t + 2;
  26296. err = sp_384_mod_mul_norm_12(t->x, a->x, p384_mod);
  26297. }
  26298. if (err == MP_OKAY) {
  26299. err = sp_384_mod_mul_norm_12(t->y, a->y, p384_mod);
  26300. }
  26301. if (err == MP_OKAY) {
  26302. err = sp_384_mod_mul_norm_12(t->z, a->z, p384_mod);
  26303. }
  26304. if (err == MP_OKAY) {
  26305. t->infinity = 0;
  26306. sp_384_proj_to_affine_12(t, tmp);
  26307. XMEMCPY(s1->z, p384_norm_mod, sizeof(p384_norm_mod));
  26308. s1->infinity = 0;
  26309. XMEMCPY(s2->z, p384_norm_mod, sizeof(p384_norm_mod));
  26310. s2->infinity = 0;
  26311. /* table[0] = {0, 0, infinity} */
  26312. XMEMSET(&table[0], 0, sizeof(sp_table_entry_384));
  26313. /* table[1] = Affine version of 'a' in Montgomery form */
  26314. XMEMCPY(table[1].x, t->x, sizeof(table->x));
  26315. XMEMCPY(table[1].y, t->y, sizeof(table->y));
  26316. for (i=1; i<8; i++) {
  26317. sp_384_proj_point_dbl_n_12(t, 48, tmp);
  26318. sp_384_proj_to_affine_12(t, tmp);
  26319. XMEMCPY(table[1<<i].x, t->x, sizeof(table->x));
  26320. XMEMCPY(table[1<<i].y, t->y, sizeof(table->y));
  26321. }
  26322. for (i=1; i<8; i++) {
  26323. XMEMCPY(s1->x, table[1<<i].x, sizeof(table->x));
  26324. XMEMCPY(s1->y, table[1<<i].y, sizeof(table->y));
  26325. for (j=(1<<i)+1; j<(1<<(i+1)); j++) {
  26326. XMEMCPY(s2->x, table[j-(1<<i)].x, sizeof(table->x));
  26327. XMEMCPY(s2->y, table[j-(1<<i)].y, sizeof(table->y));
  26328. sp_384_proj_point_add_qz1_12(t, s1, s2, tmp);
  26329. sp_384_proj_to_affine_12(t, tmp);
  26330. XMEMCPY(table[j].x, t->x, sizeof(table->x));
  26331. XMEMCPY(table[j].y, t->y, sizeof(table->y));
  26332. }
  26333. }
  26334. }
  26335. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26336. if (t != NULL)
  26337. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  26338. #endif
  26339. return err;
  26340. }
  26341. #endif /* FP_ECC */
  26342. #ifndef WC_NO_CACHE_RESISTANT
  26343. /* Touch each possible entry that could be being copied.
  26344. *
  26345. * r Point to copy into.
  26346. * table Table - start of the entires to access
  26347. * idx Index of entry to retrieve.
  26348. */
  26349. static void sp_384_get_entry_256_12(sp_point_384* r,
  26350. const sp_table_entry_384* table, int idx)
  26351. {
  26352. int i;
  26353. sp_digit mask;
  26354. r->x[0] = 0;
  26355. r->x[1] = 0;
  26356. r->x[2] = 0;
  26357. r->x[3] = 0;
  26358. r->x[4] = 0;
  26359. r->x[5] = 0;
  26360. r->x[6] = 0;
  26361. r->x[7] = 0;
  26362. r->x[8] = 0;
  26363. r->x[9] = 0;
  26364. r->x[10] = 0;
  26365. r->x[11] = 0;
  26366. r->y[0] = 0;
  26367. r->y[1] = 0;
  26368. r->y[2] = 0;
  26369. r->y[3] = 0;
  26370. r->y[4] = 0;
  26371. r->y[5] = 0;
  26372. r->y[6] = 0;
  26373. r->y[7] = 0;
  26374. r->y[8] = 0;
  26375. r->y[9] = 0;
  26376. r->y[10] = 0;
  26377. r->y[11] = 0;
  26378. for (i = 1; i < 256; i++) {
  26379. mask = 0 - (i == idx);
  26380. r->x[0] |= mask & table[i].x[0];
  26381. r->x[1] |= mask & table[i].x[1];
  26382. r->x[2] |= mask & table[i].x[2];
  26383. r->x[3] |= mask & table[i].x[3];
  26384. r->x[4] |= mask & table[i].x[4];
  26385. r->x[5] |= mask & table[i].x[5];
  26386. r->x[6] |= mask & table[i].x[6];
  26387. r->x[7] |= mask & table[i].x[7];
  26388. r->x[8] |= mask & table[i].x[8];
  26389. r->x[9] |= mask & table[i].x[9];
  26390. r->x[10] |= mask & table[i].x[10];
  26391. r->x[11] |= mask & table[i].x[11];
  26392. r->y[0] |= mask & table[i].y[0];
  26393. r->y[1] |= mask & table[i].y[1];
  26394. r->y[2] |= mask & table[i].y[2];
  26395. r->y[3] |= mask & table[i].y[3];
  26396. r->y[4] |= mask & table[i].y[4];
  26397. r->y[5] |= mask & table[i].y[5];
  26398. r->y[6] |= mask & table[i].y[6];
  26399. r->y[7] |= mask & table[i].y[7];
  26400. r->y[8] |= mask & table[i].y[8];
  26401. r->y[9] |= mask & table[i].y[9];
  26402. r->y[10] |= mask & table[i].y[10];
  26403. r->y[11] |= mask & table[i].y[11];
  26404. }
  26405. }
  26406. #endif /* !WC_NO_CACHE_RESISTANT */
  26407. /* Multiply the point by the scalar and return the result.
  26408. * If map is true then convert result to affine coordinates.
  26409. *
  26410. * Stripe implementation.
  26411. * Pre-generated: 2^0, 2^48, ...
  26412. * Pre-generated: products of all combinations of above.
  26413. * 8 doubles and adds (with qz=1)
  26414. *
  26415. * r Resulting point.
  26416. * k Scalar to multiply by.
  26417. * table Pre-computed table.
  26418. * map Indicates whether to convert result to affine.
  26419. * ct Constant time required.
  26420. * heap Heap to use for allocation.
  26421. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  26422. */
  26423. static int sp_384_ecc_mulmod_stripe_12(sp_point_384* r, const sp_point_384* g,
  26424. const sp_table_entry_384* table, const sp_digit* k, int map,
  26425. int ct, void* heap)
  26426. {
  26427. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26428. sp_point_384* rt = NULL;
  26429. sp_digit* t = NULL;
  26430. #else
  26431. sp_point_384 rt[2];
  26432. sp_digit t[2 * 12 * 6];
  26433. #endif
  26434. sp_point_384* p = NULL;
  26435. int i;
  26436. int j;
  26437. int y;
  26438. int x;
  26439. int err = MP_OKAY;
  26440. (void)g;
  26441. /* Constant time used for cache attack resistance implementation. */
  26442. (void)ct;
  26443. (void)heap;
  26444. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26445. rt = (sp_point_384*)XMALLOC(sizeof(sp_point_384) * 2, heap,
  26446. DYNAMIC_TYPE_ECC);
  26447. if (rt == NULL)
  26448. err = MEMORY_E;
  26449. if (err == MP_OKAY) {
  26450. t = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 12 * 6, heap,
  26451. DYNAMIC_TYPE_ECC);
  26452. if (t == NULL)
  26453. err = MEMORY_E;
  26454. }
  26455. #endif
  26456. if (err == MP_OKAY) {
  26457. p = rt + 1;
  26458. XMEMCPY(p->z, p384_norm_mod, sizeof(p384_norm_mod));
  26459. XMEMCPY(rt->z, p384_norm_mod, sizeof(p384_norm_mod));
  26460. y = 0;
  26461. x = 47;
  26462. for (j=0; j<8; j++) {
  26463. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  26464. x += 48;
  26465. }
  26466. #ifndef WC_NO_CACHE_RESISTANT
  26467. if (ct) {
  26468. sp_384_get_entry_256_12(rt, table, y);
  26469. } else
  26470. #endif
  26471. {
  26472. XMEMCPY(rt->x, table[y].x, sizeof(table[y].x));
  26473. XMEMCPY(rt->y, table[y].y, sizeof(table[y].y));
  26474. }
  26475. rt->infinity = !y;
  26476. for (i=46; i>=0; i--) {
  26477. y = 0;
  26478. x = i;
  26479. for (j=0; j<8; j++) {
  26480. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  26481. x += 48;
  26482. }
  26483. sp_384_proj_point_dbl_12(rt, rt, t);
  26484. #ifndef WC_NO_CACHE_RESISTANT
  26485. if (ct) {
  26486. sp_384_get_entry_256_12(p, table, y);
  26487. }
  26488. else
  26489. #endif
  26490. {
  26491. XMEMCPY(p->x, table[y].x, sizeof(table[y].x));
  26492. XMEMCPY(p->y, table[y].y, sizeof(table[y].y));
  26493. }
  26494. p->infinity = !y;
  26495. sp_384_proj_point_add_qz1_12(rt, rt, p, t);
  26496. }
  26497. if (map != 0) {
  26498. sp_384_map_12(r, rt, t);
  26499. }
  26500. else {
  26501. XMEMCPY(r, rt, sizeof(sp_point_384));
  26502. }
  26503. }
  26504. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26505. if (t != NULL)
  26506. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  26507. if (rt != NULL)
  26508. XFREE(rt, heap, DYNAMIC_TYPE_ECC);
  26509. #endif
  26510. return err;
  26511. }
  26512. #ifdef FP_ECC
  26513. #ifndef FP_ENTRIES
  26514. #define FP_ENTRIES 16
  26515. #endif
  26516. /* Cache entry - holds precomputation tables for a point. */
  26517. typedef struct sp_cache_384_t {
  26518. /* X ordinate of point that table was generated from. */
  26519. sp_digit x[12];
  26520. /* Y ordinate of point that table was generated from. */
  26521. sp_digit y[12];
  26522. /* Precomputation table for point. */
  26523. sp_table_entry_384 table[256];
  26524. /* Count of entries in table. */
  26525. uint32_t cnt;
  26526. /* Point and table set in entry. */
  26527. int set;
  26528. } sp_cache_384_t;
  26529. /* Cache of tables. */
  26530. static THREAD_LS_T sp_cache_384_t sp_cache_384[FP_ENTRIES];
  26531. /* Index of last entry in cache. */
  26532. static THREAD_LS_T int sp_cache_384_last = -1;
  26533. /* Cache has been initialized. */
  26534. static THREAD_LS_T int sp_cache_384_inited = 0;
  26535. #ifndef HAVE_THREAD_LS
  26536. static volatile int initCacheMutex_384 = 0;
  26537. static wolfSSL_Mutex sp_cache_384_lock;
  26538. #endif
  26539. /* Get the cache entry for the point.
  26540. *
  26541. * g [in] Point scalar multipling.
  26542. * cache [out] Cache table to use.
  26543. */
  26544. static void sp_ecc_get_cache_384(const sp_point_384* g, sp_cache_384_t** cache)
  26545. {
  26546. int i;
  26547. int j;
  26548. uint32_t least;
  26549. if (sp_cache_384_inited == 0) {
  26550. for (i=0; i<FP_ENTRIES; i++) {
  26551. sp_cache_384[i].set = 0;
  26552. }
  26553. sp_cache_384_inited = 1;
  26554. }
  26555. /* Compare point with those in cache. */
  26556. for (i=0; i<FP_ENTRIES; i++) {
  26557. if (!sp_cache_384[i].set)
  26558. continue;
  26559. if (sp_384_cmp_equal_12(g->x, sp_cache_384[i].x) &
  26560. sp_384_cmp_equal_12(g->y, sp_cache_384[i].y)) {
  26561. sp_cache_384[i].cnt++;
  26562. break;
  26563. }
  26564. }
  26565. /* No match. */
  26566. if (i == FP_ENTRIES) {
  26567. /* Find empty entry. */
  26568. i = (sp_cache_384_last + 1) % FP_ENTRIES;
  26569. for (; i != sp_cache_384_last; i=(i+1)%FP_ENTRIES) {
  26570. if (!sp_cache_384[i].set) {
  26571. break;
  26572. }
  26573. }
  26574. /* Evict least used. */
  26575. if (i == sp_cache_384_last) {
  26576. least = sp_cache_384[0].cnt;
  26577. for (j=1; j<FP_ENTRIES; j++) {
  26578. if (sp_cache_384[j].cnt < least) {
  26579. i = j;
  26580. least = sp_cache_384[i].cnt;
  26581. }
  26582. }
  26583. }
  26584. XMEMCPY(sp_cache_384[i].x, g->x, sizeof(sp_cache_384[i].x));
  26585. XMEMCPY(sp_cache_384[i].y, g->y, sizeof(sp_cache_384[i].y));
  26586. sp_cache_384[i].set = 1;
  26587. sp_cache_384[i].cnt = 1;
  26588. }
  26589. *cache = &sp_cache_384[i];
  26590. sp_cache_384_last = i;
  26591. }
  26592. #endif /* FP_ECC */
  26593. /* Multiply the base point of P384 by the scalar and return the result.
  26594. * If map is true then convert result to affine coordinates.
  26595. *
  26596. * r Resulting point.
  26597. * g Point to multiply.
  26598. * k Scalar to multiply by.
  26599. * map Indicates whether to convert result to affine.
  26600. * ct Constant time required.
  26601. * heap Heap to use for allocation.
  26602. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  26603. */
  26604. static int sp_384_ecc_mulmod_12(sp_point_384* r, const sp_point_384* g, const sp_digit* k,
  26605. int map, int ct, void* heap)
  26606. {
  26607. #ifndef FP_ECC
  26608. return sp_384_ecc_mulmod_fast_12(r, g, k, map, ct, heap);
  26609. #else
  26610. sp_digit tmp[2 * 12 * 7];
  26611. sp_cache_384_t* cache;
  26612. int err = MP_OKAY;
  26613. #ifndef HAVE_THREAD_LS
  26614. if (initCacheMutex_384 == 0) {
  26615. wc_InitMutex(&sp_cache_384_lock);
  26616. initCacheMutex_384 = 1;
  26617. }
  26618. if (wc_LockMutex(&sp_cache_384_lock) != 0)
  26619. err = BAD_MUTEX_E;
  26620. #endif /* HAVE_THREAD_LS */
  26621. if (err == MP_OKAY) {
  26622. sp_ecc_get_cache_384(g, &cache);
  26623. if (cache->cnt == 2)
  26624. sp_384_gen_stripe_table_12(g, cache->table, tmp, heap);
  26625. #ifndef HAVE_THREAD_LS
  26626. wc_UnLockMutex(&sp_cache_384_lock);
  26627. #endif /* HAVE_THREAD_LS */
  26628. if (cache->cnt < 2) {
  26629. err = sp_384_ecc_mulmod_fast_12(r, g, k, map, ct, heap);
  26630. }
  26631. else {
  26632. err = sp_384_ecc_mulmod_stripe_12(r, g, cache->table, k,
  26633. map, ct, heap);
  26634. }
  26635. }
  26636. return err;
  26637. #endif
  26638. }
  26639. #endif /* WOLFSSL_SP_SMALL */
  26640. /* Multiply the point by the scalar and return the result.
  26641. * If map is true then convert result to affine coordinates.
  26642. *
  26643. * km Scalar to multiply by.
  26644. * p Point to multiply.
  26645. * r Resulting point.
  26646. * map Indicates whether to convert result to affine.
  26647. * heap Heap to use for allocation.
  26648. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  26649. */
  26650. int sp_ecc_mulmod_384(const mp_int* km, const ecc_point* gm, ecc_point* r,
  26651. int map, void* heap)
  26652. {
  26653. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26654. sp_point_384* point = NULL;
  26655. sp_digit* k = NULL;
  26656. #else
  26657. sp_point_384 point[1];
  26658. sp_digit k[12];
  26659. #endif
  26660. int err = MP_OKAY;
  26661. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26662. point = (sp_point_384*)XMALLOC(sizeof(sp_point_384), heap,
  26663. DYNAMIC_TYPE_ECC);
  26664. if (point == NULL)
  26665. err = MEMORY_E;
  26666. if (err == MP_OKAY) {
  26667. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 12, heap,
  26668. DYNAMIC_TYPE_ECC);
  26669. if (k == NULL)
  26670. err = MEMORY_E;
  26671. }
  26672. #endif
  26673. if (err == MP_OKAY) {
  26674. sp_384_from_mp(k, 12, km);
  26675. sp_384_point_from_ecc_point_12(point, gm);
  26676. err = sp_384_ecc_mulmod_12(point, point, k, map, 1, heap);
  26677. }
  26678. if (err == MP_OKAY) {
  26679. err = sp_384_point_to_ecc_point_12(point, r);
  26680. }
  26681. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26682. if (k != NULL)
  26683. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  26684. if (point != NULL)
  26685. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  26686. #endif
  26687. return err;
  26688. }
  26689. /* Multiply the point by the scalar, add point a and return the result.
  26690. * If map is true then convert result to affine coordinates.
  26691. *
  26692. * km Scalar to multiply by.
  26693. * p Point to multiply.
  26694. * am Point to add to scalar mulitply result.
  26695. * inMont Point to add is in montgomery form.
  26696. * r Resulting point.
  26697. * map Indicates whether to convert result to affine.
  26698. * heap Heap to use for allocation.
  26699. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  26700. */
  26701. int sp_ecc_mulmod_add_384(const mp_int* km, const ecc_point* gm,
  26702. const ecc_point* am, int inMont, ecc_point* r, int map, void* heap)
  26703. {
  26704. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26705. sp_point_384* point = NULL;
  26706. sp_digit* k = NULL;
  26707. #else
  26708. sp_point_384 point[2];
  26709. sp_digit k[12 + 12 * 2 * 6];
  26710. #endif
  26711. sp_point_384* addP = NULL;
  26712. sp_digit* tmp = NULL;
  26713. int err = MP_OKAY;
  26714. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26715. point = (sp_point_384*)XMALLOC(sizeof(sp_point_384) * 2, heap,
  26716. DYNAMIC_TYPE_ECC);
  26717. if (point == NULL)
  26718. err = MEMORY_E;
  26719. if (err == MP_OKAY) {
  26720. k = (sp_digit*)XMALLOC(
  26721. sizeof(sp_digit) * (12 + 12 * 2 * 6), heap,
  26722. DYNAMIC_TYPE_ECC);
  26723. if (k == NULL)
  26724. err = MEMORY_E;
  26725. }
  26726. #endif
  26727. if (err == MP_OKAY) {
  26728. addP = point + 1;
  26729. tmp = k + 12;
  26730. sp_384_from_mp(k, 12, km);
  26731. sp_384_point_from_ecc_point_12(point, gm);
  26732. sp_384_point_from_ecc_point_12(addP, am);
  26733. }
  26734. if ((err == MP_OKAY) && (!inMont)) {
  26735. err = sp_384_mod_mul_norm_12(addP->x, addP->x, p384_mod);
  26736. }
  26737. if ((err == MP_OKAY) && (!inMont)) {
  26738. err = sp_384_mod_mul_norm_12(addP->y, addP->y, p384_mod);
  26739. }
  26740. if ((err == MP_OKAY) && (!inMont)) {
  26741. err = sp_384_mod_mul_norm_12(addP->z, addP->z, p384_mod);
  26742. }
  26743. if (err == MP_OKAY) {
  26744. err = sp_384_ecc_mulmod_12(point, point, k, 0, 0, heap);
  26745. }
  26746. if (err == MP_OKAY) {
  26747. sp_384_proj_point_add_12(point, point, addP, tmp);
  26748. if (map) {
  26749. sp_384_map_12(point, point, tmp);
  26750. }
  26751. err = sp_384_point_to_ecc_point_12(point, r);
  26752. }
  26753. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  26754. if (k != NULL)
  26755. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  26756. if (point != NULL)
  26757. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  26758. #endif
  26759. return err;
  26760. }
  26761. #ifdef WOLFSSL_SP_SMALL
  26762. /* Striping precomputation table.
  26763. * 4 points combined into a table of 16 points.
  26764. * Distance of 96 between points.
  26765. */
  26766. static const sp_table_entry_384 p384_table[16] = {
  26767. /* 0 */
  26768. { { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 },
  26769. { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 } },
  26770. /* 1 */
  26771. { { 0x49c0b528,0x3dd07566,0xa0d6ce38,0x20e378e2,0x541b4d6e,0x879c3afc,
  26772. 0x59a30eff,0x64548684,0x614ede2b,0x812ff723,0x299e1513,0x4d3aadc2 },
  26773. { 0x4b03a4fe,0x23043dad,0x7bb4a9ac,0xa1bfa8bf,0x2e83b050,0x8bade756,
  26774. 0x68f4ffd9,0xc6c35219,0x3969a840,0xdd800226,0x5a15c5e9,0x2b78abc2 } },
  26775. /* 2 */
  26776. { { 0xf26feef9,0x24480c57,0x3a0e1240,0xc31a2694,0x273e2bc7,0x735002c3,
  26777. 0x3ef1ed4c,0x8c42e9c5,0x7f4948e8,0x028babf6,0x8a978632,0x6a502f43 },
  26778. { 0xb74536fe,0xf5f13a46,0xd8a9f0eb,0x1d218bab,0x37232768,0x30f36bcc,
  26779. 0x576e8c18,0xc5317b31,0x9bbcb766,0xef1d57a6,0xb3e3d4dc,0x917c4930 } },
  26780. /* 3 */
  26781. { { 0xe349ddd0,0x11426e2e,0x9b2fc250,0x9f117ef9,0xec0174a6,0xff36b480,
  26782. 0x18458466,0x4f4bde76,0x05806049,0x2f2edb6d,0x19dfca92,0x8adc75d1 },
  26783. { 0xb7d5a7ce,0xa619d097,0xa34411e9,0x874275e5,0x0da4b4ef,0x5403e047,
  26784. 0x77901d8f,0x2ebaafd9,0xa747170f,0x5e63ebce,0x7f9d8036,0x12a36944 } },
  26785. /* 4 */
  26786. { { 0x2f9fbe67,0x378205de,0x7f728e44,0xc4afcb83,0x682e00f1,0xdbcec06c,
  26787. 0x114d5423,0xf2a145c3,0x7a52463e,0xa01d9874,0x7d717b0a,0xfc0935b1 },
  26788. { 0xd4d01f95,0x9653bc4f,0x9560ad34,0x9aa83ea8,0xaf8e3f3f,0xf77943dc,
  26789. 0xe86fe16e,0x70774a10,0xbf9ffdcf,0x6b62e6f1,0x588745c9,0x8a72f39e } },
  26790. /* 5 */
  26791. { { 0x2341c342,0x73ade4da,0xea704422,0xdd326e54,0x3741cef3,0x336c7d98,
  26792. 0x59e61549,0x1eafa00d,0xbd9a3efd,0xcd3ed892,0xc5c6c7e4,0x03faf26c },
  26793. { 0x3045f8ac,0x087e2fcf,0x174f1e73,0x14a65532,0xfe0af9a7,0x2cf84f28,
  26794. 0x2cdc935b,0xddfd7a84,0x6929c895,0x4c0f117b,0x4c8bcfcc,0x356572d6 } },
  26795. /* 6 */
  26796. { { 0x3f3b236f,0xfab08607,0x81e221da,0x19e9d41d,0x3927b428,0xf3f6571e,
  26797. 0x7550f1f6,0x4348a933,0xa85e62f0,0x7167b996,0x7f5452bf,0x62d43759 },
  26798. { 0xf2955926,0xd85feb9e,0x6df78353,0x440a561f,0x9ca36b59,0x389668ec,
  26799. 0xa22da016,0x052bf1a1,0xf6093254,0xbdfbff72,0xe22209f3,0x94e50f28 } },
  26800. /* 7 */
  26801. { { 0x3062e8af,0x90b2e5b3,0xe8a3d369,0xa8572375,0x201db7b1,0x3fe1b00b,
  26802. 0xee651aa2,0xe926def0,0xb9b10ad7,0x6542c9be,0xa2fcbe74,0x098e309b },
  26803. { 0xfff1d63f,0x779deeb3,0x20bfd374,0x23d0e80a,0x8768f797,0x8452bb3b,
  26804. 0x1f952856,0xcf75bb4d,0x29ea3faa,0x8fe6b400,0x81373a53,0x12bd3e40 } },
  26805. /* 8 */
  26806. { { 0x16973cf4,0x070d34e1,0x7e4f34f7,0x20aee08b,0x5eb8ad29,0x269af9b9,
  26807. 0xa6a45dda,0xdde0a036,0x63df41e0,0xa18b528e,0xa260df2a,0x03cc71b2 },
  26808. { 0xa06b1dd7,0x24a6770a,0x9d2675d3,0x5bfa9c11,0x96844432,0x73c1e2a1,
  26809. 0x131a6cf0,0x3660558d,0x2ee79454,0xb0289c83,0xc6d8ddcd,0xa6aefb01 } },
  26810. /* 9 */
  26811. { { 0x01ab5245,0xba1464b4,0xc48d93ff,0x9b8d0b6d,0x93ad272c,0x939867dc,
  26812. 0xae9fdc77,0xbebe085e,0x894ea8bd,0x73ae5103,0x39ac22e1,0x740fc89a },
  26813. { 0x28e23b23,0x5e28b0a3,0xe13104d0,0x2352722e,0xb0a2640d,0xf4667a18,
  26814. 0x49bb37c3,0xac74a72e,0xe81e183a,0x79f734f0,0x3fd9c0eb,0xbffe5b6c } },
  26815. /* 10 */
  26816. { { 0x00623f3b,0x03cf2922,0x5f29ebff,0x095c7111,0x80aa6823,0x42d72247,
  26817. 0x7458c0b0,0x044c7ba1,0x0959ec20,0xca62f7ef,0xf8ca929f,0x40ae2ab7 },
  26818. { 0xa927b102,0xb8c5377a,0xdc031771,0x398a86a0,0xc216a406,0x04908f9d,
  26819. 0x918d3300,0xb423a73a,0xe0b94739,0x634b0ff1,0x2d69f697,0xe29de725 } },
  26820. /* 11 */
  26821. { { 0x8435af04,0x744d1400,0xfec192da,0x5f255b1d,0x336dc542,0x1f17dc12,
  26822. 0x636a68a8,0x5c90c2a7,0x7704ca1e,0x960c9eb7,0x6fb3d65a,0x9de8cf1e },
  26823. { 0x511d3d06,0xc60fee0d,0xf9eb52c7,0x466e2313,0x206b0914,0x743c0f5f,
  26824. 0x2191aa4d,0x42f55bac,0xffebdbc2,0xcefc7c8f,0xe6e8ed1c,0xd4fa6081 } },
  26825. /* 12 */
  26826. { { 0x98683186,0x867db639,0xddcc4ea9,0xfb5cf424,0xd4f0e7bd,0xcc9a7ffe,
  26827. 0x7a779f7e,0x7c57f71c,0xd6b25ef2,0x90774079,0xb4081680,0x90eae903 },
  26828. { 0x0ee1fceb,0xdf2aae5e,0xe86c1a1f,0x3ff1da24,0xca193edf,0x80f587d6,
  26829. 0xdc9b9d6a,0xa5695523,0x85920303,0x7b840900,0xba6dbdef,0x1efa4dfc } },
  26830. /* 13 */
  26831. { { 0xe0540015,0xfbd838f9,0xc39077dc,0x2c323946,0xad619124,0x8b1fb9e6,
  26832. 0x0ca62ea8,0x9612440c,0x2dbe00ff,0x9ad9b52c,0xae197643,0xf52abaa1 },
  26833. { 0x2cac32ad,0xd0e89894,0x62a98f91,0xdfb79e42,0x276f55cb,0x65452ecf,
  26834. 0x7ad23e12,0xdb1ac0d2,0xde4986f0,0xf68c5f6a,0x82ce327d,0x389ac37b } },
  26835. /* 14 */
  26836. { { 0xb8a9e8c9,0xcd96866d,0x5bb8091e,0xa11963b8,0x045b3cd2,0xc7f90d53,
  26837. 0x80f36504,0x755a72b5,0x21d3751c,0x46f8b399,0x53c193de,0x4bffdc91 },
  26838. { 0xb89554e7,0xcd15c049,0xf7a26be6,0x353c6754,0xbd41d970,0x79602370,
  26839. 0x12b176c0,0xde16470b,0x40c8809d,0x56ba1175,0xe435fb1e,0xe2db35c3 } },
  26840. /* 15 */
  26841. { { 0x6328e33f,0xd71e4aab,0xaf8136d1,0x5486782b,0x86d57231,0x07a4995f,
  26842. 0x1651a968,0xf1f0a5bd,0x76803b6d,0xa5dc5b24,0x42dda935,0x5c587cbc },
  26843. { 0xbae8b4c0,0x2b6cdb32,0xb1331138,0x66d1598b,0x5d7e9614,0x4a23b2d2,
  26844. 0x74a8c05d,0x93e402a6,0xda7ce82e,0x45ac94e6,0xe463d465,0xeb9f8281 } },
  26845. };
  26846. /* Multiply the base point of P384 by the scalar and return the result.
  26847. * If map is true then convert result to affine coordinates.
  26848. *
  26849. * Stripe implementation.
  26850. * Pre-generated: 2^0, 2^96, ...
  26851. * Pre-generated: products of all combinations of above.
  26852. * 4 doubles and adds (with qz=1)
  26853. *
  26854. * r Resulting point.
  26855. * k Scalar to multiply by.
  26856. * map Indicates whether to convert result to affine.
  26857. * ct Constant time required.
  26858. * heap Heap to use for allocation.
  26859. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  26860. */
  26861. static int sp_384_ecc_mulmod_base_12(sp_point_384* r, const sp_digit* k,
  26862. int map, int ct, void* heap)
  26863. {
  26864. return sp_384_ecc_mulmod_stripe_12(r, &p384_base, p384_table,
  26865. k, map, ct, heap);
  26866. }
  26867. #else
  26868. /* Striping precomputation table.
  26869. * 8 points combined into a table of 256 points.
  26870. * Distance of 48 between points.
  26871. */
  26872. static const sp_table_entry_384 p384_table[256] = {
  26873. /* 0 */
  26874. { { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 },
  26875. { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 } },
  26876. /* 1 */
  26877. { { 0x49c0b528,0x3dd07566,0xa0d6ce38,0x20e378e2,0x541b4d6e,0x879c3afc,
  26878. 0x59a30eff,0x64548684,0x614ede2b,0x812ff723,0x299e1513,0x4d3aadc2 },
  26879. { 0x4b03a4fe,0x23043dad,0x7bb4a9ac,0xa1bfa8bf,0x2e83b050,0x8bade756,
  26880. 0x68f4ffd9,0xc6c35219,0x3969a840,0xdd800226,0x5a15c5e9,0x2b78abc2 } },
  26881. /* 2 */
  26882. { { 0x2b0c535b,0x29864753,0x70506296,0x90dd6953,0x216ab9ac,0x038cd6b4,
  26883. 0xbe12d76a,0x3df9b7b7,0x5f347bdb,0x13f4d978,0x13e94489,0x222c5c9c },
  26884. { 0x2680dc64,0x5f8e796f,0x58352417,0x120e7cb7,0xd10740b8,0x254b5d8a,
  26885. 0x5337dee6,0xc38b8efb,0x94f02247,0xf688c2e1,0x6c25bc4c,0x7b5c75f3 } },
  26886. /* 3 */
  26887. { { 0x9edffea5,0xe26a3cc3,0x37d7e9fc,0x35bbfd1c,0x9bde3ef6,0xf0e7700d,
  26888. 0x1a538f5a,0x0380eb47,0x05bf9eb3,0x2e9da8bb,0x1a460c3e,0xdbb93c73 },
  26889. { 0xf526b605,0x37dba260,0xfd785537,0x95d4978e,0xed72a04a,0x24ed793a,
  26890. 0x76005b1a,0x26948377,0x9e681f82,0x99f557b9,0xd64954ef,0xae5f9557 } },
  26891. /* 4 */
  26892. { { 0xf26feef9,0x24480c57,0x3a0e1240,0xc31a2694,0x273e2bc7,0x735002c3,
  26893. 0x3ef1ed4c,0x8c42e9c5,0x7f4948e8,0x028babf6,0x8a978632,0x6a502f43 },
  26894. { 0xb74536fe,0xf5f13a46,0xd8a9f0eb,0x1d218bab,0x37232768,0x30f36bcc,
  26895. 0x576e8c18,0xc5317b31,0x9bbcb766,0xef1d57a6,0xb3e3d4dc,0x917c4930 } },
  26896. /* 5 */
  26897. { { 0xe349ddd0,0x11426e2e,0x9b2fc250,0x9f117ef9,0xec0174a6,0xff36b480,
  26898. 0x18458466,0x4f4bde76,0x05806049,0x2f2edb6d,0x19dfca92,0x8adc75d1 },
  26899. { 0xb7d5a7ce,0xa619d097,0xa34411e9,0x874275e5,0x0da4b4ef,0x5403e047,
  26900. 0x77901d8f,0x2ebaafd9,0xa747170f,0x5e63ebce,0x7f9d8036,0x12a36944 } },
  26901. /* 6 */
  26902. { { 0x4fc52870,0x28f9c07a,0x1a53a961,0xce0b3748,0x0e1828d9,0xd550fa18,
  26903. 0x6adb225a,0xa24abaf7,0x6e58a348,0xd11ed0a5,0x948acb62,0xf3d811e6 },
  26904. { 0x4c61ed22,0x8618dd77,0x80b47c9d,0x0bb747f9,0xde6b8559,0x22bf796f,
  26905. 0x680a21e9,0xfdfd1c6d,0x2af2c9dd,0xc0db1577,0xc1e90f3d,0xa09379e6 } },
  26906. /* 7 */
  26907. { { 0xe085c629,0x386c66ef,0x095bc89a,0x5fc2a461,0x203f4b41,0x1353d631,
  26908. 0x7e4bd8f5,0x7ca1972b,0xa7df8ce9,0xb077380a,0xee7e4ea3,0xd8a90389 },
  26909. { 0xe7b14461,0x1bc74dc7,0x0c9c4f78,0xdc2cb014,0x84ef0a10,0x52b4b3a6,
  26910. 0x20327fe2,0xbde6ea5d,0x660f9615,0xb71ec435,0xb8ad8173,0xeede5a04 } },
  26911. /* 8 */
  26912. { { 0x893b9a2d,0x5584cbb3,0x00850c5d,0x820c660b,0x7df2d43d,0x4126d826,
  26913. 0x0109e801,0xdd5bbbf0,0x38172f1c,0x85b92ee3,0xf31430d9,0x609d4f93 },
  26914. { 0xeadaf9d6,0x1e059a07,0x0f125fb0,0x70e6536c,0x560f20e7,0xd6220751,
  26915. 0x7aaf3a9a,0xa59489ae,0x64bae14e,0x7b70e2f6,0x76d08249,0x0dd03701 } },
  26916. /* 9 */
  26917. { { 0x8510521f,0x4cc13be8,0xf724cc17,0x87315ba9,0x353dc263,0xb49d83bb,
  26918. 0x0c279257,0x8b677efe,0xc93c9537,0x510a1c1c,0xa4702c99,0x33e30cd8 },
  26919. { 0x2208353f,0xf0ffc89d,0xced42b2b,0x0170fa8d,0x26e2a5f5,0x090851ed,
  26920. 0xecb52c96,0x81276455,0x7fe1adf4,0x0646c4e1,0xb0868eab,0x513f047e } },
  26921. /* 10 */
  26922. { { 0xdf5bdf53,0xc07611f4,0x58b11a6d,0x45d331a7,0x1c4ee394,0x58965daf,
  26923. 0x5a5878d1,0xba8bebe7,0x82dd3025,0xaecc0a18,0xa923eb8b,0xcf2a3899 },
  26924. { 0xd24fd048,0xf98c9281,0x8bbb025d,0x841bfb59,0xc9ab9d53,0xb8ddf8ce,
  26925. 0x7fef044e,0x538a4cb6,0x23236662,0x092ac21f,0x0b66f065,0xa919d385 } },
  26926. /* 11 */
  26927. { { 0x85d480d8,0x3db03b40,0x1b287a7d,0x8cd9f479,0x4a8f3bae,0x8f24dc75,
  26928. 0x3db41892,0x482eb800,0x9c56e0f5,0x38bf9eb3,0x9a91dc6f,0x8b977320 },
  26929. { 0x7209cfc2,0xa31b05b2,0x05b2db70,0x4c49bf85,0xd619527b,0x56462498,
  26930. 0x1fac51ba,0x3fe51039,0xab4b8342,0xfb04f55e,0x04c6eabf,0xc07c10dc } },
  26931. /* 12 */
  26932. { { 0xdb32f048,0xad22fe4c,0x475ed6df,0x5f23bf91,0xaa66b6cb,0xa50ce0c0,
  26933. 0xf03405c0,0xdf627a89,0xf95e2d6a,0x3674837d,0xba42e64e,0x081c95b6 },
  26934. { 0xe71d6ceb,0xeba3e036,0x6c6b0271,0xb45bcccf,0x0684701d,0x67b47e63,
  26935. 0xe712523f,0x60f8f942,0x5cd47adc,0x82423472,0x87649cbb,0x83027d79 } },
  26936. /* 13 */
  26937. { { 0x3615b0b8,0xb3929ea6,0xa54dac41,0xb41441fd,0xb5b6a368,0x8995d556,
  26938. 0x167ef05e,0xa80d4529,0x6d25a27f,0xf6bcb4a1,0x7bd55b68,0x210d6a4c },
  26939. { 0x25351130,0xf3804abb,0x903e37eb,0x1d2df699,0x084c25c8,0x5f201efc,
  26940. 0xa1c68e91,0x31a28c87,0x563f62a5,0x81dad253,0xd6c415d4,0x5dd6de70 } },
  26941. /* 14 */
  26942. { { 0x846612ce,0x29f470fd,0xda18d997,0x986f3eec,0x2f34af86,0x6b84c161,
  26943. 0x46ddaf8b,0x5ef0a408,0xe49e795f,0x14405a00,0xaa2f7a37,0x5f491b16 },
  26944. { 0xdb41b38d,0xc7f07ae4,0x18fbfcaa,0xef7d119e,0x14443b19,0x3a18e076,
  26945. 0x79a19926,0x4356841a,0xe2226fbe,0x91f4a91c,0x3cc88721,0xdc77248c } },
  26946. /* 15 */
  26947. { { 0xe4b1ec9d,0xd570ff1a,0xe7eef706,0x21d23e0e,0xca19e086,0x3cde40f4,
  26948. 0xcd4bb270,0x7d6523c4,0xbf13aa6c,0x16c1f06c,0xd14c4b60,0x5aa7245a },
  26949. { 0x44b74de8,0x37f81467,0x620a934e,0x839e7a17,0xde8b1aa1,0xf74d14e8,
  26950. 0xf30d75e2,0x8789fa51,0xc81c261e,0x09b24052,0x33c565ee,0x654e2678 } },
  26951. /* 16 */
  26952. { { 0x2f9fbe67,0x378205de,0x7f728e44,0xc4afcb83,0x682e00f1,0xdbcec06c,
  26953. 0x114d5423,0xf2a145c3,0x7a52463e,0xa01d9874,0x7d717b0a,0xfc0935b1 },
  26954. { 0xd4d01f95,0x9653bc4f,0x9560ad34,0x9aa83ea8,0xaf8e3f3f,0xf77943dc,
  26955. 0xe86fe16e,0x70774a10,0xbf9ffdcf,0x6b62e6f1,0x588745c9,0x8a72f39e } },
  26956. /* 17 */
  26957. { { 0x2341c342,0x73ade4da,0xea704422,0xdd326e54,0x3741cef3,0x336c7d98,
  26958. 0x59e61549,0x1eafa00d,0xbd9a3efd,0xcd3ed892,0xc5c6c7e4,0x03faf26c },
  26959. { 0x3045f8ac,0x087e2fcf,0x174f1e73,0x14a65532,0xfe0af9a7,0x2cf84f28,
  26960. 0x2cdc935b,0xddfd7a84,0x6929c895,0x4c0f117b,0x4c8bcfcc,0x356572d6 } },
  26961. /* 18 */
  26962. { { 0x7d8c1bba,0x7ecbac01,0x90b0f3d5,0x6058f9c3,0xf6197d0f,0xaee116e3,
  26963. 0x4033b128,0xc4dd7068,0xc209b983,0xf084dba6,0x831dbc4a,0x97c7c2cf },
  26964. { 0xf96010e8,0x2f4e61dd,0x529faa17,0xd97e4e20,0x69d37f20,0x4ee66660,
  26965. 0x3d366d72,0xccc139ed,0x13488e0f,0x690b6ee2,0xf3a6d533,0x7cad1dc5 } },
  26966. /* 19 */
  26967. { { 0xda57a41f,0x660a9a81,0xec0039b6,0xe74a0412,0x5e1dad15,0x42343c6b,
  26968. 0x46681d4c,0x284f3ff5,0x63749e89,0xb51087f1,0x6f9f2f13,0x070f23cc },
  26969. { 0x5d186e14,0x542211da,0xfddb0dff,0x84748f37,0xdb1f4180,0x41a3aab4,
  26970. 0xa6402d0e,0x25ed667b,0x02f58355,0x2f2924a9,0xfa44a689,0x5844ee7c } },
  26971. /* 20 */
  26972. { { 0x3f3b236f,0xfab08607,0x81e221da,0x19e9d41d,0x3927b428,0xf3f6571e,
  26973. 0x7550f1f6,0x4348a933,0xa85e62f0,0x7167b996,0x7f5452bf,0x62d43759 },
  26974. { 0xf2955926,0xd85feb9e,0x6df78353,0x440a561f,0x9ca36b59,0x389668ec,
  26975. 0xa22da016,0x052bf1a1,0xf6093254,0xbdfbff72,0xe22209f3,0x94e50f28 } },
  26976. /* 21 */
  26977. { { 0x3062e8af,0x90b2e5b3,0xe8a3d369,0xa8572375,0x201db7b1,0x3fe1b00b,
  26978. 0xee651aa2,0xe926def0,0xb9b10ad7,0x6542c9be,0xa2fcbe74,0x098e309b },
  26979. { 0xfff1d63f,0x779deeb3,0x20bfd374,0x23d0e80a,0x8768f797,0x8452bb3b,
  26980. 0x1f952856,0xcf75bb4d,0x29ea3faa,0x8fe6b400,0x81373a53,0x12bd3e40 } },
  26981. /* 22 */
  26982. { { 0x104cbba5,0xc023780d,0xfa35dd4c,0x6207e747,0x1ca9b6a3,0x35c23928,
  26983. 0x97987b10,0x4ff19be8,0x8022eee8,0xb8476bbf,0xd3bbe74d,0xaa0a4a14 },
  26984. { 0x187d4543,0x20f94331,0x79f6e066,0x32153870,0xac7e82e1,0x83b0f74e,
  26985. 0x828f06ab,0xa7748ba2,0xc26ef35f,0xc5f0298a,0x8e9a7dbd,0x0f0c5070 } },
  26986. /* 23 */
  26987. { { 0xdef029dd,0x0c5c244c,0x850661b8,0x3dabc687,0xfe11d981,0x9992b865,
  26988. 0x6274dbad,0xe9801b8f,0x098da242,0xe54e6319,0x91a53d08,0x9929a91a },
  26989. { 0x35285887,0x37bffd72,0xf1418102,0xbc759425,0xfd2e6e20,0x9280cc35,
  26990. 0xfbc42ee5,0x735c600c,0x8837619a,0xb7ad2864,0xa778c57b,0xa3627231 } },
  26991. /* 24 */
  26992. { { 0x91361ed8,0xae799b5c,0x6c63366c,0x47d71b75,0x1b265a6a,0x54cdd521,
  26993. 0x98d77b74,0xe0215a59,0xbab29db0,0x4424d9b7,0x7fd9e536,0x8b0ffacc },
  26994. { 0x37b5d9ef,0x46d85d12,0xbfa91747,0x5b106d62,0x5f99ba2d,0xed0479f8,
  26995. 0x1d104de4,0x0e6f3923,0x25e8983f,0x83a84c84,0xf8105a70,0xa9507e0a } },
  26996. /* 25 */
  26997. { { 0x14cf381c,0xf6c68a6e,0xc22e31cc,0xaf9d27bd,0xaa8a5ccb,0x23568d4d,
  26998. 0xe338e4d2,0xe431eec0,0x8f52ad1f,0xf1a828fe,0xe86acd80,0xdb6a0579 },
  26999. { 0x4507832a,0x2885672e,0x887e5289,0x73fc275f,0x05610d08,0x65f80278,
  27000. 0x075ff5b0,0x8d9b4554,0x09f712b5,0x3a8e8fb1,0x2ebe9cf2,0x39f0ac86 } },
  27001. /* 26 */
  27002. { { 0x4c52edf5,0xd8fabf78,0xa589ae53,0xdcd737e5,0xd791ab17,0x94918bf0,
  27003. 0xbcff06c9,0xb5fbd956,0xdca46d45,0xf6d3032e,0x41a3e486,0x2cdff7e1 },
  27004. { 0x61f47ec8,0x6674b3ba,0xeef84608,0x8a882163,0x4c687f90,0xa257c705,
  27005. 0xf6cdf227,0xe30cb2ed,0x7f6ea846,0x2c4c64ca,0xcc6bcd3c,0x186fa17c } },
  27006. /* 27 */
  27007. { { 0x1dfcb91e,0x48a3f536,0x646d358a,0x83595e13,0x91128798,0xbd15827b,
  27008. 0x2187757a,0x3ce612b8,0x61bd7372,0x873150a1,0xb662f568,0xf4684530 },
  27009. { 0x401896f6,0x8833950b,0x77f3e090,0xe11cb89a,0x48e7f4a5,0xb2f12cac,
  27010. 0xf606677e,0x313dd769,0x16579f93,0xfdcf08b3,0x46b8f22b,0x6429cec9 } },
  27011. /* 28 */
  27012. { { 0xbb75f9a4,0x4984dd54,0x29d3b570,0x4aef06b9,0x3d6e4c1e,0xb5f84ca2,
  27013. 0xb083ef35,0x24c61c11,0x392ca9ff,0xce4a7392,0x6730a800,0x865d6517 },
  27014. { 0x722b4a2b,0xca3dfe76,0x7b083e0e,0x12c04bf9,0x1b86b8a5,0x803ce5b5,
  27015. 0x6a7e3e0c,0x3fc7632d,0xc81adbe4,0xc89970c2,0x120e16b1,0x3cbcd3ad } },
  27016. /* 29 */
  27017. { { 0xec30ce93,0xfbfb4cc7,0xb72720a2,0x10ed6c7d,0x47b55500,0xec675bf7,
  27018. 0x333ff7c3,0x90725903,0x5075bfc0,0xc7c3973e,0x07acf31b,0xb049ecb0 },
  27019. { 0x4f58839c,0xb4076eaf,0xa2b05e4f,0x101896da,0xab40c66e,0x3f6033b0,
  27020. 0xc8d864ba,0x19ee9eeb,0x47bf6d2a,0xeb6cf155,0xf826477d,0x8e5a9663 } },
  27021. /* 30 */
  27022. { { 0xf7fbd5e1,0x69e62fdd,0x76912b1d,0x38ecfe54,0xd1da3bfb,0x845a3d56,
  27023. 0x1c86f0d4,0x0494950e,0x3bc36ce8,0x83cadbf9,0x4fccc8d1,0x41fce572 },
  27024. { 0x8332c144,0x05f939c2,0x0871e46e,0xb17f248b,0x66e8aff6,0x3d8534e2,
  27025. 0x3b85c629,0x1d06f1dc,0xa3131b73,0xdb06a32e,0x8b3f64e5,0xf295184d } },
  27026. /* 31 */
  27027. { { 0x36ddc103,0xd9653ff7,0x95ef606f,0x25f43e37,0xfe06dce8,0x09e301fc,
  27028. 0x30b6eebf,0x85af2341,0x0ff56b20,0x79b12b53,0xfe9a3c6b,0x9b4fb499 },
  27029. { 0x51d27ac2,0x0154f892,0x56ca5389,0xd33167e3,0xafc065a6,0x7828ec1f,
  27030. 0x7f746c9b,0x0959a258,0x0c44f837,0xb18f1be3,0xc4132fdb,0xa7946117 } },
  27031. /* 32 */
  27032. { { 0x5e3c647b,0xc0426b77,0x8cf05348,0xbfcbd939,0x172c0d3d,0x31d312e3,
  27033. 0xee754737,0x5f49fde6,0x6da7ee61,0x895530f0,0xe8b3a5fb,0xcf281b0a },
  27034. { 0x41b8a543,0xfd149735,0x3080dd30,0x41a625a7,0x653908cf,0xe2baae07,
  27035. 0xba02a278,0xc3d01436,0x7b21b8f8,0xa0d0222e,0xd7ec1297,0xfdc270e9 } },
  27036. /* 33 */
  27037. { { 0xbc7f41d6,0x00873c0c,0x1b7ad641,0xd976113e,0x238443fb,0x2a536ff4,
  27038. 0x41e62e45,0x030d00e2,0x5f545fc6,0x532e9867,0x8e91208c,0xcd033108 },
  27039. { 0x9797612c,0xd1a04c99,0xeea674e2,0xd4393e02,0xe19742a1,0xd56fa69e,
  27040. 0x85f0590e,0xdd2ab480,0x48a2243d,0xa5cefc52,0x54383f41,0x48cc67b6 } },
  27041. /* 34 */
  27042. { { 0xfc14ab48,0x4e50430e,0x26706a74,0x195b7f4f,0xcc881ff6,0x2fe8a228,
  27043. 0xd945013d,0xb1b968e2,0x4b92162b,0x936aa579,0x364e754a,0x4fb766b7 },
  27044. { 0x31e1ff7f,0x13f93bca,0xce4f2691,0x696eb5ca,0xa2b09e02,0xff754bf8,
  27045. 0xe58e3ff8,0x58f13c9c,0x1678c0b0,0xb757346f,0xa86692b3,0xd54200db } },
  27046. /* 35 */
  27047. { { 0x6dda1265,0x9a030bbd,0xe89718dd,0xf7b4f3fc,0x936065b8,0xa6a4931f,
  27048. 0x5f72241c,0xbce72d87,0x65775857,0x6cbb51cb,0x4e993675,0xc7161815 },
  27049. { 0x2ee32189,0xe81a0f79,0x277dc0b2,0xef2fab26,0xb71f469f,0x9e64f6fe,
  27050. 0xdfdaf859,0xb448ce33,0xbe6b5df1,0x3f5c1c4c,0x1de45f7b,0xfb8dfb00 } },
  27051. /* 36 */
  27052. { { 0x4d5bb921,0xc7345fa7,0x4d2b667e,0x5c7e04be,0x282d7a3e,0x47ed3a80,
  27053. 0x7e47b2a4,0x5c2777f8,0x08488e2e,0x89b3b100,0xb2eb5b45,0x9aad77c2 },
  27054. { 0xdaac34ae,0xd681bca7,0x26afb326,0x2452e4e5,0x41a1ee14,0x0c887924,
  27055. 0xc2407ade,0x743b04d4,0xfc17a2ac,0xcb5e999b,0x4a701a06,0x4dca2f82 } },
  27056. /* 37 */
  27057. { { 0x1127bc1a,0x68e31ca6,0x17ead3be,0xa3edd59b,0xe25f5a15,0x67b6b645,
  27058. 0xa420e15e,0x76221794,0x4b1e872e,0x794fd83b,0xb2dece1b,0x7cab3f03 },
  27059. { 0xca9b3586,0x7119bf15,0x4d250bd7,0xa5545924,0xcc6bcf24,0x173633ea,
  27060. 0xb1b6f884,0x9bd308c2,0x447d38c3,0x3bae06f5,0xf341fe1c,0x54dcc135 } },
  27061. /* 38 */
  27062. { { 0x943caf0d,0x56d3598d,0x225ff133,0xce044ea9,0x563fadea,0x9edf6a7c,
  27063. 0x73e8dc27,0x632eb944,0x3190dcab,0x814b467e,0x6dbb1e31,0x2d4f4f31 },
  27064. { 0xa143b7ca,0x8d69811c,0xde7cf950,0x4ec1ac32,0x37b5fe82,0x223ab5fd,
  27065. 0x9390f1d9,0xe82616e4,0x75804610,0xabff4b20,0x875b08f0,0x11b9be15 } },
  27066. /* 39 */
  27067. { { 0x3bbe682c,0x4ae31a3d,0x74eef2dd,0xbc7c5d26,0x3c47dd40,0x92afd10a,
  27068. 0xc14ab9e1,0xec7e0a3b,0xb2e495e4,0x6a6c3dd1,0x309bcd85,0x085ee5e9 },
  27069. { 0x8c2e67fd,0xf381a908,0xe261eaf2,0x32083a80,0x96deee15,0x0fcd6a49,
  27070. 0x5e524c79,0xe3b8fb03,0x1d5b08b9,0x8dc360d9,0x7f26719f,0x3a06e2c8 } },
  27071. /* 40 */
  27072. { { 0x7237cac0,0x5cd9f5a8,0x43586794,0x93f0b59d,0xe94f6c4e,0x4384a764,
  27073. 0xb62782d3,0x8304ed2b,0xcde06015,0x0b8db8b3,0x5dbe190f,0x4336dd53 },
  27074. { 0x92ab473a,0x57443553,0xbe5ed046,0x031c7275,0x21909aa4,0x3e78678c,
  27075. 0x99202ddb,0x4ab7e04f,0x6977e635,0x2648d206,0x093198be,0xd427d184 } },
  27076. /* 41 */
  27077. { { 0x0f9b5a31,0x822848f5,0xbaadb62a,0xbb003468,0x3357559c,0x233a0472,
  27078. 0x79aee843,0x49ef6880,0xaeb9e1e3,0xa89867a0,0x1f6f9a55,0xc151931b },
  27079. { 0xad74251e,0xd264eb0b,0x4abf295e,0x37b9b263,0x04960d10,0xb600921b,
  27080. 0x4da77dc0,0x0de53dbc,0xd2b18697,0x01d9bab3,0xf7156ddf,0xad54ec7a } },
  27081. /* 42 */
  27082. { { 0x79efdc58,0x8e74dc35,0x4ff68ddb,0x456bd369,0xd32096a5,0x724e74cc,
  27083. 0x386783d0,0xe41cff42,0x7c70d8a4,0xa04c7f21,0xe61a19a2,0x41199d2f },
  27084. { 0x29c05dd2,0xd389a3e0,0xe7e3fda9,0x535f2a6b,0x7c2b4df8,0x26ecf72d,
  27085. 0xfe745294,0x678275f4,0x9d23f519,0x6319c9cc,0x88048fc4,0x1e05a02d } },
  27086. /* 43 */
  27087. { { 0xd4d5ffe8,0x75cc8e2e,0xdbea17f2,0xf8bb4896,0xcee3cb4a,0x35059790,
  27088. 0xa47c6165,0x4c06ee85,0x92935d2f,0xf98fff25,0x32ffd7c7,0x34c4a572 },
  27089. { 0xea0376a2,0xc4b14806,0x4f115e02,0x2ea5e750,0x1e55d7c0,0x532d76e2,
  27090. 0xf31044da,0x68dc9411,0x71b77993,0x9272e465,0x93a8cfd5,0xadaa38bb } },
  27091. /* 44 */
  27092. { { 0x7d4ed72a,0x4bf0c712,0xba1f79a3,0xda0e9264,0xf4c39ea4,0x48c0258b,
  27093. 0x2a715138,0xa5394ed8,0xbf06c660,0x4af511ce,0xec5c37cd,0xfcebceef },
  27094. { 0x779ae8c1,0xf23b75aa,0xad1e606e,0xdeff59cc,0x22755c82,0xf3f526fd,
  27095. 0xbb32cefd,0x64c5ab44,0x915bdefd,0xa96e11a2,0x1143813e,0xab19746a } },
  27096. /* 45 */
  27097. { { 0xec837d7d,0x43c78585,0xb8ee0ba4,0xca5b6fbc,0xd5dbb5ee,0x34e924d9,
  27098. 0xbb4f1ca5,0x3f4fa104,0x398640f7,0x15458b72,0xd7f407ea,0x4231faa9 },
  27099. { 0xf96e6896,0x53e0661e,0xd03b0f9d,0x554e4c69,0x9c7858d1,0xd4fcb07b,
  27100. 0x52cb04fa,0x7e952793,0x8974e7f7,0x5f5f1574,0x6b6d57c8,0x2e3fa558 } },
  27101. /* 46 */
  27102. { { 0x6a9951a8,0x42cd4803,0x42792ad0,0xa8b15b88,0xabb29a73,0x18e8bcf9,
  27103. 0x409933e8,0xbfd9a092,0xefb88dc4,0x760a3594,0x40724458,0x14418863 },
  27104. { 0x99caedc7,0x162a56ee,0x91d101c9,0x8fb12ecd,0x393202da,0xea671967,
  27105. 0xa4ccd796,0x1aac8c4a,0x1cf185a8,0x7db05036,0x8cfd095a,0x0c9f86cd } },
  27106. /* 47 */
  27107. { { 0x10b2a556,0x9a728147,0x327b70b2,0x767ca964,0x5e3799b7,0x04ed9e12,
  27108. 0x22a3eb2a,0x6781d2dc,0x0d9450ac,0x5bd116eb,0xa7ebe08a,0xeccac1fc },
  27109. { 0xdc2d6e94,0xde68444f,0x35ecf21b,0x3621f429,0x29e03a2c,0x14e2d543,
  27110. 0x7d3e7f0a,0x53e42cd5,0x73ed00b9,0xbba26c09,0xc57d2272,0x00297c39 } },
  27111. /* 48 */
  27112. { { 0xb8243a7d,0x3aaaab10,0x8fa58c5b,0x6eeef93e,0x9ae7f764,0xf866fca3,
  27113. 0x61ab04d3,0x64105a26,0x03945d66,0xa3578d8a,0x791b848c,0xb08cd3e4 },
  27114. { 0x756d2411,0x45edc5f8,0xa755128c,0xd4a790d9,0x49e5f6a0,0xc2cf0963,
  27115. 0xf649beaa,0xc66d267d,0x8467039e,0x3ce6d968,0x42f7816f,0x50046c6b } },
  27116. /* 49 */
  27117. { { 0x66425043,0x92ae1602,0xf08db890,0x1ff66afd,0x8f162ce5,0x386f5a7f,
  27118. 0xfcf5598f,0x18d2dea0,0x1a8ca18e,0x78372b3a,0x8cd0e6f7,0xdf0d20eb },
  27119. { 0x75bb4045,0x7edd5e1d,0xb96d94b7,0x252a47ce,0x2c626776,0xbdb29358,
  27120. 0x40dd1031,0x853c3943,0x7d5f47fd,0x9dc9becf,0xbae4044a,0x27c2302f } },
  27121. /* 50 */
  27122. { { 0x8f2d49ce,0x2d1d208a,0x162df0a2,0x0d91aa02,0x09a07f65,0x9c5cce87,
  27123. 0x84339012,0xdf07238b,0x419442cd,0x5028e2c8,0x72062aba,0x2dcbd358 },
  27124. { 0xe4680967,0xb5fbc3cb,0x9f92d72c,0x2a7bc645,0x116c369d,0x806c76e1,
  27125. 0x3177e8d8,0x5c50677a,0x4569df57,0x753739eb,0x36c3f40b,0x2d481ef6 } },
  27126. /* 51 */
  27127. { { 0xfea1103e,0x1a2d39fd,0x95f81b17,0xeaae5592,0xf59b264a,0xdbd0aa18,
  27128. 0xcb592ee0,0x90c39c1a,0x9750cca3,0xdf62f80d,0xdf97cc6c,0xda4d8283 },
  27129. { 0x1e201067,0x0a6dd346,0x69fb1f6b,0x1531f859,0x1d60121f,0x4895e552,
  27130. 0x4c041c91,0x0b21aab0,0xbcc1ccf8,0x9d896c46,0x3141bde7,0xd24da3b3 } },
  27131. /* 52 */
  27132. { { 0x53b0a354,0x575a0537,0x0c6ddcd8,0x392ff2f4,0x56157b94,0x0b8e8cff,
  27133. 0x3b1b80d1,0x073e57bd,0x3fedee15,0x2a75e0f0,0xaa8e6f19,0x752380e4 },
  27134. { 0x6558ffe9,0x1f4e227c,0x19ec5415,0x3a348618,0xf7997085,0xab382d5e,
  27135. 0xddc46ac2,0x5e6deaff,0xfc8d094c,0xe5144078,0xf60e37c6,0xf674fe51 } },
  27136. /* 53 */
  27137. { { 0xaf63408f,0x6fb87ae5,0xcd75a737,0xa39c36a9,0xcf4c618d,0x7833313f,
  27138. 0xf034c88d,0xfbcd4482,0x39b35288,0x4469a761,0x66b5d9c9,0x77a711c5 },
  27139. { 0x944f8d65,0x4a695dc7,0x161aaba8,0xe6da5f65,0x24601669,0x8654e9c3,
  27140. 0x28ae7491,0xbc8b93f5,0x8f5580d8,0x5f1d1e83,0xcea32cc8,0x8ccf9a1a } },
  27141. /* 54 */
  27142. { { 0x7196fee2,0x28ab110c,0x874c8945,0x75799d63,0x29aedadd,0xa2629348,
  27143. 0x2be88ff4,0x9714cc7b,0xd58d60d6,0xf71293cf,0x32a564e9,0xda6b6cb3 },
  27144. { 0x3dd821c2,0xf43fddb1,0x90dd323d,0xf2f2785f,0x048489f8,0x91246419,
  27145. 0xd24c6749,0x61660f26,0xc803c15c,0x961d9e8c,0xfaadc4c9,0x631c6158 } },
  27146. /* 55 */
  27147. { { 0xfd752366,0xacf2ebe0,0x139be88b,0xb93c340e,0x0f20179e,0x98f66485,
  27148. 0xff1da785,0x14820254,0x4f85c16e,0x5278e276,0x7aab1913,0xa246ee45 },
  27149. { 0x53763b33,0x43861eb4,0x45c0bc0d,0xc49f03fc,0xad6b1ea1,0xafff16bc,
  27150. 0x6fd49c99,0xce33908b,0xf7fde8c3,0x5c51e9bf,0xff142c5e,0x076a7a39 } },
  27151. /* 56 */
  27152. { { 0x9e338d10,0x04639dfe,0xf42b411b,0x8ee6996f,0xa875cef2,0x960461d1,
  27153. 0x95b4d0ba,0x1057b6d6,0xa906e0bc,0x27639252,0xe1c20f8a,0x2c19f09a },
  27154. { 0xeef4c43d,0x5b8fc3f0,0x07a84aa9,0xe2e1b1a8,0x835d2bdb,0x5f455528,
  27155. 0x207132dd,0x0f4aee4d,0x3907f675,0xe9f8338c,0x0e0531f0,0x7a874dc9 } },
  27156. /* 57 */
  27157. { { 0x97c27050,0x84b22d45,0x59e70bf8,0xbd0b8df7,0x79738b9b,0xb4d67405,
  27158. 0xcd917c4f,0x47f4d5f5,0x13ce6e33,0x9099c4ce,0x521d0f8b,0x942bfd39 },
  27159. { 0xa43b566d,0x5028f0f6,0x21bff7de,0xaf6e8669,0xc44232cd,0x83f6f856,
  27160. 0xf915069a,0x65680579,0xecfecb85,0xd12095a2,0xdb01ba16,0xcf7f06ae } },
  27161. /* 58 */
  27162. { { 0x8ef96c80,0x0f56e3c4,0x3ddb609c,0xd521f2b3,0x7dc1450d,0x2be94102,
  27163. 0x02a91fe2,0x2d21a071,0x1efa37de,0x2e6f74fa,0x156c28a1,0x9a9a90b8 },
  27164. { 0x9dc7dfcb,0xc54ea9ea,0x2c2c1d62,0xc74e66fc,0x49d3e067,0x9f23f967,
  27165. 0x54dd38ad,0x1c7c3a46,0x5946cee3,0xc7005884,0x45cc045d,0x89856368 } },
  27166. /* 59 */
  27167. { { 0xfce73946,0x29da7cd4,0x23168563,0x8f697db5,0xcba92ec6,0x8e235e9c,
  27168. 0x9f91d3ea,0x55d4655f,0xaa50a6cd,0xf3689f23,0x21e6a1a0,0xdcf21c26 },
  27169. { 0x61b818bf,0xcffbc82e,0xda47a243,0xc74a2f96,0x8bc1a0cf,0x234e980a,
  27170. 0x7929cb6d,0xf35fd6b5,0xefe17d6c,0x81468e12,0x58b2dafb,0xddea6ae5 } },
  27171. /* 60 */
  27172. { { 0x7e787b2e,0x294de887,0x39a9310d,0x258acc1f,0xac14265d,0x92d9714a,
  27173. 0x708b48a0,0x18b5591c,0xe1abbf71,0x27cc6bb0,0x568307b9,0xc0581fa3 },
  27174. { 0xf24d4d58,0x9e0f58a3,0xe0ce2327,0xfebe9bb8,0x9d1be702,0x91fd6a41,
  27175. 0xfacac993,0x9a7d8a45,0x9e50d66d,0xabc0a08c,0x06498201,0x02c342f7 } },
  27176. /* 61 */
  27177. { { 0x157bdbc2,0xccd71407,0xad0e1605,0x72fa89c6,0xb92a015f,0xb1d3da2b,
  27178. 0xa0a3fe56,0x8ad9e7cd,0x24f06737,0x160edcbd,0x61275be6,0x79d4db33 },
  27179. { 0x5f3497c4,0xd3d31fd9,0x04192fb0,0x8cafeaee,0x13a50af3,0xe13ca745,
  27180. 0x8c85aae5,0x18826167,0x9eb556ff,0xce06cea8,0xbdb549f3,0x2eef1995 } },
  27181. /* 62 */
  27182. { { 0x50596edc,0x8ed7d3eb,0x905243a2,0xaa359362,0xa4b6d02b,0xa212c2c2,
  27183. 0xc4fbec68,0x611fd727,0xb84f733d,0x8a0b8ff7,0x5f0daf0e,0xd85a6b90 },
  27184. { 0xd4091cf7,0x60e899f5,0x2eff2768,0x4fef2b67,0x10c33964,0xc1f195cb,
  27185. 0x93626a8f,0x8275d369,0x0d6c840a,0xc77904f4,0x7a868acd,0x88d8b7fd } },
  27186. /* 63 */
  27187. { { 0x7bd98425,0x85f23723,0xc70b154e,0xd4463992,0x96687a2e,0xcbb00ee2,
  27188. 0xc83214fd,0x905fdbf7,0x13593684,0x2019d293,0xef51218e,0x0428c393 },
  27189. { 0x981e909a,0x40c7623f,0x7be192da,0x92513385,0x4010907e,0x48fe480f,
  27190. 0x3120b459,0xdd7a187c,0xa1fd8f3c,0xc9d7702d,0xe358efc5,0x66e4753b } },
  27191. /* 64 */
  27192. { { 0x16973cf4,0x070d34e1,0x7e4f34f7,0x20aee08b,0x5eb8ad29,0x269af9b9,
  27193. 0xa6a45dda,0xdde0a036,0x63df41e0,0xa18b528e,0xa260df2a,0x03cc71b2 },
  27194. { 0xa06b1dd7,0x24a6770a,0x9d2675d3,0x5bfa9c11,0x96844432,0x73c1e2a1,
  27195. 0x131a6cf0,0x3660558d,0x2ee79454,0xb0289c83,0xc6d8ddcd,0xa6aefb01 } },
  27196. /* 65 */
  27197. { { 0x01ab5245,0xba1464b4,0xc48d93ff,0x9b8d0b6d,0x93ad272c,0x939867dc,
  27198. 0xae9fdc77,0xbebe085e,0x894ea8bd,0x73ae5103,0x39ac22e1,0x740fc89a },
  27199. { 0x28e23b23,0x5e28b0a3,0xe13104d0,0x2352722e,0xb0a2640d,0xf4667a18,
  27200. 0x49bb37c3,0xac74a72e,0xe81e183a,0x79f734f0,0x3fd9c0eb,0xbffe5b6c } },
  27201. /* 66 */
  27202. { { 0xc6a2123f,0xb1a358f5,0xfe28df6d,0x927b2d95,0xf199d2f9,0x89702753,
  27203. 0x1a3f82dc,0x0a73754c,0x777affe1,0x063d029d,0xdae6d34d,0x5439817e },
  27204. { 0x6b8b83c4,0xf7979eef,0x9d945682,0x615cb214,0xc5e57eae,0x8f0e4fac,
  27205. 0x113047dd,0x042b89b8,0x93f36508,0x888356dc,0x5fd1f32f,0xbf008d18 } },
  27206. /* 67 */
  27207. { { 0x4e8068db,0x8012aa24,0xa5729a47,0xc72cc641,0x43f0691d,0x3c33df2c,
  27208. 0x1d92145f,0xfa057347,0xb97f7946,0xaefc0f2f,0x2f8121bf,0x813d75cb },
  27209. { 0x4383bba6,0x05613c72,0xa4224b3f,0xa924ce70,0x5f2179a6,0xe59cecbe,
  27210. 0x79f62b61,0x78e2e8aa,0x53ad8079,0x3ac2cc3b,0xd8f4fa96,0x55518d71 } },
  27211. /* 68 */
  27212. { { 0x00623f3b,0x03cf2922,0x5f29ebff,0x095c7111,0x80aa6823,0x42d72247,
  27213. 0x7458c0b0,0x044c7ba1,0x0959ec20,0xca62f7ef,0xf8ca929f,0x40ae2ab7 },
  27214. { 0xa927b102,0xb8c5377a,0xdc031771,0x398a86a0,0xc216a406,0x04908f9d,
  27215. 0x918d3300,0xb423a73a,0xe0b94739,0x634b0ff1,0x2d69f697,0xe29de725 } },
  27216. /* 69 */
  27217. { { 0x8435af04,0x744d1400,0xfec192da,0x5f255b1d,0x336dc542,0x1f17dc12,
  27218. 0x636a68a8,0x5c90c2a7,0x7704ca1e,0x960c9eb7,0x6fb3d65a,0x9de8cf1e },
  27219. { 0x511d3d06,0xc60fee0d,0xf9eb52c7,0x466e2313,0x206b0914,0x743c0f5f,
  27220. 0x2191aa4d,0x42f55bac,0xffebdbc2,0xcefc7c8f,0xe6e8ed1c,0xd4fa6081 } },
  27221. /* 70 */
  27222. { { 0xb0ab9645,0xb5e405d3,0xd5f1f711,0xaeec7f98,0x585c2a6e,0x8ad42311,
  27223. 0x512c6944,0x045acb9e,0xa90db1c6,0xae106c4e,0x898e6563,0xb89f33d5 },
  27224. { 0x7fed2ce4,0x43b07cd9,0xdd815b20,0xf9934e17,0x0a81a349,0x6778d4d5,
  27225. 0x52918061,0x9e616ade,0xd7e67112,0xfa06db06,0x88488091,0x1da23cf1 } },
  27226. /* 71 */
  27227. { { 0x42f2c4b5,0x821c46b3,0x66059e47,0x931513ef,0x66f50cd1,0x7030ae43,
  27228. 0x43e7b127,0x43b536c9,0x5fca5360,0x006258cf,0x6b557abf,0xe4e3ee79 },
  27229. { 0x24c8b22f,0xbb6b3900,0xfcbf1054,0x2eb5e2c1,0x567492af,0x937b18c9,
  27230. 0xacf53957,0xf09432e4,0x1dbf3a56,0x585f5a9d,0xbe0887cf,0xf86751fd } },
  27231. /* 72 */
  27232. { { 0x9d10e0b2,0x157399cb,0x60dc51b7,0x1c0d5956,0x1f583090,0x1d496b8a,
  27233. 0x88590484,0x6658bc26,0x03213f28,0x88c08ab7,0x7ae58de4,0x8d2e0f73 },
  27234. { 0x486cfee6,0x9b79bc95,0xe9e5bc57,0x036a26c7,0xcd8ae97a,0x1ad03601,
  27235. 0xff3a0494,0x06907f87,0x2c7eb584,0x078f4bbf,0x7e8d0a5a,0xe3731bf5 } },
  27236. /* 73 */
  27237. { { 0xe1cd0abe,0x72f2282b,0x87efefa2,0xd4f9015e,0x6c3834bd,0x9d189806,
  27238. 0xb8a29ced,0x9c8cdcc1,0xfee82ebc,0x0601b9f4,0x7206a756,0x371052bc },
  27239. { 0x46f32562,0x76fa1092,0x17351bb4,0xdaad534c,0xb3636bb5,0xc3d64c37,
  27240. 0x45d54e00,0x038a8c51,0x32c09e7c,0x301e6180,0x95735151,0x9764eae7 } },
  27241. /* 74 */
  27242. { { 0xcbd5256a,0x8791b19f,0x6ca13a3b,0x4007e0f2,0x4cf06904,0x03b79460,
  27243. 0xb6c17589,0xb18a9c22,0x81d45908,0xa1cb7d7d,0x21bb68f1,0x6e13fa9d },
  27244. { 0xa71e6e16,0x47183c62,0xe18749ed,0x5cf0ef8e,0x2e5ed409,0x2c9c7f9b,
  27245. 0xe6e117e1,0x042eeacc,0x13fb5a7f,0xb86d4816,0xc9e5feb1,0xea1cf0ed } },
  27246. /* 75 */
  27247. { { 0xcea4cc9b,0x6e6573c9,0xafcec8f3,0x5417961d,0xa438b6f6,0x804bf02a,
  27248. 0xdcd4ea88,0xb894b03c,0x3799571f,0xd0f807e9,0x862156e8,0x3466a7f5 },
  27249. { 0x56515664,0x51e59acd,0xa3c5eb0b,0x55b0f93c,0x6a4279db,0x84a06b02,
  27250. 0xc5fae08e,0x5c850579,0xa663a1a2,0xcf07b8db,0xf46ffc8d,0x49a36bbc } },
  27251. /* 76 */
  27252. { { 0x46d93106,0xe47f5acc,0xaa897c9c,0x65b7ade0,0x12d7e4be,0x37cf4c94,
  27253. 0xd4b2caa9,0xa2ae9b80,0xe60357a3,0x5e7ce09c,0xc8ecd5f9,0x29f77667 },
  27254. { 0xa8a0b1c5,0xdf6868f5,0x62978ad8,0x240858cf,0xdc0002a1,0x0f7ac101,
  27255. 0xffe9aa05,0x1d28a9d7,0x5b962c97,0x744984d6,0x3d28c8b2,0xa8a7c00b } },
  27256. /* 77 */
  27257. { { 0xae11a338,0x7c58a852,0xd1af96e7,0xa78613f1,0x5355cc73,0x7e9767d2,
  27258. 0x792a2de6,0x6ba37009,0x124386b2,0x7d60f618,0x11157674,0xab09b531 },
  27259. { 0x98eb9dd0,0x95a04841,0x15070328,0xe6c17acc,0x489c6e49,0xafc6da45,
  27260. 0xbb211530,0xab45a60a,0x7d7ea933,0xc58d6592,0x095642c6,0xa3ef3c65 } },
  27261. /* 78 */
  27262. { { 0xdf010879,0x89d420e9,0x39576179,0x9d25255d,0xe39513b6,0x9cdefd50,
  27263. 0xd5d1c313,0xe4efe45b,0x3f7af771,0xc0149de7,0x340ab06b,0x55a6b4f4 },
  27264. { 0xebeaf771,0xf1325251,0x878d4288,0x2ab44128,0x18e05afe,0xfcd5832e,
  27265. 0xcc1fb62b,0xef52a348,0xc1c4792a,0x2bd08274,0x877c6dc7,0x345c5846 } },
  27266. /* 79 */
  27267. { { 0xbea65e90,0xde15ceb0,0x2416d99c,0x0987f72b,0xfd863dec,0x44db578d,
  27268. 0xac6a3578,0xf617b74b,0xdb48e999,0x9e62bd7a,0xeab1a1be,0x877cae61 },
  27269. { 0x3a358610,0x23adddaa,0x325e2b07,0x2fc4d6d1,0x1585754e,0x897198f5,
  27270. 0xb392b584,0xf741852c,0xb55f7de1,0x9927804c,0x1aa8efae,0xe9e6c4ed } },
  27271. /* 80 */
  27272. { { 0x98683186,0x867db639,0xddcc4ea9,0xfb5cf424,0xd4f0e7bd,0xcc9a7ffe,
  27273. 0x7a779f7e,0x7c57f71c,0xd6b25ef2,0x90774079,0xb4081680,0x90eae903 },
  27274. { 0x0ee1fceb,0xdf2aae5e,0xe86c1a1f,0x3ff1da24,0xca193edf,0x80f587d6,
  27275. 0xdc9b9d6a,0xa5695523,0x85920303,0x7b840900,0xba6dbdef,0x1efa4dfc } },
  27276. /* 81 */
  27277. { { 0xe0540015,0xfbd838f9,0xc39077dc,0x2c323946,0xad619124,0x8b1fb9e6,
  27278. 0x0ca62ea8,0x9612440c,0x2dbe00ff,0x9ad9b52c,0xae197643,0xf52abaa1 },
  27279. { 0x2cac32ad,0xd0e89894,0x62a98f91,0xdfb79e42,0x276f55cb,0x65452ecf,
  27280. 0x7ad23e12,0xdb1ac0d2,0xde4986f0,0xf68c5f6a,0x82ce327d,0x389ac37b } },
  27281. /* 82 */
  27282. { { 0xf8e60f5b,0x511188b4,0x48aa2ada,0x7fe67015,0x381abca2,0xdb333cb8,
  27283. 0xdaf3fc97,0xb15e6d9d,0x36aabc03,0x4b24f6eb,0x72a748b4,0xc59789df },
  27284. { 0x29cf5279,0x26fcb8a5,0x01ad9a6c,0x7a3c6bfc,0x4b8bac9b,0x866cf88d,
  27285. 0x9c80d041,0xf4c89989,0x70add148,0xf0a04241,0x45d81a41,0x5a02f479 } },
  27286. /* 83 */
  27287. { { 0xc1c90202,0xfa5c877c,0xf8ac7570,0xd099d440,0xd17881f7,0x428a5b1b,
  27288. 0x5b2501d7,0x61e267db,0xf2e4465b,0xf889bf04,0x76aa4cb8,0x4da3ae08 },
  27289. { 0xe3e66861,0x3ef0fe26,0x3318b86d,0x5e772953,0x747396df,0xc3c35fbc,
  27290. 0x439ffd37,0x5115a29c,0xb2d70374,0xbfc4bd97,0x56246b9d,0x088630ea } },
  27291. /* 84 */
  27292. { { 0xb8a9e8c9,0xcd96866d,0x5bb8091e,0xa11963b8,0x045b3cd2,0xc7f90d53,
  27293. 0x80f36504,0x755a72b5,0x21d3751c,0x46f8b399,0x53c193de,0x4bffdc91 },
  27294. { 0xb89554e7,0xcd15c049,0xf7a26be6,0x353c6754,0xbd41d970,0x79602370,
  27295. 0x12b176c0,0xde16470b,0x40c8809d,0x56ba1175,0xe435fb1e,0xe2db35c3 } },
  27296. /* 85 */
  27297. { { 0x6328e33f,0xd71e4aab,0xaf8136d1,0x5486782b,0x86d57231,0x07a4995f,
  27298. 0x1651a968,0xf1f0a5bd,0x76803b6d,0xa5dc5b24,0x42dda935,0x5c587cbc },
  27299. { 0xbae8b4c0,0x2b6cdb32,0xb1331138,0x66d1598b,0x5d7e9614,0x4a23b2d2,
  27300. 0x74a8c05d,0x93e402a6,0xda7ce82e,0x45ac94e6,0xe463d465,0xeb9f8281 } },
  27301. /* 86 */
  27302. { { 0xfecf5b9b,0x34e0f9d1,0xf206966a,0xa115b12b,0x1eaa0534,0x5591cf3b,
  27303. 0xfb1558f9,0x5f0293cb,0x1bc703a5,0x1c8507a4,0x862c1f81,0x92e6b81c },
  27304. { 0xcdaf24e3,0xcc9ebc66,0x72fcfc70,0x68917ecd,0x8157ba48,0x6dc9a930,
  27305. 0xb06ab2b2,0x5d425c08,0x36e929c4,0x362f8ce7,0x62e89324,0x09f6f57c } },
  27306. /* 87 */
  27307. { { 0xd29375fb,0x1c7d6b78,0xe35d1157,0xfabd851e,0x4243ea47,0xf6f62dcd,
  27308. 0x8fe30b0f,0x1dd92460,0xffc6e709,0x08166dfa,0x0881e6a7,0xc6c4c693 },
  27309. { 0xd6a53fb0,0x20368f87,0x9eb4d1f9,0x38718e9f,0xafd7e790,0x03f08acd,
  27310. 0x72fe2a1c,0x0835eb44,0x88076e5d,0x7e050903,0xa638e731,0x538f765e } },
  27311. /* 88 */
  27312. { { 0xc2663b4b,0x0e0249d9,0x47cd38dd,0xe700ab5b,0x2c46559f,0xb192559d,
  27313. 0x4bcde66d,0x8f9f74a8,0x3e2aced5,0xad161523,0x3dd03a5b,0xc155c047 },
  27314. { 0x3be454eb,0x346a8799,0x83b7dccd,0x66ee94db,0xab9d2abe,0x1f6d8378,
  27315. 0x7733f355,0x4a396dd2,0xf53553c2,0x419bd40a,0x731dd943,0xd0ead98d } },
  27316. /* 89 */
  27317. { { 0xec142408,0x908e0b0e,0x4114b310,0x98943cb9,0x1742b1d7,0x03dbf7d8,
  27318. 0x693412f4,0xd270df6b,0x8f69e20c,0xc5065494,0x697e43a1,0xa76a90c3 },
  27319. { 0x4624825a,0xe0fa3384,0x8acc34c2,0x82e48c0b,0xe9a14f2b,0x7b24bd14,
  27320. 0x4db30803,0x4f5dd5e2,0x932da0a3,0x0c77a9e7,0x74c653dc,0x20db90f2 } },
  27321. /* 90 */
  27322. { { 0x0e6c5fd9,0x261179b7,0x6c982eea,0xf8bec123,0xd4957b7e,0x47683338,
  27323. 0x0a72f66a,0xcc47e664,0x1bad9350,0xbd54bf6a,0xf454e95a,0xdfbf4c6a },
  27324. { 0x6907f4fa,0x3f7a7afa,0x865ca735,0x7311fae0,0x2a496ada,0x24737ab8,
  27325. 0x15feb79b,0x13e425f1,0xa1b93c21,0xe9e97c50,0x4ddd3eb5,0xb26b6eac } },
  27326. /* 91 */
  27327. { { 0x2a2e5f2b,0x81cab9f5,0xbf385ac4,0xf93caf29,0xc909963a,0xf4bf35c3,
  27328. 0x74c9143c,0x081e7300,0xc281b4c5,0x3ea57fa8,0x9b340741,0xe497905c },
  27329. { 0x55ab3cfb,0xf556dd8a,0x518db6ad,0xd444b96b,0x5ef4b955,0x34f5425a,
  27330. 0xecd26aa3,0xdda7a3ac,0xda655e97,0xb57da11b,0xc2024c70,0x02da3eff } },
  27331. /* 92 */
  27332. { { 0x6481d0d9,0xe24b0036,0x818fdfe2,0x3740dbe5,0x190fda00,0xc1fc1f45,
  27333. 0x3cf27fde,0x329c9280,0x6934f43e,0x7435cb53,0x7884e8fe,0x2b505a5d },
  27334. { 0x711adcc9,0x6cfcc6a6,0x531e21e1,0xf034325c,0x9b2a8a99,0xa2f4a967,
  27335. 0x3c21bdff,0x9d5f3842,0x31b57d66,0xb25c7811,0x0b8093b9,0xdb5344d8 } },
  27336. /* 93 */
  27337. { { 0xae50a2f5,0x0d72e667,0xe4a861d1,0x9b7f8d8a,0x330df1cb,0xa129f70f,
  27338. 0xe04fefc3,0xe90aa5d7,0xe72c3ae1,0xff561ecb,0xcdb955fa,0x0d8fb428 },
  27339. { 0xd7663784,0xd2235f73,0x7e2c456a,0xc05baec6,0x2adbfccc,0xe5c292e4,
  27340. 0xefb110d5,0x4fd17988,0xd19d49f3,0x27e57734,0x84f679fe,0x188ac4ce } },
  27341. /* 94 */
  27342. { { 0xa796c53e,0x7ee344cf,0x0868009b,0xbbf6074d,0x474a1295,0x1f1594f7,
  27343. 0xac11632d,0x66776edc,0x04e2fa5a,0x1862278b,0xc854a89a,0x52665cf2 },
  27344. { 0x8104ab58,0x7e376464,0x7204fd6d,0x16775913,0x44ea1199,0x86ca06a5,
  27345. 0x1c9240dd,0xaa3f765b,0x24746149,0x5f8501a9,0xdcd251d7,0x7b982e30 } },
  27346. /* 95 */
  27347. { { 0xc15f3060,0xe44e9efc,0xa87ebbe6,0x5ad62f2e,0xc79500d4,0x36499d41,
  27348. 0x336fa9d1,0xa66d6dc0,0x5afd3b1f,0xf8afc495,0xe5c9822b,0x1d8ccb24 },
  27349. { 0x79d7584b,0x4031422b,0xea3f20dd,0xc54a0580,0x958468c5,0x3f837c8f,
  27350. 0xfbea7735,0x3d82f110,0x7dffe2fc,0x679a8778,0x20704803,0x48eba63b } },
  27351. /* 96 */
  27352. { { 0xdf46e2f6,0x89b10d41,0x19514367,0x13ab57f8,0x1d469c87,0x067372b9,
  27353. 0x4f6c5798,0x0c195afa,0x272c9acf,0xea43a12a,0x678abdac,0x9dadd8cb },
  27354. { 0xe182579a,0xcce56c6b,0x2d26c2d8,0x86febadb,0x2a44745c,0x1c668ee1,
  27355. 0x98dc047a,0x580acd86,0x51b9ec2d,0x5a2b79cc,0x4054f6a0,0x007da608 } },
  27356. /* 97 */
  27357. { { 0x17b00dd0,0x9e3ca352,0x0e81a7a6,0x046779cb,0xd482d871,0xb999fef3,
  27358. 0xd9233fbc,0xe6f38134,0xf48cd0e0,0x112c3001,0x3c6c66ae,0x934e7576 },
  27359. { 0xd73234dc,0xb44d4fc3,0x864eafc1,0xfcae2062,0x26bef21a,0x843afe25,
  27360. 0xf3b75fdf,0x61355107,0x794c2e6b,0x8367a5aa,0x8548a372,0x3d2629b1 } },
  27361. /* 98 */
  27362. { { 0x437cfaf8,0x6230618f,0x2032c299,0x5b8742cb,0x2293643a,0x949f7247,
  27363. 0x09464f79,0xb8040f1a,0x4f254143,0x049462d2,0x366c7e76,0xabd6b522 },
  27364. { 0xd5338f55,0x119b392b,0x01495a0c,0x1a80a9ce,0xf8d7537e,0xf3118ca7,
  27365. 0x6bf4b762,0xb715adc2,0xa8482b6c,0x24506165,0x96a7c84d,0xd958d7c6 } },
  27366. /* 99 */
  27367. { { 0xbdc21f31,0x9ad8aa87,0x8063e58c,0xadb3cab4,0xb07dd7b8,0xefd86283,
  27368. 0x1be7c6b4,0xc7b9b762,0x015582de,0x2ef58741,0x299addf3,0xc970c52e },
  27369. { 0x22f24d66,0x78f02e2a,0x74cc100a,0xefec1d10,0x09316e1a,0xaf2a6a39,
  27370. 0x5849dd49,0xce7c2205,0x96bffc4c,0x9c1fe75c,0x7ba06ec0,0xcad98fd2 } },
  27371. /* 100 */
  27372. { { 0xb648b73e,0xed76e2d0,0x1cfd285e,0xa9f92ce5,0x2ed13de1,0xa8c86c06,
  27373. 0xa5191a93,0x1d3a574e,0x1ad1b8bf,0x385cdf8b,0x47d2cfe3,0xbbecc28a },
  27374. { 0x69cec548,0x98d326c0,0xf240a0b2,0x4f5bc1dd,0x29057236,0x241a7062,
  27375. 0xc68294a4,0x0fc6e9c5,0xa319f17a,0x4d04838b,0x9ffc1c6f,0x8b612cf1 } },
  27376. /* 101 */
  27377. { { 0x4c3830eb,0x9bb0b501,0x8ee0d0c5,0x3d08f83c,0x79ba9389,0xa4a62642,
  27378. 0x9cbc2914,0x5d5d4044,0x074c46f0,0xae9eb83e,0x74ead7d6,0x63bb758f },
  27379. { 0xc6bb29e0,0x1c40d2ea,0x4b02f41e,0x95aa2d87,0x53cb199a,0x92989175,
  27380. 0x51584f6d,0xdd91bafe,0x31a1aaec,0x3715efb9,0x46780f9e,0xc1b6ae5b } },
  27381. /* 102 */
  27382. { { 0x42772f41,0xcded3e4b,0x3bcb79d1,0x3a700d5d,0x80feee60,0x4430d50e,
  27383. 0xf5e5d4bb,0x444ef1fc,0xe6e358ff,0xc660194f,0x6a91b43c,0xe68a2f32 },
  27384. { 0x977fe4d2,0x5842775c,0x7e2a41eb,0x78fdef5c,0xff8df00e,0x5f3bec02,
  27385. 0x5852525d,0xf4b840cd,0x4e6988bd,0x0870483a,0xcc64b837,0x39499e39 } },
  27386. /* 103 */
  27387. { { 0xb08df5fe,0xfc05de80,0x63ba0362,0x0c12957c,0xd5cf1428,0xea379414,
  27388. 0x54ef6216,0xc559132a,0xb9e65cf8,0x33d5f12f,0x1695d663,0x09c60278 },
  27389. { 0x61f7a2fb,0x3ac1ced4,0xd4f5eeb8,0xdd838444,0x8318fcad,0x82a38c6c,
  27390. 0xe9f1a864,0x315be2e5,0x442daf47,0x317b5771,0x95aa5f9e,0x81b5904a } },
  27391. /* 104 */
  27392. { { 0x8b21d232,0x6b6b1c50,0x8c2cba75,0x87f3dbc0,0xae9f0faf,0xa7e74b46,
  27393. 0xbb7b8079,0x036a0985,0x8d974a25,0x4f185b90,0xd9af5ec9,0x5aa7cef0 },
  27394. { 0x57dcfffc,0xe0566a70,0xb8453225,0x6ea311da,0x23368aa9,0x72ea1a8d,
  27395. 0x48cd552d,0xed9b2083,0xc80ea435,0xb987967c,0x6c104173,0xad735c75 } },
  27396. /* 105 */
  27397. { { 0xcee76ef4,0xaea85ab3,0xaf1d2b93,0x44997444,0xeacb923f,0x0851929b,
  27398. 0x51e3bc0c,0xb080b590,0x59be68a2,0xc4ee1d86,0x64b26cda,0xf00de219 },
  27399. { 0xf2e90d4d,0x8d7fb5c0,0x77d9ec64,0x00e219a7,0x5d1c491c,0xc4e6febd,
  27400. 0x1a8f4585,0x080e3754,0x48d2af9c,0x4a9b86c8,0xb6679851,0x2ed70db6 } },
  27401. /* 106 */
  27402. { { 0x586f25cb,0xaee44116,0xa0fcf70f,0xf7b6861f,0x18a350e8,0x55d2cd20,
  27403. 0x92dc286f,0x861bf3e5,0x6226aba7,0x9ab18ffa,0xa9857b03,0xd15827be },
  27404. { 0x92e6acef,0x26c1f547,0xac1fbac3,0x422c63c8,0xfcbfd71d,0xa2d8760d,
  27405. 0xb2511224,0x35f6a539,0x048d1a21,0xbaa88fa1,0xebf999db,0x49f1abe9 } },
  27406. /* 107 */
  27407. { { 0xf7492b73,0x16f9f4f4,0xcb392b1a,0xcf28ec1e,0x69ca6ffc,0x45b130d4,
  27408. 0xb72efa58,0x28ba8d40,0x5ca066f5,0xace987c7,0x4ad022eb,0x3e399246 },
  27409. { 0x752555bb,0x63a2d84e,0x9c2ae394,0xaaa93b4a,0xc89539ca,0xcd80424e,
  27410. 0xaa119a99,0x6d6b5a6d,0x379f2629,0xbd50334c,0xef3cc7d3,0x899e925e } },
  27411. /* 108 */
  27412. { { 0xbf825dc4,0xb7ff3651,0x40b9c462,0x0f741cc4,0x5cc4fb5b,0x771ff5a9,
  27413. 0x47fd56fe,0xcb9e9c9b,0x5626c0d3,0xbdf053db,0xf7e14098,0xa97ce675 },
  27414. { 0x6c934f5e,0x68afe5a3,0xccefc46f,0x6cd5e148,0xd7a88586,0xc7758570,
  27415. 0xdd558d40,0x49978f5e,0x64ae00c1,0xa1d5088a,0xf1d65bb2,0x58f2a720 } },
  27416. /* 109 */
  27417. { { 0x3e4daedb,0x66fdda4a,0x65d1b052,0x38318c12,0x4c4bbf5c,0x28d910a2,
  27418. 0x78a9cd14,0x762fe5c4,0xd2cc0aee,0x08e5ebaa,0xca0c654c,0xd2cdf257 },
  27419. { 0x08b717d2,0x48f7c58b,0x386cd07a,0x3807184a,0xae7d0112,0x3240f626,
  27420. 0xc43917b0,0x03e9361b,0x20aea018,0xf261a876,0x7e1e6372,0x53f556a4 } },
  27421. /* 110 */
  27422. { { 0x2f512a90,0xc84cee56,0x1b0ea9f1,0x24b3c004,0xe26cc1ea,0x0ee15d2d,
  27423. 0xf0c9ef7d,0xd848762c,0xd5341435,0x1026e9c5,0xfdb16b31,0x8f5b73dc },
  27424. { 0xd2c75d95,0x1f69bef2,0xbe064dda,0x8d33d581,0x57ed35e6,0x8c024c12,
  27425. 0xc309c281,0xf8d435f9,0xd6960193,0xfd295061,0xe9e49541,0x66618d78 } },
  27426. /* 111 */
  27427. { { 0x8ce382de,0x571cfd45,0xde900dde,0x175806ee,0x34aba3b5,0x61849965,
  27428. 0xde7aec95,0xe899778a,0xff4aa97f,0xe8f00f6e,0x010b0c6d,0xae971cb5 },
  27429. { 0x3af788f1,0x1827eebc,0xe413fe2d,0xd46229ff,0x4741c9b4,0x8a15455b,
  27430. 0xf8e424eb,0x5f02e690,0xdae87712,0x40a1202e,0x64944f6d,0x49b3bda2 } },
  27431. /* 112 */
  27432. { { 0x035b2d69,0xd63c6067,0x6bed91b0,0xb507150d,0x7afb39b2,0x1f35f82f,
  27433. 0x16012b66,0xb9bd9c01,0xed0a5f50,0x00d97960,0x2716f7c9,0xed705451 },
  27434. { 0x127abdb4,0x1576eff4,0xf01e701c,0x6850d698,0x3fc87e2f,0x9fa7d749,
  27435. 0xb0ce3e48,0x0b6bcc6f,0xf7d8c1c0,0xf4fbe1f5,0x02719cc6,0xcf75230e } },
  27436. /* 113 */
  27437. { { 0x722d94ed,0x6761d6c2,0x3718820e,0xd1ec3f21,0x25d0e7c6,0x65a40b70,
  27438. 0xbaf3cf31,0xd67f830e,0xb93ea430,0x633b3807,0x0bc96c69,0x17faa0ea },
  27439. { 0xdf866b98,0xe6bf3482,0xa9db52d4,0x205c1ee9,0xff9ab869,0x51ef9bbd,
  27440. 0x75eeb985,0x3863dad1,0xd3cf442a,0xef216c3b,0xf9c8e321,0x3fb228e3 } },
  27441. /* 114 */
  27442. { { 0x0760ac07,0x94f9b70c,0x9d79bf4d,0xf3c9ccae,0xc5ffc83d,0x73cea084,
  27443. 0xdc49c38e,0xef50f943,0xbc9e7330,0xf467a2ae,0x44ea7fba,0x5ee534b6 },
  27444. { 0x03609e7f,0x20cb6272,0x62fdc9f0,0x09844355,0x0f1457f7,0xaf5c8e58,
  27445. 0xb4b25941,0xd1f50a6c,0x2ec82395,0x77cb247c,0xda3dca33,0xa5f3e1e5 } },
  27446. /* 115 */
  27447. { { 0x7d85fa94,0x023489d6,0x2db9ce47,0x0ba40537,0xaed7aad1,0x0fdf7a1f,
  27448. 0x9a4ccb40,0xa57b0d73,0x5b18967c,0x48fcec99,0xb7274d24,0xf30b5b6e },
  27449. { 0xc81c5338,0x7ccb4773,0xa3ed6bd0,0xb85639e6,0x1d56eada,0x7d9df95f,
  27450. 0x0a1607ad,0xe256d57f,0x957574d6,0x6da7ffdc,0x01c7a8c4,0x65f84046 } },
  27451. /* 116 */
  27452. { { 0xcba1e7f1,0x8d45d0cb,0x02b55f64,0xef0a08c0,0x17e19892,0x771ca31b,
  27453. 0x4885907e,0xe1843ecb,0x364ce16a,0x67797ebc,0x8df4b338,0x816d2b2d },
  27454. { 0x39aa8671,0xe870b0e5,0xc102b5f5,0x9f0db3e4,0x1720c697,0x34296659,
  27455. 0x613c0d2a,0x0ad4c89e,0x418ddd61,0x1af900b2,0xd336e20e,0xe087ca72 } },
  27456. /* 117 */
  27457. { { 0xaba10079,0x222831ff,0x6d64fff2,0x0dc5f87b,0x3e8cb330,0x44547907,
  27458. 0x702a33fb,0xe815aaa2,0x5fba3215,0x338d6b2e,0x79f549c8,0x0f7535cb },
  27459. { 0x2ee95923,0x471ecd97,0xc6d1c09f,0x1e868b37,0xc666ef4e,0x2bc7b8ec,
  27460. 0x808a4bfc,0xf5416589,0x3fbc4d2e,0xf23e9ee2,0x2d75125b,0x4357236c } },
  27461. /* 118 */
  27462. { { 0xba9cdb1b,0xfe176d95,0x2f82791e,0x45a1ca01,0x4de4cca2,0x97654af2,
  27463. 0x5cc4bcb9,0xbdbf9d0e,0xad97ac0a,0xf6a7df50,0x61359fd6,0xc52112b0 },
  27464. { 0x4f05eae3,0x696d9ce3,0xe943ac2b,0x903adc02,0x0848be17,0xa9075347,
  27465. 0x2a3973e5,0x1e20f170,0x6feb67e9,0xe1aacc1c,0xe16bc6b9,0x2ca0ac32 } },
  27466. /* 119 */
  27467. { { 0xef871eb5,0xffea12e4,0xa8bf0a7a,0x94c2f25d,0x78134eaa,0x4d1e4c2a,
  27468. 0x0360fb10,0x11ed16fb,0x85fc11be,0x4029b6db,0xf4d390fa,0x5e9f7ab7 },
  27469. { 0x30646612,0x5076d72f,0xdda1d0d8,0xa0afed1d,0x85a1d103,0x29022257,
  27470. 0x4e276bcd,0xcb499e17,0x51246c3d,0x16d1da71,0x589a0443,0xc72d56d3 } },
  27471. /* 120 */
  27472. { { 0xdae5bb45,0xdf5ffc74,0x261bd6dc,0x99068c4a,0xaa98ec7b,0xdc0afa7a,
  27473. 0xf121e96d,0xedd2ee00,0x1414045c,0x163cc7be,0x335af50e,0xb0b1bbce },
  27474. { 0x01a06293,0xd440d785,0x6552e644,0xcdebab7c,0x8c757e46,0x48cb8dbc,
  27475. 0x3cabe3cb,0x81f9cf78,0xb123f59a,0xddd02611,0xeeb3784d,0x3dc7b88e } },
  27476. /* 121 */
  27477. { { 0xc4741456,0xe1b8d398,0x6032a121,0xa9dfa902,0x1263245b,0x1cbfc86d,
  27478. 0x5244718c,0xf411c762,0x05b0fc54,0x96521d54,0xdbaa4985,0x1afab46e },
  27479. { 0x8674b4ad,0xa75902ba,0x5ad87d12,0x486b43ad,0x36e0d099,0x72b1c736,
  27480. 0xbb6cd6d6,0x39890e07,0x59bace4e,0x8128999c,0x7b535e33,0xd8da430b } },
  27481. /* 122 */
  27482. { { 0xc6b75791,0x39f65642,0x21806bfb,0x050947a6,0x1362ef84,0x0ca3e370,
  27483. 0x8c3d2391,0x9bc60aed,0x732e1ddc,0x9b488671,0xa98ee077,0x12d10d9e },
  27484. { 0x3651b7dc,0xb6f2822d,0x80abd138,0x6345a5ba,0x472d3c84,0x62033262,
  27485. 0xacc57527,0xd54a1d40,0x424447cb,0x6ea46b3a,0x2fb1a496,0x5bc41057 } },
  27486. /* 123 */
  27487. { { 0xa751cd0e,0xe70c57a3,0xeba3c7d6,0x190d8419,0x9d47d55a,0xb1c3bee7,
  27488. 0xf912c6d8,0xda941266,0x407a6ad6,0x12e9aacc,0x6e838911,0xd6ce5f11 },
  27489. { 0x70e1f2ce,0x063ca97b,0x8213d434,0xa3e47c72,0x84df810a,0xa016e241,
  27490. 0xdfd881a4,0x688ad7b0,0xa89bf0ad,0xa37d99fc,0xa23c2d23,0xd8e3f339 } },
  27491. /* 124 */
  27492. { { 0x750bed6f,0xbdf53163,0x83e68b0a,0x808abc32,0x5bb08a33,0x85a36627,
  27493. 0x6b0e4abe,0xf72a3a0f,0xfaf0c6ad,0xf7716d19,0x5379b25f,0x22dcc020 },
  27494. { 0xf9a56e11,0x7400bf8d,0x56a47f21,0x6cb8bad7,0x7a6eb644,0x7c97176f,
  27495. 0xd1f5b646,0xe8fd84f7,0x44ddb054,0x98320a94,0x1dde86f5,0x07071ba3 } },
  27496. /* 125 */
  27497. { { 0x98f8fcb9,0x6fdfa0e5,0x94d0d70c,0x89cec8e0,0x106d20a8,0xa0899397,
  27498. 0xba8acc9c,0x915bfb9a,0x5507e01c,0x1370c94b,0x8a821ffb,0x83246a60 },
  27499. { 0xbe3c378f,0xa8273a9f,0x35a25be9,0x7e544789,0x4dd929d7,0x6cfa4972,
  27500. 0x365bd878,0x987fed9d,0x5c29a7ae,0x4982ac94,0x5ddd7ec5,0x4589a5d7 } },
  27501. /* 126 */
  27502. { { 0xa95540a9,0x9fabb174,0x0162c5b0,0x7cfb886f,0xea3dee18,0x17be766b,
  27503. 0xe88e624c,0xff7da41f,0x8b919c38,0xad0b71eb,0xf31ff9a9,0x86a522e0 },
  27504. { 0x868bc259,0xbc8e6f72,0x3ccef9e4,0x6130c638,0x9a466555,0x09f1f454,
  27505. 0x19b2bfb4,0x8e6c0f09,0x0ca7bb22,0x945c46c9,0x4dafb67b,0xacd87168 } },
  27506. /* 127 */
  27507. { { 0x10c53841,0x090c72ca,0x55a4fced,0xc20ae01b,0xe10234ad,0x03f7ebd5,
  27508. 0x85892064,0xb3f42a6a,0xb4a14722,0xbdbc30c0,0x8ca124cc,0x971bc437 },
  27509. { 0x517ff2ff,0x6f79f46d,0xecba947b,0x6a9c96e2,0x62925122,0x5e79f2f4,
  27510. 0x6a4e91f1,0x30a96bb1,0x2d4c72da,0x1147c923,0x5811e4df,0x65bc311f } },
  27511. /* 128 */
  27512. { { 0x139b3239,0x87c7dd7d,0x4d833bae,0x8b57824e,0x9fff0015,0xbcbc4878,
  27513. 0x909eaf1a,0x8ffcef8b,0xf1443a78,0x9905f4ee,0xe15cbfed,0x020dd4a2 },
  27514. { 0xa306d695,0xca2969ec,0xb93caf60,0xdf940cad,0x87ea6e39,0x67f7fab7,
  27515. 0xf98c4fe5,0x0d0ee10f,0xc19cb91e,0xc646879a,0x7d1d7ab4,0x4b4ea50c } },
  27516. /* 129 */
  27517. { { 0x7a0db57e,0x19e40945,0x9a8c9702,0xe6017cad,0x1be5cff9,0xdbf739e5,
  27518. 0xa7a938a2,0x3646b3cd,0x68350dfc,0x04511085,0x56e098b5,0xad3bd6f3 },
  27519. { 0xee2e3e3e,0x935ebabf,0x473926cb,0xfbd01702,0x9e9fb5aa,0x7c735b02,
  27520. 0x2e3feff0,0xc52a1b85,0x046b405a,0x9199abd3,0x39039971,0xe306fcec } },
  27521. /* 130 */
  27522. { { 0x23e4712c,0xd6d9aec8,0xc3c198ee,0x7ca8376c,0x31bebd8a,0xe6d83187,
  27523. 0xd88bfef3,0xed57aff3,0xcf44edc7,0x72a645ee,0x5cbb1517,0xd4e63d0b },
  27524. { 0xceee0ecf,0x98ce7a1c,0x5383ee8e,0x8f012633,0xa6b455e8,0x3b879078,
  27525. 0xc7658c06,0xcbcd3d96,0x0783336a,0x721d6fe7,0x5a677136,0xf21a7263 } },
  27526. /* 131 */
  27527. { { 0x9586ba11,0x19d8b3cd,0x8a5c0480,0xd9e0aeb2,0x2230ef5c,0xe4261dbf,
  27528. 0x02e6bf09,0x095a9dee,0x80dc7784,0x8963723c,0x145157b1,0x5c97dbaf },
  27529. { 0x4bc4503e,0x97e74434,0x85a6b370,0x0fb1cb31,0xcd205d4b,0x3e8df2be,
  27530. 0xf8f765da,0x497dd1bc,0x6c988a1a,0x92ef95c7,0x64dc4cfa,0x3f924baa } },
  27531. /* 132 */
  27532. { { 0x7268b448,0x6bf1b8dd,0xefd79b94,0xd4c28ba1,0xe4e3551f,0x2fa1f8c8,
  27533. 0x5c9187a9,0x769e3ad4,0x40326c0d,0x28843b4d,0x50d5d669,0xfefc8094 },
  27534. { 0x90339366,0x30c85bfd,0x5ccf6c3a,0x4eeb56f1,0x28ccd1dc,0x0e72b149,
  27535. 0xf2ce978e,0x73ee85b5,0x3165bb23,0xcdeb2bf3,0x4e410abf,0x8106c923 } },
  27536. /* 133 */
  27537. { { 0x7d02f4ee,0xc8df0161,0x18e21225,0x8a781547,0x6acf9e40,0x4ea895eb,
  27538. 0x6e5a633d,0x8b000cb5,0x7e981ffb,0xf31d86d5,0x4475bc32,0xf5c8029c },
  27539. { 0x1b568973,0x764561ce,0xa62996ec,0x2f809b81,0xda085408,0x9e513d64,
  27540. 0xe61ce309,0xc27d815d,0x272999e0,0x0da6ff99,0xfead73f7,0xbd284779 } },
  27541. /* 134 */
  27542. { { 0x9b1cdf2b,0x6033c2f9,0xbc5fa151,0x2a99cf06,0x12177b3b,0x7d27d259,
  27543. 0xc4485483,0xb1f15273,0x102e2297,0x5fd57d81,0xc7f6acb7,0x3d43e017 },
  27544. { 0x3a70eb28,0x41a8bb0b,0x3e80b06b,0x67de2d8e,0x70c28de5,0x09245a41,
  27545. 0xa7b26023,0xad7dbcb1,0x2cbc6c1e,0x70b08a35,0x9b33041f,0xb504fb66 } },
  27546. /* 135 */
  27547. { { 0xf97a27c2,0xa8e85ab5,0xc10a011b,0x6ac5ec8b,0xffbcf161,0x55745533,
  27548. 0x65790a60,0x01780e85,0x99ee75b0,0xe451bf85,0x39c29881,0x8907a63b },
  27549. { 0x260189ed,0x76d46738,0x47bd35cb,0x284a4436,0x20cab61e,0xd74e8c40,
  27550. 0x416cf20a,0x6264bf8c,0x5fd820ce,0xfa5a6c95,0xf24bb5fc,0xfa7154d0 } },
  27551. /* 136 */
  27552. { { 0x9b3f5034,0x18482cec,0xcd9e68fd,0x962d445a,0x95746f23,0x266fb1d6,
  27553. 0x58c94a4b,0xc66ade5a,0xed68a5b6,0xdbbda826,0x7ab0d6ae,0x05664a4d },
  27554. { 0x025e32fc,0xbcd4fe51,0xa96df252,0x61a5aebf,0x31592a31,0xd88a07e2,
  27555. 0x98905517,0x5d9d94de,0x5fd440e7,0x96bb4010,0xe807db4c,0x1b0c47a2 } },
  27556. /* 137 */
  27557. { { 0x08223878,0x5c2a6ac8,0xe65a5558,0xba08c269,0x9bbc27fd,0xd22b1b9b,
  27558. 0x72b9607d,0x919171bf,0xe588dc58,0x9ab455f9,0x23662d93,0x6d54916e },
  27559. { 0x3b1de0c1,0x8da8e938,0x804f278f,0xa84d186a,0xd3461695,0xbf4988cc,
  27560. 0xe10eb0cb,0xf5eae3be,0xbf2a66ed,0x1ff8b68f,0xc305b570,0xa68daf67 } },
  27561. /* 138 */
  27562. { { 0x44b2e045,0xc1004cff,0x4b1c05d4,0x91b5e136,0x88a48a07,0x53ae4090,
  27563. 0xea11bb1a,0x73fb2995,0x3d93a4ea,0x32048570,0x3bfc8a5f,0xcce45de8 },
  27564. { 0xc2b3106e,0xaff4a97e,0xb6848b4f,0x9069c630,0xed76241c,0xeda837a6,
  27565. 0x6cc3f6cf,0x8a0daf13,0x3da018a8,0x199d049d,0xd9093ba3,0xf867c6b1 } },
  27566. /* 139 */
  27567. { { 0x56527296,0xe4d42a56,0xce71178d,0xae26c73d,0x6c251664,0x70a0adac,
  27568. 0x5dc0ae1d,0x813483ae,0xdaab2daf,0x7574eacd,0xc2d55f4f,0xc56b52dc },
  27569. { 0x95f32923,0x872bc167,0x5bdd2a89,0x4be17581,0xa7699f00,0x9b57f1e7,
  27570. 0x3ac2de02,0x5fcd9c72,0x92377739,0x83af3ba1,0xfc50b97f,0xa64d4e2b } },
  27571. /* 140 */
  27572. { { 0x0e552b40,0x2172dae2,0xd34d52e8,0x62f49725,0x07958f98,0x7930ee40,
  27573. 0x751fdd74,0x56da2a90,0xf53e48c3,0xf1192834,0x8e53c343,0x34d2ac26 },
  27574. { 0x13111286,0x1073c218,0xda9d9827,0x201dac14,0xee95d378,0xec2c29db,
  27575. 0x1f3ee0b1,0x9316f119,0x544ce71c,0x7890c9f0,0x27612127,0xd77138af } },
  27576. /* 141 */
  27577. { { 0x3b4ad1cd,0x78045e6d,0x4aa49bc1,0xcd86b94e,0xfd677a16,0x57e51f1d,
  27578. 0xfa613697,0xd9290935,0x34f4d893,0x7a3f9593,0x5d5fcf9b,0x8c9c248b },
  27579. { 0x6f70d4e9,0x9f23a482,0x63190ae9,0x17273454,0x5b081a48,0x4bdd7c13,
  27580. 0x28d65271,0x1e2de389,0xe5841d1f,0x0bbaaa25,0x746772e5,0xc4c18a79 } },
  27581. /* 142 */
  27582. { { 0x593375ac,0x10ee2681,0x7dd5e113,0x4f3288be,0x240f3538,0x9a97b2fb,
  27583. 0x1de6b1e2,0xfa11089f,0x1351bc58,0x516da562,0x2dfa85b5,0x573b6119 },
  27584. { 0x6cba7df5,0x89e96683,0x8c28ab40,0xf299be15,0xad43fcbf,0xe91c9348,
  27585. 0x9a1cefb3,0xe9bbc7cc,0x738b2775,0xc8add876,0x775eaa01,0x6e3b1f2e } },
  27586. /* 143 */
  27587. { { 0xb677788b,0x0365a888,0x3fd6173c,0x634ae8c4,0x9e498dbe,0x30498761,
  27588. 0xc8f779ab,0x08c43e6d,0x4c09aca9,0x068ae384,0x2018d170,0x2380c70b },
  27589. { 0xa297c5ec,0xcf77fbc3,0xca457948,0xdacbc853,0x336bec7e,0x3690de04,
  27590. 0x14eec461,0x26bbac64,0x1f713abf,0xd1c23c7e,0xe6fd569e,0xf08bbfcd } },
  27591. /* 144 */
  27592. { { 0x84770ee3,0x5f8163f4,0x744a1706,0x0e0c7f94,0xe1b2d46d,0x9c8f05f7,
  27593. 0xd01fd99a,0x417eafe7,0x11440e5b,0x2ba15df5,0x91a6fbcf,0xdc5c552a },
  27594. { 0xa270f721,0x86271d74,0xa004485b,0x32c0a075,0x8defa075,0x9d1a87e3,
  27595. 0xbf0d20fe,0xb590a7ac,0x8feda1f5,0x430c41c2,0x58f6ec24,0x454d2879 } },
  27596. /* 145 */
  27597. { { 0x7c525435,0x52b7a635,0x37c4bdbc,0x3d9ef57f,0xdffcc475,0x2bb93e9e,
  27598. 0x7710f3be,0xf7b8ba98,0x21b727de,0x42ee86da,0x2e490d01,0x55ac3f19 },
  27599. { 0xc0c1c390,0x487e3a6e,0x446cde7b,0x036fb345,0x496ae951,0x089eb276,
  27600. 0x71ed1234,0xedfed4d9,0x900f0b46,0x661b0dd5,0x8582f0d3,0x11bd6f1b } },
  27601. /* 146 */
  27602. { { 0x076bc9d1,0x5cf9350f,0xcf3cd2c3,0x15d903be,0x25af031c,0x21cfc8c2,
  27603. 0x8b1cc657,0xe0ad3248,0x70014e87,0xdd9fb963,0x297f1658,0xf0f3a5a1 },
  27604. { 0xf1f703aa,0xbb908fba,0x2f6760ba,0x2f9cc420,0x66a38b51,0x00ceec66,
  27605. 0x05d645da,0x4deda330,0xf7de3394,0xb9cf5c72,0x1ad4c906,0xaeef6502 } },
  27606. /* 147 */
  27607. { { 0x7a19045d,0x0583c8b1,0xd052824c,0xae7c3102,0xff6cfa58,0x2a234979,
  27608. 0x62c733c0,0xfe9dffc9,0x9c0c4b09,0x3a7fa250,0x4fe21805,0x516437bb },
  27609. { 0xc2a23ddb,0x9454e3d5,0x289c104e,0x0726d887,0x4fd15243,0x8977d918,
  27610. 0x6d7790ba,0xc559e73f,0x465af85f,0x8fd3e87d,0x5feee46b,0xa2615c74 } },
  27611. /* 148 */
  27612. { { 0x4335167d,0xc8d607a8,0xe0f5c887,0x8b42d804,0x398d11f9,0x5f9f13df,
  27613. 0x20740c67,0x5aaa5087,0xa3d9234b,0x83da9a6a,0x2a54bad1,0xbd3a5c4e },
  27614. { 0x2db0f658,0xdd13914c,0x5a3f373a,0x29dcb66e,0x5245a72b,0xbfd62df5,
  27615. 0x91e40847,0x19d18023,0xb136b1ae,0xd9df74db,0x3f93bc5b,0x72a06b6b } },
  27616. /* 149 */
  27617. { { 0xad19d96f,0x6da19ec3,0xfb2a4099,0xb342daa4,0x662271ea,0x0e61633a,
  27618. 0xce8c054b,0x3bcece81,0x8bd62dc6,0x7cc8e061,0xee578d8b,0xae189e19 },
  27619. { 0xdced1eed,0x73e7a25d,0x7875d3ab,0xc1257f0a,0x1cfef026,0x2cb2d5a2,
  27620. 0xb1fdf61c,0xd98ef39b,0x24e83e6c,0xcd8e6f69,0xc7b7088b,0xd71e7076 } },
  27621. /* 150 */
  27622. { { 0x9d4245bf,0x33936830,0x2ac2953b,0x22d96217,0x56c3c3cd,0xb3bf5a82,
  27623. 0x0d0699e8,0x50c9be91,0x8f366459,0xec094463,0x513b7c35,0x6c056dba },
  27624. { 0x045ab0e3,0x687a6a83,0x445c9295,0x8d40b57f,0xa16f5954,0x0f345048,
  27625. 0x3d8f0a87,0x64b5c639,0x9f71c5e2,0x106353a2,0x874f0dd4,0xdd58b475 } },
  27626. /* 151 */
  27627. { { 0x62230c72,0x67ec084f,0x481385e3,0xf14f6cca,0x4cda7774,0xf58bb407,
  27628. 0xaa2dbb6b,0xe15011b1,0x0c035ab1,0xd488369d,0x8245f2fd,0xef83c24a },
  27629. { 0x9fdc2538,0xfb57328f,0x191fe46a,0x79808293,0x32ede548,0xe28f5c44,
  27630. 0xea1a022c,0x1b3cda99,0x3df2ec7f,0x39e639b7,0x760e9a18,0x77b6272b } },
  27631. /* 152 */
  27632. { { 0xa65d56d5,0x2b1d51bd,0x7ea696e0,0x3a9b71f9,0x9904f4c4,0x95250ecc,
  27633. 0xe75774b7,0x8bc4d6eb,0xeaeeb9aa,0x0e343f8a,0x930e04cb,0xc473c1d1 },
  27634. { 0x064cd8ae,0x282321b1,0x5562221c,0xf4b4371e,0xd1bf1221,0xc1cc81ec,
  27635. 0xe2c8082f,0xa52a07a9,0xba64a958,0x350d8e59,0x6fb32c9a,0x29e4f3de } },
  27636. /* 153 */
  27637. { { 0xba89aaa5,0x0aa9d56c,0xc4c6059e,0xf0208ac0,0xbd6ddca4,0x7400d9c6,
  27638. 0xf2c2f74a,0xb384e475,0xb1562dd3,0x4c1061fc,0x2e153b8d,0x3924e248 },
  27639. { 0x849808ab,0xf38b8d98,0xa491aa36,0x29bf3260,0x88220ede,0x85159ada,
  27640. 0xbe5bc422,0x8b47915b,0xd7300967,0xa934d72e,0x2e515d0d,0xc4f30398 } },
  27641. /* 154 */
  27642. { { 0x1b1de38b,0xe3e9ee42,0x42636760,0xa124e25a,0x90165b1a,0x90bf73c0,
  27643. 0x146434c5,0x21802a34,0x2e1fa109,0x54aa83f2,0xed9c51e9,0x1d4bd03c },
  27644. { 0x798751e6,0xc2d96a38,0x8c3507f5,0xed27235f,0xc8c24f88,0xb5fb80e2,
  27645. 0xd37f4f78,0xf873eefa,0xf224ba96,0x7229fd74,0x9edd7149,0x9dcd9199 } },
  27646. /* 155 */
  27647. { { 0x4e94f22a,0xee9f81a6,0xf71ec341,0xe5609892,0xa998284e,0x6c818ddd,
  27648. 0x3b54b098,0x9fd47295,0x0e8a7cc9,0x47a6ac03,0xb207a382,0xde684e5e },
  27649. { 0x2b6b956b,0x4bdd1ecd,0xf01b3583,0x09084414,0x55233b14,0xe2f80b32,
  27650. 0xef5ebc5e,0x5a0fec54,0xbf8b29a2,0x74cf25e6,0x7f29e014,0x1c757fa0 } },
  27651. /* 156 */
  27652. { { 0xeb0fdfe4,0x1bcb5c4a,0xf0899367,0xd7c649b3,0x05bc083b,0xaef68e3f,
  27653. 0xa78aa607,0x57a06e46,0x21223a44,0xa2136ecc,0x52f5a50b,0x89bd6484 },
  27654. { 0x4455f15a,0x724411b9,0x08a9c0fd,0x23dfa970,0x6db63bef,0x7b0da4d1,
  27655. 0xfb162443,0x6f8a7ec1,0xe98284fb,0xc1ac9cee,0x33566022,0x085a582b } },
  27656. /* 157 */
  27657. { { 0xec1f138a,0x15cb61f9,0x668f0c28,0x11c9a230,0xdf93f38f,0xac829729,
  27658. 0x4048848d,0xcef25698,0x2bba8fbf,0x3f686da0,0x111c619a,0xed5fea78 },
  27659. { 0xd6d1c833,0x9b4f73bc,0x86e7bf80,0x50951606,0x042b1d51,0xa2a73508,
  27660. 0x5fb89ec2,0x9ef6ea49,0x5ef8b892,0xf1008ce9,0x9ae8568b,0x78a7e684 } },
  27661. /* 158 */
  27662. { { 0x10470cd8,0x3fe83a7c,0xf86df000,0x92734682,0xda9409b5,0xb5dac06b,
  27663. 0x94939c5f,0x1e7a9660,0x5cc116dc,0xdec6c150,0x66bac8cc,0x1a52b408 },
  27664. { 0x6e864045,0x5303a365,0x9139efc1,0x45eae72a,0x6f31d54f,0x83bec646,
  27665. 0x6e958a6d,0x2fb4a86f,0x4ff44030,0x6760718e,0xe91ae0df,0x008117e3 } },
  27666. /* 159 */
  27667. { { 0x384310a2,0x5d5833ba,0x1fd6c9fc,0xbdfb4edc,0x849c4fb8,0xb9a4f102,
  27668. 0x581c1e1f,0xe5fb239a,0xd0a9746d,0xba44b2e7,0x3bd942b9,0x78f7b768 },
  27669. { 0xc87607ae,0x076c8ca1,0xd5caaa7e,0x82b23c2e,0x2763e461,0x6a581f39,
  27670. 0x3886df11,0xca8a5e4a,0x264e7f22,0xc87e90cf,0x215cfcfc,0x04f74870 } },
  27671. /* 160 */
  27672. { { 0x141d161c,0x5285d116,0x93c4ed17,0x67cd2e0e,0x7c36187e,0x12c62a64,
  27673. 0xed2584ca,0xf5329539,0x42fbbd69,0xc4c777c4,0x1bdfc50a,0x107de776 },
  27674. { 0xe96beebd,0x9976dcc5,0xa865a151,0xbe2aff95,0x9d8872af,0x0e0a9da1,
  27675. 0xa63c17cc,0x5e357a3d,0xe15cc67c,0xd31fdfd8,0x7970c6d8,0xc44bbefd } },
  27676. /* 161 */
  27677. { { 0x4c0c62f1,0x703f83e2,0x4e195572,0x9b1e28ee,0xfe26cced,0x6a82858b,
  27678. 0xc43638fa,0xd381c84b,0xa5ba43d8,0x94f72867,0x10b82743,0x3b4a783d },
  27679. { 0x7576451e,0xee1ad7b5,0x14b6b5c8,0xc3d0b597,0xfcacc1b8,0x3dc30954,
  27680. 0x472c9d7b,0x55df110e,0x02f8a328,0x97c86ed7,0x88dc098f,0xd0433413 } },
  27681. /* 162 */
  27682. { { 0x2ca8f2fe,0x1a60d152,0x491bd41f,0x61640948,0x58dfe035,0x6dae29a5,
  27683. 0x278e4863,0x9a615bea,0x9ad7c8e5,0xbbdb4477,0x2ceac2fc,0x1c706630 },
  27684. { 0x99699b4b,0x5e2b54c6,0x239e17e8,0xb509ca6d,0xea063a82,0x728165fe,
  27685. 0xb6a22e02,0x6b5e609d,0xb26ee1df,0x12813905,0x439491fa,0x07b9f722 } },
  27686. /* 163 */
  27687. { { 0x48ff4e49,0x1592ec14,0x6d644129,0x3e4e9f17,0x1156acc0,0x7acf8288,
  27688. 0xbb092b0b,0x5aa34ba8,0x7d38393d,0xcd0f9022,0xea4f8187,0x416724dd },
  27689. { 0xc0139e73,0x3c4e641c,0x91e4d87d,0xe0fe46cf,0xcab61f8a,0xedb3c792,
  27690. 0xd3868753,0x4cb46de4,0x20f1098a,0xe449c21d,0xf5b8ea6e,0x5e5fd059 } },
  27691. /* 164 */
  27692. { { 0x75856031,0x7fcadd46,0xeaf2fbd0,0x89c7a4cd,0x7a87c480,0x1af523ce,
  27693. 0x61d9ae90,0xe5fc1095,0xbcdb95f5,0x3fb5864f,0xbb5b2c7d,0xbeb5188e },
  27694. { 0x3ae65825,0x3d1563c3,0x0e57d641,0x116854c4,0x1942ebd3,0x11f73d34,
  27695. 0xc06955b3,0x24dc5904,0x995a0a62,0x8a0d4c83,0x5d577b7d,0xfb26b86d } },
  27696. /* 165 */
  27697. { { 0xc686ae17,0xc53108e7,0xd1c1da56,0x9090d739,0x9aec50ae,0x4583b013,
  27698. 0xa49a6ab2,0xdd9a088b,0xf382f850,0x28192eea,0xf5fe910e,0xcc8df756 },
  27699. { 0x9cab7630,0x877823a3,0xfb8e7fc1,0x64984a9a,0x364bfc16,0x5448ef9c,
  27700. 0xc44e2a9a,0xbbb4f871,0x435c95e9,0x901a41ab,0xaaa50a06,0xc6c23e5f } },
  27701. /* 166 */
  27702. { { 0x9034d8dd,0xb78016c1,0x0b13e79b,0x856bb44b,0xb3241a05,0x85c6409a,
  27703. 0x2d78ed21,0x8d2fe19a,0x726eddf2,0xdcc7c26d,0x25104f04,0x3ccaff5f },
  27704. { 0x6b21f843,0x397d7edc,0xe975de4c,0xda88e4dd,0x4f5ab69e,0x5273d396,
  27705. 0x9aae6cc0,0x537680e3,0x3e6f9461,0xf749cce5,0x957bffd3,0x021ddbd9 } },
  27706. /* 167 */
  27707. { { 0x777233cf,0x7b64585f,0x0942a6f0,0xfe6771f6,0xdfe6eef0,0x636aba7a,
  27708. 0x86038029,0x63bbeb56,0xde8fcf36,0xacee5842,0xd4a20524,0x48d9aa99 },
  27709. { 0x0da5e57a,0xcff7a74c,0xe549d6c9,0xc232593c,0xf0f2287b,0x68504bcc,
  27710. 0xbc8360b5,0x6d7d098d,0x5b402f41,0xeac5f149,0xb87d1bf1,0x61936f11 } },
  27711. /* 168 */
  27712. { { 0xb8153a9d,0xaa9da167,0x9e83ecf0,0xa49fe3ac,0x1b661384,0x14c18f8e,
  27713. 0x38434de1,0x61c24dab,0x283dae96,0x3d973c3a,0x82754fc9,0xc99baa01 },
  27714. { 0x4c26b1e3,0x477d198f,0xa7516202,0x12e8e186,0x362addfa,0x386e52f6,
  27715. 0xc3962853,0x31e8f695,0x6aaedb60,0xdec2af13,0x29cf74ac,0xfcfdb4c6 } },
  27716. /* 169 */
  27717. { { 0xcca40298,0x6b3ee958,0xf2f5d195,0xc3878153,0xed2eae5b,0x0c565630,
  27718. 0x3a697cf2,0xd089b37e,0xad5029ea,0xc2ed2ac7,0x0f0dda6a,0x7e5cdfad },
  27719. { 0xd9b86202,0xf98426df,0x4335e054,0xed1960b1,0x3f14639e,0x1fdb0246,
  27720. 0x0db6c670,0x17f709c3,0x773421e1,0xbfc687ae,0x26c1a8ac,0x13fefc4a } },
  27721. /* 170 */
  27722. { { 0x7ffa0a5f,0xe361a198,0xc63fe109,0xf4b26102,0x6c74e111,0x264acbc5,
  27723. 0x77abebaf,0x4af445fa,0x24cddb75,0x448c4fdd,0x44506eea,0x0b13157d },
  27724. { 0x72e9993d,0x22a6b159,0x85e5ecbe,0x2c3c57e4,0xfd83e1a1,0xa673560b,
  27725. 0xc3b8c83b,0x6be23f82,0x40bbe38e,0x40b13a96,0xad17399b,0x66eea033 } },
  27726. /* 171 */
  27727. { { 0xb4c6c693,0x49fc6e95,0x36af7d38,0xefc735de,0x35fe42fc,0xe053343d,
  27728. 0x6a9ab7c3,0xf0aa427c,0x4a0fcb24,0xc79f0436,0x93ebbc50,0x16287243 },
  27729. { 0x16927e1e,0x5c3d6bd0,0x673b984c,0x40158ed2,0x4cd48b9a,0xa7f86fc8,
  27730. 0x60ea282d,0x1643eda6,0xe2a1beed,0x45b393ea,0x19571a94,0x664c839e } },
  27731. /* 172 */
  27732. { { 0x27eeaf94,0x57745750,0xea99e1e7,0x2875c925,0x5086adea,0xc127e7ba,
  27733. 0x86fe424f,0x765252a0,0x2b6c0281,0x1143cc6c,0xd671312d,0xc9bb2989 },
  27734. { 0x51acb0a5,0x880c337c,0xd3c60f78,0xa3710915,0x9262b6ed,0x496113c0,
  27735. 0x9ce48182,0x5d25d9f8,0xb3813586,0x53b6ad72,0x4c0e159c,0x0ea3bebc } },
  27736. /* 173 */
  27737. { { 0xc5e49bea,0xcaba450a,0x7c05da59,0x684e5415,0xde7ac36c,0xa2e9cab9,
  27738. 0x2e6f957b,0x4ca79b5f,0x09b817b1,0xef7b0247,0x7d89df0f,0xeb304990 },
  27739. { 0x46fe5096,0x508f7307,0x2e04eaaf,0x695810e8,0x3512f76c,0x88ef1bd9,
  27740. 0x3ebca06b,0x77661351,0xccf158b7,0xf7d4863a,0x94ee57da,0xb2a81e44 } },
  27741. /* 174 */
  27742. { { 0x6d53e6ba,0xff288e5b,0x14484ea2,0xa90de1a9,0xed33c8ec,0x2fadb60c,
  27743. 0x28b66a40,0x579d6ef3,0xec24372d,0x4f2dd6dd,0x1d66ec7d,0xe9e33fc9 },
  27744. { 0x039eab6e,0x110899d2,0x3e97bb5e,0xa31a667a,0xcfdce68e,0x6200166d,
  27745. 0x5137d54b,0xbe83ebae,0x4800acdf,0x085f7d87,0x0c6f8c86,0xcf4ab133 } },
  27746. /* 175 */
  27747. { { 0x931e08fb,0x03f65845,0x1506e2c0,0x6438551e,0x9c36961f,0x5791f0dc,
  27748. 0xe3dcc916,0x68107b29,0xf495d2ca,0x83242374,0x6ee5895b,0xd8cfb663 },
  27749. { 0xa0349b1b,0x525e0f16,0x4a0fab86,0x33cd2c6c,0x2af8dda9,0x46c12ee8,
  27750. 0x71e97ad3,0x7cc424ba,0x37621eb0,0x69766ddf,0xa5f0d390,0x95565f56 } },
  27751. /* 176 */
  27752. { { 0x1a0f5e94,0xe0e7bbf2,0x1d82d327,0xf771e115,0xceb111fa,0x10033e3d,
  27753. 0xd3426638,0xd269744d,0x00d01ef6,0xbdf2d9da,0xa049ceaf,0x1cb80c71 },
  27754. { 0x9e21c677,0x17f18328,0x19c8f98b,0x6452af05,0x80b67997,0x35b9c5f7,
  27755. 0x40f8f3d4,0x5c2e1cbe,0x66d667ca,0x43f91656,0xcf9d6e79,0x9faaa059 } },
  27756. /* 177 */
  27757. { { 0x0a078fe6,0x8ad24618,0x464fd1dd,0xf6cc73e6,0xc3e37448,0x4d2ce34d,
  27758. 0xe3271b5f,0x624950c5,0xefc5af72,0x62910f5e,0xaa132bc6,0x8b585bf8 },
  27759. { 0xa839327f,0x11723985,0x4aac252f,0x34e2d27d,0x6296cc4e,0x402f59ef,
  27760. 0x47053de9,0x00ae055c,0x28b4f09b,0xfc22a972,0xfa0c180e,0xa9e86264 } },
  27761. /* 178 */
  27762. { { 0xbc310ecc,0x0b7b6224,0x67fa14ed,0x8a1a74f1,0x7214395c,0x87dd0960,
  27763. 0xf5c91128,0xdf1b3d09,0x86b264a8,0x39ff23c6,0x3e58d4c5,0xdc2d49d0 },
  27764. { 0xa9d6f501,0x2152b7d3,0xc04094f7,0xf4c32e24,0xd938990f,0xc6366596,
  27765. 0x94fb207f,0x084d078f,0x328594cb,0xfd99f1d7,0xcb2d96b3,0x36defa64 } },
  27766. /* 179 */
  27767. { { 0x13ed7cbe,0x4619b781,0x9784bd0e,0x95e50015,0x2c7705fe,0x2a32251c,
  27768. 0x5f0dd083,0xa376af99,0x0361a45b,0x55425c6c,0x1f291e7b,0x812d2cef },
  27769. { 0x5fd94972,0xccf581a0,0xe56dc383,0x26e20e39,0x63dbfbf0,0x0093685d,
  27770. 0x36b8c575,0x1fc164cc,0x390ef5e7,0xb9c5ab81,0x26908c66,0x40086beb } },
  27771. /* 180 */
  27772. { { 0x37e3c115,0xe5e54f79,0xc1445a8a,0x69b8ee8c,0xb7659709,0x79aedff2,
  27773. 0x1b46fbe6,0xe288e163,0xd18d7bb7,0xdb4844f0,0x48aa6424,0xe0ea23d0 },
  27774. { 0xf3d80a73,0x714c0e4e,0x3bd64f98,0x87a0aa9e,0x2ec63080,0x8844b8a8,
  27775. 0x255d81a3,0xe0ac9c30,0x455397fc,0x86151237,0x2f820155,0x0b979464 } },
  27776. /* 181 */
  27777. { { 0x4ae03080,0x127a255a,0x580a89fb,0x232306b4,0x6416f539,0x04e8cd6a,
  27778. 0x13b02a0e,0xaeb70dee,0x4c09684a,0xa3038cf8,0x28e433ee,0xa710ec3c },
  27779. { 0x681b1f7d,0x77a72567,0x2fc28170,0x86fbce95,0xf5735ac8,0xd3408683,
  27780. 0x6bd68e93,0x3a324e2a,0xc027d155,0x7ec74353,0xd4427177,0xab60354c } },
  27781. /* 182 */
  27782. { { 0xef4c209d,0x32a5342a,0x08d62704,0x2ba75274,0xc825d5fe,0x4bb4af6f,
  27783. 0xd28e7ff1,0x1c3919ce,0xde0340f6,0x1dfc2fdc,0x29f33ba9,0xc6580baf },
  27784. { 0x41d442cb,0xae121e75,0x3a4724e4,0x4c7727fd,0x524f3474,0xe556d6a4,
  27785. 0x785642a2,0x87e13cc7,0xa17845fd,0x182efbb1,0x4e144857,0xdcec0cf1 } },
  27786. /* 183 */
  27787. { { 0xe9539819,0x1cb89541,0x9d94dbf1,0xc8cb3b4f,0x417da578,0x1d353f63,
  27788. 0x8053a09e,0xb7a697fb,0xc35d8b78,0x8d841731,0xb656a7a9,0x85748d6f },
  27789. { 0xc1859c5d,0x1fd03947,0x535d22a2,0x6ce965c1,0x0ca3aadc,0x1966a13e,
  27790. 0x4fb14eff,0x9802e41d,0x76dd3fcd,0xa9048cbb,0xe9455bba,0x89b182b5 } },
  27791. /* 184 */
  27792. { { 0x43360710,0xd777ad6a,0x55e9936b,0x841287ef,0x04a21b24,0xbaf5c670,
  27793. 0x35ad86f1,0xf2c0725f,0xc707e72e,0x338fa650,0xd8883e52,0x2bf8ed2e },
  27794. { 0xb56e0d6a,0xb0212cf4,0x6843290c,0x50537e12,0x98b3dc6f,0xd8b184a1,
  27795. 0x0210b722,0xd2be9a35,0x559781ee,0x407406db,0x0bc18534,0x5a78d591 } },
  27796. /* 185 */
  27797. { { 0xd748b02c,0x4d57aa2a,0xa12b3b95,0xbe5b3451,0x64711258,0xadca7a45,
  27798. 0x322153db,0x597e091a,0x32eb1eab,0xf3271006,0x2873f301,0xbd9adcba },
  27799. { 0x38543f7f,0xd1dc79d1,0x921b1fef,0x00022092,0x1e5df8ed,0x86db3ef5,
  27800. 0x9e6b944a,0x888cae04,0x791a32b4,0x71bd29ec,0xa6d1c13e,0xd3516206 } },
  27801. /* 186 */
  27802. { { 0x55924f43,0x2ef6b952,0x4f9de8d5,0xd2f401ae,0xadc68042,0xfc73e8d7,
  27803. 0x0d9d1bb4,0x627ea70c,0xbbf35679,0xc3bb3e3e,0xd882dee4,0x7e8a254a },
  27804. { 0xb5924407,0x08906f50,0xa1ad444a,0xf14a0e61,0x65f3738e,0xaa0efa21,
  27805. 0xae71f161,0xd60c7dd6,0xf175894d,0x9e8390fa,0x149f4c00,0xd115cd20 } },
  27806. /* 187 */
  27807. { { 0xa52abf77,0x2f2e2c1d,0x54232568,0xc2a0dca5,0x54966dcc,0xed423ea2,
  27808. 0xcd0dd039,0xe48c93c7,0x176405c7,0x1e54a225,0x70d58f2e,0x1efb5b16 },
  27809. { 0x94fb1471,0xa751f9d9,0x67d2941d,0xfdb31e1f,0x53733698,0xa6c74eb2,
  27810. 0x89a0f64a,0xd3155d11,0xa4b8d2b6,0x4414cfe4,0xf7a8e9e3,0x8d5a4be8 } },
  27811. /* 188 */
  27812. { { 0x52669e98,0x5c96b4d4,0x8fd42a03,0x4547f922,0xd285174e,0xcf5c1319,
  27813. 0x064bffa0,0x805cd1ae,0x246d27e7,0x50e8bc4f,0xd5781e11,0xf89ef98f },
  27814. { 0xdee0b63f,0xb4ff95f6,0x222663a4,0xad850047,0x4d23ce9c,0x02691860,
  27815. 0x50019f59,0x3e5309ce,0x69a508ae,0x27e6f722,0x267ba52c,0xe9376652 } },
  27816. /* 189 */
  27817. { { 0xc0368708,0xa04d289c,0x5e306e1d,0xc458872f,0x33112fea,0x76fa23de,
  27818. 0x6efde42e,0x718e3974,0x1d206091,0xf0c98cdc,0x14a71987,0x5fa3ca62 },
  27819. { 0xdcaa9f2a,0xeee8188b,0x589a860d,0x312cc732,0xc63aeb1f,0xf9808dd6,
  27820. 0x4ea62b53,0x70fd43db,0x890b6e97,0x2c2bfe34,0xfa426aa6,0x105f863c } },
  27821. /* 190 */
  27822. { { 0xb38059ad,0x0b29795d,0x90647ea0,0x5686b77e,0xdb473a3e,0xeff0470e,
  27823. 0xf9b6d1e2,0x278d2340,0xbd594ec7,0xebbff95b,0xd3a7f23d,0xf4b72334 },
  27824. { 0xa5a83f0b,0x2a285980,0x9716a8b3,0x0786c41a,0x22511812,0x138901bd,
  27825. 0xe2fede6e,0xd1b55221,0xdf4eb590,0x0806e264,0x762e462e,0x6c4c897e } },
  27826. /* 191 */
  27827. { { 0xb4b41d9d,0xd10b905f,0x4523a65b,0x826ca466,0xb699fa37,0x535bbd13,
  27828. 0x73bc8f90,0x5b9933d7,0xcd2118ad,0x9332d61f,0xd4a65fd0,0x158c693e },
  27829. { 0xe6806e63,0x4ddfb2a8,0xb5de651b,0xe31ed3ec,0x819bc69a,0xf9460e51,
  27830. 0x2c76b1f8,0x6229c0d6,0x901970a3,0xbb78f231,0x9cee72b8,0x31f3820f } },
  27831. /* 192 */
  27832. { { 0xc09e1c72,0xe931caf2,0x12990cf4,0x0715f298,0x943262d8,0x33aad81d,
  27833. 0x73048d3f,0x5d292b7a,0xdc7415f6,0xb152aaa4,0x0fd19587,0xc3d10fd9 },
  27834. { 0x75ddadd0,0xf76b35c5,0x1e7b694c,0x9f5f4a51,0xc0663025,0x2f1ab7eb,
  27835. 0x920260b0,0x01c9cc87,0x05d39da6,0xc4b1f61a,0xeb4a9c4e,0x6dcd76c4 } },
  27836. /* 193 */
  27837. { { 0xfdc83f01,0x0ba0916f,0x9553e4f9,0x354c8b44,0xffc5e622,0xa6cc511a,
  27838. 0xe95be787,0xb954726a,0x75b41a62,0xcb048115,0xebfde989,0xfa2ae6cd },
  27839. { 0x0f24659a,0x6376bbc7,0x4c289c43,0x13a999fd,0xec9abd8b,0xc7134184,
  27840. 0xa789ab04,0x28c02bf6,0xd3e526ec,0xff841ebc,0x640893a8,0x442b191e } },
  27841. /* 194 */
  27842. { { 0xfa2b6e20,0x4cac6c62,0xf6d69861,0x97f29e9b,0xbc96d12d,0x228ab1db,
  27843. 0x5e8e108d,0x6eb91327,0x40771245,0xd4b3d4d1,0xca8a803a,0x61b20623 },
  27844. { 0xa6a560b1,0x2c2f3b41,0x3859fcf4,0x879e1d40,0x024dbfc3,0x7cdb5145,
  27845. 0x3bfa5315,0x55d08f15,0xaa93823a,0x2f57d773,0xc6a2c9a2,0xa97f259c } },
  27846. /* 195 */
  27847. { { 0xe58edbbb,0xc306317b,0x79dfdf13,0x25ade51c,0x16d83dd6,0x6b5beaf1,
  27848. 0x1dd8f925,0xe8038a44,0xb2a87b6b,0x7f00143c,0xf5b438de,0xa885d00d },
  27849. { 0xcf9e48bd,0xe9f76790,0xa5162768,0xf0bdf9f0,0xad7b57cb,0x0436709f,
  27850. 0xf7c15db7,0x7e151c12,0x5d90ee3b,0x3514f022,0x2c361a8d,0x2e84e803 } },
  27851. /* 196 */
  27852. { { 0x563ec8d8,0x2277607d,0xe3934cb7,0xa661811f,0xf58fd5de,0x3ca72e7a,
  27853. 0x62294c6a,0x7989da04,0xf6bbefe9,0x88b3708b,0x53ed7c82,0x0d524cf7 },
  27854. { 0x2f30c073,0x69f699ca,0x9dc1dcf3,0xf0fa264b,0x05f0aaf6,0x44ca4568,
  27855. 0xd19b9baf,0x0f5b23c7,0xeabd1107,0x39193f41,0x2a7c9b83,0x9e3e10ad } },
  27856. /* 197 */
  27857. { { 0xd4ae972f,0xa90824f0,0xc6e846e7,0x43eef02b,0x29d2160a,0x7e460612,
  27858. 0xfe604e91,0x29a178ac,0x4eb184b2,0x23056f04,0xeb54cdf4,0x4fcad55f },
  27859. { 0xae728d15,0xa0ff96f3,0xc6a00331,0x8a2680c6,0x7ee52556,0x5f84cae0,
  27860. 0xc5a65dad,0x5e462c3a,0xe2d23f4f,0x5d2b81df,0xc5b1eb07,0x6e47301b } },
  27861. /* 198 */
  27862. { { 0xaf8219b9,0x77411d68,0x51b1907a,0xcb883ce6,0x101383b5,0x25c87e57,
  27863. 0x982f970d,0x9c7d9859,0x118305d2,0xaa6abca5,0x9013a5db,0x725fed2f },
  27864. { 0xababd109,0x487cdbaf,0x87586528,0xc0f8cf56,0x8ad58254,0xa02591e6,
  27865. 0xdebbd526,0xc071b1d1,0x961e7e31,0x927dfe8b,0x9263dfe1,0x55f895f9 } },
  27866. /* 199 */
  27867. { { 0xb175645b,0xf899b00d,0xb65b4b92,0x51f3a627,0xb67399ef,0xa2f3ac8d,
  27868. 0xe400bc20,0xe717867f,0x1967b952,0x42cc9020,0x3ecd1de1,0x3d596751 },
  27869. { 0xdb979775,0xd41ebcde,0x6a2e7e88,0x99ba61bc,0x321504f2,0x039149a5,
  27870. 0x27ba2fad,0xe7dc2314,0xb57d8368,0x9f556308,0x57da80a7,0x2b6d16c9 } },
  27871. /* 200 */
  27872. { { 0x279ad982,0x84af5e76,0x9c8b81a6,0x9bb4c92d,0x0e698e67,0xd79ad44e,
  27873. 0x265fc167,0xe8be9048,0x0c3a4ccc,0xf135f7e6,0xb8863a33,0xa0a10d38 },
  27874. { 0xd386efd9,0xe197247c,0xb52346c2,0x0eefd3f9,0x78607bc8,0xc22415f9,
  27875. 0x508674ce,0xa2a8f862,0xc8c9d607,0xa72ad09e,0x50fa764f,0xcd9f0ede } },
  27876. /* 201 */
  27877. { { 0xd1a46d4d,0x063391c7,0x9eb01693,0x2df51c11,0x849e83de,0xc5849800,
  27878. 0x8ad08382,0x48fd09aa,0xaa742736,0xa405d873,0xe1f9600c,0xee49e61e },
  27879. { 0x48c76f73,0xd76676be,0x01274b2a,0xd9c100f6,0x83f8718d,0x110bb67c,
  27880. 0x02fc0d73,0xec85a420,0x744656ad,0xc0449e1e,0x37d9939b,0x28ce7376 } },
  27881. /* 202 */
  27882. { { 0x44544ac7,0x97e9af72,0xba010426,0xf2c658d5,0xfb3adfbd,0x732dec39,
  27883. 0xa2df0b07,0xd12faf91,0x2171e208,0x8ac26725,0x5b24fa54,0xf820cdc8 },
  27884. { 0x94f4cf77,0x307a6eea,0x944a33c6,0x18c783d2,0x0b741ac5,0x4b939d4c,
  27885. 0x3ffbb6e4,0x1d7acd15,0x7a255e44,0x06a24858,0xce336d50,0x14fbc494 } },
  27886. /* 203 */
  27887. { { 0x51584e3c,0x9b920c0c,0xf7e54027,0xc7733c59,0x88422bbe,0xe24ce139,
  27888. 0x523bd6ab,0x11ada812,0xb88e6def,0xde068800,0xfe8c582d,0x7b872671 },
  27889. { 0x7de53510,0x4e746f28,0xf7971968,0x492f8b99,0x7d928ac2,0x1ec80bc7,
  27890. 0x432eb1b5,0xb3913e48,0x32028f6e,0xad084866,0x8fc2f38b,0x122bb835 } },
  27891. /* 204 */
  27892. { { 0x3b0b29c3,0x0a9f3b1e,0x4fa44151,0x837b6432,0x17b28ea7,0xb9905c92,
  27893. 0x98451750,0xf39bc937,0xce8b6da1,0xcd383c24,0x010620b2,0x299f57db },
  27894. { 0x58afdce3,0x7b6ac396,0x3d05ef47,0xa15206b3,0xb9bb02ff,0xa0ae37e2,
  27895. 0x9db3964c,0x107760ab,0x67954bea,0xe29de9a0,0x431c3f82,0x446a1ad8 } },
  27896. /* 205 */
  27897. { { 0x5c6b8195,0xc6fecea0,0xf49e71b9,0xd744a7c5,0x177a7ae7,0xa8e96acc,
  27898. 0x358773a7,0x1a05746c,0x37567369,0xa4162146,0x87d1c971,0xaa0217f7 },
  27899. { 0x77fd3226,0x61e9d158,0xe4f600be,0x0f6f2304,0x7a6dff07,0xa9c4cebc,
  27900. 0x09f12a24,0xd15afa01,0x8c863ee9,0x2bbadb22,0xe5eb8c78,0xa28290e4 } },
  27901. /* 206 */
  27902. { { 0x3e9de330,0x55b87fa0,0x195c145b,0x12b26066,0xa920bef0,0xe08536e0,
  27903. 0x4d195adc,0x7bff6f2c,0x945f4187,0x7f319e9d,0xf892ce47,0xf9848863 },
  27904. { 0x4fe37657,0xd0efc1d3,0x5cf0e45a,0x3c58de82,0x8b0ccbbe,0x626ad21a,
  27905. 0xaf952fc5,0xd2a31208,0xeb437357,0x81791995,0x98e95d4f,0x5f19d30f } },
  27906. /* 207 */
  27907. { { 0x0e6865bb,0x72e83d9a,0xf63456a6,0x22f5af3b,0x463c8d9e,0x409e9c73,
  27908. 0xdfe6970e,0x40e9e578,0x711b91ca,0x876b6efa,0x942625a3,0x895512cf },
  27909. { 0xcb4e462b,0x84c8eda8,0x4412e7c8,0x84c0154a,0xceb7b71f,0x04325db1,
  27910. 0x66f70877,0x1537dde3,0x1992b9ac,0xf3a09399,0xd498ae77,0xa7316606 } },
  27911. /* 208 */
  27912. { { 0xcad260f5,0x13990d2f,0xeec0e8c0,0x76c3be29,0x0f7bd7d5,0x7dc5bee0,
  27913. 0xefebda4b,0x9be167d2,0x9122b87e,0xcce3dde6,0x82b5415c,0x75a28b09 },
  27914. { 0xe84607a6,0xf6810bcd,0x6f4dbf0d,0xc6d58128,0x1b4dafeb,0xfead577d,
  27915. 0x066b28eb,0x9bc440b2,0x8b17e84b,0x53f1da97,0xcda9a575,0x0459504b } },
  27916. /* 209 */
  27917. { { 0x329e5836,0x13e39a02,0xf717269d,0x2c9e7d51,0xf26c963b,0xc5ac58d6,
  27918. 0x79967bf5,0x3b0c6c43,0x55908d9d,0x60bbea3f,0xf07c9ad1,0xd84811e7 },
  27919. { 0x5bd20e4a,0xfe7609a7,0x0a70baa8,0xe4325dd2,0xb3600386,0x3711f370,
  27920. 0xd0924302,0x97f9562f,0x4acc4436,0x040dc0c3,0xde79cdd4,0xfd6d725c } },
  27921. /* 210 */
  27922. { { 0xcf13eafb,0xb3efd0e3,0x5aa0ae5f,0x21009cbb,0x79022279,0xe480c553,
  27923. 0xb2fc9a6d,0x755cf334,0x07096ae7,0x8564a5bf,0xbd238139,0xddd649d0 },
  27924. { 0x8a045041,0xd0de10b1,0xc957d572,0x6e05b413,0x4e0fb25c,0x5c5ff806,
  27925. 0x641162fb,0xd933179b,0xe57439f9,0x42d48485,0x8a8d72aa,0x70c5bd0a } },
  27926. /* 211 */
  27927. { { 0x97bdf646,0xa7671738,0xab329f7c,0xaa1485b4,0xf8f25fdf,0xce3e11d6,
  27928. 0xc6221824,0x76a3fc7e,0xf3924740,0x045f281f,0x96d13a9a,0x24557d4e },
  27929. { 0xdd4c27cd,0x875c804b,0x0f5c7fea,0x11c5f0f4,0xdc55ff7e,0xac8c880b,
  27930. 0x1103f101,0x2acddec5,0xf99faa89,0x38341a21,0xce9d6b57,0xc7b67a2c } },
  27931. /* 212 */
  27932. { { 0x8e357586,0x9a0d724f,0xdf648da0,0x1d7f4ff5,0xfdee62a5,0x9c3e6c9b,
  27933. 0x0389b372,0x0499cef0,0x98eab879,0xe904050d,0x6c051617,0xe8eef1b6 },
  27934. { 0xc37e3ca9,0xebf5bfeb,0xa4e0b91d,0x7c5e946d,0x2c4bea28,0x79097314,
  27935. 0xee67b2b7,0x81f6c109,0xdafc5ede,0xaf237d9b,0x2abb04c7,0xd2e60201 } },
  27936. /* 213 */
  27937. { { 0x8a4f57bf,0x6156060c,0xff11182a,0xf9758696,0x6296ef00,0x8336773c,
  27938. 0xff666899,0x9c054bce,0x719cd11c,0xd6a11611,0xdbe1acfa,0x9824a641 },
  27939. { 0xba89fd01,0x0b7b7a5f,0x889f79d8,0xf8d3b809,0xf578285c,0xc5e1ea08,
  27940. 0xae6d8288,0x7ac74536,0x7521ef5f,0x5d37a200,0xb260a25d,0x5ecc4184 } },
  27941. /* 214 */
  27942. { { 0xa708c8d3,0xddcebb19,0xc63f81ec,0xe63ed04f,0x11873f95,0xd045f5a0,
  27943. 0x79f276d5,0x3b5ad544,0x425ae5b3,0x81272a3d,0x10ce1605,0x8bfeb501 },
  27944. { 0x888228bf,0x4233809c,0xb2aff7df,0x4bd82acf,0x0cbd4a7f,0x9c68f180,
  27945. 0x6b44323d,0xfcd77124,0x891db957,0x60c0fcf6,0x04da8f7f,0xcfbb4d89 } },
  27946. /* 215 */
  27947. { { 0x3b26139a,0x9a6a5df9,0xb2cc7eb8,0x3e076a83,0x5a964bcd,0x47a8e82d,
  27948. 0xb9278d6b,0x8a4e2a39,0xe4443549,0x93506c98,0xf1e0d566,0x06497a8f },
  27949. { 0x2b1efa05,0x3dee8d99,0x45393e33,0x2da63ca8,0xcf0579ad,0xa4af7277,
  27950. 0x3236d8ea,0xaf4b4639,0x32b617f5,0x6ccad95b,0xb88bb124,0xce76d8b8 } },
  27951. /* 216 */
  27952. { { 0x083843dc,0x63d2537a,0x1e4153b4,0x89eb3514,0xea9afc94,0x5175ebc4,
  27953. 0x8ed1aed7,0x7a652580,0xd85e8297,0x67295611,0xb584b73d,0x8dd2d68b },
  27954. { 0x0133c3a4,0x237139e6,0x4bd278ea,0x9de838ab,0xc062fcd9,0xe829b072,
  27955. 0x63ba8706,0x70730d4f,0xd3cd05ec,0x6080483f,0x0c85f84d,0x872ab5b8 } },
  27956. /* 217 */
  27957. { { 0x999d4d49,0xfc0776d3,0xec3f45e7,0xa3eb59de,0x0dae1fc1,0xbc990e44,
  27958. 0xa15371ff,0x33596b1e,0x9bc7ab25,0xd447dcb2,0x35979582,0xcd5b63e9 },
  27959. { 0x77d1ff11,0xae3366fa,0xedee6903,0x59f28f05,0xa4433bf2,0x6f43fed1,
  27960. 0xdf9ce00e,0x15409c9b,0xaca9c5dc,0x21b5cded,0x82d7bdb4,0xf9f33595 } },
  27961. /* 218 */
  27962. { { 0x9422c792,0x95944378,0xc958b8bf,0x239ea923,0xdf076541,0x4b61a247,
  27963. 0xbb9fc544,0x4d29ce85,0x0b424559,0x9a692a67,0x0e486900,0x6e0ca5a0 },
  27964. { 0x85b3bece,0x6b79a782,0xc61f9892,0x41f35e39,0xae747f82,0xff82099a,
  27965. 0xd0ca59d6,0x58c8ae3f,0x99406b5f,0x4ac930e2,0x9df24243,0x2ce04eb9 } },
  27966. /* 219 */
  27967. { { 0x1ac37b82,0x4366b994,0x25b04d83,0xff0c728d,0x19c47b7c,0x1f551361,
  27968. 0xbeff13e7,0xdbf2d5ed,0xe12a683d,0xf78efd51,0x989cf9c4,0x82cd85b9 },
  27969. { 0xe0cb5d37,0xe23c6db6,0x72ee1a15,0x818aeebd,0x28771b14,0x8212aafd,
  27970. 0x1def817d,0x7bc221d9,0x9445c51f,0xdac403a2,0x12c3746b,0x711b0517 } },
  27971. /* 220 */
  27972. { { 0x5ea99ecc,0x0ed9ed48,0xb8cab5e1,0xf799500d,0xb570cbdc,0xa8ec87dc,
  27973. 0xd35dfaec,0x52cfb2c2,0x6e4d80a4,0x8d31fae2,0xdcdeabe5,0xe6a37dc9 },
  27974. { 0x1deca452,0x5d365a34,0x0d68b44e,0x09a5f8a5,0xa60744b1,0x59238ea5,
  27975. 0xbb4249e9,0xf2fedc0d,0xa909b2e3,0xe395c74e,0x39388250,0xe156d1a5 } },
  27976. /* 221 */
  27977. { { 0x47181ae9,0xd796b3d0,0x44197808,0xbaf44ba8,0x34cf3fac,0xe6933094,
  27978. 0xc3bd5c46,0x41aa6ade,0xeed947c6,0x4fda75d8,0x9ea5a525,0xacd9d412 },
  27979. { 0xd430301b,0x65cc55a3,0x7b52ea49,0x3c9a5bcf,0x159507f0,0x22d319cf,
  27980. 0xde74a8dd,0x2ee0b9b5,0x877ac2b6,0x20c26a1e,0x92e7c314,0x387d73da } },
  27981. /* 222 */
  27982. { { 0x8cd3fdac,0x13c4833e,0x332e5b8e,0x76fcd473,0xe2fe1fd3,0xff671b4b,
  27983. 0x5d98d8ec,0x4d734e8b,0x514bbc11,0xb1ead3c6,0x7b390494,0xd14ca858 },
  27984. { 0x5d2d37e9,0x95a443af,0x00464622,0x73c6ea73,0x15755044,0xa44aeb4b,
  27985. 0xfab58fee,0xba3f8575,0xdc680a6f,0x9779dbc9,0x7b37ddfc,0xe1ee5f5a } },
  27986. /* 223 */
  27987. { { 0x12d29f46,0xcd0b4648,0x0ed53137,0x93295b0b,0x80bef6c9,0xbfe26094,
  27988. 0x54248b00,0xa6565788,0x80e7f9c4,0x69c43fca,0xbe141ea1,0x2190837b },
  27989. { 0xa1b26cfb,0x875e159a,0x7affe852,0x90ca9f87,0x92ca598e,0x15e6550d,
  27990. 0x1938ad11,0xe3e0945d,0x366ef937,0xef7636bb,0xb39869e5,0xb6034d0b } },
  27991. /* 224 */
  27992. { { 0x26d8356e,0x4d255e30,0xd314626f,0xf83666ed,0xd0c8ed64,0x421ddf61,
  27993. 0x26677b61,0x96e473c5,0x9e9b18b3,0xdad4af7e,0xa9393f75,0xfceffd4a },
  27994. { 0x11c731d5,0x843138a1,0xb2f141d9,0x05bcb3a1,0x617b7671,0x20e1fa95,
  27995. 0x88ccec7b,0xbefce812,0x90f1b568,0x582073dc,0x1f055cb7,0xf572261a } },
  27996. /* 225 */
  27997. { { 0x36973088,0xf3148277,0x86a9f980,0xc008e708,0xe046c261,0x1b795947,
  27998. 0xca76bca0,0xdf1e6a7d,0x71acddf0,0xabafd886,0x1364d8f4,0xff7054d9 },
  27999. { 0xe2260594,0x2cf63547,0xd73b277e,0x468a5372,0xef9bd35e,0xc7419e24,
  28000. 0x24043cc3,0x2b4a1c20,0x890b39cd,0xa28f047a,0x46f9a2e3,0xdca2cea1 } },
  28001. /* 226 */
  28002. { { 0x53277538,0xab788736,0xcf697738,0xa734e225,0x6b22e2c1,0x66ee1d1e,
  28003. 0xebe1d212,0x2c615389,0x02bb0766,0xf36cad40,0x3e64f207,0x120885c3 },
  28004. { 0x90fbfec2,0x59e77d56,0xd7a574ae,0xf9e781aa,0x5d045e53,0x801410b0,
  28005. 0xa91b5f0e,0xd3b5f0aa,0x7fbb3521,0xb3d1df00,0xc72bee9a,0x11c4b33e } },
  28006. /* 227 */
  28007. { { 0x83c3a7f3,0xd32b9832,0x88d8a354,0x8083abcf,0x50f4ec5a,0xdeb16404,
  28008. 0x641e2907,0x18d747f0,0xf1bbf03e,0x4e8978ae,0x88a0cd89,0x932447dc },
  28009. { 0xcf3d5897,0x561e0feb,0x13600e6d,0xfc3a682f,0xd16a6b73,0xc78b9d73,
  28010. 0xd29bf580,0xe713fede,0x08d69e5c,0x0a225223,0x1ff7fda4,0x3a924a57 } },
  28011. /* 228 */
  28012. { { 0xb4093bee,0xfb64554c,0xa58c6ec0,0xa6d65a25,0x43d0ed37,0x4126994d,
  28013. 0x55152d44,0xa5689a51,0x284caa8d,0xb8e5ea8c,0xd1f25538,0x33f05d4f },
  28014. { 0x1b615d6e,0xe0fdfe09,0x705507da,0x2ded7e8f,0x17bbcc80,0xdd5631e5,
  28015. 0x267fd11f,0x4f87453e,0xff89d62d,0xc6da723f,0xe3cda21d,0x55cbcae2 } },
  28016. /* 229 */
  28017. { { 0x6b4e84f3,0x336bc94e,0x4ef72c35,0x72863031,0xeeb57f99,0x6d85fdee,
  28018. 0xa42ece1b,0x7f4e3272,0x36f0320a,0x7f86cbb5,0x923331e6,0xf09b6a2b },
  28019. { 0x56778435,0x21d3ecf1,0x8323b2d2,0x2977ba99,0x1704bc0f,0x6a1b57fb,
  28020. 0x389f048a,0xd777cf8b,0xac6b42cd,0x9ce2174f,0x09e6c55a,0x404e2bff } },
  28021. /* 230 */
  28022. { { 0x204c5ddb,0x9b9b135e,0x3eff550e,0x9dbfe044,0xec3be0f6,0x35eab4bf,
  28023. 0x0a43e56f,0x8b4c3f0d,0x0e73f9b3,0x4c1c6673,0x2c78c905,0x92ed38bd },
  28024. { 0xa386e27c,0xc7003f6a,0xaced8507,0xb9c4f46f,0x59df5464,0xea024ec8,
  28025. 0x429572ea,0x4af96152,0xe1fc1194,0x279cd5e2,0x281e358c,0xaa376a03 } },
  28026. /* 231 */
  28027. { { 0x3cdbc95c,0x07859223,0xef2e337a,0xaae1aa6a,0x472a8544,0xc040108d,
  28028. 0x8d037b7d,0x80c853e6,0x8c7eee24,0xd221315c,0x8ee47752,0x195d3856 },
  28029. { 0xdacd7fbe,0xd4b1ba03,0xd3e0c52b,0x4b5ac61e,0x6aab7b52,0x68d3c052,
  28030. 0x660e3fea,0xf0d7248c,0x3145efb4,0xafdb3f89,0x8f40936d,0xa73fd9a3 } },
  28031. /* 232 */
  28032. { { 0xbb1b17ce,0x891b9ef3,0xc6127f31,0x14023667,0x305521fd,0x12b2e58d,
  28033. 0xe3508088,0x3a47e449,0xff751507,0xe49fc84b,0x5310d16e,0x4023f722 },
  28034. { 0xb73399fa,0xa608e5ed,0xd532aa3e,0xf12632d8,0x845e8415,0x13a2758e,
  28035. 0x1fc2d861,0xae4b6f85,0x339d02f2,0x3879f5b1,0x80d99ebd,0x446d22a6 } },
  28036. /* 233 */
  28037. { { 0x4be164f1,0x0f502302,0x88b81920,0x8d09d2d6,0x984aceff,0x514056f1,
  28038. 0x75e9e80d,0xa5c4ddf0,0xdf496a93,0x38cb47e6,0x38df6bf7,0x899e1d6b },
  28039. { 0xb59eb2a6,0x69e87e88,0x9b47f38b,0x280d9d63,0x3654e955,0x599411ea,
  28040. 0x969aa581,0xcf8dd4fd,0x530742a7,0xff5c2baf,0x1a373085,0xa4391536 } },
  28041. /* 234 */
  28042. { { 0xa8a4bdd2,0x6ace72a3,0xb68ef702,0xc656cdd1,0x90c4dad8,0xd4a33e7e,
  28043. 0x9d951c50,0x4aece08a,0x085d68e6,0xea8005ae,0x6f7502b8,0xfdd7a7d7 },
  28044. { 0x98d6fa45,0xce6fb0a6,0x1104eb8c,0x228f8672,0xda09d7dc,0xd23d8787,
  28045. 0x2ae93065,0x5521428b,0xea56c366,0x95faba3d,0x0a88aca5,0xedbe5039 } },
  28046. /* 235 */
  28047. { { 0xbfb26c82,0xd64da0ad,0x952c2f9c,0xe5d70b3c,0xf7e77f68,0xf5e8f365,
  28048. 0x08f2d695,0x7234e002,0xd12e7be6,0xfaf900ee,0x4acf734e,0x27dc6934 },
  28049. { 0xc260a46a,0x80e4ff5e,0x2dc31c28,0x7da5ebce,0xca69f552,0x485c5d73,
  28050. 0x69cc84c2,0xcdfb6b29,0xed6d4eca,0x031c5afe,0x22247637,0xc7bbf4c8 } },
  28051. /* 236 */
  28052. { { 0x49fe01b2,0x9d5b72c7,0x793a91b8,0x34785186,0xcf460438,0xa3ba3c54,
  28053. 0x3ab21b6f,0x73e8e43d,0xbe57b8ab,0x50cde8e0,0xdd204264,0x6488b3a7 },
  28054. { 0xdddc4582,0xa9e398b3,0x5bec46fe,0x1698c1a9,0x156d3843,0x7f1446ef,
  28055. 0x770329a2,0x3fd25dd8,0x2c710668,0x05b1221a,0xa72ee6cf,0x65b2dc2a } },
  28056. /* 237 */
  28057. { { 0xcd021d63,0x21a885f7,0xfea61f08,0x3f344b15,0xc5cf73e6,0xad5ba6dd,
  28058. 0x227a8b23,0x154d0d8f,0xdc559311,0x9b74373c,0x98620fa1,0x4feab715 },
  28059. { 0x7d9ec924,0x5098938e,0x6d47e550,0x84d54a5e,0x1b617506,0x1a2d1bdc,
  28060. 0x615868a4,0x99fe1782,0x3005a924,0x171da780,0x7d8f79b6,0xa70bf5ed } },
  28061. /* 238 */
  28062. { { 0xfe2216c5,0x0bc1250d,0x7601b351,0x2c37e250,0xd6f06b7e,0xb6300175,
  28063. 0x8bfeb9b7,0x4dde8ca1,0xb82f843d,0x4f210432,0xb1ac0afd,0x8d70e2f9 },
  28064. { 0xaae91abb,0x25c73b78,0x863028f2,0x0230dca3,0xe5cf30b7,0x8b923ecf,
  28065. 0x5506f265,0xed754ec2,0x729a5e39,0x8e41b88c,0xbabf889b,0xee67cec2 } },
  28066. /* 239 */
  28067. { { 0x1be46c65,0xe183acf5,0xe7565d7a,0x9789538f,0xd9627b4e,0x87873391,
  28068. 0x9f1d9187,0xbf4ac4c1,0x4691f5c8,0x5db99f63,0x74a1fb98,0xa68df803 },
  28069. { 0xbf92b5fa,0x3c448ed1,0x3e0bdc32,0xa098c841,0x79bf016c,0x8e74cd55,
  28070. 0x115e244d,0x5df0d09c,0x3410b66e,0x9418ad01,0x17a02130,0x8b6124cb } },
  28071. /* 240 */
  28072. { { 0xc26e3392,0x425ec3af,0xa1722e00,0xc07f8470,0xe2356b43,0xdcc28190,
  28073. 0xb1ef59a6,0x4ed97dff,0xc63028c1,0xc22b3ad1,0x68c18988,0x070723c2 },
  28074. { 0x4cf49e7d,0x70da302f,0x3f12a522,0xc5e87c93,0x18594148,0x74acdd1d,
  28075. 0xca74124c,0xad5f73ab,0xd69fd478,0xe72e4a3e,0x7b117cc3,0x61593868 } },
  28076. /* 241 */
  28077. { { 0xa9aa0486,0x7b7b9577,0xa063d557,0x6e41fb35,0xda9047d7,0xb017d5c7,
  28078. 0x68a87ba9,0x8c748280,0xdf08ad93,0xab45fa5c,0x4c288a28,0xcd9fb217 },
  28079. { 0x5747843d,0x59544642,0xa56111e3,0x34d64c6c,0x4bfce8d5,0x12e47ea1,
  28080. 0x6169267f,0x17740e05,0xeed03fb5,0x5c49438e,0x4fc3f513,0x9da30add } },
  28081. /* 242 */
  28082. { { 0xccfa5200,0xc4e85282,0x6a19b13d,0x2707608f,0xf5726e2f,0xdcb9a53d,
  28083. 0xe9427de5,0x612407c9,0xd54d582a,0x3e5a17e1,0x655ae118,0xb99877de },
  28084. { 0x015254de,0x6f0e972b,0xf0a6f7c5,0x92a56db1,0xa656f8b2,0xd297e4e1,
  28085. 0xad981983,0x99fe0052,0x07cfed84,0xd3652d2f,0x843c1738,0xc784352e } },
  28086. /* 243 */
  28087. { { 0x7e9b2d8a,0x6ee90af0,0x57cf1964,0xac8d7018,0x71f28efc,0xf6ed9031,
  28088. 0x6812b20e,0x7f70d5a9,0xf1c61eee,0x27b557f4,0xc6263758,0xf1c9bd57 },
  28089. { 0x2a1a6194,0x5cf7d014,0x1890ab84,0xdd614e0b,0x0e93c2a6,0x3ef9de10,
  28090. 0xe0cd91c5,0xf98cf575,0x14befc32,0x504ec0c6,0x6279d68c,0xd0513a66 } },
  28091. /* 244 */
  28092. { { 0xa859fb6a,0xa8eadbad,0xdb283666,0xcf8346e7,0x3e22e355,0x7b35e61a,
  28093. 0x99639c6b,0x293ece2c,0x56f241c8,0xfa0162e2,0xbf7a1dda,0xd2e6c7b9 },
  28094. { 0x40075e63,0xd0de6253,0xf9ec8286,0x2405aa61,0x8fe45494,0x2237830a,
  28095. 0x364e9c8c,0x4fd01ac7,0x904ba750,0x4d9c3d21,0xaf1b520b,0xd589be14 } },
  28096. /* 245 */
  28097. { { 0x4662e53b,0x13576a4f,0xf9077676,0x35ec2f51,0x97c0af97,0x66297d13,
  28098. 0x9e598b58,0xed3201fe,0x5e70f604,0x49bc752a,0xbb12d951,0xb54af535 },
  28099. { 0x212c1c76,0x36ea4c2b,0xeb250dfd,0x18f5bbc7,0x9a0a1a46,0xa0d466cc,
  28100. 0xdac2d917,0x52564da4,0x8e95fab5,0x206559f4,0x9ca67a33,0x7487c190 } },
  28101. /* 246 */
  28102. { { 0xdde98e9c,0x75abfe37,0x2a411199,0x99b90b26,0xdcdb1f7c,0x1b410996,
  28103. 0x8b3b5675,0xab346f11,0xf1f8ae1e,0x04852193,0x6b8b98c1,0x1ec4d227 },
  28104. { 0x45452baa,0xba3bc926,0xacc4a572,0x387d1858,0xe51f171e,0x9478eff6,
  28105. 0x931e1c00,0xf357077d,0xe54c8ca8,0xffee77cd,0x551dc9a4,0xfb4892ff } },
  28106. /* 247 */
  28107. { { 0x2db8dff8,0x5b1bdad0,0x5a2285a2,0xd462f4fd,0xda00b461,0x1d6aad8e,
  28108. 0x41306d1b,0x43fbefcf,0x6a13fe19,0x428e86f3,0x17f89404,0xc8b2f118 },
  28109. { 0xf0d51afb,0x762528aa,0x549b1d06,0xa3e2fea4,0xea3ddf66,0x86fad8f2,
  28110. 0x4fbdd206,0x0d9ccc4b,0xc189ff5a,0xcde97d4c,0x199f19a6,0xc36793d6 } },
  28111. /* 248 */
  28112. { { 0x51b85197,0xea38909b,0xb4c92895,0xffb17dd0,0x1ddb3f3f,0x0eb0878b,
  28113. 0xc57cf0f2,0xb05d28ff,0x1abd57e2,0xd8bde2e7,0xc40c1b20,0x7f2be28d },
  28114. { 0x299a2d48,0x6554dca2,0x8377982d,0x5130ba2e,0x1071971a,0x8863205f,
  28115. 0x7cf2825d,0x15ee6282,0x03748f2b,0xd4b6c57f,0x430385a0,0xa9e3f4da } },
  28116. /* 249 */
  28117. { { 0x83fbc9c6,0x33eb7cec,0x4541777e,0x24a311c7,0x4f0767fc,0xc81377f7,
  28118. 0x4ab702da,0x12adae36,0x2a779696,0xb7fcb6db,0x01cea6ad,0x4a6fb284 },
  28119. { 0xcdfc73de,0x5e8b1d2a,0x1b02fd32,0xd0efae8d,0xd81d8519,0x3f99c190,
  28120. 0xfc808971,0x3c18f7fa,0x51b7ae7b,0x41f713e7,0xf07fc3f8,0x0a4b3435 } },
  28121. /* 250 */
  28122. { { 0x019b7d2e,0x7dda3c4c,0xd4dc4b89,0x631c8d1a,0x1cdb313c,0x5489cd6e,
  28123. 0x4c07bb06,0xd44aed10,0x75f000d1,0x8f97e13a,0xdda5df4d,0x0e9ee64f },
  28124. { 0x3e346910,0xeaa99f3b,0xfa294ad7,0x622f6921,0x0d0b2fe9,0x22aaa20d,
  28125. 0x1e5881ba,0x4fed2f99,0xc1571802,0x9af3b2d6,0xdc7ee17c,0x919e67a8 } },
  28126. /* 251 */
  28127. { { 0x76250533,0xc724fe4c,0x7d817ef8,0x8a2080e5,0x172c9751,0xa2afb0f4,
  28128. 0x17c0702e,0x9b10cdeb,0xc9b7e3e9,0xbf3975e3,0x1cd0cdc5,0x206117df },
  28129. { 0xbe05ebd5,0xfb049e61,0x16c782c0,0xeb0bb55c,0xab7fed09,0x13a331b8,
  28130. 0x632863f0,0xf6c58b1d,0x4d3b6195,0x6264ef6e,0x9a53f116,0x92c51b63 } },
  28131. /* 252 */
  28132. { { 0x288b364d,0xa57c7bc8,0x7b41e5c4,0x4a562e08,0x698a9a11,0x699d21c6,
  28133. 0xf3f849b9,0xa4ed9581,0x9eb726ba,0xa223eef3,0xcc2884f9,0x13159c23 },
  28134. { 0x3a3f4963,0x73931e58,0x0ada6a81,0x96500389,0x5ab2950b,0x3ee8a1c6,
  28135. 0x775fab52,0xeedf4949,0x4f2671b6,0x63d652e1,0x3c4e2f55,0xfed4491c } },
  28136. /* 253 */
  28137. { { 0xf4eb453e,0x335eadc3,0xcadd1a5b,0x5ff74b63,0x5d84a91a,0x6933d0d7,
  28138. 0xb49ba337,0x9ca3eeb9,0xc04c15b8,0x1f6facce,0xdc09a7e4,0x4ef19326 },
  28139. { 0x3dca3233,0x53d2d324,0xa2259d4b,0x0ee40590,0x5546f002,0x18c22edb,
  28140. 0x09ea6b71,0x92429801,0xb0e91e61,0xaada0add,0x99963c50,0x5fe53ef4 } },
  28141. /* 254 */
  28142. { { 0x90c28c65,0x372dd06b,0x119ce47d,0x1765242c,0x6b22fc82,0xc041fb80,
  28143. 0xb0a7ccc1,0x667edf07,0x1261bece,0xc79599e7,0x19cff22a,0xbc69d9ba },
  28144. { 0x13c06819,0x009d77cd,0xe282b79d,0x635a66ae,0x225b1be8,0x4edac4a6,
  28145. 0x524008f9,0x57d4f4e4,0xb056af84,0xee299ac5,0x3a0bc386,0xcc38444c } },
  28146. /* 255 */
  28147. { { 0xcd4c2356,0x490643b1,0x750547be,0x740a4851,0xd4944c04,0x643eaf29,
  28148. 0x299a98a0,0xba572479,0xee05fdf9,0x48b29f16,0x089b2d7b,0x33fb4f61 },
  28149. { 0xa950f955,0x86704902,0xfedc3ddf,0x97e1034d,0x05fbb6a2,0x211320b6,
  28150. 0x432299bb,0x23d7b93f,0x8590e4a3,0x1fe1a057,0xf58c0ce6,0x8e1d0586 } },
  28151. };
  28152. /* Multiply the base point of P384 by the scalar and return the result.
  28153. * If map is true then convert result to affine coordinates.
  28154. *
  28155. * Stripe implementation.
  28156. * Pre-generated: 2^0, 2^48, ...
  28157. * Pre-generated: products of all combinations of above.
  28158. * 8 doubles and adds (with qz=1)
  28159. *
  28160. * r Resulting point.
  28161. * k Scalar to multiply by.
  28162. * map Indicates whether to convert result to affine.
  28163. * ct Constant time required.
  28164. * heap Heap to use for allocation.
  28165. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  28166. */
  28167. static int sp_384_ecc_mulmod_base_12(sp_point_384* r, const sp_digit* k,
  28168. int map, int ct, void* heap)
  28169. {
  28170. return sp_384_ecc_mulmod_stripe_12(r, &p384_base, p384_table,
  28171. k, map, ct, heap);
  28172. }
  28173. #endif
  28174. /* Multiply the base point of P384 by the scalar and return the result.
  28175. * If map is true then convert result to affine coordinates.
  28176. *
  28177. * km Scalar to multiply by.
  28178. * r Resulting point.
  28179. * map Indicates whether to convert result to affine.
  28180. * heap Heap to use for allocation.
  28181. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  28182. */
  28183. int sp_ecc_mulmod_base_384(const mp_int* km, ecc_point* r, int map, void* heap)
  28184. {
  28185. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28186. sp_point_384* point = NULL;
  28187. sp_digit* k = NULL;
  28188. #else
  28189. sp_point_384 point[1];
  28190. sp_digit k[12];
  28191. #endif
  28192. int err = MP_OKAY;
  28193. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28194. point = (sp_point_384*)XMALLOC(sizeof(sp_point_384), heap,
  28195. DYNAMIC_TYPE_ECC);
  28196. if (point == NULL)
  28197. err = MEMORY_E;
  28198. if (err == MP_OKAY) {
  28199. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 12, heap,
  28200. DYNAMIC_TYPE_ECC);
  28201. if (k == NULL)
  28202. err = MEMORY_E;
  28203. }
  28204. #endif
  28205. if (err == MP_OKAY) {
  28206. sp_384_from_mp(k, 12, km);
  28207. err = sp_384_ecc_mulmod_base_12(point, k, map, 1, heap);
  28208. }
  28209. if (err == MP_OKAY) {
  28210. err = sp_384_point_to_ecc_point_12(point, r);
  28211. }
  28212. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28213. if (k != NULL)
  28214. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  28215. if (point != NULL)
  28216. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  28217. #endif
  28218. return err;
  28219. }
  28220. /* Multiply the base point of P384 by the scalar, add point a and return
  28221. * the result. If map is true then convert result to affine coordinates.
  28222. *
  28223. * km Scalar to multiply by.
  28224. * am Point to add to scalar mulitply result.
  28225. * inMont Point to add is in montgomery form.
  28226. * r Resulting point.
  28227. * map Indicates whether to convert result to affine.
  28228. * heap Heap to use for allocation.
  28229. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  28230. */
  28231. int sp_ecc_mulmod_base_add_384(const mp_int* km, const ecc_point* am,
  28232. int inMont, ecc_point* r, int map, void* heap)
  28233. {
  28234. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28235. sp_point_384* point = NULL;
  28236. sp_digit* k = NULL;
  28237. #else
  28238. sp_point_384 point[2];
  28239. sp_digit k[12 + 12 * 2 * 6];
  28240. #endif
  28241. sp_point_384* addP = NULL;
  28242. sp_digit* tmp = NULL;
  28243. int err = MP_OKAY;
  28244. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28245. point = (sp_point_384*)XMALLOC(sizeof(sp_point_384) * 2, heap,
  28246. DYNAMIC_TYPE_ECC);
  28247. if (point == NULL)
  28248. err = MEMORY_E;
  28249. if (err == MP_OKAY) {
  28250. k = (sp_digit*)XMALLOC(
  28251. sizeof(sp_digit) * (12 + 12 * 2 * 6),
  28252. heap, DYNAMIC_TYPE_ECC);
  28253. if (k == NULL)
  28254. err = MEMORY_E;
  28255. }
  28256. #endif
  28257. if (err == MP_OKAY) {
  28258. addP = point + 1;
  28259. tmp = k + 12;
  28260. sp_384_from_mp(k, 12, km);
  28261. sp_384_point_from_ecc_point_12(addP, am);
  28262. }
  28263. if ((err == MP_OKAY) && (!inMont)) {
  28264. err = sp_384_mod_mul_norm_12(addP->x, addP->x, p384_mod);
  28265. }
  28266. if ((err == MP_OKAY) && (!inMont)) {
  28267. err = sp_384_mod_mul_norm_12(addP->y, addP->y, p384_mod);
  28268. }
  28269. if ((err == MP_OKAY) && (!inMont)) {
  28270. err = sp_384_mod_mul_norm_12(addP->z, addP->z, p384_mod);
  28271. }
  28272. if (err == MP_OKAY) {
  28273. err = sp_384_ecc_mulmod_base_12(point, k, 0, 0, heap);
  28274. }
  28275. if (err == MP_OKAY) {
  28276. sp_384_proj_point_add_12(point, point, addP, tmp);
  28277. if (map) {
  28278. sp_384_map_12(point, point, tmp);
  28279. }
  28280. err = sp_384_point_to_ecc_point_12(point, r);
  28281. }
  28282. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28283. if (k != NULL)
  28284. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  28285. if (point)
  28286. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  28287. #endif
  28288. return err;
  28289. }
  28290. #if defined(WOLFSSL_VALIDATE_ECC_KEYGEN) || defined(HAVE_ECC_SIGN) || \
  28291. defined(HAVE_ECC_VERIFY)
  28292. #endif /* WOLFSSL_VALIDATE_ECC_KEYGEN | HAVE_ECC_SIGN | HAVE_ECC_VERIFY */
  28293. /* Add 1 to a. (a = a + 1)
  28294. *
  28295. * a A single precision integer.
  28296. */
  28297. SP_NOINLINE static void sp_384_add_one_12(sp_digit* a)
  28298. {
  28299. __asm__ __volatile__ (
  28300. "mov r2, #1\n\t"
  28301. "ldr r1, [%[a], #0]\n\t"
  28302. "adds r1, r1, r2\n\t"
  28303. "mov r2, #0\n\t"
  28304. "str r1, [%[a], #0]\n\t"
  28305. "ldr r1, [%[a], #4]\n\t"
  28306. "adcs r1, r1, r2\n\t"
  28307. "str r1, [%[a], #4]\n\t"
  28308. "ldr r1, [%[a], #8]\n\t"
  28309. "adcs r1, r1, r2\n\t"
  28310. "str r1, [%[a], #8]\n\t"
  28311. "ldr r1, [%[a], #12]\n\t"
  28312. "adcs r1, r1, r2\n\t"
  28313. "str r1, [%[a], #12]\n\t"
  28314. "ldr r1, [%[a], #16]\n\t"
  28315. "adcs r1, r1, r2\n\t"
  28316. "str r1, [%[a], #16]\n\t"
  28317. "ldr r1, [%[a], #20]\n\t"
  28318. "adcs r1, r1, r2\n\t"
  28319. "str r1, [%[a], #20]\n\t"
  28320. "ldr r1, [%[a], #24]\n\t"
  28321. "adcs r1, r1, r2\n\t"
  28322. "str r1, [%[a], #24]\n\t"
  28323. "ldr r1, [%[a], #28]\n\t"
  28324. "adcs r1, r1, r2\n\t"
  28325. "str r1, [%[a], #28]\n\t"
  28326. "ldr r1, [%[a], #32]\n\t"
  28327. "adcs r1, r1, r2\n\t"
  28328. "str r1, [%[a], #32]\n\t"
  28329. "ldr r1, [%[a], #36]\n\t"
  28330. "adcs r1, r1, r2\n\t"
  28331. "str r1, [%[a], #36]\n\t"
  28332. "ldr r1, [%[a], #40]\n\t"
  28333. "adcs r1, r1, r2\n\t"
  28334. "str r1, [%[a], #40]\n\t"
  28335. "ldr r1, [%[a], #44]\n\t"
  28336. "adcs r1, r1, r2\n\t"
  28337. "str r1, [%[a], #44]\n\t"
  28338. :
  28339. : [a] "r" (a)
  28340. : "memory", "r1", "r2"
  28341. );
  28342. }
  28343. /* Read big endian unsigned byte array into r.
  28344. *
  28345. * r A single precision integer.
  28346. * size Maximum number of bytes to convert
  28347. * a Byte array.
  28348. * n Number of bytes in array to read.
  28349. */
  28350. static void sp_384_from_bin(sp_digit* r, int size, const byte* a, int n)
  28351. {
  28352. int i;
  28353. int j;
  28354. byte* d;
  28355. for (i = n - 1,j = 0; i >= 3; i -= 4) {
  28356. r[j] = ((sp_digit)a[i - 0] << 0) |
  28357. ((sp_digit)a[i - 1] << 8) |
  28358. ((sp_digit)a[i - 2] << 16) |
  28359. ((sp_digit)a[i - 3] << 24);
  28360. j++;
  28361. }
  28362. if (i >= 0) {
  28363. r[j] = 0;
  28364. d = (byte*)r;
  28365. switch (i) {
  28366. case 2: d[n - 1 - 2] = a[2]; //fallthrough
  28367. case 1: d[n - 1 - 1] = a[1]; //fallthrough
  28368. case 0: d[n - 1 - 0] = a[0]; //fallthrough
  28369. }
  28370. j++;
  28371. }
  28372. for (; j < size; j++) {
  28373. r[j] = 0;
  28374. }
  28375. }
  28376. /* Generates a scalar that is in the range 1..order-1.
  28377. *
  28378. * rng Random number generator.
  28379. * k Scalar value.
  28380. * returns RNG failures, MEMORY_E when memory allocation fails and
  28381. * MP_OKAY on success.
  28382. */
  28383. static int sp_384_ecc_gen_k_12(WC_RNG* rng, sp_digit* k)
  28384. {
  28385. int err;
  28386. byte buf[48];
  28387. do {
  28388. err = wc_RNG_GenerateBlock(rng, buf, sizeof(buf));
  28389. if (err == 0) {
  28390. sp_384_from_bin(k, 12, buf, (int)sizeof(buf));
  28391. if (sp_384_cmp_12(k, p384_order2) <= 0) {
  28392. sp_384_add_one_12(k);
  28393. break;
  28394. }
  28395. }
  28396. }
  28397. while (err == 0);
  28398. return err;
  28399. }
  28400. /* Makes a random EC key pair.
  28401. *
  28402. * rng Random number generator.
  28403. * priv Generated private value.
  28404. * pub Generated public point.
  28405. * heap Heap to use for allocation.
  28406. * returns ECC_INF_E when the point does not have the correct order, RNG
  28407. * failures, MEMORY_E when memory allocation fails and MP_OKAY on success.
  28408. */
  28409. int sp_ecc_make_key_384(WC_RNG* rng, mp_int* priv, ecc_point* pub, void* heap)
  28410. {
  28411. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28412. sp_point_384* point = NULL;
  28413. sp_digit* k = NULL;
  28414. #else
  28415. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  28416. sp_point_384 point[2];
  28417. #else
  28418. sp_point_384 point[1];
  28419. #endif
  28420. sp_digit k[12];
  28421. #endif
  28422. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  28423. sp_point_384* infinity = NULL;
  28424. #endif
  28425. int err = MP_OKAY;
  28426. (void)heap;
  28427. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28428. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  28429. point = (sp_point_384*)XMALLOC(sizeof(sp_point_384) * 2, heap, DYNAMIC_TYPE_ECC);
  28430. #else
  28431. point = (sp_point_384*)XMALLOC(sizeof(sp_point_384), heap, DYNAMIC_TYPE_ECC);
  28432. #endif
  28433. if (point == NULL)
  28434. err = MEMORY_E;
  28435. if (err == MP_OKAY) {
  28436. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 12, heap,
  28437. DYNAMIC_TYPE_ECC);
  28438. if (k == NULL)
  28439. err = MEMORY_E;
  28440. }
  28441. #endif
  28442. if (err == MP_OKAY) {
  28443. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  28444. infinity = point + 1;
  28445. #endif
  28446. err = sp_384_ecc_gen_k_12(rng, k);
  28447. }
  28448. if (err == MP_OKAY) {
  28449. err = sp_384_ecc_mulmod_base_12(point, k, 1, 1, NULL);
  28450. }
  28451. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  28452. if (err == MP_OKAY) {
  28453. err = sp_384_ecc_mulmod_12(infinity, point, p384_order, 1, 1, NULL);
  28454. }
  28455. if (err == MP_OKAY) {
  28456. if (sp_384_iszero_12(point->x) || sp_384_iszero_12(point->y)) {
  28457. err = ECC_INF_E;
  28458. }
  28459. }
  28460. #endif
  28461. if (err == MP_OKAY) {
  28462. err = sp_384_to_mp(k, priv);
  28463. }
  28464. if (err == MP_OKAY) {
  28465. err = sp_384_point_to_ecc_point_12(point, pub);
  28466. }
  28467. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28468. if (k != NULL)
  28469. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  28470. if (point != NULL) {
  28471. /* point is not sensitive, so no need to zeroize */
  28472. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  28473. }
  28474. #endif
  28475. return err;
  28476. }
  28477. #ifdef HAVE_ECC_DHE
  28478. /* Write r as big endian to byte array.
  28479. * Fixed length number of bytes written: 48
  28480. *
  28481. * r A single precision integer.
  28482. * a Byte array.
  28483. */
  28484. static void sp_384_to_bin_12(sp_digit* r, byte* a)
  28485. {
  28486. int i;
  28487. int j = 0;
  28488. for (i = 11; i >= 0; i--) {
  28489. a[j++] = r[i] >> 24;
  28490. a[j++] = r[i] >> 16;
  28491. a[j++] = r[i] >> 8;
  28492. a[j++] = r[i] >> 0;
  28493. }
  28494. }
  28495. /* Multiply the point by the scalar and serialize the X ordinate.
  28496. * The number is 0 padded to maximum size on output.
  28497. *
  28498. * priv Scalar to multiply the point by.
  28499. * pub Point to multiply.
  28500. * out Buffer to hold X ordinate.
  28501. * outLen On entry, size of the buffer in bytes.
  28502. * On exit, length of data in buffer in bytes.
  28503. * heap Heap to use for allocation.
  28504. * returns BUFFER_E if the buffer is to small for output size,
  28505. * MEMORY_E when memory allocation fails and MP_OKAY on success.
  28506. */
  28507. int sp_ecc_secret_gen_384(const mp_int* priv, const ecc_point* pub, byte* out,
  28508. word32* outLen, void* heap)
  28509. {
  28510. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28511. sp_point_384* point = NULL;
  28512. sp_digit* k = NULL;
  28513. #else
  28514. sp_point_384 point[1];
  28515. sp_digit k[12];
  28516. #endif
  28517. int err = MP_OKAY;
  28518. if (*outLen < 48U) {
  28519. err = BUFFER_E;
  28520. }
  28521. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28522. if (err == MP_OKAY) {
  28523. point = (sp_point_384*)XMALLOC(sizeof(sp_point_384), heap,
  28524. DYNAMIC_TYPE_ECC);
  28525. if (point == NULL)
  28526. err = MEMORY_E;
  28527. }
  28528. if (err == MP_OKAY) {
  28529. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 12, heap,
  28530. DYNAMIC_TYPE_ECC);
  28531. if (k == NULL)
  28532. err = MEMORY_E;
  28533. }
  28534. #endif
  28535. if (err == MP_OKAY) {
  28536. sp_384_from_mp(k, 12, priv);
  28537. sp_384_point_from_ecc_point_12(point, pub);
  28538. err = sp_384_ecc_mulmod_12(point, point, k, 1, 1, heap);
  28539. }
  28540. if (err == MP_OKAY) {
  28541. sp_384_to_bin_12(point->x, out);
  28542. *outLen = 48;
  28543. }
  28544. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  28545. if (k != NULL)
  28546. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  28547. if (point != NULL)
  28548. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  28549. #endif
  28550. return err;
  28551. }
  28552. #endif /* HAVE_ECC_DHE */
  28553. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  28554. #endif
  28555. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  28556. #endif
  28557. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  28558. #ifdef WOLFSSL_SP_SMALL
  28559. /* Sub b from a into a. (a -= b)
  28560. *
  28561. * a A single precision integer.
  28562. * b A single precision integer.
  28563. */
  28564. SP_NOINLINE static sp_digit sp_384_sub_in_place_12(sp_digit* a,
  28565. const sp_digit* b)
  28566. {
  28567. sp_digit c = 0;
  28568. __asm__ __volatile__ (
  28569. "mov r8, %[a]\n\t"
  28570. "add r8, r8, #48\n\t"
  28571. "\n1:\n\t"
  28572. "mov r5, #0\n\t"
  28573. "subs r5, r5, %[c]\n\t"
  28574. "ldr r3, [%[a]]\n\t"
  28575. "ldr r4, [%[a], #4]\n\t"
  28576. "ldr r5, [%[b]]\n\t"
  28577. "ldr r6, [%[b], #4]\n\t"
  28578. "sbcs r3, r3, r5\n\t"
  28579. "sbcs r4, r4, r6\n\t"
  28580. "str r3, [%[a]]\n\t"
  28581. "str r4, [%[a], #4]\n\t"
  28582. "sbc %[c], %[c], %[c]\n\t"
  28583. "add %[a], %[a], #8\n\t"
  28584. "add %[b], %[b], #8\n\t"
  28585. "cmp %[a], r8\n\t"
  28586. #ifdef __GNUC__
  28587. "bne 1b\n\t"
  28588. #else
  28589. "bne.n 1b\n\t"
  28590. #endif /* __GNUC__ */
  28591. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  28592. :
  28593. : "memory", "r3", "r4", "r5", "r6", "r8"
  28594. );
  28595. return c;
  28596. }
  28597. #else
  28598. /* Sub b from a into r. (r = a - b)
  28599. *
  28600. * r A single precision integer.
  28601. * a A single precision integer.
  28602. * b A single precision integer.
  28603. */
  28604. SP_NOINLINE static sp_digit sp_384_sub_in_place_12(sp_digit* a,
  28605. const sp_digit* b)
  28606. {
  28607. sp_digit c = 0;
  28608. __asm__ __volatile__ (
  28609. "ldm %[a], {r3, r4}\n\t"
  28610. "ldm %[b]!, {r5, r6}\n\t"
  28611. "subs r3, r3, r5\n\t"
  28612. "sbcs r4, r4, r6\n\t"
  28613. "stm %[a]!, {r3, r4}\n\t"
  28614. "ldm %[a], {r3, r4}\n\t"
  28615. "ldm %[b]!, {r5, r6}\n\t"
  28616. "sbcs r3, r3, r5\n\t"
  28617. "sbcs r4, r4, r6\n\t"
  28618. "stm %[a]!, {r3, r4}\n\t"
  28619. "ldm %[a], {r3, r4}\n\t"
  28620. "ldm %[b]!, {r5, r6}\n\t"
  28621. "sbcs r3, r3, r5\n\t"
  28622. "sbcs r4, r4, r6\n\t"
  28623. "stm %[a]!, {r3, r4}\n\t"
  28624. "ldm %[a], {r3, r4}\n\t"
  28625. "ldm %[b]!, {r5, r6}\n\t"
  28626. "sbcs r3, r3, r5\n\t"
  28627. "sbcs r4, r4, r6\n\t"
  28628. "stm %[a]!, {r3, r4}\n\t"
  28629. "ldm %[a], {r3, r4}\n\t"
  28630. "ldm %[b]!, {r5, r6}\n\t"
  28631. "sbcs r3, r3, r5\n\t"
  28632. "sbcs r4, r4, r6\n\t"
  28633. "stm %[a]!, {r3, r4}\n\t"
  28634. "ldm %[a], {r3, r4}\n\t"
  28635. "ldm %[b]!, {r5, r6}\n\t"
  28636. "sbcs r3, r3, r5\n\t"
  28637. "sbcs r4, r4, r6\n\t"
  28638. "stm %[a]!, {r3, r4}\n\t"
  28639. "sbc %[c], %[c], %[c]\n\t"
  28640. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  28641. :
  28642. : "memory", "r3", "r4", "r5", "r6"
  28643. );
  28644. return c;
  28645. }
  28646. #endif /* WOLFSSL_SP_SMALL */
  28647. /* Mul a by digit b into r. (r = a * b)
  28648. *
  28649. * r A single precision integer.
  28650. * a A single precision integer.
  28651. * b A single precision digit.
  28652. */
  28653. SP_NOINLINE static void sp_384_mul_d_12(sp_digit* r, const sp_digit* a,
  28654. sp_digit b)
  28655. {
  28656. __asm__ __volatile__ (
  28657. "add r9, %[a], #48\n\t"
  28658. /* A[0] * B */
  28659. "ldr r6, [%[a]], #4\n\t"
  28660. "umull r5, r3, r6, %[b]\n\t"
  28661. "mov r4, #0\n\t"
  28662. "str r5, [%[r]], #4\n\t"
  28663. /* A[0] * B - Done */
  28664. "\n1:\n\t"
  28665. "mov r5, #0\n\t"
  28666. /* A[] * B */
  28667. "ldr r6, [%[a]], #4\n\t"
  28668. "umull r6, r8, r6, %[b]\n\t"
  28669. "adds r3, r3, r6\n\t"
  28670. "adcs r4, r4, r8\n\t"
  28671. "adc r5, r5, #0\n\t"
  28672. /* A[] * B - Done */
  28673. "str r3, [%[r]], #4\n\t"
  28674. "mov r3, r4\n\t"
  28675. "mov r4, r5\n\t"
  28676. "cmp %[a], r9\n\t"
  28677. #ifdef __GNUC__
  28678. "blt 1b\n\t"
  28679. #else
  28680. "blt.n 1b\n\t"
  28681. #endif /* __GNUC__ */
  28682. "str r3, [%[r]]\n\t"
  28683. : [r] "+r" (r), [a] "+r" (a)
  28684. : [b] "r" (b)
  28685. : "memory", "r3", "r4", "r5", "r6", "r8", "r9"
  28686. );
  28687. }
  28688. /* Divide the double width number (d1|d0) by the divisor. (d1|d0 / div)
  28689. *
  28690. * d1 The high order half of the number to divide.
  28691. * d0 The low order half of the number to divide.
  28692. * div The divisor.
  28693. * returns the result of the division.
  28694. *
  28695. * Note that this is an approximate div. It may give an answer 1 larger.
  28696. */
  28697. SP_NOINLINE static sp_digit div_384_word_12(sp_digit d1, sp_digit d0,
  28698. sp_digit div)
  28699. {
  28700. sp_digit r = 0;
  28701. __asm__ __volatile__ (
  28702. "lsr r6, %[div], #16\n\t"
  28703. "add r6, r6, #1\n\t"
  28704. "udiv r4, %[d1], r6\n\t"
  28705. "lsl r8, r4, #16\n\t"
  28706. "umull r4, r5, %[div], r8\n\t"
  28707. "subs %[d0], %[d0], r4\n\t"
  28708. "sbc %[d1], %[d1], r5\n\t"
  28709. "udiv r5, %[d1], r6\n\t"
  28710. "lsl r4, r5, #16\n\t"
  28711. "add r8, r8, r4\n\t"
  28712. "umull r4, r5, %[div], r4\n\t"
  28713. "subs %[d0], %[d0], r4\n\t"
  28714. "sbc %[d1], %[d1], r5\n\t"
  28715. "lsl r4, %[d1], #16\n\t"
  28716. "orr r4, r4, %[d0], lsr #16\n\t"
  28717. "udiv r4, r4, r6\n\t"
  28718. "add r8, r8, r4\n\t"
  28719. "umull r4, r5, %[div], r4\n\t"
  28720. "subs %[d0], %[d0], r4\n\t"
  28721. "sbc %[d1], %[d1], r5\n\t"
  28722. "lsl r4, %[d1], #16\n\t"
  28723. "orr r4, r4, %[d0], lsr #16\n\t"
  28724. "udiv r4, r4, r6\n\t"
  28725. "add r8, r8, r4\n\t"
  28726. "umull r4, r5, %[div], r4\n\t"
  28727. "subs %[d0], %[d0], r4\n\t"
  28728. "sbc %[d1], %[d1], r5\n\t"
  28729. "udiv r4, %[d0], %[div]\n\t"
  28730. "add r8, r8, r4\n\t"
  28731. "mov %[r], r8\n\t"
  28732. : [r] "+r" (r)
  28733. : [d1] "r" (d1), [d0] "r" (d0), [div] "r" (div)
  28734. : "r4", "r5", "r6", "r8"
  28735. );
  28736. return r;
  28737. }
  28738. /* AND m into each word of a and store in r.
  28739. *
  28740. * r A single precision integer.
  28741. * a A single precision integer.
  28742. * m Mask to AND against each digit.
  28743. */
  28744. static void sp_384_mask_12(sp_digit* r, const sp_digit* a, sp_digit m)
  28745. {
  28746. #ifdef WOLFSSL_SP_SMALL
  28747. int i;
  28748. for (i=0; i<12; i++) {
  28749. r[i] = a[i] & m;
  28750. }
  28751. #else
  28752. r[0] = a[0] & m;
  28753. r[1] = a[1] & m;
  28754. r[2] = a[2] & m;
  28755. r[3] = a[3] & m;
  28756. r[4] = a[4] & m;
  28757. r[5] = a[5] & m;
  28758. r[6] = a[6] & m;
  28759. r[7] = a[7] & m;
  28760. r[8] = a[8] & m;
  28761. r[9] = a[9] & m;
  28762. r[10] = a[10] & m;
  28763. r[11] = a[11] & m;
  28764. #endif
  28765. }
  28766. /* Divide d in a and put remainder into r (m*d + r = a)
  28767. * m is not calculated as it is not needed at this time.
  28768. *
  28769. * a Number to be divided.
  28770. * d Number to divide with.
  28771. * m Multiplier result.
  28772. * r Remainder from the division.
  28773. * returns MP_OKAY indicating success.
  28774. */
  28775. static WC_INLINE int sp_384_div_12(const sp_digit* a, const sp_digit* d, sp_digit* m,
  28776. sp_digit* r)
  28777. {
  28778. sp_digit t1[24], t2[13];
  28779. sp_digit div, r1;
  28780. int i;
  28781. (void)m;
  28782. div = d[11];
  28783. XMEMCPY(t1, a, sizeof(*t1) * 2 * 12);
  28784. r1 = sp_384_cmp_12(&t1[12], d) >= 0;
  28785. sp_384_cond_sub_12(&t1[12], &t1[12], d, (sp_digit)0 - r1);
  28786. for (i = 11; i >= 0; i--) {
  28787. sp_digit mask = 0 - (t1[12 + i] == div);
  28788. sp_digit hi = t1[12 + i] + mask;
  28789. r1 = div_384_word_12(hi, t1[12 + i - 1], div);
  28790. r1 |= mask;
  28791. sp_384_mul_d_12(t2, d, r1);
  28792. t1[12 + i] += sp_384_sub_in_place_12(&t1[i], t2);
  28793. t1[12 + i] -= t2[12];
  28794. sp_384_mask_12(t2, d, t1[12 + i]);
  28795. t1[12 + i] += sp_384_add_12(&t1[i], &t1[i], t2);
  28796. sp_384_mask_12(t2, d, t1[12 + i]);
  28797. t1[12 + i] += sp_384_add_12(&t1[i], &t1[i], t2);
  28798. }
  28799. r1 = sp_384_cmp_12(t1, d) >= 0;
  28800. sp_384_cond_sub_12(r, t1, d, (sp_digit)0 - r1);
  28801. return MP_OKAY;
  28802. }
  28803. /* Reduce a modulo m into r. (r = a mod m)
  28804. *
  28805. * r A single precision number that is the reduced result.
  28806. * a A single precision number that is to be reduced.
  28807. * m A single precision number that is the modulus to reduce with.
  28808. * returns MP_OKAY indicating success.
  28809. */
  28810. static WC_INLINE int sp_384_mod_12(sp_digit* r, const sp_digit* a, const sp_digit* m)
  28811. {
  28812. return sp_384_div_12(a, m, NULL, r);
  28813. }
  28814. #endif
  28815. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  28816. /* Multiply two number mod the order of P384 curve. (r = a * b mod order)
  28817. *
  28818. * r Result of the multiplication.
  28819. * a First operand of the multiplication.
  28820. * b Second operand of the multiplication.
  28821. */
  28822. static void sp_384_mont_mul_order_12(sp_digit* r, const sp_digit* a, const sp_digit* b)
  28823. {
  28824. sp_384_mul_12(r, a, b);
  28825. sp_384_mont_reduce_order_12(r, p384_order, p384_mp_order);
  28826. }
  28827. #if defined(HAVE_ECC_SIGN) || (defined(HAVE_ECC_VERIFY) && defined(WOLFSSL_SP_SMALL))
  28828. #ifdef WOLFSSL_SP_SMALL
  28829. /* Order-2 for the P384 curve. */
  28830. static const uint32_t p384_order_minus_2[12] = {
  28831. 0xccc52971U,0xecec196aU,0x48b0a77aU,0x581a0db2U,0xf4372ddfU,0xc7634d81U,
  28832. 0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU
  28833. };
  28834. #else
  28835. /* The low half of the order-2 of the P384 curve. */
  28836. static const uint32_t p384_order_low[6] = {
  28837. 0xccc52971U,0xecec196aU,0x48b0a77aU,0x581a0db2U,0xf4372ddfU,0xc7634d81U
  28838. };
  28839. #endif /* WOLFSSL_SP_SMALL */
  28840. /* Square number mod the order of P384 curve. (r = a * a mod order)
  28841. *
  28842. * r Result of the squaring.
  28843. * a Number to square.
  28844. */
  28845. static void sp_384_mont_sqr_order_12(sp_digit* r, const sp_digit* a)
  28846. {
  28847. sp_384_sqr_12(r, a);
  28848. sp_384_mont_reduce_order_12(r, p384_order, p384_mp_order);
  28849. }
  28850. #ifndef WOLFSSL_SP_SMALL
  28851. /* Square number mod the order of P384 curve a number of times.
  28852. * (r = a ^ n mod order)
  28853. *
  28854. * r Result of the squaring.
  28855. * a Number to square.
  28856. */
  28857. static void sp_384_mont_sqr_n_order_12(sp_digit* r, const sp_digit* a, int n)
  28858. {
  28859. int i;
  28860. sp_384_mont_sqr_order_12(r, a);
  28861. for (i=1; i<n; i++) {
  28862. sp_384_mont_sqr_order_12(r, r);
  28863. }
  28864. }
  28865. #endif /* !WOLFSSL_SP_SMALL */
  28866. /* Invert the number, in Montgomery form, modulo the order of the P384 curve.
  28867. * (r = 1 / a mod order)
  28868. *
  28869. * r Inverse result.
  28870. * a Number to invert.
  28871. * td Temporary data.
  28872. */
  28873. #ifdef WOLFSSL_SP_NONBLOCK
  28874. typedef struct sp_384_mont_inv_order_12_ctx {
  28875. int state;
  28876. int i;
  28877. } sp_384_mont_inv_order_12_ctx;
  28878. static int sp_384_mont_inv_order_12_nb(sp_ecc_ctx_t* sp_ctx, sp_digit* r, const sp_digit* a,
  28879. sp_digit* t)
  28880. {
  28881. int err = FP_WOULDBLOCK;
  28882. sp_384_mont_inv_order_12_ctx* ctx = (sp_384_mont_inv_order_12_ctx*)sp_ctx;
  28883. typedef char ctx_size_test[sizeof(sp_384_mont_inv_order_12_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  28884. (void)sizeof(ctx_size_test);
  28885. switch (ctx->state) {
  28886. case 0:
  28887. XMEMCPY(t, a, sizeof(sp_digit) * 12);
  28888. ctx->i = 382;
  28889. ctx->state = 1;
  28890. break;
  28891. case 1:
  28892. sp_384_mont_sqr_order_12(t, t);
  28893. ctx->state = 2;
  28894. break;
  28895. case 2:
  28896. if ((p384_order_minus_2[ctx->i / 32] & ((sp_int_digit)1 << (ctx->i % 32))) != 0) {
  28897. sp_384_mont_mul_order_12(t, t, a);
  28898. }
  28899. ctx->i--;
  28900. ctx->state = (ctx->i == 0) ? 3 : 1;
  28901. break;
  28902. case 3:
  28903. XMEMCPY(r, t, sizeof(sp_digit) * 12U);
  28904. err = MP_OKAY;
  28905. break;
  28906. }
  28907. return err;
  28908. }
  28909. #endif /* WOLFSSL_SP_NONBLOCK */
  28910. static void sp_384_mont_inv_order_12(sp_digit* r, const sp_digit* a,
  28911. sp_digit* td)
  28912. {
  28913. #ifdef WOLFSSL_SP_SMALL
  28914. sp_digit* t = td;
  28915. int i;
  28916. XMEMCPY(t, a, sizeof(sp_digit) * 12);
  28917. for (i=382; i>=0; i--) {
  28918. sp_384_mont_sqr_order_12(t, t);
  28919. if ((p384_order_minus_2[i / 32] & ((sp_int_digit)1 << (i % 32))) != 0) {
  28920. sp_384_mont_mul_order_12(t, t, a);
  28921. }
  28922. }
  28923. XMEMCPY(r, t, sizeof(sp_digit) * 12U);
  28924. #else
  28925. sp_digit* t = td;
  28926. sp_digit* t2 = td + 2 * 12;
  28927. sp_digit* t3 = td + 4 * 12;
  28928. int i;
  28929. /* t = a^2 */
  28930. sp_384_mont_sqr_order_12(t, a);
  28931. /* t = a^3 = t * a */
  28932. sp_384_mont_mul_order_12(t, t, a);
  28933. /* t2= a^c = t ^ 2 ^ 2 */
  28934. sp_384_mont_sqr_n_order_12(t2, t, 2);
  28935. /* t = a^f = t2 * t */
  28936. sp_384_mont_mul_order_12(t, t2, t);
  28937. /* t2= a^f0 = t ^ 2 ^ 4 */
  28938. sp_384_mont_sqr_n_order_12(t2, t, 4);
  28939. /* t = a^ff = t2 * t */
  28940. sp_384_mont_mul_order_12(t, t2, t);
  28941. /* t2= a^ff00 = t ^ 2 ^ 8 */
  28942. sp_384_mont_sqr_n_order_12(t2, t, 8);
  28943. /* t3= a^ffff = t2 * t */
  28944. sp_384_mont_mul_order_12(t3, t2, t);
  28945. /* t2= a^ffff0000 = t3 ^ 2 ^ 16 */
  28946. sp_384_mont_sqr_n_order_12(t2, t3, 16);
  28947. /* t = a^ffffffff = t2 * t3 */
  28948. sp_384_mont_mul_order_12(t, t2, t3);
  28949. /* t2= a^ffffffff0000 = t ^ 2 ^ 16 */
  28950. sp_384_mont_sqr_n_order_12(t2, t, 16);
  28951. /* t = a^ffffffffffff = t2 * t3 */
  28952. sp_384_mont_mul_order_12(t, t2, t3);
  28953. /* t2= a^ffffffffffff000000000000 = t ^ 2 ^ 48 */
  28954. sp_384_mont_sqr_n_order_12(t2, t, 48);
  28955. /* t= a^fffffffffffffffffffffffff = t2 * t */
  28956. sp_384_mont_mul_order_12(t, t2, t);
  28957. /* t2= a^ffffffffffffffffffffffff000000000000000000000000 */
  28958. sp_384_mont_sqr_n_order_12(t2, t, 96);
  28959. /* t2= a^ffffffffffffffffffffffffffffffffffffffffffffffff = t2 * t */
  28960. sp_384_mont_mul_order_12(t2, t2, t);
  28961. for (i=191; i>=1; i--) {
  28962. sp_384_mont_sqr_order_12(t2, t2);
  28963. if ((p384_order_low[i / 32] & ((sp_int_digit)1 << (i % 32))) != 0) {
  28964. sp_384_mont_mul_order_12(t2, t2, a);
  28965. }
  28966. }
  28967. sp_384_mont_sqr_order_12(t2, t2);
  28968. sp_384_mont_mul_order_12(r, t2, a);
  28969. #endif /* WOLFSSL_SP_SMALL */
  28970. }
  28971. #endif /* HAVE_ECC_SIGN || (HAVE_ECC_VERIFY && WOLFSSL_SP_SMALL) */
  28972. #endif /* HAVE_ECC_SIGN | HAVE_ECC_VERIFY */
  28973. #ifdef HAVE_ECC_SIGN
  28974. #ifndef SP_ECC_MAX_SIG_GEN
  28975. #define SP_ECC_MAX_SIG_GEN 64
  28976. #endif
  28977. /* Calculate second signature value S from R, k and private value.
  28978. *
  28979. * s = (r * x + e) / k
  28980. *
  28981. * s Signature value.
  28982. * r First signature value.
  28983. * k Ephemeral private key.
  28984. * x Private key as a number.
  28985. * e Hash of message as a number.
  28986. * tmp Temporary storage for intermediate numbers.
  28987. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  28988. */
  28989. static int sp_384_calc_s_12(sp_digit* s, const sp_digit* r, sp_digit* k,
  28990. sp_digit* x, const sp_digit* e, sp_digit* tmp)
  28991. {
  28992. int err;
  28993. sp_digit carry;
  28994. sp_int32 c;
  28995. sp_digit* kInv = k;
  28996. /* Conv k to Montgomery form (mod order) */
  28997. sp_384_mul_12(k, k, p384_norm_order);
  28998. err = sp_384_mod_12(k, k, p384_order);
  28999. if (err == MP_OKAY) {
  29000. sp_384_norm_12(k);
  29001. /* kInv = 1/k mod order */
  29002. sp_384_mont_inv_order_12(kInv, k, tmp);
  29003. sp_384_norm_12(kInv);
  29004. /* s = r * x + e */
  29005. sp_384_mul_12(x, x, r);
  29006. err = sp_384_mod_12(x, x, p384_order);
  29007. }
  29008. if (err == MP_OKAY) {
  29009. sp_384_norm_12(x);
  29010. carry = sp_384_add_12(s, e, x);
  29011. sp_384_cond_sub_12(s, s, p384_order, 0 - carry);
  29012. sp_384_norm_12(s);
  29013. c = sp_384_cmp_12(s, p384_order);
  29014. sp_384_cond_sub_12(s, s, p384_order,
  29015. (sp_digit)0 - (sp_digit)(c >= 0));
  29016. sp_384_norm_12(s);
  29017. /* s = s * k^-1 mod order */
  29018. sp_384_mont_mul_order_12(s, s, kInv);
  29019. sp_384_norm_12(s);
  29020. }
  29021. return err;
  29022. }
  29023. /* Sign the hash using the private key.
  29024. * e = [hash, 384 bits] from binary
  29025. * r = (k.G)->x mod order
  29026. * s = (r * x + e) / k mod order
  29027. * The hash is truncated to the first 384 bits.
  29028. *
  29029. * hash Hash to sign.
  29030. * hashLen Length of the hash data.
  29031. * rng Random number generator.
  29032. * priv Private part of key - scalar.
  29033. * rm First part of result as an mp_int.
  29034. * sm Sirst part of result as an mp_int.
  29035. * heap Heap to use for allocation.
  29036. * returns RNG failures, MEMORY_E when memory allocation fails and
  29037. * MP_OKAY on success.
  29038. */
  29039. #ifdef WOLFSSL_SP_NONBLOCK
  29040. typedef struct sp_ecc_sign_384_ctx {
  29041. int state;
  29042. union {
  29043. sp_384_ecc_mulmod_12_ctx mulmod_ctx;
  29044. sp_384_mont_inv_order_12_ctx mont_inv_order_ctx;
  29045. };
  29046. sp_digit e[2*12];
  29047. sp_digit x[2*12];
  29048. sp_digit k[2*12];
  29049. sp_digit r[2*12];
  29050. sp_digit tmp[3 * 2*12];
  29051. sp_point_384 point;
  29052. sp_digit* s;
  29053. sp_digit* kInv;
  29054. int i;
  29055. } sp_ecc_sign_384_ctx;
  29056. int sp_ecc_sign_384_nb(sp_ecc_ctx_t* sp_ctx, const byte* hash, word32 hashLen, WC_RNG* rng,
  29057. mp_int* priv, mp_int* rm, mp_int* sm, mp_int* km, void* heap)
  29058. {
  29059. int err = FP_WOULDBLOCK;
  29060. sp_ecc_sign_384_ctx* ctx = (sp_ecc_sign_384_ctx*)sp_ctx->data;
  29061. typedef char ctx_size_test[sizeof(sp_ecc_sign_384_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  29062. (void)sizeof(ctx_size_test);
  29063. (void)heap;
  29064. switch (ctx->state) {
  29065. case 0: /* INIT */
  29066. ctx->s = ctx->e;
  29067. ctx->kInv = ctx->k;
  29068. ctx->i = SP_ECC_MAX_SIG_GEN;
  29069. ctx->state = 1;
  29070. break;
  29071. case 1: /* GEN */
  29072. /* New random point. */
  29073. if (km == NULL || mp_iszero(km)) {
  29074. err = sp_384_ecc_gen_k_12(rng, ctx->k);
  29075. }
  29076. else {
  29077. sp_384_from_mp(ctx->k, 12, km);
  29078. mp_zero(km);
  29079. }
  29080. XMEMSET(&ctx->mulmod_ctx, 0, sizeof(ctx->mulmod_ctx));
  29081. ctx->state = 2;
  29082. break;
  29083. case 2: /* MULMOD */
  29084. err = sp_384_ecc_mulmod_12_nb((sp_ecc_ctx_t*)&ctx->mulmod_ctx,
  29085. &ctx->point, &p384_base, ctx->k, 1, 1, heap);
  29086. if (err == MP_OKAY) {
  29087. ctx->state = 3;
  29088. }
  29089. break;
  29090. case 3: /* MODORDER */
  29091. {
  29092. sp_int32 c;
  29093. /* r = point->x mod order */
  29094. XMEMCPY(ctx->r, ctx->point.x, sizeof(sp_digit) * 12U);
  29095. sp_384_norm_12(ctx->r);
  29096. c = sp_384_cmp_12(ctx->r, p384_order);
  29097. sp_384_cond_sub_12(ctx->r, ctx->r, p384_order,
  29098. (sp_digit)0 - (sp_digit)(c >= 0));
  29099. sp_384_norm_12(ctx->r);
  29100. if (hashLen > 48U) {
  29101. hashLen = 48U;
  29102. }
  29103. sp_384_from_mp(ctx->x, 12, priv);
  29104. sp_384_from_bin(ctx->e, 12, hash, (int)hashLen);
  29105. ctx->state = 4;
  29106. break;
  29107. }
  29108. case 4: /* KMODORDER */
  29109. /* Conv k to Montgomery form (mod order) */
  29110. sp_384_mul_12(ctx->k, ctx->k, p384_norm_order);
  29111. err = sp_384_mod_12(ctx->k, ctx->k, p384_order);
  29112. if (err == MP_OKAY) {
  29113. sp_384_norm_12(ctx->k);
  29114. XMEMSET(&ctx->mont_inv_order_ctx, 0, sizeof(ctx->mont_inv_order_ctx));
  29115. ctx->state = 5;
  29116. }
  29117. break;
  29118. case 5: /* KINV */
  29119. /* kInv = 1/k mod order */
  29120. err = sp_384_mont_inv_order_12_nb((sp_ecc_ctx_t*)&ctx->mont_inv_order_ctx, ctx->kInv, ctx->k, ctx->tmp);
  29121. if (err == MP_OKAY) {
  29122. XMEMSET(&ctx->mont_inv_order_ctx, 0, sizeof(ctx->mont_inv_order_ctx));
  29123. ctx->state = 6;
  29124. }
  29125. break;
  29126. case 6: /* KINVNORM */
  29127. sp_384_norm_12(ctx->kInv);
  29128. ctx->state = 7;
  29129. break;
  29130. case 7: /* R */
  29131. /* s = r * x + e */
  29132. sp_384_mul_12(ctx->x, ctx->x, ctx->r);
  29133. ctx->state = 8;
  29134. break;
  29135. case 8: /* S1 */
  29136. err = sp_384_mod_12(ctx->x, ctx->x, p384_order);
  29137. if (err == MP_OKAY)
  29138. ctx->state = 9;
  29139. break;
  29140. case 9: /* S2 */
  29141. {
  29142. sp_digit carry;
  29143. sp_int32 c;
  29144. sp_384_norm_12(ctx->x);
  29145. carry = sp_384_add_12(ctx->s, ctx->e, ctx->x);
  29146. sp_384_cond_sub_12(ctx->s, ctx->s,
  29147. p384_order, 0 - carry);
  29148. sp_384_norm_12(ctx->s);
  29149. c = sp_384_cmp_12(ctx->s, p384_order);
  29150. sp_384_cond_sub_12(ctx->s, ctx->s, p384_order,
  29151. (sp_digit)0 - (sp_digit)(c >= 0));
  29152. sp_384_norm_12(ctx->s);
  29153. /* s = s * k^-1 mod order */
  29154. sp_384_mont_mul_order_12(ctx->s, ctx->s, ctx->kInv);
  29155. sp_384_norm_12(ctx->s);
  29156. /* Check that signature is usable. */
  29157. if (sp_384_iszero_12(ctx->s) == 0) {
  29158. ctx->state = 10;
  29159. break;
  29160. }
  29161. #ifdef WOLFSSL_ECDSA_SET_K_ONE_LOOP
  29162. ctx->i = 1;
  29163. #endif
  29164. /* not usable gen, try again */
  29165. ctx->i--;
  29166. if (ctx->i == 0) {
  29167. err = RNG_FAILURE_E;
  29168. }
  29169. ctx->state = 1;
  29170. break;
  29171. }
  29172. case 10: /* RES */
  29173. err = sp_384_to_mp(ctx->r, rm);
  29174. if (err == MP_OKAY) {
  29175. err = sp_384_to_mp(ctx->s, sm);
  29176. }
  29177. break;
  29178. }
  29179. if (err == MP_OKAY && ctx->state != 10) {
  29180. err = FP_WOULDBLOCK;
  29181. }
  29182. if (err != FP_WOULDBLOCK) {
  29183. XMEMSET(ctx->e, 0, sizeof(sp_digit) * 2U * 12U);
  29184. XMEMSET(ctx->x, 0, sizeof(sp_digit) * 2U * 12U);
  29185. XMEMSET(ctx->k, 0, sizeof(sp_digit) * 2U * 12U);
  29186. XMEMSET(ctx->r, 0, sizeof(sp_digit) * 2U * 12U);
  29187. XMEMSET(ctx->tmp, 0, sizeof(sp_digit) * 3U * 2U * 12U);
  29188. }
  29189. return err;
  29190. }
  29191. #endif /* WOLFSSL_SP_NONBLOCK */
  29192. int sp_ecc_sign_384(const byte* hash, word32 hashLen, WC_RNG* rng,
  29193. const mp_int* priv, mp_int* rm, mp_int* sm, mp_int* km, void* heap)
  29194. {
  29195. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29196. sp_digit* e = NULL;
  29197. sp_point_384* point = NULL;
  29198. #else
  29199. sp_digit e[7 * 2 * 12];
  29200. sp_point_384 point[1];
  29201. #endif
  29202. sp_digit* x = NULL;
  29203. sp_digit* k = NULL;
  29204. sp_digit* r = NULL;
  29205. sp_digit* tmp = NULL;
  29206. sp_digit* s = NULL;
  29207. sp_int32 c;
  29208. int err = MP_OKAY;
  29209. int i;
  29210. (void)heap;
  29211. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29212. if (err == MP_OKAY) {
  29213. point = (sp_point_384*)XMALLOC(sizeof(sp_point_384), heap,
  29214. DYNAMIC_TYPE_ECC);
  29215. if (point == NULL)
  29216. err = MEMORY_E;
  29217. }
  29218. if (err == MP_OKAY) {
  29219. e = (sp_digit*)XMALLOC(sizeof(sp_digit) * 7 * 2 * 12, heap,
  29220. DYNAMIC_TYPE_ECC);
  29221. if (e == NULL)
  29222. err = MEMORY_E;
  29223. }
  29224. #endif
  29225. if (err == MP_OKAY) {
  29226. x = e + 2 * 12;
  29227. k = e + 4 * 12;
  29228. r = e + 6 * 12;
  29229. tmp = e + 8 * 12;
  29230. s = e;
  29231. if (hashLen > 48U) {
  29232. hashLen = 48U;
  29233. }
  29234. }
  29235. for (i = SP_ECC_MAX_SIG_GEN; err == MP_OKAY && i > 0; i--) {
  29236. /* New random point. */
  29237. if (km == NULL || mp_iszero(km)) {
  29238. err = sp_384_ecc_gen_k_12(rng, k);
  29239. }
  29240. else {
  29241. sp_384_from_mp(k, 12, km);
  29242. mp_zero(km);
  29243. }
  29244. if (err == MP_OKAY) {
  29245. err = sp_384_ecc_mulmod_base_12(point, k, 1, 1, heap);
  29246. }
  29247. if (err == MP_OKAY) {
  29248. /* r = point->x mod order */
  29249. XMEMCPY(r, point->x, sizeof(sp_digit) * 12U);
  29250. sp_384_norm_12(r);
  29251. c = sp_384_cmp_12(r, p384_order);
  29252. sp_384_cond_sub_12(r, r, p384_order,
  29253. (sp_digit)0 - (sp_digit)(c >= 0));
  29254. sp_384_norm_12(r);
  29255. sp_384_from_mp(x, 12, priv);
  29256. sp_384_from_bin(e, 12, hash, (int)hashLen);
  29257. err = sp_384_calc_s_12(s, r, k, x, e, tmp);
  29258. }
  29259. /* Check that signature is usable. */
  29260. if ((err == MP_OKAY) && (sp_384_iszero_12(s) == 0)) {
  29261. break;
  29262. }
  29263. #ifdef WOLFSSL_ECDSA_SET_K_ONE_LOOP
  29264. i = 1;
  29265. #endif
  29266. }
  29267. if (i == 0) {
  29268. err = RNG_FAILURE_E;
  29269. }
  29270. if (err == MP_OKAY) {
  29271. err = sp_384_to_mp(r, rm);
  29272. }
  29273. if (err == MP_OKAY) {
  29274. err = sp_384_to_mp(s, sm);
  29275. }
  29276. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29277. if (e != NULL)
  29278. #endif
  29279. {
  29280. ForceZero(e, sizeof(sp_digit) * 7 * 2 * 12);
  29281. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29282. XFREE(e, heap, DYNAMIC_TYPE_ECC);
  29283. #endif
  29284. }
  29285. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29286. if (point != NULL)
  29287. #endif
  29288. {
  29289. ForceZero(point, sizeof(sp_point_384));
  29290. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29291. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  29292. #endif
  29293. }
  29294. return err;
  29295. }
  29296. #endif /* HAVE_ECC_SIGN */
  29297. #ifndef WOLFSSL_SP_SMALL
  29298. /* Divide the number by 2 mod the modulus. (r = a / 2 % m)
  29299. *
  29300. * r Result of division by 2.
  29301. * a Number to divide.
  29302. * m Modulus.
  29303. */
  29304. static void sp_384_div2_mod_12(sp_digit* r, const sp_digit* a, const sp_digit* m)
  29305. {
  29306. __asm__ __volatile__ (
  29307. "ldr r4, [%[a]]\n\t"
  29308. "ands r8, r4, #1\n\t"
  29309. "beq 1f\n\t"
  29310. "mov r12, #0\n\t"
  29311. "ldr r5, [%[a], #4]\n\t"
  29312. "ldr r6, [%[a], #8]\n\t"
  29313. "ldr r7, [%[a], #12]\n\t"
  29314. "ldr r8, [%[m], #0]\n\t"
  29315. "ldr r9, [%[m], #4]\n\t"
  29316. "ldr r10, [%[m], #8]\n\t"
  29317. "ldr r14, [%[m], #12]\n\t"
  29318. "adds r4, r4, r8\n\t"
  29319. "adcs r5, r5, r9\n\t"
  29320. "adcs r6, r6, r10\n\t"
  29321. "adcs r7, r7, r14\n\t"
  29322. "str r4, [%[r], #0]\n\t"
  29323. "str r5, [%[r], #4]\n\t"
  29324. "str r6, [%[r], #8]\n\t"
  29325. "str r7, [%[r], #12]\n\t"
  29326. "ldr r4, [%[a], #16]\n\t"
  29327. "ldr r5, [%[a], #20]\n\t"
  29328. "ldr r6, [%[a], #24]\n\t"
  29329. "ldr r7, [%[a], #28]\n\t"
  29330. "ldr r8, [%[m], #16]\n\t"
  29331. "ldr r9, [%[m], #20]\n\t"
  29332. "ldr r10, [%[m], #24]\n\t"
  29333. "ldr r14, [%[m], #28]\n\t"
  29334. "adcs r4, r4, r8\n\t"
  29335. "adcs r5, r5, r9\n\t"
  29336. "adcs r6, r6, r10\n\t"
  29337. "adcs r7, r7, r14\n\t"
  29338. "str r4, [%[r], #16]\n\t"
  29339. "str r5, [%[r], #20]\n\t"
  29340. "str r6, [%[r], #24]\n\t"
  29341. "str r7, [%[r], #28]\n\t"
  29342. "ldr r4, [%[a], #32]\n\t"
  29343. "ldr r5, [%[a], #36]\n\t"
  29344. "ldr r6, [%[a], #40]\n\t"
  29345. "ldr r7, [%[a], #44]\n\t"
  29346. "ldr r8, [%[m], #32]\n\t"
  29347. "ldr r9, [%[m], #36]\n\t"
  29348. "ldr r10, [%[m], #40]\n\t"
  29349. "ldr r14, [%[m], #44]\n\t"
  29350. "adcs r4, r4, r8\n\t"
  29351. "adcs r5, r5, r9\n\t"
  29352. "adcs r6, r6, r10\n\t"
  29353. "adcs r7, r7, r14\n\t"
  29354. "str r4, [%[r], #32]\n\t"
  29355. "str r5, [%[r], #36]\n\t"
  29356. "str r6, [%[r], #40]\n\t"
  29357. "str r7, [%[r], #44]\n\t"
  29358. "adc r8, r12, r12\n\t"
  29359. "b 2f\n\t"
  29360. "\n1:\n\t"
  29361. "ldr r5, [%[a], #2]\n\t"
  29362. "str r4, [%[r], #0]\n\t"
  29363. "str r5, [%[r], #2]\n\t"
  29364. "ldr r4, [%[a], #4]\n\t"
  29365. "ldr r5, [%[a], #6]\n\t"
  29366. "str r4, [%[r], #4]\n\t"
  29367. "str r5, [%[r], #6]\n\t"
  29368. "ldr r4, [%[a], #8]\n\t"
  29369. "ldr r5, [%[a], #10]\n\t"
  29370. "str r4, [%[r], #8]\n\t"
  29371. "str r5, [%[r], #10]\n\t"
  29372. "ldr r4, [%[a], #12]\n\t"
  29373. "ldr r5, [%[a], #14]\n\t"
  29374. "str r4, [%[r], #12]\n\t"
  29375. "str r5, [%[r], #14]\n\t"
  29376. "ldr r4, [%[a], #16]\n\t"
  29377. "ldr r5, [%[a], #18]\n\t"
  29378. "str r4, [%[r], #16]\n\t"
  29379. "str r5, [%[r], #18]\n\t"
  29380. "ldr r4, [%[a], #20]\n\t"
  29381. "ldr r5, [%[a], #22]\n\t"
  29382. "str r4, [%[r], #20]\n\t"
  29383. "str r5, [%[r], #22]\n\t"
  29384. "\n2:\n\t"
  29385. "ldr r3, [%[r]]\n\t"
  29386. "ldr r4, [%[r], #4]\n\t"
  29387. "lsr r3, r3, #1\n\t"
  29388. "orr r3, r3, r4, lsl #31\n\t"
  29389. "lsr r4, r4, #1\n\t"
  29390. "ldr r5, [%[a], #8]\n\t"
  29391. "str r3, [%[r], #0]\n\t"
  29392. "orr r4, r4, r5, lsl #31\n\t"
  29393. "lsr r5, r5, #1\n\t"
  29394. "ldr r3, [%[a], #12]\n\t"
  29395. "str r4, [%[r], #4]\n\t"
  29396. "orr r5, r5, r3, lsl #31\n\t"
  29397. "lsr r3, r3, #1\n\t"
  29398. "ldr r4, [%[a], #16]\n\t"
  29399. "str r5, [%[r], #8]\n\t"
  29400. "orr r3, r3, r4, lsl #31\n\t"
  29401. "lsr r4, r4, #1\n\t"
  29402. "ldr r5, [%[a], #20]\n\t"
  29403. "str r3, [%[r], #12]\n\t"
  29404. "orr r4, r4, r5, lsl #31\n\t"
  29405. "lsr r5, r5, #1\n\t"
  29406. "ldr r3, [%[a], #24]\n\t"
  29407. "str r4, [%[r], #16]\n\t"
  29408. "orr r5, r5, r3, lsl #31\n\t"
  29409. "lsr r3, r3, #1\n\t"
  29410. "ldr r4, [%[a], #28]\n\t"
  29411. "str r5, [%[r], #20]\n\t"
  29412. "orr r3, r3, r4, lsl #31\n\t"
  29413. "lsr r4, r4, #1\n\t"
  29414. "ldr r5, [%[a], #32]\n\t"
  29415. "str r3, [%[r], #24]\n\t"
  29416. "orr r4, r4, r5, lsl #31\n\t"
  29417. "lsr r5, r5, #1\n\t"
  29418. "ldr r3, [%[a], #36]\n\t"
  29419. "str r4, [%[r], #28]\n\t"
  29420. "orr r5, r5, r3, lsl #31\n\t"
  29421. "lsr r3, r3, #1\n\t"
  29422. "ldr r4, [%[a], #40]\n\t"
  29423. "str r5, [%[r], #32]\n\t"
  29424. "orr r3, r3, r4, lsl #31\n\t"
  29425. "lsr r4, r4, #1\n\t"
  29426. "ldr r5, [%[a], #44]\n\t"
  29427. "str r3, [%[r], #36]\n\t"
  29428. "orr r4, r4, r5, lsl #31\n\t"
  29429. "lsr r5, r5, #1\n\t"
  29430. "orr r5, r5, r8, lsl #31\n\t"
  29431. "str r4, [%[r], #40]\n\t"
  29432. "str r5, [%[r], #44]\n\t"
  29433. :
  29434. : [r] "r" (r), [a] "r" (a), [m] "r" (m)
  29435. : "memory", "r3", "r4", "r5", "r6", "r7", "r8", "r9", "r10", "r14"
  29436. );
  29437. }
  29438. static int sp_384_num_bits_12(sp_digit* a)
  29439. {
  29440. int r = 0;
  29441. __asm__ __volatile__ (
  29442. "ldr r2, [%[a], #44]\n\t"
  29443. "cmp r2, #0\n\t"
  29444. "beq 11f\n\t"
  29445. "mov r3, #384\n\t"
  29446. "clz %[r], r2\n\t"
  29447. "sub %[r], r3, %[r]\n\t"
  29448. "b 13f\n\t"
  29449. "\n11:\n\t"
  29450. "ldr r2, [%[a], #40]\n\t"
  29451. "cmp r2, #0\n\t"
  29452. "beq 10f\n\t"
  29453. "mov r3, #352\n\t"
  29454. "clz %[r], r2\n\t"
  29455. "sub %[r], r3, %[r]\n\t"
  29456. "b 13f\n\t"
  29457. "\n10:\n\t"
  29458. "ldr r2, [%[a], #36]\n\t"
  29459. "cmp r2, #0\n\t"
  29460. "beq 9f\n\t"
  29461. "mov r3, #320\n\t"
  29462. "clz %[r], r2\n\t"
  29463. "sub %[r], r3, %[r]\n\t"
  29464. "b 13f\n\t"
  29465. "\n9:\n\t"
  29466. "ldr r2, [%[a], #32]\n\t"
  29467. "cmp r2, #0\n\t"
  29468. "beq 8f\n\t"
  29469. "mov r3, #288\n\t"
  29470. "clz %[r], r2\n\t"
  29471. "sub %[r], r3, %[r]\n\t"
  29472. "b 13f\n\t"
  29473. "\n8:\n\t"
  29474. "ldr r2, [%[a], #28]\n\t"
  29475. "cmp r2, #0\n\t"
  29476. "beq 7f\n\t"
  29477. "mov r3, #256\n\t"
  29478. "clz %[r], r2\n\t"
  29479. "sub %[r], r3, %[r]\n\t"
  29480. "b 13f\n\t"
  29481. "\n7:\n\t"
  29482. "ldr r2, [%[a], #24]\n\t"
  29483. "cmp r2, #0\n\t"
  29484. "beq 6f\n\t"
  29485. "mov r3, #224\n\t"
  29486. "clz %[r], r2\n\t"
  29487. "sub %[r], r3, %[r]\n\t"
  29488. "b 13f\n\t"
  29489. "\n6:\n\t"
  29490. "ldr r2, [%[a], #20]\n\t"
  29491. "cmp r2, #0\n\t"
  29492. "beq 5f\n\t"
  29493. "mov r3, #192\n\t"
  29494. "clz %[r], r2\n\t"
  29495. "sub %[r], r3, %[r]\n\t"
  29496. "b 13f\n\t"
  29497. "\n5:\n\t"
  29498. "ldr r2, [%[a], #16]\n\t"
  29499. "cmp r2, #0\n\t"
  29500. "beq 4f\n\t"
  29501. "mov r3, #160\n\t"
  29502. "clz %[r], r2\n\t"
  29503. "sub %[r], r3, %[r]\n\t"
  29504. "b 13f\n\t"
  29505. "\n4:\n\t"
  29506. "ldr r2, [%[a], #12]\n\t"
  29507. "cmp r2, #0\n\t"
  29508. "beq 3f\n\t"
  29509. "mov r3, #128\n\t"
  29510. "clz %[r], r2\n\t"
  29511. "sub %[r], r3, %[r]\n\t"
  29512. "b 13f\n\t"
  29513. "\n3:\n\t"
  29514. "ldr r2, [%[a], #8]\n\t"
  29515. "cmp r2, #0\n\t"
  29516. "beq 2f\n\t"
  29517. "mov r3, #96\n\t"
  29518. "clz %[r], r2\n\t"
  29519. "sub %[r], r3, %[r]\n\t"
  29520. "b 13f\n\t"
  29521. "\n2:\n\t"
  29522. "ldr r2, [%[a], #4]\n\t"
  29523. "cmp r2, #0\n\t"
  29524. "beq 1f\n\t"
  29525. "mov r3, #64\n\t"
  29526. "clz %[r], r2\n\t"
  29527. "sub %[r], r3, %[r]\n\t"
  29528. "b 13f\n\t"
  29529. "\n1:\n\t"
  29530. "ldr r2, [%[a], #0]\n\t"
  29531. "mov r3, #32\n\t"
  29532. "clz %[r], r2\n\t"
  29533. "sub %[r], r3, %[r]\n\t"
  29534. "\n13:\n\t"
  29535. : [r] "+r" (r)
  29536. : [a] "r" (a)
  29537. : "r2", "r3"
  29538. );
  29539. return r;
  29540. }
  29541. /* Non-constant time modular inversion.
  29542. *
  29543. * @param [out] r Resulting number.
  29544. * @param [in] a Number to invert.
  29545. * @param [in] m Modulus.
  29546. * @return MP_OKAY on success.
  29547. */
  29548. static int sp_384_mod_inv_12(sp_digit* r, const sp_digit* a, const sp_digit* m)
  29549. {
  29550. sp_digit u[12];
  29551. sp_digit v[12];
  29552. sp_digit b[12];
  29553. sp_digit d[12];
  29554. int ut, vt;
  29555. sp_digit o;
  29556. XMEMCPY(u, m, sizeof(u));
  29557. XMEMCPY(v, a, sizeof(v));
  29558. ut = sp_384_num_bits_12(u);
  29559. vt = sp_384_num_bits_12(v);
  29560. XMEMSET(b, 0, sizeof(b));
  29561. if ((v[0] & 1) == 0) {
  29562. sp_384_rshift1_12(v, v);
  29563. XMEMCPY(d, m, sizeof(u));
  29564. d[0] += 1;
  29565. sp_384_rshift1_12(d, d);
  29566. vt--;
  29567. while ((v[0] & 1) == 0) {
  29568. sp_384_rshift1_12(v, v);
  29569. sp_384_div2_mod_12(d, d, m);
  29570. vt--;
  29571. }
  29572. }
  29573. else {
  29574. XMEMSET(d+1, 0, sizeof(d)-sizeof(sp_digit));
  29575. d[0] = 1;
  29576. }
  29577. while (ut > 1 && vt > 1) {
  29578. if (ut > vt || (ut == vt && sp_384_cmp_12(u, v) >= 0)) {
  29579. sp_384_sub_12(u, u, v);
  29580. o = sp_384_sub_12(b, b, d);
  29581. if (o != 0)
  29582. sp_384_add_12(b, b, m);
  29583. ut = sp_384_num_bits_12(u);
  29584. do {
  29585. sp_384_rshift1_12(u, u);
  29586. sp_384_div2_mod_12(b, b, m);
  29587. ut--;
  29588. }
  29589. while (ut > 0 && (u[0] & 1) == 0);
  29590. }
  29591. else {
  29592. sp_384_sub_12(v, v, u);
  29593. o = sp_384_sub_12(d, d, b);
  29594. if (o != 0)
  29595. sp_384_add_12(d, d, m);
  29596. vt = sp_384_num_bits_12(v);
  29597. do {
  29598. sp_384_rshift1_12(v, v);
  29599. sp_384_div2_mod_12(d, d, m);
  29600. vt--;
  29601. }
  29602. while (vt > 0 && (v[0] & 1) == 0);
  29603. }
  29604. }
  29605. if (ut == 1)
  29606. XMEMCPY(r, b, sizeof(b));
  29607. else
  29608. XMEMCPY(r, d, sizeof(d));
  29609. return MP_OKAY;
  29610. }
  29611. #endif /* WOLFSSL_SP_SMALL */
  29612. /* Add point p1 into point p2. Handles p1 == p2 and result at infinity.
  29613. *
  29614. * p1 First point to add and holds result.
  29615. * p2 Second point to add.
  29616. * tmp Temporary storage for intermediate numbers.
  29617. */
  29618. static void sp_384_add_points_12(sp_point_384* p1, const sp_point_384* p2,
  29619. sp_digit* tmp)
  29620. {
  29621. sp_384_proj_point_add_12(p1, p1, p2, tmp);
  29622. if (sp_384_iszero_12(p1->z)) {
  29623. if (sp_384_iszero_12(p1->x) && sp_384_iszero_12(p1->y)) {
  29624. sp_384_proj_point_dbl_12(p1, p2, tmp);
  29625. }
  29626. else {
  29627. /* Y ordinate is not used from here - don't set. */
  29628. p1->x[0] = 0;
  29629. p1->x[1] = 0;
  29630. p1->x[2] = 0;
  29631. p1->x[3] = 0;
  29632. p1->x[4] = 0;
  29633. p1->x[5] = 0;
  29634. p1->x[6] = 0;
  29635. p1->x[7] = 0;
  29636. p1->x[8] = 0;
  29637. p1->x[9] = 0;
  29638. p1->x[10] = 0;
  29639. p1->x[11] = 0;
  29640. XMEMCPY(p1->z, p384_norm_mod, sizeof(p384_norm_mod));
  29641. }
  29642. }
  29643. }
  29644. /* Calculate the verification point: [e/s]G + [r/s]Q
  29645. *
  29646. * p1 Calculated point.
  29647. * p2 Public point and temporary.
  29648. * s Second part of signature as a number.
  29649. * u1 Temporary number.
  29650. * u2 Temproray number.
  29651. * heap Heap to use for allocation.
  29652. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  29653. */
  29654. static int sp_384_calc_vfy_point_12(sp_point_384* p1, sp_point_384* p2,
  29655. sp_digit* s, sp_digit* u1, sp_digit* u2, sp_digit* tmp, void* heap)
  29656. {
  29657. int err;
  29658. #ifndef WOLFSSL_SP_SMALL
  29659. err = sp_384_mod_inv_12(s, s, p384_order);
  29660. if (err == MP_OKAY)
  29661. #endif /* !WOLFSSL_SP_SMALL */
  29662. {
  29663. sp_384_mul_12(s, s, p384_norm_order);
  29664. err = sp_384_mod_12(s, s, p384_order);
  29665. }
  29666. if (err == MP_OKAY) {
  29667. sp_384_norm_12(s);
  29668. #ifdef WOLFSSL_SP_SMALL
  29669. {
  29670. sp_384_mont_inv_order_12(s, s, tmp);
  29671. sp_384_mont_mul_order_12(u1, u1, s);
  29672. sp_384_mont_mul_order_12(u2, u2, s);
  29673. }
  29674. #else
  29675. {
  29676. sp_384_mont_mul_order_12(u1, u1, s);
  29677. sp_384_mont_mul_order_12(u2, u2, s);
  29678. }
  29679. #endif /* WOLFSSL_SP_SMALL */
  29680. {
  29681. err = sp_384_ecc_mulmod_base_12(p1, u1, 0, 0, heap);
  29682. }
  29683. }
  29684. if ((err == MP_OKAY) && sp_384_iszero_12(p1->z)) {
  29685. p1->infinity = 1;
  29686. }
  29687. if (err == MP_OKAY) {
  29688. err = sp_384_ecc_mulmod_12(p2, p2, u2, 0, 0, heap);
  29689. }
  29690. if ((err == MP_OKAY) && sp_384_iszero_12(p2->z)) {
  29691. p2->infinity = 1;
  29692. }
  29693. if (err == MP_OKAY) {
  29694. sp_384_add_points_12(p1, p2, tmp);
  29695. }
  29696. return err;
  29697. }
  29698. #ifdef HAVE_ECC_VERIFY
  29699. /* Verify the signature values with the hash and public key.
  29700. * e = Truncate(hash, 384)
  29701. * u1 = e/s mod order
  29702. * u2 = r/s mod order
  29703. * r == (u1.G + u2.Q)->x mod order
  29704. * Optimization: Leave point in projective form.
  29705. * (x, y, 1) == (x' / z'*z', y' / z'*z'*z', z' / z')
  29706. * (r + n*order).z'.z' mod prime == (u1.G + u2.Q)->x'
  29707. * The hash is truncated to the first 384 bits.
  29708. *
  29709. * hash Hash to sign.
  29710. * hashLen Length of the hash data.
  29711. * rng Random number generator.
  29712. * priv Private part of key - scalar.
  29713. * rm First part of result as an mp_int.
  29714. * sm Sirst part of result as an mp_int.
  29715. * heap Heap to use for allocation.
  29716. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  29717. */
  29718. #ifdef WOLFSSL_SP_NONBLOCK
  29719. typedef struct sp_ecc_verify_384_ctx {
  29720. int state;
  29721. union {
  29722. sp_384_ecc_mulmod_12_ctx mulmod_ctx;
  29723. sp_384_mont_inv_order_12_ctx mont_inv_order_ctx;
  29724. sp_384_proj_point_dbl_12_ctx dbl_ctx;
  29725. sp_384_proj_point_add_12_ctx add_ctx;
  29726. };
  29727. sp_digit u1[2*12];
  29728. sp_digit u2[2*12];
  29729. sp_digit s[2*12];
  29730. sp_digit tmp[2*12 * 6];
  29731. sp_point_384 p1;
  29732. sp_point_384 p2;
  29733. } sp_ecc_verify_384_ctx;
  29734. int sp_ecc_verify_384_nb(sp_ecc_ctx_t* sp_ctx, const byte* hash,
  29735. word32 hashLen, const mp_int* pX, const mp_int* pY, const mp_int* pZ,
  29736. const mp_int* rm, const mp_int* sm, int* res, void* heap)
  29737. {
  29738. int err = FP_WOULDBLOCK;
  29739. sp_ecc_verify_384_ctx* ctx = (sp_ecc_verify_384_ctx*)sp_ctx->data;
  29740. typedef char ctx_size_test[sizeof(sp_ecc_verify_384_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  29741. (void)sizeof(ctx_size_test);
  29742. switch (ctx->state) {
  29743. case 0: /* INIT */
  29744. if (hashLen > 48U) {
  29745. hashLen = 48U;
  29746. }
  29747. sp_384_from_bin(ctx->u1, 12, hash, (int)hashLen);
  29748. sp_384_from_mp(ctx->u2, 12, rm);
  29749. sp_384_from_mp(ctx->s, 12, sm);
  29750. sp_384_from_mp(ctx->p2.x, 12, pX);
  29751. sp_384_from_mp(ctx->p2.y, 12, pY);
  29752. sp_384_from_mp(ctx->p2.z, 12, pZ);
  29753. ctx->state = 1;
  29754. break;
  29755. case 1: /* NORMS0 */
  29756. sp_384_mul_12(ctx->s, ctx->s, p384_norm_order);
  29757. err = sp_384_mod_12(ctx->s, ctx->s, p384_order);
  29758. if (err == MP_OKAY)
  29759. ctx->state = 2;
  29760. break;
  29761. case 2: /* NORMS1 */
  29762. sp_384_norm_12(ctx->s);
  29763. XMEMSET(&ctx->mont_inv_order_ctx, 0, sizeof(ctx->mont_inv_order_ctx));
  29764. ctx->state = 3;
  29765. break;
  29766. case 3: /* NORMS2 */
  29767. err = sp_384_mont_inv_order_12_nb((sp_ecc_ctx_t*)&ctx->mont_inv_order_ctx, ctx->s, ctx->s, ctx->tmp);
  29768. if (err == MP_OKAY) {
  29769. ctx->state = 4;
  29770. }
  29771. break;
  29772. case 4: /* NORMS3 */
  29773. sp_384_mont_mul_order_12(ctx->u1, ctx->u1, ctx->s);
  29774. ctx->state = 5;
  29775. break;
  29776. case 5: /* NORMS4 */
  29777. sp_384_mont_mul_order_12(ctx->u2, ctx->u2, ctx->s);
  29778. XMEMSET(&ctx->mulmod_ctx, 0, sizeof(ctx->mulmod_ctx));
  29779. ctx->state = 6;
  29780. break;
  29781. case 6: /* MULBASE */
  29782. err = sp_384_ecc_mulmod_12_nb((sp_ecc_ctx_t*)&ctx->mulmod_ctx, &ctx->p1, &p384_base, ctx->u1, 0, 0, heap);
  29783. if (err == MP_OKAY) {
  29784. if (sp_384_iszero_12(ctx->p1.z)) {
  29785. ctx->p1.infinity = 1;
  29786. }
  29787. XMEMSET(&ctx->mulmod_ctx, 0, sizeof(ctx->mulmod_ctx));
  29788. ctx->state = 7;
  29789. }
  29790. break;
  29791. case 7: /* MULMOD */
  29792. err = sp_384_ecc_mulmod_12_nb((sp_ecc_ctx_t*)&ctx->mulmod_ctx, &ctx->p2, &ctx->p2, ctx->u2, 0, 0, heap);
  29793. if (err == MP_OKAY) {
  29794. if (sp_384_iszero_12(ctx->p2.z)) {
  29795. ctx->p2.infinity = 1;
  29796. }
  29797. XMEMSET(&ctx->add_ctx, 0, sizeof(ctx->add_ctx));
  29798. ctx->state = 8;
  29799. }
  29800. break;
  29801. case 8: /* ADD */
  29802. err = sp_384_proj_point_add_12_nb((sp_ecc_ctx_t*)&ctx->add_ctx, &ctx->p1, &ctx->p1, &ctx->p2, ctx->tmp);
  29803. if (err == MP_OKAY)
  29804. ctx->state = 9;
  29805. break;
  29806. case 9: /* MONT */
  29807. /* (r + n*order).z'.z' mod prime == (u1.G + u2.Q)->x' */
  29808. /* Reload r and convert to Montgomery form. */
  29809. sp_384_from_mp(ctx->u2, 12, rm);
  29810. err = sp_384_mod_mul_norm_12(ctx->u2, ctx->u2, p384_mod);
  29811. if (err == MP_OKAY)
  29812. ctx->state = 10;
  29813. break;
  29814. case 10: /* SQR */
  29815. /* u1 = r.z'.z' mod prime */
  29816. sp_384_mont_sqr_12(ctx->p1.z, ctx->p1.z, p384_mod, p384_mp_mod);
  29817. ctx->state = 11;
  29818. break;
  29819. case 11: /* MUL */
  29820. sp_384_mont_mul_12(ctx->u1, ctx->u2, ctx->p1.z, p384_mod, p384_mp_mod);
  29821. ctx->state = 12;
  29822. break;
  29823. case 12: /* RES */
  29824. {
  29825. sp_int32 c = 0;
  29826. err = MP_OKAY; /* math okay, now check result */
  29827. *res = (int)(sp_384_cmp_12(ctx->p1.x, ctx->u1) == 0);
  29828. if (*res == 0) {
  29829. sp_digit carry;
  29830. /* Reload r and add order. */
  29831. sp_384_from_mp(ctx->u2, 12, rm);
  29832. carry = sp_384_add_12(ctx->u2, ctx->u2, p384_order);
  29833. /* Carry means result is greater than mod and is not valid. */
  29834. if (carry == 0) {
  29835. sp_384_norm_12(ctx->u2);
  29836. /* Compare with mod and if greater or equal then not valid. */
  29837. c = sp_384_cmp_12(ctx->u2, p384_mod);
  29838. }
  29839. }
  29840. if ((*res == 0) && (c < 0)) {
  29841. /* Convert to Montogomery form */
  29842. err = sp_384_mod_mul_norm_12(ctx->u2, ctx->u2, p384_mod);
  29843. if (err == MP_OKAY) {
  29844. /* u1 = (r + 1*order).z'.z' mod prime */
  29845. sp_384_mont_mul_12(ctx->u1, ctx->u2, ctx->p1.z, p384_mod,
  29846. p384_mp_mod);
  29847. *res = (int)(sp_384_cmp_12(ctx->p1.x, ctx->u1) == 0);
  29848. }
  29849. }
  29850. break;
  29851. }
  29852. } /* switch */
  29853. if (err == MP_OKAY && ctx->state != 12) {
  29854. err = FP_WOULDBLOCK;
  29855. }
  29856. return err;
  29857. }
  29858. #endif /* WOLFSSL_SP_NONBLOCK */
  29859. int sp_ecc_verify_384(const byte* hash, word32 hashLen, const mp_int* pX,
  29860. const mp_int* pY, const mp_int* pZ, const mp_int* rm, const mp_int* sm,
  29861. int* res, void* heap)
  29862. {
  29863. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29864. sp_digit* u1 = NULL;
  29865. sp_point_384* p1 = NULL;
  29866. #else
  29867. sp_digit u1[18 * 12];
  29868. sp_point_384 p1[2];
  29869. #endif
  29870. sp_digit* u2 = NULL;
  29871. sp_digit* s = NULL;
  29872. sp_digit* tmp = NULL;
  29873. sp_point_384* p2 = NULL;
  29874. sp_digit carry;
  29875. sp_int32 c = 0;
  29876. int err = MP_OKAY;
  29877. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29878. if (err == MP_OKAY) {
  29879. p1 = (sp_point_384*)XMALLOC(sizeof(sp_point_384) * 2, heap,
  29880. DYNAMIC_TYPE_ECC);
  29881. if (p1 == NULL)
  29882. err = MEMORY_E;
  29883. }
  29884. if (err == MP_OKAY) {
  29885. u1 = (sp_digit*)XMALLOC(sizeof(sp_digit) * 18 * 12, heap,
  29886. DYNAMIC_TYPE_ECC);
  29887. if (u1 == NULL)
  29888. err = MEMORY_E;
  29889. }
  29890. #endif
  29891. if (err == MP_OKAY) {
  29892. u2 = u1 + 2 * 12;
  29893. s = u1 + 4 * 12;
  29894. tmp = u1 + 6 * 12;
  29895. p2 = p1 + 1;
  29896. if (hashLen > 48U) {
  29897. hashLen = 48U;
  29898. }
  29899. sp_384_from_bin(u1, 12, hash, (int)hashLen);
  29900. sp_384_from_mp(u2, 12, rm);
  29901. sp_384_from_mp(s, 12, sm);
  29902. sp_384_from_mp(p2->x, 12, pX);
  29903. sp_384_from_mp(p2->y, 12, pY);
  29904. sp_384_from_mp(p2->z, 12, pZ);
  29905. err = sp_384_calc_vfy_point_12(p1, p2, s, u1, u2, tmp, heap);
  29906. }
  29907. if (err == MP_OKAY) {
  29908. /* (r + n*order).z'.z' mod prime == (u1.G + u2.Q)->x' */
  29909. /* Reload r and convert to Montgomery form. */
  29910. sp_384_from_mp(u2, 12, rm);
  29911. err = sp_384_mod_mul_norm_12(u2, u2, p384_mod);
  29912. }
  29913. if (err == MP_OKAY) {
  29914. /* u1 = r.z'.z' mod prime */
  29915. sp_384_mont_sqr_12(p1->z, p1->z, p384_mod, p384_mp_mod);
  29916. sp_384_mont_mul_12(u1, u2, p1->z, p384_mod, p384_mp_mod);
  29917. *res = (int)(sp_384_cmp_12(p1->x, u1) == 0);
  29918. if (*res == 0) {
  29919. /* Reload r and add order. */
  29920. sp_384_from_mp(u2, 12, rm);
  29921. carry = sp_384_add_12(u2, u2, p384_order);
  29922. /* Carry means result is greater than mod and is not valid. */
  29923. if (carry == 0) {
  29924. sp_384_norm_12(u2);
  29925. /* Compare with mod and if greater or equal then not valid. */
  29926. c = sp_384_cmp_12(u2, p384_mod);
  29927. }
  29928. }
  29929. if ((*res == 0) && (c < 0)) {
  29930. /* Convert to Montogomery form */
  29931. err = sp_384_mod_mul_norm_12(u2, u2, p384_mod);
  29932. if (err == MP_OKAY) {
  29933. /* u1 = (r + 1*order).z'.z' mod prime */
  29934. {
  29935. sp_384_mont_mul_12(u1, u2, p1->z, p384_mod, p384_mp_mod);
  29936. }
  29937. *res = (sp_384_cmp_12(p1->x, u1) == 0);
  29938. }
  29939. }
  29940. }
  29941. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29942. if (u1 != NULL)
  29943. XFREE(u1, heap, DYNAMIC_TYPE_ECC);
  29944. if (p1 != NULL)
  29945. XFREE(p1, heap, DYNAMIC_TYPE_ECC);
  29946. #endif
  29947. return err;
  29948. }
  29949. #endif /* HAVE_ECC_VERIFY */
  29950. #ifdef HAVE_ECC_CHECK_KEY
  29951. /* Check that the x and y oridinates are a valid point on the curve.
  29952. *
  29953. * point EC point.
  29954. * heap Heap to use if dynamically allocating.
  29955. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  29956. * not on the curve and MP_OKAY otherwise.
  29957. */
  29958. static int sp_384_ecc_is_point_12(const sp_point_384* point,
  29959. void* heap)
  29960. {
  29961. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29962. sp_digit* t1 = NULL;
  29963. #else
  29964. sp_digit t1[12 * 4];
  29965. #endif
  29966. sp_digit* t2 = NULL;
  29967. int err = MP_OKAY;
  29968. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29969. t1 = (sp_digit*)XMALLOC(sizeof(sp_digit) * 12 * 4, heap, DYNAMIC_TYPE_ECC);
  29970. if (t1 == NULL)
  29971. err = MEMORY_E;
  29972. #endif
  29973. (void)heap;
  29974. if (err == MP_OKAY) {
  29975. t2 = t1 + 2 * 12;
  29976. sp_384_sqr_12(t1, point->y);
  29977. (void)sp_384_mod_12(t1, t1, p384_mod);
  29978. sp_384_sqr_12(t2, point->x);
  29979. (void)sp_384_mod_12(t2, t2, p384_mod);
  29980. sp_384_mul_12(t2, t2, point->x);
  29981. (void)sp_384_mod_12(t2, t2, p384_mod);
  29982. (void)sp_384_sub_12(t2, p384_mod, t2);
  29983. sp_384_mont_add_12(t1, t1, t2, p384_mod);
  29984. sp_384_mont_add_12(t1, t1, point->x, p384_mod);
  29985. sp_384_mont_add_12(t1, t1, point->x, p384_mod);
  29986. sp_384_mont_add_12(t1, t1, point->x, p384_mod);
  29987. if (sp_384_cmp_12(t1, p384_b) != 0) {
  29988. err = MP_VAL;
  29989. }
  29990. }
  29991. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  29992. if (t1 != NULL)
  29993. XFREE(t1, heap, DYNAMIC_TYPE_ECC);
  29994. #endif
  29995. return err;
  29996. }
  29997. /* Check that the x and y oridinates are a valid point on the curve.
  29998. *
  29999. * pX X ordinate of EC point.
  30000. * pY Y ordinate of EC point.
  30001. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  30002. * not on the curve and MP_OKAY otherwise.
  30003. */
  30004. int sp_ecc_is_point_384(const mp_int* pX, const mp_int* pY)
  30005. {
  30006. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30007. sp_point_384* pub = NULL;
  30008. #else
  30009. sp_point_384 pub[1];
  30010. #endif
  30011. const byte one[1] = { 1 };
  30012. int err = MP_OKAY;
  30013. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30014. pub = (sp_point_384*)XMALLOC(sizeof(sp_point_384), NULL,
  30015. DYNAMIC_TYPE_ECC);
  30016. if (pub == NULL)
  30017. err = MEMORY_E;
  30018. #endif
  30019. if (err == MP_OKAY) {
  30020. sp_384_from_mp(pub->x, 12, pX);
  30021. sp_384_from_mp(pub->y, 12, pY);
  30022. sp_384_from_bin(pub->z, 12, one, (int)sizeof(one));
  30023. err = sp_384_ecc_is_point_12(pub, NULL);
  30024. }
  30025. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30026. if (pub != NULL)
  30027. XFREE(pub, NULL, DYNAMIC_TYPE_ECC);
  30028. #endif
  30029. return err;
  30030. }
  30031. /* Check that the private scalar generates the EC point (px, py), the point is
  30032. * on the curve and the point has the correct order.
  30033. *
  30034. * pX X ordinate of EC point.
  30035. * pY Y ordinate of EC point.
  30036. * privm Private scalar that generates EC point.
  30037. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  30038. * not on the curve, ECC_INF_E if the point does not have the correct order,
  30039. * ECC_PRIV_KEY_E when the private scalar doesn't generate the EC point and
  30040. * MP_OKAY otherwise.
  30041. */
  30042. int sp_ecc_check_key_384(const mp_int* pX, const mp_int* pY,
  30043. const mp_int* privm, void* heap)
  30044. {
  30045. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30046. sp_digit* priv = NULL;
  30047. sp_point_384* pub = NULL;
  30048. #else
  30049. sp_digit priv[12];
  30050. sp_point_384 pub[2];
  30051. #endif
  30052. sp_point_384* p = NULL;
  30053. const byte one[1] = { 1 };
  30054. int err = MP_OKAY;
  30055. /* Quick check the lengs of public key ordinates and private key are in
  30056. * range. Proper check later.
  30057. */
  30058. if (((mp_count_bits(pX) > 384) ||
  30059. (mp_count_bits(pY) > 384) ||
  30060. ((privm != NULL) && (mp_count_bits(privm) > 384)))) {
  30061. err = ECC_OUT_OF_RANGE_E;
  30062. }
  30063. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30064. if (err == MP_OKAY) {
  30065. pub = (sp_point_384*)XMALLOC(sizeof(sp_point_384) * 2, heap,
  30066. DYNAMIC_TYPE_ECC);
  30067. if (pub == NULL)
  30068. err = MEMORY_E;
  30069. }
  30070. if (err == MP_OKAY && privm) {
  30071. priv = (sp_digit*)XMALLOC(sizeof(sp_digit) * 12, heap,
  30072. DYNAMIC_TYPE_ECC);
  30073. if (priv == NULL)
  30074. err = MEMORY_E;
  30075. }
  30076. #endif
  30077. if (err == MP_OKAY) {
  30078. p = pub + 1;
  30079. sp_384_from_mp(pub->x, 12, pX);
  30080. sp_384_from_mp(pub->y, 12, pY);
  30081. sp_384_from_bin(pub->z, 12, one, (int)sizeof(one));
  30082. if (privm)
  30083. sp_384_from_mp(priv, 12, privm);
  30084. /* Check point at infinitiy. */
  30085. if ((sp_384_iszero_12(pub->x) != 0) &&
  30086. (sp_384_iszero_12(pub->y) != 0)) {
  30087. err = ECC_INF_E;
  30088. }
  30089. }
  30090. /* Check range of X and Y */
  30091. if ((err == MP_OKAY) &&
  30092. ((sp_384_cmp_12(pub->x, p384_mod) >= 0) ||
  30093. (sp_384_cmp_12(pub->y, p384_mod) >= 0))) {
  30094. err = ECC_OUT_OF_RANGE_E;
  30095. }
  30096. if (err == MP_OKAY) {
  30097. /* Check point is on curve */
  30098. err = sp_384_ecc_is_point_12(pub, heap);
  30099. }
  30100. if (err == MP_OKAY) {
  30101. /* Point * order = infinity */
  30102. err = sp_384_ecc_mulmod_12(p, pub, p384_order, 1, 1, heap);
  30103. }
  30104. /* Check result is infinity */
  30105. if ((err == MP_OKAY) && ((sp_384_iszero_12(p->x) == 0) ||
  30106. (sp_384_iszero_12(p->y) == 0))) {
  30107. err = ECC_INF_E;
  30108. }
  30109. if (privm) {
  30110. if (err == MP_OKAY) {
  30111. /* Base * private = point */
  30112. err = sp_384_ecc_mulmod_base_12(p, priv, 1, 1, heap);
  30113. }
  30114. /* Check result is public key */
  30115. if ((err == MP_OKAY) &&
  30116. ((sp_384_cmp_12(p->x, pub->x) != 0) ||
  30117. (sp_384_cmp_12(p->y, pub->y) != 0))) {
  30118. err = ECC_PRIV_KEY_E;
  30119. }
  30120. }
  30121. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30122. if (pub != NULL)
  30123. XFREE(pub, heap, DYNAMIC_TYPE_ECC);
  30124. if (priv != NULL)
  30125. XFREE(priv, heap, DYNAMIC_TYPE_ECC);
  30126. #endif
  30127. return err;
  30128. }
  30129. #endif
  30130. #ifdef WOLFSSL_PUBLIC_ECC_ADD_DBL
  30131. /* Add two projective EC points together.
  30132. * (pX, pY, pZ) + (qX, qY, qZ) = (rX, rY, rZ)
  30133. *
  30134. * pX First EC point's X ordinate.
  30135. * pY First EC point's Y ordinate.
  30136. * pZ First EC point's Z ordinate.
  30137. * qX Second EC point's X ordinate.
  30138. * qY Second EC point's Y ordinate.
  30139. * qZ Second EC point's Z ordinate.
  30140. * rX Resultant EC point's X ordinate.
  30141. * rY Resultant EC point's Y ordinate.
  30142. * rZ Resultant EC point's Z ordinate.
  30143. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  30144. */
  30145. int sp_ecc_proj_add_point_384(mp_int* pX, mp_int* pY, mp_int* pZ,
  30146. mp_int* qX, mp_int* qY, mp_int* qZ,
  30147. mp_int* rX, mp_int* rY, mp_int* rZ)
  30148. {
  30149. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30150. sp_digit* tmp = NULL;
  30151. sp_point_384* p = NULL;
  30152. #else
  30153. sp_digit tmp[2 * 12 * 6];
  30154. sp_point_384 p[2];
  30155. #endif
  30156. sp_point_384* q = NULL;
  30157. int err = MP_OKAY;
  30158. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30159. if (err == MP_OKAY) {
  30160. p = (sp_point_384*)XMALLOC(sizeof(sp_point_384) * 2, NULL,
  30161. DYNAMIC_TYPE_ECC);
  30162. if (p == NULL)
  30163. err = MEMORY_E;
  30164. }
  30165. if (err == MP_OKAY) {
  30166. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 12 * 6, NULL,
  30167. DYNAMIC_TYPE_ECC);
  30168. if (tmp == NULL) {
  30169. err = MEMORY_E;
  30170. }
  30171. }
  30172. #endif
  30173. if (err == MP_OKAY) {
  30174. q = p + 1;
  30175. sp_384_from_mp(p->x, 12, pX);
  30176. sp_384_from_mp(p->y, 12, pY);
  30177. sp_384_from_mp(p->z, 12, pZ);
  30178. sp_384_from_mp(q->x, 12, qX);
  30179. sp_384_from_mp(q->y, 12, qY);
  30180. sp_384_from_mp(q->z, 12, qZ);
  30181. p->infinity = sp_384_iszero_12(p->x) &
  30182. sp_384_iszero_12(p->y);
  30183. q->infinity = sp_384_iszero_12(q->x) &
  30184. sp_384_iszero_12(q->y);
  30185. sp_384_proj_point_add_12(p, p, q, tmp);
  30186. }
  30187. if (err == MP_OKAY) {
  30188. err = sp_384_to_mp(p->x, rX);
  30189. }
  30190. if (err == MP_OKAY) {
  30191. err = sp_384_to_mp(p->y, rY);
  30192. }
  30193. if (err == MP_OKAY) {
  30194. err = sp_384_to_mp(p->z, rZ);
  30195. }
  30196. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30197. if (tmp != NULL)
  30198. XFREE(tmp, NULL, DYNAMIC_TYPE_ECC);
  30199. if (p != NULL)
  30200. XFREE(p, NULL, DYNAMIC_TYPE_ECC);
  30201. #endif
  30202. return err;
  30203. }
  30204. /* Double a projective EC point.
  30205. * (pX, pY, pZ) + (pX, pY, pZ) = (rX, rY, rZ)
  30206. *
  30207. * pX EC point's X ordinate.
  30208. * pY EC point's Y ordinate.
  30209. * pZ EC point's Z ordinate.
  30210. * rX Resultant EC point's X ordinate.
  30211. * rY Resultant EC point's Y ordinate.
  30212. * rZ Resultant EC point's Z ordinate.
  30213. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  30214. */
  30215. int sp_ecc_proj_dbl_point_384(mp_int* pX, mp_int* pY, mp_int* pZ,
  30216. mp_int* rX, mp_int* rY, mp_int* rZ)
  30217. {
  30218. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30219. sp_digit* tmp = NULL;
  30220. sp_point_384* p = NULL;
  30221. #else
  30222. sp_digit tmp[2 * 12 * 2];
  30223. sp_point_384 p[1];
  30224. #endif
  30225. int err = MP_OKAY;
  30226. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30227. if (err == MP_OKAY) {
  30228. p = (sp_point_384*)XMALLOC(sizeof(sp_point_384), NULL,
  30229. DYNAMIC_TYPE_ECC);
  30230. if (p == NULL)
  30231. err = MEMORY_E;
  30232. }
  30233. if (err == MP_OKAY) {
  30234. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 12 * 2, NULL,
  30235. DYNAMIC_TYPE_ECC);
  30236. if (tmp == NULL)
  30237. err = MEMORY_E;
  30238. }
  30239. #endif
  30240. if (err == MP_OKAY) {
  30241. sp_384_from_mp(p->x, 12, pX);
  30242. sp_384_from_mp(p->y, 12, pY);
  30243. sp_384_from_mp(p->z, 12, pZ);
  30244. p->infinity = sp_384_iszero_12(p->x) &
  30245. sp_384_iszero_12(p->y);
  30246. sp_384_proj_point_dbl_12(p, p, tmp);
  30247. }
  30248. if (err == MP_OKAY) {
  30249. err = sp_384_to_mp(p->x, rX);
  30250. }
  30251. if (err == MP_OKAY) {
  30252. err = sp_384_to_mp(p->y, rY);
  30253. }
  30254. if (err == MP_OKAY) {
  30255. err = sp_384_to_mp(p->z, rZ);
  30256. }
  30257. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30258. if (tmp != NULL)
  30259. XFREE(tmp, NULL, DYNAMIC_TYPE_ECC);
  30260. if (p != NULL)
  30261. XFREE(p, NULL, DYNAMIC_TYPE_ECC);
  30262. #endif
  30263. return err;
  30264. }
  30265. /* Map a projective EC point to affine in place.
  30266. * pZ will be one.
  30267. *
  30268. * pX EC point's X ordinate.
  30269. * pY EC point's Y ordinate.
  30270. * pZ EC point's Z ordinate.
  30271. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  30272. */
  30273. int sp_ecc_map_384(mp_int* pX, mp_int* pY, mp_int* pZ)
  30274. {
  30275. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30276. sp_digit* tmp = NULL;
  30277. sp_point_384* p = NULL;
  30278. #else
  30279. sp_digit tmp[2 * 12 * 6];
  30280. sp_point_384 p[1];
  30281. #endif
  30282. int err = MP_OKAY;
  30283. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30284. if (err == MP_OKAY) {
  30285. p = (sp_point_384*)XMALLOC(sizeof(sp_point_384), NULL,
  30286. DYNAMIC_TYPE_ECC);
  30287. if (p == NULL)
  30288. err = MEMORY_E;
  30289. }
  30290. if (err == MP_OKAY) {
  30291. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 12 * 6, NULL,
  30292. DYNAMIC_TYPE_ECC);
  30293. if (tmp == NULL)
  30294. err = MEMORY_E;
  30295. }
  30296. #endif
  30297. if (err == MP_OKAY) {
  30298. sp_384_from_mp(p->x, 12, pX);
  30299. sp_384_from_mp(p->y, 12, pY);
  30300. sp_384_from_mp(p->z, 12, pZ);
  30301. p->infinity = sp_384_iszero_12(p->x) &
  30302. sp_384_iszero_12(p->y);
  30303. sp_384_map_12(p, p, tmp);
  30304. }
  30305. if (err == MP_OKAY) {
  30306. err = sp_384_to_mp(p->x, pX);
  30307. }
  30308. if (err == MP_OKAY) {
  30309. err = sp_384_to_mp(p->y, pY);
  30310. }
  30311. if (err == MP_OKAY) {
  30312. err = sp_384_to_mp(p->z, pZ);
  30313. }
  30314. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30315. if (tmp != NULL)
  30316. XFREE(tmp, NULL, DYNAMIC_TYPE_ECC);
  30317. if (p != NULL)
  30318. XFREE(p, NULL, DYNAMIC_TYPE_ECC);
  30319. #endif
  30320. return err;
  30321. }
  30322. #endif /* WOLFSSL_PUBLIC_ECC_ADD_DBL */
  30323. #ifdef HAVE_COMP_KEY
  30324. /* Find the square root of a number mod the prime of the curve.
  30325. *
  30326. * y The number to operate on and the result.
  30327. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  30328. */
  30329. static int sp_384_mont_sqrt_12(sp_digit* y)
  30330. {
  30331. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30332. sp_digit* t1 = NULL;
  30333. #else
  30334. sp_digit t1[5 * 2 * 12];
  30335. #endif
  30336. sp_digit* t2 = NULL;
  30337. sp_digit* t3 = NULL;
  30338. sp_digit* t4 = NULL;
  30339. sp_digit* t5 = NULL;
  30340. int err = MP_OKAY;
  30341. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30342. t1 = (sp_digit*)XMALLOC(sizeof(sp_digit) * 5 * 2 * 12, NULL, DYNAMIC_TYPE_ECC);
  30343. if (t1 == NULL)
  30344. err = MEMORY_E;
  30345. #endif
  30346. if (err == MP_OKAY) {
  30347. t2 = t1 + 2 * 12;
  30348. t3 = t1 + 4 * 12;
  30349. t4 = t1 + 6 * 12;
  30350. t5 = t1 + 8 * 12;
  30351. {
  30352. /* t2 = y ^ 0x2 */
  30353. sp_384_mont_sqr_12(t2, y, p384_mod, p384_mp_mod);
  30354. /* t1 = y ^ 0x3 */
  30355. sp_384_mont_mul_12(t1, t2, y, p384_mod, p384_mp_mod);
  30356. /* t5 = y ^ 0xc */
  30357. sp_384_mont_sqr_n_12(t5, t1, 2, p384_mod, p384_mp_mod);
  30358. /* t1 = y ^ 0xf */
  30359. sp_384_mont_mul_12(t1, t1, t5, p384_mod, p384_mp_mod);
  30360. /* t2 = y ^ 0x1e */
  30361. sp_384_mont_sqr_12(t2, t1, p384_mod, p384_mp_mod);
  30362. /* t3 = y ^ 0x1f */
  30363. sp_384_mont_mul_12(t3, t2, y, p384_mod, p384_mp_mod);
  30364. /* t2 = y ^ 0x3e0 */
  30365. sp_384_mont_sqr_n_12(t2, t3, 5, p384_mod, p384_mp_mod);
  30366. /* t1 = y ^ 0x3ff */
  30367. sp_384_mont_mul_12(t1, t3, t2, p384_mod, p384_mp_mod);
  30368. /* t2 = y ^ 0x7fe0 */
  30369. sp_384_mont_sqr_n_12(t2, t1, 5, p384_mod, p384_mp_mod);
  30370. /* t3 = y ^ 0x7fff */
  30371. sp_384_mont_mul_12(t3, t3, t2, p384_mod, p384_mp_mod);
  30372. /* t2 = y ^ 0x3fff800 */
  30373. sp_384_mont_sqr_n_12(t2, t3, 15, p384_mod, p384_mp_mod);
  30374. /* t4 = y ^ 0x3ffffff */
  30375. sp_384_mont_mul_12(t4, t3, t2, p384_mod, p384_mp_mod);
  30376. /* t2 = y ^ 0xffffffc000000 */
  30377. sp_384_mont_sqr_n_12(t2, t4, 30, p384_mod, p384_mp_mod);
  30378. /* t1 = y ^ 0xfffffffffffff */
  30379. sp_384_mont_mul_12(t1, t4, t2, p384_mod, p384_mp_mod);
  30380. /* t2 = y ^ 0xfffffffffffffff000000000000000 */
  30381. sp_384_mont_sqr_n_12(t2, t1, 60, p384_mod, p384_mp_mod);
  30382. /* t1 = y ^ 0xffffffffffffffffffffffffffffff */
  30383. sp_384_mont_mul_12(t1, t1, t2, p384_mod, p384_mp_mod);
  30384. /* t2 = y ^ 0xffffffffffffffffffffffffffffff000000000000000000000000000000 */
  30385. sp_384_mont_sqr_n_12(t2, t1, 120, p384_mod, p384_mp_mod);
  30386. /* t1 = y ^ 0xffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff */
  30387. sp_384_mont_mul_12(t1, t1, t2, p384_mod, p384_mp_mod);
  30388. /* t2 = y ^ 0x7fffffffffffffffffffffffffffffffffffffffffffffffffffffffffff8000 */
  30389. sp_384_mont_sqr_n_12(t2, t1, 15, p384_mod, p384_mp_mod);
  30390. /* t1 = y ^ 0x7fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff */
  30391. sp_384_mont_mul_12(t1, t3, t2, p384_mod, p384_mp_mod);
  30392. /* t2 = y ^ 0x3fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff80000000 */
  30393. sp_384_mont_sqr_n_12(t2, t1, 31, p384_mod, p384_mp_mod);
  30394. /* t1 = y ^ 0x3fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffbfffffff */
  30395. sp_384_mont_mul_12(t1, t4, t2, p384_mod, p384_mp_mod);
  30396. /* t2 = y ^ 0x3fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffbfffffff0 */
  30397. sp_384_mont_sqr_n_12(t2, t1, 4, p384_mod, p384_mp_mod);
  30398. /* t1 = y ^ 0x3fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffbfffffffc */
  30399. sp_384_mont_mul_12(t1, t5, t2, p384_mod, p384_mp_mod);
  30400. /* t2 = y ^ 0xfffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffeffffffff0000000000000000 */
  30401. sp_384_mont_sqr_n_12(t2, t1, 62, p384_mod, p384_mp_mod);
  30402. /* t1 = y ^ 0xfffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffeffffffff0000000000000001 */
  30403. sp_384_mont_mul_12(t1, y, t2, p384_mod, p384_mp_mod);
  30404. /* t2 = y ^ 0x3fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffbfffffffc00000000000000040000000 */
  30405. sp_384_mont_sqr_n_12(y, t1, 30, p384_mod, p384_mp_mod);
  30406. }
  30407. }
  30408. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30409. if (t1 != NULL)
  30410. XFREE(t1, NULL, DYNAMIC_TYPE_ECC);
  30411. #endif
  30412. return err;
  30413. }
  30414. /* Uncompress the point given the X ordinate.
  30415. *
  30416. * xm X ordinate.
  30417. * odd Whether the Y ordinate is odd.
  30418. * ym Calculated Y ordinate.
  30419. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  30420. */
  30421. int sp_ecc_uncompress_384(mp_int* xm, int odd, mp_int* ym)
  30422. {
  30423. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30424. sp_digit* x = NULL;
  30425. #else
  30426. sp_digit x[4 * 12];
  30427. #endif
  30428. sp_digit* y = NULL;
  30429. int err = MP_OKAY;
  30430. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30431. x = (sp_digit*)XMALLOC(sizeof(sp_digit) * 4 * 12, NULL, DYNAMIC_TYPE_ECC);
  30432. if (x == NULL)
  30433. err = MEMORY_E;
  30434. #endif
  30435. if (err == MP_OKAY) {
  30436. y = x + 2 * 12;
  30437. sp_384_from_mp(x, 12, xm);
  30438. err = sp_384_mod_mul_norm_12(x, x, p384_mod);
  30439. }
  30440. if (err == MP_OKAY) {
  30441. /* y = x^3 */
  30442. {
  30443. sp_384_mont_sqr_12(y, x, p384_mod, p384_mp_mod);
  30444. sp_384_mont_mul_12(y, y, x, p384_mod, p384_mp_mod);
  30445. }
  30446. /* y = x^3 - 3x */
  30447. sp_384_mont_sub_12(y, y, x, p384_mod);
  30448. sp_384_mont_sub_12(y, y, x, p384_mod);
  30449. sp_384_mont_sub_12(y, y, x, p384_mod);
  30450. /* y = x^3 - 3x + b */
  30451. err = sp_384_mod_mul_norm_12(x, p384_b, p384_mod);
  30452. }
  30453. if (err == MP_OKAY) {
  30454. sp_384_mont_add_12(y, y, x, p384_mod);
  30455. /* y = sqrt(x^3 - 3x + b) */
  30456. err = sp_384_mont_sqrt_12(y);
  30457. }
  30458. if (err == MP_OKAY) {
  30459. XMEMSET(y + 12, 0, 12U * sizeof(sp_digit));
  30460. sp_384_mont_reduce_12(y, p384_mod, p384_mp_mod);
  30461. if ((((word32)y[0] ^ (word32)odd) & 1U) != 0U) {
  30462. sp_384_mont_sub_12(y, p384_mod, y, p384_mod);
  30463. }
  30464. err = sp_384_to_mp(y, ym);
  30465. }
  30466. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  30467. if (x != NULL)
  30468. XFREE(x, NULL, DYNAMIC_TYPE_ECC);
  30469. #endif
  30470. return err;
  30471. }
  30472. #endif
  30473. #endif /* WOLFSSL_SP_384 */
  30474. #ifdef WOLFSSL_SP_521
  30475. /* Point structure to use. */
  30476. typedef struct sp_point_521 {
  30477. /* X ordinate of point. */
  30478. sp_digit x[2 * 17];
  30479. /* Y ordinate of point. */
  30480. sp_digit y[2 * 17];
  30481. /* Z ordinate of point. */
  30482. sp_digit z[2 * 17];
  30483. /* Indicates point is at infinity. */
  30484. int infinity;
  30485. } sp_point_521;
  30486. /* The modulus (prime) of the curve P521. */
  30487. static const sp_digit p521_mod[17] = {
  30488. 0xffffffff,0xffffffff,0xffffffff,0xffffffff,0xffffffff,0xffffffff,
  30489. 0xffffffff,0xffffffff,0xffffffff,0xffffffff,0xffffffff,0xffffffff,
  30490. 0xffffffff,0xffffffff,0xffffffff,0xffffffff,0x000001ff
  30491. };
  30492. /* The Montgomery normalizer for modulus of the curve P521. */
  30493. static const sp_digit p521_norm_mod[17] = {
  30494. 0x00000001,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  30495. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  30496. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000
  30497. };
  30498. /* The Montgomery multiplier for modulus of the curve P521. */
  30499. static sp_digit p521_mp_mod = 0x00000001;
  30500. #if defined(WOLFSSL_VALIDATE_ECC_KEYGEN) || defined(HAVE_ECC_SIGN) || \
  30501. defined(HAVE_ECC_VERIFY)
  30502. /* The order of the curve P521. */
  30503. static const sp_digit p521_order[17] = {
  30504. 0x91386409,0xbb6fb71e,0x899c47ae,0x3bb5c9b8,0xf709a5d0,0x7fcc0148,
  30505. 0xbf2f966b,0x51868783,0xfffffffa,0xffffffff,0xffffffff,0xffffffff,
  30506. 0xffffffff,0xffffffff,0xffffffff,0xffffffff,0x000001ff
  30507. };
  30508. #endif
  30509. /* The order of the curve P521 minus 2. */
  30510. static const sp_digit p521_order2[17] = {
  30511. 0x91386407,0xbb6fb71e,0x899c47ae,0x3bb5c9b8,0xf709a5d0,0x7fcc0148,
  30512. 0xbf2f966b,0x51868783,0xfffffffa,0xffffffff,0xffffffff,0xffffffff,
  30513. 0xffffffff,0xffffffff,0xffffffff,0xffffffff,0x000001ff
  30514. };
  30515. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  30516. /* The Montgomery normalizer for order of the curve P521. */
  30517. static const sp_digit p521_norm_order[17] = {
  30518. 0x6ec79bf7,0x449048e1,0x7663b851,0xc44a3647,0x08f65a2f,0x8033feb7,
  30519. 0x40d06994,0xae79787c,0x00000005,0x00000000,0x00000000,0x00000000,
  30520. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000
  30521. };
  30522. #endif
  30523. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  30524. /* The Montgomery multiplier for order of the curve P521. */
  30525. static sp_digit p521_mp_order = 0x79a995c7;
  30526. #endif
  30527. /* The base point of curve P521. */
  30528. static const sp_point_521 p521_base = {
  30529. /* X ordinate */
  30530. {
  30531. 0xc2e5bd66,0xf97e7e31,0x856a429b,0x3348b3c1,0xa2ffa8de,0xfe1dc127,
  30532. 0xefe75928,0xa14b5e77,0x6b4d3dba,0xf828af60,0x053fb521,0x9c648139,
  30533. 0x2395b442,0x9e3ecb66,0x0404e9cd,0x858e06b7,0x000000c6,
  30534. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  30535. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  30536. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  30537. (sp_digit)0, (sp_digit)0
  30538. },
  30539. /* Y ordinate */
  30540. {
  30541. 0x9fd16650,0x88be9476,0xa272c240,0x353c7086,0x3fad0761,0xc550b901,
  30542. 0x5ef42640,0x97ee7299,0x273e662c,0x17afbd17,0x579b4468,0x98f54449,
  30543. 0x2c7d1bd9,0x5c8a5fb4,0x9a3bc004,0x39296a78,0x00000118,
  30544. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  30545. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  30546. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  30547. (sp_digit)0, (sp_digit)0
  30548. },
  30549. /* Z ordinate */
  30550. {
  30551. 0x00000001,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  30552. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  30553. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  30554. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  30555. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  30556. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  30557. (sp_digit)0, (sp_digit)0
  30558. },
  30559. /* infinity */
  30560. 0
  30561. };
  30562. #if defined(HAVE_ECC_CHECK_KEY) || defined(HAVE_COMP_KEY)
  30563. static const sp_digit p521_b[17] = {
  30564. 0x6b503f00,0xef451fd4,0x3d2c34f1,0x3573df88,0x3bb1bf07,0x1652c0bd,
  30565. 0xec7e937b,0x56193951,0x8ef109e1,0xb8b48991,0x99b315f3,0xa2da725b,
  30566. 0xb68540ee,0x929a21a0,0x8e1c9a1f,0x953eb961,0x00000051
  30567. };
  30568. #endif
  30569. /* Multiply a and b into r. (r = a * b)
  30570. *
  30571. * r A single precision integer.
  30572. * a A single precision integer.
  30573. * b A single precision integer.
  30574. */
  30575. SP_NOINLINE static void sp_521_mul_17(sp_digit* r, const sp_digit* a,
  30576. const sp_digit* b)
  30577. {
  30578. sp_digit tmp_arr[17 * 2];
  30579. sp_digit* tmp = tmp_arr;
  30580. __asm__ __volatile__ (
  30581. "mov r3, #0\n\t"
  30582. "mov r4, #0\n\t"
  30583. "mov r9, r3\n\t"
  30584. "mov r12, %[r]\n\t"
  30585. "mov r10, %[a]\n\t"
  30586. "mov r11, %[b]\n\t"
  30587. "mov r6, #68\n\t"
  30588. "add r6, r6, r10\n\t"
  30589. "mov r14, r6\n\t"
  30590. "\n1:\n\t"
  30591. "mov %[r], #0\n\t"
  30592. "mov r5, #0\n\t"
  30593. "mov r6, #64\n\t"
  30594. "mov %[a], r9\n\t"
  30595. "subs %[a], %[a], r6\n\t"
  30596. "sbc r6, r6, r6\n\t"
  30597. "mvn r6, r6\n\t"
  30598. "and %[a], %[a], r6\n\t"
  30599. "mov %[b], r9\n\t"
  30600. "sub %[b], %[b], %[a]\n\t"
  30601. "add %[a], %[a], r10\n\t"
  30602. "add %[b], %[b], r11\n\t"
  30603. "\n2:\n\t"
  30604. /* Multiply Start */
  30605. "ldr r6, [%[a]]\n\t"
  30606. "ldr r8, [%[b]]\n\t"
  30607. "umull r6, r8, r6, r8\n\t"
  30608. "adds r3, r3, r6\n\t"
  30609. "adcs r4, r4, r8\n\t"
  30610. "adc r5, r5, %[r]\n\t"
  30611. /* Multiply Done */
  30612. "add %[a], %[a], #4\n\t"
  30613. "sub %[b], %[b], #4\n\t"
  30614. "cmp %[a], r14\n\t"
  30615. #ifdef __GNUC__
  30616. "beq 3f\n\t"
  30617. #else
  30618. "beq.n 3f\n\t"
  30619. #endif /* __GNUC__ */
  30620. "mov r6, r9\n\t"
  30621. "add r6, r6, r10\n\t"
  30622. "cmp %[a], r6\n\t"
  30623. #ifdef __GNUC__
  30624. "ble 2b\n\t"
  30625. #else
  30626. "ble.n 2b\n\t"
  30627. #endif /* __GNUC__ */
  30628. "\n3:\n\t"
  30629. "mov %[r], r12\n\t"
  30630. "mov r8, r9\n\t"
  30631. "str r3, [%[r], r8]\n\t"
  30632. "mov r3, r4\n\t"
  30633. "mov r4, r5\n\t"
  30634. "add r8, r8, #4\n\t"
  30635. "mov r9, r8\n\t"
  30636. "mov r6, #128\n\t"
  30637. "cmp r8, r6\n\t"
  30638. #ifdef __GNUC__
  30639. "ble 1b\n\t"
  30640. #else
  30641. "ble.n 1b\n\t"
  30642. #endif /* __GNUC__ */
  30643. "str r3, [%[r], r8]\n\t"
  30644. "mov %[a], r10\n\t"
  30645. "mov %[b], r11\n\t"
  30646. :
  30647. : [r] "r" (tmp), [a] "r" (a), [b] "r" (b)
  30648. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  30649. );
  30650. XMEMCPY(r, tmp_arr, sizeof(tmp_arr));
  30651. }
  30652. /* Square a and put result in r. (r = a * a)
  30653. *
  30654. * r A single precision integer.
  30655. * a A single precision integer.
  30656. */
  30657. SP_NOINLINE static void sp_521_sqr_17(sp_digit* r, const sp_digit* a)
  30658. {
  30659. __asm__ __volatile__ (
  30660. "mov r3, #0\n\t"
  30661. "mov r4, #0\n\t"
  30662. "mov r5, #0\n\t"
  30663. "mov r9, r3\n\t"
  30664. "mov r12, %[r]\n\t"
  30665. "mov r6, #136\n\t"
  30666. "neg r6, r6\n\t"
  30667. "add sp, sp, r6\n\t"
  30668. "mov r11, sp\n\t"
  30669. "mov r10, %[a]\n\t"
  30670. "\n1:\n\t"
  30671. "mov %[r], #0\n\t"
  30672. "mov r6, #64\n\t"
  30673. "mov %[a], r9\n\t"
  30674. "subs %[a], %[a], r6\n\t"
  30675. "sbc r6, r6, r6\n\t"
  30676. "mvn r6, r6\n\t"
  30677. "and %[a], %[a], r6\n\t"
  30678. "mov r2, r9\n\t"
  30679. "sub r2, r2, %[a]\n\t"
  30680. "add %[a], %[a], r10\n\t"
  30681. "add r2, r2, r10\n\t"
  30682. "\n2:\n\t"
  30683. "cmp r2, %[a]\n\t"
  30684. #ifdef __GNUC__
  30685. "beq 4f\n\t"
  30686. #else
  30687. "beq.n 4f\n\t"
  30688. #endif /* __GNUC__ */
  30689. /* Multiply * 2: Start */
  30690. "ldr r6, [%[a]]\n\t"
  30691. "ldr r8, [r2]\n\t"
  30692. "umull r6, r8, r6, r8\n\t"
  30693. "adds r3, r3, r6\n\t"
  30694. "adcs r4, r4, r8\n\t"
  30695. "adc r5, r5, %[r]\n\t"
  30696. "adds r3, r3, r6\n\t"
  30697. "adcs r4, r4, r8\n\t"
  30698. "adc r5, r5, %[r]\n\t"
  30699. /* Multiply * 2: Done */
  30700. #ifdef __GNUC__
  30701. "bal 5f\n\t"
  30702. #else
  30703. "bal.n 5f\n\t"
  30704. #endif /* __GNUC__ */
  30705. "\n4:\n\t"
  30706. /* Square: Start */
  30707. "ldr r6, [%[a]]\n\t"
  30708. "umull r6, r8, r6, r6\n\t"
  30709. "adds r3, r3, r6\n\t"
  30710. "adcs r4, r4, r8\n\t"
  30711. "adc r5, r5, %[r]\n\t"
  30712. /* Square: Done */
  30713. "\n5:\n\t"
  30714. "add %[a], %[a], #4\n\t"
  30715. "sub r2, r2, #4\n\t"
  30716. "mov r6, #68\n\t"
  30717. "add r6, r6, r10\n\t"
  30718. "cmp %[a], r6\n\t"
  30719. #ifdef __GNUC__
  30720. "beq 3f\n\t"
  30721. #else
  30722. "beq.n 3f\n\t"
  30723. #endif /* __GNUC__ */
  30724. "cmp %[a], r2\n\t"
  30725. #ifdef __GNUC__
  30726. "bgt 3f\n\t"
  30727. #else
  30728. "bgt.n 3f\n\t"
  30729. #endif /* __GNUC__ */
  30730. "mov r8, r9\n\t"
  30731. "add r8, r8, r10\n\t"
  30732. "cmp %[a], r8\n\t"
  30733. #ifdef __GNUC__
  30734. "ble 2b\n\t"
  30735. #else
  30736. "ble.n 2b\n\t"
  30737. #endif /* __GNUC__ */
  30738. "\n3:\n\t"
  30739. "mov %[r], r11\n\t"
  30740. "mov r8, r9\n\t"
  30741. "str r3, [%[r], r8]\n\t"
  30742. "mov r3, r4\n\t"
  30743. "mov r4, r5\n\t"
  30744. "mov r5, #0\n\t"
  30745. "add r8, r8, #4\n\t"
  30746. "mov r9, r8\n\t"
  30747. "mov r6, #128\n\t"
  30748. "cmp r8, r6\n\t"
  30749. #ifdef __GNUC__
  30750. "ble 1b\n\t"
  30751. #else
  30752. "ble.n 1b\n\t"
  30753. #endif /* __GNUC__ */
  30754. "mov %[a], r10\n\t"
  30755. "str r3, [%[r], r8]\n\t"
  30756. "mov %[r], r12\n\t"
  30757. "mov %[a], r11\n\t"
  30758. "mov r3, #132\n\t"
  30759. "\n4:\n\t"
  30760. "ldr r6, [%[a], r3]\n\t"
  30761. "str r6, [%[r], r3]\n\t"
  30762. "subs r3, r3, #4\n\t"
  30763. #ifdef __GNUC__
  30764. "bge 4b\n\t"
  30765. #else
  30766. "bge.n 4b\n\t"
  30767. #endif /* __GNUC__ */
  30768. "mov r6, #136\n\t"
  30769. "add sp, sp, r6\n\t"
  30770. :
  30771. : [r] "r" (r), [a] "r" (a)
  30772. : "memory", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12"
  30773. );
  30774. }
  30775. #ifdef WOLFSSL_SP_SMALL
  30776. /* Add b to a into r. (r = a + b)
  30777. *
  30778. * r A single precision integer.
  30779. * a A single precision integer.
  30780. * b A single precision integer.
  30781. */
  30782. SP_NOINLINE static sp_digit sp_521_add_17(sp_digit* r, const sp_digit* a,
  30783. const sp_digit* b)
  30784. {
  30785. sp_digit c = 0;
  30786. __asm__ __volatile__ (
  30787. "mov r6, %[a]\n\t"
  30788. "mov r8, #0\n\t"
  30789. "add r6, r6, #68\n\t"
  30790. "sub r8, r8, #1\n\t"
  30791. "\n1:\n\t"
  30792. "adds %[c], %[c], r8\n\t"
  30793. "ldr r4, [%[a]]\n\t"
  30794. "ldr r5, [%[b]]\n\t"
  30795. "adcs r4, r4, r5\n\t"
  30796. "str r4, [%[r]]\n\t"
  30797. "mov %[c], #0\n\t"
  30798. "adc %[c], %[c], %[c]\n\t"
  30799. "add %[a], %[a], #4\n\t"
  30800. "add %[b], %[b], #4\n\t"
  30801. "add %[r], %[r], #4\n\t"
  30802. "cmp %[a], r6\n\t"
  30803. #ifdef __GNUC__
  30804. "bne 1b\n\t"
  30805. #else
  30806. "bne.n 1b\n\t"
  30807. #endif /* __GNUC__ */
  30808. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  30809. :
  30810. : "memory", "r4", "r5", "r6", "r8"
  30811. );
  30812. return c;
  30813. }
  30814. #else
  30815. /* Add b to a into r. (r = a + b)
  30816. *
  30817. * r A single precision integer.
  30818. * a A single precision integer.
  30819. * b A single precision integer.
  30820. */
  30821. SP_NOINLINE static sp_digit sp_521_add_17(sp_digit* r, const sp_digit* a,
  30822. const sp_digit* b)
  30823. {
  30824. sp_digit c = 0;
  30825. __asm__ __volatile__ (
  30826. "ldm %[a]!, {r4, r5}\n\t"
  30827. "ldm %[b]!, {r6, r8}\n\t"
  30828. "adds r4, r4, r6\n\t"
  30829. "adcs r5, r5, r8\n\t"
  30830. "stm %[r]!, {r4, r5}\n\t"
  30831. "ldm %[a]!, {r4, r5}\n\t"
  30832. "ldm %[b]!, {r6, r8}\n\t"
  30833. "adcs r4, r4, r6\n\t"
  30834. "adcs r5, r5, r8\n\t"
  30835. "stm %[r]!, {r4, r5}\n\t"
  30836. "ldm %[a]!, {r4, r5}\n\t"
  30837. "ldm %[b]!, {r6, r8}\n\t"
  30838. "adcs r4, r4, r6\n\t"
  30839. "adcs r5, r5, r8\n\t"
  30840. "stm %[r]!, {r4, r5}\n\t"
  30841. "ldm %[a]!, {r4, r5}\n\t"
  30842. "ldm %[b]!, {r6, r8}\n\t"
  30843. "adcs r4, r4, r6\n\t"
  30844. "adcs r5, r5, r8\n\t"
  30845. "stm %[r]!, {r4, r5}\n\t"
  30846. "ldm %[a]!, {r4, r5}\n\t"
  30847. "ldm %[b]!, {r6, r8}\n\t"
  30848. "adcs r4, r4, r6\n\t"
  30849. "adcs r5, r5, r8\n\t"
  30850. "stm %[r]!, {r4, r5}\n\t"
  30851. "ldm %[a]!, {r4, r5}\n\t"
  30852. "ldm %[b]!, {r6, r8}\n\t"
  30853. "adcs r4, r4, r6\n\t"
  30854. "adcs r5, r5, r8\n\t"
  30855. "stm %[r]!, {r4, r5}\n\t"
  30856. "ldm %[a]!, {r4, r5}\n\t"
  30857. "ldm %[b]!, {r6, r8}\n\t"
  30858. "adcs r4, r4, r6\n\t"
  30859. "adcs r5, r5, r8\n\t"
  30860. "stm %[r]!, {r4, r5}\n\t"
  30861. "ldm %[a]!, {r4, r5}\n\t"
  30862. "ldm %[b]!, {r6, r8}\n\t"
  30863. "adcs r4, r4, r6\n\t"
  30864. "adcs r5, r5, r8\n\t"
  30865. "stm %[r]!, {r4, r5}\n\t"
  30866. "ldr r4, [%[a]]\n\t"
  30867. "ldr r6, [%[b]]\n\t"
  30868. "adcs r4, r4, r6\n\t"
  30869. "str r4, [%[r]]\n\t"
  30870. "mov %[c], #0\n\t"
  30871. "adc %[c], %[c], %[c]\n\t"
  30872. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  30873. :
  30874. : "memory", "r4", "r5", "r6", "r8"
  30875. );
  30876. return c;
  30877. }
  30878. #endif /* WOLFSSL_SP_SMALL */
  30879. #ifdef WOLFSSL_SP_SMALL
  30880. /* Sub b from a into r. (r = a - b)
  30881. *
  30882. * r A single precision integer.
  30883. * a A single precision integer.
  30884. * b A single precision integer.
  30885. */
  30886. SP_NOINLINE static sp_digit sp_521_sub_17(sp_digit* r, const sp_digit* a,
  30887. const sp_digit* b)
  30888. {
  30889. sp_digit c = 0;
  30890. __asm__ __volatile__ (
  30891. "mov r6, %[a]\n\t"
  30892. "add r6, r6, #68\n\t"
  30893. "\n1:\n\t"
  30894. "mov r5, #0\n\t"
  30895. "subs r5, r5, %[c]\n\t"
  30896. "ldr r4, [%[a]]\n\t"
  30897. "ldr r5, [%[b]]\n\t"
  30898. "sbcs r4, r4, r5\n\t"
  30899. "str r4, [%[r]]\n\t"
  30900. "sbc %[c], %[c], %[c]\n\t"
  30901. "add %[a], %[a], #4\n\t"
  30902. "add %[b], %[b], #4\n\t"
  30903. "add %[r], %[r], #4\n\t"
  30904. "cmp %[a], r6\n\t"
  30905. #ifdef __GNUC__
  30906. "bne 1b\n\t"
  30907. #else
  30908. "bne.n 1b\n\t"
  30909. #endif /* __GNUC__ */
  30910. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  30911. :
  30912. : "memory", "r4", "r5", "r6"
  30913. );
  30914. return c;
  30915. }
  30916. #else
  30917. /* Sub b from a into r. (r = a - b)
  30918. *
  30919. * r A single precision integer.
  30920. * a A single precision integer.
  30921. * b A single precision integer.
  30922. */
  30923. SP_NOINLINE static sp_digit sp_521_sub_17(sp_digit* r, const sp_digit* a,
  30924. const sp_digit* b)
  30925. {
  30926. sp_digit c = 0;
  30927. __asm__ __volatile__ (
  30928. "ldm %[a]!, {r4, r5}\n\t"
  30929. "ldm %[b]!, {r6, r8}\n\t"
  30930. "subs r4, r4, r6\n\t"
  30931. "sbcs r5, r5, r8\n\t"
  30932. "stm %[r]!, {r4, r5}\n\t"
  30933. "ldm %[a]!, {r4, r5}\n\t"
  30934. "ldm %[b]!, {r6, r8}\n\t"
  30935. "sbcs r4, r4, r6\n\t"
  30936. "sbcs r5, r5, r8\n\t"
  30937. "stm %[r]!, {r4, r5}\n\t"
  30938. "ldm %[a]!, {r4, r5}\n\t"
  30939. "ldm %[b]!, {r6, r8}\n\t"
  30940. "sbcs r4, r4, r6\n\t"
  30941. "sbcs r5, r5, r8\n\t"
  30942. "stm %[r]!, {r4, r5}\n\t"
  30943. "ldm %[a]!, {r4, r5}\n\t"
  30944. "ldm %[b]!, {r6, r8}\n\t"
  30945. "sbcs r4, r4, r6\n\t"
  30946. "sbcs r5, r5, r8\n\t"
  30947. "stm %[r]!, {r4, r5}\n\t"
  30948. "ldm %[a]!, {r4, r5}\n\t"
  30949. "ldm %[b]!, {r6, r8}\n\t"
  30950. "sbcs r4, r4, r6\n\t"
  30951. "sbcs r5, r5, r8\n\t"
  30952. "stm %[r]!, {r4, r5}\n\t"
  30953. "ldm %[a]!, {r4, r5}\n\t"
  30954. "ldm %[b]!, {r6, r8}\n\t"
  30955. "sbcs r4, r4, r6\n\t"
  30956. "sbcs r5, r5, r8\n\t"
  30957. "stm %[r]!, {r4, r5}\n\t"
  30958. "ldm %[a]!, {r4, r5}\n\t"
  30959. "ldm %[b]!, {r6, r8}\n\t"
  30960. "sbcs r4, r4, r6\n\t"
  30961. "sbcs r5, r5, r8\n\t"
  30962. "stm %[r]!, {r4, r5}\n\t"
  30963. "ldm %[a]!, {r4, r5}\n\t"
  30964. "ldm %[b]!, {r6, r8}\n\t"
  30965. "sbcs r4, r4, r6\n\t"
  30966. "sbcs r5, r5, r8\n\t"
  30967. "stm %[r]!, {r4, r5}\n\t"
  30968. "ldr r4, [%[a]]\n\t"
  30969. "ldr r6, [%[b]]\n\t"
  30970. "sbcs r4, r4, r6\n\t"
  30971. "str r4, [%[r]]\n\t"
  30972. "sbc %[c], %[c], %[c]\n\t"
  30973. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  30974. :
  30975. : "memory", "r4", "r5", "r6", "r8"
  30976. );
  30977. return c;
  30978. }
  30979. #endif /* WOLFSSL_SP_SMALL */
  30980. /* Multiply a number by Montgomery normalizer mod modulus (prime).
  30981. *
  30982. * r The resulting Montgomery form number.
  30983. * a The number to convert.
  30984. * m The modulus (prime).
  30985. * returns MEMORY_E when memory allocation fails and MP_OKAY otherwise.
  30986. */
  30987. static int sp_521_mod_mul_norm_17(sp_digit* r, const sp_digit* a, const sp_digit* m)
  30988. {
  30989. (void)m;
  30990. if (r != a) {
  30991. XMEMCPY(r, a, 17 * sizeof(sp_digit));
  30992. }
  30993. return MP_OKAY;
  30994. }
  30995. /* Convert an mp_int to an array of sp_digit.
  30996. *
  30997. * r A single precision integer.
  30998. * size Maximum number of bytes to convert
  30999. * a A multi-precision integer.
  31000. */
  31001. static void sp_521_from_mp(sp_digit* r, int size, const mp_int* a)
  31002. {
  31003. #if DIGIT_BIT == 32
  31004. int j;
  31005. XMEMCPY(r, a->dp, sizeof(sp_digit) * a->used);
  31006. for (j = a->used; j < size; j++) {
  31007. r[j] = 0;
  31008. }
  31009. #elif DIGIT_BIT > 32
  31010. int i;
  31011. int j = 0;
  31012. word32 s = 0;
  31013. r[0] = 0;
  31014. for (i = 0; i < a->used && j < size; i++) {
  31015. r[j] |= ((sp_digit)a->dp[i] << s);
  31016. r[j] &= 0xffffffff;
  31017. s = 32U - s;
  31018. if (j + 1 >= size) {
  31019. break;
  31020. }
  31021. /* lint allow cast of mismatch word32 and mp_digit */
  31022. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  31023. while ((s + 32U) <= (word32)DIGIT_BIT) {
  31024. s += 32U;
  31025. r[j] &= 0xffffffff;
  31026. if (j + 1 >= size) {
  31027. break;
  31028. }
  31029. if (s < (word32)DIGIT_BIT) {
  31030. /* lint allow cast of mismatch word32 and mp_digit */
  31031. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  31032. }
  31033. else {
  31034. r[++j] = (sp_digit)0;
  31035. }
  31036. }
  31037. s = (word32)DIGIT_BIT - s;
  31038. }
  31039. for (j++; j < size; j++) {
  31040. r[j] = 0;
  31041. }
  31042. #else
  31043. int i;
  31044. int j = 0;
  31045. int s = 0;
  31046. r[0] = 0;
  31047. for (i = 0; i < a->used && j < size; i++) {
  31048. r[j] |= ((sp_digit)a->dp[i]) << s;
  31049. if (s + DIGIT_BIT >= 32) {
  31050. r[j] &= 0xffffffff;
  31051. if (j + 1 >= size) {
  31052. break;
  31053. }
  31054. s = 32 - s;
  31055. if (s == DIGIT_BIT) {
  31056. r[++j] = 0;
  31057. s = 0;
  31058. }
  31059. else {
  31060. r[++j] = a->dp[i] >> s;
  31061. s = DIGIT_BIT - s;
  31062. }
  31063. }
  31064. else {
  31065. s += DIGIT_BIT;
  31066. }
  31067. }
  31068. for (j++; j < size; j++) {
  31069. r[j] = 0;
  31070. }
  31071. #endif
  31072. }
  31073. /* Convert a point of type ecc_point to type sp_point_521.
  31074. *
  31075. * p Point of type sp_point_521 (result).
  31076. * pm Point of type ecc_point.
  31077. */
  31078. static void sp_521_point_from_ecc_point_17(sp_point_521* p,
  31079. const ecc_point* pm)
  31080. {
  31081. XMEMSET(p->x, 0, sizeof(p->x));
  31082. XMEMSET(p->y, 0, sizeof(p->y));
  31083. XMEMSET(p->z, 0, sizeof(p->z));
  31084. sp_521_from_mp(p->x, 17, pm->x);
  31085. sp_521_from_mp(p->y, 17, pm->y);
  31086. sp_521_from_mp(p->z, 17, pm->z);
  31087. p->infinity = 0;
  31088. }
  31089. /* Convert an array of sp_digit to an mp_int.
  31090. *
  31091. * a A single precision integer.
  31092. * r A multi-precision integer.
  31093. */
  31094. static int sp_521_to_mp(const sp_digit* a, mp_int* r)
  31095. {
  31096. int err;
  31097. err = mp_grow(r, (521 + DIGIT_BIT - 1) / DIGIT_BIT);
  31098. if (err == MP_OKAY) { /*lint !e774 case where err is always MP_OKAY*/
  31099. #if DIGIT_BIT == 32
  31100. XMEMCPY(r->dp, a, sizeof(sp_digit) * 17);
  31101. r->used = 17;
  31102. mp_clamp(r);
  31103. #elif DIGIT_BIT < 32
  31104. int i;
  31105. int j = 0;
  31106. int s = 0;
  31107. r->dp[0] = 0;
  31108. for (i = 0; i < 17; i++) {
  31109. r->dp[j] |= (mp_digit)(a[i] << s);
  31110. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  31111. s = DIGIT_BIT - s;
  31112. r->dp[++j] = (mp_digit)(a[i] >> s);
  31113. while (s + DIGIT_BIT <= 32) {
  31114. s += DIGIT_BIT;
  31115. r->dp[j++] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  31116. if (s == SP_WORD_SIZE) {
  31117. r->dp[j] = 0;
  31118. }
  31119. else {
  31120. r->dp[j] = (mp_digit)(a[i] >> s);
  31121. }
  31122. }
  31123. s = 32 - s;
  31124. }
  31125. r->used = (521 + DIGIT_BIT - 1) / DIGIT_BIT;
  31126. mp_clamp(r);
  31127. #else
  31128. int i;
  31129. int j = 0;
  31130. int s = 0;
  31131. r->dp[0] = 0;
  31132. for (i = 0; i < 17; i++) {
  31133. r->dp[j] |= ((mp_digit)a[i]) << s;
  31134. if (s + 32 >= DIGIT_BIT) {
  31135. #if DIGIT_BIT != 32 && DIGIT_BIT != 64
  31136. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  31137. #endif
  31138. s = DIGIT_BIT - s;
  31139. r->dp[++j] = a[i] >> s;
  31140. s = 32 - s;
  31141. }
  31142. else {
  31143. s += 32;
  31144. }
  31145. }
  31146. r->used = (521 + DIGIT_BIT - 1) / DIGIT_BIT;
  31147. mp_clamp(r);
  31148. #endif
  31149. }
  31150. return err;
  31151. }
  31152. /* Convert a point of type sp_point_521 to type ecc_point.
  31153. *
  31154. * p Point of type sp_point_521.
  31155. * pm Point of type ecc_point (result).
  31156. * returns MEMORY_E when allocation of memory in ecc_point fails otherwise
  31157. * MP_OKAY.
  31158. */
  31159. static int sp_521_point_to_ecc_point_17(const sp_point_521* p, ecc_point* pm)
  31160. {
  31161. int err;
  31162. err = sp_521_to_mp(p->x, pm->x);
  31163. if (err == MP_OKAY) {
  31164. err = sp_521_to_mp(p->y, pm->y);
  31165. }
  31166. if (err == MP_OKAY) {
  31167. err = sp_521_to_mp(p->z, pm->z);
  31168. }
  31169. return err;
  31170. }
  31171. /* Conditionally subtract b from a using the mask m.
  31172. * m is -1 to subtract and 0 when not copying.
  31173. *
  31174. * r A single precision number representing condition subtract result.
  31175. * a A single precision number to subtract from.
  31176. * b A single precision number to subtract.
  31177. * m Mask value to apply.
  31178. */
  31179. SP_NOINLINE static sp_digit sp_521_cond_sub_17(sp_digit* r, const sp_digit* a,
  31180. const sp_digit* b, sp_digit m)
  31181. {
  31182. sp_digit c = 0;
  31183. __asm__ __volatile__ (
  31184. "mov r5, #68\n\t"
  31185. "mov r9, r5\n\t"
  31186. "mov r8, #0\n\t"
  31187. "\n1:\n\t"
  31188. "ldr r6, [%[b], r8]\n\t"
  31189. "and r6, r6, %[m]\n\t"
  31190. "mov r5, #0\n\t"
  31191. "subs r5, r5, %[c]\n\t"
  31192. "ldr r5, [%[a], r8]\n\t"
  31193. "sbcs r5, r5, r6\n\t"
  31194. "sbcs %[c], %[c], %[c]\n\t"
  31195. "str r5, [%[r], r8]\n\t"
  31196. "add r8, r8, #4\n\t"
  31197. "cmp r8, r9\n\t"
  31198. #ifdef __GNUC__
  31199. "blt 1b\n\t"
  31200. #else
  31201. "blt.n 1b\n\t"
  31202. #endif /* __GNUC__ */
  31203. : [c] "+r" (c)
  31204. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  31205. : "memory", "r5", "r6", "r8", "r9"
  31206. );
  31207. return c;
  31208. }
  31209. /* Reduce the number back to 521 bits using Montgomery reduction.
  31210. *
  31211. * a A single precision number to reduce in place.
  31212. * m The single precision number representing the modulus.
  31213. * mp The digit representing the negative inverse of m mod 2^n.
  31214. */
  31215. SP_NOINLINE static void sp_521_mont_reduce_17(sp_digit* a, const sp_digit* m,
  31216. sp_digit mp)
  31217. {
  31218. (void)mp;
  31219. (void)m;
  31220. __asm__ __volatile__ (
  31221. "sub sp, sp, #68\n\t"
  31222. "mov r12, sp\n\t"
  31223. "add r14, %[a], #64\n\t"
  31224. "ldm r14!, {r1, r2, r3, r4, r5, r6, r7, r8, r9, r10}\n\t"
  31225. "lsr r1, r1, #9\n\t"
  31226. "orr r1, r1, r2, lsl #23\n\t"
  31227. "lsr r2, r2, #9\n\t"
  31228. "orr r2, r2, r3, lsl #23\n\t"
  31229. "lsr r3, r3, #9\n\t"
  31230. "orr r3, r3, r4, lsl #23\n\t"
  31231. "lsr r4, r4, #9\n\t"
  31232. "orr r4, r4, r5, lsl #23\n\t"
  31233. "lsr r5, r5, #9\n\t"
  31234. "orr r5, r5, r6, lsl #23\n\t"
  31235. "lsr r6, r6, #9\n\t"
  31236. "orr r6, r6, r7, lsl #23\n\t"
  31237. "lsr r7, r7, #9\n\t"
  31238. "orr r7, r7, r8, lsl #23\n\t"
  31239. "lsr r8, r8, #9\n\t"
  31240. "orr r8, r8, r9, lsl #23\n\t"
  31241. "lsr r9, r9, #9\n\t"
  31242. "orr r9, r9, r10, lsl #23\n\t"
  31243. "stm r12!, {r1, r2, r3, r4, r5, r6, r7, r8, r9}\n\t"
  31244. "mov r1, r10\n\t"
  31245. "ldm r14, {r2, r3, r4, r5, r6, r7, r8}\n\t"
  31246. "lsr r1, r1, #9\n\t"
  31247. "orr r1, r1, r2, lsl #23\n\t"
  31248. "lsr r2, r2, #9\n\t"
  31249. "orr r2, r2, r3, lsl #23\n\t"
  31250. "lsr r3, r3, #9\n\t"
  31251. "orr r3, r3, r4, lsl #23\n\t"
  31252. "lsr r4, r4, #9\n\t"
  31253. "orr r4, r4, r5, lsl #23\n\t"
  31254. "lsr r5, r5, #9\n\t"
  31255. "orr r5, r5, r6, lsl #23\n\t"
  31256. "lsr r6, r6, #9\n\t"
  31257. "orr r6, r6, r7, lsl #23\n\t"
  31258. "lsr r7, r7, #9\n\t"
  31259. "orr r7, r7, r8, lsl #23\n\t"
  31260. "lsr r8, r8, #9\n\t"
  31261. "stm r12!, {r1, r2, r3, r4, r5, r6, r7, r8}\n\t"
  31262. "mov r14, sp\n\t"
  31263. "ldm %[a], {r1, r2, r3, r4, r5, r6}\n\t"
  31264. "ldm r14!, {r7, r8, r9, r10, r11, r12}\n\t"
  31265. "adds r1, r1, r7\n\t"
  31266. "adcs r2, r2, r8\n\t"
  31267. "adcs r3, r3, r9\n\t"
  31268. "adcs r4, r4, r10\n\t"
  31269. "adcs r5, r5, r11\n\t"
  31270. "adcs r6, r6, r12\n\t"
  31271. "stm %[a]!, {r1, r2, r3, r4, r5, r6}\n\t"
  31272. "ldm %[a], {r1, r2, r3, r4, r5, r6}\n\t"
  31273. "ldm r14!, {r7, r8, r9, r10, r11, r12}\n\t"
  31274. "adcs r1, r1, r7\n\t"
  31275. "adcs r2, r2, r8\n\t"
  31276. "adcs r3, r3, r9\n\t"
  31277. "adcs r4, r4, r10\n\t"
  31278. "adcs r5, r5, r11\n\t"
  31279. "adcs r6, r6, r12\n\t"
  31280. "stm %[a]!, {r1, r2, r3, r4, r5, r6}\n\t"
  31281. "ldm %[a], {r1, r2, r3, r4, r5}\n\t"
  31282. "ldm r14!, {r7, r8, r9, r10, r11}\n\t"
  31283. "mov r14, #0x1ff\n\t"
  31284. "and r5, r5, r14\n\t"
  31285. "adcs r1, r1, r7\n\t"
  31286. "adcs r2, r2, r8\n\t"
  31287. "adcs r3, r3, r9\n\t"
  31288. "adcs r4, r4, r10\n\t"
  31289. "adcs r5, r5, r11\n\t"
  31290. "lsr r12, r5, #9\n\t"
  31291. "and r5, r5, r14\n\t"
  31292. "stm %[a]!, {r1, r2, r3, r4, r5}\n\t"
  31293. "sub %[a], %[a], #68\n\t"
  31294. "mov r11, #0\n\t"
  31295. "ldm %[a], {r1, r2, r3, r4, r5, r6, r7, r8, r9}\n\t"
  31296. "adds r1, r1, r12\n\t"
  31297. "adcs r2, r2, r11\n\t"
  31298. "adcs r3, r3, r11\n\t"
  31299. "adcs r4, r4, r11\n\t"
  31300. "adcs r5, r5, r11\n\t"
  31301. "adcs r6, r6, r11\n\t"
  31302. "adcs r7, r7, r11\n\t"
  31303. "adcs r8, r8, r11\n\t"
  31304. "adcs r9, r9, r11\n\t"
  31305. "stm %[a]!, {r1, r2, r3, r4, r5, r6, r7, r8, r9}\n\t"
  31306. "ldm %[a], {r1, r2, r3, r4, r5, r6, r7, r8}\n\t"
  31307. "adcs r1, r1, r11\n\t"
  31308. "adcs r2, r2, r11\n\t"
  31309. "adcs r3, r3, r11\n\t"
  31310. "adcs r4, r4, r11\n\t"
  31311. "adcs r5, r5, r11\n\t"
  31312. "adcs r6, r6, r11\n\t"
  31313. "adcs r7, r7, r11\n\t"
  31314. "adcs r8, r8, r11\n\t"
  31315. "stm %[a]!, {r1, r2, r3, r4, r5, r6, r7, r8}\n\t"
  31316. "add sp, sp, #68\n\t"
  31317. "sub %[a], %[a], #68\n\t"
  31318. : [a] "+r" (a)
  31319. :
  31320. : "memory", "r1", "r2", "r3", "r4", "r5", "r6", "r7", "r8", "r9", "r10", "r11", "r12", "r14"
  31321. );
  31322. }
  31323. /* Reduce the number back to 521 bits using Montgomery reduction.
  31324. *
  31325. * a A single precision number to reduce in place.
  31326. * m The single precision number representing the modulus.
  31327. * mp The digit representing the negative inverse of m mod 2^n.
  31328. */
  31329. SP_NOINLINE static void sp_521_mont_reduce_order_17(sp_digit* a, const sp_digit* m,
  31330. sp_digit mp)
  31331. {
  31332. sp_digit ca = 0;
  31333. __asm__ __volatile__ (
  31334. "mov r9, %[mp]\n\t"
  31335. "mov r12, %[m]\n\t"
  31336. "mov r10, %[a]\n\t"
  31337. "mov r4, #0\n\t"
  31338. "add r11, r10, #68\n\t"
  31339. "\n1:\n\t"
  31340. /* mu = a[i] * mp */
  31341. "mov %[mp], r9\n\t"
  31342. "ldr %[a], [r10]\n\t"
  31343. "mul %[mp], %[mp], %[a]\n\t"
  31344. "sub r14, r11, #4\n\t"
  31345. "cmp r10, r14\n\t"
  31346. "bne L_521_mont_reduce_17_nomask\n\t"
  31347. "mov r8, #0x1ff\n\t"
  31348. "and %[mp], %[mp], r8\n\t"
  31349. "L_521_mont_reduce_17_nomask:\n\t"
  31350. "mov %[m], r12\n\t"
  31351. "add r14, r10, #64\n\t"
  31352. "\n2:\n\t"
  31353. /* a[i+j] += m[j] * mu */
  31354. "ldr %[a], [r10]\n\t"
  31355. "mov r5, #0\n\t"
  31356. /* Multiply m[j] and mu - Start */
  31357. "ldr r8, [%[m]], #4\n\t"
  31358. "umull r6, r8, %[mp], r8\n\t"
  31359. "adds %[a], %[a], r6\n\t"
  31360. "adc r5, r5, r8\n\t"
  31361. /* Multiply m[j] and mu - Done */
  31362. "adds r4, r4, %[a]\n\t"
  31363. "adc r5, r5, #0\n\t"
  31364. "str r4, [r10], #4\n\t"
  31365. /* a[i+j+1] += m[j+1] * mu */
  31366. "ldr %[a], [r10]\n\t"
  31367. "mov r4, #0\n\t"
  31368. /* Multiply m[j] and mu - Start */
  31369. "ldr r8, [%[m]], #4\n\t"
  31370. "umull r6, r8, %[mp], r8\n\t"
  31371. "adds %[a], %[a], r6\n\t"
  31372. "adc r4, r4, r8\n\t"
  31373. /* Multiply m[j] and mu - Done */
  31374. "adds r5, r5, %[a]\n\t"
  31375. "adc r4, r4, #0\n\t"
  31376. "str r5, [r10], #4\n\t"
  31377. "cmp r10, r14\n\t"
  31378. #ifdef __GNUC__
  31379. "blt 2b\n\t"
  31380. #else
  31381. "blt.n 2b\n\t"
  31382. #endif /* __GNUC__ */
  31383. /* a[i+16] += m[16] * mu */
  31384. "mov r5, %[ca]\n\t"
  31385. "mov %[ca], #0\n\t"
  31386. /* Multiply m[16] and mu - Start */
  31387. "ldr r8, [%[m]]\n\t"
  31388. "umull r6, r8, %[mp], r8\n\t"
  31389. "adds r4, r4, r6\n\t"
  31390. "adcs r5, r5, r8\n\t"
  31391. "adc %[ca], %[ca], #0\n\t"
  31392. /* Multiply m[16] and mu - Done */
  31393. "ldr r6, [r10]\n\t"
  31394. "ldr r8, [r10, #4]\n\t"
  31395. "adds r6, r6, r4\n\t"
  31396. "adcs r8, r8, r5\n\t"
  31397. "adc %[ca], %[ca], #0\n\t"
  31398. "str r6, [r10]\n\t"
  31399. "str r8, [r10, #4]\n\t"
  31400. "mov r4, #0\n\t"
  31401. /* Next word in a */
  31402. "sub r10, r10, #60\n\t"
  31403. "cmp r10, r11\n\t"
  31404. #ifdef __GNUC__
  31405. "blt 1b\n\t"
  31406. #else
  31407. "blt.n 1b\n\t"
  31408. #endif /* __GNUC__ */
  31409. "sub r10, r10, #4\n\t"
  31410. "ldr r4, [r10], #4\n\t"
  31411. "ldr r5, [r10]\n\t"
  31412. "lsr r4, r4, #9\n\t"
  31413. "orr r4, r4, r5, lsl #23\n\t"
  31414. "str r4, [r10], #4\n\t"
  31415. "ldr r4, [r10]\n\t"
  31416. "lsr r5, r5, #9\n\t"
  31417. "orr r5, r5, r4, lsl #23\n\t"
  31418. "str r5, [r10], #4\n\t"
  31419. "ldr r5, [r10]\n\t"
  31420. "lsr r4, r4, #9\n\t"
  31421. "orr r4, r4, r5, lsl #23\n\t"
  31422. "str r4, [r10], #4\n\t"
  31423. "ldr r4, [r10]\n\t"
  31424. "lsr r5, r5, #9\n\t"
  31425. "orr r5, r5, r4, lsl #23\n\t"
  31426. "str r5, [r10], #4\n\t"
  31427. "ldr r5, [r10]\n\t"
  31428. "lsr r4, r4, #9\n\t"
  31429. "orr r4, r4, r5, lsl #23\n\t"
  31430. "str r4, [r10], #4\n\t"
  31431. "ldr r4, [r10]\n\t"
  31432. "lsr r5, r5, #9\n\t"
  31433. "orr r5, r5, r4, lsl #23\n\t"
  31434. "str r5, [r10], #4\n\t"
  31435. "ldr r5, [r10]\n\t"
  31436. "lsr r4, r4, #9\n\t"
  31437. "orr r4, r4, r5, lsl #23\n\t"
  31438. "str r4, [r10], #4\n\t"
  31439. "ldr r4, [r10]\n\t"
  31440. "lsr r5, r5, #9\n\t"
  31441. "orr r5, r5, r4, lsl #23\n\t"
  31442. "str r5, [r10], #4\n\t"
  31443. "ldr r5, [r10]\n\t"
  31444. "lsr r4, r4, #9\n\t"
  31445. "orr r4, r4, r5, lsl #23\n\t"
  31446. "str r4, [r10], #4\n\t"
  31447. "ldr r4, [r10]\n\t"
  31448. "lsr r5, r5, #9\n\t"
  31449. "orr r5, r5, r4, lsl #23\n\t"
  31450. "str r5, [r10], #4\n\t"
  31451. "ldr r5, [r10]\n\t"
  31452. "lsr r4, r4, #9\n\t"
  31453. "orr r4, r4, r5, lsl #23\n\t"
  31454. "str r4, [r10], #4\n\t"
  31455. "ldr r4, [r10]\n\t"
  31456. "lsr r5, r5, #9\n\t"
  31457. "orr r5, r5, r4, lsl #23\n\t"
  31458. "str r5, [r10], #4\n\t"
  31459. "ldr r5, [r10]\n\t"
  31460. "lsr r4, r4, #9\n\t"
  31461. "orr r4, r4, r5, lsl #23\n\t"
  31462. "str r4, [r10], #4\n\t"
  31463. "ldr r4, [r10]\n\t"
  31464. "lsr r5, r5, #9\n\t"
  31465. "orr r5, r5, r4, lsl #23\n\t"
  31466. "str r5, [r10], #4\n\t"
  31467. "ldr r5, [r10]\n\t"
  31468. "lsr r4, r4, #9\n\t"
  31469. "orr r4, r4, r5, lsl #23\n\t"
  31470. "str r4, [r10], #4\n\t"
  31471. "ldr r4, [r10]\n\t"
  31472. "lsr r5, r5, #9\n\t"
  31473. "orr r5, r5, r4, lsl #23\n\t"
  31474. "str r5, [r10], #4\n\t"
  31475. "lsr r4, r4, #9\n\t"
  31476. "str r4, [r10]\n\t"
  31477. "lsr %[ca], r4, #9\n\t"
  31478. "sub %[a], r10, #64\n\t"
  31479. "mov %[m], r12\n\t"
  31480. : [ca] "+r" (ca), [a] "+r" (a)
  31481. : [m] "r" (m), [mp] "r" (mp)
  31482. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  31483. );
  31484. sp_521_cond_sub_17(a - 17, a, m, (sp_digit)0 - ca);
  31485. }
  31486. /* Multiply two Montgomery form numbers mod the modulus (prime).
  31487. * (r = a * b mod m)
  31488. *
  31489. * r Result of multiplication.
  31490. * a First number to multiply in Montgomery form.
  31491. * b Second number to multiply in Montgomery form.
  31492. * m Modulus (prime).
  31493. * mp Montgomery mulitplier.
  31494. */
  31495. SP_NOINLINE static void sp_521_mont_mul_17(sp_digit* r, const sp_digit* a,
  31496. const sp_digit* b, const sp_digit* m, sp_digit mp)
  31497. {
  31498. sp_521_mul_17(r, a, b);
  31499. sp_521_mont_reduce_17(r, m, mp);
  31500. }
  31501. /* Square the Montgomery form number. (r = a * a mod m)
  31502. *
  31503. * r Result of squaring.
  31504. * a Number to square in Montgomery form.
  31505. * m Modulus (prime).
  31506. * mp Montgomery mulitplier.
  31507. */
  31508. SP_NOINLINE static void sp_521_mont_sqr_17(sp_digit* r, const sp_digit* a,
  31509. const sp_digit* m, sp_digit mp)
  31510. {
  31511. sp_521_sqr_17(r, a);
  31512. sp_521_mont_reduce_17(r, m, mp);
  31513. }
  31514. #if !defined(WOLFSSL_SP_SMALL) || defined(HAVE_COMP_KEY)
  31515. /* Square the Montgomery form number a number of times. (r = a ^ n mod m)
  31516. *
  31517. * r Result of squaring.
  31518. * a Number to square in Montgomery form.
  31519. * n Number of times to square.
  31520. * m Modulus (prime).
  31521. * mp Montgomery mulitplier.
  31522. */
  31523. static void sp_521_mont_sqr_n_17(sp_digit* r, const sp_digit* a, int n,
  31524. const sp_digit* m, sp_digit mp)
  31525. {
  31526. sp_521_mont_sqr_17(r, a, m, mp);
  31527. for (; n > 1; n--) {
  31528. sp_521_mont_sqr_17(r, r, m, mp);
  31529. }
  31530. }
  31531. #endif /* !WOLFSSL_SP_SMALL | HAVE_COMP_KEY */
  31532. #ifdef WOLFSSL_SP_SMALL
  31533. /* Mod-2 for the P521 curve. */
  31534. static const uint32_t p521_mod_minus_2[17] = {
  31535. 0xfffffffdU,0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU,
  31536. 0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU,
  31537. 0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU,0x000001ffU
  31538. };
  31539. #endif /* !WOLFSSL_SP_SMALL */
  31540. /* Invert the number, in Montgomery form, modulo the modulus (prime) of the
  31541. * P521 curve. (r = 1 / a mod m)
  31542. *
  31543. * r Inverse result.
  31544. * a Number to invert.
  31545. * td Temporary data.
  31546. */
  31547. static void sp_521_mont_inv_17(sp_digit* r, const sp_digit* a, sp_digit* td)
  31548. {
  31549. #ifdef WOLFSSL_SP_SMALL
  31550. sp_digit* t = td;
  31551. int i;
  31552. XMEMCPY(t, a, sizeof(sp_digit) * 17);
  31553. for (i=519; i>=0; i--) {
  31554. sp_521_mont_sqr_17(t, t, p521_mod, p521_mp_mod);
  31555. if (p521_mod_minus_2[i / 32] & ((sp_digit)1 << (i % 32)))
  31556. sp_521_mont_mul_17(t, t, a, p521_mod, p521_mp_mod);
  31557. }
  31558. XMEMCPY(r, t, sizeof(sp_digit) * 17);
  31559. #else
  31560. sp_digit* t1 = td;
  31561. sp_digit* t2 = td + 2 * 17;
  31562. sp_digit* t3 = td + 4 * 17;
  31563. /* 0x2 */
  31564. sp_521_mont_sqr_17(t1, a, p521_mod, p521_mp_mod);
  31565. /* 0x3 */
  31566. sp_521_mont_mul_17(t2, t1, a, p521_mod, p521_mp_mod);
  31567. /* 0x6 */
  31568. sp_521_mont_sqr_17(t1, t2, p521_mod, p521_mp_mod);
  31569. /* 0x7 */
  31570. sp_521_mont_mul_17(t3, t1, a, p521_mod, p521_mp_mod);
  31571. /* 0xc */
  31572. sp_521_mont_sqr_n_17(t1, t2, 2, p521_mod, p521_mp_mod);
  31573. /* 0xf */
  31574. sp_521_mont_mul_17(t2, t2, t1, p521_mod, p521_mp_mod);
  31575. /* 0x78 */
  31576. sp_521_mont_sqr_n_17(t1, t2, 3, p521_mod, p521_mp_mod);
  31577. /* 0x7f */
  31578. sp_521_mont_mul_17(t3, t3, t1, p521_mod, p521_mp_mod);
  31579. /* 0xf0 */
  31580. sp_521_mont_sqr_n_17(t1, t2, 4, p521_mod, p521_mp_mod);
  31581. /* 0xff */
  31582. sp_521_mont_mul_17(t2, t2, t1, p521_mod, p521_mp_mod);
  31583. /* 0xff00 */
  31584. sp_521_mont_sqr_n_17(t1, t2, 8, p521_mod, p521_mp_mod);
  31585. /* 0xffff */
  31586. sp_521_mont_mul_17(t2, t2, t1, p521_mod, p521_mp_mod);
  31587. /* 0xffff0000 */
  31588. sp_521_mont_sqr_n_17(t1, t2, 16, p521_mod, p521_mp_mod);
  31589. /* 0xffffffff */
  31590. sp_521_mont_mul_17(t2, t2, t1, p521_mod, p521_mp_mod);
  31591. /* 0xffffffff00000000 */
  31592. sp_521_mont_sqr_n_17(t1, t2, 32, p521_mod, p521_mp_mod);
  31593. /* 0xffffffffffffffff */
  31594. sp_521_mont_mul_17(t2, t2, t1, p521_mod, p521_mp_mod);
  31595. /* 0xffffffffffffffff0000000000000000 */
  31596. sp_521_mont_sqr_n_17(t1, t2, 64, p521_mod, p521_mp_mod);
  31597. /* 0xffffffffffffffffffffffffffffffff */
  31598. sp_521_mont_mul_17(t2, t2, t1, p521_mod, p521_mp_mod);
  31599. /* 0xffffffffffffffffffffffffffffffff00000000000000000000000000000000 */
  31600. sp_521_mont_sqr_n_17(t1, t2, 128, p521_mod, p521_mp_mod);
  31601. /* 0xffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff */
  31602. sp_521_mont_mul_17(t2, t2, t1, p521_mod, p521_mp_mod);
  31603. /* 0xffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff0000000000000000000000000000000000000000000000000000000000000000 */
  31604. sp_521_mont_sqr_n_17(t1, t2, 256, p521_mod, p521_mp_mod);
  31605. /* 0xffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff */
  31606. sp_521_mont_mul_17(t2, t2, t1, p521_mod, p521_mp_mod);
  31607. /* 0x7fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff80 */
  31608. sp_521_mont_sqr_n_17(t1, t2, 7, p521_mod, p521_mp_mod);
  31609. /* 0x7fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff */
  31610. sp_521_mont_mul_17(t2, t3, t1, p521_mod, p521_mp_mod);
  31611. /* 0x1fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffc */
  31612. sp_521_mont_sqr_n_17(t1, t2, 2, p521_mod, p521_mp_mod);
  31613. /* 0x1fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffd */
  31614. sp_521_mont_mul_17(r, t1, a, p521_mod, p521_mp_mod);
  31615. #endif /* WOLFSSL_SP_SMALL */
  31616. }
  31617. /* Compare a with b in constant time.
  31618. *
  31619. * a A single precision integer.
  31620. * b A single precision integer.
  31621. * return -ve, 0 or +ve if a is less than, equal to or greater than b
  31622. * respectively.
  31623. */
  31624. SP_NOINLINE static sp_int32 sp_521_cmp_17(const sp_digit* a, const sp_digit* b)
  31625. {
  31626. sp_digit r = 0;
  31627. __asm__ __volatile__ (
  31628. "mov r3, #0\n\t"
  31629. "mvn r3, r3\n\t"
  31630. "mov r6, #64\n\t"
  31631. "\n1:\n\t"
  31632. "ldr r8, [%[a], r6]\n\t"
  31633. "ldr r5, [%[b], r6]\n\t"
  31634. "and r8, r8, r3\n\t"
  31635. "and r5, r5, r3\n\t"
  31636. "mov r4, r8\n\t"
  31637. "subs r8, r8, r5\n\t"
  31638. "sbc r8, r8, r8\n\t"
  31639. "add %[r], %[r], r8\n\t"
  31640. "mvn r8, r8\n\t"
  31641. "and r3, r3, r8\n\t"
  31642. "subs r5, r5, r4\n\t"
  31643. "sbc r8, r8, r8\n\t"
  31644. "sub %[r], %[r], r8\n\t"
  31645. "mvn r8, r8\n\t"
  31646. "and r3, r3, r8\n\t"
  31647. "sub r6, r6, #4\n\t"
  31648. "cmp r6, #0\n\t"
  31649. #ifdef __GNUC__
  31650. "bge 1b\n\t"
  31651. #else
  31652. "bge.n 1b\n\t"
  31653. #endif /* __GNUC__ */
  31654. : [r] "+r" (r)
  31655. : [a] "r" (a), [b] "r" (b)
  31656. : "r3", "r4", "r5", "r6", "r8"
  31657. );
  31658. return r;
  31659. }
  31660. /* Normalize the values in each word to 32.
  31661. *
  31662. * a Array of sp_digit to normalize.
  31663. */
  31664. #define sp_521_norm_17(a)
  31665. /* Map the Montgomery form projective coordinate point to an affine point.
  31666. *
  31667. * r Resulting affine coordinate point.
  31668. * p Montgomery form projective coordinate point.
  31669. * t Temporary ordinate data.
  31670. */
  31671. static void sp_521_map_17(sp_point_521* r, const sp_point_521* p,
  31672. sp_digit* t)
  31673. {
  31674. sp_digit* t1 = t;
  31675. sp_digit* t2 = t + 2*17;
  31676. sp_int32 n;
  31677. sp_521_mont_inv_17(t1, p->z, t + 2*17);
  31678. sp_521_mont_sqr_17(t2, t1, p521_mod, p521_mp_mod);
  31679. sp_521_mont_mul_17(t1, t2, t1, p521_mod, p521_mp_mod);
  31680. /* x /= z^2 */
  31681. sp_521_mont_mul_17(r->x, p->x, t2, p521_mod, p521_mp_mod);
  31682. XMEMSET(r->x + 17, 0, sizeof(r->x) / 2U);
  31683. sp_521_mont_reduce_17(r->x, p521_mod, p521_mp_mod);
  31684. /* Reduce x to less than modulus */
  31685. n = sp_521_cmp_17(r->x, p521_mod);
  31686. sp_521_cond_sub_17(r->x, r->x, p521_mod, ~(n >> 31));
  31687. sp_521_norm_17(r->x);
  31688. /* y /= z^3 */
  31689. sp_521_mont_mul_17(r->y, p->y, t1, p521_mod, p521_mp_mod);
  31690. XMEMSET(r->y + 17, 0, sizeof(r->y) / 2U);
  31691. sp_521_mont_reduce_17(r->y, p521_mod, p521_mp_mod);
  31692. /* Reduce y to less than modulus */
  31693. n = sp_521_cmp_17(r->y, p521_mod);
  31694. sp_521_cond_sub_17(r->y, r->y, p521_mod, ~(n >> 31));
  31695. sp_521_norm_17(r->y);
  31696. XMEMSET(r->z, 0, sizeof(r->z) / 2);
  31697. r->z[0] = 1;
  31698. }
  31699. /* Add two Montgomery form numbers (r = a + b % m).
  31700. *
  31701. * r Result of addition.
  31702. * a First number to add in Montgomery form.
  31703. * b Second number to add in Montgomery form.
  31704. * m Modulus (prime).
  31705. */
  31706. SP_NOINLINE static void sp_521_mont_add_17(sp_digit* r, const sp_digit* a, const sp_digit* b,
  31707. const sp_digit* m)
  31708. {
  31709. (void)m;
  31710. __asm__ __volatile__ (
  31711. "mov r12, #0\n\t"
  31712. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31713. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  31714. "adds r4, r4, r8\n\t"
  31715. "adcs r5, r5, r9\n\t"
  31716. "adcs r6, r6, r10\n\t"
  31717. "adcs r7, r7, r14\n\t"
  31718. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31719. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31720. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  31721. "adcs r4, r4, r8\n\t"
  31722. "adcs r5, r5, r9\n\t"
  31723. "adcs r6, r6, r10\n\t"
  31724. "adcs r7, r7, r14\n\t"
  31725. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31726. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31727. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  31728. "adcs r4, r4, r8\n\t"
  31729. "adcs r5, r5, r9\n\t"
  31730. "adcs r6, r6, r10\n\t"
  31731. "adcs r7, r7, r14\n\t"
  31732. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31733. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31734. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  31735. "adcs r4, r4, r8\n\t"
  31736. "adcs r5, r5, r9\n\t"
  31737. "adcs r6, r6, r10\n\t"
  31738. "adcs r7, r7, r14\n\t"
  31739. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31740. "ldm %[a]!, {r4}\n\t"
  31741. "ldm %[b]!, {r8}\n\t"
  31742. "adcs r4, r4, r8\n\t"
  31743. "mov r14, #0x1ff\n\t"
  31744. "lsr r12, r4, #9\n\t"
  31745. "and r4, r4, r14\n\t"
  31746. "stm %[r]!, {r4}\n\t"
  31747. "sub %[r], %[r], #68\n\t"
  31748. "mov r14, #0\n\t"
  31749. "ldm %[r], {r4, r5, r6, r7}\n\t"
  31750. "adds r4, r4, r12\n\t"
  31751. "adcs r5, r5, r14\n\t"
  31752. "adcs r6, r6, r14\n\t"
  31753. "adcs r7, r7, r14\n\t"
  31754. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31755. "ldm %[r], {r4, r5, r6, r7}\n\t"
  31756. "adcs r4, r4, r14\n\t"
  31757. "adcs r5, r5, r14\n\t"
  31758. "adcs r6, r6, r14\n\t"
  31759. "adcs r7, r7, r14\n\t"
  31760. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31761. "ldm %[r], {r4, r5, r6, r7}\n\t"
  31762. "adcs r4, r4, r14\n\t"
  31763. "adcs r5, r5, r14\n\t"
  31764. "adcs r6, r6, r14\n\t"
  31765. "adcs r7, r7, r14\n\t"
  31766. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31767. "ldm %[r], {r4, r5, r6, r7}\n\t"
  31768. "adcs r4, r4, r14\n\t"
  31769. "adcs r5, r5, r14\n\t"
  31770. "adcs r6, r6, r14\n\t"
  31771. "adcs r7, r7, r14\n\t"
  31772. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31773. "ldm %[r], {r4}\n\t"
  31774. "adcs r4, r4, r14\n\t"
  31775. "stm %[r]!, {r4}\n\t"
  31776. "sub %[r], %[r], #68\n\t"
  31777. : [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  31778. :
  31779. : "memory", "r4", "r5", "r6", "r7", "r8", "r9", "r10", "r14", "r12"
  31780. );
  31781. }
  31782. /* Double a Montgomery form number (r = a + a % m).
  31783. *
  31784. * r Result of doubling.
  31785. * a Number to double in Montgomery form.
  31786. * m Modulus (prime).
  31787. */
  31788. SP_NOINLINE static void sp_521_mont_dbl_17(sp_digit* r, const sp_digit* a, const sp_digit* m)
  31789. {
  31790. (void)m;
  31791. __asm__ __volatile__ (
  31792. "mov r8, #0\n\t"
  31793. "ldm %[a]!, {r2, r3, r4, r5, r6, r7}\n\t"
  31794. "adds r2, r2, r2\n\t"
  31795. "adcs r3, r3, r3\n\t"
  31796. "adcs r4, r4, r4\n\t"
  31797. "adcs r5, r5, r5\n\t"
  31798. "adcs r6, r6, r6\n\t"
  31799. "adcs r7, r7, r7\n\t"
  31800. "str r2, [%[r], #0]\n\t"
  31801. "str r3, [%[r], #4]\n\t"
  31802. "str r4, [%[r], #8]\n\t"
  31803. "str r5, [%[r], #12]\n\t"
  31804. "str r6, [%[r], #16]\n\t"
  31805. "stm %[r]!, {r2, r3, r4, r5, r6, r7}\n\t"
  31806. "ldm %[a]!, {r2, r3, r4, r5, r6, r7}\n\t"
  31807. "adcs r2, r2, r2\n\t"
  31808. "adcs r3, r3, r3\n\t"
  31809. "adcs r4, r4, r4\n\t"
  31810. "adcs r5, r5, r5\n\t"
  31811. "adcs r6, r6, r6\n\t"
  31812. "adcs r7, r7, r7\n\t"
  31813. "str r2, [%[r], #0]\n\t"
  31814. "str r3, [%[r], #4]\n\t"
  31815. "str r4, [%[r], #8]\n\t"
  31816. "str r5, [%[r], #12]\n\t"
  31817. "str r6, [%[r], #16]\n\t"
  31818. "stm %[r]!, {r2, r3, r4, r5, r6, r7}\n\t"
  31819. "ldm %[a]!, {r2, r3, r4, r5, r6}\n\t"
  31820. "adcs r2, r2, r2\n\t"
  31821. "adcs r3, r3, r3\n\t"
  31822. "adcs r4, r4, r4\n\t"
  31823. "adcs r5, r5, r5\n\t"
  31824. "adcs r6, r6, r6\n\t"
  31825. "mov r9, #0x1ff\n\t"
  31826. "lsr r8, r6, #9\n\t"
  31827. "and r6, r6, r9\n\t"
  31828. "stm %[r]!, {r2, r3, r4, r5, r6}\n\t"
  31829. "sub %[r], %[r], #68\n\t"
  31830. "mov r9, #0\n\t"
  31831. "ldm %[r], {r2, r3, r4, r5, r6, r7}\n\t"
  31832. "adds r2, r2, r8\n\t"
  31833. "adcs r3, r3, r9\n\t"
  31834. "adcs r4, r4, r9\n\t"
  31835. "adcs r5, r5, r9\n\t"
  31836. "adcs r6, r6, r9\n\t"
  31837. "adcs r7, r7, r9\n\t"
  31838. "stm %[r]!, {r2, r3, r4, r5, r6, r7}\n\t"
  31839. "ldm %[r], {r2, r3, r4, r5, r6, r7}\n\t"
  31840. "adcs r2, r2, r9\n\t"
  31841. "adcs r3, r3, r9\n\t"
  31842. "adcs r4, r4, r9\n\t"
  31843. "adcs r5, r5, r9\n\t"
  31844. "adcs r6, r6, r9\n\t"
  31845. "adcs r7, r7, r9\n\t"
  31846. "stm %[r]!, {r2, r3, r4, r5, r6, r7}\n\t"
  31847. "ldm %[r], {r2, r3, r4, r5, r6}\n\t"
  31848. "adcs r2, r2, r9\n\t"
  31849. "adcs r3, r3, r9\n\t"
  31850. "adcs r4, r4, r9\n\t"
  31851. "adcs r5, r5, r9\n\t"
  31852. "adcs r6, r6, r9\n\t"
  31853. "stm %[r]!, {r2, r3, r4, r5, r6}\n\t"
  31854. "sub %[r], %[r], #68\n\t"
  31855. "sub %[a], %[a], #68\n\t"
  31856. : [r] "+r" (r), [a] "+r" (a)
  31857. :
  31858. : "memory", "r2", "r3", "r4", "r5", "r6", "r7", "r8", "r9"
  31859. );
  31860. }
  31861. /* Triple a Montgomery form number (r = a + a + a % m).
  31862. *
  31863. * r Result of Tripling.
  31864. * a Number to triple in Montgomery form.
  31865. * m Modulus (prime).
  31866. */
  31867. SP_NOINLINE static void sp_521_mont_tpl_17(sp_digit* r, const sp_digit* a, const sp_digit* m)
  31868. {
  31869. (void)m;
  31870. __asm__ __volatile__ (
  31871. "mov r12, #0\n\t"
  31872. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31873. "adds r4, r4, r4\n\t"
  31874. "adcs r5, r5, r5\n\t"
  31875. "adcs r6, r6, r6\n\t"
  31876. "adcs r7, r7, r7\n\t"
  31877. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31878. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31879. "adcs r4, r4, r4\n\t"
  31880. "adcs r5, r5, r5\n\t"
  31881. "adcs r6, r6, r6\n\t"
  31882. "adcs r7, r7, r7\n\t"
  31883. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31884. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31885. "adcs r4, r4, r4\n\t"
  31886. "adcs r5, r5, r5\n\t"
  31887. "adcs r6, r6, r6\n\t"
  31888. "adcs r7, r7, r7\n\t"
  31889. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31890. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31891. "adcs r4, r4, r4\n\t"
  31892. "adcs r5, r5, r5\n\t"
  31893. "adcs r6, r6, r6\n\t"
  31894. "adcs r7, r7, r7\n\t"
  31895. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31896. "ldm %[a]!, {r4}\n\t"
  31897. "adcs r4, r4, r4\n\t"
  31898. "stm %[r]!, {r4}\n\t"
  31899. "sub %[r], %[r], #68\n\t"
  31900. "sub %[a], %[a], #68\n\t"
  31901. "ldm %[r], {r8, r9, r10, r14}\n\t"
  31902. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31903. "adds r8, r8, r4\n\t"
  31904. "adcs r9, r9, r5\n\t"
  31905. "adcs r10, r10, r6\n\t"
  31906. "adcs r14, r14, r7\n\t"
  31907. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  31908. "ldm %[r], {r8, r9, r10, r14}\n\t"
  31909. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31910. "adcs r8, r8, r4\n\t"
  31911. "adcs r9, r9, r5\n\t"
  31912. "adcs r10, r10, r6\n\t"
  31913. "adcs r14, r14, r7\n\t"
  31914. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  31915. "ldm %[r], {r8, r9, r10, r14}\n\t"
  31916. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31917. "adcs r8, r8, r4\n\t"
  31918. "adcs r9, r9, r5\n\t"
  31919. "adcs r10, r10, r6\n\t"
  31920. "adcs r14, r14, r7\n\t"
  31921. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  31922. "ldm %[r], {r8, r9, r10, r14}\n\t"
  31923. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31924. "adcs r8, r8, r4\n\t"
  31925. "adcs r9, r9, r5\n\t"
  31926. "adcs r10, r10, r6\n\t"
  31927. "adcs r14, r14, r7\n\t"
  31928. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  31929. "ldm %[r], {r8}\n\t"
  31930. "ldm %[a]!, {r4}\n\t"
  31931. "adcs r8, r8, r4\n\t"
  31932. "mov r14, #0x1ff\n\t"
  31933. "lsr r12, r8, #9\n\t"
  31934. "and r8, r8, r14\n\t"
  31935. "stm %[r]!, {r8}\n\t"
  31936. "sub %[r], %[r], #68\n\t"
  31937. "mov r14, #0\n\t"
  31938. "ldm %[r], {r4, r5, r6, r7}\n\t"
  31939. "adds r4, r4, r12\n\t"
  31940. "adcs r5, r5, r14\n\t"
  31941. "adcs r6, r6, r14\n\t"
  31942. "adcs r7, r7, r14\n\t"
  31943. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31944. "ldm %[r], {r4, r5, r6, r7}\n\t"
  31945. "adcs r4, r4, r14\n\t"
  31946. "adcs r5, r5, r14\n\t"
  31947. "adcs r6, r6, r14\n\t"
  31948. "adcs r7, r7, r14\n\t"
  31949. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31950. "ldm %[r], {r4, r5, r6, r7}\n\t"
  31951. "adcs r4, r4, r14\n\t"
  31952. "adcs r5, r5, r14\n\t"
  31953. "adcs r6, r6, r14\n\t"
  31954. "adcs r7, r7, r14\n\t"
  31955. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31956. "ldm %[r], {r4, r5, r6, r7}\n\t"
  31957. "adcs r4, r4, r14\n\t"
  31958. "adcs r5, r5, r14\n\t"
  31959. "adcs r6, r6, r14\n\t"
  31960. "adcs r7, r7, r14\n\t"
  31961. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31962. "ldm %[r], {r4}\n\t"
  31963. "adcs r4, r4, r14\n\t"
  31964. "stm %[r]!, {r4}\n\t"
  31965. "sub %[r], %[r], #68\n\t"
  31966. : [r] "+r" (r), [a] "+r" (a)
  31967. :
  31968. : "memory", "r4", "r5", "r6", "r7", "r8", "r9", "r10", "r14", "r12"
  31969. );
  31970. }
  31971. /* Subtract two Montgomery form numbers (r = a - b % m).
  31972. *
  31973. * r Result of subtration.
  31974. * a Number to subtract from in Montgomery form.
  31975. * b Number to subtract with in Montgomery form.
  31976. * m Modulus (prime).
  31977. */
  31978. SP_NOINLINE static void sp_521_mont_sub_17(sp_digit* r, const sp_digit* a, const sp_digit* b,
  31979. const sp_digit* m)
  31980. {
  31981. (void)m;
  31982. __asm__ __volatile__ (
  31983. "mov r12, #0\n\t"
  31984. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31985. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  31986. "subs r4, r4, r8\n\t"
  31987. "sbcs r5, r5, r9\n\t"
  31988. "sbcs r6, r6, r10\n\t"
  31989. "sbcs r7, r7, r14\n\t"
  31990. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31991. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31992. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  31993. "sbcs r4, r4, r8\n\t"
  31994. "sbcs r5, r5, r9\n\t"
  31995. "sbcs r6, r6, r10\n\t"
  31996. "sbcs r7, r7, r14\n\t"
  31997. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  31998. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  31999. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  32000. "sbcs r4, r4, r8\n\t"
  32001. "sbcs r5, r5, r9\n\t"
  32002. "sbcs r6, r6, r10\n\t"
  32003. "sbcs r7, r7, r14\n\t"
  32004. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  32005. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  32006. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  32007. "sbcs r4, r4, r8\n\t"
  32008. "sbcs r5, r5, r9\n\t"
  32009. "sbcs r6, r6, r10\n\t"
  32010. "sbcs r7, r7, r14\n\t"
  32011. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  32012. "ldm %[a]!, {r4}\n\t"
  32013. "ldm %[b]!, {r8}\n\t"
  32014. "sbcs r4, r4, r8\n\t"
  32015. "mov r14, #0x1ff\n\t"
  32016. "asr r12, r4, #9\n\t"
  32017. "and r4, r4, r14\n\t"
  32018. "neg r12, r12\n\t"
  32019. "stm %[r]!, {r4}\n\t"
  32020. "sub %[r], %[r], #68\n\t"
  32021. "mov r14, #0\n\t"
  32022. "ldm %[r], {r4, r5, r6, r7}\n\t"
  32023. "subs r4, r4, r12\n\t"
  32024. "sbcs r5, r5, r14\n\t"
  32025. "sbcs r6, r6, r14\n\t"
  32026. "sbcs r7, r7, r14\n\t"
  32027. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  32028. "ldm %[r], {r4, r5, r6, r7}\n\t"
  32029. "sbcs r4, r4, r14\n\t"
  32030. "sbcs r5, r5, r14\n\t"
  32031. "sbcs r6, r6, r14\n\t"
  32032. "sbcs r7, r7, r14\n\t"
  32033. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  32034. "ldm %[r], {r4, r5, r6, r7}\n\t"
  32035. "sbcs r4, r4, r14\n\t"
  32036. "sbcs r5, r5, r14\n\t"
  32037. "sbcs r6, r6, r14\n\t"
  32038. "sbcs r7, r7, r14\n\t"
  32039. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  32040. "ldm %[r], {r4, r5, r6, r7}\n\t"
  32041. "sbcs r4, r4, r14\n\t"
  32042. "sbcs r5, r5, r14\n\t"
  32043. "sbcs r6, r6, r14\n\t"
  32044. "sbcs r7, r7, r14\n\t"
  32045. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  32046. "ldm %[r], {r4}\n\t"
  32047. "sbcs r4, r4, r14\n\t"
  32048. "stm %[r]!, {r4}\n\t"
  32049. "sub %[r], %[r], #68\n\t"
  32050. : [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  32051. :
  32052. : "memory", "r4", "r5", "r6", "r7", "r8", "r9", "r10", "r14", "r12"
  32053. );
  32054. }
  32055. #define sp_521_mont_sub_lower_17 sp_521_mont_sub_17
  32056. /* Conditionally add a and b using the mask m.
  32057. * m is -1 to add and 0 when not.
  32058. *
  32059. * r A single precision number representing conditional add result.
  32060. * a A single precision number to add with.
  32061. * b A single precision number to add.
  32062. * m Mask value to apply.
  32063. */
  32064. SP_NOINLINE static sp_digit sp_521_cond_add_17(sp_digit* r, const sp_digit* a, const sp_digit* b,
  32065. sp_digit m)
  32066. {
  32067. sp_digit c = 0;
  32068. __asm__ __volatile__ (
  32069. "mov r5, #68\n\t"
  32070. "mov r9, r5\n\t"
  32071. "mov r8, #0\n\t"
  32072. "\n1:\n\t"
  32073. "ldr r6, [%[b], r8]\n\t"
  32074. "and r6, r6, %[m]\n\t"
  32075. "adds r5, %[c], #-1\n\t"
  32076. "ldr r5, [%[a], r8]\n\t"
  32077. "adcs r5, r5, r6\n\t"
  32078. "mov %[c], #0\n\t"
  32079. "adcs %[c], %[c], %[c]\n\t"
  32080. "str r5, [%[r], r8]\n\t"
  32081. "add r8, r8, #4\n\t"
  32082. "cmp r8, r9\n\t"
  32083. #ifdef __GNUC__
  32084. "blt 1b\n\t"
  32085. #else
  32086. "blt.n 1b\n\t"
  32087. #endif /* __GNUC__ */
  32088. : [c] "+r" (c)
  32089. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  32090. : "memory", "r5", "r6", "r8", "r9"
  32091. );
  32092. return c;
  32093. }
  32094. static void sp_521_rshift1_17(sp_digit* r, const sp_digit* a)
  32095. {
  32096. __asm__ __volatile__ (
  32097. "ldr r2, [%[a]]\n\t"
  32098. "ldr r3, [%[a], #4]\n\t"
  32099. "lsr r2, r2, #1\n\t"
  32100. "orr r2, r2, r3, lsl #31\n\t"
  32101. "lsr r3, r3, #1\n\t"
  32102. "ldr r4, [%[a], #8]\n\t"
  32103. "str r2, [%[r], #0]\n\t"
  32104. "orr r3, r3, r4, lsl #31\n\t"
  32105. "lsr r4, r4, #1\n\t"
  32106. "ldr r2, [%[a], #12]\n\t"
  32107. "str r3, [%[r], #4]\n\t"
  32108. "orr r4, r4, r2, lsl #31\n\t"
  32109. "lsr r2, r2, #1\n\t"
  32110. "ldr r3, [%[a], #16]\n\t"
  32111. "str r4, [%[r], #8]\n\t"
  32112. "orr r2, r2, r3, lsl #31\n\t"
  32113. "lsr r3, r3, #1\n\t"
  32114. "ldr r4, [%[a], #20]\n\t"
  32115. "str r2, [%[r], #12]\n\t"
  32116. "orr r3, r3, r4, lsl #31\n\t"
  32117. "lsr r4, r4, #1\n\t"
  32118. "ldr r2, [%[a], #24]\n\t"
  32119. "str r3, [%[r], #16]\n\t"
  32120. "orr r4, r4, r2, lsl #31\n\t"
  32121. "lsr r2, r2, #1\n\t"
  32122. "ldr r3, [%[a], #28]\n\t"
  32123. "str r4, [%[r], #20]\n\t"
  32124. "orr r2, r2, r3, lsl #31\n\t"
  32125. "lsr r3, r3, #1\n\t"
  32126. "ldr r4, [%[a], #32]\n\t"
  32127. "str r2, [%[r], #24]\n\t"
  32128. "orr r3, r3, r4, lsl #31\n\t"
  32129. "lsr r4, r4, #1\n\t"
  32130. "ldr r2, [%[a], #36]\n\t"
  32131. "str r3, [%[r], #28]\n\t"
  32132. "orr r4, r4, r2, lsl #31\n\t"
  32133. "lsr r2, r2, #1\n\t"
  32134. "ldr r3, [%[a], #40]\n\t"
  32135. "str r4, [%[r], #32]\n\t"
  32136. "orr r2, r2, r3, lsl #31\n\t"
  32137. "lsr r3, r3, #1\n\t"
  32138. "ldr r4, [%[a], #44]\n\t"
  32139. "str r2, [%[r], #36]\n\t"
  32140. "orr r3, r3, r4, lsl #31\n\t"
  32141. "lsr r4, r4, #1\n\t"
  32142. "ldr r2, [%[a], #48]\n\t"
  32143. "str r3, [%[r], #40]\n\t"
  32144. "orr r4, r4, r2, lsl #31\n\t"
  32145. "lsr r2, r2, #1\n\t"
  32146. "ldr r3, [%[a], #52]\n\t"
  32147. "str r4, [%[r], #44]\n\t"
  32148. "orr r2, r2, r3, lsl #31\n\t"
  32149. "lsr r3, r3, #1\n\t"
  32150. "ldr r4, [%[a], #56]\n\t"
  32151. "str r2, [%[r], #48]\n\t"
  32152. "orr r3, r3, r4, lsl #31\n\t"
  32153. "lsr r4, r4, #1\n\t"
  32154. "ldr r2, [%[a], #60]\n\t"
  32155. "str r3, [%[r], #52]\n\t"
  32156. "orr r4, r4, r2, lsl #31\n\t"
  32157. "lsr r2, r2, #1\n\t"
  32158. "ldr r3, [%[a], #64]\n\t"
  32159. "str r4, [%[r], #56]\n\t"
  32160. "orr r2, r2, r3, lsl #31\n\t"
  32161. "lsr r3, r3, #1\n\t"
  32162. "str r2, [%[r], #60]\n\t"
  32163. "str r3, [%[r], #64]\n\t"
  32164. :
  32165. : [r] "r" (r), [a] "r" (a)
  32166. : "memory", "r2", "r3", "r4"
  32167. );
  32168. }
  32169. /* Divide the number by 2 mod the modulus (prime). (r = a / 2 % m)
  32170. *
  32171. * r Result of division by 2.
  32172. * a Number to divide.
  32173. * m Modulus (prime).
  32174. */
  32175. SP_NOINLINE static void sp_521_div2_17(sp_digit* r, const sp_digit* a, const sp_digit* m)
  32176. {
  32177. sp_digit o;
  32178. o = sp_521_cond_add_17(r, a, m, 0 - (a[0] & 1));
  32179. sp_521_rshift1_17(r, r);
  32180. r[16] |= o << 31;
  32181. }
  32182. /* Double the Montgomery form projective point p.
  32183. *
  32184. * r Result of doubling point.
  32185. * p Point to double.
  32186. * t Temporary ordinate data.
  32187. */
  32188. #ifdef WOLFSSL_SP_NONBLOCK
  32189. typedef struct sp_521_proj_point_dbl_17_ctx {
  32190. int state;
  32191. sp_digit* t1;
  32192. sp_digit* t2;
  32193. sp_digit* x;
  32194. sp_digit* y;
  32195. sp_digit* z;
  32196. } sp_521_proj_point_dbl_17_ctx;
  32197. static int sp_521_proj_point_dbl_17_nb(sp_ecc_ctx_t* sp_ctx, sp_point_521* r, const sp_point_521* p, sp_digit* t)
  32198. {
  32199. int err = FP_WOULDBLOCK;
  32200. sp_521_proj_point_dbl_17_ctx* ctx = (sp_521_proj_point_dbl_17_ctx*)sp_ctx->data;
  32201. typedef char ctx_size_test[sizeof(sp_521_proj_point_dbl_17_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  32202. (void)sizeof(ctx_size_test);
  32203. switch (ctx->state) {
  32204. case 0:
  32205. ctx->t1 = t;
  32206. ctx->t2 = t + 2*17;
  32207. ctx->x = r->x;
  32208. ctx->y = r->y;
  32209. ctx->z = r->z;
  32210. /* Put infinity into result. */
  32211. if (r != p) {
  32212. r->infinity = p->infinity;
  32213. }
  32214. ctx->state = 1;
  32215. break;
  32216. case 1:
  32217. /* T1 = Z * Z */
  32218. sp_521_mont_sqr_17(ctx->t1, p->z, p521_mod, p521_mp_mod);
  32219. ctx->state = 2;
  32220. break;
  32221. case 2:
  32222. /* Z = Y * Z */
  32223. sp_521_mont_mul_17(ctx->z, p->y, p->z, p521_mod, p521_mp_mod);
  32224. ctx->state = 3;
  32225. break;
  32226. case 3:
  32227. /* Z = 2Z */
  32228. sp_521_mont_dbl_17(ctx->z, ctx->z, p521_mod);
  32229. ctx->state = 4;
  32230. break;
  32231. case 4:
  32232. /* T2 = X - T1 */
  32233. sp_521_mont_sub_17(ctx->t2, p->x, ctx->t1, p521_mod);
  32234. ctx->state = 5;
  32235. break;
  32236. case 5:
  32237. /* T1 = X + T1 */
  32238. sp_521_mont_add_17(ctx->t1, p->x, ctx->t1, p521_mod);
  32239. ctx->state = 6;
  32240. break;
  32241. case 6:
  32242. /* T2 = T1 * T2 */
  32243. sp_521_mont_mul_17(ctx->t2, ctx->t1, ctx->t2, p521_mod, p521_mp_mod);
  32244. ctx->state = 7;
  32245. break;
  32246. case 7:
  32247. /* T1 = 3T2 */
  32248. sp_521_mont_tpl_17(ctx->t1, ctx->t2, p521_mod);
  32249. ctx->state = 8;
  32250. break;
  32251. case 8:
  32252. /* Y = 2Y */
  32253. sp_521_mont_dbl_17(ctx->y, p->y, p521_mod);
  32254. ctx->state = 9;
  32255. break;
  32256. case 9:
  32257. /* Y = Y * Y */
  32258. sp_521_mont_sqr_17(ctx->y, ctx->y, p521_mod, p521_mp_mod);
  32259. ctx->state = 10;
  32260. break;
  32261. case 10:
  32262. /* T2 = Y * Y */
  32263. sp_521_mont_sqr_17(ctx->t2, ctx->y, p521_mod, p521_mp_mod);
  32264. ctx->state = 11;
  32265. break;
  32266. case 11:
  32267. /* T2 = T2/2 */
  32268. sp_521_div2_17(ctx->t2, ctx->t2, p521_mod);
  32269. ctx->state = 12;
  32270. break;
  32271. case 12:
  32272. /* Y = Y * X */
  32273. sp_521_mont_mul_17(ctx->y, ctx->y, p->x, p521_mod, p521_mp_mod);
  32274. ctx->state = 13;
  32275. break;
  32276. case 13:
  32277. /* X = T1 * T1 */
  32278. sp_521_mont_sqr_17(ctx->x, ctx->t1, p521_mod, p521_mp_mod);
  32279. ctx->state = 14;
  32280. break;
  32281. case 14:
  32282. /* X = X - Y */
  32283. sp_521_mont_sub_17(ctx->x, ctx->x, ctx->y, p521_mod);
  32284. ctx->state = 15;
  32285. break;
  32286. case 15:
  32287. /* X = X - Y */
  32288. sp_521_mont_sub_17(ctx->x, ctx->x, ctx->y, p521_mod);
  32289. ctx->state = 16;
  32290. break;
  32291. case 16:
  32292. /* Y = Y - X */
  32293. sp_521_mont_sub_lower_17(ctx->y, ctx->y, ctx->x, p521_mod);
  32294. ctx->state = 17;
  32295. break;
  32296. case 17:
  32297. /* Y = Y * T1 */
  32298. sp_521_mont_mul_17(ctx->y, ctx->y, ctx->t1, p521_mod, p521_mp_mod);
  32299. ctx->state = 18;
  32300. break;
  32301. case 18:
  32302. /* Y = Y - T2 */
  32303. sp_521_mont_sub_17(ctx->y, ctx->y, ctx->t2, p521_mod);
  32304. ctx->state = 19;
  32305. /* fall-through */
  32306. case 19:
  32307. err = MP_OKAY;
  32308. break;
  32309. }
  32310. if (err == MP_OKAY && ctx->state != 19) {
  32311. err = FP_WOULDBLOCK;
  32312. }
  32313. return err;
  32314. }
  32315. #endif /* WOLFSSL_SP_NONBLOCK */
  32316. static void sp_521_proj_point_dbl_17(sp_point_521* r, const sp_point_521* p,
  32317. sp_digit* t)
  32318. {
  32319. sp_digit* t1 = t;
  32320. sp_digit* t2 = t + 2*17;
  32321. sp_digit* x;
  32322. sp_digit* y;
  32323. sp_digit* z;
  32324. x = r->x;
  32325. y = r->y;
  32326. z = r->z;
  32327. /* Put infinity into result. */
  32328. if (r != p) {
  32329. r->infinity = p->infinity;
  32330. }
  32331. /* T1 = Z * Z */
  32332. sp_521_mont_sqr_17(t1, p->z, p521_mod, p521_mp_mod);
  32333. /* Z = Y * Z */
  32334. sp_521_mont_mul_17(z, p->y, p->z, p521_mod, p521_mp_mod);
  32335. /* Z = 2Z */
  32336. sp_521_mont_dbl_17(z, z, p521_mod);
  32337. /* T2 = X - T1 */
  32338. sp_521_mont_sub_17(t2, p->x, t1, p521_mod);
  32339. /* T1 = X + T1 */
  32340. sp_521_mont_add_17(t1, p->x, t1, p521_mod);
  32341. /* T2 = T1 * T2 */
  32342. sp_521_mont_mul_17(t2, t1, t2, p521_mod, p521_mp_mod);
  32343. /* T1 = 3T2 */
  32344. sp_521_mont_tpl_17(t1, t2, p521_mod);
  32345. /* Y = 2Y */
  32346. sp_521_mont_dbl_17(y, p->y, p521_mod);
  32347. /* Y = Y * Y */
  32348. sp_521_mont_sqr_17(y, y, p521_mod, p521_mp_mod);
  32349. /* T2 = Y * Y */
  32350. sp_521_mont_sqr_17(t2, y, p521_mod, p521_mp_mod);
  32351. /* T2 = T2/2 */
  32352. sp_521_div2_17(t2, t2, p521_mod);
  32353. /* Y = Y * X */
  32354. sp_521_mont_mul_17(y, y, p->x, p521_mod, p521_mp_mod);
  32355. /* X = T1 * T1 */
  32356. sp_521_mont_sqr_17(x, t1, p521_mod, p521_mp_mod);
  32357. /* X = X - Y */
  32358. sp_521_mont_sub_17(x, x, y, p521_mod);
  32359. /* X = X - Y */
  32360. sp_521_mont_sub_17(x, x, y, p521_mod);
  32361. /* Y = Y - X */
  32362. sp_521_mont_sub_lower_17(y, y, x, p521_mod);
  32363. /* Y = Y * T1 */
  32364. sp_521_mont_mul_17(y, y, t1, p521_mod, p521_mp_mod);
  32365. /* Y = Y - T2 */
  32366. sp_521_mont_sub_17(y, y, t2, p521_mod);
  32367. }
  32368. /* Compare two numbers to determine if they are equal.
  32369. * Constant time implementation.
  32370. *
  32371. * a First number to compare.
  32372. * b Second number to compare.
  32373. * returns 1 when equal and 0 otherwise.
  32374. */
  32375. static int sp_521_cmp_equal_17(const sp_digit* a, const sp_digit* b)
  32376. {
  32377. return ((a[0] ^ b[0]) | (a[1] ^ b[1]) | (a[2] ^ b[2]) |
  32378. (a[3] ^ b[3]) | (a[4] ^ b[4]) | (a[5] ^ b[5]) |
  32379. (a[6] ^ b[6]) | (a[7] ^ b[7]) | (a[8] ^ b[8]) |
  32380. (a[9] ^ b[9]) | (a[10] ^ b[10]) | (a[11] ^ b[11]) |
  32381. (a[12] ^ b[12]) | (a[13] ^ b[13]) | (a[14] ^ b[14]) |
  32382. (a[15] ^ b[15]) | (a[16] ^ b[16])) == 0;
  32383. }
  32384. /* Returns 1 if the number of zero.
  32385. * Implementation is constant time.
  32386. *
  32387. * a Number to check.
  32388. * returns 1 if the number is zero and 0 otherwise.
  32389. */
  32390. static int sp_521_iszero_17(const sp_digit* a)
  32391. {
  32392. return (a[0] | a[1] | a[2] | a[3] | a[4] | a[5] | a[6] | a[7] |
  32393. a[8] | a[9] | a[10] | a[11] | a[12] | a[13] | a[14] | a[15] |
  32394. a[16]) == 0;
  32395. }
  32396. /* Add two Montgomery form projective points.
  32397. *
  32398. * r Result of addition.
  32399. * p First point to add.
  32400. * q Second point to add.
  32401. * t Temporary ordinate data.
  32402. */
  32403. #ifdef WOLFSSL_SP_NONBLOCK
  32404. typedef struct sp_521_proj_point_add_17_ctx {
  32405. int state;
  32406. sp_521_proj_point_dbl_17_ctx dbl_ctx;
  32407. const sp_point_521* ap[2];
  32408. sp_point_521* rp[2];
  32409. sp_digit* t1;
  32410. sp_digit* t2;
  32411. sp_digit* t3;
  32412. sp_digit* t4;
  32413. sp_digit* t5;
  32414. sp_digit* t6;
  32415. sp_digit* x;
  32416. sp_digit* y;
  32417. sp_digit* z;
  32418. } sp_521_proj_point_add_17_ctx;
  32419. static int sp_521_proj_point_add_17_nb(sp_ecc_ctx_t* sp_ctx, sp_point_521* r,
  32420. const sp_point_521* p, const sp_point_521* q, sp_digit* t)
  32421. {
  32422. int err = FP_WOULDBLOCK;
  32423. sp_521_proj_point_add_17_ctx* ctx = (sp_521_proj_point_add_17_ctx*)sp_ctx->data;
  32424. /* Ensure only the first point is the same as the result. */
  32425. if (q == r) {
  32426. const sp_point_521* a = p;
  32427. p = q;
  32428. q = a;
  32429. }
  32430. typedef char ctx_size_test[sizeof(sp_521_proj_point_add_17_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  32431. (void)sizeof(ctx_size_test);
  32432. switch (ctx->state) {
  32433. case 0: /* INIT */
  32434. ctx->t1 = t;
  32435. ctx->t2 = t + 2*17;
  32436. ctx->t3 = t + 4*17;
  32437. ctx->t4 = t + 6*17;
  32438. ctx->t5 = t + 8*17;
  32439. ctx->t6 = t + 10*17;
  32440. ctx->x = ctx->t6;
  32441. ctx->y = ctx->t1;
  32442. ctx->z = ctx->t2;
  32443. ctx->state = 1;
  32444. break;
  32445. case 1:
  32446. /* Check double */
  32447. (void)sp_521_sub_17(ctx->t1, p521_mod, q->y);
  32448. sp_521_norm_17(ctx->t1);
  32449. if ((~p->infinity & ~q->infinity &
  32450. sp_521_cmp_equal_17(p->x, q->x) & sp_521_cmp_equal_17(p->z, q->z) &
  32451. (sp_521_cmp_equal_17(p->y, q->y) | sp_521_cmp_equal_17(p->y, ctx->t1))) != 0)
  32452. {
  32453. XMEMSET(&ctx->dbl_ctx, 0, sizeof(ctx->dbl_ctx));
  32454. ctx->state = 2;
  32455. }
  32456. else {
  32457. ctx->state = 3;
  32458. }
  32459. break;
  32460. case 2:
  32461. err = sp_521_proj_point_dbl_17_nb((sp_ecc_ctx_t*)&ctx->dbl_ctx, r, p, t);
  32462. if (err == MP_OKAY)
  32463. ctx->state = 27; /* done */
  32464. break;
  32465. case 3:
  32466. {
  32467. ctx->state = 4;
  32468. break;
  32469. }
  32470. case 4:
  32471. /* U1 = X1*Z2^2 */
  32472. sp_521_mont_sqr_17(ctx->t1, q->z, p521_mod, p521_mp_mod);
  32473. ctx->state = 5;
  32474. break;
  32475. case 5:
  32476. sp_521_mont_mul_17(ctx->t3, ctx->t1, q->z, p521_mod, p521_mp_mod);
  32477. ctx->state = 6;
  32478. break;
  32479. case 6:
  32480. sp_521_mont_mul_17(ctx->t1, ctx->t1, p->x, p521_mod, p521_mp_mod);
  32481. ctx->state = 7;
  32482. break;
  32483. case 7:
  32484. /* U2 = X2*Z1^2 */
  32485. sp_521_mont_sqr_17(ctx->t2, p->z, p521_mod, p521_mp_mod);
  32486. ctx->state = 8;
  32487. break;
  32488. case 8:
  32489. sp_521_mont_mul_17(ctx->t4, ctx->t2, p->z, p521_mod, p521_mp_mod);
  32490. ctx->state = 9;
  32491. break;
  32492. case 9:
  32493. sp_521_mont_mul_17(ctx->t2, ctx->t2, q->x, p521_mod, p521_mp_mod);
  32494. ctx->state = 10;
  32495. break;
  32496. case 10:
  32497. /* S1 = Y1*Z2^3 */
  32498. sp_521_mont_mul_17(ctx->t3, ctx->t3, p->y, p521_mod, p521_mp_mod);
  32499. ctx->state = 11;
  32500. break;
  32501. case 11:
  32502. /* S2 = Y2*Z1^3 */
  32503. sp_521_mont_mul_17(ctx->t4, ctx->t4, q->y, p521_mod, p521_mp_mod);
  32504. ctx->state = 12;
  32505. break;
  32506. case 12:
  32507. /* H = U2 - U1 */
  32508. sp_521_mont_sub_17(ctx->t2, ctx->t2, ctx->t1, p521_mod);
  32509. ctx->state = 13;
  32510. break;
  32511. case 13:
  32512. /* R = S2 - S1 */
  32513. sp_521_mont_sub_17(ctx->t4, ctx->t4, ctx->t3, p521_mod);
  32514. ctx->state = 14;
  32515. break;
  32516. case 14:
  32517. /* X3 = R^2 - H^3 - 2*U1*H^2 */
  32518. sp_521_mont_sqr_17(ctx->t5, ctx->t2, p521_mod, p521_mp_mod);
  32519. ctx->state = 15;
  32520. break;
  32521. case 15:
  32522. sp_521_mont_mul_17(ctx->y, ctx->t1, ctx->t5, p521_mod, p521_mp_mod);
  32523. ctx->state = 16;
  32524. break;
  32525. case 16:
  32526. sp_521_mont_mul_17(ctx->t5, ctx->t5, ctx->t2, p521_mod, p521_mp_mod);
  32527. ctx->state = 17;
  32528. break;
  32529. case 17:
  32530. /* Z3 = H*Z1*Z2 */
  32531. sp_521_mont_mul_17(ctx->z, p->z, ctx->t2, p521_mod, p521_mp_mod);
  32532. ctx->state = 18;
  32533. break;
  32534. case 18:
  32535. sp_521_mont_mul_17(ctx->z, ctx->z, q->z, p521_mod, p521_mp_mod);
  32536. ctx->state = 19;
  32537. break;
  32538. case 19:
  32539. sp_521_mont_sqr_17(ctx->x, ctx->t4, p521_mod, p521_mp_mod);
  32540. ctx->state = 20;
  32541. break;
  32542. case 20:
  32543. sp_521_mont_sub_17(ctx->x, ctx->x, ctx->t5, p521_mod);
  32544. ctx->state = 21;
  32545. break;
  32546. case 21:
  32547. sp_521_mont_mul_17(ctx->t5, ctx->t5, ctx->t3, p521_mod, p521_mp_mod);
  32548. ctx->state = 22;
  32549. break;
  32550. case 22:
  32551. sp_521_mont_dbl_17(ctx->t3, ctx->y, p521_mod);
  32552. ctx->state = 23;
  32553. break;
  32554. case 23:
  32555. sp_521_mont_sub_17(ctx->x, ctx->x, ctx->t3, p521_mod);
  32556. ctx->state = 24;
  32557. break;
  32558. case 24:
  32559. /* Y3 = R*(U1*H^2 - X3) - S1*H^3 */
  32560. sp_521_mont_sub_lower_17(ctx->y, ctx->y, ctx->x, p521_mod);
  32561. ctx->state = 25;
  32562. break;
  32563. case 25:
  32564. sp_521_mont_mul_17(ctx->y, ctx->y, ctx->t4, p521_mod, p521_mp_mod);
  32565. ctx->state = 26;
  32566. break;
  32567. case 26:
  32568. sp_521_mont_sub_17(ctx->y, ctx->y, ctx->t5, p521_mod);
  32569. ctx->state = 27;
  32570. /* fall-through */
  32571. case 27:
  32572. {
  32573. int i;
  32574. sp_digit maskp = 0 - (q->infinity & (!p->infinity));
  32575. sp_digit maskq = 0 - (p->infinity & (!q->infinity));
  32576. sp_digit maskt = ~(maskp | maskq);
  32577. for (i = 0; i < 17; i++) {
  32578. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) |
  32579. (ctx->x[i] & maskt);
  32580. }
  32581. for (i = 0; i < 17; i++) {
  32582. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) |
  32583. (ctx->y[i] & maskt);
  32584. }
  32585. for (i = 0; i < 17; i++) {
  32586. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) |
  32587. (ctx->z[i] & maskt);
  32588. }
  32589. r->z[0] |= p->infinity & q->infinity;
  32590. r->infinity = p->infinity & q->infinity;
  32591. err = MP_OKAY;
  32592. break;
  32593. }
  32594. }
  32595. if (err == MP_OKAY && ctx->state != 27) {
  32596. err = FP_WOULDBLOCK;
  32597. }
  32598. return err;
  32599. }
  32600. #endif /* WOLFSSL_SP_NONBLOCK */
  32601. static void sp_521_proj_point_add_17(sp_point_521* r,
  32602. const sp_point_521* p, const sp_point_521* q, sp_digit* t)
  32603. {
  32604. sp_digit* t1 = t;
  32605. sp_digit* t2 = t + 2*17;
  32606. sp_digit* t3 = t + 4*17;
  32607. sp_digit* t4 = t + 6*17;
  32608. sp_digit* t5 = t + 8*17;
  32609. sp_digit* t6 = t + 10*17;
  32610. /* Check double */
  32611. (void)sp_521_sub_17(t1, p521_mod, q->y);
  32612. sp_521_norm_17(t1);
  32613. if ((~p->infinity & ~q->infinity &
  32614. sp_521_cmp_equal_17(p->x, q->x) & sp_521_cmp_equal_17(p->z, q->z) &
  32615. (sp_521_cmp_equal_17(p->y, q->y) | sp_521_cmp_equal_17(p->y, t1))) != 0) {
  32616. sp_521_proj_point_dbl_17(r, p, t);
  32617. }
  32618. else {
  32619. sp_digit maskp;
  32620. sp_digit maskq;
  32621. sp_digit maskt;
  32622. sp_digit* x = t6;
  32623. sp_digit* y = t1;
  32624. sp_digit* z = t2;
  32625. int i;
  32626. maskp = 0 - (q->infinity & (!p->infinity));
  32627. maskq = 0 - (p->infinity & (!q->infinity));
  32628. maskt = ~(maskp | maskq);
  32629. /* U1 = X1*Z2^2 */
  32630. sp_521_mont_sqr_17(t1, q->z, p521_mod, p521_mp_mod);
  32631. sp_521_mont_mul_17(t3, t1, q->z, p521_mod, p521_mp_mod);
  32632. sp_521_mont_mul_17(t1, t1, p->x, p521_mod, p521_mp_mod);
  32633. /* U2 = X2*Z1^2 */
  32634. sp_521_mont_sqr_17(t2, p->z, p521_mod, p521_mp_mod);
  32635. sp_521_mont_mul_17(t4, t2, p->z, p521_mod, p521_mp_mod);
  32636. sp_521_mont_mul_17(t2, t2, q->x, p521_mod, p521_mp_mod);
  32637. /* S1 = Y1*Z2^3 */
  32638. sp_521_mont_mul_17(t3, t3, p->y, p521_mod, p521_mp_mod);
  32639. /* S2 = Y2*Z1^3 */
  32640. sp_521_mont_mul_17(t4, t4, q->y, p521_mod, p521_mp_mod);
  32641. /* H = U2 - U1 */
  32642. sp_521_mont_sub_17(t2, t2, t1, p521_mod);
  32643. /* R = S2 - S1 */
  32644. sp_521_mont_sub_17(t4, t4, t3, p521_mod);
  32645. if (~p->infinity & ~q->infinity &
  32646. sp_521_iszero_17(t2) & sp_521_iszero_17(t4) & maskt) {
  32647. sp_521_proj_point_dbl_17(r, p, t);
  32648. }
  32649. else {
  32650. /* X3 = R^2 - H^3 - 2*U1*H^2 */
  32651. sp_521_mont_sqr_17(t5, t2, p521_mod, p521_mp_mod);
  32652. sp_521_mont_mul_17(y, t1, t5, p521_mod, p521_mp_mod);
  32653. sp_521_mont_mul_17(t5, t5, t2, p521_mod, p521_mp_mod);
  32654. /* Z3 = H*Z1*Z2 */
  32655. sp_521_mont_mul_17(z, p->z, t2, p521_mod, p521_mp_mod);
  32656. sp_521_mont_mul_17(z, z, q->z, p521_mod, p521_mp_mod);
  32657. sp_521_mont_sqr_17(x, t4, p521_mod, p521_mp_mod);
  32658. sp_521_mont_sub_17(x, x, t5, p521_mod);
  32659. sp_521_mont_mul_17(t5, t5, t3, p521_mod, p521_mp_mod);
  32660. sp_521_mont_dbl_17(t3, y, p521_mod);
  32661. sp_521_mont_sub_17(x, x, t3, p521_mod);
  32662. /* Y3 = R*(U1*H^2 - X3) - S1*H^3 */
  32663. sp_521_mont_sub_lower_17(y, y, x, p521_mod);
  32664. sp_521_mont_mul_17(y, y, t4, p521_mod, p521_mp_mod);
  32665. sp_521_mont_sub_17(y, y, t5, p521_mod);
  32666. for (i = 0; i < 17; i++) {
  32667. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) |
  32668. (x[i] & maskt);
  32669. }
  32670. for (i = 0; i < 17; i++) {
  32671. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) |
  32672. (y[i] & maskt);
  32673. }
  32674. for (i = 0; i < 17; i++) {
  32675. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) |
  32676. (z[i] & maskt);
  32677. }
  32678. r->z[0] |= p->infinity & q->infinity;
  32679. r->infinity = p->infinity & q->infinity;
  32680. }
  32681. }
  32682. }
  32683. #ifndef WC_NO_CACHE_RESISTANT
  32684. /* Touch each possible point that could be being copied.
  32685. *
  32686. * r Point to copy into.
  32687. * table Table - start of the entires to access
  32688. * idx Index of entry to retrieve.
  32689. */
  32690. static void sp_521_get_point_16_17(sp_point_521* r, const sp_point_521* table,
  32691. int idx)
  32692. {
  32693. int i;
  32694. sp_digit mask;
  32695. r->x[0] = 0;
  32696. r->x[1] = 0;
  32697. r->x[2] = 0;
  32698. r->x[3] = 0;
  32699. r->x[4] = 0;
  32700. r->x[5] = 0;
  32701. r->x[6] = 0;
  32702. r->x[7] = 0;
  32703. r->x[8] = 0;
  32704. r->x[9] = 0;
  32705. r->x[10] = 0;
  32706. r->x[11] = 0;
  32707. r->x[12] = 0;
  32708. r->x[13] = 0;
  32709. r->x[14] = 0;
  32710. r->x[15] = 0;
  32711. r->x[16] = 0;
  32712. r->y[0] = 0;
  32713. r->y[1] = 0;
  32714. r->y[2] = 0;
  32715. r->y[3] = 0;
  32716. r->y[4] = 0;
  32717. r->y[5] = 0;
  32718. r->y[6] = 0;
  32719. r->y[7] = 0;
  32720. r->y[8] = 0;
  32721. r->y[9] = 0;
  32722. r->y[10] = 0;
  32723. r->y[11] = 0;
  32724. r->y[12] = 0;
  32725. r->y[13] = 0;
  32726. r->y[14] = 0;
  32727. r->y[15] = 0;
  32728. r->y[16] = 0;
  32729. r->z[0] = 0;
  32730. r->z[1] = 0;
  32731. r->z[2] = 0;
  32732. r->z[3] = 0;
  32733. r->z[4] = 0;
  32734. r->z[5] = 0;
  32735. r->z[6] = 0;
  32736. r->z[7] = 0;
  32737. r->z[8] = 0;
  32738. r->z[9] = 0;
  32739. r->z[10] = 0;
  32740. r->z[11] = 0;
  32741. r->z[12] = 0;
  32742. r->z[13] = 0;
  32743. r->z[14] = 0;
  32744. r->z[15] = 0;
  32745. r->z[16] = 0;
  32746. for (i = 1; i < 16; i++) {
  32747. mask = 0 - (i == idx);
  32748. r->x[0] |= mask & table[i].x[0];
  32749. r->x[1] |= mask & table[i].x[1];
  32750. r->x[2] |= mask & table[i].x[2];
  32751. r->x[3] |= mask & table[i].x[3];
  32752. r->x[4] |= mask & table[i].x[4];
  32753. r->x[5] |= mask & table[i].x[5];
  32754. r->x[6] |= mask & table[i].x[6];
  32755. r->x[7] |= mask & table[i].x[7];
  32756. r->x[8] |= mask & table[i].x[8];
  32757. r->x[9] |= mask & table[i].x[9];
  32758. r->x[10] |= mask & table[i].x[10];
  32759. r->x[11] |= mask & table[i].x[11];
  32760. r->x[12] |= mask & table[i].x[12];
  32761. r->x[13] |= mask & table[i].x[13];
  32762. r->x[14] |= mask & table[i].x[14];
  32763. r->x[15] |= mask & table[i].x[15];
  32764. r->x[16] |= mask & table[i].x[16];
  32765. r->y[0] |= mask & table[i].y[0];
  32766. r->y[1] |= mask & table[i].y[1];
  32767. r->y[2] |= mask & table[i].y[2];
  32768. r->y[3] |= mask & table[i].y[3];
  32769. r->y[4] |= mask & table[i].y[4];
  32770. r->y[5] |= mask & table[i].y[5];
  32771. r->y[6] |= mask & table[i].y[6];
  32772. r->y[7] |= mask & table[i].y[7];
  32773. r->y[8] |= mask & table[i].y[8];
  32774. r->y[9] |= mask & table[i].y[9];
  32775. r->y[10] |= mask & table[i].y[10];
  32776. r->y[11] |= mask & table[i].y[11];
  32777. r->y[12] |= mask & table[i].y[12];
  32778. r->y[13] |= mask & table[i].y[13];
  32779. r->y[14] |= mask & table[i].y[14];
  32780. r->y[15] |= mask & table[i].y[15];
  32781. r->y[16] |= mask & table[i].y[16];
  32782. r->z[0] |= mask & table[i].z[0];
  32783. r->z[1] |= mask & table[i].z[1];
  32784. r->z[2] |= mask & table[i].z[2];
  32785. r->z[3] |= mask & table[i].z[3];
  32786. r->z[4] |= mask & table[i].z[4];
  32787. r->z[5] |= mask & table[i].z[5];
  32788. r->z[6] |= mask & table[i].z[6];
  32789. r->z[7] |= mask & table[i].z[7];
  32790. r->z[8] |= mask & table[i].z[8];
  32791. r->z[9] |= mask & table[i].z[9];
  32792. r->z[10] |= mask & table[i].z[10];
  32793. r->z[11] |= mask & table[i].z[11];
  32794. r->z[12] |= mask & table[i].z[12];
  32795. r->z[13] |= mask & table[i].z[13];
  32796. r->z[14] |= mask & table[i].z[14];
  32797. r->z[15] |= mask & table[i].z[15];
  32798. r->z[16] |= mask & table[i].z[16];
  32799. }
  32800. }
  32801. #endif /* !WC_NO_CACHE_RESISTANT */
  32802. /* Multiply the point by the scalar and return the result.
  32803. * If map is true then convert result to affine coordinates.
  32804. *
  32805. * Fast implementation that generates a pre-computation table.
  32806. * 4 bits of window (no sliding!).
  32807. * Uses add and double for calculating table.
  32808. * 521 doubles.
  32809. * 143 adds.
  32810. *
  32811. * r Resulting point.
  32812. * g Point to multiply.
  32813. * k Scalar to multiply by.
  32814. * map Indicates whether to convert result to affine.
  32815. * ct Constant time required.
  32816. * heap Heap to use for allocation.
  32817. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  32818. */
  32819. static int sp_521_ecc_mulmod_fast_17(sp_point_521* r, const sp_point_521* g, const sp_digit* k,
  32820. int map, int ct, void* heap)
  32821. {
  32822. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  32823. sp_point_521* t = NULL;
  32824. sp_digit* tmp = NULL;
  32825. #else
  32826. sp_point_521 t[16 + 1];
  32827. sp_digit tmp[2 * 17 * 6];
  32828. #endif
  32829. sp_point_521* rt = NULL;
  32830. #ifndef WC_NO_CACHE_RESISTANT
  32831. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  32832. sp_point_521* p = NULL;
  32833. #else
  32834. sp_point_521 p[1];
  32835. #endif
  32836. #endif /* !WC_NO_CACHE_RESISTANT */
  32837. sp_digit n;
  32838. int i;
  32839. int c;
  32840. int y;
  32841. int err = MP_OKAY;
  32842. /* Constant time used for cache attack resistance implementation. */
  32843. (void)ct;
  32844. (void)heap;
  32845. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  32846. t = (sp_point_521*)XMALLOC(sizeof(sp_point_521) * (16 + 1),
  32847. heap, DYNAMIC_TYPE_ECC);
  32848. if (t == NULL)
  32849. err = MEMORY_E;
  32850. #ifndef WC_NO_CACHE_RESISTANT
  32851. if (err == MP_OKAY) {
  32852. p = (sp_point_521*)XMALLOC(sizeof(sp_point_521),
  32853. heap, DYNAMIC_TYPE_ECC);
  32854. if (p == NULL)
  32855. err = MEMORY_E;
  32856. }
  32857. #endif
  32858. if (err == MP_OKAY) {
  32859. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 17 * 6, heap,
  32860. DYNAMIC_TYPE_ECC);
  32861. if (tmp == NULL)
  32862. err = MEMORY_E;
  32863. }
  32864. #endif
  32865. if (err == MP_OKAY) {
  32866. rt = t + 16;
  32867. /* t[0] = {0, 0, 1} * norm */
  32868. XMEMSET(&t[0], 0, sizeof(t[0]));
  32869. t[0].infinity = 1;
  32870. /* t[1] = {g->x, g->y, g->z} * norm */
  32871. (void)sp_521_mod_mul_norm_17(t[1].x, g->x, p521_mod);
  32872. (void)sp_521_mod_mul_norm_17(t[1].y, g->y, p521_mod);
  32873. (void)sp_521_mod_mul_norm_17(t[1].z, g->z, p521_mod);
  32874. t[1].infinity = 0;
  32875. sp_521_proj_point_dbl_17(&t[ 2], &t[ 1], tmp);
  32876. t[ 2].infinity = 0;
  32877. sp_521_proj_point_add_17(&t[ 3], &t[ 2], &t[ 1], tmp);
  32878. t[ 3].infinity = 0;
  32879. sp_521_proj_point_dbl_17(&t[ 4], &t[ 2], tmp);
  32880. t[ 4].infinity = 0;
  32881. sp_521_proj_point_add_17(&t[ 5], &t[ 3], &t[ 2], tmp);
  32882. t[ 5].infinity = 0;
  32883. sp_521_proj_point_dbl_17(&t[ 6], &t[ 3], tmp);
  32884. t[ 6].infinity = 0;
  32885. sp_521_proj_point_add_17(&t[ 7], &t[ 4], &t[ 3], tmp);
  32886. t[ 7].infinity = 0;
  32887. sp_521_proj_point_dbl_17(&t[ 8], &t[ 4], tmp);
  32888. t[ 8].infinity = 0;
  32889. sp_521_proj_point_add_17(&t[ 9], &t[ 5], &t[ 4], tmp);
  32890. t[ 9].infinity = 0;
  32891. sp_521_proj_point_dbl_17(&t[10], &t[ 5], tmp);
  32892. t[10].infinity = 0;
  32893. sp_521_proj_point_add_17(&t[11], &t[ 6], &t[ 5], tmp);
  32894. t[11].infinity = 0;
  32895. sp_521_proj_point_dbl_17(&t[12], &t[ 6], tmp);
  32896. t[12].infinity = 0;
  32897. sp_521_proj_point_add_17(&t[13], &t[ 7], &t[ 6], tmp);
  32898. t[13].infinity = 0;
  32899. sp_521_proj_point_dbl_17(&t[14], &t[ 7], tmp);
  32900. t[14].infinity = 0;
  32901. sp_521_proj_point_add_17(&t[15], &t[ 8], &t[ 7], tmp);
  32902. t[15].infinity = 0;
  32903. i = 15;
  32904. n = k[i+1] << 0;
  32905. c = 5;
  32906. y = (int)(n >> 5);
  32907. #ifndef WC_NO_CACHE_RESISTANT
  32908. if (ct) {
  32909. sp_521_get_point_16_17(rt, t, y);
  32910. rt->infinity = !y;
  32911. }
  32912. else
  32913. #endif
  32914. {
  32915. XMEMCPY(rt, &t[y], sizeof(sp_point_521));
  32916. }
  32917. n <<= 27;
  32918. for (; i>=0 || c>=4; ) {
  32919. if (c < 4) {
  32920. n = (k[i+1] << 31) | (k[i] >> 1);
  32921. i--;
  32922. c += 32;
  32923. }
  32924. y = (n >> 28) & 0xf;
  32925. n <<= 4;
  32926. c -= 4;
  32927. sp_521_proj_point_dbl_17(rt, rt, tmp);
  32928. sp_521_proj_point_dbl_17(rt, rt, tmp);
  32929. sp_521_proj_point_dbl_17(rt, rt, tmp);
  32930. sp_521_proj_point_dbl_17(rt, rt, tmp);
  32931. #ifndef WC_NO_CACHE_RESISTANT
  32932. if (ct) {
  32933. sp_521_get_point_16_17(p, t, y);
  32934. p->infinity = !y;
  32935. sp_521_proj_point_add_17(rt, rt, p, tmp);
  32936. }
  32937. else
  32938. #endif
  32939. {
  32940. sp_521_proj_point_add_17(rt, rt, &t[y], tmp);
  32941. }
  32942. }
  32943. y = k[0] & 0x1;
  32944. sp_521_proj_point_dbl_17(rt, rt, tmp);
  32945. sp_521_proj_point_add_17(rt, rt, &t[y], tmp);
  32946. if (map != 0) {
  32947. sp_521_map_17(r, rt, tmp);
  32948. }
  32949. else {
  32950. XMEMCPY(r, rt, sizeof(sp_point_521));
  32951. }
  32952. }
  32953. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  32954. if (tmp != NULL)
  32955. #endif
  32956. {
  32957. ForceZero(tmp, sizeof(sp_digit) * 2 * 17 * 6);
  32958. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  32959. XFREE(tmp, heap, DYNAMIC_TYPE_ECC);
  32960. #endif
  32961. }
  32962. #ifndef WC_NO_CACHE_RESISTANT
  32963. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  32964. if (p != NULL)
  32965. #endif
  32966. {
  32967. ForceZero(p, sizeof(sp_point_521));
  32968. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  32969. XFREE(p, heap, DYNAMIC_TYPE_ECC);
  32970. #endif
  32971. }
  32972. #endif /* !WC_NO_CACHE_RESISTANT */
  32973. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  32974. if (t != NULL)
  32975. #endif
  32976. {
  32977. ForceZero(t, sizeof(sp_point_521) * 17);
  32978. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  32979. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  32980. #endif
  32981. }
  32982. return err;
  32983. }
  32984. #ifdef FP_ECC
  32985. #define sp_521_mont_dbl_lower_17 sp_521_mont_dbl_17
  32986. #define sp_521_mont_tpl_lower_17 sp_521_mont_tpl_17
  32987. /* Double the Montgomery form projective point p a number of times.
  32988. *
  32989. * r Result of repeated doubling of point.
  32990. * p Point to double.
  32991. * n Number of times to double
  32992. * t Temporary ordinate data.
  32993. */
  32994. static void sp_521_proj_point_dbl_n_17(sp_point_521* p, int i,
  32995. sp_digit* t)
  32996. {
  32997. sp_digit* w = t;
  32998. sp_digit* a = t + 2*17;
  32999. sp_digit* b = t + 4*17;
  33000. sp_digit* t1 = t + 6*17;
  33001. sp_digit* t2 = t + 8*17;
  33002. sp_digit* x;
  33003. sp_digit* y;
  33004. sp_digit* z;
  33005. volatile int n = i;
  33006. x = p->x;
  33007. y = p->y;
  33008. z = p->z;
  33009. /* Y = 2*Y */
  33010. sp_521_mont_dbl_17(y, y, p521_mod);
  33011. /* W = Z^4 */
  33012. sp_521_mont_sqr_17(w, z, p521_mod, p521_mp_mod);
  33013. sp_521_mont_sqr_17(w, w, p521_mod, p521_mp_mod);
  33014. #ifndef WOLFSSL_SP_SMALL
  33015. while (--n > 0)
  33016. #else
  33017. while (--n >= 0)
  33018. #endif
  33019. {
  33020. /* A = 3*(X^2 - W) */
  33021. sp_521_mont_sqr_17(t1, x, p521_mod, p521_mp_mod);
  33022. sp_521_mont_sub_17(t1, t1, w, p521_mod);
  33023. sp_521_mont_tpl_lower_17(a, t1, p521_mod);
  33024. /* B = X*Y^2 */
  33025. sp_521_mont_sqr_17(t1, y, p521_mod, p521_mp_mod);
  33026. sp_521_mont_mul_17(b, t1, x, p521_mod, p521_mp_mod);
  33027. /* X = A^2 - 2B */
  33028. sp_521_mont_sqr_17(x, a, p521_mod, p521_mp_mod);
  33029. sp_521_mont_dbl_17(t2, b, p521_mod);
  33030. sp_521_mont_sub_17(x, x, t2, p521_mod);
  33031. /* b = 2.(B - X) */
  33032. sp_521_mont_sub_lower_17(t2, b, x, p521_mod);
  33033. sp_521_mont_dbl_lower_17(b, t2, p521_mod);
  33034. /* Z = Z*Y */
  33035. sp_521_mont_mul_17(z, z, y, p521_mod, p521_mp_mod);
  33036. /* t1 = Y^4 */
  33037. sp_521_mont_sqr_17(t1, t1, p521_mod, p521_mp_mod);
  33038. #ifdef WOLFSSL_SP_SMALL
  33039. if (n != 0)
  33040. #endif
  33041. {
  33042. /* W = W*Y^4 */
  33043. sp_521_mont_mul_17(w, w, t1, p521_mod, p521_mp_mod);
  33044. }
  33045. /* y = 2*A*(B - X) - Y^4 */
  33046. sp_521_mont_mul_17(y, b, a, p521_mod, p521_mp_mod);
  33047. sp_521_mont_sub_17(y, y, t1, p521_mod);
  33048. }
  33049. #ifndef WOLFSSL_SP_SMALL
  33050. /* A = 3*(X^2 - W) */
  33051. sp_521_mont_sqr_17(t1, x, p521_mod, p521_mp_mod);
  33052. sp_521_mont_sub_17(t1, t1, w, p521_mod);
  33053. sp_521_mont_tpl_lower_17(a, t1, p521_mod);
  33054. /* B = X*Y^2 */
  33055. sp_521_mont_sqr_17(t1, y, p521_mod, p521_mp_mod);
  33056. sp_521_mont_mul_17(b, t1, x, p521_mod, p521_mp_mod);
  33057. /* X = A^2 - 2B */
  33058. sp_521_mont_sqr_17(x, a, p521_mod, p521_mp_mod);
  33059. sp_521_mont_dbl_17(t2, b, p521_mod);
  33060. sp_521_mont_sub_17(x, x, t2, p521_mod);
  33061. /* b = 2.(B - X) */
  33062. sp_521_mont_sub_lower_17(t2, b, x, p521_mod);
  33063. sp_521_mont_dbl_lower_17(b, t2, p521_mod);
  33064. /* Z = Z*Y */
  33065. sp_521_mont_mul_17(z, z, y, p521_mod, p521_mp_mod);
  33066. /* t1 = Y^4 */
  33067. sp_521_mont_sqr_17(t1, t1, p521_mod, p521_mp_mod);
  33068. /* y = 2*A*(B - X) - Y^4 */
  33069. sp_521_mont_mul_17(y, b, a, p521_mod, p521_mp_mod);
  33070. sp_521_mont_sub_17(y, y, t1, p521_mod);
  33071. #endif
  33072. /* Y = Y/2 */
  33073. sp_521_div2_17(y, y, p521_mod);
  33074. }
  33075. /* Convert the projective point to affine.
  33076. * Ordinates are in Montgomery form.
  33077. *
  33078. * a Point to convert.
  33079. * t Temporary data.
  33080. */
  33081. static void sp_521_proj_to_affine_17(sp_point_521* a, sp_digit* t)
  33082. {
  33083. sp_digit* t1 = t;
  33084. sp_digit* t2 = t + 2 * 17;
  33085. sp_digit* tmp = t + 4 * 17;
  33086. sp_521_mont_inv_17(t1, a->z, tmp);
  33087. sp_521_mont_sqr_17(t2, t1, p521_mod, p521_mp_mod);
  33088. sp_521_mont_mul_17(t1, t2, t1, p521_mod, p521_mp_mod);
  33089. sp_521_mont_mul_17(a->x, a->x, t2, p521_mod, p521_mp_mod);
  33090. sp_521_mont_mul_17(a->y, a->y, t1, p521_mod, p521_mp_mod);
  33091. XMEMCPY(a->z, p521_norm_mod, sizeof(p521_norm_mod));
  33092. }
  33093. #endif /* FP_ECC */
  33094. /* A table entry for pre-computed points. */
  33095. typedef struct sp_table_entry_521 {
  33096. sp_digit x[17];
  33097. sp_digit y[17];
  33098. } sp_table_entry_521;
  33099. #ifdef FP_ECC
  33100. #endif /* FP_ECC */
  33101. /* Add two Montgomery form projective points. The second point has a q value of
  33102. * one.
  33103. * Only the first point can be the same pointer as the result point.
  33104. *
  33105. * r Result of addition.
  33106. * p First point to add.
  33107. * q Second point to add.
  33108. * t Temporary ordinate data.
  33109. */
  33110. static void sp_521_proj_point_add_qz1_17(sp_point_521* r, const sp_point_521* p,
  33111. const sp_point_521* q, sp_digit* t)
  33112. {
  33113. sp_digit* t1 = t;
  33114. sp_digit* t2 = t + 2*17;
  33115. sp_digit* t3 = t + 4*17;
  33116. sp_digit* t4 = t + 6*17;
  33117. sp_digit* t5 = t + 8*17;
  33118. sp_digit* t6 = t + 10*17;
  33119. /* Check double */
  33120. (void)sp_521_sub_17(t1, p521_mod, q->y);
  33121. sp_521_norm_17(t1);
  33122. if ((~p->infinity & ~q->infinity &
  33123. sp_521_cmp_equal_17(p->x, q->x) & sp_521_cmp_equal_17(p->z, q->z) &
  33124. (sp_521_cmp_equal_17(p->y, q->y) | sp_521_cmp_equal_17(p->y, t1))) != 0) {
  33125. sp_521_proj_point_dbl_17(r, p, t);
  33126. }
  33127. else {
  33128. sp_digit maskp;
  33129. sp_digit maskq;
  33130. sp_digit maskt;
  33131. sp_digit* x = t2;
  33132. sp_digit* y = t5;
  33133. sp_digit* z = t6;
  33134. int i;
  33135. /* U2 = X2*Z1^2 */
  33136. sp_521_mont_sqr_17(t2, p->z, p521_mod, p521_mp_mod);
  33137. sp_521_mont_mul_17(t4, t2, p->z, p521_mod, p521_mp_mod);
  33138. sp_521_mont_mul_17(t2, t2, q->x, p521_mod, p521_mp_mod);
  33139. /* S2 = Y2*Z1^3 */
  33140. sp_521_mont_mul_17(t4, t4, q->y, p521_mod, p521_mp_mod);
  33141. /* H = U2 - X1 */
  33142. sp_521_mont_sub_17(t2, t2, p->x, p521_mod);
  33143. /* R = S2 - Y1 */
  33144. sp_521_mont_sub_17(t4, t4, p->y, p521_mod);
  33145. /* Z3 = H*Z1 */
  33146. sp_521_mont_mul_17(z, p->z, t2, p521_mod, p521_mp_mod);
  33147. /* X3 = R^2 - H^3 - 2*X1*H^2 */
  33148. sp_521_mont_sqr_17(t1, t4, p521_mod, p521_mp_mod);
  33149. sp_521_mont_sqr_17(t5, t2, p521_mod, p521_mp_mod);
  33150. sp_521_mont_mul_17(t3, p->x, t5, p521_mod, p521_mp_mod);
  33151. sp_521_mont_mul_17(t5, t5, t2, p521_mod, p521_mp_mod);
  33152. sp_521_mont_sub_17(x, t1, t5, p521_mod);
  33153. sp_521_mont_dbl_17(t1, t3, p521_mod);
  33154. sp_521_mont_sub_17(x, x, t1, p521_mod);
  33155. /* Y3 = R*(X1*H^2 - X3) - Y1*H^3 */
  33156. sp_521_mont_sub_lower_17(t3, t3, x, p521_mod);
  33157. sp_521_mont_mul_17(t3, t3, t4, p521_mod, p521_mp_mod);
  33158. sp_521_mont_mul_17(t5, t5, p->y, p521_mod, p521_mp_mod);
  33159. sp_521_mont_sub_17(y, t3, t5, p521_mod);
  33160. maskp = 0 - (q->infinity & (!p->infinity));
  33161. maskq = 0 - (p->infinity & (!q->infinity));
  33162. maskt = ~(maskp | maskq);
  33163. for (i = 0; i < 17; i++) {
  33164. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) | (x[i] & maskt);
  33165. }
  33166. for (i = 0; i < 17; i++) {
  33167. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) | (y[i] & maskt);
  33168. }
  33169. for (i = 0; i < 17; i++) {
  33170. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) | (z[i] & maskt);
  33171. }
  33172. r->z[0] |= p->infinity & q->infinity;
  33173. r->infinity = p->infinity & q->infinity;
  33174. }
  33175. }
  33176. #ifdef WOLFSSL_SP_SMALL
  33177. #ifdef FP_ECC
  33178. /* Generate the pre-computed table of points for the base point.
  33179. *
  33180. * width = 4
  33181. * 16 entries
  33182. * 130 bits between
  33183. *
  33184. * a The base point.
  33185. * table Place to store generated point data.
  33186. * tmp Temporary data.
  33187. * heap Heap to use for allocation.
  33188. */
  33189. static int sp_521_gen_stripe_table_17(const sp_point_521* a,
  33190. sp_table_entry_521* table, sp_digit* tmp, void* heap)
  33191. {
  33192. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33193. sp_point_521* t = NULL;
  33194. #else
  33195. sp_point_521 t[3];
  33196. #endif
  33197. sp_point_521* s1 = NULL;
  33198. sp_point_521* s2 = NULL;
  33199. int i;
  33200. int j;
  33201. int err = MP_OKAY;
  33202. (void)heap;
  33203. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33204. t = (sp_point_521*)XMALLOC(sizeof(sp_point_521) * 3, heap,
  33205. DYNAMIC_TYPE_ECC);
  33206. if (t == NULL)
  33207. err = MEMORY_E;
  33208. #endif
  33209. if (err == MP_OKAY) {
  33210. s1 = t + 1;
  33211. s2 = t + 2;
  33212. err = sp_521_mod_mul_norm_17(t->x, a->x, p521_mod);
  33213. }
  33214. if (err == MP_OKAY) {
  33215. err = sp_521_mod_mul_norm_17(t->y, a->y, p521_mod);
  33216. }
  33217. if (err == MP_OKAY) {
  33218. err = sp_521_mod_mul_norm_17(t->z, a->z, p521_mod);
  33219. }
  33220. if (err == MP_OKAY) {
  33221. t->infinity = 0;
  33222. sp_521_proj_to_affine_17(t, tmp);
  33223. XMEMCPY(s1->z, p521_norm_mod, sizeof(p521_norm_mod));
  33224. s1->infinity = 0;
  33225. XMEMCPY(s2->z, p521_norm_mod, sizeof(p521_norm_mod));
  33226. s2->infinity = 0;
  33227. /* table[0] = {0, 0, infinity} */
  33228. XMEMSET(&table[0], 0, sizeof(sp_table_entry_521));
  33229. /* table[1] = Affine version of 'a' in Montgomery form */
  33230. XMEMCPY(table[1].x, t->x, sizeof(table->x));
  33231. XMEMCPY(table[1].y, t->y, sizeof(table->y));
  33232. for (i=1; i<4; i++) {
  33233. sp_521_proj_point_dbl_n_17(t, 131, tmp);
  33234. sp_521_proj_to_affine_17(t, tmp);
  33235. XMEMCPY(table[1<<i].x, t->x, sizeof(table->x));
  33236. XMEMCPY(table[1<<i].y, t->y, sizeof(table->y));
  33237. }
  33238. for (i=1; i<4; i++) {
  33239. XMEMCPY(s1->x, table[1<<i].x, sizeof(table->x));
  33240. XMEMCPY(s1->y, table[1<<i].y, sizeof(table->y));
  33241. for (j=(1<<i)+1; j<(1<<(i+1)); j++) {
  33242. XMEMCPY(s2->x, table[j-(1<<i)].x, sizeof(table->x));
  33243. XMEMCPY(s2->y, table[j-(1<<i)].y, sizeof(table->y));
  33244. sp_521_proj_point_add_qz1_17(t, s1, s2, tmp);
  33245. sp_521_proj_to_affine_17(t, tmp);
  33246. XMEMCPY(table[j].x, t->x, sizeof(table->x));
  33247. XMEMCPY(table[j].y, t->y, sizeof(table->y));
  33248. }
  33249. }
  33250. }
  33251. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33252. if (t != NULL)
  33253. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  33254. #endif
  33255. return err;
  33256. }
  33257. #endif /* FP_ECC */
  33258. #ifndef WC_NO_CACHE_RESISTANT
  33259. /* Touch each possible entry that could be being copied.
  33260. *
  33261. * r Point to copy into.
  33262. * table Table - start of the entires to access
  33263. * idx Index of entry to retrieve.
  33264. */
  33265. static void sp_521_get_entry_16_17(sp_point_521* r,
  33266. const sp_table_entry_521* table, int idx)
  33267. {
  33268. int i;
  33269. sp_digit mask;
  33270. r->x[0] = 0;
  33271. r->x[1] = 0;
  33272. r->x[2] = 0;
  33273. r->x[3] = 0;
  33274. r->x[4] = 0;
  33275. r->x[5] = 0;
  33276. r->x[6] = 0;
  33277. r->x[7] = 0;
  33278. r->x[8] = 0;
  33279. r->x[9] = 0;
  33280. r->x[10] = 0;
  33281. r->x[11] = 0;
  33282. r->x[12] = 0;
  33283. r->x[13] = 0;
  33284. r->x[14] = 0;
  33285. r->x[15] = 0;
  33286. r->x[16] = 0;
  33287. r->y[0] = 0;
  33288. r->y[1] = 0;
  33289. r->y[2] = 0;
  33290. r->y[3] = 0;
  33291. r->y[4] = 0;
  33292. r->y[5] = 0;
  33293. r->y[6] = 0;
  33294. r->y[7] = 0;
  33295. r->y[8] = 0;
  33296. r->y[9] = 0;
  33297. r->y[10] = 0;
  33298. r->y[11] = 0;
  33299. r->y[12] = 0;
  33300. r->y[13] = 0;
  33301. r->y[14] = 0;
  33302. r->y[15] = 0;
  33303. r->y[16] = 0;
  33304. for (i = 1; i < 16; i++) {
  33305. mask = 0 - (i == idx);
  33306. r->x[0] |= mask & table[i].x[0];
  33307. r->x[1] |= mask & table[i].x[1];
  33308. r->x[2] |= mask & table[i].x[2];
  33309. r->x[3] |= mask & table[i].x[3];
  33310. r->x[4] |= mask & table[i].x[4];
  33311. r->x[5] |= mask & table[i].x[5];
  33312. r->x[6] |= mask & table[i].x[6];
  33313. r->x[7] |= mask & table[i].x[7];
  33314. r->x[8] |= mask & table[i].x[8];
  33315. r->x[9] |= mask & table[i].x[9];
  33316. r->x[10] |= mask & table[i].x[10];
  33317. r->x[11] |= mask & table[i].x[11];
  33318. r->x[12] |= mask & table[i].x[12];
  33319. r->x[13] |= mask & table[i].x[13];
  33320. r->x[14] |= mask & table[i].x[14];
  33321. r->x[15] |= mask & table[i].x[15];
  33322. r->x[16] |= mask & table[i].x[16];
  33323. r->y[0] |= mask & table[i].y[0];
  33324. r->y[1] |= mask & table[i].y[1];
  33325. r->y[2] |= mask & table[i].y[2];
  33326. r->y[3] |= mask & table[i].y[3];
  33327. r->y[4] |= mask & table[i].y[4];
  33328. r->y[5] |= mask & table[i].y[5];
  33329. r->y[6] |= mask & table[i].y[6];
  33330. r->y[7] |= mask & table[i].y[7];
  33331. r->y[8] |= mask & table[i].y[8];
  33332. r->y[9] |= mask & table[i].y[9];
  33333. r->y[10] |= mask & table[i].y[10];
  33334. r->y[11] |= mask & table[i].y[11];
  33335. r->y[12] |= mask & table[i].y[12];
  33336. r->y[13] |= mask & table[i].y[13];
  33337. r->y[14] |= mask & table[i].y[14];
  33338. r->y[15] |= mask & table[i].y[15];
  33339. r->y[16] |= mask & table[i].y[16];
  33340. }
  33341. }
  33342. #endif /* !WC_NO_CACHE_RESISTANT */
  33343. /* Multiply the point by the scalar and return the result.
  33344. * If map is true then convert result to affine coordinates.
  33345. *
  33346. * Stripe implementation.
  33347. * Pre-generated: 2^0, 2^130, ...
  33348. * Pre-generated: products of all combinations of above.
  33349. * 4 doubles and adds (with qz=1)
  33350. *
  33351. * r Resulting point.
  33352. * k Scalar to multiply by.
  33353. * table Pre-computed table.
  33354. * map Indicates whether to convert result to affine.
  33355. * ct Constant time required.
  33356. * heap Heap to use for allocation.
  33357. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  33358. */
  33359. static int sp_521_ecc_mulmod_stripe_17(sp_point_521* r, const sp_point_521* g,
  33360. const sp_table_entry_521* table, const sp_digit* k, int map,
  33361. int ct, void* heap)
  33362. {
  33363. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33364. sp_point_521* rt = NULL;
  33365. sp_digit* t = NULL;
  33366. #else
  33367. sp_point_521 rt[2];
  33368. sp_digit t[2 * 17 * 6];
  33369. #endif
  33370. sp_point_521* p = NULL;
  33371. int i;
  33372. int j;
  33373. int y;
  33374. int x;
  33375. int err = MP_OKAY;
  33376. (void)g;
  33377. /* Constant time used for cache attack resistance implementation. */
  33378. (void)ct;
  33379. (void)heap;
  33380. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33381. rt = (sp_point_521*)XMALLOC(sizeof(sp_point_521) * 2, heap,
  33382. DYNAMIC_TYPE_ECC);
  33383. if (rt == NULL)
  33384. err = MEMORY_E;
  33385. if (err == MP_OKAY) {
  33386. t = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 17 * 6, heap,
  33387. DYNAMIC_TYPE_ECC);
  33388. if (t == NULL)
  33389. err = MEMORY_E;
  33390. }
  33391. #endif
  33392. if (err == MP_OKAY) {
  33393. p = rt + 1;
  33394. XMEMCPY(p->z, p521_norm_mod, sizeof(p521_norm_mod));
  33395. XMEMCPY(rt->z, p521_norm_mod, sizeof(p521_norm_mod));
  33396. y = 0;
  33397. x = 130;
  33398. for (j=0; j<4 && x<521; j++) {
  33399. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  33400. x += 131;
  33401. }
  33402. #ifndef WC_NO_CACHE_RESISTANT
  33403. if (ct) {
  33404. sp_521_get_entry_16_17(rt, table, y);
  33405. } else
  33406. #endif
  33407. {
  33408. XMEMCPY(rt->x, table[y].x, sizeof(table[y].x));
  33409. XMEMCPY(rt->y, table[y].y, sizeof(table[y].y));
  33410. }
  33411. rt->infinity = !y;
  33412. for (i=129; i>=0; i--) {
  33413. y = 0;
  33414. x = i;
  33415. for (j=0; j<4 && x<521; j++) {
  33416. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  33417. x += 131;
  33418. }
  33419. sp_521_proj_point_dbl_17(rt, rt, t);
  33420. #ifndef WC_NO_CACHE_RESISTANT
  33421. if (ct) {
  33422. sp_521_get_entry_16_17(p, table, y);
  33423. }
  33424. else
  33425. #endif
  33426. {
  33427. XMEMCPY(p->x, table[y].x, sizeof(table[y].x));
  33428. XMEMCPY(p->y, table[y].y, sizeof(table[y].y));
  33429. }
  33430. p->infinity = !y;
  33431. sp_521_proj_point_add_qz1_17(rt, rt, p, t);
  33432. }
  33433. if (map != 0) {
  33434. sp_521_map_17(r, rt, t);
  33435. }
  33436. else {
  33437. XMEMCPY(r, rt, sizeof(sp_point_521));
  33438. }
  33439. }
  33440. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33441. if (t != NULL)
  33442. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  33443. if (rt != NULL)
  33444. XFREE(rt, heap, DYNAMIC_TYPE_ECC);
  33445. #endif
  33446. return err;
  33447. }
  33448. #ifdef FP_ECC
  33449. #ifndef FP_ENTRIES
  33450. #define FP_ENTRIES 16
  33451. #endif
  33452. /* Cache entry - holds precomputation tables for a point. */
  33453. typedef struct sp_cache_521_t {
  33454. /* X ordinate of point that table was generated from. */
  33455. sp_digit x[17];
  33456. /* Y ordinate of point that table was generated from. */
  33457. sp_digit y[17];
  33458. /* Precomputation table for point. */
  33459. sp_table_entry_521 table[16];
  33460. /* Count of entries in table. */
  33461. uint32_t cnt;
  33462. /* Point and table set in entry. */
  33463. int set;
  33464. } sp_cache_521_t;
  33465. /* Cache of tables. */
  33466. static THREAD_LS_T sp_cache_521_t sp_cache_521[FP_ENTRIES];
  33467. /* Index of last entry in cache. */
  33468. static THREAD_LS_T int sp_cache_521_last = -1;
  33469. /* Cache has been initialized. */
  33470. static THREAD_LS_T int sp_cache_521_inited = 0;
  33471. #ifndef HAVE_THREAD_LS
  33472. static volatile int initCacheMutex_521 = 0;
  33473. static wolfSSL_Mutex sp_cache_521_lock;
  33474. #endif
  33475. /* Get the cache entry for the point.
  33476. *
  33477. * g [in] Point scalar multipling.
  33478. * cache [out] Cache table to use.
  33479. */
  33480. static void sp_ecc_get_cache_521(const sp_point_521* g, sp_cache_521_t** cache)
  33481. {
  33482. int i;
  33483. int j;
  33484. uint32_t least;
  33485. if (sp_cache_521_inited == 0) {
  33486. for (i=0; i<FP_ENTRIES; i++) {
  33487. sp_cache_521[i].set = 0;
  33488. }
  33489. sp_cache_521_inited = 1;
  33490. }
  33491. /* Compare point with those in cache. */
  33492. for (i=0; i<FP_ENTRIES; i++) {
  33493. if (!sp_cache_521[i].set)
  33494. continue;
  33495. if (sp_521_cmp_equal_17(g->x, sp_cache_521[i].x) &
  33496. sp_521_cmp_equal_17(g->y, sp_cache_521[i].y)) {
  33497. sp_cache_521[i].cnt++;
  33498. break;
  33499. }
  33500. }
  33501. /* No match. */
  33502. if (i == FP_ENTRIES) {
  33503. /* Find empty entry. */
  33504. i = (sp_cache_521_last + 1) % FP_ENTRIES;
  33505. for (; i != sp_cache_521_last; i=(i+1)%FP_ENTRIES) {
  33506. if (!sp_cache_521[i].set) {
  33507. break;
  33508. }
  33509. }
  33510. /* Evict least used. */
  33511. if (i == sp_cache_521_last) {
  33512. least = sp_cache_521[0].cnt;
  33513. for (j=1; j<FP_ENTRIES; j++) {
  33514. if (sp_cache_521[j].cnt < least) {
  33515. i = j;
  33516. least = sp_cache_521[i].cnt;
  33517. }
  33518. }
  33519. }
  33520. XMEMCPY(sp_cache_521[i].x, g->x, sizeof(sp_cache_521[i].x));
  33521. XMEMCPY(sp_cache_521[i].y, g->y, sizeof(sp_cache_521[i].y));
  33522. sp_cache_521[i].set = 1;
  33523. sp_cache_521[i].cnt = 1;
  33524. }
  33525. *cache = &sp_cache_521[i];
  33526. sp_cache_521_last = i;
  33527. }
  33528. #endif /* FP_ECC */
  33529. /* Multiply the base point of P521 by the scalar and return the result.
  33530. * If map is true then convert result to affine coordinates.
  33531. *
  33532. * r Resulting point.
  33533. * g Point to multiply.
  33534. * k Scalar to multiply by.
  33535. * map Indicates whether to convert result to affine.
  33536. * ct Constant time required.
  33537. * heap Heap to use for allocation.
  33538. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  33539. */
  33540. static int sp_521_ecc_mulmod_17(sp_point_521* r, const sp_point_521* g, const sp_digit* k,
  33541. int map, int ct, void* heap)
  33542. {
  33543. #ifndef FP_ECC
  33544. return sp_521_ecc_mulmod_fast_17(r, g, k, map, ct, heap);
  33545. #else
  33546. sp_digit tmp[2 * 17 * 6];
  33547. sp_cache_521_t* cache;
  33548. int err = MP_OKAY;
  33549. #ifndef HAVE_THREAD_LS
  33550. if (initCacheMutex_521 == 0) {
  33551. wc_InitMutex(&sp_cache_521_lock);
  33552. initCacheMutex_521 = 1;
  33553. }
  33554. if (wc_LockMutex(&sp_cache_521_lock) != 0)
  33555. err = BAD_MUTEX_E;
  33556. #endif /* HAVE_THREAD_LS */
  33557. if (err == MP_OKAY) {
  33558. sp_ecc_get_cache_521(g, &cache);
  33559. if (cache->cnt == 2)
  33560. sp_521_gen_stripe_table_17(g, cache->table, tmp, heap);
  33561. #ifndef HAVE_THREAD_LS
  33562. wc_UnLockMutex(&sp_cache_521_lock);
  33563. #endif /* HAVE_THREAD_LS */
  33564. if (cache->cnt < 2) {
  33565. err = sp_521_ecc_mulmod_fast_17(r, g, k, map, ct, heap);
  33566. }
  33567. else {
  33568. err = sp_521_ecc_mulmod_stripe_17(r, g, cache->table, k,
  33569. map, ct, heap);
  33570. }
  33571. }
  33572. return err;
  33573. #endif
  33574. }
  33575. #else
  33576. #ifdef FP_ECC
  33577. /* Generate the pre-computed table of points for the base point.
  33578. *
  33579. * width = 8
  33580. * 256 entries
  33581. * 65 bits between
  33582. *
  33583. * a The base point.
  33584. * table Place to store generated point data.
  33585. * tmp Temporary data.
  33586. * heap Heap to use for allocation.
  33587. */
  33588. static int sp_521_gen_stripe_table_17(const sp_point_521* a,
  33589. sp_table_entry_521* table, sp_digit* tmp, void* heap)
  33590. {
  33591. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33592. sp_point_521* t = NULL;
  33593. #else
  33594. sp_point_521 t[3];
  33595. #endif
  33596. sp_point_521* s1 = NULL;
  33597. sp_point_521* s2 = NULL;
  33598. int i;
  33599. int j;
  33600. int err = MP_OKAY;
  33601. (void)heap;
  33602. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33603. t = (sp_point_521*)XMALLOC(sizeof(sp_point_521) * 3, heap,
  33604. DYNAMIC_TYPE_ECC);
  33605. if (t == NULL)
  33606. err = MEMORY_E;
  33607. #endif
  33608. if (err == MP_OKAY) {
  33609. s1 = t + 1;
  33610. s2 = t + 2;
  33611. err = sp_521_mod_mul_norm_17(t->x, a->x, p521_mod);
  33612. }
  33613. if (err == MP_OKAY) {
  33614. err = sp_521_mod_mul_norm_17(t->y, a->y, p521_mod);
  33615. }
  33616. if (err == MP_OKAY) {
  33617. err = sp_521_mod_mul_norm_17(t->z, a->z, p521_mod);
  33618. }
  33619. if (err == MP_OKAY) {
  33620. t->infinity = 0;
  33621. sp_521_proj_to_affine_17(t, tmp);
  33622. XMEMCPY(s1->z, p521_norm_mod, sizeof(p521_norm_mod));
  33623. s1->infinity = 0;
  33624. XMEMCPY(s2->z, p521_norm_mod, sizeof(p521_norm_mod));
  33625. s2->infinity = 0;
  33626. /* table[0] = {0, 0, infinity} */
  33627. XMEMSET(&table[0], 0, sizeof(sp_table_entry_521));
  33628. /* table[1] = Affine version of 'a' in Montgomery form */
  33629. XMEMCPY(table[1].x, t->x, sizeof(table->x));
  33630. XMEMCPY(table[1].y, t->y, sizeof(table->y));
  33631. for (i=1; i<8; i++) {
  33632. sp_521_proj_point_dbl_n_17(t, 66, tmp);
  33633. sp_521_proj_to_affine_17(t, tmp);
  33634. XMEMCPY(table[1<<i].x, t->x, sizeof(table->x));
  33635. XMEMCPY(table[1<<i].y, t->y, sizeof(table->y));
  33636. }
  33637. for (i=1; i<8; i++) {
  33638. XMEMCPY(s1->x, table[1<<i].x, sizeof(table->x));
  33639. XMEMCPY(s1->y, table[1<<i].y, sizeof(table->y));
  33640. for (j=(1<<i)+1; j<(1<<(i+1)); j++) {
  33641. XMEMCPY(s2->x, table[j-(1<<i)].x, sizeof(table->x));
  33642. XMEMCPY(s2->y, table[j-(1<<i)].y, sizeof(table->y));
  33643. sp_521_proj_point_add_qz1_17(t, s1, s2, tmp);
  33644. sp_521_proj_to_affine_17(t, tmp);
  33645. XMEMCPY(table[j].x, t->x, sizeof(table->x));
  33646. XMEMCPY(table[j].y, t->y, sizeof(table->y));
  33647. }
  33648. }
  33649. }
  33650. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33651. if (t != NULL)
  33652. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  33653. #endif
  33654. return err;
  33655. }
  33656. #endif /* FP_ECC */
  33657. #ifndef WC_NO_CACHE_RESISTANT
  33658. /* Touch each possible entry that could be being copied.
  33659. *
  33660. * r Point to copy into.
  33661. * table Table - start of the entires to access
  33662. * idx Index of entry to retrieve.
  33663. */
  33664. static void sp_521_get_entry_256_17(sp_point_521* r,
  33665. const sp_table_entry_521* table, int idx)
  33666. {
  33667. int i;
  33668. sp_digit mask;
  33669. r->x[0] = 0;
  33670. r->x[1] = 0;
  33671. r->x[2] = 0;
  33672. r->x[3] = 0;
  33673. r->x[4] = 0;
  33674. r->x[5] = 0;
  33675. r->x[6] = 0;
  33676. r->x[7] = 0;
  33677. r->x[8] = 0;
  33678. r->x[9] = 0;
  33679. r->x[10] = 0;
  33680. r->x[11] = 0;
  33681. r->x[12] = 0;
  33682. r->x[13] = 0;
  33683. r->x[14] = 0;
  33684. r->x[15] = 0;
  33685. r->x[16] = 0;
  33686. r->y[0] = 0;
  33687. r->y[1] = 0;
  33688. r->y[2] = 0;
  33689. r->y[3] = 0;
  33690. r->y[4] = 0;
  33691. r->y[5] = 0;
  33692. r->y[6] = 0;
  33693. r->y[7] = 0;
  33694. r->y[8] = 0;
  33695. r->y[9] = 0;
  33696. r->y[10] = 0;
  33697. r->y[11] = 0;
  33698. r->y[12] = 0;
  33699. r->y[13] = 0;
  33700. r->y[14] = 0;
  33701. r->y[15] = 0;
  33702. r->y[16] = 0;
  33703. for (i = 1; i < 256; i++) {
  33704. mask = 0 - (i == idx);
  33705. r->x[0] |= mask & table[i].x[0];
  33706. r->x[1] |= mask & table[i].x[1];
  33707. r->x[2] |= mask & table[i].x[2];
  33708. r->x[3] |= mask & table[i].x[3];
  33709. r->x[4] |= mask & table[i].x[4];
  33710. r->x[5] |= mask & table[i].x[5];
  33711. r->x[6] |= mask & table[i].x[6];
  33712. r->x[7] |= mask & table[i].x[7];
  33713. r->x[8] |= mask & table[i].x[8];
  33714. r->x[9] |= mask & table[i].x[9];
  33715. r->x[10] |= mask & table[i].x[10];
  33716. r->x[11] |= mask & table[i].x[11];
  33717. r->x[12] |= mask & table[i].x[12];
  33718. r->x[13] |= mask & table[i].x[13];
  33719. r->x[14] |= mask & table[i].x[14];
  33720. r->x[15] |= mask & table[i].x[15];
  33721. r->x[16] |= mask & table[i].x[16];
  33722. r->y[0] |= mask & table[i].y[0];
  33723. r->y[1] |= mask & table[i].y[1];
  33724. r->y[2] |= mask & table[i].y[2];
  33725. r->y[3] |= mask & table[i].y[3];
  33726. r->y[4] |= mask & table[i].y[4];
  33727. r->y[5] |= mask & table[i].y[5];
  33728. r->y[6] |= mask & table[i].y[6];
  33729. r->y[7] |= mask & table[i].y[7];
  33730. r->y[8] |= mask & table[i].y[8];
  33731. r->y[9] |= mask & table[i].y[9];
  33732. r->y[10] |= mask & table[i].y[10];
  33733. r->y[11] |= mask & table[i].y[11];
  33734. r->y[12] |= mask & table[i].y[12];
  33735. r->y[13] |= mask & table[i].y[13];
  33736. r->y[14] |= mask & table[i].y[14];
  33737. r->y[15] |= mask & table[i].y[15];
  33738. r->y[16] |= mask & table[i].y[16];
  33739. }
  33740. }
  33741. #endif /* !WC_NO_CACHE_RESISTANT */
  33742. /* Multiply the point by the scalar and return the result.
  33743. * If map is true then convert result to affine coordinates.
  33744. *
  33745. * Stripe implementation.
  33746. * Pre-generated: 2^0, 2^65, ...
  33747. * Pre-generated: products of all combinations of above.
  33748. * 8 doubles and adds (with qz=1)
  33749. *
  33750. * r Resulting point.
  33751. * k Scalar to multiply by.
  33752. * table Pre-computed table.
  33753. * map Indicates whether to convert result to affine.
  33754. * ct Constant time required.
  33755. * heap Heap to use for allocation.
  33756. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  33757. */
  33758. static int sp_521_ecc_mulmod_stripe_17(sp_point_521* r, const sp_point_521* g,
  33759. const sp_table_entry_521* table, const sp_digit* k, int map,
  33760. int ct, void* heap)
  33761. {
  33762. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33763. sp_point_521* rt = NULL;
  33764. sp_digit* t = NULL;
  33765. #else
  33766. sp_point_521 rt[2];
  33767. sp_digit t[2 * 17 * 6];
  33768. #endif
  33769. sp_point_521* p = NULL;
  33770. int i;
  33771. int j;
  33772. int y;
  33773. int x;
  33774. int err = MP_OKAY;
  33775. (void)g;
  33776. /* Constant time used for cache attack resistance implementation. */
  33777. (void)ct;
  33778. (void)heap;
  33779. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33780. rt = (sp_point_521*)XMALLOC(sizeof(sp_point_521) * 2, heap,
  33781. DYNAMIC_TYPE_ECC);
  33782. if (rt == NULL)
  33783. err = MEMORY_E;
  33784. if (err == MP_OKAY) {
  33785. t = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 17 * 6, heap,
  33786. DYNAMIC_TYPE_ECC);
  33787. if (t == NULL)
  33788. err = MEMORY_E;
  33789. }
  33790. #endif
  33791. if (err == MP_OKAY) {
  33792. p = rt + 1;
  33793. XMEMCPY(p->z, p521_norm_mod, sizeof(p521_norm_mod));
  33794. XMEMCPY(rt->z, p521_norm_mod, sizeof(p521_norm_mod));
  33795. y = 0;
  33796. x = 65;
  33797. for (j=0; j<8 && x<521; j++) {
  33798. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  33799. x += 66;
  33800. }
  33801. #ifndef WC_NO_CACHE_RESISTANT
  33802. if (ct) {
  33803. sp_521_get_entry_256_17(rt, table, y);
  33804. } else
  33805. #endif
  33806. {
  33807. XMEMCPY(rt->x, table[y].x, sizeof(table[y].x));
  33808. XMEMCPY(rt->y, table[y].y, sizeof(table[y].y));
  33809. }
  33810. rt->infinity = !y;
  33811. for (i=64; i>=0; i--) {
  33812. y = 0;
  33813. x = i;
  33814. for (j=0; j<8 && x<521; j++) {
  33815. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  33816. x += 66;
  33817. }
  33818. sp_521_proj_point_dbl_17(rt, rt, t);
  33819. #ifndef WC_NO_CACHE_RESISTANT
  33820. if (ct) {
  33821. sp_521_get_entry_256_17(p, table, y);
  33822. }
  33823. else
  33824. #endif
  33825. {
  33826. XMEMCPY(p->x, table[y].x, sizeof(table[y].x));
  33827. XMEMCPY(p->y, table[y].y, sizeof(table[y].y));
  33828. }
  33829. p->infinity = !y;
  33830. sp_521_proj_point_add_qz1_17(rt, rt, p, t);
  33831. }
  33832. if (map != 0) {
  33833. sp_521_map_17(r, rt, t);
  33834. }
  33835. else {
  33836. XMEMCPY(r, rt, sizeof(sp_point_521));
  33837. }
  33838. }
  33839. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33840. if (t != NULL)
  33841. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  33842. if (rt != NULL)
  33843. XFREE(rt, heap, DYNAMIC_TYPE_ECC);
  33844. #endif
  33845. return err;
  33846. }
  33847. #ifdef FP_ECC
  33848. #ifndef FP_ENTRIES
  33849. #define FP_ENTRIES 16
  33850. #endif
  33851. /* Cache entry - holds precomputation tables for a point. */
  33852. typedef struct sp_cache_521_t {
  33853. /* X ordinate of point that table was generated from. */
  33854. sp_digit x[17];
  33855. /* Y ordinate of point that table was generated from. */
  33856. sp_digit y[17];
  33857. /* Precomputation table for point. */
  33858. sp_table_entry_521 table[256];
  33859. /* Count of entries in table. */
  33860. uint32_t cnt;
  33861. /* Point and table set in entry. */
  33862. int set;
  33863. } sp_cache_521_t;
  33864. /* Cache of tables. */
  33865. static THREAD_LS_T sp_cache_521_t sp_cache_521[FP_ENTRIES];
  33866. /* Index of last entry in cache. */
  33867. static THREAD_LS_T int sp_cache_521_last = -1;
  33868. /* Cache has been initialized. */
  33869. static THREAD_LS_T int sp_cache_521_inited = 0;
  33870. #ifndef HAVE_THREAD_LS
  33871. static volatile int initCacheMutex_521 = 0;
  33872. static wolfSSL_Mutex sp_cache_521_lock;
  33873. #endif
  33874. /* Get the cache entry for the point.
  33875. *
  33876. * g [in] Point scalar multipling.
  33877. * cache [out] Cache table to use.
  33878. */
  33879. static void sp_ecc_get_cache_521(const sp_point_521* g, sp_cache_521_t** cache)
  33880. {
  33881. int i;
  33882. int j;
  33883. uint32_t least;
  33884. if (sp_cache_521_inited == 0) {
  33885. for (i=0; i<FP_ENTRIES; i++) {
  33886. sp_cache_521[i].set = 0;
  33887. }
  33888. sp_cache_521_inited = 1;
  33889. }
  33890. /* Compare point with those in cache. */
  33891. for (i=0; i<FP_ENTRIES; i++) {
  33892. if (!sp_cache_521[i].set)
  33893. continue;
  33894. if (sp_521_cmp_equal_17(g->x, sp_cache_521[i].x) &
  33895. sp_521_cmp_equal_17(g->y, sp_cache_521[i].y)) {
  33896. sp_cache_521[i].cnt++;
  33897. break;
  33898. }
  33899. }
  33900. /* No match. */
  33901. if (i == FP_ENTRIES) {
  33902. /* Find empty entry. */
  33903. i = (sp_cache_521_last + 1) % FP_ENTRIES;
  33904. for (; i != sp_cache_521_last; i=(i+1)%FP_ENTRIES) {
  33905. if (!sp_cache_521[i].set) {
  33906. break;
  33907. }
  33908. }
  33909. /* Evict least used. */
  33910. if (i == sp_cache_521_last) {
  33911. least = sp_cache_521[0].cnt;
  33912. for (j=1; j<FP_ENTRIES; j++) {
  33913. if (sp_cache_521[j].cnt < least) {
  33914. i = j;
  33915. least = sp_cache_521[i].cnt;
  33916. }
  33917. }
  33918. }
  33919. XMEMCPY(sp_cache_521[i].x, g->x, sizeof(sp_cache_521[i].x));
  33920. XMEMCPY(sp_cache_521[i].y, g->y, sizeof(sp_cache_521[i].y));
  33921. sp_cache_521[i].set = 1;
  33922. sp_cache_521[i].cnt = 1;
  33923. }
  33924. *cache = &sp_cache_521[i];
  33925. sp_cache_521_last = i;
  33926. }
  33927. #endif /* FP_ECC */
  33928. /* Multiply the base point of P521 by the scalar and return the result.
  33929. * If map is true then convert result to affine coordinates.
  33930. *
  33931. * r Resulting point.
  33932. * g Point to multiply.
  33933. * k Scalar to multiply by.
  33934. * map Indicates whether to convert result to affine.
  33935. * ct Constant time required.
  33936. * heap Heap to use for allocation.
  33937. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  33938. */
  33939. static int sp_521_ecc_mulmod_17(sp_point_521* r, const sp_point_521* g, const sp_digit* k,
  33940. int map, int ct, void* heap)
  33941. {
  33942. #ifndef FP_ECC
  33943. return sp_521_ecc_mulmod_fast_17(r, g, k, map, ct, heap);
  33944. #else
  33945. sp_digit tmp[2 * 17 * 6];
  33946. sp_cache_521_t* cache;
  33947. int err = MP_OKAY;
  33948. #ifndef HAVE_THREAD_LS
  33949. if (initCacheMutex_521 == 0) {
  33950. wc_InitMutex(&sp_cache_521_lock);
  33951. initCacheMutex_521 = 1;
  33952. }
  33953. if (wc_LockMutex(&sp_cache_521_lock) != 0)
  33954. err = BAD_MUTEX_E;
  33955. #endif /* HAVE_THREAD_LS */
  33956. if (err == MP_OKAY) {
  33957. sp_ecc_get_cache_521(g, &cache);
  33958. if (cache->cnt == 2)
  33959. sp_521_gen_stripe_table_17(g, cache->table, tmp, heap);
  33960. #ifndef HAVE_THREAD_LS
  33961. wc_UnLockMutex(&sp_cache_521_lock);
  33962. #endif /* HAVE_THREAD_LS */
  33963. if (cache->cnt < 2) {
  33964. err = sp_521_ecc_mulmod_fast_17(r, g, k, map, ct, heap);
  33965. }
  33966. else {
  33967. err = sp_521_ecc_mulmod_stripe_17(r, g, cache->table, k,
  33968. map, ct, heap);
  33969. }
  33970. }
  33971. return err;
  33972. #endif
  33973. }
  33974. #endif /* WOLFSSL_SP_SMALL */
  33975. /* Multiply the point by the scalar and return the result.
  33976. * If map is true then convert result to affine coordinates.
  33977. *
  33978. * km Scalar to multiply by.
  33979. * p Point to multiply.
  33980. * r Resulting point.
  33981. * map Indicates whether to convert result to affine.
  33982. * heap Heap to use for allocation.
  33983. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  33984. */
  33985. int sp_ecc_mulmod_521(const mp_int* km, const ecc_point* gm, ecc_point* r,
  33986. int map, void* heap)
  33987. {
  33988. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33989. sp_point_521* point = NULL;
  33990. sp_digit* k = NULL;
  33991. #else
  33992. sp_point_521 point[1];
  33993. sp_digit k[17];
  33994. #endif
  33995. int err = MP_OKAY;
  33996. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  33997. point = (sp_point_521*)XMALLOC(sizeof(sp_point_521), heap,
  33998. DYNAMIC_TYPE_ECC);
  33999. if (point == NULL)
  34000. err = MEMORY_E;
  34001. if (err == MP_OKAY) {
  34002. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 17, heap,
  34003. DYNAMIC_TYPE_ECC);
  34004. if (k == NULL)
  34005. err = MEMORY_E;
  34006. }
  34007. #endif
  34008. if (err == MP_OKAY) {
  34009. sp_521_from_mp(k, 17, km);
  34010. sp_521_point_from_ecc_point_17(point, gm);
  34011. err = sp_521_ecc_mulmod_17(point, point, k, map, 1, heap);
  34012. }
  34013. if (err == MP_OKAY) {
  34014. err = sp_521_point_to_ecc_point_17(point, r);
  34015. }
  34016. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  34017. if (k != NULL)
  34018. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  34019. if (point != NULL)
  34020. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  34021. #endif
  34022. return err;
  34023. }
  34024. /* Multiply the point by the scalar, add point a and return the result.
  34025. * If map is true then convert result to affine coordinates.
  34026. *
  34027. * km Scalar to multiply by.
  34028. * p Point to multiply.
  34029. * am Point to add to scalar mulitply result.
  34030. * inMont Point to add is in montgomery form.
  34031. * r Resulting point.
  34032. * map Indicates whether to convert result to affine.
  34033. * heap Heap to use for allocation.
  34034. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  34035. */
  34036. int sp_ecc_mulmod_add_521(const mp_int* km, const ecc_point* gm,
  34037. const ecc_point* am, int inMont, ecc_point* r, int map, void* heap)
  34038. {
  34039. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  34040. sp_point_521* point = NULL;
  34041. sp_digit* k = NULL;
  34042. #else
  34043. sp_point_521 point[2];
  34044. sp_digit k[17 + 17 * 2 * 6];
  34045. #endif
  34046. sp_point_521* addP = NULL;
  34047. sp_digit* tmp = NULL;
  34048. int err = MP_OKAY;
  34049. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  34050. point = (sp_point_521*)XMALLOC(sizeof(sp_point_521) * 2, heap,
  34051. DYNAMIC_TYPE_ECC);
  34052. if (point == NULL)
  34053. err = MEMORY_E;
  34054. if (err == MP_OKAY) {
  34055. k = (sp_digit*)XMALLOC(
  34056. sizeof(sp_digit) * (17 + 17 * 2 * 6), heap,
  34057. DYNAMIC_TYPE_ECC);
  34058. if (k == NULL)
  34059. err = MEMORY_E;
  34060. }
  34061. #endif
  34062. if (err == MP_OKAY) {
  34063. addP = point + 1;
  34064. tmp = k + 17;
  34065. sp_521_from_mp(k, 17, km);
  34066. sp_521_point_from_ecc_point_17(point, gm);
  34067. sp_521_point_from_ecc_point_17(addP, am);
  34068. }
  34069. if ((err == MP_OKAY) && (!inMont)) {
  34070. err = sp_521_mod_mul_norm_17(addP->x, addP->x, p521_mod);
  34071. }
  34072. if ((err == MP_OKAY) && (!inMont)) {
  34073. err = sp_521_mod_mul_norm_17(addP->y, addP->y, p521_mod);
  34074. }
  34075. if ((err == MP_OKAY) && (!inMont)) {
  34076. err = sp_521_mod_mul_norm_17(addP->z, addP->z, p521_mod);
  34077. }
  34078. if (err == MP_OKAY) {
  34079. err = sp_521_ecc_mulmod_17(point, point, k, 0, 0, heap);
  34080. }
  34081. if (err == MP_OKAY) {
  34082. sp_521_proj_point_add_17(point, point, addP, tmp);
  34083. if (map) {
  34084. sp_521_map_17(point, point, tmp);
  34085. }
  34086. err = sp_521_point_to_ecc_point_17(point, r);
  34087. }
  34088. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  34089. if (k != NULL)
  34090. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  34091. if (point != NULL)
  34092. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  34093. #endif
  34094. return err;
  34095. }
  34096. #ifdef WOLFSSL_SP_SMALL
  34097. /* Striping precomputation table.
  34098. * 4 points combined into a table of 16 points.
  34099. * Distance of 131 between points.
  34100. */
  34101. static const sp_table_entry_521 p521_table[16] = {
  34102. /* 0 */
  34103. { { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  34104. 0x00, 0x00, 0x00, 0x00, 0x00 },
  34105. { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  34106. 0x00, 0x00, 0x00, 0x00, 0x00 } },
  34107. /* 1 */
  34108. { { 0xc2e5bd66,0xf97e7e31,0x856a429b,0x3348b3c1,0xa2ffa8de,0xfe1dc127,
  34109. 0xefe75928,0xa14b5e77,0x6b4d3dba,0xf828af60,0x053fb521,0x9c648139,
  34110. 0x2395b442,0x9e3ecb66,0x0404e9cd,0x858e06b7,0x000000c6 },
  34111. { 0x9fd16650,0x88be9476,0xa272c240,0x353c7086,0x3fad0761,0xc550b901,
  34112. 0x5ef42640,0x97ee7299,0x273e662c,0x17afbd17,0x579b4468,0x98f54449,
  34113. 0x2c7d1bd9,0x5c8a5fb4,0x9a3bc004,0x39296a78,0x00000118 } },
  34114. /* 2 */
  34115. { { 0x66fd07ca,0x1036eb9b,0x6b7fb490,0x6ca52cc1,0xd3e0c270,0x512e973e,
  34116. 0x73d92d11,0x889980bf,0xa4005eea,0x38b4cfe4,0x8ceb4313,0xb6f992cc,
  34117. 0x6daf7c23,0xd0ac2f8d,0xe32a93cb,0x1ccfbf17,0x000000c2 },
  34118. { 0x2f508cca,0x7bd9d6f1,0x595a72af,0xe82d7171,0x97512873,0x25d02976,
  34119. 0x8cf39fbc,0xefc1de8b,0x9a1237f4,0x25e6b77f,0xd4d98b5d,0x9f3b73e7,
  34120. 0xeccb07fe,0xe1fda62b,0x625350cf,0xdb813b03,0x00000014 } },
  34121. /* 3 */
  34122. { { 0x9b27bd61,0x415a1c9b,0x606854d6,0x74522753,0x92e73538,0x9e331ef4,
  34123. 0x817e7a6d,0x0b3dba85,0x49ac273b,0x55c4bd53,0xfcb5417f,0xad42c78d,
  34124. 0x92e08d38,0x528998b9,0xcc1914cc,0x14c2fff6,0x000000c1 },
  34125. { 0x767e9645,0x35b26fb0,0xc5e5a659,0x162b512f,0xcc47fbb8,0xa6e03696,
  34126. 0x0a29a69b,0x732db065,0xd56bdf5d,0x058a74ed,0x25c858d9,0x4b7b60a0,
  34127. 0xbd43373d,0x17f8a6d4,0xedf610b4,0x7b968f51,0x0000011f } },
  34128. /* 4 */
  34129. { { 0x1bc0fa77,0x5f56b5a4,0x64fd36f5,0x6cdd6bb5,0x8a5b7c7f,0xd0ac68b5,
  34130. 0x09919ef9,0x4a92d9bf,0x71c3c520,0xc305e12b,0xdb699aee,0x554a9d1c,
  34131. 0x61f54643,0x7fde0077,0x479115ce,0x99c13124,0x00000039 },
  34132. { 0xc271ac2d,0x25f890e1,0x94b370ac,0x1353ccd3,0x744d4011,0xc7b5adf6,
  34133. 0xbe378127,0x9ccd7687,0x06c4e3cd,0xa8489b5c,0x305505f9,0x1945580a,
  34134. 0x4ab3b12b,0x07190a20,0x1534ea4d,0x0ff53eb1,0x00000159 } },
  34135. /* 5 */
  34136. { { 0x91798548,0x877d4edd,0x031d657a,0xc43c7b25,0xfab18a04,0x47603671,
  34137. 0xf670b476,0x7e39e7f2,0xb02fcc03,0xf7b76431,0x877f46f5,0x7c5662f3,
  34138. 0x1c8b0c61,0x5bf8327e,0x4a8be322,0xe9cdb353,0x000001ae },
  34139. { 0x9d264420,0xa2d7092e,0x533ff3db,0x1f970352,0x99b5b52e,0x31dd232b,
  34140. 0x850f45e9,0x8a9ce16b,0xc3011849,0x01c99023,0xc8e9301e,0x4bc30989,
  34141. 0xcd95f64c,0x77a4de70,0x1026f289,0xbc8797bb,0x000000d7 } },
  34142. /* 6 */
  34143. { { 0x2be9edf8,0x98ea0934,0xfcb98199,0x6c2f3132,0xfaf83aeb,0xf579893d,
  34144. 0xc73fda0f,0x858e87bb,0x7a0b9d1c,0xd3c0b3fb,0x71ee68b1,0x21fe6305,
  34145. 0x66aa6f16,0x5bf8f01f,0xbca825ed,0x30934c99,0x000000d1 },
  34146. { 0x913022f2,0xe4309850,0xde5b80ce,0xfdc336c9,0x8b6130ef,0xb716d689,
  34147. 0xa758d2f4,0x8a58b405,0xaa5cbc1c,0x98879df8,0xc12ce0bb,0x847cfd06,
  34148. 0x8c02ff3c,0xa1006360,0x3438695b,0x836e906a,0x00000136 } },
  34149. /* 7 */
  34150. { { 0x259ce02d,0xac8fe351,0xdae5e0f7,0xa506da0c,0xf043421d,0x77b56e98,
  34151. 0xa1647490,0xe0d041c7,0x9cb90101,0xe41f0789,0xda3e72e6,0x29bbf572,
  34152. 0x04a14df0,0x6b635c47,0xe81ef5d3,0x56873f58,0x000001dd },
  34153. { 0x5cf9e33f,0x77abe79e,0x0a1117fd,0x91aab581,0xcbac2fe1,0x11edf3b1,
  34154. 0xd72113b7,0xef43e017,0x06b74002,0xf9ad685c,0x8fbd3b1a,0x7e6370ce,
  34155. 0x42f73a82,0x550dd50b,0xc5e64a9b,0x8f2146be,0x000001f2 } },
  34156. /* 8 */
  34157. { { 0x2934ed82,0x05a704cc,0x989edd8c,0x647089fb,0x0ce7c62d,0xe0b239d4,
  34158. 0x105a5eff,0x4c892ea6,0xd5ed6b04,0xa519395f,0x509ed794,0x806c7003,
  34159. 0xe70ce5c4,0x882e9886,0xff01f6a9,0x50730ca1,0x00000088 },
  34160. { 0xdbcc5484,0x90a78a16,0xfd454b50,0xc1ab078c,0xcb09e525,0x6f488252,
  34161. 0xe19b2ed7,0xdd663f53,0xa67bf59c,0x16b10da1,0x36bb770a,0xb47f6b95,
  34162. 0x777b2bce,0x6bdc8428,0x561553f8,0xcd02ae3d,0x00000017 } },
  34163. /* 9 */
  34164. { { 0x1579d15a,0x1e3633a0,0x3e98cd1f,0x574f0c23,0xc60f4f99,0x45969dca,
  34165. 0x49fb9f24,0x10062c93,0xd378f640,0xd29a29d7,0xd7d48c2f,0xec941760,
  34166. 0x31fbea5c,0xf0591c59,0xb40f9ebf,0xd6173e6b,0x00000063 },
  34167. { 0x5a984a72,0x220f4f39,0x32510f26,0x9a3f82ce,0x8c069a1d,0xf3d04c76,
  34168. 0x69a21e57,0xf1d6d891,0xdc4db601,0x6b96b30b,0x64dcf3e0,0x71eeb728,
  34169. 0xc7caaff3,0x6f80c483,0x571b66e4,0x45533092,0x000000b0 } },
  34170. /* 10 */
  34171. { { 0x87140dad,0x49ae4521,0x57e2803e,0xda73032b,0x026ea20a,0x13f5e5eb,
  34172. 0x6e00afb9,0x2d54c4b0,0x7a150474,0x4393b92b,0x13f1a7da,0xb5b41bf8,
  34173. 0x02b5867a,0x6d786907,0xaf2ea4d1,0x5193a9ac,0x000001b3 },
  34174. { 0xa6b186cb,0x2a1563f7,0xe28e57b6,0x73a70a44,0x78fc8a1d,0xd7c4fc6d,
  34175. 0xdf3d6d99,0x4c9b4581,0x1e373aab,0x544f5249,0xe913498e,0xe99434a2,
  34176. 0xc4700f4c,0x30159749,0xe5142766,0xb8ef02cc,0x000001d0 } },
  34177. /* 11 */
  34178. { { 0xb9e6ffc9,0xe99805a6,0xf74d977b,0x1a357f05,0x5c9941bc,0xc8ddef31,
  34179. 0xcbe842e7,0x4b6d66ca,0xa20dc12d,0x84e1f75f,0x5f0c02fc,0x8b1b2c50,
  34180. 0x037b493d,0x3fa1889e,0x95705046,0x720bd9e0,0x000001c2 },
  34181. { 0x93ab9309,0x1a1f3378,0x226a8f94,0xe05a30a2,0x4045f1bd,0x2c01a52d,
  34182. 0xab5f5115,0xf42e8fd5,0x0c05fecf,0x954d1d09,0x8d0650d3,0x47e964d1,
  34183. 0x3c860801,0x6866fa5d,0x5abbb4af,0xac2fecbf,0x0000012c } },
  34184. /* 12 */
  34185. { { 0xe5537747,0x846dc3d2,0x1f5f9f46,0xe28e00df,0x3f31e42d,0x041af624,
  34186. 0x256af225,0x4948947f,0xff4f9550,0x3896c61a,0x34bb5a3e,0xcb40c773,
  34187. 0xeceafacc,0xb9becb07,0x4d45e83e,0xfe29f049,0x000001aa },
  34188. { 0x6b5578db,0x83fb71b3,0x0a710526,0x3017f115,0x5f220d77,0x189ec946,
  34189. 0x48465e68,0xba87ae07,0x70e0cbea,0x1da474d5,0x2b2ba7c5,0xb92cb0a6,
  34190. 0x8b1fb7e2,0x35cb356d,0x2cc8cb18,0x1155296a,0x0000000f } },
  34191. /* 13 */
  34192. { { 0x6ed0f604,0x7f9c9d9b,0xcb49c6d7,0x765e43e9,0xae9be5ca,0x03c4dd67,
  34193. 0x405aed36,0x5480888b,0x920ccddb,0x3a69ebb2,0x03f0c7cc,0x44ec0573,
  34194. 0xce89b026,0x158e2437,0x4f179a17,0x86795029,0x0000003a },
  34195. { 0x9f193dd9,0xf7854032,0xdcc158a9,0x531e4068,0x3642b1a5,0x774171bf,
  34196. 0xc1e53aa3,0x12b4920f,0xfd87478d,0xd1c5fb53,0xa7cba7ca,0x48958c58,
  34197. 0x3f66f2c7,0x375b2cb2,0x598899bd,0x1b510d0f,0x000001b8 } },
  34198. /* 14 */
  34199. { { 0x52007e41,0xfe96299d,0xcd708dcd,0x997140b5,0xf655f6fa,0xe9294eed,
  34200. 0xd58b839d,0x7701d45d,0xb6f77cdb,0x5dbdf5ad,0x95a572f0,0x265189f4,
  34201. 0xb3515e7b,0xc162794e,0x72655e0b,0xbfb571e0,0x00000168 },
  34202. { 0xbda82a6b,0xf0d2b863,0x390a9cc7,0x3df5b283,0x700fcd7b,0xbab9995a,
  34203. 0xfa4e6c06,0xc01ef0af,0x76a392d4,0x10a98513,0x955392f0,0xa7e3fc72,
  34204. 0x1d7a8550,0x8e3c0128,0x361898a8,0xcbca551a,0x0000010f } },
  34205. /* 15 */
  34206. { { 0x3ab71115,0xc8a4cd40,0xbcb9b55b,0xb783170d,0xabd9b426,0x1be20f6a,
  34207. 0x5377b714,0x32d2ea64,0x6b358bbf,0xda342480,0x6e202211,0x782bc800,
  34208. 0xaa27c499,0xf80974c4,0x50341cde,0xc2e66fa9,0x0000004e },
  34209. { 0x24ae60c3,0x082cb95b,0x83ad7484,0xd4b80af4,0x6205256b,0x84b739ce,
  34210. 0xae1fe063,0x616f505e,0x342f218f,0xef14ea68,0x64a01186,0x2b17d66c,
  34211. 0x50858bce,0x60e889ce,0xd5881005,0xdb046c59,0x000001e1 } },
  34212. };
  34213. /* Multiply the base point of P521 by the scalar and return the result.
  34214. * If map is true then convert result to affine coordinates.
  34215. *
  34216. * Stripe implementation.
  34217. * Pre-generated: 2^0, 2^130, ...
  34218. * Pre-generated: products of all combinations of above.
  34219. * 4 doubles and adds (with qz=1)
  34220. *
  34221. * r Resulting point.
  34222. * k Scalar to multiply by.
  34223. * map Indicates whether to convert result to affine.
  34224. * ct Constant time required.
  34225. * heap Heap to use for allocation.
  34226. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  34227. */
  34228. static int sp_521_ecc_mulmod_base_17(sp_point_521* r, const sp_digit* k,
  34229. int map, int ct, void* heap)
  34230. {
  34231. return sp_521_ecc_mulmod_stripe_17(r, &p521_base, p521_table,
  34232. k, map, ct, heap);
  34233. }
  34234. #else
  34235. /* Striping precomputation table.
  34236. * 8 points combined into a table of 256 points.
  34237. * Distance of 66 between points.
  34238. */
  34239. static const sp_table_entry_521 p521_table[256] = {
  34240. /* 0 */
  34241. { { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  34242. 0x00, 0x00, 0x00, 0x00, 0x00 },
  34243. { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  34244. 0x00, 0x00, 0x00, 0x00, 0x00 } },
  34245. /* 1 */
  34246. { { 0xc2e5bd66,0xf97e7e31,0x856a429b,0x3348b3c1,0xa2ffa8de,0xfe1dc127,
  34247. 0xefe75928,0xa14b5e77,0x6b4d3dba,0xf828af60,0x053fb521,0x9c648139,
  34248. 0x2395b442,0x9e3ecb66,0x0404e9cd,0x858e06b7,0x000000c6 },
  34249. { 0x9fd16650,0x88be9476,0xa272c240,0x353c7086,0x3fad0761,0xc550b901,
  34250. 0x5ef42640,0x97ee7299,0x273e662c,0x17afbd17,0x579b4468,0x98f54449,
  34251. 0x2c7d1bd9,0x5c8a5fb4,0x9a3bc004,0x39296a78,0x00000118 } },
  34252. /* 2 */
  34253. { { 0x0f0ccb51,0x80398667,0x3654974a,0xb87e1d01,0xb2b29ed9,0x7f58cf21,
  34254. 0xa3add337,0x06c0e9aa,0xe9d08ffb,0xf13b35d0,0x96761627,0xdd8bf44c,
  34255. 0x758a3ef4,0xa4a18c14,0xa0043adb,0x96a576dd,0x0000013e },
  34256. { 0x632d95a3,0x2bde24f8,0x4c524829,0x79f15ef1,0x9bdaba19,0xaadd863e,
  34257. 0xa962b707,0xdde053f4,0x14258d98,0xc598a2de,0x061c235c,0x9fa5a19d,
  34258. 0xe8ffd32c,0x0ed46510,0xef78ceac,0x2aea9dd1,0x00000185 } },
  34259. /* 3 */
  34260. { { 0xeaaf1fe3,0xd0a91dd8,0x4400b52b,0x0db38662,0x21abf0d2,0xff6a06a9,
  34261. 0xa768c940,0x9412879a,0x9a1eec37,0xf3791abc,0x2738343c,0xc913fbe6,
  34262. 0xe222abc1,0x728b42ab,0x2b9ef313,0x874c0a86,0x00000157 },
  34263. { 0xe6f03d49,0x0ac8f184,0x1e48be03,0xa9c357e4,0x815cbdef,0x02ce5ef3,
  34264. 0x5fd8dc3c,0x7a41c7ab,0xfaeb109d,0x4bef67c9,0xa84f4d38,0x2f98cca1,
  34265. 0x672f0aae,0x7e03d47d,0x1d58968b,0x24b1ab58,0x00000007 } },
  34266. /* 4 */
  34267. { { 0xdf9314e0,0x904f2d4b,0xe7a00aac,0xdaae850d,0x582efb03,0x79231083,
  34268. 0xec7fe6d2,0x80f1c283,0x199d74a8,0x2d5b3996,0x395007e7,0x5f120b9b,
  34269. 0x4773f03e,0x30d23773,0x3b78b686,0xf4c19273,0x00000121 },
  34270. { 0xfa8b51f0,0xf103ff6d,0x40e2bdf0,0xae7afb51,0x83254171,0x1130380e,
  34271. 0xcda10d95,0xe83501b8,0x4f3a8c01,0x1057771e,0xac807069,0x8f52196a,
  34272. 0xa5623821,0x3609b0aa,0x94a0a7f1,0x8c257906,0x000001db } },
  34273. /* 5 */
  34274. { { 0xb2c0958d,0x300370cc,0x69a7b387,0x89aef166,0x480c9b38,0x2792f3cf,
  34275. 0xfab3e149,0x0b2984f2,0x50748967,0x9751e436,0xad33db2a,0x9cab99d5,
  34276. 0xb44a4daa,0x4d945d32,0x16c77325,0xa26cca52,0x0000000a },
  34277. { 0xf9e66d18,0xcdbe1d41,0xaa117e7a,0x80aeef96,0xddb0d24b,0x053214a2,
  34278. 0x5c98b7bf,0x6dcfb227,0xdfd3c848,0x613e7436,0x3ca4d52c,0x6e703fa1,
  34279. 0x18551e64,0x0c8e2977,0xbfa8527d,0xf5e90eac,0x000001c6 } },
  34280. /* 6 */
  34281. { { 0x4ab2d58f,0xa2c2f1e7,0x2a097802,0xc1bbf82c,0x770bb76a,0x6583eb24,
  34282. 0x5667f7bd,0x8e4ed9ed,0xfd96897e,0xd8c01d86,0x3fbe0f15,0x66395a13,
  34283. 0xd99cdcb1,0x51e4f39d,0x720deb25,0xde08424a,0x00000082 },
  34284. { 0x60ea91af,0x97aa53b2,0x7a31dfdd,0xa4384af7,0x5cd09bbe,0xcd82f239,
  34285. 0xf30058e1,0x997c19da,0xe5c78e97,0x443b60c6,0x575b1845,0xfaae9b5f,
  34286. 0x08c2ce16,0x5ce86f33,0x4f63fa86,0x983ce58f,0x00000073 } },
  34287. /* 7 */
  34288. { { 0x8217609d,0xaee93131,0x2412fc00,0x7f8a9dd4,0x286c6329,0xe117e64c,
  34289. 0x7bf1c65e,0xcc3782d6,0x8d03eee5,0xe8c144db,0x9ab93799,0x01acacb2,
  34290. 0xb07784c7,0x215eb1b5,0x1affcd87,0x2c409fa8,0x000000f8 },
  34291. { 0x378139a4,0x007d3766,0xb55bea93,0xc6d969eb,0x68c8bc9d,0xc7c60d6f,
  34292. 0x5f93f242,0x844e8461,0x741717d9,0x8461ca2a,0xf0bf120e,0x8e930e79,
  34293. 0x6b5699d7,0xe1554a02,0x6a4fb6de,0xe69c7702,0x0000007d } },
  34294. /* 8 */
  34295. { { 0x4bee80d7,0x61b51bb0,0x7692de69,0x0e1f6a1f,0xa0ebc3bd,0x8379e46c,
  34296. 0x930644f0,0x1c0bffa7,0x390db077,0x97c67b87,0xfada1ce9,0x095c33e1,
  34297. 0xac54b512,0x3c500add,0xd3118656,0xc231d360,0x000000b0 },
  34298. { 0x39bcab2f,0x06289298,0x64dd220a,0xc0c06780,0x763dc2a0,0x062f6084,
  34299. 0x1938c3e3,0x88e9da73,0x52e46eb9,0x69be8f2d,0x6a5de0fd,0xe55c8d2d,
  34300. 0xdb2c0e26,0xf3a3fd63,0x1e4bff57,0x899c6d9f,0x0000014a } },
  34301. /* 9 */
  34302. { { 0xec05ce88,0x9ff6e3a1,0xb6afd202,0xf8fc2496,0x6fbeb007,0x0b9d2077,
  34303. 0xeebded40,0xb50ec0bd,0x693700f7,0xaef97742,0x3f7b030e,0x806e37a1,
  34304. 0x1b901f77,0x5cf17d17,0xca95ae0f,0x9036e5df,0x00000159 },
  34305. { 0x000e8e0c,0x00af64b5,0x06fb4df9,0xd3f2ae04,0x449f23ba,0x5f61da67,
  34306. 0x255b25a9,0x0ca91842,0x8e33c650,0xfa6af3e6,0xc2c027c1,0x14373c00,
  34307. 0x972840a5,0x99f3cda1,0xd0e84240,0x98c62b79,0x000000e7 } },
  34308. /* 10 */
  34309. { { 0xae4d0f28,0xe8c7c4a8,0x566d006e,0x3a8a55ef,0x066e4023,0x37985f65,
  34310. 0x5d321b76,0x8deccab5,0xb8351b07,0x38b966d6,0x57d548ab,0x2e889e53,
  34311. 0xe631ab0b,0x7a9e8e2f,0xe75c537b,0x45c60f95,0x00000059 },
  34312. { 0x7867d79c,0xbca27d34,0x81c81980,0x7f460b15,0x976b8c51,0x7ec2d9ab,
  34313. 0x61b91ed9,0xfcd04486,0xd9c1d15f,0x730a7a25,0xf94c9db9,0x8a2cf259,
  34314. 0x5dec5a3b,0x8e784b87,0x3e5131ee,0x06252607,0x00000004 } },
  34315. /* 11 */
  34316. { { 0xf1631bba,0xdee04e5c,0x156f4524,0x40e6c1df,0xe4c30990,0x06603f30,
  34317. 0x6b6abec7,0xdb649a43,0xf6b94f6e,0x354f509c,0x36b7e0b5,0x7fecf469,
  34318. 0xba1e6dd2,0xa7a7107e,0x689450ca,0x889edac5,0x00000022 },
  34319. { 0xd05596f2,0x9012916e,0xb023cb8b,0xe3901dac,0xe7d4abe1,0x2501d3ec,
  34320. 0xa9c90313,0xb2815040,0xc6d146d0,0x9dbcd3f1,0x74ee1896,0x6fa1d5b1,
  34321. 0xa91226fb,0x49aea161,0xb8a80984,0x754ceedf,0x00000154 } },
  34322. /* 12 */
  34323. { { 0x4270b2f0,0xb64e27b0,0xbf4d74d7,0x84b34e48,0x0c2722ba,0xb186be8b,
  34324. 0x9ff9b71c,0xf54a589d,0x34fd6bc4,0x9887e4df,0x7412f49d,0xb7c669fd,
  34325. 0x77f89d16,0x4008d9bb,0xc902e074,0xafb9426b,0x000001cf },
  34326. { 0x662935ca,0xcca4f2d1,0x997dcc46,0x2847c703,0x353c79f8,0xc089e9e5,
  34327. 0x5215f0f4,0x9ed8d989,0x80911b9d,0x59cf08bc,0x6de27aa3,0x4b03540e,
  34328. 0xf69e320d,0x52f4d63e,0x94ef193b,0xa0217fd6,0x000000e6 } },
  34329. /* 13 */
  34330. { { 0x74214780,0xb77de627,0x207459ea,0xca066817,0xe9c7fb01,0xf78579b7,
  34331. 0xd6d4b7c7,0xe55548c1,0xa66caa39,0x45756190,0x98505a4f,0xf8141b03,
  34332. 0x4c8864eb,0xa5ca0d7c,0x9e129d3f,0xbf8af950,0x00000053 },
  34333. { 0x85285092,0xbc9b29d8,0x8eed5e5f,0x82f31daa,0xf618aab9,0x9c33690e,
  34334. 0xd2626ed1,0x0eee14f4,0x07ed8e09,0x4229570b,0x8736d040,0x1977920e,
  34335. 0xede7d01d,0x47ee25ff,0xbc7ab73b,0x3c921c3a,0x000001b9 } },
  34336. /* 14 */
  34337. { { 0xa08b2b14,0x0b6a07cc,0xbf174c7f,0xaa978deb,0xc40cb2a4,0x291cb828,
  34338. 0x90adc838,0x95c78272,0x8c1edde6,0x08da8b2a,0x90fbd220,0x741ceb2f,
  34339. 0x322db94e,0x5f89c9e5,0xb73c548e,0x18266085,0x0000007d },
  34340. { 0x2defd012,0x69ebf82a,0x5a1537ef,0x01ecb094,0x3ef0811d,0x3c557535,
  34341. 0xb2bd4dea,0x59c882a7,0x7bf969c8,0x00a1f972,0x0b25ad1b,0x063adf5e,
  34342. 0xf2536005,0x4c1ff306,0x4112fe18,0x8e515bec,0x00000117 } },
  34343. /* 15 */
  34344. { { 0xefe3d3d5,0x9314787f,0x9d897227,0x29e76f65,0xe0b6acf5,0x15c77ed1,
  34345. 0x1c5e8dd9,0x9c2b7b20,0x5f5667af,0x788038f1,0xf3576ef4,0xf38c766f,
  34346. 0x0040154a,0x9f0623c8,0xde883b53,0x47d3c44b,0x00000096 },
  34347. { 0xde1b21a4,0x32075638,0x571081c1,0xbb6399c1,0x75c03599,0x322e6067,
  34348. 0xade60cf5,0x5c7fde7f,0xefc19059,0x1b195440,0xdd7b3960,0x7e70ac8c,
  34349. 0x6a6fa73e,0x4aa5a83d,0x63080764,0x34f8cfac,0x00000042 } },
  34350. /* 16 */
  34351. { { 0x286492ad,0xee31e71a,0x65f86ac4,0x08f3de44,0xda713cb4,0xe89700d4,
  34352. 0xa86b7104,0x7ad0f5e9,0x2572c161,0xd9a62e4f,0x25cc1c99,0x77d223ef,
  34353. 0x3b962e0c,0xedff6961,0x81d8b205,0x818d28f3,0x0000008e },
  34354. { 0x8cdf1f60,0x721231cf,0x6717760f,0x8b640f2b,0xe045a403,0xbe726f8c,
  34355. 0x0370689f,0x422285dc,0x72ea0dcb,0x7196bf8f,0xc8086623,0xa16f7855,
  34356. 0xc326fe48,0xd4e19fc7,0x8f68bf44,0xfdbc856e,0x0000013e } },
  34357. /* 17 */
  34358. { { 0xe6a3ace5,0xde34d04f,0x896191c1,0x0dbb603e,0xf75ed0f4,0xb4dc0007,
  34359. 0x95b259b5,0x15e0e6bc,0x2615f020,0xdfbcba66,0xd31ea3f8,0xb2ec5433,
  34360. 0x103ff824,0x42b0b0e4,0xc480332e,0x19315060,0x00000111 },
  34361. { 0x045452f1,0x9997ea28,0x71f3f73b,0x80b678cf,0x41e9328e,0x4a52bddc,
  34362. 0xe6af1c23,0xb7f2656e,0xb44215e7,0xc43805b9,0xf0a4028b,0x3aa734f2,
  34363. 0x422476e2,0xe3c72479,0x68c60cf7,0x6dc2e8b0,0x000001f1 } },
  34364. /* 18 */
  34365. { { 0xfffc0de5,0xbcdfae6f,0xab4a5f24,0xa801814f,0xea2aa8dd,0x19013658,
  34366. 0xda4f0441,0xf3b1caf5,0x34100611,0xf24b9cdb,0x96e0cf88,0x48c324ed,
  34367. 0x23055c82,0x4b7ea334,0x89092e29,0x6e835b64,0x000001d3 },
  34368. { 0x07372f27,0x7eb77ae7,0x83bae19a,0x4779b4fa,0x65429ebb,0xa175dae1,
  34369. 0xfc03ef3f,0x942ec266,0x6991c7c4,0x0e5fc6a9,0x56253d3c,0xa0f61e4f,
  34370. 0xde74e738,0x7a11ff58,0x624de919,0x60524cd4,0x00000002 } },
  34371. /* 19 */
  34372. { { 0x01342e08,0x45b5d0ca,0xb749f0af,0x509ed4f0,0x6529d804,0xeb5502d9,
  34373. 0x6d80359c,0x5eb087db,0x4c384800,0xeaa66a87,0xc75a8784,0xe972c7a0,
  34374. 0x6874317e,0x8c169e21,0xe5c9fbf4,0x81c556e0,0x0000014f },
  34375. { 0xe120674d,0x26b0b12b,0x219f00ac,0xc6bf09b9,0xd658caa6,0x1e1e732d,
  34376. 0x8292d99e,0xc771c5af,0x25fdbf80,0x5d813529,0x3666c37d,0xe61bd798,
  34377. 0x1d0df680,0x8dac946a,0xc39f0983,0x58dcf684,0x0000009f } },
  34378. /* 20 */
  34379. { { 0x7b7dc837,0x14169102,0xb50eb1c4,0x2d719754,0xd7e6741b,0x04f4092a,
  34380. 0xbc824a38,0x1d0a7f1d,0xc8e20bcf,0x570b2056,0xda181db0,0x6732e3b9,
  34381. 0x0a7b508a,0x7880636e,0xc9f70492,0x11af502c,0x00000045 },
  34382. { 0xc56f4ffa,0x0b820d94,0xc4f0c0fa,0x1c6205a2,0xa1a0606a,0x99f33d4e,
  34383. 0x79b316fb,0x1bab6466,0xe4f240fc,0x05aa0852,0x92d7dc43,0x22539b78,
  34384. 0x06e3c073,0x03657f12,0xcedb6633,0x28405280,0x00000059 } },
  34385. /* 21 */
  34386. { { 0x4397760c,0x90d08711,0x1c9fcd06,0xb9020b76,0x987e24f7,0xc7fec7fa,
  34387. 0x522335a0,0x0e33b8a0,0xae21ca10,0x73dbeafd,0x3b032220,0x458c060a,
  34388. 0xee145da6,0x9b9c73b8,0x27ff62ef,0x31c661e5,0x000000aa },
  34389. { 0x81430b5e,0xaf518eb0,0x50ee0d69,0xb32f9cea,0xaa6ebe8b,0x0ecdb0b5,
  34390. 0x9fe1d689,0x1f15f7f2,0x1a59cc9a,0xce5d68f3,0x08ab2a63,0xf4d67994,
  34391. 0x4347ce54,0xe85b1cef,0x286d0776,0x8ff423c0,0x00000176 } },
  34392. /* 22 */
  34393. { { 0x33dcec23,0x8564104c,0xcdd07519,0xbaf0d61b,0x4c4f309a,0x486daf51,
  34394. 0xde488715,0xf01bc8f5,0xd3539ba3,0xddd6baf1,0x3a3be8ec,0xbb7e665d,
  34395. 0xcb5d865f,0xf919dac3,0xf12149a0,0xfe203da3,0x00000173 },
  34396. { 0x78d4a3d1,0x043ae9a1,0x865316d8,0xa4d5cf58,0x41176463,0xeaf026c0,
  34397. 0xf84afa44,0x316c638f,0xffea422d,0x512f2397,0x6622b613,0x691eaa04,
  34398. 0x97e7068d,0x48856ea3,0xf4a1b33c,0x42d1b2e3,0x000001b5 } },
  34399. /* 23 */
  34400. { { 0x1f487402,0xf51b2d5e,0x7aaf1dd5,0xe36016e6,0x6da9c20a,0x1eb3f1f5,
  34401. 0xece45bfd,0x25b7d361,0x027a9e18,0x42db0633,0xe8411649,0xbf228777,
  34402. 0x458773d0,0xf5fce0c4,0x2dd7a5f0,0xb2b3151d,0x0000001f },
  34403. { 0xfbaa096a,0x102773e8,0xe093a878,0x152726eb,0x2c7f1781,0x5c53cd07,
  34404. 0xab5dca76,0x38d3dfd0,0x87ef2d4a,0xbb4a7d85,0xb7eb11c2,0x5c9c2013,
  34405. 0x0b6da22f,0x5e353c34,0xa325ecad,0x846d50a5,0x00000039 } },
  34406. /* 24 */
  34407. { { 0x1677df58,0x76da7736,0x1cb50d6c,0x364bd567,0x0a080ff2,0x0443c7d7,
  34408. 0x86532430,0xa0a85429,0xc35101e7,0x82002dd2,0x48c5cd76,0xbebc6143,
  34409. 0xca6cf13f,0xff1591ae,0x98bf8dc0,0x91c7c2e6,0x000000fb },
  34410. { 0x12de14d5,0x6a7c5cad,0x6561c822,0xbc448c5f,0x7cdbb3da,0x9f8de430,
  34411. 0xc76811d7,0x9c58f011,0x75462049,0x1e89806e,0xc9a74e49,0xe52ad0a2,
  34412. 0xb2be37c3,0x2034685c,0x0a0bc72d,0x7a863245,0x000000ec } },
  34413. /* 25 */
  34414. { { 0x8a86786e,0x33818c21,0x2137e2c8,0xed537f74,0xa7e6eb20,0x5d9690d1,
  34415. 0x5cdc4803,0x9790ec70,0x24f7bd75,0x469162c8,0x4e1f0f14,0x09e7ef9d,
  34416. 0xce9915ca,0xd30c128b,0x6c71226f,0x810145f6,0x0000002d },
  34417. { 0xb71d87e5,0x312749f5,0x7b02ceda,0x25f3b141,0xe0baff16,0x02456d2e,
  34418. 0xfcae6627,0x97f7b3a9,0x37bd985f,0x0d6ebf8f,0x7fa6d0c1,0x20aa81b9,
  34419. 0x21f2f137,0xb29f1a01,0x5cc0ddb1,0xe326a2f8,0x0000003d } },
  34420. /* 26 */
  34421. { { 0x38c2ee78,0x26f3398b,0xa75a0bee,0x40c3d101,0x565a7f8e,0x35a31706,
  34422. 0x04019e5d,0xd12985e3,0xb8174b6e,0x21e2a642,0xaf80a52a,0x25a15ee8,
  34423. 0x8518d80e,0x5d1e0fe6,0x04f6ea9a,0x8cbbc138,0x00000084 },
  34424. { 0xdfd45169,0x76828690,0x59d3e8d0,0x38d7e098,0xcdb8bfc2,0x23758811,
  34425. 0x162cf648,0x8499547a,0xb4d15b8c,0x494bab3b,0xc60499a6,0x822cbc57,
  34426. 0xa8a1cfed,0xac43224e,0x57c6598b,0x43563469,0x000000d9 } },
  34427. /* 27 */
  34428. { { 0x68271323,0x2b069253,0x49cd04d7,0x24d9e0a8,0x2b31cc7d,0xaae35fbf,
  34429. 0x57a3e361,0x44f64b4f,0x0294e856,0x14904686,0x43ced4ae,0xddc82ee7,
  34430. 0x7e2cda47,0xcb92a6a5,0xbfc1f968,0x989c42ef,0x0000013f },
  34431. { 0xb8651600,0xbed98bdf,0x7a3cfaee,0x8c363434,0x35b1a226,0x93a12543,
  34432. 0xd5825507,0x558da7dd,0x852eb1e9,0xa5173b23,0x2295f545,0xdf5ae585,
  34433. 0x6646d101,0xe546e2ef,0x5d89f862,0xf7e16a2c,0x000001fa } },
  34434. /* 28 */
  34435. { { 0xc7ec136d,0x0d746c8e,0xcd11351b,0xf8e1d827,0xf187a116,0x764a3ad3,
  34436. 0x136e8465,0x2f1b968f,0x850983c2,0xd41aa294,0xbe717259,0x2123ecc4,
  34437. 0x763c149c,0xdcdcab52,0x1022b82d,0xa7f50b18,0x0000016d },
  34438. { 0x0ca5e258,0xf99e532d,0x97b62a7b,0xa148ad17,0xc77fddef,0x8d0a242e,
  34439. 0x74f9b6c4,0x58518bcd,0x7fd122d4,0xc53b30b8,0xfb50b2d7,0xbb8cd193,
  34440. 0xbc01aae9,0x1a169aee,0x1de26e09,0x7e49b10a,0x000001c5 } },
  34441. /* 29 */
  34442. { { 0x21210716,0x2cabe675,0x07e02400,0x81a296a3,0x8c83795b,0x94afc11d,
  34443. 0xdd9efa6a,0x68f20334,0x677d686f,0x5be2f9eb,0xbf5ce275,0x6a13f277,
  34444. 0xb9757c5c,0xf7d92241,0xc74f4b8c,0x70c3d2f4,0x00000132 },
  34445. { 0x8d209aa4,0xf9c8609c,0xdb2b5436,0x46f413a2,0x2992345d,0x96b72d1a,
  34446. 0x9487c34f,0x186f2aeb,0xb440a375,0x4fa72176,0x7da5358e,0x3a420936,
  34447. 0xff25b310,0xf11eade3,0x505d60b8,0x9a570153,0x000001a9 } },
  34448. /* 30 */
  34449. { { 0x6e7495bb,0xae151393,0x490879d1,0xebd2fd28,0x29fd76fc,0x9c232b0b,
  34450. 0xc60e721c,0xa1a0d49b,0x517a09e2,0x9f582b83,0x9d8badf8,0xac37809e,
  34451. 0x0ad48bb4,0x4aa4de9e,0xcb6cc487,0xfd041312,0x00000027 },
  34452. { 0xead4fb6d,0xc05502ee,0x0a602cbe,0x760c25ed,0xbd7f4a07,0x58ba6841,
  34453. 0x54edce14,0xc28b6032,0x0397614c,0xb9d41e39,0x181eed93,0x4221b71d,
  34454. 0x332d4b0b,0xd010e3c2,0xdab0e419,0xdfe58a27,0x00000096 } },
  34455. /* 31 */
  34456. { { 0x7debd24e,0x4cd6fcd6,0x9ae2b075,0xbe3fca60,0xf217c26c,0xa7d8c22e,
  34457. 0xb9620e3f,0xd42d03e0,0xc7f9f87d,0x634bf216,0x8972ffee,0x22b1ec53,
  34458. 0xd60d3e77,0x83a957c1,0x0f6a537e,0xedfe5f86,0x00000162 },
  34459. { 0xf0ea20b8,0x40a05400,0x1d796900,0x2872ac7e,0x0edb0cac,0x7765a5c9,
  34460. 0xb62939a7,0x9df5b930,0xaf2cb708,0xf78a676e,0x52febc12,0x030732bf,
  34461. 0xba190ad3,0x3a6640de,0x93e7e341,0x36eae15f,0x000000d5 } },
  34462. /* 32 */
  34463. { { 0xa1c88f3c,0x6c6119f6,0x2ec6944a,0x924e5fec,0x5742ff2a,0x4c8aac60,
  34464. 0xddb22c7c,0x60adde1e,0xfa5d25bb,0x9728938c,0xec117de0,0xfa5ac4f7,
  34465. 0x482929c1,0x41f35ab7,0x0afd95f5,0xd1c4e8f9,0x00000180 },
  34466. { 0xa7cd8358,0x2fc4e73d,0xf2a1c920,0x39361a57,0xad94d288,0xf6f2f130,
  34467. 0x2b6a78e2,0xe37e2466,0x79c262cd,0x0babff8b,0x61b597b9,0x6cae01ef,
  34468. 0xa60d4e64,0x9c1e33f0,0xdd01f845,0x52a42280,0x0000000e } },
  34469. /* 33 */
  34470. { { 0x0f013755,0x72d640a4,0xfb8380e9,0x0b6dce77,0x7eb64b31,0x2789ce79,
  34471. 0x93ca5a36,0x8e704b0b,0x58bdffc9,0x18c360ff,0xb230c372,0x53b1f323,
  34472. 0x5a7385d1,0xd6b39088,0x56b93bf7,0x071130f5,0x0000004a },
  34473. { 0xfeef3f88,0x29a2096b,0xb82b3945,0x22eba869,0x872664a7,0x7fe2184a,
  34474. 0x858ff942,0xa0dc0ba1,0x7490c9da,0x33799eb5,0x81588ce8,0x1d356f62,
  34475. 0xa7b2cee2,0x7dd9bc7f,0xa3cfaee9,0x1e61a4e8,0x000000d2 } },
  34476. /* 34 */
  34477. { { 0xe9068656,0xec5db629,0x9fede4df,0x623bd70c,0xfcd45546,0xc78ad5bd,
  34478. 0x6291a741,0xf7981dd2,0x761e688e,0x3ac53d92,0x55b9272f,0x6a96892a,
  34479. 0x06546fec,0x4217e7b8,0xab9e2f56,0x793c03cb,0x0000015e },
  34480. { 0x6eff39be,0x08fd9543,0xdbff4f68,0x5a1af07e,0xb0241616,0x83d47abd,
  34481. 0xd4798029,0x37c5d2fd,0x60b2e6fb,0x9d86d978,0xce8db998,0xe3e3284e,
  34482. 0xd868b9bb,0x9f049eb5,0x9dad18b3,0x3b3e8a78,0x0000018e } },
  34483. /* 35 */
  34484. { { 0xe51e61f0,0x57026c56,0x307f2757,0xdddbcaa3,0xb1aeaf41,0x92a026eb,
  34485. 0xe2d7f5ba,0xa33e937c,0xbc5ead91,0x1f7cc01e,0x2e46807d,0x90ab665d,
  34486. 0x53419519,0xc2a44f55,0x79664049,0x099c1ca6,0x000000aa },
  34487. { 0x8f97e387,0xb561a909,0x45e1dd69,0xf6051778,0x7ff1d6ab,0x1ffa512b,
  34488. 0xd09a9c89,0x42da55a4,0xd2282e2b,0x5e5a7c71,0xe74185ad,0xdfa5a203,
  34489. 0xea0baeff,0x19b1369d,0x1ecc0a16,0xa5eef914,0x000001a3 } },
  34490. /* 36 */
  34491. { { 0x7a573b81,0x2af20d0a,0x66194cef,0x7eac1ca8,0x0b711c34,0xef0d2d8d,
  34492. 0xba099d42,0x6aea016c,0x5067a8ca,0xa6609d28,0x7a1351ef,0x6a52c600,
  34493. 0xb11c2634,0xdab85818,0xbb1c033c,0xf17fa45d,0x00000121 },
  34494. { 0xfc3279d6,0x9fb8b87a,0xc201f1e1,0xe30e76ab,0x806c21dd,0x02af6a83,
  34495. 0xc63f824f,0xeafd7e2b,0x46bd1a53,0x7b074e26,0xa2139164,0xcd6f4931,
  34496. 0xc172d9bf,0xab2cfd39,0x4db59cf1,0x62f3eb4b,0x0000010a } },
  34497. /* 37 */
  34498. { { 0xe0689a1b,0xe402de36,0x7dcafe72,0x9dccc9fd,0x255d0bfb,0xe4dead7e,
  34499. 0x4ada04d9,0xd7ee87ee,0xbfd2e774,0x5a85039e,0x770b2b9b,0x282c6657,
  34500. 0xba103bba,0xa7aca826,0xc7cd5071,0xac7028ba,0x0000011a },
  34501. { 0x680c8f04,0x2e61d39c,0xb48b3b5e,0x2f09c4cc,0x95744f3c,0x131609bd,
  34502. 0xaaccb593,0x6d72e4b4,0x5adfb209,0xdb7060ca,0x1fd3eccf,0xc67d9e43,
  34503. 0xe1752a73,0x1487a26f,0x64d0857c,0x3d953663,0x000001e3 } },
  34504. /* 38 */
  34505. { { 0x4cec9e7f,0xe664506b,0x30aab98f,0xa44564b4,0x173fa284,0x5e1b501f,
  34506. 0x15c97472,0xe7b7bd7e,0x82dec033,0xd6cc67a8,0x0a63b762,0x1fe2e934,
  34507. 0x3f8e2fcd,0x3a084e1b,0x9ae6e752,0xccce4da8,0x000000fd },
  34508. { 0xc12fd820,0x0797f8ee,0x96da4733,0x325f892a,0x55997bf4,0x597d241d,
  34509. 0x02b753cf,0x3aef35ac,0xf677ceba,0x8a73f95d,0xd1bbac6c,0x5b2892b7,
  34510. 0xcc5278b0,0x90751583,0xa47f45f6,0x2f5ed53f,0x0000001c } },
  34511. /* 39 */
  34512. { { 0xab40b79c,0x3914165e,0x25b489a8,0xbfb6eed8,0x8a6c107f,0xda136b7d,
  34513. 0x8e01f28b,0xd431db8b,0xa4d79907,0x84e5d0dd,0xa471e685,0x69a91472,
  34514. 0x98376ff8,0x58d06969,0xc46311fd,0xce369b74,0x00000006 },
  34515. { 0x1add1452,0x6c0773d1,0xed8e9a2a,0x2e4e9c95,0xca15a40c,0xe8ff8e32,
  34516. 0xaf62f18f,0x3fcb7d36,0xeec9484b,0x2ca336ee,0x3b20405b,0xa4d6e7a9,
  34517. 0x956d8352,0x6d90d031,0xd9ca03e7,0xdd375603,0x000000e5 } },
  34518. /* 40 */
  34519. { { 0x8b481bf7,0xcc5f297d,0x2a13383c,0x06a2a3e4,0xdc40b96c,0x9e14528c,
  34520. 0x1189da3c,0x9a2bf35f,0x6cd57fa7,0xb8adb989,0x9357d32b,0xc1a4935c,
  34521. 0xc2d76fad,0x51fb2580,0x24f23de1,0x98721eb4,0x000001ba },
  34522. { 0x52a4b397,0x8c02daaf,0x0d0b4e54,0xc3c5f4cc,0x7b7e79cd,0x29be4db3,
  34523. 0xb33970b6,0xf34336ec,0x92808c7f,0xed3dcb7c,0x02288db1,0xec290eff,
  34524. 0xe96ed59a,0x2a479d51,0x76d8fa5f,0x9d7ed870,0x00000092 } },
  34525. /* 41 */
  34526. { { 0xe660043c,0xd8edaf0b,0x016e074d,0x84aa2ccb,0xe2cc3b3d,0x9d2368e7,
  34527. 0x5c269fc4,0x47b50130,0x3de33e36,0xd0194ee1,0x789ca504,0xdb3361b9,
  34528. 0x984db11d,0x8cd51833,0xc8ec92f0,0xd5b801ec,0x000000c6 },
  34529. { 0x47ab9887,0x33f91c15,0x6b5ab011,0x2f285e2a,0x133fc818,0x9b734e5a,
  34530. 0x38d8692c,0x5c435a74,0x43282e81,0x3c92b47c,0x9c7bcdaa,0x191231f5,
  34531. 0x4d158c86,0x3ae425c3,0xc5a23cca,0x7f568feb,0x00000011 } },
  34532. /* 42 */
  34533. { { 0xbf5caa87,0x8ccbd9d5,0x68dd8c9d,0x17bfc60f,0xc7d4dede,0x63eb4dbb,
  34534. 0x8270b5bf,0xbf6e5945,0xcc098fe7,0x887137a5,0x05d7b8f5,0xca5eb687,
  34535. 0x4b25a533,0x4b7deeee,0x4a700a6c,0x8e045c32,0x000000ef },
  34536. { 0x70cf52bc,0x160c1c92,0x90cc6298,0x4bf3f63a,0xbf3028fb,0x5fff421c,
  34537. 0x523beff1,0x0a8102d7,0x8b9ce105,0xff3309a3,0x06621b1e,0x8e9da4d0,
  34538. 0xcc0a7807,0x9775f89f,0x00178612,0x59044865,0x000000eb } },
  34539. /* 43 */
  34540. { { 0xebbd33ec,0x8a6664fd,0xce5ad579,0x0cf9a660,0x50fb56ed,0xecd06c05,
  34541. 0x1d5aaa6e,0xb4ca5fad,0x948a7f07,0x36daee5b,0xefe1c11a,0xd2e37887,
  34542. 0x91d2544b,0x41f61ac4,0x2bffd8ea,0x49df7071,0x000000be },
  34543. { 0x65acdb56,0x60e2f1f5,0x5e5e5bde,0xf2f13c84,0xe17a0412,0xb97fd354,
  34544. 0xd9c93bef,0x8a2867cf,0x25a957e4,0x9ca9d16b,0x4a18635f,0x1f55c19b,
  34545. 0x8d26ae71,0x9b3868f5,0x4c94541d,0xac448041,0x00000000 } },
  34546. /* 44 */
  34547. { { 0xd4ad38db,0x6c1bcf89,0x3d714511,0x1180f381,0xcb70243a,0x5b4c2759,
  34548. 0x163a716c,0x5dd64d63,0x13648bdb,0xbbd2efea,0xe4de9969,0xa47187f9,
  34549. 0xe2de8c45,0x65de6912,0x4bdad0a7,0xe075f29c,0x00000048 },
  34550. { 0x5e4dd88d,0x00335474,0x80577afc,0x18283638,0x227288f7,0xe4b35c01,
  34551. 0xe68989de,0xd008fd91,0xcd3f71ba,0x42142315,0x3e4da1e2,0x5cb023ff,
  34552. 0xb5662bb1,0x7e6b9c35,0x7fb04fe5,0x143f4165,0x00000072 } },
  34553. /* 45 */
  34554. { { 0x26f40f2c,0xb06b046c,0x6cd7c31d,0xbd5d246c,0x1953a9b7,0xaaa56270,
  34555. 0x8f00436f,0x5ac929b8,0x21d0660d,0x1937392c,0x9bd6dbe6,0xd279ed15,
  34556. 0xd17c43f9,0x377c4d5a,0xb8fcd025,0x800eda50,0x00000179 },
  34557. { 0x36132f31,0xb88ddc0b,0x2ade73a3,0x6f8f4f01,0x203de2b9,0x38859ec3,
  34558. 0x231b6533,0xedb03814,0xa14093ca,0xad08cd20,0x5c2be2f9,0xb9f86d44,
  34559. 0xf6ebc09f,0xfd3d9532,0x1aef478d,0x757b5899,0x0000013d } },
  34560. /* 46 */
  34561. { { 0x580f894b,0x7d9ad100,0xd925e46f,0xb612488a,0x2e5a6865,0x45497e14,
  34562. 0x17f9a813,0xc86e1053,0xf8a33541,0xd8aa820a,0x7a66d578,0xa6790660,
  34563. 0x5f758e23,0x47df60ae,0xa7f8ab5c,0xcadd4c90,0x00000107 },
  34564. { 0x6764ad0e,0x356b044f,0x250189b3,0xf69fe0e1,0x5f14db6a,0x2deaca62,
  34565. 0x1bd77d54,0xe9f2779f,0x5cfa895c,0x979911f2,0xb6f19ac3,0xd4e94ced,
  34566. 0x01af44b1,0xc3533417,0x50c727f5,0xcac43fff,0x0000003b } },
  34567. /* 47 */
  34568. { { 0x83c1d4cf,0x1742951c,0xb245c34f,0xe03791d0,0x9c2dcc71,0xea8f8ef6,
  34569. 0x2a310767,0x2ea57a29,0xb12948bd,0x255b46bb,0x0feaeb83,0x2adc1e09,
  34570. 0x449abf59,0xa0d2d18c,0xc4a8a689,0x9e8c9ff5,0x00000019 },
  34571. { 0xeb28171a,0xc9f7b9cd,0xd576987b,0xefd78403,0x22ff824c,0x58b4f3bf,
  34572. 0xbf333cc5,0xee09b393,0xb01ceb72,0xebff83a2,0x220299cd,0x5bb34c45,
  34573. 0x66ebf751,0xa3c3e8a0,0x49d05cf3,0x5dee07bb,0x000001a6 } },
  34574. /* 48 */
  34575. { { 0xb114257b,0x09a958d6,0xd4975e30,0x729afd41,0x3aae7b11,0x072879b5,
  34576. 0xedd1ac83,0x0791b093,0x1eb67975,0xcfefc7d1,0xe2675b4a,0x0e54bd37,
  34577. 0x8d69517f,0x89a62d7e,0x202109a3,0x96f805d8,0x0000006b },
  34578. { 0x57b5f9f4,0x4815d517,0x405b44d1,0xe5c9e436,0xe4870160,0x3442dde0,
  34579. 0x1ef6b3f8,0x953fef95,0xf7497faf,0x919e4cf5,0x016ef0b7,0x24e3cc4d,
  34580. 0x2512eeed,0xfc5caa87,0xa3bd1703,0xf1ba4029,0x000001b6 } },
  34581. /* 49 */
  34582. { { 0x529252ac,0x2a668435,0x74e7b0d8,0x3da626c0,0xe0be86ab,0x55080cc1,
  34583. 0x4ed5dc53,0x534a53f7,0x0cd41fd0,0xa9eff140,0x5674891c,0x0e7c945c,
  34584. 0xec53b5ad,0xdea4b895,0x15150988,0xefc67bef,0x000001ff },
  34585. { 0x306033fd,0x988dc109,0xf36875d9,0x1b287979,0xe3c335c5,0x4d39af26,
  34586. 0x124e29d6,0xa47259fd,0xc41dbdfc,0x5d60c570,0x0cc0d895,0x06224b61,
  34587. 0xeea8ff86,0xa041d4e5,0xae4d8707,0x2920e15c,0x000001fd } },
  34588. /* 50 */
  34589. { { 0xcd67da85,0x66d15f0c,0x5ac54a15,0xae98b6f4,0xf1ac71c3,0x2f05e021,
  34590. 0x47559224,0x1feb2226,0x66e856dc,0x2a2f1561,0x6fb4ba47,0x65eb1456,
  34591. 0xa29d920b,0x34688bd2,0xf9d4cb9b,0x943ce86e,0x00000061 },
  34592. { 0xaac91174,0xb4696218,0x41dd9234,0x85b519ec,0x9f0763a4,0xb7efadf2,
  34593. 0x712c8b33,0x98517f27,0xb0538630,0xa02e7ec3,0x1ff3e3e4,0x46bc45bb,
  34594. 0x29496486,0x46ae896f,0xebd2b93f,0x2aeb1649,0x00000146 } },
  34595. /* 51 */
  34596. { { 0xe8e4d3c3,0x1f34f41f,0x5bb7e9db,0xc80d87ff,0xd910b579,0xf0216c0a,
  34597. 0xb87349ae,0x2a24b761,0x2b0a6cc0,0x054bc528,0xaf2d1957,0x3b4c7029,
  34598. 0xadbe6cdd,0x0e4b90e2,0x26060a34,0x8e774f81,0x000000cf },
  34599. { 0x2e229950,0x3c7f9dbc,0xd9f82b70,0xab11f846,0xf10c05f3,0x2b7ad9a3,
  34600. 0x0f1820ca,0x203ead4f,0xccbfb332,0x51dbcbc8,0x066706f1,0x3bd9caf0,
  34601. 0x06059d5e,0x5a39be25,0xdcafe64e,0x984387c8,0x0000014c } },
  34602. /* 52 */
  34603. { { 0x8e011531,0x708a757f,0xc3dcd57c,0x7f45b172,0xc2d99e29,0xa8eac9fd,
  34604. 0xb93b6415,0x9d4ee81f,0xa5488e86,0xa5833b54,0x0bb7ab70,0xddd561c3,
  34605. 0xb3bdf3a9,0xb5bda384,0x1ddf332b,0xf909f8e0,0x00000124 },
  34606. { 0xab41e782,0xc5b8aa84,0x851ddb87,0x1de20126,0x99482bd2,0xf49baa7d,
  34607. 0xf4b6413b,0x05963deb,0x7cd1e224,0xed369fbb,0x1bad60ee,0xdcf495dd,
  34608. 0x892e30ed,0xeb475693,0xaf0a212d,0xaaf11bd8,0x0000010b } },
  34609. /* 53 */
  34610. { { 0x16ec64e2,0x71460174,0x7d7c6ebe,0xbfd14acf,0x668b7176,0x1e3504a3,
  34611. 0x741b041c,0x72e3f3f3,0x2d3b67b0,0x651fa54a,0xe57d928d,0x623edca3,
  34612. 0x72c8f419,0x29b74e8b,0x327abaef,0x3d99cb47,0x00000038 },
  34613. { 0xda342a3f,0x808dd0b3,0xdef4a954,0x12002462,0xeab5a860,0x1b1c642e,
  34614. 0x06e54b6d,0x5e1e2a05,0x10c6cf1a,0x9ba1710f,0x0f903cd0,0x334fc366,
  34615. 0x134166f5,0x969e0001,0x155c4353,0xfaa26074,0x000000fa } },
  34616. /* 54 */
  34617. { { 0x712de285,0xc85cd0e6,0x869f5dc5,0xcd2ff8b0,0xdf4ed389,0x372a2b92,
  34618. 0x55b99c84,0x63524d30,0xe07a0033,0x46fef5a2,0xd6e09493,0x0a2c82da,
  34619. 0x72a8952b,0xb3626621,0xaf217eb6,0x9afcb188,0x0000002c },
  34620. { 0x9a64c5b5,0xd3b9d476,0x44c4cfe1,0xa0d8d5de,0x11c6dbff,0x560858ef,
  34621. 0x41c14aed,0xce1d978f,0x35efe854,0x251f9e72,0x0474575d,0xf9d0c14c,
  34622. 0xbda89c03,0x0d2c838e,0x36cc9dc0,0xa25f040b,0x0000016f } },
  34623. /* 55 */
  34624. { { 0x9cad682d,0xb23d9dea,0x46369391,0x87acb1b3,0x5c0f24d7,0x9f5c1988,
  34625. 0xd41883ce,0xdff62fc7,0x53555e46,0xd1ab29df,0x891cda05,0x569b1cb2,
  34626. 0x52c633ed,0xdb14dbc4,0x2a345428,0x1acbb86c,0x00000194 },
  34627. { 0x24db8127,0xd86a70c8,0x41b7cf5b,0x84a6563f,0xb908d9b4,0x8d84dabe,
  34628. 0x899c260a,0xaaeaae63,0x44436957,0x13ed6b2b,0xd0a92c8d,0x3bc94f99,
  34629. 0xd04bcb97,0x978f2e2b,0x716a565f,0x56a388ef,0x00000074 } },
  34630. /* 56 */
  34631. { { 0x96fc1f77,0x6082dfe4,0x1347ad6a,0xb04c435f,0x25ebe457,0xf42694dc,
  34632. 0xb6f764aa,0x64a17069,0x04d83da1,0xe03873d5,0xe0c82330,0xb0b9db52,
  34633. 0xd4239b3e,0x9886b34e,0x598814da,0x76587f2a,0x0000016a },
  34634. { 0xebc71a5d,0x6918f8e8,0x85405233,0x49141a42,0xc182cbcc,0xd63f09cc,
  34635. 0xe09057a7,0x4afe59d3,0xe239d8eb,0xe633db0d,0xfd9494b2,0xbac8582d,
  34636. 0x4704fd61,0x8b915a41,0xfceaefd9,0xe0866a9d,0x0000010e } },
  34637. /* 57 */
  34638. { { 0x52e07a4d,0x2b50c470,0xe5d745d0,0x7f6d38b8,0xe1af1226,0xb414c47c,
  34639. 0x39c505f7,0x03e4b44b,0x86f739be,0x59f3d795,0xe7c2f1bc,0xca19bca7,
  34640. 0xc063fad4,0x1c51c01e,0x7f428afb,0xda3937a5,0x00000080 },
  34641. { 0x102369fa,0xe9d8ca9d,0x706c0e35,0xe009bffb,0x96b55d80,0x2e0a19a7,
  34642. 0xac0d094c,0xda0e42de,0x787c187a,0x6c1be2c5,0x9cfa04b6,0x6d4ae2cc,
  34643. 0x76577340,0x5b0cea60,0xc7c96285,0x2d525245,0x000000d8 } },
  34644. /* 58 */
  34645. { { 0xae93de69,0x6dcb238c,0x3bfdae9b,0x4963c833,0xe8b79836,0x33c81f4d,
  34646. 0xae8bf8ae,0xe13a2244,0x4c3ebacc,0x0bc6e786,0x555a5ad6,0xa837a53c,
  34647. 0xbc7e9459,0x875d8d35,0xf9f46fcd,0xb3705534,0x0000001f },
  34648. { 0x7fb974a1,0x78e9270c,0xe9ed2481,0x23448fa0,0x64bffbd4,0x14166c3d,
  34649. 0xd79f4b3c,0xa05aa443,0x3b9f32a0,0xd855a4f1,0xac90235e,0x4bebcf8d,
  34650. 0x8db52b48,0x65849987,0xe48d09d1,0xaa4d59f1,0x00000183 } },
  34651. /* 59 */
  34652. { { 0xdbffad9f,0xee585d75,0xf419d8fc,0x64df6174,0xe6c69345,0x6f73bf59,
  34653. 0x83d59b0c,0xb80793d1,0x929c8950,0x6baf4fc3,0x29962bab,0xbd445a95,
  34654. 0xeaa91273,0x52b61945,0x3d1c785b,0x4fccdfff,0x000001be },
  34655. { 0x7cb2857f,0x05c384d9,0x06b7abf4,0x4cf83058,0x43ace6b2,0xf528dd17,
  34656. 0xbc43d6b6,0x2c7b8fa2,0x14e564b9,0x8f0e28bf,0xd2b9f01a,0x1b69bc73,
  34657. 0x3dd383e6,0xab8beb40,0x9791946b,0xaccea0c5,0x000000ae } },
  34658. /* 60 */
  34659. { { 0x0163c2de,0x9a68baee,0xeb2768a4,0xc42d0b2b,0xffdae767,0x5686f124,
  34660. 0x0aaca943,0x926da5d5,0xe01091cf,0x699c34ce,0x5324becd,0x3d254540,
  34661. 0x4193a0a9,0x1b6b58f1,0xd611cc9d,0xf144925e,0x0000014f },
  34662. { 0xc1ed9259,0x7f61a60c,0x2f1d5a7f,0x1be37aa3,0x07aef431,0x0384713d,
  34663. 0x4e6fa7ba,0x99f33d49,0x8bd3730c,0x43928c16,0x5b9557dc,0x73cf8ccf,
  34664. 0xd1a2bee5,0x0bc6d460,0x83b15610,0x27cd1943,0x00000145 } },
  34665. /* 61 */
  34666. { { 0x3427af4e,0x4be65135,0x310d937d,0x2e6c0bb1,0xcaa671c3,0xbd8ea76a,
  34667. 0xd3a9c376,0x9d7b3fd4,0x471709aa,0x124ce863,0x018051c0,0x225ce41d,
  34668. 0xf9e8ee1c,0x5489284f,0x535c4ec8,0x22d829c9,0x0000013d },
  34669. { 0xa1b15e02,0x6b01ed9d,0x301e5868,0x1d092bac,0x5764135b,0xbfa7a183,
  34670. 0x6f7159a4,0xc0ee59b7,0x18090d0d,0x9171a051,0xb8052196,0x5c1531bb,
  34671. 0x20927904,0x740930fc,0x76337685,0x963b48cc,0x00000008 } },
  34672. /* 62 */
  34673. { { 0xf4aaaed5,0x0fe8b620,0xfe871ee8,0x1068de7d,0xfebfcb4b,0x2b22030f,
  34674. 0xc3a2155b,0xd4dfbee7,0x2769b805,0xa7a26a8c,0x6d39eaf0,0x377de770,
  34675. 0xf615f032,0xf1a92447,0x42d9b731,0xa1b81a84,0x0000012a },
  34676. { 0xb1152e8f,0x299e67d0,0x92b5e14c,0x2e773d97,0xf1cb57a2,0xe0d81073,
  34677. 0xbf1da4a2,0x03af0a9c,0xc22b449a,0x169b160e,0xdd2d7d1d,0xb82c1ac8,
  34678. 0xbfc98ee4,0x7508aca6,0xe3cbea15,0x54992440,0x00000150 } },
  34679. /* 63 */
  34680. { { 0xa13a4602,0x70004a0a,0xd0d2c60e,0x505c71a3,0xa6d79bc5,0xa4fe2463,
  34681. 0xd54d9df4,0xe878eb3a,0x73d3c7b8,0x7ecca907,0x244ecfa5,0x5b3bb278,
  34682. 0xb124d179,0x8a30f61f,0x4f632af0,0x5b7e5001,0x00000115 },
  34683. { 0x9ef0021a,0x62c42ecc,0xf856c9d4,0x58017fd7,0x2e6478bc,0x10e243b8,
  34684. 0x1505a4db,0xaf074669,0x4cd7eea5,0xd9bb0a1c,0xd52aed0a,0xe8ba39a2,
  34685. 0xb549f09d,0x0747449a,0x9e57fa64,0xd5c8f7bd,0x0000013f } },
  34686. /* 64 */
  34687. { { 0x5a53c22b,0x1bd8ce7b,0x7cab446a,0x78733fcd,0x48acb394,0xc44ca4e2,
  34688. 0xa38c790f,0xa9888b1e,0x15c34237,0x36afb6eb,0xfb702063,0xb913b8a8,
  34689. 0x917508fa,0x34b77cc5,0xf9e4732b,0xa931d7a7,0x00000050 },
  34690. { 0x56d21d18,0xa90a4290,0x55b410a1,0x82666307,0x894a6b05,0xb4684a8b,
  34691. 0x828cf75c,0x8a1ade63,0x127702a3,0x4fb2f85a,0xadf7b709,0x83ff7d05,
  34692. 0xa68d1db6,0x1d3f5a92,0xc093cd5c,0x243ce1db,0x000000f5 } },
  34693. /* 65 */
  34694. { { 0xd37d7891,0x8fc183c3,0xfd865eca,0x17b50149,0x8f218441,0x0f6e43d6,
  34695. 0x5a07f658,0xaf51ec25,0xad303202,0x8fe5a6cb,0x10676ef5,0x95de68f3,
  34696. 0xca4e000c,0x7508e31f,0x77735254,0x783e5a95,0x00000159 },
  34697. { 0x2e537ad9,0xbc1db571,0x35be9cf7,0x5e87112d,0xd57f9bcb,0xbb522b48,
  34698. 0xa8b3cbc7,0x1eff7890,0xe5ecdb5c,0x4f306e11,0x3387e7ed,0x30da8392,
  34699. 0x72321e3d,0x4d91fcf4,0xe412a67c,0x8487bb62,0x0000009f } },
  34700. /* 66 */
  34701. { { 0x8cb8e08e,0x86f5f80f,0x2496fed6,0x7cfd2c41,0x60b7dcdf,0x0061b743,
  34702. 0x57f4d05f,0x4dbaffdf,0x458061f2,0xb1993c2a,0x9de994c4,0x6c6ca8d0,
  34703. 0x2747e062,0xef70d24d,0xb9995cbc,0xd4e5d4e3,0x000000ff },
  34704. { 0xc6f40077,0x3171e245,0x0723e506,0x1592e045,0x6a6bfd88,0x35c86f7e,
  34705. 0x6d9d9ce0,0xba0959d1,0x3eb5770c,0x2e7f8fe8,0xc40d63dd,0x58eb0881,
  34706. 0xeb9e4419,0x56333bda,0x3afd1f4d,0xfb0397df,0x00000034 } },
  34707. /* 67 */
  34708. { { 0xb358815c,0x7b84e05e,0xe41087d9,0x3abcb2d4,0x07f05d7a,0x87a75889,
  34709. 0x7a9d481c,0x350778d5,0x42d64cbd,0x9d34cff8,0xccf289fe,0x0859cd5a,
  34710. 0xdd2b2c6e,0x8372d591,0x18b40b62,0xc06d482e,0x0000006b },
  34711. { 0xda4ed375,0xd10695a0,0x298daaea,0x51baf588,0xf4b7092c,0xb028a1b4,
  34712. 0x7a335b35,0x8ab87dae,0x0567efd8,0xa7359362,0x3320c374,0x7a49fc10,
  34713. 0xa3558b30,0x737acac4,0x4c0fce9b,0xd30696a3,0x0000001e } },
  34714. /* 68 */
  34715. { { 0xbd3902fe,0xd9550ab0,0x86a9d3b3,0x9bba4b4b,0x975cac37,0x3a59e0a9,
  34716. 0x333605dc,0x045e8731,0x1afc2c58,0xf2c598c2,0xeef9cbf1,0x81ff8d6f,
  34717. 0x9bf83c42,0x82bed5d0,0x528131d5,0x9d1d9d5b,0x00000157 },
  34718. { 0x5519258e,0x687da305,0x027de2a8,0x73f539f9,0xd6a230d6,0x69fa9747,
  34719. 0x5f5d1684,0xab1aeb23,0x5f7e41f5,0x5bbfe947,0x16a7feb3,0xbd546abb,
  34720. 0xe16d5187,0x2afbd4e8,0xbcc953dd,0x7437be13,0x00000160 } },
  34721. /* 69 */
  34722. { { 0xee9755a3,0x55f165a9,0xb82c9ab1,0x0c8d5a1a,0xab6b97e6,0x65a1e45a,
  34723. 0xab05e271,0x3004cdb0,0x6db0830f,0x9e0c3b52,0x75acbdeb,0xaae1ec1a,
  34724. 0x761e8498,0x413d4484,0xb1b9c62e,0x589e09bb,0x000001e9 },
  34725. { 0x9c72258d,0x67512081,0x5c1593d4,0x61dcd734,0x91c11fdb,0x6c627a7b,
  34726. 0x8857908e,0xd1d3e9bf,0x530bc68e,0x9aac06fe,0x6b5b44ff,0x125c16bb,
  34727. 0xdb90edd5,0x38860bb6,0xfbbedb5c,0x96fe8b08,0x000001aa } },
  34728. /* 70 */
  34729. { { 0xf257c0f8,0x323a5dd8,0xdd3a10d9,0x4884dc92,0xbbb8ce03,0x03f379ce,
  34730. 0xa47262a9,0x6217ad53,0x52e06c6d,0xa1df2017,0xc32428cd,0xf5b723e0,
  34731. 0x2c30c62c,0x1e5d3889,0x477f82cc,0xd9a90f1f,0x000001fd },
  34732. { 0x1763ab59,0x830d27ba,0x723783e9,0xcf27d93e,0x945968aa,0x81558264,
  34733. 0x1700d5d5,0x63251a32,0x03146d9f,0xcf6bbe73,0xe65bf0f2,0x6cdcf455,
  34734. 0x632323fb,0x80aa00ce,0xd96a4744,0x6e49e62c,0x00000149 } },
  34735. /* 71 */
  34736. { { 0x40574c09,0xbeff0b7e,0x3fe80e96,0xb76f2643,0xeb237d91,0x0b3bd352,
  34737. 0x7edc3102,0x3c0c62b7,0x424a36dc,0xf989394b,0x7c6c435e,0xe9ea64c2,
  34738. 0xe388d076,0x2dfc21c4,0xa4e69e4b,0xcc3852f6,0x00000139 },
  34739. { 0xbb096b91,0x5238a3ff,0x73d8d43e,0xee72c9e5,0x8c577558,0xc116db11,
  34740. 0xdc47d4b4,0x54ec89d2,0x42e1955f,0x2006dd35,0x7437475c,0x004aed6a,
  34741. 0x2bee9041,0xc1ddc32a,0xed9332c9,0x597417a2,0x000001fb } },
  34742. /* 72 */
  34743. { { 0x859bae66,0x3c0f1981,0x845d7c1b,0xab48e9b1,0x452a3c1e,0xc6ce9c03,
  34744. 0xff810339,0x2384a00c,0x5f98d6fe,0xcd7ede11,0x38a0dd5b,0xf7a00e3d,
  34745. 0x3c7e1c06,0x56dd948a,0x8e53a61f,0x9d21a7d1,0x000000d0 },
  34746. { 0x880eb3fb,0xf9cfdbaf,0x5e83f7c9,0x64cfd297,0xa28a74b4,0x61ba7d6f,
  34747. 0xdfb13e03,0xb8200d5f,0x232a6128,0x03bc8f4b,0x81a8d86e,0xd1fb92c2,
  34748. 0x706d6ea7,0x68675fae,0xefab18c2,0x9b08608a,0x0000011d } },
  34749. /* 73 */
  34750. { { 0xbbd2f539,0x17cf6146,0x76e26ba2,0x96052fc0,0xd4be4a67,0x36821d18,
  34751. 0x9f3f39a8,0x8f823422,0x433f873a,0x68b846b9,0x716f4568,0x7a1d3f36,
  34752. 0x2fd47750,0xdf603e28,0x6975e226,0x77cb02c5,0x00000003 },
  34753. { 0x8c01dd59,0xf275add3,0xb9c1a37a,0x9c213a9e,0x4dfc5403,0x690ad104,
  34754. 0x07ee0d86,0x202ee206,0x661fc40e,0x896ede95,0xd0b02f56,0x6b4d7398,
  34755. 0xe5af1a24,0xccb96991,0xc13f7125,0xd5c281af,0x0000009f } },
  34756. /* 74 */
  34757. { { 0xd7073a5a,0xc858c54b,0x861eac7d,0x87c81a5c,0xe720201a,0x51f84a39,
  34758. 0x40e003ce,0x952a9f8e,0x58f199de,0x76bdc4ab,0xd56cc02b,0x1cf12322,
  34759. 0x83f162f3,0xb6634e63,0x8f969e11,0x84c017ee,0x00000169 },
  34760. { 0x5c89f1fa,0xf1f43362,0xb697b078,0x4a02a630,0x4b05b7f4,0x33311e5c,
  34761. 0x4fede4cc,0xa7ccae51,0x4b025aa4,0x0d26e874,0xf84db7ad,0x7d5b77bb,
  34762. 0xf571c1fe,0x39ef1aa8,0x418ccd20,0x65eba928,0x0000018d } },
  34763. /* 75 */
  34764. { { 0x8abb2537,0xa37866ab,0x65b3096f,0x14ac4cbb,0x2a428ad3,0x827fa7ed,
  34765. 0x10e9e196,0x95d19f62,0x89801b4e,0x31eb97a0,0xaae8b823,0xaae77a62,
  34766. 0x5f5c9642,0x9693d62a,0x3e368b84,0xff5bfe97,0x000000ad },
  34767. { 0x492b0dee,0xa3efae21,0x9602c2ce,0x2143e9ee,0x6f3b99e5,0x21367c99,
  34768. 0xe93b8f59,0xdd78b2b0,0x1064c13e,0x8d541c38,0xf5738e7a,0xe6b970da,
  34769. 0x8373b1a4,0xaf6ecc16,0x74ae208f,0xdbfa3f4f,0x00000180 } },
  34770. /* 76 */
  34771. { { 0x907a6aa0,0xb024621a,0x407879f6,0xef56cb68,0x8168a934,0x44c38b68,
  34772. 0x9b9a9048,0x70d638d3,0x82541f20,0x6968caa0,0x1fc88b50,0x0c597053,
  34773. 0xaf635784,0x5564ded5,0xc4d494cf,0xe7e898c7,0x00000097 },
  34774. { 0x6b6ebb2f,0xe1dc98d9,0x7aa9e126,0x292a17fc,0xfa2a2c68,0xb60f0fdb,
  34775. 0xb2e1851b,0x9c63270c,0x81ca4cfe,0x898db265,0xb11959d5,0x94082638,
  34776. 0xa54b8d19,0xe44f308e,0x44e63094,0x96399eb8,0x000000d6 } },
  34777. /* 77 */
  34778. { { 0xb83769ee,0xfa00f362,0x3efc4cb3,0x72d040ac,0x57abd687,0xc3933889,
  34779. 0x940a7128,0x62264425,0xec242a31,0x909c4c8f,0x65a1a551,0xd1e48f1e,
  34780. 0x049c2172,0x68bd70f1,0x709b7fd4,0xc8692d2b,0x00000041 },
  34781. { 0xdf816784,0x4e388aa1,0x01be75ce,0x4a58c8a5,0x02a67812,0x9b49dffb,
  34782. 0xeda721e0,0xa73299e0,0xe67a65ec,0x8a0bd1f5,0x856c71b6,0xd81e91e8,
  34783. 0xc005aa30,0x37aee2f4,0x0595bbf2,0xd9400750,0x00000073 } },
  34784. /* 78 */
  34785. { { 0x010c0ef3,0xa912ac4a,0x4e81b1a0,0x0e654bd8,0x4f353509,0x8f0563dc,
  34786. 0xb47d189a,0x10dc41f3,0xf238c09c,0x122edd06,0xc41acf67,0x224c16af,
  34787. 0x83758520,0x1ccb9334,0x2275ae6f,0x1a4b5f29,0x00000127 },
  34788. { 0x3ce688b5,0x792fd473,0xdca9c68b,0x14566d37,0x541711d0,0xfce9326e,
  34789. 0x3cc341a8,0xe3ba14ee,0x2122c11f,0x6b8ab4cc,0xf5d379b5,0xc0fa763b,
  34790. 0xf1522f91,0x95e2d2ae,0x31cf95a5,0xd4e21b3d,0x000000ac } },
  34791. /* 79 */
  34792. { { 0x1d8e061a,0x4013a779,0xacc84a30,0x62707e70,0xeb2f636a,0x6ac08266,
  34793. 0x77b25c9d,0xe917ea21,0x70ff35cf,0xddb78bbd,0x041898be,0x5008db2b,
  34794. 0xce0ae445,0x0f58a4fc,0x2257d0e7,0xed092397,0x00000043 },
  34795. { 0xe2e129e6,0x2cad77b3,0x0f1be4d7,0xfb8c4a87,0x20056333,0xaee50dff,
  34796. 0x2a691543,0xbc2658c1,0xb8fe2640,0x95dc0cca,0x1965a0af,0x694eb584,
  34797. 0xedd1d99e,0x7d3baa53,0x8a1edc87,0x2df13b20,0x00000083 } },
  34798. /* 80 */
  34799. { { 0xd181c3f2,0xfead2247,0xf337b23f,0x915d35be,0x74890672,0xdb4cfcba,
  34800. 0xfda7a3a1,0xe4f70d8f,0x79275686,0x226b6419,0x6ff1f79e,0xe8040863,
  34801. 0xcf5fa4e8,0x98e84b39,0xd8a09f60,0x57aa0be9,0x000000da },
  34802. { 0x4efcea66,0xd40cecf5,0xafc76fae,0x98df2aec,0xc91585a8,0x63f19a48,
  34803. 0x13f00aa5,0xb111bda7,0x44b5cb9f,0x6687afab,0x652620d1,0xc6d5fb12,
  34804. 0xbacb35ab,0xaf953f1b,0xff94c4d2,0x99709370,0x000000ed } },
  34805. /* 81 */
  34806. { { 0x68b54c89,0xac9f56e0,0xce737c22,0x08ecc17d,0xab089b53,0x208ee83f,
  34807. 0x543fbd1b,0xb0f3a129,0x844dd706,0x1b204cf8,0xdec2e40d,0x80975c89,
  34808. 0x9399914a,0x08b011ae,0x74674df7,0x6b4ba170,0x00000017 },
  34809. { 0x8fdfc175,0x71216ea9,0x7e0f5b0c,0x77b7fc63,0xceb33a34,0x88d0285f,
  34810. 0x0223eab7,0xb679814f,0x51c6d922,0x9078720b,0x9c13f51d,0x5859d5a4,
  34811. 0xfaed60b5,0xe69f850b,0x6d0ccab2,0x2499a844,0x0000005c } },
  34812. /* 82 */
  34813. { { 0x73e7bcf1,0x41d581fb,0xdd3c17be,0x16dde61c,0xfa199fd9,0xc62997ec,
  34814. 0xc159db97,0x1a758873,0x64132830,0x4ed77896,0x2942a918,0x9672ce89,
  34815. 0x816ba4bb,0xf3ee4587,0xce54dd7f,0x4fb7a148,0x00000123 },
  34816. { 0xf009be8c,0xf05d80af,0x78df1ba1,0x62e938d7,0x312de620,0xa7e22e84,
  34817. 0x6070c4b9,0x48d29e7f,0xa1b5da37,0x5cd9c3eb,0xa4717453,0x1e51bd2f,
  34818. 0x56ab9e67,0x94098ab0,0x49f7c6a1,0xbb584abc,0x00000049 } },
  34819. /* 83 */
  34820. { { 0x1ea470f7,0xa9f25530,0xe9254e30,0xa01bf808,0x71a0038d,0x098569ea,
  34821. 0x5913ca87,0x0d2b2ee1,0xb8281fdb,0xae17004b,0x118e5c2a,0xdb5c6eb0,
  34822. 0x1fa943ab,0xa56ac64c,0x1a92d501,0x1aaf6477,0x00000053 },
  34823. { 0x06345730,0x9679ef49,0x846f37c2,0x946aaa4e,0x1a7c3aab,0xf81726b0,
  34824. 0x8166df4e,0xcb808da2,0x4e04dc3e,0xe9fb3fc2,0x76ec19b4,0x9e0b61db,
  34825. 0xeed6d13e,0x6e7f665e,0x86a75384,0x70ed8c07,0x000000e5 } },
  34826. /* 84 */
  34827. { { 0x108ce13f,0x66456e58,0x0e397813,0xb5bfc58d,0xea3949e9,0x04b6a84b,
  34828. 0x75af667d,0xea9b66bc,0xa891566b,0x7cb4d6dc,0xbf61595a,0x1b3cecf0,
  34829. 0x002e2520,0x4312c73d,0x6135a5fa,0x81d76898,0x0000014b },
  34830. { 0x841078ec,0x4047bc25,0x179c454d,0x75aa9c96,0x4851f8fc,0x6a160609,
  34831. 0xce34091f,0x998d4e3e,0x88e54102,0x9a9f6704,0x5da8ac5e,0xbf280f88,
  34832. 0x8fec230c,0xc64caca0,0x5094b775,0x0ac864b0,0x0000002b } },
  34833. /* 85 */
  34834. { { 0x8f5daf7f,0x6b606e39,0x10927506,0x48385489,0x08c58a72,0xa2255c5c,
  34835. 0xc90f3ee3,0x2f362fd0,0x08795f02,0xc9633af4,0x0425f5aa,0x71710bd1,
  34836. 0xec06dbfb,0xc2017e05,0xc1b8bbcd,0xd9c7dc82,0x000001c8 },
  34837. { 0x18b8bed9,0x7db41fdf,0xe3a23125,0xe9483308,0x7291c4bb,0xbcf91de7,
  34838. 0x41448aaf,0x9b0b972b,0xc44da462,0x95dfc633,0x01bf50a2,0x90b9c463,
  34839. 0x869e3131,0x18b66f77,0x121baad9,0xa8a4e2fa,0x000000f5 } },
  34840. /* 86 */
  34841. { { 0xca0251ea,0x8ca55109,0x27a6c9b0,0xf2aeed8b,0x5620f528,0x901a8beb,
  34842. 0xae13fc56,0x9a8421e8,0x85993c07,0x1349f1c4,0x0d1ab0d7,0x29e08359,
  34843. 0xaeb5d909,0x96e2929b,0xf599a66f,0x96c2f1f8,0x000000ce },
  34844. { 0x12be8bd7,0xe4bc4b51,0x3c67e99b,0xf4846a0f,0x4d3a3864,0xd89cc7d3,
  34845. 0x73f43981,0x1f647112,0x26dce567,0xc32bc324,0xf02b096b,0xf7134ebf,
  34846. 0x0d0682b7,0x5604f00b,0xe3ce8b59,0xfd23d7ea,0x0000011c } },
  34847. /* 87 */
  34848. { { 0xa27689a6,0xf89646cc,0x5564172b,0xd6a7dc43,0xb57cbfcc,0x30bda48e,
  34849. 0x5b1adfe5,0x9b11fffb,0x711d8bf4,0x9f2d80db,0xb70e5a5b,0xe879fdf0,
  34850. 0x6bd18a1d,0x97534183,0x8cbfd504,0xc8c526bd,0x00000114 },
  34851. { 0xef7388bd,0xd5fe725b,0xe7ffaea7,0xf1c3dbdf,0x7e6de2ac,0x78395b89,
  34852. 0x9ebf1bfb,0x81a72c9a,0x69785146,0x65265707,0xf52670af,0x3925ecd9,
  34853. 0x83d57d48,0x437bcdd2,0xc80ecb02,0xb5d732a7,0x000001ce } },
  34854. /* 88 */
  34855. { { 0xcfd376d7,0xa7f9fcce,0xa66b084d,0x6b4eab3e,0xd5b91bd8,0x6ac90d08,
  34856. 0x8aa304d8,0xaa3d5b7e,0x7f866a4f,0x27f3d42b,0xbb813ae1,0x95d19fa8,
  34857. 0xe34a9206,0xd38798d7,0xa32c1cdd,0xdf7c0a69,0x00000073 },
  34858. { 0x38315b16,0xbe2c01bb,0x9e18c8f9,0x1daa7c89,0x08b6b853,0xa3d43fb4,
  34859. 0x68092a81,0xb159e48c,0x836faad4,0x77e93d9e,0xa4699730,0xd4ed6361,
  34860. 0x6297e476,0x569cb3f6,0xe7811fa6,0xb69d8183,0x00000185 } },
  34861. /* 89 */
  34862. { { 0xab9cb764,0x18f27eb3,0x8ebc1d6d,0xbbbefc21,0x0479aa79,0x47760ddb,
  34863. 0x09e542f5,0xb4d16d24,0xbc699b96,0xe35c38d1,0x8c8d8c8a,0x13b2ae25,
  34864. 0x67a3a45d,0x8579c152,0x6c554c04,0x773b7357,0x000000d9 },
  34865. { 0x0218c299,0x9620a473,0x99f78a33,0x69be29b3,0x484f414f,0x4684a009,
  34866. 0x9a2ca4d4,0xb2c74937,0x68db7ab3,0x09c0773e,0x935c357f,0x6181f059,
  34867. 0x8b7de3f2,0x0931303d,0xe0fb6e08,0xf3effcd0,0x00000060 } },
  34868. /* 90 */
  34869. { { 0xb25d6530,0x723c14be,0x9a97d40f,0x5e015b39,0xfbf7f622,0x209c3c4b,
  34870. 0x14b4f0f1,0x83d8c59c,0x3f7e8ecf,0xcf002fde,0x1eb1ef0f,0x35d353c9,
  34871. 0x201f0c60,0x394c42a5,0x7be8ee34,0x787128ab,0x000001b5 },
  34872. { 0xb70110cd,0xa0937d3a,0x477911b5,0xe0fa4efc,0xc53a4c19,0xc6acaf5b,
  34873. 0x38d509f2,0xbd3010f3,0xe54ac1c6,0x3ee2a82b,0xe4f2a3bf,0x31ea67c3,
  34874. 0xf089c7b9,0x7a4ca66e,0x34a2362f,0x5bda2c4f,0x000000b0 } },
  34875. /* 91 */
  34876. { { 0xd1f575cd,0xb424a071,0xa5237182,0x15693b01,0x9a2c9d40,0x14133602,
  34877. 0x9c914a60,0x50c4348b,0x095b31c1,0x9024573d,0x22fd4962,0x6f975fd2,
  34878. 0xe210b277,0xa1704886,0x6dba937b,0xac29b813,0x000001f6 },
  34879. { 0x775da491,0x09edef55,0x2b6aad82,0x25953f9e,0x1bb40d5b,0x6696a106,
  34880. 0x4d5127d8,0xcfc45311,0x81ead062,0x2f21dca9,0xaf3b7123,0x3f3e4f07,
  34881. 0x9646f20d,0x12cd06b8,0x6910f5bb,0x24136369,0x0000015e } },
  34882. /* 92 */
  34883. { { 0x3ecfc44e,0x0c844fd0,0x5043b3d5,0x4095f2c8,0xc9bd059a,0x9a5fe7db,
  34884. 0xf65becdf,0x239328fa,0xa67961cd,0xe3102471,0xbbb5dfdd,0xea9e39bf,
  34885. 0x133dc5ba,0x8022b6d0,0x5f12c379,0xbed7aa9b,0x00000141 },
  34886. { 0xfd94d941,0x096f0059,0x7d4ff018,0xfc6e9f00,0x779f05e3,0xe63af598,
  34887. 0x00483c99,0x4c40f0b3,0x72a19870,0x04d2feef,0x464a4a71,0xdb773b5b,
  34888. 0x49367f1e,0x00b6770f,0x2a9fbd2a,0x4f7e0301,0x00000169 } },
  34889. /* 93 */
  34890. { { 0x8a9095fd,0x0df5dd73,0xd3ce857a,0xc4b7a021,0xe5edc767,0x90aa796b,
  34891. 0x180a0808,0x56497eff,0x66f10aab,0xb9856e1f,0x39879766,0x31298824,
  34892. 0x3ba80601,0x61748cf7,0x555da929,0x07d9076c,0x00000012 },
  34893. { 0x1c44394d,0x0b049a01,0x0ce49e45,0xf5f25ef7,0xb1694265,0x1e3a09f0,
  34894. 0x109b33f8,0x2c5bd9fe,0xa30932e4,0x07f2a43f,0xc6cf8af2,0x736abfca,
  34895. 0xf3366722,0xadf7fa04,0xfa9d26b0,0x2f1e92fb,0x000000e0 } },
  34896. /* 94 */
  34897. { { 0x63be4d4a,0x9524e4a6,0x66f3cc91,0x1fa57bed,0x7e7a7ccd,0xdd7c93fa,
  34898. 0x88c5d1d3,0x70e8cf6a,0x3f251f1e,0xb257997a,0xe3554cf5,0x0a5ec58e,
  34899. 0x065a7109,0x68d268d7,0x085089ea,0x7c23d4d2,0x0000004c },
  34900. { 0xbd52d132,0x63ae575b,0x38c81cc5,0x0fb8daa7,0xe4e63b99,0x096a6e51,
  34901. 0xb239d387,0x51d6b366,0xa5d49fed,0xed5f8874,0x43a8c07a,0x025091d9,
  34902. 0xe4686ae2,0x100f845a,0x7eb4ef5a,0x1af59d74,0x000001c2 } },
  34903. /* 95 */
  34904. { { 0xdd441308,0x5f7bc01e,0x86308890,0x0dc34944,0x759611cd,0x2af38a74,
  34905. 0x4c23ce66,0x11a71261,0xf8bafed2,0x37f317b5,0x4c93e079,0x4efbb9ff,
  34906. 0x8ecc52cf,0x880f0edd,0xddc9d82a,0x480cdd2c,0x00000028 },
  34907. { 0xc3f807ac,0xe8f1ca0d,0xbd070549,0x6a3e4fc2,0x91f8bb6c,0xad3d0a14,
  34908. 0x3d6dfacd,0xe3ee1cfd,0x5fb46ffb,0xee46b1b9,0x7dd5cfbc,0x5207b3ac,
  34909. 0xb1b8e8b7,0xd580c0d9,0xc7bdd11a,0x52c669f4,0x00000084 } },
  34910. /* 96 */
  34911. { { 0xc0ace6d5,0xa42b4747,0xbe7287ad,0xd5acb64b,0x89bc2614,0xf3304899,
  34912. 0xff05c71e,0x817fe836,0xd35ac450,0x772eb246,0x375a9c3c,0x7f5fc216,
  34913. 0xcbc0d6fd,0xfb6f9e1a,0x720e9733,0x7643c315,0x0000009a },
  34914. { 0xf3845ccf,0x4b2216b4,0x90bc05bd,0x9c174e80,0xd6049037,0x7a550c74,
  34915. 0x6358c806,0xbd7220a1,0xaa677b6d,0x838f9c41,0x66e2e08e,0x37332c19,
  34916. 0x496f6da5,0xb032875e,0x9c30630d,0x52b274cf,0x0000000c } },
  34917. /* 97 */
  34918. { { 0x8ea58beb,0x6ec2e782,0x3665fa48,0x2b404c1d,0x20b40ff0,0x546d5fad,
  34919. 0x29d3e6a5,0xfb5df7b6,0x66c81991,0xf186846d,0x6e2cfe3e,0xbe690bde,
  34920. 0x1410d16b,0x97aeb9a0,0xbacc8e92,0x59d81548,0x000000cb },
  34921. { 0xbaf66a23,0xd905d3ad,0x40dfb081,0xc3337387,0x4b00f432,0x6d5535de,
  34922. 0x07d3a03e,0xe17fe8e8,0x066bca80,0x29544ff7,0xbadffa55,0x60c2b96c,
  34923. 0x45a26ea4,0x9f018d94,0x24a34ffc,0xd5438167,0x0000011e } },
  34924. /* 98 */
  34925. { { 0xbd7f8a61,0x62a873fb,0xbbe580bb,0x5e18cd71,0x667f6980,0xfd5c9eb3,
  34926. 0x571d3dc0,0xab8d4f61,0x783f9bc8,0xe2e45215,0x24398b14,0x36c3774b,
  34927. 0x74d811b5,0x2db4a363,0x2debe3c3,0x9f7f1297,0x00000138 },
  34928. { 0x798fefb2,0xbb97f21c,0x107baa72,0x9c76fcb5,0xfadbb568,0x12fbf760,
  34929. 0xd33ea6c5,0x1a648be7,0x236134a5,0x412a2993,0x8985893b,0x4a3d8169,
  34930. 0x3e66ada4,0x6144958f,0x7687b457,0xb4dfc79b,0x00000140 } },
  34931. /* 99 */
  34932. { { 0x7abe5bb9,0x83b14570,0xe51d81be,0xae0cbfd8,0xc9827aff,0x20dadf49,
  34933. 0xa687b554,0xc3a72548,0xeeb41733,0x080263fb,0xd3827c63,0x7014fdc3,
  34934. 0xb5e3b70e,0x7d018f84,0xfbcf7168,0x1d483e00,0x00000015 },
  34935. { 0x6b578aa3,0x154e3c7c,0xd3043dae,0x511ce9b5,0xb6008101,0x55f89e9b,
  34936. 0xf405ac6f,0x4ec31112,0x2008ac7b,0x7e66a4d8,0x25c52fa6,0x73c00d39,
  34937. 0x8acac2eb,0xee1b9998,0x60b57453,0xdfa31d95,0x0000008f } },
  34938. /* 100 */
  34939. { { 0x251cf8d8,0xcc74a0e0,0x041f2bd2,0xd4d8949d,0x33ebce52,0x0b734a49,
  34940. 0x5c5bcdae,0xe1ac5f51,0x16200b93,0xd3ecdfcc,0xa793736e,0x2506a266,
  34941. 0xea6e6940,0x585a1c8b,0x9190f935,0x081cdd53,0x0000000e },
  34942. { 0x53e28412,0x055f9956,0xdb27164b,0x0d1526f2,0x1df3adc7,0xcd5625eb,
  34943. 0xdd35dedd,0xd2c453ca,0xa838ffe2,0xed442849,0x5c0ce589,0xad20c137,
  34944. 0xbd99b609,0x2d5fba81,0x622efb07,0x5be41dcc,0x000001ad } },
  34945. /* 101 */
  34946. { { 0x8f850756,0x563af667,0x52f3b597,0x86d37aae,0x796842f5,0x10d38a53,
  34947. 0xf743f997,0xcdaaf99f,0x93f1a8ba,0x2fa755e5,0x409f7cd9,0x1af04e15,
  34948. 0xd6d0650b,0x63bf9a0a,0x55abfd9a,0x67b1cead,0x0000000e },
  34949. { 0xb5f43178,0x3660a8e0,0x9cc35b33,0x56bd412d,0x880f6808,0x3d7bfa63,
  34950. 0x2e622c71,0x7f372d66,0x6ff82445,0xad7b7be7,0x8db04e51,0x0f2bde80,
  34951. 0x4bd15c8d,0xe1e781fe,0xb8e502f2,0x1f475bfb,0x00000194 } },
  34952. /* 102 */
  34953. { { 0xd63543ec,0x79482bf9,0xa117ef3e,0x985cb67c,0x160ccc63,0x8ac50638,
  34954. 0x729bdc1e,0x556cbed5,0xa22686df,0xd62ed97d,0xc81eb77c,0xb124cb5f,
  34955. 0x72fa2ed9,0x4d7b4f66,0x78335b96,0x60b29aa7,0x00000172 },
  34956. { 0xa43df7c6,0x21bfc7b6,0xbc20706c,0x85acac23,0x345d9580,0xeb6f37bc,
  34957. 0xa32a08bc,0x9d8f20d2,0xd1953c5e,0xf08924f6,0xc4f680d0,0x7d25d7c6,
  34958. 0x2de9912c,0x64e6a237,0x52ce644c,0xda1c06c4,0x000000eb } },
  34959. /* 103 */
  34960. { { 0x411dd110,0x26677c5c,0x2c991c4a,0x0d6787aa,0xa45666d6,0x53be6a41,
  34961. 0xc15f9f15,0x73e716aa,0x0e0cc7b2,0xa93b863f,0x2a624ab0,0xa4057117,
  34962. 0x1a39c260,0xe5e7656e,0x2ef6f130,0xaf8d78b5,0x00000046 },
  34963. { 0x70f38dff,0x796214b1,0x123a1105,0x3e35d828,0x957ed812,0x046a44d4,
  34964. 0x0da60161,0x618fa9ba,0x54f84413,0xe7cdd2a5,0x19ea95ab,0xf1c2563e,
  34965. 0xcb2a30b4,0xc4459e14,0x61ff9aa9,0xc748add6,0x00000183 } },
  34966. /* 104 */
  34967. { { 0x9de58caf,0x32981f39,0x8753ea64,0x05bb80fd,0x2d119486,0xc83f9f24,
  34968. 0x03eeb00a,0xf490cf06,0x7c73d79c,0x4037f251,0x724d461b,0x844209fd,
  34969. 0x272420cf,0x6b03f6d2,0xb3438fa2,0x6f4bd29e,0x00000152 },
  34970. { 0xc389e51c,0x964d034a,0x6db7d98e,0xacda55e9,0xe913c583,0xb2ae97de,
  34971. 0xfeb03440,0x0793077b,0x9d461e29,0xaa16e378,0x043bf8be,0xb0a67533,
  34972. 0xba7d8c3f,0x9d749a42,0x6bb925dc,0x7c41e6d6,0x000000ec } },
  34973. /* 105 */
  34974. { { 0xc5da8398,0x2e9b345d,0xbb38c430,0xbc66841f,0x7c3bb47a,0xce3ac562,
  34975. 0x738d2cdd,0x8fbeb12b,0x68731185,0xd4bc2ad7,0xbbd4f4f4,0x9521db1c,
  34976. 0xfe4e1b0e,0x2a690cae,0x7bfebe3e,0x375215eb,0x00000194 },
  34977. { 0x2edfd661,0x4cb234f1,0xed52c1f4,0x0149984e,0xd8f8f98c,0x32d27260,
  34978. 0x7be38590,0xfe76e4e4,0x95e8b672,0x5435873d,0xf2b00e82,0x916c397f,
  34979. 0xbad61eb8,0x3b9bf705,0xae131bbe,0x7ee90182,0x00000000 } },
  34980. /* 106 */
  34981. { { 0x93fbcb5c,0xd36fea9e,0x9fa8529b,0x382be583,0xfd611ba0,0x0b243125,
  34982. 0xcd8a2637,0xa59ae37f,0x3d8d4704,0xab78c60e,0x44c41b79,0x1bac243d,
  34983. 0xeda49cc5,0xc4001fea,0x83dc7e9f,0x988ea44a,0x000000f6 },
  34984. { 0xf077f79e,0x4d90caa4,0xd9e2590d,0xf4d17601,0xd21b4b77,0x11debbb3,
  34985. 0x9037e1b6,0x031b3f60,0x135becf0,0xf113ed82,0xf2903dda,0xf6c01379,
  34986. 0xa6f19296,0x36bde7ca,0x9dbbad85,0x57d3b684,0x0000006c } },
  34987. /* 107 */
  34988. { { 0x9abfccb0,0x963fee38,0xb9676e63,0x6c6e2a24,0x84ba6d27,0xf8768f02,
  34989. 0x465853d1,0xc38ba3ba,0x1b8ab9b6,0x6e3ab36d,0x47a07331,0x01fc9742,
  34990. 0x25233f32,0xfdd41718,0xac61de7a,0x4dacfa81,0x00000021 },
  34991. { 0xeaa3198c,0x365a9f37,0xfc8b99d5,0xcbe8a345,0xd4f5ecbc,0xa427f12a,
  34992. 0x0c237514,0xe841ff60,0x28a27b05,0x5d9e8c5a,0x62859ff3,0x2d377444,
  34993. 0xea8bde37,0x1c0460ff,0x29cf5bf8,0x0a0e49a1,0x00000181 } },
  34994. /* 108 */
  34995. { { 0x45843c3e,0x688203af,0xaabebae7,0x4601e303,0x624df62b,0x397b08f3,
  34996. 0xd21e5aa8,0x5687348a,0x9a242b0e,0x2cf12c73,0x32a76c6d,0xc848ed01,
  34997. 0xf52751a2,0xb72aa1c2,0x92c02d05,0xb63296c3,0x000000f3 },
  34998. { 0xc6f3d1f0,0xce4b42ad,0x2f532b94,0x2f0dcc53,0x83443d9c,0x57813335,
  34999. 0xdc8dd9cb,0xb50118ee,0xee87192f,0x3039e1a5,0x557419c2,0x9977267d,
  35000. 0x30f96b0c,0x462efa4c,0x3cd3c35a,0x454fb796,0x000001f7 } },
  35001. /* 109 */
  35002. { { 0x9d153926,0x10f28194,0x82b57548,0x42e28c91,0x509e94c9,0x4b423b30,
  35003. 0xde9d6b57,0xc5acc52a,0x8b3ca314,0xaa746c39,0xc63d5bc5,0x0f4ea307,
  35004. 0xe1ccc989,0x425553a2,0xf76d9194,0x271198bf,0x0000008e },
  35005. { 0x3c8e672b,0xc7900e46,0x3f2dfc27,0x703675cd,0xaf2163c9,0x704951f7,
  35006. 0x7aceaab0,0x74d69908,0x7e8d2369,0x482f21a9,0x813dc115,0xdcfbc1dc,
  35007. 0x04f6cd13,0x0ce2bc80,0x82bfaff2,0x2a54662c,0x0000003f } },
  35008. /* 110 */
  35009. { { 0x1588a8bc,0x0dcf41e6,0x210c52cb,0x6f48cd0e,0x758e7a45,0x338562bd,
  35010. 0x48b9b957,0x1600d54b,0xa6b89b9e,0x461df80b,0x098cc82f,0xf7fd4f17,
  35011. 0x14977147,0x167f01cd,0x6116c5f9,0xb1338511,0x00000048 },
  35012. { 0x5d2617f0,0xdeb76333,0x6ecb8606,0x3f9a5772,0x1b91fce9,0xa93c032d,
  35013. 0x6c84b997,0xf7a4388b,0x823ca5be,0xbfe80225,0x35a32f6b,0x6f19c028,
  35014. 0xe3cb5c58,0xf26cd5ad,0x6d0c1dd9,0x7f5ddc77,0x000001e7 } },
  35015. /* 111 */
  35016. { { 0x6ee764c9,0x3c9feec8,0xb07c82cc,0xd1bec836,0xa005b142,0x6bf1b2e6,
  35017. 0x29e8a5ea,0x70ef51a3,0x3ffe241c,0x517d298e,0x72966c28,0xbb389e28,
  35018. 0x2c7acc76,0x3a2da8a9,0x732a21b5,0x902c9126,0x0000004a },
  35019. { 0x8f7ce110,0x96c51b9c,0xaeb036f1,0xdcc33a87,0x0a6a59e2,0x82695098,
  35020. 0xe78db500,0xceaf26a7,0xc95bb030,0x82f3c384,0x24c42f42,0x6dd6e9f7,
  35021. 0x70ac4a0a,0x768dde29,0x03d22efc,0x4aedce4b,0x0000016f } },
  35022. /* 112 */
  35023. { { 0xeded03c0,0x077f032a,0x588ddd4d,0x2684a052,0x9a85be0f,0x6d09bc4f,
  35024. 0xe0b9b6bb,0xbdda0c7f,0xf2fb5887,0x19689c7e,0xec3cce7e,0xf8a96960,
  35025. 0x768d2ae5,0xb043d9d5,0xdb21219a,0x29c8081b,0x00000068 },
  35026. { 0xde59f006,0x6bf872fa,0xcb97ef5a,0xc2b9ffc6,0x58ae7ef8,0x371915db,
  35027. 0xf4ccaa1f,0xc2e23ca1,0x89c27cc4,0x1af8c60e,0xc86bdcc6,0xeee5d7e7,
  35028. 0x9bd8de43,0x9225b47f,0x4b24f08b,0x53e7f463,0x000000b4 } },
  35029. /* 113 */
  35030. { { 0xe3048bda,0x54c496d0,0x43c3de4e,0xe2b67499,0x4c2d509e,0xac2049f7,
  35031. 0x543c5089,0xb01f691e,0x105a365b,0xcd9960a3,0x78b17049,0x34d93ffe,
  35032. 0xf82c9467,0x029f99b3,0x0161a755,0x785c5ea2,0x00000091 },
  35033. { 0x953dbdb6,0xb455f978,0x97eca19f,0xea9e84d9,0x36d4d75a,0x473bd029,
  35034. 0xc15276fa,0xa9c17ca8,0x47c76356,0x9cf66133,0x039738d2,0x4a68360b,
  35035. 0x69733609,0xd3e430a8,0xe2b27f21,0x0ae532de,0x000001b4 } },
  35036. /* 114 */
  35037. { { 0x5164cb8b,0x68110e82,0x2552a67d,0x6979af4f,0x8d185527,0xe10d6d0e,
  35038. 0xfb64eac4,0xcf6c5787,0xac424592,0x8408163b,0xfce0d810,0x5d8fff37,
  35039. 0xda84c15c,0x8b284e49,0x32663ec9,0xed805567,0x00000010 },
  35040. { 0x51f3ee9e,0x106f4030,0xb38adf1e,0x2e8e3ee9,0xa13d6449,0xd3c87a6e,
  35041. 0x80e1abb1,0x27b49f45,0x0bfd7298,0xc283d179,0xafc7a35f,0x8fe50fa5,
  35042. 0xade3ad4f,0x773da545,0xd9a21df2,0x78bfaae4,0x000001f8 } },
  35043. /* 115 */
  35044. { { 0xabad5678,0xae60d8e8,0xe600c25b,0x0afa72ce,0x4c288e21,0xb9d4e0b4,
  35045. 0xd254cf9f,0x64447f76,0x959e2ba5,0x1fb36bc4,0x2961132c,0x393c44d7,
  35046. 0xfc140f19,0xd7a8881f,0x8d096648,0x27a86128,0x00000091 },
  35047. { 0x8a9e690c,0xb536c021,0xeab4fa15,0x85dcc521,0xb00ee54c,0x09af4423,
  35048. 0xaf3a8e48,0xb3793525,0xb7731d85,0xe1f36308,0x141cfb55,0xb5361d78,
  35049. 0xeffc4529,0xea41f29e,0x9f7d2634,0xcf5755b1,0x000000e8 } },
  35050. /* 116 */
  35051. { { 0xd212b398,0x01edb80d,0xd53dd373,0xd0396181,0x8a52fa95,0x0e086047,
  35052. 0xa7825e6d,0xad1e6432,0x330ece4f,0xe0185bc5,0xb078936f,0x508f7313,
  35053. 0x9e7f6ea3,0x1dc982fd,0xd5556b60,0xdbf3a602,0x000000e8 },
  35054. { 0x279e05bc,0xc3763234,0xf44453d3,0x7f5f40ec,0x7fa30793,0x310c5f4d,
  35055. 0x108d7e22,0x5cffad36,0xc2a98bbc,0xf2f01ef3,0xd7d47f80,0x30ab1719,
  35056. 0xa9b22e1c,0x7bc9f918,0xe834df94,0xf53dc52a,0x000001f9 } },
  35057. /* 117 */
  35058. { { 0xc183f89b,0xf266b49e,0x5f5806d4,0xd3fb5f02,0x94ec3080,0xd30a42b5,
  35059. 0x371cd917,0x4b6b1940,0xb7f7e26d,0xf7541aab,0x2d5b7b64,0xe55269eb,
  35060. 0x7f8036c5,0x0e1a85c1,0xda5f2675,0xa0ff0f22,0x000001ce },
  35061. { 0x3a8e11f8,0x602bd56a,0xf5f9ab54,0x29864021,0x0ccc92d7,0xc6742c5a,
  35062. 0x523f650b,0xd64569e6,0xf7fabfb4,0xc8e4681b,0xc3c9e6cb,0xb4275947,
  35063. 0x38f5ff20,0x2b3952d5,0x1f04aea2,0x818f8e38,0x000001b0 } },
  35064. /* 118 */
  35065. { { 0xe50d90f0,0x3be5bffa,0xf5011cdc,0x4cb3b11b,0xa691dfac,0xe10ca711,
  35066. 0x4ea1a773,0x62ec211d,0xe586eeb6,0x5a979ebb,0xa0c2f1fd,0x4df16ab1,
  35067. 0xc57bbfea,0xfe9e3f7e,0x5ae526f6,0x1b05960e,0x0000015e },
  35068. { 0x8630e62e,0x1c8e04a5,0x6447e1b7,0x3d00310e,0x43b4447a,0xcf1e6b61,
  35069. 0x7462e7a3,0x92abb851,0x0002724d,0x8309ea08,0xe45296df,0x1d805d70,
  35070. 0x3d4ed812,0x0f3849b3,0x6834d44e,0x2d6bffbc,0x00000096 } },
  35071. /* 119 */
  35072. { { 0x48e07711,0xd13fe58d,0xd270a3b2,0x70f83648,0x8cdff04c,0x1517892d,
  35073. 0x51411f14,0x15bb6578,0x3e4f8a55,0x6c31cd90,0x0413362f,0x73f87152,
  35074. 0xeca06d4d,0x2fe025ee,0x954e317f,0x32a6e417,0x000000ad },
  35075. { 0x69d147df,0x7e38c63f,0x710bf37b,0xb69bb06e,0x28d514de,0xb94debef,
  35076. 0x8d11c3d9,0x4b2307fb,0x0385c604,0x3b369df9,0xe7800e83,0x68ea2f49,
  35077. 0x7d501c1c,0xf028b258,0x5cef7818,0x97078221,0x00000055 } },
  35078. /* 120 */
  35079. { { 0x54c1d751,0x10c351db,0xba0f9512,0x81445301,0xbfdc8bed,0xa77eb34f,
  35080. 0xcf23680a,0x498d8138,0xe04f2860,0x928c14a4,0x16a5b6da,0x96192dba,
  35081. 0x5f9a9103,0x49dea95b,0x01724102,0x80dd4578,0x00000085 },
  35082. { 0x0e09221c,0xe9072500,0xf21de056,0x62e05b21,0xe0e60950,0x448cafa1,
  35083. 0x6f775129,0x657fb97b,0xf1f34aca,0x5d2991bd,0x49ff15d6,0xa66cd5ac,
  35084. 0xd049ec79,0xdc1d6897,0xe72baea8,0x388fca84,0x00000067 } },
  35085. /* 121 */
  35086. { { 0xa6ef1dd3,0x6520b49d,0x3ba6cd76,0x391a045e,0xf33d5f48,0x9c84980a,
  35087. 0xef07474a,0xe53cf5b2,0x78bfb1ea,0xa35b2e9a,0xeda906fa,0xeca97fd6,
  35088. 0x1b9f2cf4,0xf1a93789,0x3ab28589,0x66753369,0x0000010d },
  35089. { 0x73691faf,0x5b510496,0xd57ec618,0xdc73d3a9,0x930a8525,0x7e2921bb,
  35090. 0x40b05b69,0x094f571e,0x413bedca,0x5e96a017,0x8d1a6b98,0x9e7d4f72,
  35091. 0x3eade8b7,0x55143fda,0xd16e454d,0x859b8444,0x000000fb } },
  35092. /* 122 */
  35093. { { 0x7c667aaf,0x7c22083e,0x4a91ccba,0x33545cb9,0x8ca0e94a,0xca1e9931,
  35094. 0xe4eaa0c7,0xc3afff23,0x42f56844,0xa21ac436,0x60d52d0b,0xfcc68a8b,
  35095. 0x6a9301d4,0x401a585b,0x907abce1,0x547f762c,0x000000a3 },
  35096. { 0xfbe260ce,0x63dd3ed3,0x80dc01fa,0x2717752d,0x6f1da3e4,0xd5fab75d,
  35097. 0x5261f10e,0x5f16864a,0xd20cd6bb,0xbe7b1f63,0x221ac656,0x9d638c10,
  35098. 0x673b918e,0x3137b8f6,0x4ada2fb8,0x23eb4438,0x00000174 } },
  35099. /* 123 */
  35100. { { 0x2a1fbcf4,0x194e27c4,0x5facd5ee,0x4c0d285b,0x915e6607,0x75c2ebdd,
  35101. 0xef0a6a9a,0x1e696510,0x067cf458,0x13c5afa1,0x7bee1fba,0x2be013c1,
  35102. 0xdad279e7,0x85a406d6,0x5142cf59,0x0042951d,0x00000031 },
  35103. { 0xa22bbc45,0x6a735ec1,0x7f56f4d8,0x4ee5391a,0x236001de,0x305af9d0,
  35104. 0xaa2f8d25,0xa8b21851,0x187db78a,0x0e2c36d8,0xa1a888c3,0xcfcc083f,
  35105. 0xbd3e7d5b,0xb91dab7f,0xf4fdd023,0x62d85460,0x000000f4 } },
  35106. /* 124 */
  35107. { { 0x4972d703,0xf568ba02,0x39098a03,0xfc44ca1d,0xae28c855,0xe9b8e542,
  35108. 0x5b1b4536,0x4fd4f360,0x4c7f7e48,0x2e08b07b,0x2230823d,0x042f3b98,
  35109. 0x1889fd13,0xc9ffd313,0xc6c68359,0x56af0652,0x000001bb },
  35110. { 0x06e0f16a,0xedbf05e2,0xd74644a5,0xfc1ac2fa,0x0f92c71a,0xe59a0a98,
  35111. 0x36c800a1,0x13ae37d7,0x236178dc,0x5f20efc6,0x2b46ef10,0x443a58b8,
  35112. 0x442509e4,0xc9517dcf,0x640ed9b0,0x7d0bb415,0x00000166 } },
  35113. /* 125 */
  35114. { { 0x3d22842d,0x3aa30a61,0xb3c4ece0,0x8c6e00f5,0x6df82b79,0x8764cf87,
  35115. 0x78d208c5,0xda92d86d,0xe788854a,0x0a52d391,0xa59b0994,0x499b26fb,
  35116. 0x04c5fc9a,0x5dc133ad,0x34e3f134,0xa5c09269,0x000001dd },
  35117. { 0xfad6d673,0x6f0dcac2,0x00f3b3fe,0x6d8fdf05,0x631756e9,0xece71941,
  35118. 0x0a4d80e3,0x3990f493,0x31d13001,0xf2aca936,0x75581638,0xee91966c,
  35119. 0xe6dd5679,0x6df0f574,0xccd71cda,0xbe124868,0x00000111 } },
  35120. /* 126 */
  35121. { { 0x475cc1b4,0xf644c726,0x2b73978c,0x915fc2f9,0x0e3d7eb7,0x65a7e6d1,
  35122. 0xf40c38e0,0xbb44e21a,0xe1ad24fc,0x988662b9,0xc35606e5,0x270ba4dd,
  35123. 0x1a4f93f7,0xc3834a2c,0x3362a4d7,0x93d0c9a2,0x00000021 },
  35124. { 0xf769fd7f,0xe2cb7b8c,0x89a213b9,0x1815da97,0x6b910fef,0x7b4f8c56,
  35125. 0x26931438,0x2088b309,0x925b37c0,0x477b71bd,0x26a640e5,0xa049a921,
  35126. 0xfd21c6ef,0xd3ddf1bd,0x232a56b2,0x9b5f9d7d,0x00000064 } },
  35127. /* 127 */
  35128. { { 0x679a9c35,0xd640adf8,0xcb74d796,0xcdad98e3,0x5f8e9daf,0x464b8ebb,
  35129. 0xad4a073c,0x4738614e,0x2edde557,0xbd86c0ee,0x576ce0b9,0x77331738,
  35130. 0x4095fb96,0x9b5d3327,0xee09aead,0x72f0aeb3,0x00000136 },
  35131. { 0x64e54ba5,0xa388c76d,0xdc474d21,0x63fe7af1,0xb2a77081,0x7fa3e9d1,
  35132. 0xde1240ad,0x0447b49e,0xc720303a,0xd9f64b66,0xe6bd0213,0xb1c78029,
  35133. 0x0aa03ea5,0x1caf1c70,0x3bb85d2b,0x179180eb,0x00000103 } },
  35134. /* 128 */
  35135. { { 0xaf2ed12f,0xadbf4f9f,0xf380fd8a,0xce1d19e4,0xa39e81ae,0x0957bdb5,
  35136. 0x626ef6bc,0xf9833321,0x0cf5b28d,0x110ae5ea,0x20392cd4,0xab159450,
  35137. 0x6bc67855,0x67c49887,0xa3fd61c6,0xce7e5938,0x0000004a },
  35138. { 0x28c7dea9,0x59c5b9ef,0x0a6a7184,0xd02f95ba,0x8202769c,0x034dc257,
  35139. 0x94dd6896,0x213b0b08,0xb5dea95a,0x03730b7f,0x617ca889,0xfe243ed0,
  35140. 0xfb1ba052,0x16cf4d17,0x226f96da,0xd8691d6b,0x000001c0 } },
  35141. /* 129 */
  35142. { { 0xbf8015c2,0xaa2edf3f,0xc49502d8,0xe7f8236d,0xa6a43157,0xe890f6e0,
  35143. 0xa2d04b0c,0x318ef325,0xa809dbab,0x9cc0668d,0xda67ca21,0xdd26937a,
  35144. 0x83febc49,0x8f27c12c,0x3c9b9844,0x87b3db2f,0x00000029 },
  35145. { 0xfd2e3dc7,0x37e7aed0,0x7415fd55,0x498e8bdb,0x58a45f25,0xfc0d6c9a,
  35146. 0x209c85d0,0x83d5baba,0xd579e1ee,0x31ec8dc6,0xa502bfed,0x1f4cad0b,
  35147. 0x1f41bef1,0xc432e6ce,0xbbffca65,0x3b10afaa,0x00000191 } },
  35148. /* 130 */
  35149. { { 0x53053af7,0xbd9f7df0,0xb28a1cf4,0x60304765,0x7ce90438,0x441778fc,
  35150. 0xac8c5ddd,0x8fbed36e,0xfb59ec61,0x27b1313b,0xa1b1becf,0x9d2656ff,
  35151. 0x945973a9,0x334e1345,0xc362b595,0x3261888c,0x0000018c },
  35152. { 0xaa7f6ff8,0xf413a414,0x3fab7c7a,0x092aeb88,0x7cc307ba,0xfa1d886b,
  35153. 0x2346100e,0xdc81c125,0x02140c93,0x93d4d273,0xe6104835,0xa1ed7e3c,
  35154. 0xdf1795f3,0xe2b91ecf,0x369ed416,0x160dc11a,0x00000191 } },
  35155. /* 131 */
  35156. { { 0x8b57d7cc,0x9a72f46e,0x4bf02386,0x3140b0e5,0x05b3a91d,0x886c396e,
  35157. 0xa4ec26e0,0x1b9ab3a9,0xc50f58e9,0x742feaeb,0x55e26af0,0x1592c608,
  35158. 0xbb1cd9f7,0x943cd476,0xc7f02c89,0x3ed97fd4,0x0000017c },
  35159. { 0xe6d54964,0x53b02503,0xc6a318c0,0xd9bd1162,0x9cc28c22,0x18ff6cf4,
  35160. 0x03534640,0xa45c7840,0xb4cc0668,0x8ea3335e,0xf42dbe03,0x7ad727f8,
  35161. 0xfdf6c3cd,0xb157e911,0xec992d76,0xa7f894c9,0x000001b3 } },
  35162. /* 132 */
  35163. { { 0xaf09ea77,0x91e6e397,0x75dc25c5,0x26a760b9,0xb94a197b,0x8c040c08,
  35164. 0xb68ce619,0x041baca8,0x5bd23564,0xa19a0d15,0xd977b33f,0x86ca5b94,
  35165. 0xe5fbd029,0xf31f87f8,0xb1901f99,0xf76c55a6,0x000000b8 },
  35166. { 0x3846ec9f,0x175bf8c3,0x9deaca46,0xf462205c,0xa3108df0,0x92cb5ec0,
  35167. 0xcfaed928,0x879db283,0x65049fb2,0x477dc004,0x96ee5031,0x48d24bac,
  35168. 0x56adce45,0xa7db6b16,0xab1c684f,0x0110cdab,0x000000fc } },
  35169. /* 133 */
  35170. { { 0x4d308bf2,0x151b66d8,0xd6638004,0x99013c9f,0xfd383bf9,0x6892df92,
  35171. 0x3ffc8efc,0xa10efd84,0x313ea287,0x527e316c,0x3a0df740,0x8ef6e3cd,
  35172. 0xf6ebd2a1,0xcb96e430,0xa70ee4ce,0xc1ebecf2,0x0000018c },
  35173. { 0x1a70404c,0x80d14ad7,0xf9ce2a30,0x6ad21dd0,0x3aa3e072,0xb94cbcde,
  35174. 0x6363a690,0x0ab59611,0xc6b1e2b4,0xe70bff45,0x66ceec5b,0x1296dd0b,
  35175. 0x747757c0,0xd4cb2a74,0x3d7d91e8,0x08988ca6,0x000000aa } },
  35176. /* 134 */
  35177. { { 0xf8db0396,0xaa2dcfca,0xb422da76,0xe8ae8f37,0x96485724,0x652f8349,
  35178. 0x7bf1493f,0xf647c3c4,0xb0247a4e,0x8b600b46,0x7aebda8e,0xabf3e439,
  35179. 0xa7958df0,0x2e1d231f,0xf881bab2,0x38e692b1,0x000000ef },
  35180. { 0x26cf3047,0x1f3c1689,0x59539858,0xdad14f94,0x293f20b6,0xfde85d1c,
  35181. 0xf57abb17,0x2ea5436e,0x1794de38,0x0d1a8ffc,0x2bfecd2f,0x9ba508e2,
  35182. 0xdb786042,0x110f0a7f,0x7cde31f8,0x2ade6f64,0x00000196 } },
  35183. /* 135 */
  35184. { { 0xfec78898,0xc996a537,0xde0fa77f,0x0b39de72,0xd34cb08f,0xf6d076ac,
  35185. 0xda78d353,0xacd8bb82,0xa0392cc1,0x5fe804d3,0xe581549d,0xab7adede,
  35186. 0xc067c6d9,0x883901a0,0x4ed93f37,0x5855ffa2,0x00000191 },
  35187. { 0xbf9ebef3,0x29570e36,0xdf4b3177,0xe21046a5,0xa6816b5c,0xf9b89a95,
  35188. 0x288d0e11,0xadf39281,0x3979159a,0xd6baabe5,0x5c8fabb2,0x411afee0,
  35189. 0xe5c7af10,0xf192c3af,0xd7dce37b,0xaa72e81c,0x000000f7 } },
  35190. /* 136 */
  35191. { { 0x16c386ee,0x20fa3c0f,0xd4c09839,0xb33b0469,0x876a3136,0x79e0d722,
  35192. 0x3c406c06,0x343c0a92,0x4debe27d,0xef220e3e,0x196f00ea,0x09d7b1e1,
  35193. 0x24a9dcff,0x4a0f5dd8,0x99c1d085,0x53582ec5,0x000001e2 },
  35194. { 0x5138c7ed,0xcc8ef262,0x6547f88d,0xdec43194,0xdd0a9488,0x2b6e53ad,
  35195. 0x8257ebdc,0xeb9f1efa,0x1f08c989,0xc583c6eb,0x40163768,0xf1736911,
  35196. 0xdbc20e3d,0x6282ff8b,0x9cbd514e,0x26b81005,0x000000d5 } },
  35197. /* 137 */
  35198. { { 0xa0025949,0x2449522f,0x0bbd8945,0xb26d888f,0xe637216f,0x33442f5f,
  35199. 0x472827f6,0xd8ec3b64,0x99fc2681,0x91d8a1a3,0x68c7710d,0x6d232ead,
  35200. 0xe51b2762,0x8e5bfe2f,0xfd109fa7,0x0f9f4fed,0x00000004 },
  35201. { 0x6b4a05e0,0x1952ea51,0xf21c78eb,0xcb0d48ee,0x1997dfdb,0x64d36619,
  35202. 0x8b4c21fd,0x0d11b204,0xbe92303a,0xa6f569b6,0x78c5e809,0x2b8f6096,
  35203. 0x36805d8e,0x7226b5ab,0xdb349ca2,0xd6cff180,0x000001bd } },
  35204. /* 138 */
  35205. { { 0x943cc612,0xa49f8576,0x832b31c7,0xc914319e,0xcccadebd,0x9225e297,
  35206. 0xb0619821,0x4918fb42,0x25b1cc7c,0xaccb3084,0xa646e5f0,0x751d3347,
  35207. 0x590e3e22,0xeafb4aae,0x2c4a0008,0x82146038,0x00000151 },
  35208. { 0xbf96a461,0x3c2481db,0xb52a3ba4,0x51c122e9,0x464db08b,0x21c2858e,
  35209. 0x6d6a081d,0xb1014b78,0xf533cef7,0x167d3ed4,0x81545f7c,0x6cfb3294,
  35210. 0x449b7b9f,0xea46d31c,0x9621c299,0xcfad7613,0x00000081 } },
  35211. /* 139 */
  35212. { { 0x478a7f0e,0xef796327,0xde17705d,0x914183e2,0x572117e8,0xd24a26df,
  35213. 0xb7cd52cf,0x3cdb1b09,0xad83c160,0x9e42b9fb,0x709ef8c9,0x6971d2ea,
  35214. 0x8ee54ccd,0x1894fc5b,0x34a520fc,0xf757b4e5,0x000000fc },
  35215. { 0x86b62347,0x5a5518cc,0x7bc2a928,0xec51c9d2,0x2966727f,0x2eea2b05,
  35216. 0x0ae43e6f,0xbc8a8e3a,0x05ca066b,0x80535b5e,0x8833986d,0x91ffcdb1,
  35217. 0x32374cdd,0x2f4a5bba,0x0d202243,0x08763a49,0x00000124 } },
  35218. /* 140 */
  35219. { { 0x4efac14d,0xe498b972,0xa79a9d3c,0xb6f4bf8d,0xd6e07c29,0x0f1e8dbd,
  35220. 0x71771538,0xfac30cfd,0x71b03263,0x4c91ed22,0x19b455f5,0xbf938335,
  35221. 0x127092bf,0x76a5e789,0xb4813bd9,0xa97674e1,0x00000128 },
  35222. { 0x583e5924,0x29b63c41,0x8f171d06,0x61f9aff1,0xab227a28,0x2b45b3cd,
  35223. 0x8a11ab70,0x939d5dda,0xe8db6971,0x2bfb47b0,0x0ec10805,0x562379df,
  35224. 0x24ce1801,0xaf5a6481,0x34f94aba,0x8d98c434,0x00000150 } },
  35225. /* 141 */
  35226. { { 0xcfffc80f,0xdea9fe73,0xd43473f6,0xe23e2e9b,0xc9d37ba7,0x27fb3ed3,
  35227. 0x7a3fc357,0x733766d2,0x8e04a03d,0xd0db4cf3,0x2bbe0f43,0x8ce01752,
  35228. 0xda986f4f,0xd87eb719,0x2fe6b037,0x6d1b50ae,0x00000153 },
  35229. { 0xda40bab1,0x371f5def,0x9b2bda63,0x07d6a8af,0x0d4aca87,0x5e8a5c89,
  35230. 0x643ff8ab,0x4d72f0ff,0x4bf8ec2f,0x9c4c10d9,0x0eb93e22,0x36b0eaba,
  35231. 0x1d2dfd01,0xbc4b0e8f,0x9d34a082,0x9f252e5a,0x00000142 } },
  35232. /* 142 */
  35233. { { 0x7d0e7020,0x4affd4c1,0xb5482168,0x9b169aaa,0x588f348f,0xdbe01708,
  35234. 0x885986bb,0xdaebf6ff,0x15f9c381,0xb33987f5,0x04a94a7b,0x7e455f2c,
  35235. 0xa0ed6849,0x39a41442,0x1ef7798c,0x1c1ad4a6,0x00000154 },
  35236. { 0x072709c4,0x7647b628,0x8810e5fe,0xb330d68b,0xe92e0f63,0xd1bd8874,
  35237. 0xf8bea9ba,0x144e4fb9,0x8318981a,0xc15afc18,0xb68c6a07,0xe19c5c82,
  35238. 0x36e00b66,0x858c57a2,0x07cb7aec,0x9b255110,0x00000011 } },
  35239. /* 143 */
  35240. { { 0xc887027d,0x121ced27,0x2bfab286,0x6050f335,0x19d511e2,0x6e373c1c,
  35241. 0x7f4c69f5,0x02d4c3a9,0x25226bb4,0xe6f356af,0x83e7ac30,0x3b9011c3,
  35242. 0x33d8fdfb,0x43b0c23d,0xaf2ea363,0xa8c390f7,0x0000000b },
  35243. { 0x7e851bac,0xc430c3d6,0xa5f544fc,0x8991c389,0x67fba061,0x006bbc64,
  35244. 0x97cbdbf4,0xd49d024e,0x7734adad,0x4539b7dd,0x28cb6d2a,0x90ba8f9f,
  35245. 0x4de4b3ad,0x7a921830,0xa7b96928,0xb28732ef,0x0000006a } },
  35246. /* 144 */
  35247. { { 0x22ed5986,0x71dab52d,0x58533e06,0xdeee627a,0xcf155fe3,0xe8fee37a,
  35248. 0x7ae8b132,0xcd61490d,0x34a08b94,0x2706e185,0xf9c15c30,0xa85ffd52,
  35249. 0x51a5ad46,0xd5a224f3,0x54d700bb,0x44d1b6d5,0x000001e6 },
  35250. { 0x862e4e9c,0x96830686,0x48763fe4,0xfe5cd76c,0xc0839caa,0x60309679,
  35251. 0x8d83d62d,0xc0e4cbeb,0x11bc4ae2,0x911e254e,0x64fca062,0x96a0d7c8,
  35252. 0xe9a27045,0xf5785dd5,0xf3e0412c,0x2f4677d0,0x000001be } },
  35253. /* 145 */
  35254. { { 0xab01a6dc,0x4c0012dd,0xae1adb69,0x391bd6c1,0xb9b05079,0x3ae7daec,
  35255. 0x62a1061f,0xc2714f9e,0xa96536b7,0x71978ee7,0x5e17654b,0xeec11bd0,
  35256. 0xefab3dd4,0xc71166e0,0x87edbf61,0x0f7aa572,0x000001d7 },
  35257. { 0x51eb5932,0x26ea6f7d,0x5f882ca4,0x354ea0aa,0x7739f7dc,0x175b6097,
  35258. 0x9be57934,0xd335192a,0x78545ecc,0x9801f423,0x7b643c9d,0x32b8e256,
  35259. 0x23e3abec,0xb9411dd7,0xcf1c6509,0x656dea68,0x000000ee } },
  35260. /* 146 */
  35261. { { 0xa0890deb,0x4d38e140,0xbceb84bd,0xbf7bd87d,0xba041dec,0x51f0ff72,
  35262. 0xa6820be9,0xafeec70a,0x8c486298,0x755190a3,0xe7010ec4,0xecdba558,
  35263. 0x8c7879b1,0xced91db8,0xef5e215c,0x08de3e4c,0x0000014c },
  35264. { 0x16266da2,0x9c1534ed,0x7b4c9009,0x9ce322eb,0x69927688,0x37decaef,
  35265. 0x05c2844d,0x6525097f,0x1ac519ab,0xd23b7e13,0x65a3cc86,0x682ebb72,
  35266. 0x628c4575,0x0c531db9,0x73805373,0x2e00e8b8,0x000000be } },
  35267. /* 147 */
  35268. { { 0x57ed32e9,0x3807c800,0x7c024997,0x427e40cf,0xabb54830,0x58506abb,
  35269. 0xce820bf4,0x5649776f,0xb2c43e81,0xb5353293,0xcfef6648,0x671e8353,
  35270. 0x903bdca5,0x27217d3f,0xa813fd79,0x40a9c109,0x000001dc },
  35271. { 0x3db21a38,0x6beaa6c3,0xd73ef7e4,0xcae222e1,0xbd1d507f,0x1ff684e7,
  35272. 0x587a77ab,0xf5bac664,0x0c64a4d6,0x58c74f62,0x6a7c378a,0x4ca837d9,
  35273. 0x3e42e409,0xf43df531,0xfb49e14f,0x8a9a4347,0x0000013f } },
  35274. /* 148 */
  35275. { { 0x992f8923,0x85ab4edf,0x6fd209f3,0xe24aa5e0,0x1b1340ee,0x27be9b87,
  35276. 0x91e0bb40,0x2957d11f,0xf3d4c62c,0x425afad2,0xc7ff7aaf,0x2d231286,
  35277. 0x0114cbe9,0x96412b2b,0xc3e23529,0x6706a231,0x0000019f },
  35278. { 0x225c02af,0x06b3bbd2,0x3fa3e98d,0x53ebc166,0xb84f482e,0xa6df2b75,
  35279. 0x2bfc55df,0x912b4521,0x512a73da,0x30bdbd40,0x3d53eaa4,0xac0f43d9,
  35280. 0x0c27fd53,0xfc358fe4,0x919424b4,0x2cb183be,0x000000a3 } },
  35281. /* 149 */
  35282. { { 0x3fa6a746,0xe39b0c2d,0x1d5a24a8,0xe84a7922,0x78cdf2b5,0x70a58914,
  35283. 0x30666cb3,0x8a88067d,0xf6d71d06,0xb09a709e,0x0065d184,0x50007a3e,
  35284. 0xb8dc9448,0x7046af4b,0xc65493ac,0x2b6a3129,0x000001fd },
  35285. { 0xe45f2771,0xd3d5d5bd,0xf432ed95,0x8542b08a,0xf232a6bb,0x2ecd40fb,
  35286. 0xe8beccb2,0x0fcb6143,0xbf8e247f,0xcecc513a,0x8da3039b,0x955d56f7,
  35287. 0x56c2a0df,0x9157c619,0x3031fe2a,0xa6d35cbf,0x0000018c } },
  35288. /* 150 */
  35289. { { 0xbe0c4923,0xdd800b1b,0x6902907b,0x046ae740,0x957bd0c7,0x2398b37f,
  35290. 0x9655f8b8,0xaa8e1a9d,0x500f4150,0xcd2927fa,0x202e7aee,0x826a9c6d,
  35291. 0x9f29692e,0xb4cf58b3,0xbf41577c,0x3093868c,0x0000011f },
  35292. { 0x333ed442,0xadcb5e7a,0x906fef7b,0xae5c8e2f,0x3d98f228,0x2d9b0123,
  35293. 0x7ffe125c,0x4632f2da,0xba231835,0x59487731,0x12d2c512,0xa0caae5b,
  35294. 0x9857d9c4,0xbf00e658,0x54f200f6,0xc5d10086,0x00000172 } },
  35295. /* 151 */
  35296. { { 0x2fc283e0,0x58954046,0x7ee0880e,0xf7633984,0xb7fd1622,0xfaf1b40e,
  35297. 0xf598c5ed,0xecf5151e,0x7e00d9bb,0x6b4d92f7,0xa8c43fd4,0x7543e3b3,
  35298. 0x6511d1d2,0x3994e12c,0xaf05b6d3,0xdd841a1d,0x000000c6 },
  35299. { 0x23b991ad,0x23da17e0,0x71fba514,0xaab2b213,0x0ddc1879,0xb417ec5a,
  35300. 0x5f63acdc,0x173bc8ad,0x1e2a7d50,0x2fcf5210,0x6106d008,0x63373fd0,
  35301. 0x7db012cf,0x1e8211de,0x576545ef,0xa07766d9,0x0000018c } },
  35302. /* 152 */
  35303. { { 0xaf80dfaf,0x8e4347b9,0x9c4667f3,0xa80b631f,0x6ddbc238,0x6ff1db26,
  35304. 0xaa8718a0,0x6161e365,0xaf31c35f,0xe7f7ac90,0xfc6846e8,0xc03831d1,
  35305. 0x684175b4,0x1e669d10,0x934b731a,0x6da9d620,0x000000c7 },
  35306. { 0xa3e4e78b,0x981f597b,0x55099f9a,0x2c14dedc,0x93088c61,0xbf373995,
  35307. 0x9b207458,0x7c568307,0xa2276900,0xc4440c47,0xf7e6daf3,0xb6df23c8,
  35308. 0x42929103,0x4f662c25,0x8b3b7963,0xf4ea6db1,0x000000f9 } },
  35309. /* 153 */
  35310. { { 0xced36049,0xc669eb88,0xf41b99f8,0x87a4ffe1,0x6a72e108,0x690b7563,
  35311. 0x65a0bb8a,0x67dd6a8c,0x96e42955,0x42cf8c58,0x1aabffad,0x5286b5f3,
  35312. 0x8f6f26a4,0x1f7dfaf2,0x0e1ae503,0xc5d9e0ac,0x00000120 },
  35313. { 0xacc10da7,0xafbee3ff,0x944946e5,0x67e2d5f9,0x3c4220ff,0x8ec17e86,
  35314. 0xbd6f632e,0xfe6f7414,0xc3fc9ef4,0x4a9e3c0f,0x03bfb870,0x25ff3cba,
  35315. 0xbb03342d,0x18fd3600,0x0050cd2e,0x1e63e753,0x000001ac } },
  35316. /* 154 */
  35317. { { 0x8f3d6a02,0xdd83d07c,0x7ef4d0d1,0x71fc143c,0xd4c7af61,0xca994bf0,
  35318. 0x827c5cf0,0xc8a93e98,0x2b697882,0x4a102c7b,0x8a55e8ba,0x633c87d5,
  35319. 0xcc2d64f0,0x1ae8822f,0x986d01fc,0x2ce9b53f,0x000001c1 },
  35320. { 0x95dc1b79,0x859639fd,0x3f4e616a,0x2728f754,0xede2fb9f,0x6e703c4c,
  35321. 0xd50fae9e,0x042f7680,0xc2d530ed,0x0546bc3b,0xcdd598ac,0x00a4006b,
  35322. 0xe1294910,0x3f3286c9,0xb6bf9629,0x77782255,0x00000146 } },
  35323. /* 155 */
  35324. { { 0xe30c98fe,0xaf81421e,0xfc2cd705,0xdeb0feb0,0x14df6ad2,0x9b2c4ca6,
  35325. 0x9ba314e8,0xd38134de,0x4f04b16d,0xa443deb8,0xf07f8ca8,0xfc556ee0,
  35326. 0x3a4f3917,0x3c1c83bb,0xb1adcd41,0x8397dd24,0x00000199 },
  35327. { 0xdf4781e6,0xca01e17e,0x46f1f901,0x32d7c319,0xb53090da,0xa227a613,
  35328. 0xa7c8c607,0x2495b1dc,0xddc69709,0x1cf2fbee,0x45608098,0x1d3d82bb,
  35329. 0x085134d7,0xcfcddda3,0x96798c41,0x3dd171b5,0x000000d2 } },
  35330. /* 156 */
  35331. { { 0xd4dd7e96,0x97a40f84,0x8409fc0c,0x7114c8ea,0xa9d11393,0xc56f29e6,
  35332. 0x8fd8c6d6,0x3b606621,0x00269e7c,0xad3baa86,0x05929d5f,0x1413c6b0,
  35333. 0x222e365b,0xc1ad7e40,0x4798aaec,0x6a82621a,0x000001d3 },
  35334. { 0xc1003c81,0xaeac45c4,0xf43d8602,0x9ef9ef5a,0x60f77469,0x36a65f5e,
  35335. 0xbf5d2858,0xf312e7ab,0xc84acef1,0x2f53ec81,0x9d248b52,0x63e32ca2,
  35336. 0x81e65c60,0xfe9aa7c5,0x52841973,0xe3686c9a,0x00000017 } },
  35337. /* 157 */
  35338. { { 0x9e90de99,0x0b2efe65,0xad05ab63,0xbe4485bc,0xe14e4892,0xc48a6a52,
  35339. 0x22628687,0x2ad85430,0x5eb3db54,0x261f0e95,0xd45e5841,0x48e81863,
  35340. 0x8ed75739,0xcfe1ce0f,0x7d84ade4,0xbd6f1ff5,0x0000003f },
  35341. { 0xd1bf968c,0xd43711dd,0x48dfa472,0xd558d7cd,0xe425a566,0x49f09223,
  35342. 0x5c26d041,0x0cf83338,0x7c2c1743,0xbe7b81f1,0x5143d9d9,0xe3bdc33e,
  35343. 0x94fd3fae,0xf385ac35,0x9fd1811a,0x7551cf42,0x00000113 } },
  35344. /* 158 */
  35345. { { 0x20193bb2,0x4928f55b,0x7310b872,0x96e579d0,0xd345d276,0x5ee06309,
  35346. 0xa871868a,0x9a43e432,0x11038683,0x28c113e1,0xa332f108,0x8286ecf3,
  35347. 0x0385cbb4,0x3348aa37,0xef158daf,0x698ffcaa,0x000000c6 },
  35348. { 0xf6908745,0xa044c54a,0x6a3353fb,0xa6b336e4,0xd561e821,0x694c2852,
  35349. 0x3634917f,0x1b297970,0x81f61315,0x6e1023b9,0xef46a5ef,0x6817dc2b,
  35350. 0x8e114f7f,0x93dea0af,0xed72c5bf,0xc3cf3cd5,0x00000136 } },
  35351. /* 159 */
  35352. { { 0x7b080de4,0xbb8799ab,0xd69d8396,0x3b8f781d,0x986f8f63,0x76b42aaa,
  35353. 0xa54bc5ca,0x5d74c038,0xa9c2fbb9,0x76fcb605,0x80178930,0x8451b440,
  35354. 0x9d286f0d,0x40f00c38,0x0c543263,0x3038e952,0x0000014c },
  35355. { 0x6977aad9,0xc94bc381,0xd7087be3,0xadbfd082,0x875fed08,0x06d0820c,
  35356. 0x345656fc,0xe1ce84d4,0x0fd6dd4e,0x71c4d8e0,0x6a5fab40,0x23338b22,
  35357. 0x0baeeb6f,0xd477eac1,0x5f80c26c,0xe4db08bb,0x00000078 } },
  35358. /* 160 */
  35359. { { 0x1078342a,0x0111d12a,0x559a1064,0x0534725e,0x0fd3ffdd,0xea459d59,
  35360. 0x06f0ac1f,0xcf694a9f,0x3e19bc69,0xf6d24adb,0xb9ddcd00,0x3ce38f5e,
  35361. 0xb632dd4e,0x38400f66,0xe15e1c55,0xcab8fdfb,0x00000085 },
  35362. { 0x8d09422f,0x0a943f6b,0x0f988c3b,0x17d29756,0x2ef2e4d9,0x55a441fa,
  35363. 0x35f7c13f,0x6743523b,0xedaad3ff,0x274d3407,0x9347242d,0x59411435,
  35364. 0x3bb8615d,0x1cb27301,0xbd7794cd,0xa0437004,0x0000007d } },
  35365. /* 161 */
  35366. { { 0x2d712c44,0x824b99a6,0xa6962577,0x148368f8,0xd65e2287,0x8ed68432,
  35367. 0x6f5bc5f8,0x14028306,0x4ec3479d,0xe6cf3121,0x9326db70,0x96db6f44,
  35368. 0xca32936b,0xca5ac098,0x2fea21af,0x69e248c7,0x0000004d },
  35369. { 0xa71269fb,0x0aa89092,0x18650b60,0x2f6bdba8,0x9fb55db2,0x1d9cc2a3,
  35370. 0x6311e9d0,0x0fceb0df,0x90ac2c1d,0x6faeb79c,0xcb1f372a,0x2393b222,
  35371. 0xbc8c4193,0x62a6f3df,0x2fe8e674,0x9dea30b2,0x00000001 } },
  35372. /* 162 */
  35373. { { 0x12b3118b,0x7df689ac,0x6cb6ea56,0xd06ee39d,0x187cd978,0xcfcc22c2,
  35374. 0x8d537d87,0xb985b681,0xe9f56db2,0x75845152,0x5e098c15,0x0f839871,
  35375. 0x3b212cd2,0xbe96a5c8,0xd9ac1c47,0x3dda0338,0x000001fb },
  35376. { 0xcfa0a9b8,0xf06b7fe0,0xe22dcf75,0x9478bac7,0x136887c8,0xf3815e04,
  35377. 0x914c54bc,0xed811dde,0x0f51ea64,0xc8c24160,0x4c870577,0x63914d83,
  35378. 0xa8abbcb4,0xed24e552,0x2644f52e,0x9e5eb9e8,0x00000001 } },
  35379. /* 163 */
  35380. { { 0x66d52313,0x1f65a04e,0x4d3f72bd,0xfd694545,0xa6b7ae11,0x2bc0ddaf,
  35381. 0x571ab247,0x921f79d8,0xae5a8d68,0xd4c5f966,0xaec5ce13,0xfde17716,
  35382. 0xb764bd39,0x70e6eda4,0x990d6783,0xffe94085,0x000001ef },
  35383. { 0xd88f92e8,0xf3fa0e27,0x9c77123c,0xa21ef0fd,0x89274dba,0x6259974c,
  35384. 0xb9ba2762,0xd4cfa4a5,0x46ebcaf6,0x10c909d2,0x8f8e2870,0x0317a10d,
  35385. 0x453aeea2,0xb0771de1,0x68c6b0a3,0xdf0c4791,0x000000ea } },
  35386. /* 164 */
  35387. { { 0x4c854477,0x11bc1e48,0x8638e47c,0x2bec25b4,0x869c54d9,0x43d4e02b,
  35388. 0xbe1e7ed2,0xe318de32,0x6b460c4a,0xf5471eb0,0xaa426afe,0x38ae7bf3,
  35389. 0xd8452dc1,0x23ae26dd,0x5782de9d,0x9d3fc1d5,0x00000164 },
  35390. { 0x0ade1979,0xd87cae31,0x3b4bc728,0xa847041d,0x56c3c9be,0x38923c40,
  35391. 0xd74ae467,0x36fe182a,0xecbe49ae,0x92bff6f4,0xdc41f9f5,0x6680db80,
  35392. 0xe4630715,0x35bac06f,0xd6d07307,0x6d68b4c7,0x000000c0 } },
  35393. /* 165 */
  35394. { { 0x854dfcf2,0xdbe22be7,0xa6ae3bd0,0xee21a7df,0xa521ec46,0xf4633ad1,
  35395. 0x41a9484c,0xee94527a,0x2aa123f3,0x1145eb9b,0xcae3ca92,0x5634a82a,
  35396. 0xfc85d925,0xe176aca0,0x19082d8c,0x504cf7fc,0x00000078 },
  35397. { 0x3799793c,0xd74ce7c4,0xb5519fb5,0x74ddd618,0x95ff9808,0x2cf6df93,
  35398. 0xb8bf61e6,0x00ea45d1,0xdcfcf54f,0x26863613,0x030035b0,0x67423b76,
  35399. 0x4028a9cb,0x9fbc7534,0x051a077e,0x7b52ce37,0x000000f4 } },
  35400. /* 166 */
  35401. { { 0x96bec962,0xebf7d8ad,0x17e0107a,0xd1cc81f6,0x214e1058,0x64c44509,
  35402. 0x42394c9f,0x6c298c43,0x1a660513,0xd910052d,0x90df8243,0xc3643754,
  35403. 0xfe5cdea4,0x2313be1e,0xd27fb7b1,0x249a60f7,0x00000076 },
  35404. { 0x1cf593a0,0x74975838,0x8364c59e,0x0c9ceefb,0xe05c9991,0x2f5a1333,
  35405. 0x421808e3,0x30ea5e1f,0x4f5e8f4f,0x56fb3a4f,0xb6c0cb47,0x2cae6e2e,
  35406. 0x08bdcc6a,0x60b307fd,0x0ff8c117,0xee17901c,0x0000001a } },
  35407. /* 167 */
  35408. { { 0x89aa9e14,0xc048336b,0xf676700f,0x66634271,0x906b6980,0x4daa0433,
  35409. 0xebb7ab23,0x30247ee1,0xeb59a053,0x969b4aa7,0x8000f4d5,0xd78ef825,
  35410. 0x46026b5b,0xe5db38eb,0x7d6856c4,0x06a43e5d,0x0000003b },
  35411. { 0xed2a0ee7,0xaa0ae838,0xf16e8813,0x04bbe528,0x4ea64137,0x8ab6df5c,
  35412. 0x06e29867,0x5be80cb6,0xf459ed2b,0xf19b1b72,0x1761521a,0x7a9cce4d,
  35413. 0xaa516f3b,0x39aff994,0xb3416925,0x97d92e86,0x00000007 } },
  35414. /* 168 */
  35415. { { 0x5af3a8ca,0x25aeede1,0xa5c351ec,0x33924782,0xf93ec080,0x41e7a3fb,
  35416. 0xe6f425b4,0xb04f93c4,0x81e76009,0xe4ec12ec,0x5180ffc6,0x797366d4,
  35417. 0x0e0aef3a,0xd293cbb5,0x68d71d91,0xa1496944,0x00000061 },
  35418. { 0x675a67a1,0xf52c541c,0x8f5fe906,0x67d38d30,0xf6be988e,0x2a70bccc,
  35419. 0x18589886,0xae03ecbe,0x7067045b,0xecd02616,0x10ca8d96,0x1facdd99,
  35420. 0x30c0735d,0x7aa10a82,0x3328f21c,0x2a27e554,0x00000015 } },
  35421. /* 169 */
  35422. { { 0xe6057e27,0x3dd609e0,0xc7a454da,0x87e8b6a7,0x1f32dd5b,0xff599145,
  35423. 0xd0ef51e2,0xea397a88,0x25567546,0xc49866a1,0x3228b480,0xea45c8b1,
  35424. 0xdd01997a,0x3dbe0e77,0xc51867d2,0x0e2ea28f,0x000001f8 },
  35425. { 0x69d0820b,0x6295412d,0x1ea65a18,0x03173127,0xeb06380d,0xc27c8221,
  35426. 0x75fe9706,0x7ffd4efc,0x5a71d250,0x7b396a57,0xc7cb7543,0x61c80051,
  35427. 0xad4dbee3,0xe07db4d7,0x9b192d45,0x1c7481f4,0x00000143 } },
  35428. /* 170 */
  35429. { { 0x08e1cc4d,0x5eab2d04,0xad2dc1ee,0xe93758d3,0x5c9c7393,0x0ceb7dfe,
  35430. 0xd3379683,0x530d86a9,0xe24f86d7,0xef5283ca,0xf0b1bb0b,0xab5d1a64,
  35431. 0x54db4e3c,0x96aabc1f,0x3bc00c59,0x3e3d87cc,0x00000144 },
  35432. { 0x1d60e7b0,0xe50a8213,0x5d33d018,0xfc9b629b,0xfd05338d,0xc54aee42,
  35433. 0xe821c6ea,0x0678f2c0,0x06ac09cb,0xe5c9d75f,0x53018df6,0x83357513,
  35434. 0x0bf8c667,0x81ca6fac,0x9d0ae2dd,0x7fc8020e,0x000000e1 } },
  35435. /* 171 */
  35436. { { 0x1baaa5eb,0x8add4741,0x79bd8036,0x02cbb759,0xcdffed22,0xd8680c40,
  35437. 0x4e091141,0x1c23a8f0,0x20748b87,0x65d141ed,0x659e9289,0x586a1575,
  35438. 0x5006dbfe,0x7c68d7cd,0x22569a74,0xda0ad0df,0x00000148 },
  35439. { 0x7f9069d7,0xc8fcc5db,0x5c0531a4,0x2487d245,0xe9a2db3a,0xc5ab4899,
  35440. 0xb4fe9720,0x52bfd538,0xd27f35e4,0x73a04ca4,0xee2dac93,0x7cbbc549,
  35441. 0xff3ee7e2,0x0287229d,0x28da9360,0x3179878d,0x000000d0 } },
  35442. /* 172 */
  35443. { { 0x3b66c047,0x89b7e9bb,0x602a3e1d,0x22e65869,0xc8db9c00,0x44f82297,
  35444. 0xd08a74a3,0x0e76aca3,0xfcd398de,0xfbf1a71d,0x8320e66a,0x2fbb6eaa,
  35445. 0x179c9fc5,0xa82d0ebc,0x4e7ab2b4,0x4e00cf6f,0x0000000f },
  35446. { 0x4890c439,0x424c0e9a,0xbc35a6b2,0x37564a2b,0xd9b7497d,0x95a4479d,
  35447. 0x612de942,0xa1ff3f0d,0xe60d0033,0x358627fc,0x522417da,0x815da8c0,
  35448. 0xef6b8385,0x506104d4,0xf16e96aa,0x800728d2,0x00000120 } },
  35449. /* 173 */
  35450. { { 0xab039042,0x976f2372,0x9fa084ed,0x10e6978c,0x58bec143,0xd03fdd2f,
  35451. 0xfe2045c3,0x3200c101,0xb0a5a928,0xe6868f7a,0xe61faff8,0x26c95d1d,
  35452. 0xb7b12265,0xa1e20127,0xc2a5ed17,0x8e63dd78,0x00000089 },
  35453. { 0x22bba4ee,0xbb6533da,0xf496a574,0x3eff6397,0x14f2a6b9,0x409329f7,
  35454. 0x1dfdd73f,0xa08248bd,0x69bca1b1,0x62f33f2e,0xba2e0327,0x9a177e64,
  35455. 0x75ddf741,0xbc50e993,0x4a56bd1c,0xb87a979f,0x00000095 } },
  35456. /* 174 */
  35457. { { 0x67c1f177,0xe83736a9,0x600133c9,0x1b6d3508,0x6eac9a5b,0x9424bb92,
  35458. 0xc27ef31c,0x7a9c01a6,0x122b4870,0xad93bba5,0x9d1ac985,0x9eb94e2a,
  35459. 0xd53f175b,0x511c0206,0x5102d914,0xd13eb252,0x000000b1 },
  35460. { 0x675a1171,0xcfe7dbeb,0x16c0d2b1,0xb228295c,0x057c88ca,0x8db25b5a,
  35461. 0xd300e9cf,0x73ea9e96,0x269552eb,0xb0e0037f,0x9e0f98df,0xea9d035c,
  35462. 0xd290480f,0x860e49b8,0xc036b319,0xa35e9512,0x00000037 } },
  35463. /* 175 */
  35464. { { 0x8f00df48,0xc56729ee,0x11ac8304,0xb89ca7b6,0x8b3a8123,0x497a57f9,
  35465. 0xc21ca3ea,0xe0431b19,0xe2bb3ce7,0x45a73deb,0xadc77819,0x2f86cc2b,
  35466. 0xe5eb3df1,0x5ff005e4,0xdd27dcf0,0xf955dd7a,0x0000005e },
  35467. { 0x00ee402f,0xe0c22ffa,0x3b30bb4c,0x5b335e2a,0x643cb101,0x542551d0,
  35468. 0x3cd19688,0xc6183f45,0xf0be54b4,0xc6664f22,0x4c20cde4,0xa5f4cfee,
  35469. 0x80a4c475,0xdcaa972f,0x59111ed9,0xde4af200,0x0000019c } },
  35470. /* 176 */
  35471. { { 0xd771f428,0x9e9d0bc8,0xe43ca382,0x3ac1ecd9,0xeb93acf0,0x8d5ee480,
  35472. 0x065a2a3f,0x16232f81,0x2f0b8a73,0x1fc04faa,0x025474a2,0x4a8df7e7,
  35473. 0x3bb15f6f,0x51ac4ff2,0xe0950e52,0x66e21b73,0x0000006b },
  35474. { 0x67a41dee,0x59c98480,0x7b3e2b3f,0x2cfa95ae,0x891454e1,0x54d98386,
  35475. 0xeefca6a4,0xf0dddbdf,0x11e9cb75,0x5f691b24,0xfef208c3,0xa9b9e766,
  35476. 0x18b33cf6,0xe8df1000,0xd1c174a9,0xb8a55ac9,0x000001c4 } },
  35477. /* 177 */
  35478. { { 0x5c4cccb8,0xa99f5862,0x2ef4d3ef,0x70bf5209,0x89efc878,0x28f4e576,
  35479. 0xda14206e,0xa2366f96,0x7c52107d,0x90331a00,0xd4a0f0f0,0x478d4cea,
  35480. 0x472a47b0,0xb2899ee2,0x64207549,0xae96534e,0x00000110 },
  35481. { 0xcced05b0,0x2cc1d655,0x01759543,0xabac3f09,0x8e577cd7,0xbaeb70a4,
  35482. 0x40e98d6d,0x84b00893,0x603d24f1,0x26983653,0x2572173d,0x6e145883,
  35483. 0x611141de,0x1d348b26,0xefa27f34,0xe52257dc,0x0000006b } },
  35484. /* 178 */
  35485. { { 0xc947e655,0x92678f33,0x08923795,0xff0fb76a,0x790239d1,0xb2dfe745,
  35486. 0x3cdbb7ce,0xea087492,0x05f6d41c,0x21326db9,0x79dc5588,0x5b1ae9ae,
  35487. 0xe9c31702,0xe145340c,0xa2c38a9c,0x07502c29,0x000000c3 },
  35488. { 0xc156ace2,0x0c124f11,0x79ff2529,0x2c170fe7,0x6e1171b2,0x60df9a81,
  35489. 0x55de2797,0xa19bca83,0x7c6cc79d,0x1ad927ea,0x1d61f770,0x28590112,
  35490. 0x261c06bb,0xfe80c826,0xaa2642bb,0x4050d338,0x0000015e } },
  35491. /* 179 */
  35492. { { 0xeaad87bc,0xc9397829,0x81e84cbd,0xe0ac9367,0x6ade4fde,0xb579c24d,
  35493. 0x690d7f56,0x50b9aba5,0xd14fb0b9,0xf09b29d3,0x25a0e7b6,0xd0684f23,
  35494. 0x606f4ff3,0x0514e9d3,0xe8ad733b,0xe63bdd26,0x00000077 },
  35495. { 0xe0d25c6d,0x0afd06ec,0x00ba2dcf,0xdd90021a,0x8c5bb398,0x1b025770,
  35496. 0x198ff8fc,0x077f06d8,0xb7e2cd68,0x87d50ff1,0x263a3572,0xef75e057,
  35497. 0xfa925a9a,0xbf257892,0x739d0e95,0x847d3df0,0x00000111 } },
  35498. /* 180 */
  35499. { { 0xfec82924,0x52ab9cc7,0xa7220d69,0x1c76dd69,0xa06ef0e2,0xa63527de,
  35500. 0x27183904,0xab3e51c2,0x716807c8,0xf4db35ea,0x748f1246,0x8f3ede0a,
  35501. 0x41156095,0xf1493644,0x874b38de,0x5f6583d1,0x000000f7 },
  35502. { 0x0b927eb7,0xa39189e1,0xc2e2f127,0xa87c6359,0x7fe966f4,0x0b72c233,
  35503. 0x105e5585,0x102b8382,0xe58c39f9,0x63fee006,0x991b5329,0x3f052ee3,
  35504. 0xcbaff97b,0x7f5b854c,0x5f805060,0x935e5f6c,0x0000016a } },
  35505. /* 181 */
  35506. { { 0xdfd88d38,0xf19a0355,0xc549df40,0x555cd8e3,0x04d006e1,0x322729e3,
  35507. 0xfd0b0ce6,0xf16b706c,0x35f2ad31,0xf156dc09,0xf7a3df9f,0xb30c5213,
  35508. 0xa55e5fb5,0x9f29cc92,0x2b858da2,0xa0ecfdd4,0x00000144 },
  35509. { 0x52658a92,0xb5c115df,0xc4281616,0xbce3ed17,0x7fd92a91,0xa5595f70,
  35510. 0x9cd5d896,0x663c8bfd,0x5a9472b1,0x0776343f,0xb033e1bd,0x14e44ca8,
  35511. 0x1e5c02fb,0x27a1c986,0xcc4ffb32,0xece0f2c4,0x000001b5 } },
  35512. /* 182 */
  35513. { { 0x31211943,0x17127bab,0x5684325c,0x44a8cac6,0xd855fc3e,0xd2fe0b88,
  35514. 0xce91eea5,0x47abab0c,0x78ec7d12,0x5d23ddc4,0x0cd9fefa,0xa3986de7,
  35515. 0x82655766,0x32c7b867,0xeeaec7fa,0x3e54018b,0x00000087 },
  35516. { 0xb38d17c1,0xc96e86f2,0x71fa040d,0x9cbfbd0c,0xf88499cb,0xe111ab79,
  35517. 0xf71ec80b,0x1d47c5ce,0x46c89692,0xacaa3bc1,0x3d316331,0x5f921c0e,
  35518. 0xe768765b,0x31fa081e,0x41eff270,0xd5dafd5f,0x000000fe } },
  35519. /* 183 */
  35520. { { 0x4cda1348,0x8af10b9d,0x25c3013a,0xb0769fd2,0x8957c22b,0x450aa5b1,
  35521. 0xf5acf1c4,0x5cafd6c7,0x9fef8029,0xcf71a140,0xee089f5d,0xe12029f5,
  35522. 0x0fbd2ba8,0x9752a8fb,0x6f70cb58,0x61e2275f,0x00000090 },
  35523. { 0x1fbda16a,0xb70a4ac5,0xf1dfa2a2,0x79910e79,0xd9945f6f,0xba2ce132,
  35524. 0xeb4ba4ef,0x450d59ae,0x4bf2d53d,0x6a8e09b3,0xe620c7a8,0x76010204,
  35525. 0x0a53c6f4,0x63f8943d,0x87eaf56a,0x14c91d19,0x00000132 } },
  35526. /* 184 */
  35527. { { 0x490d66c3,0xe54fb120,0xa0dc8204,0xeaed7328,0x04b4294d,0xba014c38,
  35528. 0x31ddc467,0x3f2fa2ab,0x8342ed11,0x70ff55ea,0x23034e0e,0xb18da72f,
  35529. 0xbd8ae3c1,0xadc30dbe,0x3e945a02,0x179bdf6f,0x0000009c },
  35530. { 0x7484c26f,0x46c928ef,0xef2adbb1,0x206b7db1,0x3f58dda7,0x0887f548,
  35531. 0x4bc7edb6,0xfde4e20c,0x975cafdc,0x484d121d,0x86beec20,0xc5b59670,
  35532. 0xa6d6db67,0xb579aa88,0x41187488,0x22c6d87e,0x00000015 } },
  35533. /* 185 */
  35534. { { 0xc471d4ae,0x0a890757,0x43a1da76,0xfef4b1a5,0x6aa701a1,0xb892b182,
  35535. 0x59c65f93,0xbf4d4e52,0xd789df35,0x923af929,0x0b79c3f2,0x3ccb46c6,
  35536. 0xcf4cf130,0x95582ce7,0x257f0ec4,0x7da081b4,0x0000011c },
  35537. { 0x9aeef274,0xf92c6ae5,0x1437c083,0xe6c5bf4f,0xe13c86af,0xaa74b023,
  35538. 0x2a225360,0xd21dace6,0x22589fa5,0xb3d572b8,0xdfa74b0f,0x3d4a3916,
  35539. 0xb12891a9,0xe76cd8dc,0x59f4cfbd,0xa0391a3f,0x0000019a } },
  35540. /* 186 */
  35541. { { 0x203fc3f1,0x054ba69e,0x62106a29,0x09168ccb,0xaad5fa9f,0xb0818540,
  35542. 0xbff7ed6f,0xecb8f20e,0xbef94afd,0x2c80a618,0xb0abd1db,0xe25d8ca0,
  35543. 0x028e0a7c,0x75e67a41,0xd6e95b9a,0xdd7662dd,0x000001b2 },
  35544. { 0xf289d7ee,0x87dff279,0xeea2205c,0x4d755d59,0xc18adac6,0xaeb0fd54,
  35545. 0x7ec01019,0x3a8c46cf,0xb48d70a4,0x6fc90e7e,0x10b39ef8,0x965c53c1,
  35546. 0x38545a20,0x455777cc,0x57dd023e,0xa33430f7,0x0000016e } },
  35547. /* 187 */
  35548. { { 0x0ff53d2c,0xfa9f3949,0xb00349b9,0x8dc91596,0xd5997967,0xf10a5014,
  35549. 0xa8a6b78a,0x4dd72dab,0x8b517b10,0xef5de540,0xa6d39be0,0x142b90bc,
  35550. 0xeda17f70,0xcaeaa3e9,0x06b31118,0xa01689d6,0x0000016d },
  35551. { 0xf46afff7,0xea6ca563,0x34a5e5f3,0x3945c7ba,0xaa998fd8,0xc1ffe4c8,
  35552. 0xb63f535e,0x42a60146,0xd1f509e5,0x50816888,0x9f8cd0db,0xd1918daa,
  35553. 0x78a36772,0x6505e6bb,0x9cc6dc66,0x4ab03a81,0x000001ef } },
  35554. /* 188 */
  35555. { { 0xd376d986,0x06089d14,0xa2dc35b0,0xd0f4e077,0x53ff2c86,0x1c11709a,
  35556. 0x123c3fc8,0xfef4ba45,0x1b656fc2,0x852cd5a7,0x1fefa8bb,0xb57c7489,
  35557. 0x48110b77,0x8f05383e,0x52c5a129,0x4b55d3ad,0x0000004c },
  35558. { 0xf3827633,0x5110cff3,0xe00afe96,0x086784d5,0x3ead32fa,0xcb387882,
  35559. 0x2b91cd86,0x3dcf4d16,0xe6f3638a,0x078b6a58,0xe8b7fd42,0x33792112,
  35560. 0xee5683e7,0x6964044d,0x28e28433,0x3b84210f,0x00000122 } },
  35561. /* 189 */
  35562. { { 0xc3ebeb27,0x6c28a9a9,0x3ef590f8,0xd7bcdcb5,0x4dae7f37,0xe88a2e11,
  35563. 0x726ea7c9,0x033522e4,0x8c141388,0x99d50386,0x61621575,0x59b1aeca,
  35564. 0xfcc564d8,0x719fcfeb,0x1aeb8e36,0x3a577af1,0x00000043 },
  35565. { 0x6feba922,0xc3f26ce0,0x475a5693,0x5f6c83ee,0x28bf378e,0x7f796740,
  35566. 0xbdc3f6f1,0xd2a5e368,0xa6ed90ae,0x3d034a0a,0x4a47cbd5,0x3b1c3a4c,
  35567. 0x4dce2bc8,0xa4f0aa6e,0x74ca00eb,0x97c7af43,0x000001c0 } },
  35568. /* 190 */
  35569. { { 0x79c28de7,0x00377178,0xab9c330c,0x617aa2aa,0x66bc61eb,0x43081826,
  35570. 0x4d78b504,0xe0b5b5cf,0x9870fc72,0xd76a752d,0xd40b7bc5,0x3b4689f5,
  35571. 0x87f2d03a,0xa97fd867,0xfd6060a9,0x6ab7b5ee,0x000001c0 },
  35572. { 0xffb71704,0xe99eadb1,0x390fe3b1,0x436e58bb,0xab4f19aa,0xeecab82c,
  35573. 0xe0f3d9dc,0xda492dfa,0x6e20ad12,0x2a0f54bd,0x7dbbd262,0xaf89fa0f,
  35574. 0xe8d2eb54,0xdcc50a1a,0xef7d0758,0x9799f816,0x000000b7 } },
  35575. /* 191 */
  35576. { { 0x104f98cc,0x9ec46462,0x72aedeae,0x45115922,0x7e62186f,0x7ae93dd0,
  35577. 0x8d6d69b6,0xd17ce026,0xfd43a8f3,0xb5347608,0x7c0ab797,0xe87f1c13,
  35578. 0x139f991d,0x3bf597a8,0xe547e0d6,0xe293a85b,0x0000008d },
  35579. { 0x8ef668b1,0x0982add3,0x611c9764,0xc54e6b2d,0x1c1d4263,0x3ce76b12,
  35580. 0xeff64e73,0x3134b28e,0x2871612a,0xaf71a9ac,0xba093594,0x31c88af2,
  35581. 0xba9108e8,0x0b649112,0x5cf437da,0x8febc5c5,0x00000113 } },
  35582. /* 192 */
  35583. { { 0xc4a2daa2,0x7e9ca589,0x400f608c,0x18ea703c,0xd5175103,0x6f8cd058,
  35584. 0x4abb6f29,0x26493472,0x94296ab4,0x0be553e1,0xac51657d,0x9af9398f,
  35585. 0x4f880ea8,0xe232deec,0x67b1e1b1,0x2f81761e,0x00000137 },
  35586. { 0x3a20f662,0x51014bc7,0x49ed9502,0x1fb7e77c,0xb62b9652,0x89f5096f,
  35587. 0xa2e8d37e,0x3a659c67,0x5804170e,0x0f2b2a26,0x9ed50a34,0x1674fce6,
  35588. 0xfdc3c00f,0xaaa4537e,0x4ce99d93,0xf3c3bfda,0x00000198 } },
  35589. /* 193 */
  35590. { { 0x81614189,0xbab1f5cd,0x24b259f7,0xc7d56c45,0x45fb415e,0xc7baa4b2,
  35591. 0x7af6bef9,0x302bc8dc,0x74b48e82,0x91b770e0,0x9b6d1b1f,0x4a1336e0,
  35592. 0xe6680c97,0x285c1357,0xc7ccb625,0x59bcb813,0x0000012d },
  35593. { 0x7c019927,0xddad83b4,0x630dfd5b,0xe10f2667,0x31e05d23,0x15dbec5a,
  35594. 0x456ac460,0x2aa6e5fa,0x243cac82,0x46956529,0x4dc8c9e9,0xc69c9c7f,
  35595. 0xe24a4065,0xadb27e09,0xae41301b,0xdfa7a34e,0x000001cc } },
  35596. /* 194 */
  35597. { { 0x59cb1a7d,0x176a864d,0x6aefb8ee,0x4d864ca3,0x1c22b0d8,0x0ee83acb,
  35598. 0xd980df1d,0x7e80a6eb,0x7f94ced9,0xf582acc4,0x3a72c115,0xa29cd123,
  35599. 0xc7107bb7,0xce12a2a8,0x4ed80a30,0x0229ca56,0x00000150 },
  35600. { 0x2f1c180b,0x9774bad5,0xd749aa10,0xd08be998,0x56dbd1ba,0x978c48ab,
  35601. 0x0afbea9a,0x6ed3e3e4,0x153dc5fc,0x8a8be97b,0x9be93ed0,0xadc7f095,
  35602. 0x2cee23bd,0x8d242908,0xdc2729de,0x417523c6,0x00000016 } },
  35603. /* 195 */
  35604. { { 0x6c14a31e,0x74eeccf1,0xb2de3c2d,0x488e2534,0x7cec43c3,0xf9bb3599,
  35605. 0x916ac936,0x4210459d,0x9f7e4400,0x71d15c02,0x44553583,0x8c9c7c12,
  35606. 0xec94a467,0xcc97548d,0x3167bad9,0x4ca67818,0x0000014e },
  35607. { 0x8d0312bf,0x033af055,0x54161e66,0xbd1bf4f5,0xfa41781d,0x259945a7,
  35608. 0x00eef1d5,0x33494da8,0x79c3b8d0,0x6c505ec0,0x1c9f6e69,0x70ae1ade,
  35609. 0x76830aaa,0x0288f0c1,0xa62a060c,0x7f4cfe3b,0x0000000c } },
  35610. /* 196 */
  35611. { { 0x057d6006,0x0d8b447d,0xfd71c8b0,0x38b976e6,0xabcf40f5,0x5e77e029,
  35612. 0xf103a783,0x13bee386,0x5e472c4b,0x20a6ac20,0x31fcb194,0x43b045f6,
  35613. 0xc00abf49,0xe5dc1d9f,0xa5556b79,0x28c0bc70,0x000001b5 },
  35614. { 0x8a8640b8,0xba9d07ee,0xd0e34012,0x25611023,0xbe24ae89,0xc7ce655b,
  35615. 0xfa579dcd,0xe358e524,0x377bbfe5,0x57ce2715,0x3c0947e4,0x64651c6c,
  35616. 0xf4a97826,0x5fbd8d50,0xe2e1c15a,0x6fcdd28f,0x0000008d } },
  35617. /* 197 */
  35618. { { 0x5c7202c8,0xb564a2f6,0x5a54b0d8,0x7d634052,0x1434fbf5,0x8414d672,
  35619. 0x1d9830a3,0x8114215e,0x5ef0fbe1,0xc7a758d5,0xe6f57f9f,0x5705dcf8,
  35620. 0xd92269d3,0x5dd49a56,0xbdb49f97,0x8f015d7a,0x000000f1 },
  35621. { 0xb4799ce6,0x07131110,0x2cbcb7db,0x35bbfb99,0xf7ba21e2,0xc1f00c9f,
  35622. 0xb18f49fe,0x009d6913,0xabcf959b,0x8da61951,0x0d42146e,0x0e687213,
  35623. 0xae5f23f1,0x55832817,0x9ae7386b,0xc9b5bb68,0x00000143 } },
  35624. /* 198 */
  35625. { { 0x48c74424,0x423328db,0xd19cb2eb,0x32616e11,0x40d6e217,0xe534192a,
  35626. 0x0cbdc752,0xdd83a94c,0xd733bb01,0x5c623050,0x5b7a4520,0xcd0d631a,
  35627. 0x9a4011c8,0xccdc0a25,0x646e7cd5,0x22f112cc,0x000001e6 },
  35628. { 0x3e1e4c4b,0x47d6e29a,0x9fb1548a,0xd5f82538,0x4fd3e319,0x7e3705b5,
  35629. 0x0a08b966,0x8c4ce59a,0xd8cbe8db,0xbca749e7,0xaeec3d75,0xcc4496ea,
  35630. 0x8a1a313d,0x17dc723a,0x8ceb9360,0x250ff77a,0x000001a5 } },
  35631. /* 199 */
  35632. { { 0xfe29bd79,0xa55a0726,0x4f990b34,0x6574a810,0xaad56983,0x6906946d,
  35633. 0x50d41fef,0x0e580ab9,0x6e6f7f45,0xbc75b514,0xf0f3718a,0x508cc97b,
  35634. 0xa5634087,0x51ba2ca4,0xe64d8910,0x75c39077,0x00000172 },
  35635. { 0xf77ca6bd,0xf37cccaf,0xbdb18df5,0xe0a0df41,0x019e01f7,0x9f46cff8,
  35636. 0xaa65d72b,0xbe4f3d44,0x6e3663e9,0x7822d8ac,0x3ef9db6d,0x5f37f922,
  35637. 0xabe4a9aa,0x7f0ad39d,0xf69cc8ba,0xa0a57c70,0x00000098 } },
  35638. /* 200 */
  35639. { { 0x00fd5286,0xd9c50cf4,0x72a4b03c,0x1ea5b9d5,0x051ae73e,0xf5e60f9e,
  35640. 0x951b3824,0xfe9b5142,0x9fb4d667,0xb034b2d0,0xedc50856,0x4b537a80,
  35641. 0x8cb0022e,0x69ee1012,0x6a548aee,0x7c8b9e5c,0x000000ed },
  35642. { 0xd933619b,0x746007bc,0x2b9dfe19,0x0ce7668e,0xcc6e2a2e,0xa9eed5d3,
  35643. 0x7eebf32f,0x35a14f5f,0x67cc4f64,0x75cb898d,0x7850c16c,0xcb2185fc,
  35644. 0x45f79c96,0x09874a76,0x27db4744,0x7468f8ae,0x00000139 } },
  35645. /* 201 */
  35646. { { 0xc88684f6,0xc5de68ad,0x619a7dbf,0x7c1edaab,0xb27a18f5,0x258d1735,
  35647. 0x8ecd89eb,0xb27e7b65,0xd879f7ea,0x3d8889c6,0x67d5befb,0xa8fdc96d,
  35648. 0x37bad73c,0xc84d86ae,0xce8e56d7,0xc7e91976,0x000001a4 },
  35649. { 0x6319ffa6,0x5001a540,0x134ec04c,0x0cae64ec,0xd541242c,0x1f69a96c,
  35650. 0xbf2caeee,0x9da259ee,0x28bee805,0x88e7978c,0xb8e890e4,0xe9484beb,
  35651. 0xfb227fd9,0x0e5246d0,0x625d6318,0x8be2a54a,0x000001b7 } },
  35652. /* 202 */
  35653. { { 0xf472f13a,0xa223554a,0x5733e91c,0xfac993b7,0x96c168a2,0x26afe9f0,
  35654. 0x4b127535,0x7cfe761d,0xe77070ca,0x84301873,0xc7e7cdf6,0x66b6aaad,
  35655. 0xa1562ed4,0xda2dd5ea,0x39faf8d8,0xa81a2e00,0x00000016 },
  35656. { 0x4e3de3bf,0xa880759c,0x52f3088a,0x0c1e2e11,0xaa7eba5b,0xcb2ded9a,
  35657. 0x9f9c11ca,0x4c65d553,0xb0dc5c19,0x0ab9bd87,0xca3f4b61,0xd32f8c96,
  35658. 0x28cb5f9f,0x49842fcc,0xb90e21df,0x31ae27cc,0x000000f4 } },
  35659. /* 203 */
  35660. { { 0x6a0ccd0a,0x3b2a0a0d,0x5993b555,0xa3eeec82,0x9de672a6,0xb13486fd,
  35661. 0x0da05dcf,0x8d9c5148,0x6739874d,0xc4aa444d,0xe29a35c9,0xd9cf35b2,
  35662. 0x89177ead,0xd6bd9b5f,0x2a0470a1,0x9af0f59d,0x000001d6 },
  35663. { 0xba7535fd,0xb2f844c7,0xa842ff39,0x45bd4c3d,0xe951974b,0x5fe149ed,
  35664. 0xfd4453ec,0x6982e997,0xe6c37c0e,0xa63f705d,0xd2c3ef6a,0x09b0f6a9,
  35665. 0x1776a8d6,0xbedd3586,0xede11b78,0x4048a46a,0x00000176 } },
  35666. /* 204 */
  35667. { { 0x51a251d1,0xa47c6ee5,0x0d279dfd,0xbef4bf12,0xec518a28,0x4c2d538c,
  35668. 0x3880be6e,0x1b2b7887,0x1be9b20b,0xc69ccf8e,0x3796a19e,0xe41dfeae,
  35669. 0xfb50bdea,0x25676fc9,0x03e180c0,0x8b815a05,0x0000016a },
  35670. { 0x53f5ef65,0x2ca085f6,0x77b25105,0x61dfbbf9,0xa3346fe6,0x88ea87e3,
  35671. 0x1b95f7ef,0x25ddfdee,0x5b65eaec,0x22074e69,0x4c2e023b,0x11869a15,
  35672. 0x42e83bb5,0x8601b577,0xfa877e7d,0x1464652c,0x00000015 } },
  35673. /* 205 */
  35674. { { 0x57fa58f1,0x250853c8,0x4ca4c670,0xb58a4e68,0x1b81f40d,0x07b96d0a,
  35675. 0x558e8cbd,0xa4651e10,0x42e388cf,0x1a64046e,0x44436088,0x51b0d539,
  35676. 0xe26b8fd0,0xc2bf35b3,0x5702cfce,0x4ae78709,0x000000fd },
  35677. { 0xdf53d498,0x3c79bc29,0x1137f624,0x4cf31c4e,0x17a3cedf,0x93b6856c,
  35678. 0x6cd9115d,0x2461131c,0x9228cddb,0xab30a453,0x8d202bf1,0xe97757b6,
  35679. 0xe6108612,0xa666de7c,0x4f6026b4,0xc200fe65,0x00000051 } },
  35680. /* 206 */
  35681. { { 0xb1a2b4b5,0xea96103c,0x843c0968,0x98dccbfe,0x986ffb5b,0x6a37072d,
  35682. 0x169d3ac2,0x2fa07af2,0x771371f1,0x8bb85b9a,0xe7c299ef,0xeae10d34,
  35683. 0xe2372efc,0x3d4bdc69,0x8dd856f1,0x378df75d,0x00000039 },
  35684. { 0xde7ff5d9,0x31e902ff,0x325a09ca,0x0e9a85d2,0xf4192fcd,0xd71b93a6,
  35685. 0x15b076b3,0xf52a5737,0x6e711d1c,0xd726aa86,0x2c292819,0x0b61b1df,
  35686. 0xc8015de6,0x224e575c,0x18b79e47,0x68e893e1,0x000001dc } },
  35687. /* 207 */
  35688. { { 0x6ffeda73,0xb7924ff9,0xa0da2018,0xe709f406,0xf89584df,0x368e20ea,
  35689. 0x8355a040,0x0095112e,0xfd777d7c,0x259d4528,0x2bf8f2c8,0xb0c49565,
  35690. 0x44c5311b,0x7f631928,0x8466d9d5,0x698d0e4f,0x000000d5 },
  35691. { 0x015d204d,0xe10d64fa,0x6dd10c53,0x7b626bfa,0xa7698c94,0x087f8e63,
  35692. 0x05337a56,0x525a6547,0xdf5c782f,0x558e2244,0x855fbaff,0x48aa1e41,
  35693. 0x47ee3830,0x48f2218e,0x138463d3,0xf2523959,0x0000004d } },
  35694. /* 208 */
  35695. { { 0xd8695310,0x76f4fd69,0x7e8768ea,0xe28eb09f,0xe0d532a8,0x039c1812,
  35696. 0xc572ac79,0xdda67744,0x785d6293,0x1f9800e0,0x3da76bb2,0x2bfe2a5a,
  35697. 0xa2bc7217,0x6ed15b90,0xd1788a8e,0xd80e61bf,0x0000004c },
  35698. { 0x16730056,0xb9f40370,0xdced3d43,0x46f45fef,0x1aa50742,0x0afd763c,
  35699. 0xff92ae73,0x21e5c652,0x1bb2063f,0x6ef0830d,0x12d22540,0x18306ecc,
  35700. 0x1f15001c,0x4edd9b3a,0xc0cc5424,0xe4eb25b8,0x000001f4 } },
  35701. /* 209 */
  35702. { { 0xa1db5c18,0xed61a714,0x7677074c,0x9454e61e,0x7bf685de,0xe970fbe5,
  35703. 0xd2145be5,0x221b0c53,0xee49a5f2,0xb931881b,0x14b11d03,0x00b91afa,
  35704. 0x3ec22137,0xc6aefe49,0x526200af,0x50554e94,0x0000013c },
  35705. { 0x7364c92e,0xd42c45e7,0x735218e8,0xe0500265,0x84d3f3c5,0xd281da02,
  35706. 0xdbf7646b,0x312f8424,0x485f304f,0xe1a88f2a,0x1127a513,0x583f5631,
  35707. 0x1a60e0bc,0xed7950c7,0x4b7b70a4,0x92855e10,0x000000c6 } },
  35708. /* 210 */
  35709. { { 0x644614e7,0x8d06185c,0x4749a424,0x2e906cae,0x2587e528,0x585412ea,
  35710. 0xd12857cd,0x3763990a,0xba5593b5,0x770c7f70,0xdd5d2a46,0xc2cf6dc4,
  35711. 0x3b69a1ba,0x564da456,0x187895da,0x639f7e14,0x000001c8 },
  35712. { 0xf8589620,0x05c96b02,0x41e44054,0x2fe468a3,0x096ad09c,0xbf22da11,
  35713. 0x9c652aee,0xbc73c298,0x547e1b8f,0xcdef9f8b,0x977dbf73,0x7073785a,
  35714. 0x7e13552d,0x0a92a1aa,0x3a393d3f,0x22761140,0x0000015b } },
  35715. /* 211 */
  35716. { { 0x1fbfaf32,0x89a5a7b0,0xbe661d21,0x5c5a62d0,0xf5e3b44d,0x47970f5e,
  35717. 0xf43bbf62,0x3ea001ed,0x260ae5a0,0xa8e74285,0x2697c62c,0xeb899ebd,
  35718. 0x751a7643,0x36a003e6,0xba0725a6,0xef178c51,0x000000ea },
  35719. { 0x9bd51f28,0xaacf8e9f,0xa8712044,0x39febbdb,0x5bfc8365,0x8780ad3a,
  35720. 0x10e6f08f,0x408a34cd,0x8241ab0e,0x8104ca10,0x98a662a1,0x843e71ce,
  35721. 0x232048d6,0x9dce8514,0x1cf3d187,0x5cba23be,0x000001fa } },
  35722. /* 212 */
  35723. { { 0x2973a15c,0x2fe8c9d2,0xd42979f3,0x66fec8dd,0x0b6afb3e,0x39af4a39,
  35724. 0xab65ef22,0x0bb1e436,0x66c5fcdb,0x8f26201e,0x5af4870b,0x3cffe8a3,
  35725. 0x2bb44e24,0x65ae286f,0x51dd1722,0xda2e283a,0x00000114 },
  35726. { 0xc1e3d708,0x4a9c9a56,0x1cb0efa6,0x4fe62d3f,0x97e87540,0xf0702984,
  35727. 0x3cea46fa,0x138b7d6b,0x83886263,0x0780634e,0x71c30909,0x27e84280,
  35728. 0xe5838647,0xf0af79d7,0xb236a267,0xc1b86582,0x00000104 } },
  35729. /* 213 */
  35730. { { 0xa526c894,0x32ff09ed,0x14ac7d23,0x95abf120,0x3cd92934,0xb6f94dcd,
  35731. 0x92e6b556,0xffaaeb12,0x1036c31b,0x193796ea,0x707ff32e,0xa9d237e7,
  35732. 0x829d67b8,0xd65a5b0d,0xdb29248b,0x48edb556,0x000001b3 },
  35733. { 0xded46575,0x6ee9f9b2,0xffa69acf,0x496ca08a,0xf16d37d1,0xd5aeb3a1,
  35734. 0x789e5d01,0x4a507db1,0xc827cc45,0x05e2ce29,0x2964e677,0x29b6e4a5,
  35735. 0x4c0e46f2,0x0563b0ba,0x4bc46485,0xe75c2448,0x000000a3 } },
  35736. /* 214 */
  35737. { { 0xd2f6615d,0x0fcb476f,0xd98da9a9,0x4b7f9b78,0xd2bdf107,0xe2fddf1c,
  35738. 0x9b956f31,0x2bda3086,0xb596eadf,0xf3cca2f7,0x355b2538,0x91c09f8b,
  35739. 0xc6c846db,0x46f3f6f3,0x2a14642e,0x9bb9398e,0x000001ff },
  35740. { 0xa17bd645,0x5118d4f5,0xdbd6d552,0x57033eab,0x734d0957,0x007e86fc,
  35741. 0x5f53c435,0x98ca065f,0xfd27dd19,0x9949d9bf,0x6952d1ca,0xddc4e304,
  35742. 0x81ac101c,0x84cab4fb,0x4a56b007,0x46d079f9,0x00000003 } },
  35743. /* 215 */
  35744. { { 0xa6bfdedd,0x95eb8e4f,0x7a74c6f9,0x993a285e,0x3d09a252,0x8bd5d4d1,
  35745. 0x19a5f767,0xeaa10be6,0x0cebb340,0xd3db083e,0x1dbf7a83,0xc633a78b,
  35746. 0xc30f23e1,0x2664bc3e,0x07a08379,0x6630f8f1,0x000001c9 },
  35747. { 0xdef86a80,0xbbf4cb4b,0x3f8259ab,0x1fa4ec78,0x609532c8,0xa4bf7604,
  35748. 0x8b909e92,0x71bb7acc,0x17884160,0xca1d7317,0xca1ab928,0x7f7f14be,
  35749. 0x5f8455a5,0xbfea016e,0xbf21e899,0x7b8c76b9,0x0000002d } },
  35750. /* 216 */
  35751. { { 0x4b9f8e7d,0x46860563,0x63fc58a8,0x201176b7,0x2feed68a,0xe7a5da7e,
  35752. 0x65183190,0xcc67763e,0xe9377ad6,0x7d7d0102,0x77032321,0xccfc4720,
  35753. 0x534bb505,0x573ee031,0x0f1a2769,0x1bf1ef8c,0x000000f3 },
  35754. { 0x0c935667,0x635f5c4b,0x060d2b8b,0x74152c39,0x37c3a574,0xeffaac2e,
  35755. 0x0b72e0cd,0xfd5fcc4c,0xf4f60247,0xb743f9b9,0x79e16f33,0x05c2e354,
  35756. 0x3074ef9c,0xa2234c47,0x495aace3,0x4092f279,0x00000124 } },
  35757. /* 217 */
  35758. { { 0xb30f9170,0x5bfd7851,0x37fce5b1,0x715aa1e9,0x928437b9,0xcffd55e0,
  35759. 0xc32f1273,0x88acd259,0x48be1e34,0x5a145cf2,0x7a5bc62b,0x3a340860,
  35760. 0x18156f46,0x6296eb15,0x2774e1c3,0x397fad19,0x000001e7 },
  35761. { 0x9c8225b5,0x362f99f4,0x46b77c4d,0x33efce49,0x8541e91b,0x451df530,
  35762. 0x38f3d693,0x0bd2d934,0xe727b54e,0x0b5de2d6,0x7622d940,0x42d929c2,
  35763. 0x56f6a94b,0x36ace723,0xfccaf205,0x64a18cd5,0x00000044 } },
  35764. /* 218 */
  35765. { { 0xaba95d63,0x8dbe0aab,0x7b4b346d,0x92780c61,0x0e0d8142,0x6430f863,
  35766. 0xb56ef04c,0x875be02a,0x785e3633,0xc28feb95,0xc12c93e4,0xd5401795,
  35767. 0xe36f82a3,0x89ff51c1,0x10eeafd6,0x3c48c895,0x0000016b },
  35768. { 0xd4f064be,0x79287eba,0x54ebda99,0x1a77d555,0x623727ea,0x46745ef2,
  35769. 0x89f366c6,0xa911f591,0xc59d6ebd,0x7e5435cd,0x7524d213,0x3a84daea,
  35770. 0x4395b38d,0xc7b1dd1c,0x1a823c49,0xca13e704,0x0000001c } },
  35771. /* 219 */
  35772. { { 0x874d64b0,0x6399860c,0x1653ce0c,0x3375b092,0xeaa11986,0x16700000,
  35773. 0x621cd15d,0x62c67909,0x77d70dcd,0xbe1d7dd6,0x305bd4cd,0xeff0f270,
  35774. 0x362f8f30,0x076ec621,0x7e445b78,0x81204816,0x000001d8 },
  35775. { 0x161f9758,0x81749a0e,0xa3c4fce2,0xe60915fe,0x911dd8af,0xf537ce41,
  35776. 0x79a51a09,0xfe36a8ac,0x2ca5cf8e,0x67fb54b4,0xe49057f5,0x1bdcae07,
  35777. 0xa4244b64,0xb71ff0c5,0x4b606583,0x4815a536,0x00000106 } },
  35778. /* 220 */
  35779. { { 0xef39cc39,0x78c69c3e,0xfa6356d1,0x98304564,0x412fb990,0xbd3c3542,
  35780. 0x79dbb2a5,0xa1d531d3,0xe7e75e3d,0x4865f188,0x0b0147b1,0x2dac4e22,
  35781. 0x33d29ab0,0xf59e51ca,0x37b074ef,0xc964f7fe,0x000000f1 },
  35782. { 0x0e301262,0x7080c0a6,0x5390a22d,0x9a458060,0xcc8a9029,0xda677f9a,
  35783. 0x14c0f1c2,0xdfae9057,0x6e66d9f7,0x3665ff16,0x47846924,0xc866dd8c,
  35784. 0xc4cc307c,0xc5afe98f,0xe0bf50e4,0x60e3ba63,0x00000039 } },
  35785. /* 221 */
  35786. { { 0x959ecdb3,0x1a785136,0xf9e959be,0x289af617,0xcde0dc88,0x5145b2b8,
  35787. 0x7c079e15,0xfe9070b0,0x50e22415,0xf77f04d3,0x358d6d42,0xb3ab7372,
  35788. 0xba7b629a,0x14fd41b9,0x7400fd25,0x7b32d80e,0x00000193 },
  35789. { 0x7147886f,0xe5d80d4d,0x576c81ca,0xe08ced61,0x642717bb,0xe14e8692,
  35790. 0xabb4bd21,0x9dcdf198,0x6530308b,0x658be646,0xd99d19c7,0xfbf192da,
  35791. 0x304ab126,0x55a3d1b3,0xfa24de31,0x943f4be5,0x0000000e } },
  35792. /* 222 */
  35793. { { 0x7fe9ea48,0xc5424058,0x61b57486,0xaf24f825,0x78719740,0x9d2c413c,
  35794. 0x70eb874d,0x27a9be79,0xb62ba3aa,0x43fef8e0,0x2c1bf0ac,0x0a23f286,
  35795. 0x4af130e1,0x51c276f3,0xae55cebf,0xf6cd1e9a,0x00000185 },
  35796. { 0x40369093,0x24defa7f,0x58581e0a,0x11f1d9d6,0xe512ed9e,0x9900bf33,
  35797. 0xed120896,0xbf8a8459,0x8b73c399,0x8324555e,0x8f6f54fe,0x54a30569,
  35798. 0x3c252355,0x2a9d6da5,0x2a093b31,0xe6a6f904,0x0000016a } },
  35799. /* 223 */
  35800. { { 0x152cdd35,0xb2e123c9,0x86402ef1,0xae6e43a8,0xb9ce5bd5,0x892bf0df,
  35801. 0x75804914,0xb4acb84a,0xf502eec2,0x8c7f55ff,0xaa33ef4e,0x9c8a7b93,
  35802. 0xfd9d2001,0x06b10357,0x0ba3bceb,0x3e319ff0,0x00000027 },
  35803. { 0xabe360a3,0x182c2f77,0xadfefca6,0x57ef5c84,0x650b6fcc,0x9a4f0ca6,
  35804. 0xaaf0b202,0x3f4f8e56,0xa24ef156,0x5c8508a0,0x1ea45f13,0xd8f62fd9,
  35805. 0x28036dbe,0xf2c923a0,0x1a4d103b,0x4a9ca4c0,0x0000018a } },
  35806. /* 224 */
  35807. { { 0x5448e339,0x2a3fb798,0x18a39976,0xde8770cf,0x7a69170c,0x1160574d,
  35808. 0x2b6067ac,0x4bb05c59,0x848138ab,0xde0d2db0,0x4909e794,0x149dab92,
  35809. 0x790315f7,0x83a336b6,0xa335a258,0xcd9074d9,0x0000013c },
  35810. { 0xac1b784d,0xe839c5e0,0xee527ae1,0xab65c8c6,0xa1c88ec0,0xd3c86146,
  35811. 0x46c1bf58,0x2201f790,0x3fda502a,0x71cec627,0x225b9065,0xff3f88eb,
  35812. 0xc556dfcd,0x6c1f0c98,0x484fa5cc,0xaa3222aa,0x000000ac } },
  35813. /* 225 */
  35814. { { 0xc9b4dfd6,0x17e74bc3,0xf8e76293,0x25ba8053,0x9d8c3520,0x0307dc05,
  35815. 0xb85a20b4,0x1c9036cc,0x23871359,0xf2c63f0a,0xca95fb4e,0x1a99d9d8,
  35816. 0x9850c6c6,0x3d7c4f39,0x68299668,0x162969c9,0x00000169 },
  35817. { 0xcb63ee53,0x7d13c267,0x75eac353,0x67b12e61,0x191abfca,0xb3369a11,
  35818. 0xee1af69f,0x5ad0649d,0x11dc11e7,0x4d7a6f00,0xdb9f9765,0x80f030b8,
  35819. 0xf0ab1332,0xa20001a3,0x39d8cc62,0xe17c98d2,0x00000194 } },
  35820. /* 226 */
  35821. { { 0x1d8fe898,0x720d80b4,0x32184534,0x8d7a28b7,0x04f21740,0xf1f3c385,
  35822. 0x166aa6af,0x5d381cd5,0xcc560e35,0x9cde6084,0x5e61e2cd,0xcb041f0a,
  35823. 0xd9b4951a,0x621116f5,0x7ee2ac2c,0x509e16d3,0x000000c4 },
  35824. { 0x2c6fd79e,0xb82a20c4,0x3af78b0e,0x95b7ee4e,0xbad819ca,0x3d9b63c1,
  35825. 0x98552569,0x10d674de,0xf9c19d0f,0x17de64b2,0x47c5e6a9,0xa03fabaf,
  35826. 0x2ce2db6f,0x858bc4ad,0x1fc9d18e,0x76c2380a,0x000000c9 } },
  35827. /* 227 */
  35828. { { 0xb064f114,0x91171ef8,0x4f2f0f4c,0x83cb1565,0x57b262b7,0x30525854,
  35829. 0x0f34936c,0x468c6701,0x99a41fed,0xef26d2fe,0xa7f7f6a9,0xf6da2267,
  35830. 0xa01bfc1b,0x2563b8db,0xc340ed40,0x14b36c85,0x0000000e },
  35831. { 0x25db67e6,0x5e57e264,0x7f2e905f,0x85df4e89,0x026c4268,0x7832e514,
  35832. 0x3e875093,0x312be262,0x3c538691,0x856b5bd8,0x95734f9d,0x5b1cae55,
  35833. 0xd5aa4861,0x5a07bfe2,0xce8abb58,0x7a4c96f0,0x000001d0 } },
  35834. /* 228 */
  35835. { { 0x523aa2e9,0x7bf54d05,0xed3d0860,0xc8841e0c,0x7f9bfb69,0x5683f6e2,
  35836. 0x162bdf85,0xdcb07f44,0x07b0dcc9,0x62d17839,0x657a536e,0xa2cbb8ab,
  35837. 0x7cf47d3c,0x98b9a0d2,0x5eea6370,0xff154d68,0x000001f2 },
  35838. { 0x56b232ac,0x568b768a,0x3f2a52ab,0x4e8d6e36,0x8837fc60,0xbae87a16,
  35839. 0xd10a7691,0xebc58a83,0xf9455fbe,0xad5e4af0,0x7d654e2e,0x1a20d6c3,
  35840. 0xda7c8255,0x8c40fcb9,0x60d9b931,0x6d7b3cd7,0x000000b2 } },
  35841. /* 229 */
  35842. { { 0xbb2eaf45,0x7b090c3e,0x62ffb92f,0xed24d91c,0xa736f23d,0xbf2a3ea4,
  35843. 0x6ff0fde3,0xb5b99ebd,0xca1102f5,0xbca2b55d,0x07e032a8,0xf6203cd8,
  35844. 0xa8bf17a8,0x5410b448,0xe1dc55b1,0xb86660a7,0x00000109 },
  35845. { 0x02a2fbd8,0xb148b1da,0x3b22e8a5,0xfed85e8b,0x8712b509,0x1378a0e4,
  35846. 0xc6a3e516,0x68560148,0x1633b503,0x7100921c,0x25512711,0x93925143,
  35847. 0x07d31047,0x7b4931d2,0x8542e0bb,0x623e722b,0x000000ea } },
  35848. /* 230 */
  35849. { { 0x24972688,0x084823d3,0x003f5762,0x58b83c12,0x6d0d4528,0x194d6690,
  35850. 0x2c6f747e,0x84219584,0x0146d89a,0xc8f8a2e9,0x7451bbc2,0x29ec1de7,
  35851. 0xf7f284fa,0xf622b6b8,0x7b71e44f,0x83f1dbe9,0x00000060 },
  35852. { 0x999dd56b,0x99649333,0x97a47de9,0x2cfac0ba,0xbbe8fb20,0x6660d8ae,
  35853. 0xf61d7bca,0x47c29dd8,0x85adc14d,0x6f5fb51d,0x4f9fd41c,0xe65ac788,
  35854. 0xff513e6c,0x1ce69dd4,0xffe59d3e,0x1ace591e,0x00000023 } },
  35855. /* 231 */
  35856. { { 0xa9fda771,0x2e67a438,0x8663100e,0x626f652c,0xe133f23b,0xdfb19e48,
  35857. 0x035d2d1f,0x599f88f2,0x8d13e878,0x1723a112,0xfb51ce07,0x890aa292,
  35858. 0xbbd9ba82,0xe5f3a70e,0x374514b4,0xdde82673,0x00000155 },
  35859. { 0xd6f59a95,0x08b2b77e,0x02020420,0x93f853e3,0xebac7797,0x52252ac1,
  35860. 0xb56b6676,0x6ecdcb99,0x9722a500,0x4abdb9f9,0x04e2bad0,0x26210f3f,
  35861. 0x3034dd4d,0x0ca5a0ff,0xdac0b80d,0x333d8080,0x00000041 } },
  35862. /* 232 */
  35863. { { 0x35a85a06,0xe8510709,0x42ef1b44,0x4e166e76,0xa07b3a6d,0x84a90b71,
  35864. 0x30329e6a,0xd6dd6c00,0x3d555259,0x20c4ba65,0x6f8ad05e,0xee3b26af,
  35865. 0x2ab4cccd,0x20e3d541,0xa9406424,0x79798934,0x000001bd },
  35866. { 0x8e0c7ff0,0xf2a1d184,0x9543b340,0xbae85efc,0xf51d318b,0xe96431ae,
  35867. 0x75878fa6,0xe5d3ed4e,0xc2895f52,0x4d2a29db,0x1f11067c,0x3af27877,
  35868. 0x9e7f4ee5,0x6ccde964,0xa56d74da,0x35188da1,0x00000192 } },
  35869. /* 233 */
  35870. { { 0x03d310ed,0xb0832120,0x987b0311,0xd20ee8cc,0x84c558a8,0x9e549d26,
  35871. 0xb7167ec8,0x5e25f3ce,0x4bf55bb5,0xacf114f4,0x061c9017,0x819edc77,
  35872. 0xdeb343c0,0x759a44e6,0x04c9b5ed,0x58df9f7e,0x00000078 },
  35873. { 0x3bf13222,0x4fa47ebb,0xea07da11,0x1e451dcd,0xc0d8242f,0x1be9fac3,
  35874. 0x36eb871e,0x93257d4d,0xbea3190d,0xf49e775a,0x4ebe2b33,0x406d191f,
  35875. 0x0c110096,0x67aac53c,0xd381ac78,0x5215cf8b,0x000001f4 } },
  35876. /* 234 */
  35877. { { 0xfa493b79,0x387e8a8e,0x4eb1c2ac,0xb20e270b,0x9ff22320,0x9f393fa0,
  35878. 0xa91c393d,0x5ee1baae,0x138a8d96,0xdeda961a,0x97bd50e4,0x69ab238c,
  35879. 0x2363c8e0,0xff68d48a,0xce4c4c16,0xaf8e00e5,0x00000158 },
  35880. { 0xcfc509a1,0x6ccdcf06,0xc26cc075,0x60f411ef,0x4d9c57f0,0x6d0cdfd6,
  35881. 0x32e99cac,0xa9514853,0x8b8e9510,0x58f9ab3d,0xb10dc3fd,0xa7e98709,
  35882. 0x75ef3509,0x8390843d,0x5a9312c7,0x28ccc9d0,0x000001b6 } },
  35883. /* 235 */
  35884. { { 0xe341463f,0x1d934f00,0x150da7a0,0x14c8a6ce,0x4109553f,0xdb4860fc,
  35885. 0xa93f4a91,0xc23bde5a,0x2cd58067,0x9f47c787,0x8433dc80,0x1d330054,
  35886. 0x75a32a7d,0x0c0be7f9,0x88c75da9,0x08b777d5,0x0000012e },
  35887. { 0x61a10d37,0xdfc12817,0x5c50f5a5,0xed7b6181,0x79477c60,0x28af95db,
  35888. 0x33c5310b,0xa0aa2b77,0x53118267,0x905faab8,0x6b41959f,0xf40e9816,
  35889. 0x16b37784,0x9ccb4252,0x69866acc,0x6835d77c,0x000000c5 } },
  35890. /* 236 */
  35891. { { 0x2b450a66,0xe9d714cb,0x7dbfdc14,0x1318885c,0xb466a0c0,0x655a8d85,
  35892. 0x5bdfc1a6,0x02a21e99,0xe67792d1,0x7a0d7c98,0xb550a797,0x2a01bb57,
  35893. 0x5d74d337,0x42c46233,0x88dad495,0x7be4e1c0,0x0000008b },
  35894. { 0x95812273,0x1873b03f,0xee3f757f,0x2e26ed32,0x6da6217a,0x2c710eae,
  35895. 0x261d9f4f,0x9b50b574,0xb7c1da2d,0x43971fa9,0xc4a85de7,0x22c4fb87,
  35896. 0xec22137b,0xf72c3451,0x77ba1926,0x1345668c,0x00000173 } },
  35897. /* 237 */
  35898. { { 0x8a3ba183,0x3e3e8c7a,0xfe389fa7,0x4e8cebbb,0x0f9ba60f,0x8ea44687,
  35899. 0xcb601a83,0x55176e35,0x12e52db4,0xf90bdc26,0x8f712bf1,0x95f9e459,
  35900. 0xbea054cd,0x9bd3200f,0xdd5fd40b,0x2cf19bf6,0x0000017a },
  35901. { 0x66736feb,0x71cf6ca2,0xde7cfe2f,0xbde86f49,0xfc290563,0xc60abce8,
  35902. 0x726b6e4f,0xaae8a3ce,0x3f29235b,0xd2382445,0x650ffa5e,0xa4b557f5,
  35903. 0x113ef744,0xa1453e54,0x3e426dd2,0x7c676a53,0x000001b0 } },
  35904. /* 238 */
  35905. { { 0x35d96872,0xf5e603f2,0x3fa5b8ca,0xab1a23cc,0xe988dc5f,0x5459871b,
  35906. 0xd430c0bd,0xe32e8489,0x764d9cc3,0x7ec269e0,0xf2c0c40d,0xf7238212,
  35907. 0x887b83b4,0x2d946183,0x2f18a411,0x281fa671,0x00000010 },
  35908. { 0x64858b37,0x8028048f,0x357de5d9,0xe0e149af,0x619ebb18,0xb2218791,
  35909. 0x9f2b0ba0,0x210200b3,0x1039cbae,0x5a87eae6,0x39579d1d,0x4efdcddb,
  35910. 0x2788515e,0x1b388eaa,0xc81878aa,0x1a552c3c,0x0000002c } },
  35911. /* 239 */
  35912. { { 0x0ea723dc,0x7ac7f500,0x42b15231,0x0a5f04f4,0xbe885c86,0x63d49445,
  35913. 0xff119702,0x61f9993f,0xc4c58cea,0xc3fba45c,0xb9cd6036,0xe6d151e6,
  35914. 0x57b923bb,0x75a3ab15,0xceb2fd46,0x4ec07c52,0x00000147 },
  35915. { 0xed88239d,0xc46a3d32,0x835ae694,0x0d1b8ae6,0x9feeb2e7,0xf4fde325,
  35916. 0x43bc0bb5,0x223bf71c,0x8f62a705,0x3cd220b7,0x9fe799a5,0x2224860e,
  35917. 0x24ab7f93,0xd8558703,0xb594958b,0x8e0f7330,0x0000010f } },
  35918. /* 240 */
  35919. { { 0x3c67d520,0xaf35c7bb,0x23fca9ec,0xd8f4958b,0x8bbaa808,0x0778f194,
  35920. 0x2135e8ae,0x418c30ce,0xc888eff7,0xcdd8d9a9,0xf73144ab,0x72075df0,
  35921. 0x4506a534,0xb549c895,0x5fbb7fc5,0x4ef38979,0x0000011c },
  35922. { 0x43f5e698,0x3fe2c9ac,0xe38a5e3a,0xce77fcbc,0x3089c2e1,0x6d05c90e,
  35923. 0xac1d5801,0x5a74f3ff,0x381b9d2a,0xaeeda220,0xf5f3960b,0xd958b143,
  35924. 0x0db7abbe,0x65ffd051,0x7a05b718,0x8e97e680,0x000000ce } },
  35925. /* 241 */
  35926. { { 0x8ce86a83,0x2251e61b,0xbf7e7160,0x8604159f,0x48f03377,0xfc127dd7,
  35927. 0x45052242,0x87cb2c37,0x934ea09b,0xbd4950f4,0xc4679441,0x5146c403,
  35928. 0x23ba416a,0xe8ad4710,0xaf638eb1,0x89b81a60,0x000001b3 },
  35929. { 0xe8150c69,0xe699934e,0xe27c14bc,0x74f75908,0x6a0194ff,0x5dc0a891,
  35930. 0x1bd51b76,0x38f49d32,0x18779630,0x6bc3305e,0xfd3b4a68,0xfe2f3fbf,
  35931. 0xd7caf189,0x1409b377,0x9b8f109b,0x029ea13b,0x000001b3 } },
  35932. /* 242 */
  35933. { { 0x25a2fd88,0xef7938d2,0xceba0603,0x890f2f7c,0xd7a6dff4,0x4c3e1c80,
  35934. 0x2883f986,0x00c78f36,0x998e5305,0xed92b592,0x325ddc73,0x018a8f1b,
  35935. 0xd5d3708a,0x6dffd987,0x0d1f28bb,0xdcd3554f,0x00000059 },
  35936. { 0x23a74e7d,0x17c6e41d,0x5db32df6,0x94b61ebe,0x9e7ffa0b,0x3c2fffa7,
  35937. 0x2ebb7a0d,0x473662b7,0x01adf9c3,0xa86415ee,0x54679264,0x1502c326,
  35938. 0x2fa09c57,0x16911349,0x24749086,0x897f34aa,0x00000195 } },
  35939. /* 243 */
  35940. { { 0xabadc253,0x4845d359,0xc797c95e,0xe054b92c,0x9a218212,0x22a9b5bd,
  35941. 0xa52b8827,0x9bb80a5e,0x2e61c676,0xea38e78e,0x08b0f8b3,0xfb274b1a,
  35942. 0xdb9d854c,0xb6aa42e3,0x56012d73,0x8ba22523,0x00000163 },
  35943. { 0x75c8c576,0x7cec0e6f,0xe4bc7dd2,0xabb20e7c,0x69d80726,0x0958a0c8,
  35944. 0x8a023eb7,0xa908c66a,0x76110b15,0xca9f50ea,0x186f61a6,0x668c9994,
  35945. 0x2a0a69d8,0x9ddf22ed,0xbbf8a10f,0xbfee1897,0x000001e0 } },
  35946. /* 244 */
  35947. { { 0x48319e4f,0x26d86818,0x5a586fa0,0x6be6f6b5,0x26713265,0xbef5d886,
  35948. 0x98529cfa,0xac252ac5,0x62b29cfb,0xe7cc45f1,0xa2a6358d,0xee050609,
  35949. 0x2940ac70,0xf7cb9ca4,0xa885b1f0,0xfb44aaec,0x000001ad },
  35950. { 0xe798678e,0x66b7a936,0x99540438,0xca01e103,0x816860b7,0xf2491e37,
  35951. 0xb745d857,0xeeffd483,0xa4705ed6,0x5dbb3628,0xb2a5d0f7,0x57d68d49,
  35952. 0x2389fee3,0xd1a8529a,0x1a7fd686,0xdbbc2549,0x000001ad } },
  35953. /* 245 */
  35954. { { 0x969686a3,0xe10cba20,0xe3c053f5,0x308b1c55,0x26f47102,0x1712b134,
  35955. 0x49033038,0x1f9165b1,0x2d01527b,0x45b72017,0xaa9a34e2,0x6fcf6647,
  35956. 0xb0be35c8,0x51f54b94,0x5a15e382,0xfccb22a5,0x000000e3 },
  35957. { 0x5b4dc0be,0xaa71e4ec,0xdb1cd5c4,0xbb136248,0x046e1007,0xf36bff43,
  35958. 0xda9c99a3,0x5a6806d7,0x8349bc50,0x9cbfc6ee,0xe13e0850,0x26871e73,
  35959. 0x67f448c1,0x5e6aa227,0x2da7baf9,0xba77787c,0x000001b9 } },
  35960. /* 246 */
  35961. { { 0xc5a73375,0x1abe58ee,0x7a8ac438,0x175df69d,0xceca835a,0x2cf3150a,
  35962. 0xf507d30f,0xb87b0609,0xc60b0424,0x9ae53a2b,0x410f90ec,0x4931e182,
  35963. 0xadd689bb,0x452c7d0f,0x47631a8e,0xab453491,0x00000013 },
  35964. { 0x8c84f3af,0xaf2dd856,0x1baae33e,0x829dc092,0x8b96b070,0x46542a85,
  35965. 0xe8a82516,0x42260d40,0x5c35322b,0xb9e5edac,0x39eda0d2,0xbca79560,
  35966. 0xb962b90a,0x86bd07c6,0xb1ec5302,0x2e22dac7,0x0000010a } },
  35967. /* 247 */
  35968. { { 0x239d8f0a,0x665fc09d,0xab8a1021,0x92b2e03c,0x0173477b,0xe4369768,
  35969. 0x8e361604,0xab38ed9f,0x9eb061be,0x79b0091d,0x3e845670,0xcd422654,
  35970. 0x2fe1a2e0,0xa0f77ec7,0x760a030f,0x1d242162,0x00000093 },
  35971. { 0xf8646bc3,0xfa9f834c,0x40ae96f9,0x7df94a52,0x379177d1,0x901c3890,
  35972. 0xffeb66cd,0x9dfd0644,0x77b92465,0x81aec2ec,0xcd981d4f,0x2df3b7f2,
  35973. 0xf377b093,0xc9bc3f69,0xdd859d8b,0xdaef34f3,0x00000125 } },
  35974. /* 248 */
  35975. { { 0xa2c123bc,0xac08451b,0x0818fa54,0xd1e83a68,0x98957b8a,0x56dd5702,
  35976. 0xf0f12f16,0xcc7f2e34,0x0a9fa14d,0x1f6a9c33,0xb2fe782c,0xefc9a2bb,
  35977. 0x709f54dd,0xd319c697,0xd6460a53,0x0b8238cb,0x000001dc },
  35978. { 0x44dfb6f6,0xf6492901,0x6e401d26,0x270d7cb4,0x48537ad8,0x1a70a40e,
  35979. 0x70d8dbd9,0x84d661b5,0xf170d58b,0xca27223a,0x6344e1d2,0xeeb4cf14,
  35980. 0xab9de1fa,0x2255fc95,0xdbdc5ea7,0xcd6e110a,0x000001f8 } },
  35981. /* 249 */
  35982. { { 0x78b8a0a7,0x2a57c6b9,0xe833edea,0x24b4aeb6,0x4bd13fe7,0x9e4617c1,
  35983. 0xfc2e8ee4,0xc4186888,0xfb147eef,0x8d398a49,0x2e662cfb,0xe9f191f1,
  35984. 0x958ba2ec,0x61872289,0x00b8d50d,0xbd6d0f1b,0x0000002d },
  35985. { 0x24c93cc9,0x895cfdfe,0xb9e718e7,0x29ed7780,0x38baf7eb,0x01c8ba58,
  35986. 0x4ddcbf69,0x0225387e,0xa180d6bb,0x64b250bf,0xc947c7c2,0x6d68e548,
  35987. 0x9923f3cd,0x82a7b632,0x2d103cd2,0xb8f03613,0x0000000f } },
  35988. /* 250 */
  35989. { { 0x8cd9d494,0x8198b3f0,0x94f4f9f3,0x9b2065b9,0x3c738fa9,0x7664a220,
  35990. 0xd8d229cb,0x199f4c14,0xc51c54b3,0xddad75c4,0xd213a332,0x9a32ce0b,
  35991. 0x888c7b2f,0xf3a21085,0x5b1ff20a,0x6defa362,0x000000d1 },
  35992. { 0x19a296eb,0x44e00548,0xd1a91313,0x1d94ff15,0xfeaa454f,0xd7dead2b,
  35993. 0x4d40bd7f,0xae65a803,0x1801a4af,0x604f147e,0xa5e0de77,0x983048f9,
  35994. 0xff572ca0,0xa3b19ca5,0x1821d117,0xa237dba7,0x000000e0 } },
  35995. /* 251 */
  35996. { { 0x91630ee8,0xedbabf84,0x05eb5301,0xde6589c2,0xa051f47b,0x9f7d2b2d,
  35997. 0x212bbe81,0xaeaa9f96,0x94292124,0xdced3d5e,0xf4435e5b,0x691f5b89,
  35998. 0x9411f66f,0x19604c33,0x4356f0da,0xb7fc09ca,0x000000e6 },
  35999. { 0xf74f811c,0x1294e413,0xdf8d8ddb,0x1a42d831,0x963418c9,0x27f57217,
  36000. 0x88ebcdec,0x5fde5218,0xea305bc9,0xfdd5e06e,0xac668b61,0xed1e6088,
  36001. 0xeb811861,0x333af016,0x15ddcebc,0x5ecb192d,0x000001c9 } },
  36002. /* 252 */
  36003. { { 0xe0bde442,0x927b37a3,0x66f7a73e,0xe0543fe8,0x8ed10c2e,0xd30d9d20,
  36004. 0xa6617a32,0xaf79c341,0xd1d5cf8b,0xe7367870,0xe3abcf8b,0x02d0dce9,
  36005. 0x772b5e7b,0xfe23d2dd,0x1ffc70c5,0x29fceea0,0x0000010b },
  36006. { 0x62d803ff,0x31bcae4d,0xdbc306a9,0x93ee913f,0xd8c10662,0xaf1de7ab,
  36007. 0xe7a6d658,0xd485782a,0x102f4e06,0x9126592e,0x136fafe6,0x91a3127f,
  36008. 0x88371213,0x46b93440,0xa31e1634,0x53bb4380,0x000000ba } },
  36009. /* 253 */
  36010. { { 0xca5636b0,0x62e517fc,0x6aba15c7,0x4296e021,0x212e7b2d,0x5aa8fd7c,
  36011. 0x5717ad84,0x9517ce6d,0x98b2f357,0xe762b85b,0xdf59b07c,0x42f996b5,
  36012. 0xf37ef6f0,0xf3732abb,0x4542b489,0xa5d145ea,0x0000015d },
  36013. { 0xaa7f6e3f,0x1e77c55e,0xaa4a05bc,0x3f4d99a7,0x45828227,0xa56d7d77,
  36014. 0x77b748fb,0xdb0895fb,0x0629f5d1,0x1c484cce,0x359803fb,0xf5b1c90a,
  36015. 0x1720b8d0,0x43ac4f29,0x72ac13f2,0x8c10bfe8,0x000000e9 } },
  36016. /* 254 */
  36017. { { 0xc06c4fd6,0x9d1c4785,0xd25c2b9d,0xbf4b9025,0xd4982f24,0x04135eb1,
  36018. 0xba4fef2b,0x3ab3edc2,0x98de07ab,0x55a5239f,0x096f4b7d,0xd5fc49ab,
  36019. 0x3844c815,0xc50a2960,0x15676b2b,0xdb1148d0,0x00000047 },
  36020. { 0x10f3bad9,0xc49f9cc5,0x022901d4,0x490888fc,0xc47b44df,0x917a55eb,
  36021. 0xf39f2b68,0x20b2ebc6,0x04e9962a,0x0c58e3af,0x573dd5b7,0x52ab7c1b,
  36022. 0xa329f76c,0x2b54add6,0x82f4ca3b,0x59dad1eb,0x00000108 } },
  36023. /* 255 */
  36024. { { 0xa182d1ad,0x662c4128,0x20916c45,0x7751796e,0xba681647,0xa7704272,
  36025. 0xb92c85c1,0xfac8b0fa,0xaefb2e07,0x207ab2df,0x7861b32d,0xc73530a0,
  36026. 0x88aed145,0x63dbed65,0x0a53a49d,0x547bcdca,0x000000bd },
  36027. { 0x87056b51,0xa7c1382f,0x130f9912,0xc3d91edb,0xd3805b42,0xf7c7de46,
  36028. 0xfd31a995,0x456101eb,0xcd3fb8aa,0x1efd22b4,0x9eb17bce,0xfe391df7,
  36029. 0x616c0c32,0xb4d4c0c6,0x711beef4,0x19f023be,0x00000112 } },
  36030. };
  36031. /* Multiply the base point of P521 by the scalar and return the result.
  36032. * If map is true then convert result to affine coordinates.
  36033. *
  36034. * Stripe implementation.
  36035. * Pre-generated: 2^0, 2^65, ...
  36036. * Pre-generated: products of all combinations of above.
  36037. * 8 doubles and adds (with qz=1)
  36038. *
  36039. * r Resulting point.
  36040. * k Scalar to multiply by.
  36041. * map Indicates whether to convert result to affine.
  36042. * ct Constant time required.
  36043. * heap Heap to use for allocation.
  36044. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  36045. */
  36046. static int sp_521_ecc_mulmod_base_17(sp_point_521* r, const sp_digit* k,
  36047. int map, int ct, void* heap)
  36048. {
  36049. return sp_521_ecc_mulmod_stripe_17(r, &p521_base, p521_table,
  36050. k, map, ct, heap);
  36051. }
  36052. #endif
  36053. /* Multiply the base point of P521 by the scalar and return the result.
  36054. * If map is true then convert result to affine coordinates.
  36055. *
  36056. * km Scalar to multiply by.
  36057. * r Resulting point.
  36058. * map Indicates whether to convert result to affine.
  36059. * heap Heap to use for allocation.
  36060. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  36061. */
  36062. int sp_ecc_mulmod_base_521(const mp_int* km, ecc_point* r, int map, void* heap)
  36063. {
  36064. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36065. sp_point_521* point = NULL;
  36066. sp_digit* k = NULL;
  36067. #else
  36068. sp_point_521 point[1];
  36069. sp_digit k[17];
  36070. #endif
  36071. int err = MP_OKAY;
  36072. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36073. point = (sp_point_521*)XMALLOC(sizeof(sp_point_521), heap,
  36074. DYNAMIC_TYPE_ECC);
  36075. if (point == NULL)
  36076. err = MEMORY_E;
  36077. if (err == MP_OKAY) {
  36078. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 17, heap,
  36079. DYNAMIC_TYPE_ECC);
  36080. if (k == NULL)
  36081. err = MEMORY_E;
  36082. }
  36083. #endif
  36084. if (err == MP_OKAY) {
  36085. sp_521_from_mp(k, 17, km);
  36086. err = sp_521_ecc_mulmod_base_17(point, k, map, 1, heap);
  36087. }
  36088. if (err == MP_OKAY) {
  36089. err = sp_521_point_to_ecc_point_17(point, r);
  36090. }
  36091. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36092. if (k != NULL)
  36093. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  36094. if (point != NULL)
  36095. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  36096. #endif
  36097. return err;
  36098. }
  36099. /* Multiply the base point of P521 by the scalar, add point a and return
  36100. * the result. If map is true then convert result to affine coordinates.
  36101. *
  36102. * km Scalar to multiply by.
  36103. * am Point to add to scalar mulitply result.
  36104. * inMont Point to add is in montgomery form.
  36105. * r Resulting point.
  36106. * map Indicates whether to convert result to affine.
  36107. * heap Heap to use for allocation.
  36108. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  36109. */
  36110. int sp_ecc_mulmod_base_add_521(const mp_int* km, const ecc_point* am,
  36111. int inMont, ecc_point* r, int map, void* heap)
  36112. {
  36113. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36114. sp_point_521* point = NULL;
  36115. sp_digit* k = NULL;
  36116. #else
  36117. sp_point_521 point[2];
  36118. sp_digit k[17 + 17 * 2 * 6];
  36119. #endif
  36120. sp_point_521* addP = NULL;
  36121. sp_digit* tmp = NULL;
  36122. int err = MP_OKAY;
  36123. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36124. point = (sp_point_521*)XMALLOC(sizeof(sp_point_521) * 2, heap,
  36125. DYNAMIC_TYPE_ECC);
  36126. if (point == NULL)
  36127. err = MEMORY_E;
  36128. if (err == MP_OKAY) {
  36129. k = (sp_digit*)XMALLOC(
  36130. sizeof(sp_digit) * (17 + 17 * 2 * 6),
  36131. heap, DYNAMIC_TYPE_ECC);
  36132. if (k == NULL)
  36133. err = MEMORY_E;
  36134. }
  36135. #endif
  36136. if (err == MP_OKAY) {
  36137. addP = point + 1;
  36138. tmp = k + 17;
  36139. sp_521_from_mp(k, 17, km);
  36140. sp_521_point_from_ecc_point_17(addP, am);
  36141. }
  36142. if ((err == MP_OKAY) && (!inMont)) {
  36143. err = sp_521_mod_mul_norm_17(addP->x, addP->x, p521_mod);
  36144. }
  36145. if ((err == MP_OKAY) && (!inMont)) {
  36146. err = sp_521_mod_mul_norm_17(addP->y, addP->y, p521_mod);
  36147. }
  36148. if ((err == MP_OKAY) && (!inMont)) {
  36149. err = sp_521_mod_mul_norm_17(addP->z, addP->z, p521_mod);
  36150. }
  36151. if (err == MP_OKAY) {
  36152. err = sp_521_ecc_mulmod_base_17(point, k, 0, 0, heap);
  36153. }
  36154. if (err == MP_OKAY) {
  36155. sp_521_proj_point_add_17(point, point, addP, tmp);
  36156. if (map) {
  36157. sp_521_map_17(point, point, tmp);
  36158. }
  36159. err = sp_521_point_to_ecc_point_17(point, r);
  36160. }
  36161. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36162. if (k != NULL)
  36163. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  36164. if (point)
  36165. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  36166. #endif
  36167. return err;
  36168. }
  36169. #if defined(WOLFSSL_VALIDATE_ECC_KEYGEN) || defined(HAVE_ECC_SIGN) || \
  36170. defined(HAVE_ECC_VERIFY)
  36171. #endif /* WOLFSSL_VALIDATE_ECC_KEYGEN | HAVE_ECC_SIGN | HAVE_ECC_VERIFY */
  36172. /* Add 1 to a. (a = a + 1)
  36173. *
  36174. * a A single precision integer.
  36175. */
  36176. SP_NOINLINE static void sp_521_add_one_17(sp_digit* a)
  36177. {
  36178. __asm__ __volatile__ (
  36179. "mov r2, #1\n\t"
  36180. "ldr r1, [%[a], #0]\n\t"
  36181. "adds r1, r1, r2\n\t"
  36182. "mov r2, #0\n\t"
  36183. "str r1, [%[a], #0]\n\t"
  36184. "ldr r1, [%[a], #4]\n\t"
  36185. "adcs r1, r1, r2\n\t"
  36186. "str r1, [%[a], #4]\n\t"
  36187. "ldr r1, [%[a], #8]\n\t"
  36188. "adcs r1, r1, r2\n\t"
  36189. "str r1, [%[a], #8]\n\t"
  36190. "ldr r1, [%[a], #12]\n\t"
  36191. "adcs r1, r1, r2\n\t"
  36192. "str r1, [%[a], #12]\n\t"
  36193. "ldr r1, [%[a], #16]\n\t"
  36194. "adcs r1, r1, r2\n\t"
  36195. "str r1, [%[a], #16]\n\t"
  36196. "ldr r1, [%[a], #20]\n\t"
  36197. "adcs r1, r1, r2\n\t"
  36198. "str r1, [%[a], #20]\n\t"
  36199. "ldr r1, [%[a], #24]\n\t"
  36200. "adcs r1, r1, r2\n\t"
  36201. "str r1, [%[a], #24]\n\t"
  36202. "ldr r1, [%[a], #28]\n\t"
  36203. "adcs r1, r1, r2\n\t"
  36204. "str r1, [%[a], #28]\n\t"
  36205. "ldr r1, [%[a], #32]\n\t"
  36206. "adcs r1, r1, r2\n\t"
  36207. "str r1, [%[a], #32]\n\t"
  36208. "ldr r1, [%[a], #36]\n\t"
  36209. "adcs r1, r1, r2\n\t"
  36210. "str r1, [%[a], #36]\n\t"
  36211. "ldr r1, [%[a], #40]\n\t"
  36212. "adcs r1, r1, r2\n\t"
  36213. "str r1, [%[a], #40]\n\t"
  36214. "ldr r1, [%[a], #44]\n\t"
  36215. "adcs r1, r1, r2\n\t"
  36216. "str r1, [%[a], #44]\n\t"
  36217. "ldr r1, [%[a], #48]\n\t"
  36218. "adcs r1, r1, r2\n\t"
  36219. "str r1, [%[a], #48]\n\t"
  36220. "ldr r1, [%[a], #52]\n\t"
  36221. "adcs r1, r1, r2\n\t"
  36222. "str r1, [%[a], #52]\n\t"
  36223. "ldr r1, [%[a], #56]\n\t"
  36224. "adcs r1, r1, r2\n\t"
  36225. "str r1, [%[a], #56]\n\t"
  36226. "ldr r1, [%[a], #60]\n\t"
  36227. "adcs r1, r1, r2\n\t"
  36228. "str r1, [%[a], #60]\n\t"
  36229. "ldr r1, [%[a], #64]\n\t"
  36230. "adcs r1, r1, r2\n\t"
  36231. "str r1, [%[a], #64]\n\t"
  36232. :
  36233. : [a] "r" (a)
  36234. : "memory", "r1", "r2"
  36235. );
  36236. }
  36237. /* Read big endian unsigned byte array into r.
  36238. *
  36239. * r A single precision integer.
  36240. * size Maximum number of bytes to convert
  36241. * a Byte array.
  36242. * n Number of bytes in array to read.
  36243. */
  36244. static void sp_521_from_bin(sp_digit* r, int size, const byte* a, int n)
  36245. {
  36246. int i;
  36247. int j;
  36248. byte* d;
  36249. for (i = n - 1,j = 0; i >= 3; i -= 4) {
  36250. r[j] = ((sp_digit)a[i - 0] << 0) |
  36251. ((sp_digit)a[i - 1] << 8) |
  36252. ((sp_digit)a[i - 2] << 16) |
  36253. ((sp_digit)a[i - 3] << 24);
  36254. j++;
  36255. }
  36256. if (i >= 0) {
  36257. r[j] = 0;
  36258. d = (byte*)r;
  36259. switch (i) {
  36260. case 2: d[n - 1 - 2] = a[2]; //fallthrough
  36261. case 1: d[n - 1 - 1] = a[1]; //fallthrough
  36262. case 0: d[n - 1 - 0] = a[0]; //fallthrough
  36263. }
  36264. j++;
  36265. }
  36266. for (; j < size; j++) {
  36267. r[j] = 0;
  36268. }
  36269. }
  36270. /* Generates a scalar that is in the range 1..order-1.
  36271. *
  36272. * rng Random number generator.
  36273. * k Scalar value.
  36274. * returns RNG failures, MEMORY_E when memory allocation fails and
  36275. * MP_OKAY on success.
  36276. */
  36277. static int sp_521_ecc_gen_k_17(WC_RNG* rng, sp_digit* k)
  36278. {
  36279. int err;
  36280. byte buf[66];
  36281. do {
  36282. err = wc_RNG_GenerateBlock(rng, buf, sizeof(buf));
  36283. if (err == 0) {
  36284. buf[0] &= 0x1;
  36285. sp_521_from_bin(k, 17, buf, (int)sizeof(buf));
  36286. if (sp_521_cmp_17(k, p521_order2) <= 0) {
  36287. sp_521_add_one_17(k);
  36288. break;
  36289. }
  36290. }
  36291. }
  36292. while (err == 0);
  36293. return err;
  36294. }
  36295. /* Makes a random EC key pair.
  36296. *
  36297. * rng Random number generator.
  36298. * priv Generated private value.
  36299. * pub Generated public point.
  36300. * heap Heap to use for allocation.
  36301. * returns ECC_INF_E when the point does not have the correct order, RNG
  36302. * failures, MEMORY_E when memory allocation fails and MP_OKAY on success.
  36303. */
  36304. int sp_ecc_make_key_521(WC_RNG* rng, mp_int* priv, ecc_point* pub, void* heap)
  36305. {
  36306. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36307. sp_point_521* point = NULL;
  36308. sp_digit* k = NULL;
  36309. #else
  36310. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  36311. sp_point_521 point[2];
  36312. #else
  36313. sp_point_521 point[1];
  36314. #endif
  36315. sp_digit k[17];
  36316. #endif
  36317. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  36318. sp_point_521* infinity = NULL;
  36319. #endif
  36320. int err = MP_OKAY;
  36321. (void)heap;
  36322. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36323. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  36324. point = (sp_point_521*)XMALLOC(sizeof(sp_point_521) * 2, heap, DYNAMIC_TYPE_ECC);
  36325. #else
  36326. point = (sp_point_521*)XMALLOC(sizeof(sp_point_521), heap, DYNAMIC_TYPE_ECC);
  36327. #endif
  36328. if (point == NULL)
  36329. err = MEMORY_E;
  36330. if (err == MP_OKAY) {
  36331. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 17, heap,
  36332. DYNAMIC_TYPE_ECC);
  36333. if (k == NULL)
  36334. err = MEMORY_E;
  36335. }
  36336. #endif
  36337. if (err == MP_OKAY) {
  36338. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  36339. infinity = point + 1;
  36340. #endif
  36341. err = sp_521_ecc_gen_k_17(rng, k);
  36342. }
  36343. if (err == MP_OKAY) {
  36344. err = sp_521_ecc_mulmod_base_17(point, k, 1, 1, NULL);
  36345. }
  36346. #ifdef WOLFSSL_VALIDATE_ECC_KEYGEN
  36347. if (err == MP_OKAY) {
  36348. err = sp_521_ecc_mulmod_17(infinity, point, p521_order, 1, 1, NULL);
  36349. }
  36350. if (err == MP_OKAY) {
  36351. if (sp_521_iszero_17(point->x) || sp_521_iszero_17(point->y)) {
  36352. err = ECC_INF_E;
  36353. }
  36354. }
  36355. #endif
  36356. if (err == MP_OKAY) {
  36357. err = sp_521_to_mp(k, priv);
  36358. }
  36359. if (err == MP_OKAY) {
  36360. err = sp_521_point_to_ecc_point_17(point, pub);
  36361. }
  36362. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36363. if (k != NULL)
  36364. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  36365. if (point != NULL) {
  36366. /* point is not sensitive, so no need to zeroize */
  36367. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  36368. }
  36369. #endif
  36370. return err;
  36371. }
  36372. #ifdef HAVE_ECC_DHE
  36373. /* Write r as big endian to byte array.
  36374. * Fixed length number of bytes written: 66
  36375. *
  36376. * r A single precision integer.
  36377. * a Byte array.
  36378. */
  36379. static void sp_521_to_bin_17(sp_digit* r, byte* a)
  36380. {
  36381. int i;
  36382. int j = 0;
  36383. a[j++] = r[16] >> 8;
  36384. a[j++] = r[16] >> 0;
  36385. for (i = 15; i >= 0; i--) {
  36386. a[j++] = r[i] >> 24;
  36387. a[j++] = r[i] >> 16;
  36388. a[j++] = r[i] >> 8;
  36389. a[j++] = r[i] >> 0;
  36390. }
  36391. }
  36392. /* Multiply the point by the scalar and serialize the X ordinate.
  36393. * The number is 0 padded to maximum size on output.
  36394. *
  36395. * priv Scalar to multiply the point by.
  36396. * pub Point to multiply.
  36397. * out Buffer to hold X ordinate.
  36398. * outLen On entry, size of the buffer in bytes.
  36399. * On exit, length of data in buffer in bytes.
  36400. * heap Heap to use for allocation.
  36401. * returns BUFFER_E if the buffer is to small for output size,
  36402. * MEMORY_E when memory allocation fails and MP_OKAY on success.
  36403. */
  36404. int sp_ecc_secret_gen_521(const mp_int* priv, const ecc_point* pub, byte* out,
  36405. word32* outLen, void* heap)
  36406. {
  36407. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36408. sp_point_521* point = NULL;
  36409. sp_digit* k = NULL;
  36410. #else
  36411. sp_point_521 point[1];
  36412. sp_digit k[17];
  36413. #endif
  36414. int err = MP_OKAY;
  36415. if (*outLen < 65U) {
  36416. err = BUFFER_E;
  36417. }
  36418. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36419. if (err == MP_OKAY) {
  36420. point = (sp_point_521*)XMALLOC(sizeof(sp_point_521), heap,
  36421. DYNAMIC_TYPE_ECC);
  36422. if (point == NULL)
  36423. err = MEMORY_E;
  36424. }
  36425. if (err == MP_OKAY) {
  36426. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 17, heap,
  36427. DYNAMIC_TYPE_ECC);
  36428. if (k == NULL)
  36429. err = MEMORY_E;
  36430. }
  36431. #endif
  36432. if (err == MP_OKAY) {
  36433. sp_521_from_mp(k, 17, priv);
  36434. sp_521_point_from_ecc_point_17(point, pub);
  36435. err = sp_521_ecc_mulmod_17(point, point, k, 1, 1, heap);
  36436. }
  36437. if (err == MP_OKAY) {
  36438. sp_521_to_bin_17(point->x, out);
  36439. *outLen = 66;
  36440. }
  36441. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  36442. if (k != NULL)
  36443. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  36444. if (point != NULL)
  36445. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  36446. #endif
  36447. return err;
  36448. }
  36449. #endif /* HAVE_ECC_DHE */
  36450. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  36451. SP_NOINLINE static void sp_521_rshift_17(sp_digit* r, const sp_digit* a, byte n)
  36452. {
  36453. __asm__ __volatile__ (
  36454. "mov r6, #32\n\t"
  36455. "sub r6, r6, %[n]\n\t"
  36456. "ldrd r2, r3, [%[a]]\n\t"
  36457. "lsr r2, r2, %[n]\n\t"
  36458. "lsl r5, r3, r6\n\t"
  36459. "lsr r3, r3, %[n]\n\t"
  36460. "orr r2, r2, r5\n\t"
  36461. "ldr r4, [%[a], #8]\n\t"
  36462. "str r2, [%[r], #0]\n\t"
  36463. "lsl r5, r4, r6\n\t"
  36464. "lsr r4, r4, %[n]\n\t"
  36465. "orr r3, r3, r5\n\t"
  36466. "ldr r2, [%[a], #12]\n\t"
  36467. "str r3, [%[r], #4]\n\t"
  36468. "lsl r5, r2, r6\n\t"
  36469. "lsr r2, r2, %[n]\n\t"
  36470. "orr r4, r4, r5\n\t"
  36471. "ldr r3, [%[a], #16]\n\t"
  36472. "str r4, [%[r], #8]\n\t"
  36473. "lsl r5, r3, r6\n\t"
  36474. "lsr r3, r3, %[n]\n\t"
  36475. "orr r2, r2, r5\n\t"
  36476. "ldr r4, [%[a], #20]\n\t"
  36477. "str r2, [%[r], #12]\n\t"
  36478. "lsl r5, r4, r6\n\t"
  36479. "lsr r4, r4, %[n]\n\t"
  36480. "orr r3, r3, r5\n\t"
  36481. "ldr r2, [%[a], #24]\n\t"
  36482. "str r3, [%[r], #16]\n\t"
  36483. "lsl r5, r2, r6\n\t"
  36484. "lsr r2, r2, %[n]\n\t"
  36485. "orr r4, r4, r5\n\t"
  36486. "ldr r3, [%[a], #28]\n\t"
  36487. "str r4, [%[r], #20]\n\t"
  36488. "lsl r5, r3, r6\n\t"
  36489. "lsr r3, r3, %[n]\n\t"
  36490. "orr r2, r2, r5\n\t"
  36491. "ldr r4, [%[a], #32]\n\t"
  36492. "str r2, [%[r], #24]\n\t"
  36493. "lsl r5, r4, r6\n\t"
  36494. "lsr r4, r4, %[n]\n\t"
  36495. "orr r3, r3, r5\n\t"
  36496. "ldr r2, [%[a], #36]\n\t"
  36497. "str r3, [%[r], #28]\n\t"
  36498. "lsl r5, r2, r6\n\t"
  36499. "lsr r2, r2, %[n]\n\t"
  36500. "orr r4, r4, r5\n\t"
  36501. "ldr r3, [%[a], #40]\n\t"
  36502. "str r4, [%[r], #32]\n\t"
  36503. "lsl r5, r3, r6\n\t"
  36504. "lsr r3, r3, %[n]\n\t"
  36505. "orr r2, r2, r5\n\t"
  36506. "ldr r4, [%[a], #44]\n\t"
  36507. "str r2, [%[r], #36]\n\t"
  36508. "lsl r5, r4, r6\n\t"
  36509. "lsr r4, r4, %[n]\n\t"
  36510. "orr r3, r3, r5\n\t"
  36511. "ldr r2, [%[a], #48]\n\t"
  36512. "str r3, [%[r], #40]\n\t"
  36513. "lsl r5, r2, r6\n\t"
  36514. "lsr r2, r2, %[n]\n\t"
  36515. "orr r4, r4, r5\n\t"
  36516. "ldr r3, [%[a], #52]\n\t"
  36517. "str r4, [%[r], #44]\n\t"
  36518. "lsl r5, r3, r6\n\t"
  36519. "lsr r3, r3, %[n]\n\t"
  36520. "orr r2, r2, r5\n\t"
  36521. "ldr r4, [%[a], #56]\n\t"
  36522. "str r2, [%[r], #48]\n\t"
  36523. "lsl r5, r4, r6\n\t"
  36524. "lsr r4, r4, %[n]\n\t"
  36525. "orr r3, r3, r5\n\t"
  36526. "ldr r2, [%[a], #60]\n\t"
  36527. "str r3, [%[r], #52]\n\t"
  36528. "lsl r5, r2, r6\n\t"
  36529. "lsr r2, r2, %[n]\n\t"
  36530. "orr r4, r4, r5\n\t"
  36531. "ldr r3, [%[a], #64]\n\t"
  36532. "str r4, [%[r], #56]\n\t"
  36533. "lsl r5, r3, r6\n\t"
  36534. "lsr r3, r3, %[n]\n\t"
  36535. "orr r2, r2, r5\n\t"
  36536. "strd r2, r3, [%[r], #60]\n\t"
  36537. :
  36538. : [r] "r" (r), [a] "r" (a), [n] "r" (n)
  36539. : "memory", "r2", "r3", "r4", "r5", "r6"
  36540. );
  36541. }
  36542. #endif
  36543. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  36544. #endif
  36545. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  36546. static void sp_521_lshift_17(sp_digit* r, const sp_digit* a, byte n)
  36547. {
  36548. __asm__ __volatile__ (
  36549. "mov r6, #31\n\t"
  36550. "sub r6, r6, %[n]\n\t"
  36551. "ldr r3, [%[a], #64]\n\t"
  36552. "lsr r4, r3, #1\n\t"
  36553. "lsl r3, r3, %[n]\n\t"
  36554. "lsr r4, r4, r6\n\t"
  36555. "ldr r2, [%[a], #60]\n\t"
  36556. "str r4, [%[r], #68]\n\t"
  36557. "lsr r5, r2, #1\n\t"
  36558. "lsl r2, r2, %[n]\n\t"
  36559. "lsr r5, r5, r6\n\t"
  36560. "orr r3, r3, r5\n\t"
  36561. "ldr r4, [%[a], #56]\n\t"
  36562. "str r3, [%[r], #64]\n\t"
  36563. "lsr r5, r4, #1\n\t"
  36564. "lsl r4, r4, %[n]\n\t"
  36565. "lsr r5, r5, r6\n\t"
  36566. "orr r2, r2, r5\n\t"
  36567. "ldr r3, [%[a], #52]\n\t"
  36568. "str r2, [%[r], #60]\n\t"
  36569. "lsr r5, r3, #1\n\t"
  36570. "lsl r3, r3, %[n]\n\t"
  36571. "lsr r5, r5, r6\n\t"
  36572. "orr r4, r4, r5\n\t"
  36573. "ldr r2, [%[a], #48]\n\t"
  36574. "str r4, [%[r], #56]\n\t"
  36575. "lsr r5, r2, #1\n\t"
  36576. "lsl r2, r2, %[n]\n\t"
  36577. "lsr r5, r5, r6\n\t"
  36578. "orr r3, r3, r5\n\t"
  36579. "ldr r4, [%[a], #44]\n\t"
  36580. "str r3, [%[r], #52]\n\t"
  36581. "lsr r5, r4, #1\n\t"
  36582. "lsl r4, r4, %[n]\n\t"
  36583. "lsr r5, r5, r6\n\t"
  36584. "orr r2, r2, r5\n\t"
  36585. "ldr r3, [%[a], #40]\n\t"
  36586. "str r2, [%[r], #48]\n\t"
  36587. "lsr r5, r3, #1\n\t"
  36588. "lsl r3, r3, %[n]\n\t"
  36589. "lsr r5, r5, r6\n\t"
  36590. "orr r4, r4, r5\n\t"
  36591. "ldr r2, [%[a], #36]\n\t"
  36592. "str r4, [%[r], #44]\n\t"
  36593. "lsr r5, r2, #1\n\t"
  36594. "lsl r2, r2, %[n]\n\t"
  36595. "lsr r5, r5, r6\n\t"
  36596. "orr r3, r3, r5\n\t"
  36597. "ldr r4, [%[a], #32]\n\t"
  36598. "str r3, [%[r], #40]\n\t"
  36599. "lsr r5, r4, #1\n\t"
  36600. "lsl r4, r4, %[n]\n\t"
  36601. "lsr r5, r5, r6\n\t"
  36602. "orr r2, r2, r5\n\t"
  36603. "ldr r3, [%[a], #28]\n\t"
  36604. "str r2, [%[r], #36]\n\t"
  36605. "lsr r5, r3, #1\n\t"
  36606. "lsl r3, r3, %[n]\n\t"
  36607. "lsr r5, r5, r6\n\t"
  36608. "orr r4, r4, r5\n\t"
  36609. "ldr r2, [%[a], #24]\n\t"
  36610. "str r4, [%[r], #32]\n\t"
  36611. "lsr r5, r2, #1\n\t"
  36612. "lsl r2, r2, %[n]\n\t"
  36613. "lsr r5, r5, r6\n\t"
  36614. "orr r3, r3, r5\n\t"
  36615. "ldr r4, [%[a], #20]\n\t"
  36616. "str r3, [%[r], #28]\n\t"
  36617. "lsr r5, r4, #1\n\t"
  36618. "lsl r4, r4, %[n]\n\t"
  36619. "lsr r5, r5, r6\n\t"
  36620. "orr r2, r2, r5\n\t"
  36621. "ldr r3, [%[a], #16]\n\t"
  36622. "str r2, [%[r], #24]\n\t"
  36623. "lsr r5, r3, #1\n\t"
  36624. "lsl r3, r3, %[n]\n\t"
  36625. "lsr r5, r5, r6\n\t"
  36626. "orr r4, r4, r5\n\t"
  36627. "ldr r2, [%[a], #12]\n\t"
  36628. "str r4, [%[r], #20]\n\t"
  36629. "lsr r5, r2, #1\n\t"
  36630. "lsl r2, r2, %[n]\n\t"
  36631. "lsr r5, r5, r6\n\t"
  36632. "orr r3, r3, r5\n\t"
  36633. "ldr r4, [%[a], #8]\n\t"
  36634. "str r3, [%[r], #16]\n\t"
  36635. "lsr r5, r4, #1\n\t"
  36636. "lsl r4, r4, %[n]\n\t"
  36637. "lsr r5, r5, r6\n\t"
  36638. "orr r2, r2, r5\n\t"
  36639. "ldr r3, [%[a], #4]\n\t"
  36640. "str r2, [%[r], #12]\n\t"
  36641. "lsr r5, r3, #1\n\t"
  36642. "lsl r3, r3, %[n]\n\t"
  36643. "lsr r5, r5, r6\n\t"
  36644. "orr r4, r4, r5\n\t"
  36645. "ldr r2, [%[a], #0]\n\t"
  36646. "str r4, [%[r], #8]\n\t"
  36647. "lsr r5, r2, #1\n\t"
  36648. "lsl r2, r2, %[n]\n\t"
  36649. "lsr r5, r5, r6\n\t"
  36650. "orr r3, r3, r5\n\t"
  36651. "str r2, [%[r]]\n\t"
  36652. "str r3, [%[r], #4]\n\t"
  36653. :
  36654. : [r] "r" (r), [a] "r" (a), [n] "r" (n)
  36655. : "memory", "r2", "r3", "r4", "r5", "r6"
  36656. );
  36657. }
  36658. static void sp_521_lshift_34(sp_digit* r, const sp_digit* a, byte n)
  36659. {
  36660. __asm__ __volatile__ (
  36661. "mov r6, #31\n\t"
  36662. "sub r6, r6, %[n]\n\t"
  36663. "ldr r3, [%[a], #132]\n\t"
  36664. "lsr r4, r3, #1\n\t"
  36665. "lsl r3, r3, %[n]\n\t"
  36666. "lsr r4, r4, r6\n\t"
  36667. "ldr r2, [%[a], #128]\n\t"
  36668. "str r4, [%[r], #136]\n\t"
  36669. "lsr r5, r2, #1\n\t"
  36670. "lsl r2, r2, %[n]\n\t"
  36671. "lsr r5, r5, r6\n\t"
  36672. "orr r3, r3, r5\n\t"
  36673. "ldr r4, [%[a], #124]\n\t"
  36674. "str r3, [%[r], #132]\n\t"
  36675. "lsr r5, r4, #1\n\t"
  36676. "lsl r4, r4, %[n]\n\t"
  36677. "lsr r5, r5, r6\n\t"
  36678. "orr r2, r2, r5\n\t"
  36679. "ldr r3, [%[a], #120]\n\t"
  36680. "str r2, [%[r], #128]\n\t"
  36681. "lsr r5, r3, #1\n\t"
  36682. "lsl r3, r3, %[n]\n\t"
  36683. "lsr r5, r5, r6\n\t"
  36684. "orr r4, r4, r5\n\t"
  36685. "ldr r2, [%[a], #116]\n\t"
  36686. "str r4, [%[r], #124]\n\t"
  36687. "lsr r5, r2, #1\n\t"
  36688. "lsl r2, r2, %[n]\n\t"
  36689. "lsr r5, r5, r6\n\t"
  36690. "orr r3, r3, r5\n\t"
  36691. "ldr r4, [%[a], #112]\n\t"
  36692. "str r3, [%[r], #120]\n\t"
  36693. "lsr r5, r4, #1\n\t"
  36694. "lsl r4, r4, %[n]\n\t"
  36695. "lsr r5, r5, r6\n\t"
  36696. "orr r2, r2, r5\n\t"
  36697. "ldr r3, [%[a], #108]\n\t"
  36698. "str r2, [%[r], #116]\n\t"
  36699. "lsr r5, r3, #1\n\t"
  36700. "lsl r3, r3, %[n]\n\t"
  36701. "lsr r5, r5, r6\n\t"
  36702. "orr r4, r4, r5\n\t"
  36703. "ldr r2, [%[a], #104]\n\t"
  36704. "str r4, [%[r], #112]\n\t"
  36705. "lsr r5, r2, #1\n\t"
  36706. "lsl r2, r2, %[n]\n\t"
  36707. "lsr r5, r5, r6\n\t"
  36708. "orr r3, r3, r5\n\t"
  36709. "ldr r4, [%[a], #100]\n\t"
  36710. "str r3, [%[r], #108]\n\t"
  36711. "lsr r5, r4, #1\n\t"
  36712. "lsl r4, r4, %[n]\n\t"
  36713. "lsr r5, r5, r6\n\t"
  36714. "orr r2, r2, r5\n\t"
  36715. "ldr r3, [%[a], #96]\n\t"
  36716. "str r2, [%[r], #104]\n\t"
  36717. "lsr r5, r3, #1\n\t"
  36718. "lsl r3, r3, %[n]\n\t"
  36719. "lsr r5, r5, r6\n\t"
  36720. "orr r4, r4, r5\n\t"
  36721. "ldr r2, [%[a], #92]\n\t"
  36722. "str r4, [%[r], #100]\n\t"
  36723. "lsr r5, r2, #1\n\t"
  36724. "lsl r2, r2, %[n]\n\t"
  36725. "lsr r5, r5, r6\n\t"
  36726. "orr r3, r3, r5\n\t"
  36727. "ldr r4, [%[a], #88]\n\t"
  36728. "str r3, [%[r], #96]\n\t"
  36729. "lsr r5, r4, #1\n\t"
  36730. "lsl r4, r4, %[n]\n\t"
  36731. "lsr r5, r5, r6\n\t"
  36732. "orr r2, r2, r5\n\t"
  36733. "ldr r3, [%[a], #84]\n\t"
  36734. "str r2, [%[r], #92]\n\t"
  36735. "lsr r5, r3, #1\n\t"
  36736. "lsl r3, r3, %[n]\n\t"
  36737. "lsr r5, r5, r6\n\t"
  36738. "orr r4, r4, r5\n\t"
  36739. "ldr r2, [%[a], #80]\n\t"
  36740. "str r4, [%[r], #88]\n\t"
  36741. "lsr r5, r2, #1\n\t"
  36742. "lsl r2, r2, %[n]\n\t"
  36743. "lsr r5, r5, r6\n\t"
  36744. "orr r3, r3, r5\n\t"
  36745. "ldr r4, [%[a], #76]\n\t"
  36746. "str r3, [%[r], #84]\n\t"
  36747. "lsr r5, r4, #1\n\t"
  36748. "lsl r4, r4, %[n]\n\t"
  36749. "lsr r5, r5, r6\n\t"
  36750. "orr r2, r2, r5\n\t"
  36751. "ldr r3, [%[a], #72]\n\t"
  36752. "str r2, [%[r], #80]\n\t"
  36753. "lsr r5, r3, #1\n\t"
  36754. "lsl r3, r3, %[n]\n\t"
  36755. "lsr r5, r5, r6\n\t"
  36756. "orr r4, r4, r5\n\t"
  36757. "ldr r2, [%[a], #68]\n\t"
  36758. "str r4, [%[r], #76]\n\t"
  36759. "lsr r5, r2, #1\n\t"
  36760. "lsl r2, r2, %[n]\n\t"
  36761. "lsr r5, r5, r6\n\t"
  36762. "orr r3, r3, r5\n\t"
  36763. "ldr r4, [%[a], #64]\n\t"
  36764. "str r3, [%[r], #72]\n\t"
  36765. "lsr r5, r4, #1\n\t"
  36766. "lsl r4, r4, %[n]\n\t"
  36767. "lsr r5, r5, r6\n\t"
  36768. "orr r2, r2, r5\n\t"
  36769. "ldr r3, [%[a], #60]\n\t"
  36770. "str r2, [%[r], #68]\n\t"
  36771. "lsr r5, r3, #1\n\t"
  36772. "lsl r3, r3, %[n]\n\t"
  36773. "lsr r5, r5, r6\n\t"
  36774. "orr r4, r4, r5\n\t"
  36775. "ldr r2, [%[a], #56]\n\t"
  36776. "str r4, [%[r], #64]\n\t"
  36777. "lsr r5, r2, #1\n\t"
  36778. "lsl r2, r2, %[n]\n\t"
  36779. "lsr r5, r5, r6\n\t"
  36780. "orr r3, r3, r5\n\t"
  36781. "ldr r4, [%[a], #52]\n\t"
  36782. "str r3, [%[r], #60]\n\t"
  36783. "lsr r5, r4, #1\n\t"
  36784. "lsl r4, r4, %[n]\n\t"
  36785. "lsr r5, r5, r6\n\t"
  36786. "orr r2, r2, r5\n\t"
  36787. "ldr r3, [%[a], #48]\n\t"
  36788. "str r2, [%[r], #56]\n\t"
  36789. "lsr r5, r3, #1\n\t"
  36790. "lsl r3, r3, %[n]\n\t"
  36791. "lsr r5, r5, r6\n\t"
  36792. "orr r4, r4, r5\n\t"
  36793. "ldr r2, [%[a], #44]\n\t"
  36794. "str r4, [%[r], #52]\n\t"
  36795. "lsr r5, r2, #1\n\t"
  36796. "lsl r2, r2, %[n]\n\t"
  36797. "lsr r5, r5, r6\n\t"
  36798. "orr r3, r3, r5\n\t"
  36799. "ldr r4, [%[a], #40]\n\t"
  36800. "str r3, [%[r], #48]\n\t"
  36801. "lsr r5, r4, #1\n\t"
  36802. "lsl r4, r4, %[n]\n\t"
  36803. "lsr r5, r5, r6\n\t"
  36804. "orr r2, r2, r5\n\t"
  36805. "ldr r3, [%[a], #36]\n\t"
  36806. "str r2, [%[r], #44]\n\t"
  36807. "lsr r5, r3, #1\n\t"
  36808. "lsl r3, r3, %[n]\n\t"
  36809. "lsr r5, r5, r6\n\t"
  36810. "orr r4, r4, r5\n\t"
  36811. "ldr r2, [%[a], #32]\n\t"
  36812. "str r4, [%[r], #40]\n\t"
  36813. "lsr r5, r2, #1\n\t"
  36814. "lsl r2, r2, %[n]\n\t"
  36815. "lsr r5, r5, r6\n\t"
  36816. "orr r3, r3, r5\n\t"
  36817. "ldr r4, [%[a], #28]\n\t"
  36818. "str r3, [%[r], #36]\n\t"
  36819. "lsr r5, r4, #1\n\t"
  36820. "lsl r4, r4, %[n]\n\t"
  36821. "lsr r5, r5, r6\n\t"
  36822. "orr r2, r2, r5\n\t"
  36823. "ldr r3, [%[a], #24]\n\t"
  36824. "str r2, [%[r], #32]\n\t"
  36825. "lsr r5, r3, #1\n\t"
  36826. "lsl r3, r3, %[n]\n\t"
  36827. "lsr r5, r5, r6\n\t"
  36828. "orr r4, r4, r5\n\t"
  36829. "ldr r2, [%[a], #20]\n\t"
  36830. "str r4, [%[r], #28]\n\t"
  36831. "lsr r5, r2, #1\n\t"
  36832. "lsl r2, r2, %[n]\n\t"
  36833. "lsr r5, r5, r6\n\t"
  36834. "orr r3, r3, r5\n\t"
  36835. "ldr r4, [%[a], #16]\n\t"
  36836. "str r3, [%[r], #24]\n\t"
  36837. "lsr r5, r4, #1\n\t"
  36838. "lsl r4, r4, %[n]\n\t"
  36839. "lsr r5, r5, r6\n\t"
  36840. "orr r2, r2, r5\n\t"
  36841. "ldr r3, [%[a], #12]\n\t"
  36842. "str r2, [%[r], #20]\n\t"
  36843. "lsr r5, r3, #1\n\t"
  36844. "lsl r3, r3, %[n]\n\t"
  36845. "lsr r5, r5, r6\n\t"
  36846. "orr r4, r4, r5\n\t"
  36847. "ldr r2, [%[a], #8]\n\t"
  36848. "str r4, [%[r], #16]\n\t"
  36849. "lsr r5, r2, #1\n\t"
  36850. "lsl r2, r2, %[n]\n\t"
  36851. "lsr r5, r5, r6\n\t"
  36852. "orr r3, r3, r5\n\t"
  36853. "ldr r4, [%[a], #4]\n\t"
  36854. "str r3, [%[r], #12]\n\t"
  36855. "lsr r5, r4, #1\n\t"
  36856. "lsl r4, r4, %[n]\n\t"
  36857. "lsr r5, r5, r6\n\t"
  36858. "orr r2, r2, r5\n\t"
  36859. "ldr r3, [%[a], #0]\n\t"
  36860. "str r2, [%[r], #8]\n\t"
  36861. "lsr r5, r3, #1\n\t"
  36862. "lsl r3, r3, %[n]\n\t"
  36863. "lsr r5, r5, r6\n\t"
  36864. "orr r4, r4, r5\n\t"
  36865. "str r3, [%[r]]\n\t"
  36866. "str r4, [%[r], #4]\n\t"
  36867. :
  36868. : [r] "r" (r), [a] "r" (a), [n] "r" (n)
  36869. : "memory", "r2", "r3", "r4", "r5", "r6"
  36870. );
  36871. }
  36872. #ifdef WOLFSSL_SP_SMALL
  36873. /* Sub b from a into a. (a -= b)
  36874. *
  36875. * a A single precision integer.
  36876. * b A single precision integer.
  36877. */
  36878. SP_NOINLINE static sp_digit sp_521_sub_in_place_17(sp_digit* a,
  36879. const sp_digit* b)
  36880. {
  36881. sp_digit c = 0;
  36882. __asm__ __volatile__ (
  36883. "mov r8, %[a]\n\t"
  36884. "add r8, r8, #64\n\t"
  36885. "\n1:\n\t"
  36886. "mov r5, #0\n\t"
  36887. "subs r5, r5, %[c]\n\t"
  36888. "ldr r3, [%[a]]\n\t"
  36889. "ldr r4, [%[a], #4]\n\t"
  36890. "ldr r5, [%[b]]\n\t"
  36891. "ldr r6, [%[b], #4]\n\t"
  36892. "sbcs r3, r3, r5\n\t"
  36893. "sbcs r4, r4, r6\n\t"
  36894. "str r3, [%[a]]\n\t"
  36895. "str r4, [%[a], #4]\n\t"
  36896. "sbc %[c], %[c], %[c]\n\t"
  36897. "add %[a], %[a], #8\n\t"
  36898. "add %[b], %[b], #8\n\t"
  36899. "cmp %[a], r8\n\t"
  36900. #ifdef __GNUC__
  36901. "bne 1b\n\t"
  36902. #else
  36903. "bne.n 1b\n\t"
  36904. #endif /* __GNUC__ */
  36905. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  36906. :
  36907. : "memory", "r3", "r4", "r5", "r6", "r8"
  36908. );
  36909. return c;
  36910. }
  36911. #else
  36912. /* Sub b from a into r. (r = a - b)
  36913. *
  36914. * r A single precision integer.
  36915. * a A single precision integer.
  36916. * b A single precision integer.
  36917. */
  36918. SP_NOINLINE static sp_digit sp_521_sub_in_place_17(sp_digit* a,
  36919. const sp_digit* b)
  36920. {
  36921. sp_digit c = 0;
  36922. __asm__ __volatile__ (
  36923. "ldm %[a], {r3, r4}\n\t"
  36924. "ldm %[b]!, {r5, r6}\n\t"
  36925. "subs r3, r3, r5\n\t"
  36926. "sbcs r4, r4, r6\n\t"
  36927. "stm %[a]!, {r3, r4}\n\t"
  36928. "ldm %[a], {r3, r4}\n\t"
  36929. "ldm %[b]!, {r5, r6}\n\t"
  36930. "sbcs r3, r3, r5\n\t"
  36931. "sbcs r4, r4, r6\n\t"
  36932. "stm %[a]!, {r3, r4}\n\t"
  36933. "ldm %[a], {r3, r4}\n\t"
  36934. "ldm %[b]!, {r5, r6}\n\t"
  36935. "sbcs r3, r3, r5\n\t"
  36936. "sbcs r4, r4, r6\n\t"
  36937. "stm %[a]!, {r3, r4}\n\t"
  36938. "ldm %[a], {r3, r4}\n\t"
  36939. "ldm %[b]!, {r5, r6}\n\t"
  36940. "sbcs r3, r3, r5\n\t"
  36941. "sbcs r4, r4, r6\n\t"
  36942. "stm %[a]!, {r3, r4}\n\t"
  36943. "ldm %[a], {r3, r4}\n\t"
  36944. "ldm %[b]!, {r5, r6}\n\t"
  36945. "sbcs r3, r3, r5\n\t"
  36946. "sbcs r4, r4, r6\n\t"
  36947. "stm %[a]!, {r3, r4}\n\t"
  36948. "ldm %[a], {r3, r4}\n\t"
  36949. "ldm %[b]!, {r5, r6}\n\t"
  36950. "sbcs r3, r3, r5\n\t"
  36951. "sbcs r4, r4, r6\n\t"
  36952. "stm %[a]!, {r3, r4}\n\t"
  36953. "ldm %[a], {r3, r4}\n\t"
  36954. "ldm %[b]!, {r5, r6}\n\t"
  36955. "sbcs r3, r3, r5\n\t"
  36956. "sbcs r4, r4, r6\n\t"
  36957. "stm %[a]!, {r3, r4}\n\t"
  36958. "ldm %[a], {r3, r4}\n\t"
  36959. "ldm %[b]!, {r5, r6}\n\t"
  36960. "sbcs r3, r3, r5\n\t"
  36961. "sbcs r4, r4, r6\n\t"
  36962. "stm %[a]!, {r3, r4}\n\t"
  36963. "ldr r3, [%[a]]\n\t"
  36964. "ldr r5, [%[b]]\n\t"
  36965. "sbcs r3, r3, r5\n\t"
  36966. "str r3, [%[a]]\n\t"
  36967. "sbc %[c], %[c], %[c]\n\t"
  36968. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  36969. :
  36970. : "memory", "r3", "r4", "r5", "r6"
  36971. );
  36972. return c;
  36973. }
  36974. #endif /* WOLFSSL_SP_SMALL */
  36975. /* Mul a by digit b into r. (r = a * b)
  36976. *
  36977. * r A single precision integer.
  36978. * a A single precision integer.
  36979. * b A single precision digit.
  36980. */
  36981. SP_NOINLINE static void sp_521_mul_d_17(sp_digit* r, const sp_digit* a,
  36982. sp_digit b)
  36983. {
  36984. __asm__ __volatile__ (
  36985. "add r9, %[a], #68\n\t"
  36986. /* A[0] * B */
  36987. "ldr r6, [%[a]], #4\n\t"
  36988. "umull r5, r3, r6, %[b]\n\t"
  36989. "mov r4, #0\n\t"
  36990. "str r5, [%[r]], #4\n\t"
  36991. /* A[0] * B - Done */
  36992. "\n1:\n\t"
  36993. "mov r5, #0\n\t"
  36994. /* A[] * B */
  36995. "ldr r6, [%[a]], #4\n\t"
  36996. "umull r6, r8, r6, %[b]\n\t"
  36997. "adds r3, r3, r6\n\t"
  36998. "adcs r4, r4, r8\n\t"
  36999. "adc r5, r5, #0\n\t"
  37000. /* A[] * B - Done */
  37001. "str r3, [%[r]], #4\n\t"
  37002. "mov r3, r4\n\t"
  37003. "mov r4, r5\n\t"
  37004. "cmp %[a], r9\n\t"
  37005. #ifdef __GNUC__
  37006. "blt 1b\n\t"
  37007. #else
  37008. "blt.n 1b\n\t"
  37009. #endif /* __GNUC__ */
  37010. "str r3, [%[r]]\n\t"
  37011. : [r] "+r" (r), [a] "+r" (a)
  37012. : [b] "r" (b)
  37013. : "memory", "r3", "r4", "r5", "r6", "r8", "r9"
  37014. );
  37015. }
  37016. /* Divide the double width number (d1|d0) by the divisor. (d1|d0 / div)
  37017. *
  37018. * d1 The high order half of the number to divide.
  37019. * d0 The low order half of the number to divide.
  37020. * div The divisor.
  37021. * returns the result of the division.
  37022. *
  37023. * Note that this is an approximate div. It may give an answer 1 larger.
  37024. */
  37025. SP_NOINLINE static sp_digit div_521_word_17(sp_digit d1, sp_digit d0,
  37026. sp_digit div)
  37027. {
  37028. sp_digit r = 0;
  37029. __asm__ __volatile__ (
  37030. "lsr r6, %[div], #16\n\t"
  37031. "add r6, r6, #1\n\t"
  37032. "udiv r4, %[d1], r6\n\t"
  37033. "lsl r8, r4, #16\n\t"
  37034. "umull r4, r5, %[div], r8\n\t"
  37035. "subs %[d0], %[d0], r4\n\t"
  37036. "sbc %[d1], %[d1], r5\n\t"
  37037. "udiv r5, %[d1], r6\n\t"
  37038. "lsl r4, r5, #16\n\t"
  37039. "add r8, r8, r4\n\t"
  37040. "umull r4, r5, %[div], r4\n\t"
  37041. "subs %[d0], %[d0], r4\n\t"
  37042. "sbc %[d1], %[d1], r5\n\t"
  37043. "lsl r4, %[d1], #16\n\t"
  37044. "orr r4, r4, %[d0], lsr #16\n\t"
  37045. "udiv r4, r4, r6\n\t"
  37046. "add r8, r8, r4\n\t"
  37047. "umull r4, r5, %[div], r4\n\t"
  37048. "subs %[d0], %[d0], r4\n\t"
  37049. "sbc %[d1], %[d1], r5\n\t"
  37050. "lsl r4, %[d1], #16\n\t"
  37051. "orr r4, r4, %[d0], lsr #16\n\t"
  37052. "udiv r4, r4, r6\n\t"
  37053. "add r8, r8, r4\n\t"
  37054. "umull r4, r5, %[div], r4\n\t"
  37055. "subs %[d0], %[d0], r4\n\t"
  37056. "sbc %[d1], %[d1], r5\n\t"
  37057. "udiv r4, %[d0], %[div]\n\t"
  37058. "add r8, r8, r4\n\t"
  37059. "mov %[r], r8\n\t"
  37060. : [r] "+r" (r)
  37061. : [d1] "r" (d1), [d0] "r" (d0), [div] "r" (div)
  37062. : "r4", "r5", "r6", "r8"
  37063. );
  37064. return r;
  37065. }
  37066. /* AND m into each word of a and store in r.
  37067. *
  37068. * r A single precision integer.
  37069. * a A single precision integer.
  37070. * m Mask to AND against each digit.
  37071. */
  37072. static void sp_521_mask_17(sp_digit* r, const sp_digit* a, sp_digit m)
  37073. {
  37074. #ifdef WOLFSSL_SP_SMALL
  37075. int i;
  37076. for (i=0; i<17; i++) {
  37077. r[i] = a[i] & m;
  37078. }
  37079. #else
  37080. int i;
  37081. for (i = 0; i < 16; i += 8) {
  37082. r[i+0] = a[i+0] & m;
  37083. r[i+1] = a[i+1] & m;
  37084. r[i+2] = a[i+2] & m;
  37085. r[i+3] = a[i+3] & m;
  37086. r[i+4] = a[i+4] & m;
  37087. r[i+5] = a[i+5] & m;
  37088. r[i+6] = a[i+6] & m;
  37089. r[i+7] = a[i+7] & m;
  37090. }
  37091. r[16] = a[16] & m;
  37092. #endif
  37093. }
  37094. /* Divide d in a and put remainder into r (m*d + r = a)
  37095. * m is not calculated as it is not needed at this time.
  37096. *
  37097. * a Number to be divided.
  37098. * d Number to divide with.
  37099. * m Multiplier result.
  37100. * r Remainder from the division.
  37101. * returns MP_OKAY indicating success.
  37102. */
  37103. static WC_INLINE int sp_521_div_17(const sp_digit* a, const sp_digit* d, sp_digit* m,
  37104. sp_digit* r)
  37105. {
  37106. sp_digit t1[35];
  37107. sp_digit t2[18];
  37108. sp_digit sd[18];
  37109. sp_digit div;
  37110. sp_digit r1;
  37111. int i;
  37112. ASSERT_SAVED_VECTOR_REGISTERS();
  37113. (void)m;
  37114. div = (d[16] << 23) | (d[15] >> 9);
  37115. XMEMCPY(t1, a, sizeof(*t1) * 2 * 17);
  37116. r1 = sp_521_cmp_17(&t1[17], d) >= 0;
  37117. sp_521_cond_sub_17(&t1[17], &t1[17], d, (sp_digit)0 - r1);
  37118. sp_521_lshift_17(sd, d, 23);
  37119. sp_521_lshift_34(t1, t1, 23);
  37120. for (i = 16; i >= 0; i--) {
  37121. sp_digit hi = t1[17 + i] - (t1[17 + i] == div);
  37122. r1 = div_521_word_17(hi, t1[17 + i - 1], div);
  37123. sp_521_mul_d_17(t2, sd, r1);
  37124. t1[17 + i] += sp_521_sub_in_place_17(&t1[i], t2);
  37125. t1[17 + i] -= t2[17];
  37126. sp_521_mask_17(t2, sd, t1[17 + i]);
  37127. t1[17 + i] += sp_521_add_17(&t1[i], &t1[i], t2);
  37128. sp_521_mask_17(t2, sd, t1[17 + i]);
  37129. t1[17 + i] += sp_521_add_17(&t1[i], &t1[i], t2);
  37130. }
  37131. r1 = sp_521_cmp_17(t1, sd) >= 0;
  37132. sp_521_cond_sub_17(r, t1, sd, (sp_digit)0 - r1);
  37133. sp_521_rshift_17(r, r, 23);
  37134. return MP_OKAY;
  37135. }
  37136. /* Reduce a modulo m into r. (r = a mod m)
  37137. *
  37138. * r A single precision number that is the reduced result.
  37139. * a A single precision number that is to be reduced.
  37140. * m A single precision number that is the modulus to reduce with.
  37141. * returns MP_OKAY indicating success.
  37142. */
  37143. static WC_INLINE int sp_521_mod_17(sp_digit* r, const sp_digit* a, const sp_digit* m)
  37144. {
  37145. return sp_521_div_17(a, m, NULL, r);
  37146. }
  37147. #endif
  37148. #if defined(HAVE_ECC_SIGN) || defined(HAVE_ECC_VERIFY)
  37149. /* Multiply two number mod the order of P521 curve. (r = a * b mod order)
  37150. *
  37151. * r Result of the multiplication.
  37152. * a First operand of the multiplication.
  37153. * b Second operand of the multiplication.
  37154. */
  37155. static void sp_521_mont_mul_order_17(sp_digit* r, const sp_digit* a, const sp_digit* b)
  37156. {
  37157. sp_521_mul_17(r, a, b);
  37158. sp_521_mont_reduce_order_17(r, p521_order, p521_mp_order);
  37159. }
  37160. #if defined(HAVE_ECC_SIGN) || (defined(HAVE_ECC_VERIFY) && defined(WOLFSSL_SP_SMALL))
  37161. #ifdef WOLFSSL_SP_SMALL
  37162. /* Order-2 for the P521 curve. */
  37163. static const uint32_t p521_order_minus_2[17] = {
  37164. 0x91386407U,0xbb6fb71eU,0x899c47aeU,0x3bb5c9b8U,0xf709a5d0U,0x7fcc0148U,
  37165. 0xbf2f966bU,0x51868783U,0xfffffffaU,0xffffffffU,0xffffffffU,0xffffffffU,
  37166. 0xffffffffU,0xffffffffU,0xffffffffU,0xffffffffU,0x000001ffU
  37167. };
  37168. #else
  37169. /* The low half of the order-2 of the P521 curve. */
  37170. static const uint32_t p521_order_low[9] = {
  37171. 0x91386407U,0xbb6fb71eU,0x899c47aeU,0x3bb5c9b8U,0xf709a5d0U,0x7fcc0148U,
  37172. 0xbf2f966bU,0x51868783U,0xfffffffaU
  37173. };
  37174. #endif /* WOLFSSL_SP_SMALL */
  37175. /* Square number mod the order of P521 curve. (r = a * a mod order)
  37176. *
  37177. * r Result of the squaring.
  37178. * a Number to square.
  37179. */
  37180. static void sp_521_mont_sqr_order_17(sp_digit* r, const sp_digit* a)
  37181. {
  37182. sp_521_sqr_17(r, a);
  37183. sp_521_mont_reduce_order_17(r, p521_order, p521_mp_order);
  37184. }
  37185. #ifndef WOLFSSL_SP_SMALL
  37186. /* Square number mod the order of P521 curve a number of times.
  37187. * (r = a ^ n mod order)
  37188. *
  37189. * r Result of the squaring.
  37190. * a Number to square.
  37191. */
  37192. static void sp_521_mont_sqr_n_order_17(sp_digit* r, const sp_digit* a, int n)
  37193. {
  37194. int i;
  37195. sp_521_mont_sqr_order_17(r, a);
  37196. for (i=1; i<n; i++) {
  37197. sp_521_mont_sqr_order_17(r, r);
  37198. }
  37199. }
  37200. #endif /* !WOLFSSL_SP_SMALL */
  37201. /* Invert the number, in Montgomery form, modulo the order of the P521 curve.
  37202. * (r = 1 / a mod order)
  37203. *
  37204. * r Inverse result.
  37205. * a Number to invert.
  37206. * td Temporary data.
  37207. */
  37208. #ifdef WOLFSSL_SP_NONBLOCK
  37209. typedef struct sp_521_mont_inv_order_17_ctx {
  37210. int state;
  37211. int i;
  37212. } sp_521_mont_inv_order_17_ctx;
  37213. static int sp_521_mont_inv_order_17_nb(sp_ecc_ctx_t* sp_ctx, sp_digit* r, const sp_digit* a,
  37214. sp_digit* t)
  37215. {
  37216. int err = FP_WOULDBLOCK;
  37217. sp_521_mont_inv_order_17_ctx* ctx = (sp_521_mont_inv_order_17_ctx*)sp_ctx;
  37218. typedef char ctx_size_test[sizeof(sp_521_mont_inv_order_17_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  37219. (void)sizeof(ctx_size_test);
  37220. switch (ctx->state) {
  37221. case 0:
  37222. XMEMCPY(t, a, sizeof(sp_digit) * 17);
  37223. ctx->i = 519;
  37224. ctx->state = 1;
  37225. break;
  37226. case 1:
  37227. sp_521_mont_sqr_order_17(t, t);
  37228. ctx->state = 2;
  37229. break;
  37230. case 2:
  37231. if ((p521_order_minus_2[ctx->i / 32] & ((sp_int_digit)1 << (ctx->i % 32))) != 0) {
  37232. sp_521_mont_mul_order_17(t, t, a);
  37233. }
  37234. ctx->i--;
  37235. ctx->state = (ctx->i == 0) ? 3 : 1;
  37236. break;
  37237. case 3:
  37238. XMEMCPY(r, t, sizeof(sp_digit) * 17U);
  37239. err = MP_OKAY;
  37240. break;
  37241. }
  37242. return err;
  37243. }
  37244. #endif /* WOLFSSL_SP_NONBLOCK */
  37245. static void sp_521_mont_inv_order_17(sp_digit* r, const sp_digit* a,
  37246. sp_digit* td)
  37247. {
  37248. #ifdef WOLFSSL_SP_SMALL
  37249. sp_digit* t = td;
  37250. int i;
  37251. XMEMCPY(t, a, sizeof(sp_digit) * 17);
  37252. for (i=519; i>=0; i--) {
  37253. sp_521_mont_sqr_order_17(t, t);
  37254. if ((p521_order_minus_2[i / 32] & ((sp_int_digit)1 << (i % 32))) != 0) {
  37255. sp_521_mont_mul_order_17(t, t, a);
  37256. }
  37257. }
  37258. XMEMCPY(r, t, sizeof(sp_digit) * 17U);
  37259. #else
  37260. sp_digit* t = td;
  37261. sp_digit* t2 = td + 2 * 17;
  37262. sp_digit* t3 = td + 4 * 17;
  37263. int i;
  37264. /* t = a^2 */
  37265. sp_521_mont_sqr_order_17(t, a);
  37266. /* t = a^3 = t * a */
  37267. sp_521_mont_mul_order_17(t, t, a);
  37268. /* t= a^c = t ^ 2 ^ 2 */
  37269. sp_521_mont_sqr_n_order_17(t2, t, 2);
  37270. /* t = a^f = t2 * t */
  37271. sp_521_mont_mul_order_17(t, t2, t);
  37272. /* t3 = a^1e */
  37273. sp_521_mont_sqr_order_17(t3, t);
  37274. /* t3 = a^1f = t3 * a */
  37275. sp_521_mont_mul_order_17(t3, t3, a);
  37276. /* t2= a^f0 = t ^ 2 ^ 4 */
  37277. sp_521_mont_sqr_n_order_17(t2, t, 4);
  37278. /* t = a^ff = t2 * t */
  37279. sp_521_mont_mul_order_17(t, t2, t);
  37280. /* t2= a^ff00 = t ^ 2 ^ 8 */
  37281. sp_521_mont_sqr_n_order_17(t2, t, 8);
  37282. /* t3= a^ffff = t2 * t */
  37283. sp_521_mont_mul_order_17(t, t2, t);
  37284. /* t2= a^ffff0000 = t ^ 2 ^ 16 */
  37285. sp_521_mont_sqr_n_order_17(t2, t, 16);
  37286. /* t = a^ffffffff = t2 * t */
  37287. sp_521_mont_mul_order_17(t, t2, t);
  37288. /* t2= a^ffffffff00000000 = t ^ 2 ^ 32 */
  37289. sp_521_mont_sqr_n_order_17(t2, t, 32);
  37290. /* t = a^ffffffffffffffff = t2 * t */
  37291. sp_521_mont_mul_order_17(t, t2, t);
  37292. /* t2= a^ffffffffffffffff0000000000000000 = t ^ 2 ^ 64 */
  37293. sp_521_mont_sqr_n_order_17(t2, t, 64);
  37294. /* t = a^ffffffffffffffffffffffffffffffff = t2 * t */
  37295. sp_521_mont_mul_order_17(t, t2, t);
  37296. /* t2= a^ffffffffffffffffffffffffffffffff00000000000000000000000000000000 = t ^ 2 ^ 128 */
  37297. sp_521_mont_sqr_n_order_17(t2, t, 128);
  37298. /* t = a^ffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff = t2 * t */
  37299. sp_521_mont_mul_order_17(t, t2, t);
  37300. /* t2 = a^1fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffe0 */
  37301. sp_521_mont_sqr_n_order_17(t2, t, 5);
  37302. /* t2 = a^1fffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff = t * t3 */
  37303. sp_521_mont_mul_order_17(t2, t2, t3);
  37304. for (i=259; i>=1; i--) {
  37305. sp_521_mont_sqr_order_17(t2, t2);
  37306. if ((p521_order_low[i / 32] & ((sp_int_digit)1 << (i % 32))) != 0) {
  37307. sp_521_mont_mul_order_17(t2, t2, a);
  37308. }
  37309. }
  37310. sp_521_mont_sqr_order_17(t2, t2);
  37311. sp_521_mont_mul_order_17(r, t2, a);
  37312. #endif /* WOLFSSL_SP_SMALL */
  37313. }
  37314. #endif /* HAVE_ECC_SIGN || (HAVE_ECC_VERIFY && WOLFSSL_SP_SMALL) */
  37315. #endif /* HAVE_ECC_SIGN | HAVE_ECC_VERIFY */
  37316. #ifdef HAVE_ECC_SIGN
  37317. #ifndef SP_ECC_MAX_SIG_GEN
  37318. #define SP_ECC_MAX_SIG_GEN 64
  37319. #endif
  37320. /* Calculate second signature value S from R, k and private value.
  37321. *
  37322. * s = (r * x + e) / k
  37323. *
  37324. * s Signature value.
  37325. * r First signature value.
  37326. * k Ephemeral private key.
  37327. * x Private key as a number.
  37328. * e Hash of message as a number.
  37329. * tmp Temporary storage for intermediate numbers.
  37330. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  37331. */
  37332. static int sp_521_calc_s_17(sp_digit* s, const sp_digit* r, sp_digit* k,
  37333. sp_digit* x, const sp_digit* e, sp_digit* tmp)
  37334. {
  37335. int err;
  37336. sp_digit carry;
  37337. sp_int32 c;
  37338. sp_digit* kInv = k;
  37339. /* Conv k to Montgomery form (mod order) */
  37340. sp_521_mul_17(k, k, p521_norm_order);
  37341. err = sp_521_mod_17(k, k, p521_order);
  37342. if (err == MP_OKAY) {
  37343. sp_521_norm_17(k);
  37344. /* kInv = 1/k mod order */
  37345. sp_521_mont_inv_order_17(kInv, k, tmp);
  37346. sp_521_norm_17(kInv);
  37347. /* s = r * x + e */
  37348. sp_521_mul_17(x, x, r);
  37349. err = sp_521_mod_17(x, x, p521_order);
  37350. }
  37351. if (err == MP_OKAY) {
  37352. sp_521_norm_17(x);
  37353. carry = sp_521_add_17(s, e, x);
  37354. sp_521_cond_sub_17(s, s, p521_order, 0 - carry);
  37355. sp_521_norm_17(s);
  37356. c = sp_521_cmp_17(s, p521_order);
  37357. sp_521_cond_sub_17(s, s, p521_order,
  37358. (sp_digit)0 - (sp_digit)(c >= 0));
  37359. sp_521_norm_17(s);
  37360. /* s = s * k^-1 mod order */
  37361. sp_521_mont_mul_order_17(s, s, kInv);
  37362. sp_521_norm_17(s);
  37363. }
  37364. return err;
  37365. }
  37366. /* Sign the hash using the private key.
  37367. * e = [hash, 521 bits] from binary
  37368. * r = (k.G)->x mod order
  37369. * s = (r * x + e) / k mod order
  37370. * The hash is truncated to the first 521 bits.
  37371. *
  37372. * hash Hash to sign.
  37373. * hashLen Length of the hash data.
  37374. * rng Random number generator.
  37375. * priv Private part of key - scalar.
  37376. * rm First part of result as an mp_int.
  37377. * sm Sirst part of result as an mp_int.
  37378. * heap Heap to use for allocation.
  37379. * returns RNG failures, MEMORY_E when memory allocation fails and
  37380. * MP_OKAY on success.
  37381. */
  37382. #ifdef WOLFSSL_SP_NONBLOCK
  37383. typedef struct sp_ecc_sign_521_ctx {
  37384. int state;
  37385. union {
  37386. sp_521_ecc_mulmod_17_ctx mulmod_ctx;
  37387. sp_521_mont_inv_order_17_ctx mont_inv_order_ctx;
  37388. };
  37389. sp_digit e[2*17];
  37390. sp_digit x[2*17];
  37391. sp_digit k[2*17];
  37392. sp_digit r[2*17];
  37393. sp_digit tmp[3 * 2*17];
  37394. sp_point_521 point;
  37395. sp_digit* s;
  37396. sp_digit* kInv;
  37397. int i;
  37398. } sp_ecc_sign_521_ctx;
  37399. int sp_ecc_sign_521_nb(sp_ecc_ctx_t* sp_ctx, const byte* hash, word32 hashLen, WC_RNG* rng,
  37400. mp_int* priv, mp_int* rm, mp_int* sm, mp_int* km, void* heap)
  37401. {
  37402. int err = FP_WOULDBLOCK;
  37403. sp_ecc_sign_521_ctx* ctx = (sp_ecc_sign_521_ctx*)sp_ctx->data;
  37404. typedef char ctx_size_test[sizeof(sp_ecc_sign_521_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  37405. (void)sizeof(ctx_size_test);
  37406. (void)heap;
  37407. switch (ctx->state) {
  37408. case 0: /* INIT */
  37409. ctx->s = ctx->e;
  37410. ctx->kInv = ctx->k;
  37411. ctx->i = SP_ECC_MAX_SIG_GEN;
  37412. ctx->state = 1;
  37413. break;
  37414. case 1: /* GEN */
  37415. /* New random point. */
  37416. if (km == NULL || mp_iszero(km)) {
  37417. err = sp_521_ecc_gen_k_17(rng, ctx->k);
  37418. }
  37419. else {
  37420. sp_521_from_mp(ctx->k, 17, km);
  37421. mp_zero(km);
  37422. }
  37423. XMEMSET(&ctx->mulmod_ctx, 0, sizeof(ctx->mulmod_ctx));
  37424. ctx->state = 2;
  37425. break;
  37426. case 2: /* MULMOD */
  37427. err = sp_521_ecc_mulmod_17_nb((sp_ecc_ctx_t*)&ctx->mulmod_ctx,
  37428. &ctx->point, &p521_base, ctx->k, 1, 1, heap);
  37429. if (err == MP_OKAY) {
  37430. ctx->state = 3;
  37431. }
  37432. break;
  37433. case 3: /* MODORDER */
  37434. {
  37435. sp_int32 c;
  37436. /* r = point->x mod order */
  37437. XMEMCPY(ctx->r, ctx->point.x, sizeof(sp_digit) * 17U);
  37438. sp_521_norm_17(ctx->r);
  37439. c = sp_521_cmp_17(ctx->r, p521_order);
  37440. sp_521_cond_sub_17(ctx->r, ctx->r, p521_order,
  37441. (sp_digit)0 - (sp_digit)(c >= 0));
  37442. sp_521_norm_17(ctx->r);
  37443. if (hashLen > 66U) {
  37444. hashLen = 66U;
  37445. }
  37446. sp_521_from_mp(ctx->x, 17, priv);
  37447. sp_521_from_bin(ctx->e, 17, hash, (int)hashLen);
  37448. if (hashLen == 66U) {
  37449. sp_521_rshift_17(ctx->e, ctx->e, 7);
  37450. }
  37451. ctx->state = 4;
  37452. break;
  37453. }
  37454. case 4: /* KMODORDER */
  37455. /* Conv k to Montgomery form (mod order) */
  37456. sp_521_mul_17(ctx->k, ctx->k, p521_norm_order);
  37457. err = sp_521_mod_17(ctx->k, ctx->k, p521_order);
  37458. if (err == MP_OKAY) {
  37459. sp_521_norm_17(ctx->k);
  37460. XMEMSET(&ctx->mont_inv_order_ctx, 0, sizeof(ctx->mont_inv_order_ctx));
  37461. ctx->state = 5;
  37462. }
  37463. break;
  37464. case 5: /* KINV */
  37465. /* kInv = 1/k mod order */
  37466. err = sp_521_mont_inv_order_17_nb((sp_ecc_ctx_t*)&ctx->mont_inv_order_ctx, ctx->kInv, ctx->k, ctx->tmp);
  37467. if (err == MP_OKAY) {
  37468. XMEMSET(&ctx->mont_inv_order_ctx, 0, sizeof(ctx->mont_inv_order_ctx));
  37469. ctx->state = 6;
  37470. }
  37471. break;
  37472. case 6: /* KINVNORM */
  37473. sp_521_norm_17(ctx->kInv);
  37474. ctx->state = 7;
  37475. break;
  37476. case 7: /* R */
  37477. /* s = r * x + e */
  37478. sp_521_mul_17(ctx->x, ctx->x, ctx->r);
  37479. ctx->state = 8;
  37480. break;
  37481. case 8: /* S1 */
  37482. err = sp_521_mod_17(ctx->x, ctx->x, p521_order);
  37483. if (err == MP_OKAY)
  37484. ctx->state = 9;
  37485. break;
  37486. case 9: /* S2 */
  37487. {
  37488. sp_digit carry;
  37489. sp_int32 c;
  37490. sp_521_norm_17(ctx->x);
  37491. carry = sp_521_add_17(ctx->s, ctx->e, ctx->x);
  37492. sp_521_cond_sub_17(ctx->s, ctx->s,
  37493. p521_order, 0 - carry);
  37494. sp_521_norm_17(ctx->s);
  37495. c = sp_521_cmp_17(ctx->s, p521_order);
  37496. sp_521_cond_sub_17(ctx->s, ctx->s, p521_order,
  37497. (sp_digit)0 - (sp_digit)(c >= 0));
  37498. sp_521_norm_17(ctx->s);
  37499. /* s = s * k^-1 mod order */
  37500. sp_521_mont_mul_order_17(ctx->s, ctx->s, ctx->kInv);
  37501. sp_521_norm_17(ctx->s);
  37502. /* Check that signature is usable. */
  37503. if (sp_521_iszero_17(ctx->s) == 0) {
  37504. ctx->state = 10;
  37505. break;
  37506. }
  37507. #ifdef WOLFSSL_ECDSA_SET_K_ONE_LOOP
  37508. ctx->i = 1;
  37509. #endif
  37510. /* not usable gen, try again */
  37511. ctx->i--;
  37512. if (ctx->i == 0) {
  37513. err = RNG_FAILURE_E;
  37514. }
  37515. ctx->state = 1;
  37516. break;
  37517. }
  37518. case 10: /* RES */
  37519. err = sp_521_to_mp(ctx->r, rm);
  37520. if (err == MP_OKAY) {
  37521. err = sp_521_to_mp(ctx->s, sm);
  37522. }
  37523. break;
  37524. }
  37525. if (err == MP_OKAY && ctx->state != 10) {
  37526. err = FP_WOULDBLOCK;
  37527. }
  37528. if (err != FP_WOULDBLOCK) {
  37529. XMEMSET(ctx->e, 0, sizeof(sp_digit) * 2U * 17U);
  37530. XMEMSET(ctx->x, 0, sizeof(sp_digit) * 2U * 17U);
  37531. XMEMSET(ctx->k, 0, sizeof(sp_digit) * 2U * 17U);
  37532. XMEMSET(ctx->r, 0, sizeof(sp_digit) * 2U * 17U);
  37533. XMEMSET(ctx->tmp, 0, sizeof(sp_digit) * 3U * 2U * 17U);
  37534. }
  37535. return err;
  37536. }
  37537. #endif /* WOLFSSL_SP_NONBLOCK */
  37538. int sp_ecc_sign_521(const byte* hash, word32 hashLen, WC_RNG* rng,
  37539. const mp_int* priv, mp_int* rm, mp_int* sm, mp_int* km, void* heap)
  37540. {
  37541. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  37542. sp_digit* e = NULL;
  37543. sp_point_521* point = NULL;
  37544. #else
  37545. sp_digit e[7 * 2 * 17];
  37546. sp_point_521 point[1];
  37547. #endif
  37548. sp_digit* x = NULL;
  37549. sp_digit* k = NULL;
  37550. sp_digit* r = NULL;
  37551. sp_digit* tmp = NULL;
  37552. sp_digit* s = NULL;
  37553. sp_int32 c;
  37554. int err = MP_OKAY;
  37555. int i;
  37556. (void)heap;
  37557. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  37558. if (err == MP_OKAY) {
  37559. point = (sp_point_521*)XMALLOC(sizeof(sp_point_521), heap,
  37560. DYNAMIC_TYPE_ECC);
  37561. if (point == NULL)
  37562. err = MEMORY_E;
  37563. }
  37564. if (err == MP_OKAY) {
  37565. e = (sp_digit*)XMALLOC(sizeof(sp_digit) * 7 * 2 * 17, heap,
  37566. DYNAMIC_TYPE_ECC);
  37567. if (e == NULL)
  37568. err = MEMORY_E;
  37569. }
  37570. #endif
  37571. if (err == MP_OKAY) {
  37572. x = e + 2 * 17;
  37573. k = e + 4 * 17;
  37574. r = e + 6 * 17;
  37575. tmp = e + 8 * 17;
  37576. s = e;
  37577. if (hashLen > 66U) {
  37578. hashLen = 66U;
  37579. }
  37580. }
  37581. for (i = SP_ECC_MAX_SIG_GEN; err == MP_OKAY && i > 0; i--) {
  37582. /* New random point. */
  37583. if (km == NULL || mp_iszero(km)) {
  37584. err = sp_521_ecc_gen_k_17(rng, k);
  37585. }
  37586. else {
  37587. sp_521_from_mp(k, 17, km);
  37588. mp_zero(km);
  37589. }
  37590. if (err == MP_OKAY) {
  37591. err = sp_521_ecc_mulmod_base_17(point, k, 1, 1, heap);
  37592. }
  37593. if (err == MP_OKAY) {
  37594. /* r = point->x mod order */
  37595. XMEMCPY(r, point->x, sizeof(sp_digit) * 17U);
  37596. sp_521_norm_17(r);
  37597. c = sp_521_cmp_17(r, p521_order);
  37598. sp_521_cond_sub_17(r, r, p521_order,
  37599. (sp_digit)0 - (sp_digit)(c >= 0));
  37600. sp_521_norm_17(r);
  37601. sp_521_from_mp(x, 17, priv);
  37602. sp_521_from_bin(e, 17, hash, (int)hashLen);
  37603. if (hashLen == 66U) {
  37604. sp_521_rshift_17(e, e, 7);
  37605. }
  37606. err = sp_521_calc_s_17(s, r, k, x, e, tmp);
  37607. }
  37608. /* Check that signature is usable. */
  37609. if ((err == MP_OKAY) && (sp_521_iszero_17(s) == 0)) {
  37610. break;
  37611. }
  37612. #ifdef WOLFSSL_ECDSA_SET_K_ONE_LOOP
  37613. i = 1;
  37614. #endif
  37615. }
  37616. if (i == 0) {
  37617. err = RNG_FAILURE_E;
  37618. }
  37619. if (err == MP_OKAY) {
  37620. err = sp_521_to_mp(r, rm);
  37621. }
  37622. if (err == MP_OKAY) {
  37623. err = sp_521_to_mp(s, sm);
  37624. }
  37625. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  37626. if (e != NULL)
  37627. #endif
  37628. {
  37629. ForceZero(e, sizeof(sp_digit) * 7 * 2 * 17);
  37630. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  37631. XFREE(e, heap, DYNAMIC_TYPE_ECC);
  37632. #endif
  37633. }
  37634. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  37635. if (point != NULL)
  37636. #endif
  37637. {
  37638. ForceZero(point, sizeof(sp_point_521));
  37639. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  37640. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  37641. #endif
  37642. }
  37643. return err;
  37644. }
  37645. #endif /* HAVE_ECC_SIGN */
  37646. #ifndef WOLFSSL_SP_SMALL
  37647. /* Divide the number by 2 mod the modulus. (r = a / 2 % m)
  37648. *
  37649. * r Result of division by 2.
  37650. * a Number to divide.
  37651. * m Modulus.
  37652. */
  37653. static void sp_521_div2_mod_17(sp_digit* r, const sp_digit* a, const sp_digit* m)
  37654. {
  37655. __asm__ __volatile__ (
  37656. "ldr r4, [%[a]]\n\t"
  37657. "ands r8, r4, #1\n\t"
  37658. "beq 1f\n\t"
  37659. "mov r12, #0\n\t"
  37660. "ldr r5, [%[a], #4]\n\t"
  37661. "ldr r6, [%[a], #8]\n\t"
  37662. "ldr r7, [%[a], #12]\n\t"
  37663. "ldr r8, [%[m], #0]\n\t"
  37664. "ldr r9, [%[m], #4]\n\t"
  37665. "ldr r10, [%[m], #8]\n\t"
  37666. "ldr r14, [%[m], #12]\n\t"
  37667. "adds r4, r4, r8\n\t"
  37668. "adcs r5, r5, r9\n\t"
  37669. "adcs r6, r6, r10\n\t"
  37670. "adcs r7, r7, r14\n\t"
  37671. "str r4, [%[r], #0]\n\t"
  37672. "str r5, [%[r], #4]\n\t"
  37673. "str r6, [%[r], #8]\n\t"
  37674. "str r7, [%[r], #12]\n\t"
  37675. "ldr r4, [%[a], #16]\n\t"
  37676. "ldr r5, [%[a], #20]\n\t"
  37677. "ldr r6, [%[a], #24]\n\t"
  37678. "ldr r7, [%[a], #28]\n\t"
  37679. "ldr r8, [%[m], #16]\n\t"
  37680. "ldr r9, [%[m], #20]\n\t"
  37681. "ldr r10, [%[m], #24]\n\t"
  37682. "ldr r14, [%[m], #28]\n\t"
  37683. "adcs r4, r4, r8\n\t"
  37684. "adcs r5, r5, r9\n\t"
  37685. "adcs r6, r6, r10\n\t"
  37686. "adcs r7, r7, r14\n\t"
  37687. "str r4, [%[r], #16]\n\t"
  37688. "str r5, [%[r], #20]\n\t"
  37689. "str r6, [%[r], #24]\n\t"
  37690. "str r7, [%[r], #28]\n\t"
  37691. "ldr r4, [%[a], #32]\n\t"
  37692. "ldr r5, [%[a], #36]\n\t"
  37693. "ldr r6, [%[a], #40]\n\t"
  37694. "ldr r7, [%[a], #44]\n\t"
  37695. "ldr r8, [%[m], #32]\n\t"
  37696. "ldr r9, [%[m], #36]\n\t"
  37697. "ldr r10, [%[m], #40]\n\t"
  37698. "ldr r14, [%[m], #44]\n\t"
  37699. "adcs r4, r4, r8\n\t"
  37700. "adcs r5, r5, r9\n\t"
  37701. "adcs r6, r6, r10\n\t"
  37702. "adcs r7, r7, r14\n\t"
  37703. "str r4, [%[r], #32]\n\t"
  37704. "str r5, [%[r], #36]\n\t"
  37705. "str r6, [%[r], #40]\n\t"
  37706. "str r7, [%[r], #44]\n\t"
  37707. "ldr r4, [%[a], #48]\n\t"
  37708. "ldr r5, [%[a], #52]\n\t"
  37709. "ldr r6, [%[a], #56]\n\t"
  37710. "ldr r7, [%[a], #60]\n\t"
  37711. "ldr r8, [%[m], #48]\n\t"
  37712. "ldr r9, [%[m], #52]\n\t"
  37713. "ldr r10, [%[m], #56]\n\t"
  37714. "ldr r14, [%[m], #60]\n\t"
  37715. "adcs r4, r4, r8\n\t"
  37716. "adcs r5, r5, r9\n\t"
  37717. "adcs r6, r6, r10\n\t"
  37718. "adcs r7, r7, r14\n\t"
  37719. "str r4, [%[r], #48]\n\t"
  37720. "str r5, [%[r], #52]\n\t"
  37721. "str r6, [%[r], #56]\n\t"
  37722. "str r7, [%[r], #60]\n\t"
  37723. "ldr r4, [%[a], #64]\n\t"
  37724. "ldr r8, [%[m], #64]\n\t"
  37725. "adcs r4, r4, r8\n\t"
  37726. "str r4, [%[r], #64]\n\t"
  37727. "adc r8, r12, r12\n\t"
  37728. "b 2f\n\t"
  37729. "\n1:\n\t"
  37730. "ldr r5, [%[a], #2]\n\t"
  37731. "str r4, [%[r], #0]\n\t"
  37732. "str r5, [%[r], #2]\n\t"
  37733. "ldr r4, [%[a], #4]\n\t"
  37734. "ldr r5, [%[a], #6]\n\t"
  37735. "str r4, [%[r], #4]\n\t"
  37736. "str r5, [%[r], #6]\n\t"
  37737. "ldr r4, [%[a], #8]\n\t"
  37738. "ldr r5, [%[a], #10]\n\t"
  37739. "str r4, [%[r], #8]\n\t"
  37740. "str r5, [%[r], #10]\n\t"
  37741. "ldr r4, [%[a], #12]\n\t"
  37742. "ldr r5, [%[a], #14]\n\t"
  37743. "str r4, [%[r], #12]\n\t"
  37744. "str r5, [%[r], #14]\n\t"
  37745. "ldr r4, [%[a], #16]\n\t"
  37746. "ldr r5, [%[a], #18]\n\t"
  37747. "str r4, [%[r], #16]\n\t"
  37748. "str r5, [%[r], #18]\n\t"
  37749. "ldr r4, [%[a], #20]\n\t"
  37750. "ldr r5, [%[a], #22]\n\t"
  37751. "str r4, [%[r], #20]\n\t"
  37752. "str r5, [%[r], #22]\n\t"
  37753. "ldr r4, [%[a], #24]\n\t"
  37754. "ldr r5, [%[a], #26]\n\t"
  37755. "str r4, [%[r], #24]\n\t"
  37756. "str r5, [%[r], #26]\n\t"
  37757. "ldr r4, [%[a], #28]\n\t"
  37758. "ldr r5, [%[a], #30]\n\t"
  37759. "str r4, [%[r], #28]\n\t"
  37760. "str r5, [%[r], #30]\n\t"
  37761. "\n2:\n\t"
  37762. "ldr r3, [%[r]]\n\t"
  37763. "ldr r4, [%[r], #4]\n\t"
  37764. "lsr r3, r3, #1\n\t"
  37765. "orr r3, r3, r4, lsl #31\n\t"
  37766. "lsr r4, r4, #1\n\t"
  37767. "ldr r5, [%[a], #8]\n\t"
  37768. "str r3, [%[r], #0]\n\t"
  37769. "orr r4, r4, r5, lsl #31\n\t"
  37770. "lsr r5, r5, #1\n\t"
  37771. "ldr r3, [%[a], #12]\n\t"
  37772. "str r4, [%[r], #4]\n\t"
  37773. "orr r5, r5, r3, lsl #31\n\t"
  37774. "lsr r3, r3, #1\n\t"
  37775. "ldr r4, [%[a], #16]\n\t"
  37776. "str r5, [%[r], #8]\n\t"
  37777. "orr r3, r3, r4, lsl #31\n\t"
  37778. "lsr r4, r4, #1\n\t"
  37779. "ldr r5, [%[a], #20]\n\t"
  37780. "str r3, [%[r], #12]\n\t"
  37781. "orr r4, r4, r5, lsl #31\n\t"
  37782. "lsr r5, r5, #1\n\t"
  37783. "ldr r3, [%[a], #24]\n\t"
  37784. "str r4, [%[r], #16]\n\t"
  37785. "orr r5, r5, r3, lsl #31\n\t"
  37786. "lsr r3, r3, #1\n\t"
  37787. "ldr r4, [%[a], #28]\n\t"
  37788. "str r5, [%[r], #20]\n\t"
  37789. "orr r3, r3, r4, lsl #31\n\t"
  37790. "lsr r4, r4, #1\n\t"
  37791. "ldr r5, [%[a], #32]\n\t"
  37792. "str r3, [%[r], #24]\n\t"
  37793. "orr r4, r4, r5, lsl #31\n\t"
  37794. "lsr r5, r5, #1\n\t"
  37795. "ldr r3, [%[a], #36]\n\t"
  37796. "str r4, [%[r], #28]\n\t"
  37797. "orr r5, r5, r3, lsl #31\n\t"
  37798. "lsr r3, r3, #1\n\t"
  37799. "ldr r4, [%[a], #40]\n\t"
  37800. "str r5, [%[r], #32]\n\t"
  37801. "orr r3, r3, r4, lsl #31\n\t"
  37802. "lsr r4, r4, #1\n\t"
  37803. "ldr r5, [%[a], #44]\n\t"
  37804. "str r3, [%[r], #36]\n\t"
  37805. "orr r4, r4, r5, lsl #31\n\t"
  37806. "lsr r5, r5, #1\n\t"
  37807. "ldr r3, [%[a], #48]\n\t"
  37808. "str r4, [%[r], #40]\n\t"
  37809. "orr r5, r5, r3, lsl #31\n\t"
  37810. "lsr r3, r3, #1\n\t"
  37811. "ldr r4, [%[a], #52]\n\t"
  37812. "str r5, [%[r], #44]\n\t"
  37813. "orr r3, r3, r4, lsl #31\n\t"
  37814. "lsr r4, r4, #1\n\t"
  37815. "ldr r5, [%[a], #56]\n\t"
  37816. "str r3, [%[r], #48]\n\t"
  37817. "orr r4, r4, r5, lsl #31\n\t"
  37818. "lsr r5, r5, #1\n\t"
  37819. "ldr r3, [%[a], #60]\n\t"
  37820. "str r4, [%[r], #52]\n\t"
  37821. "orr r5, r5, r3, lsl #31\n\t"
  37822. "lsr r3, r3, #1\n\t"
  37823. "ldr r4, [%[a], #64]\n\t"
  37824. "str r5, [%[r], #56]\n\t"
  37825. "orr r3, r3, r4, lsl #31\n\t"
  37826. "lsr r4, r4, #1\n\t"
  37827. "orr r4, r4, r8, lsl #31\n\t"
  37828. "str r3, [%[r], #60]\n\t"
  37829. "str r4, [%[r], #64]\n\t"
  37830. :
  37831. : [r] "r" (r), [a] "r" (a), [m] "r" (m)
  37832. : "memory", "r3", "r4", "r5", "r6", "r7", "r8", "r9", "r10", "r14"
  37833. );
  37834. }
  37835. static int sp_521_num_bits_17(sp_digit* a)
  37836. {
  37837. int r = 0;
  37838. __asm__ __volatile__ (
  37839. "ldr r2, [%[a], #64]\n\t"
  37840. "cmp r2, #0\n\t"
  37841. "beq 16f\n\t"
  37842. "mov r3, #544\n\t"
  37843. "clz %[r], r2\n\t"
  37844. "sub %[r], r3, %[r]\n\t"
  37845. "b 18f\n\t"
  37846. "\n16:\n\t"
  37847. "ldr r2, [%[a], #60]\n\t"
  37848. "cmp r2, #0\n\t"
  37849. "beq 15f\n\t"
  37850. "mov r3, #512\n\t"
  37851. "clz %[r], r2\n\t"
  37852. "sub %[r], r3, %[r]\n\t"
  37853. "b 18f\n\t"
  37854. "\n15:\n\t"
  37855. "ldr r2, [%[a], #56]\n\t"
  37856. "cmp r2, #0\n\t"
  37857. "beq 14f\n\t"
  37858. "mov r3, #480\n\t"
  37859. "clz %[r], r2\n\t"
  37860. "sub %[r], r3, %[r]\n\t"
  37861. "b 18f\n\t"
  37862. "\n14:\n\t"
  37863. "ldr r2, [%[a], #52]\n\t"
  37864. "cmp r2, #0\n\t"
  37865. "beq 13f\n\t"
  37866. "mov r3, #448\n\t"
  37867. "clz %[r], r2\n\t"
  37868. "sub %[r], r3, %[r]\n\t"
  37869. "b 18f\n\t"
  37870. "\n13:\n\t"
  37871. "ldr r2, [%[a], #48]\n\t"
  37872. "cmp r2, #0\n\t"
  37873. "beq 12f\n\t"
  37874. "mov r3, #416\n\t"
  37875. "clz %[r], r2\n\t"
  37876. "sub %[r], r3, %[r]\n\t"
  37877. "b 18f\n\t"
  37878. "\n12:\n\t"
  37879. "ldr r2, [%[a], #44]\n\t"
  37880. "cmp r2, #0\n\t"
  37881. "beq 11f\n\t"
  37882. "mov r3, #384\n\t"
  37883. "clz %[r], r2\n\t"
  37884. "sub %[r], r3, %[r]\n\t"
  37885. "b 18f\n\t"
  37886. "\n11:\n\t"
  37887. "ldr r2, [%[a], #40]\n\t"
  37888. "cmp r2, #0\n\t"
  37889. "beq 10f\n\t"
  37890. "mov r3, #352\n\t"
  37891. "clz %[r], r2\n\t"
  37892. "sub %[r], r3, %[r]\n\t"
  37893. "b 18f\n\t"
  37894. "\n10:\n\t"
  37895. "ldr r2, [%[a], #36]\n\t"
  37896. "cmp r2, #0\n\t"
  37897. "beq 9f\n\t"
  37898. "mov r3, #320\n\t"
  37899. "clz %[r], r2\n\t"
  37900. "sub %[r], r3, %[r]\n\t"
  37901. "b 18f\n\t"
  37902. "\n9:\n\t"
  37903. "ldr r2, [%[a], #32]\n\t"
  37904. "cmp r2, #0\n\t"
  37905. "beq 8f\n\t"
  37906. "mov r3, #288\n\t"
  37907. "clz %[r], r2\n\t"
  37908. "sub %[r], r3, %[r]\n\t"
  37909. "b 18f\n\t"
  37910. "\n8:\n\t"
  37911. "ldr r2, [%[a], #28]\n\t"
  37912. "cmp r2, #0\n\t"
  37913. "beq 7f\n\t"
  37914. "mov r3, #256\n\t"
  37915. "clz %[r], r2\n\t"
  37916. "sub %[r], r3, %[r]\n\t"
  37917. "b 18f\n\t"
  37918. "\n7:\n\t"
  37919. "ldr r2, [%[a], #24]\n\t"
  37920. "cmp r2, #0\n\t"
  37921. "beq 6f\n\t"
  37922. "mov r3, #224\n\t"
  37923. "clz %[r], r2\n\t"
  37924. "sub %[r], r3, %[r]\n\t"
  37925. "b 18f\n\t"
  37926. "\n6:\n\t"
  37927. "ldr r2, [%[a], #20]\n\t"
  37928. "cmp r2, #0\n\t"
  37929. "beq 5f\n\t"
  37930. "mov r3, #192\n\t"
  37931. "clz %[r], r2\n\t"
  37932. "sub %[r], r3, %[r]\n\t"
  37933. "b 18f\n\t"
  37934. "\n5:\n\t"
  37935. "ldr r2, [%[a], #16]\n\t"
  37936. "cmp r2, #0\n\t"
  37937. "beq 4f\n\t"
  37938. "mov r3, #160\n\t"
  37939. "clz %[r], r2\n\t"
  37940. "sub %[r], r3, %[r]\n\t"
  37941. "b 18f\n\t"
  37942. "\n4:\n\t"
  37943. "ldr r2, [%[a], #12]\n\t"
  37944. "cmp r2, #0\n\t"
  37945. "beq 3f\n\t"
  37946. "mov r3, #128\n\t"
  37947. "clz %[r], r2\n\t"
  37948. "sub %[r], r3, %[r]\n\t"
  37949. "b 18f\n\t"
  37950. "\n3:\n\t"
  37951. "ldr r2, [%[a], #8]\n\t"
  37952. "cmp r2, #0\n\t"
  37953. "beq 2f\n\t"
  37954. "mov r3, #96\n\t"
  37955. "clz %[r], r2\n\t"
  37956. "sub %[r], r3, %[r]\n\t"
  37957. "b 18f\n\t"
  37958. "\n2:\n\t"
  37959. "ldr r2, [%[a], #4]\n\t"
  37960. "cmp r2, #0\n\t"
  37961. "beq 1f\n\t"
  37962. "mov r3, #64\n\t"
  37963. "clz %[r], r2\n\t"
  37964. "sub %[r], r3, %[r]\n\t"
  37965. "b 18f\n\t"
  37966. "\n1:\n\t"
  37967. "ldr r2, [%[a], #0]\n\t"
  37968. "mov r3, #32\n\t"
  37969. "clz %[r], r2\n\t"
  37970. "sub %[r], r3, %[r]\n\t"
  37971. "\n18:\n\t"
  37972. : [r] "+r" (r)
  37973. : [a] "r" (a)
  37974. : "r2", "r3"
  37975. );
  37976. return r;
  37977. }
  37978. /* Non-constant time modular inversion.
  37979. *
  37980. * @param [out] r Resulting number.
  37981. * @param [in] a Number to invert.
  37982. * @param [in] m Modulus.
  37983. * @return MP_OKAY on success.
  37984. */
  37985. static int sp_521_mod_inv_17(sp_digit* r, const sp_digit* a, const sp_digit* m)
  37986. {
  37987. sp_digit u[17];
  37988. sp_digit v[17];
  37989. sp_digit b[17];
  37990. sp_digit d[17];
  37991. int ut, vt;
  37992. sp_digit o;
  37993. XMEMCPY(u, m, sizeof(u));
  37994. XMEMCPY(v, a, sizeof(v));
  37995. ut = sp_521_num_bits_17(u);
  37996. vt = sp_521_num_bits_17(v);
  37997. XMEMSET(b, 0, sizeof(b));
  37998. if ((v[0] & 1) == 0) {
  37999. sp_521_rshift1_17(v, v);
  38000. XMEMCPY(d, m, sizeof(u));
  38001. d[0] += 1;
  38002. sp_521_rshift1_17(d, d);
  38003. vt--;
  38004. while ((v[0] & 1) == 0) {
  38005. sp_521_rshift1_17(v, v);
  38006. sp_521_div2_mod_17(d, d, m);
  38007. vt--;
  38008. }
  38009. }
  38010. else {
  38011. XMEMSET(d+1, 0, sizeof(d)-sizeof(sp_digit));
  38012. d[0] = 1;
  38013. }
  38014. while (ut > 1 && vt > 1) {
  38015. if (ut > vt || (ut == vt && sp_521_cmp_17(u, v) >= 0)) {
  38016. sp_521_sub_17(u, u, v);
  38017. o = sp_521_sub_17(b, b, d);
  38018. if (o != 0)
  38019. sp_521_add_17(b, b, m);
  38020. ut = sp_521_num_bits_17(u);
  38021. do {
  38022. sp_521_rshift1_17(u, u);
  38023. sp_521_div2_mod_17(b, b, m);
  38024. ut--;
  38025. }
  38026. while (ut > 0 && (u[0] & 1) == 0);
  38027. }
  38028. else {
  38029. sp_521_sub_17(v, v, u);
  38030. o = sp_521_sub_17(d, d, b);
  38031. if (o != 0)
  38032. sp_521_add_17(d, d, m);
  38033. vt = sp_521_num_bits_17(v);
  38034. do {
  38035. sp_521_rshift1_17(v, v);
  38036. sp_521_div2_mod_17(d, d, m);
  38037. vt--;
  38038. }
  38039. while (vt > 0 && (v[0] & 1) == 0);
  38040. }
  38041. }
  38042. if (ut == 1)
  38043. XMEMCPY(r, b, sizeof(b));
  38044. else
  38045. XMEMCPY(r, d, sizeof(d));
  38046. return MP_OKAY;
  38047. }
  38048. #endif /* WOLFSSL_SP_SMALL */
  38049. /* Add point p1 into point p2. Handles p1 == p2 and result at infinity.
  38050. *
  38051. * p1 First point to add and holds result.
  38052. * p2 Second point to add.
  38053. * tmp Temporary storage for intermediate numbers.
  38054. */
  38055. static void sp_521_add_points_17(sp_point_521* p1, const sp_point_521* p2,
  38056. sp_digit* tmp)
  38057. {
  38058. sp_521_proj_point_add_17(p1, p1, p2, tmp);
  38059. if (sp_521_iszero_17(p1->z)) {
  38060. if (sp_521_iszero_17(p1->x) && sp_521_iszero_17(p1->y)) {
  38061. sp_521_proj_point_dbl_17(p1, p2, tmp);
  38062. }
  38063. else {
  38064. /* Y ordinate is not used from here - don't set. */
  38065. p1->x[0] = 0;
  38066. p1->x[1] = 0;
  38067. p1->x[2] = 0;
  38068. p1->x[3] = 0;
  38069. p1->x[4] = 0;
  38070. p1->x[5] = 0;
  38071. p1->x[6] = 0;
  38072. p1->x[7] = 0;
  38073. p1->x[8] = 0;
  38074. p1->x[9] = 0;
  38075. p1->x[10] = 0;
  38076. p1->x[11] = 0;
  38077. p1->x[12] = 0;
  38078. p1->x[13] = 0;
  38079. p1->x[14] = 0;
  38080. p1->x[15] = 0;
  38081. p1->x[16] = 0;
  38082. XMEMCPY(p1->z, p521_norm_mod, sizeof(p521_norm_mod));
  38083. }
  38084. }
  38085. }
  38086. /* Calculate the verification point: [e/s]G + [r/s]Q
  38087. *
  38088. * p1 Calculated point.
  38089. * p2 Public point and temporary.
  38090. * s Second part of signature as a number.
  38091. * u1 Temporary number.
  38092. * u2 Temproray number.
  38093. * heap Heap to use for allocation.
  38094. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  38095. */
  38096. static int sp_521_calc_vfy_point_17(sp_point_521* p1, sp_point_521* p2,
  38097. sp_digit* s, sp_digit* u1, sp_digit* u2, sp_digit* tmp, void* heap)
  38098. {
  38099. int err;
  38100. #ifndef WOLFSSL_SP_SMALL
  38101. err = sp_521_mod_inv_17(s, s, p521_order);
  38102. if (err == MP_OKAY)
  38103. #endif /* !WOLFSSL_SP_SMALL */
  38104. {
  38105. sp_521_mul_17(s, s, p521_norm_order);
  38106. err = sp_521_mod_17(s, s, p521_order);
  38107. }
  38108. if (err == MP_OKAY) {
  38109. sp_521_norm_17(s);
  38110. #ifdef WOLFSSL_SP_SMALL
  38111. {
  38112. sp_521_mont_inv_order_17(s, s, tmp);
  38113. sp_521_mont_mul_order_17(u1, u1, s);
  38114. sp_521_mont_mul_order_17(u2, u2, s);
  38115. }
  38116. #else
  38117. {
  38118. sp_521_mont_mul_order_17(u1, u1, s);
  38119. sp_521_mont_mul_order_17(u2, u2, s);
  38120. }
  38121. #endif /* WOLFSSL_SP_SMALL */
  38122. {
  38123. err = sp_521_ecc_mulmod_base_17(p1, u1, 0, 0, heap);
  38124. }
  38125. }
  38126. if ((err == MP_OKAY) && sp_521_iszero_17(p1->z)) {
  38127. p1->infinity = 1;
  38128. }
  38129. if (err == MP_OKAY) {
  38130. err = sp_521_ecc_mulmod_17(p2, p2, u2, 0, 0, heap);
  38131. }
  38132. if ((err == MP_OKAY) && sp_521_iszero_17(p2->z)) {
  38133. p2->infinity = 1;
  38134. }
  38135. if (err == MP_OKAY) {
  38136. sp_521_add_points_17(p1, p2, tmp);
  38137. }
  38138. return err;
  38139. }
  38140. #ifdef HAVE_ECC_VERIFY
  38141. /* Verify the signature values with the hash and public key.
  38142. * e = Truncate(hash, 521)
  38143. * u1 = e/s mod order
  38144. * u2 = r/s mod order
  38145. * r == (u1.G + u2.Q)->x mod order
  38146. * Optimization: Leave point in projective form.
  38147. * (x, y, 1) == (x' / z'*z', y' / z'*z'*z', z' / z')
  38148. * (r + n*order).z'.z' mod prime == (u1.G + u2.Q)->x'
  38149. * The hash is truncated to the first 521 bits.
  38150. *
  38151. * hash Hash to sign.
  38152. * hashLen Length of the hash data.
  38153. * rng Random number generator.
  38154. * priv Private part of key - scalar.
  38155. * rm First part of result as an mp_int.
  38156. * sm Sirst part of result as an mp_int.
  38157. * heap Heap to use for allocation.
  38158. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  38159. */
  38160. #ifdef WOLFSSL_SP_NONBLOCK
  38161. typedef struct sp_ecc_verify_521_ctx {
  38162. int state;
  38163. union {
  38164. sp_521_ecc_mulmod_17_ctx mulmod_ctx;
  38165. sp_521_mont_inv_order_17_ctx mont_inv_order_ctx;
  38166. sp_521_proj_point_dbl_17_ctx dbl_ctx;
  38167. sp_521_proj_point_add_17_ctx add_ctx;
  38168. };
  38169. sp_digit u1[2*17];
  38170. sp_digit u2[2*17];
  38171. sp_digit s[2*17];
  38172. sp_digit tmp[2*17 * 6];
  38173. sp_point_521 p1;
  38174. sp_point_521 p2;
  38175. } sp_ecc_verify_521_ctx;
  38176. int sp_ecc_verify_521_nb(sp_ecc_ctx_t* sp_ctx, const byte* hash,
  38177. word32 hashLen, const mp_int* pX, const mp_int* pY, const mp_int* pZ,
  38178. const mp_int* rm, const mp_int* sm, int* res, void* heap)
  38179. {
  38180. int err = FP_WOULDBLOCK;
  38181. sp_ecc_verify_521_ctx* ctx = (sp_ecc_verify_521_ctx*)sp_ctx->data;
  38182. typedef char ctx_size_test[sizeof(sp_ecc_verify_521_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  38183. (void)sizeof(ctx_size_test);
  38184. switch (ctx->state) {
  38185. case 0: /* INIT */
  38186. if (hashLen > 66U) {
  38187. hashLen = 66U;
  38188. }
  38189. sp_521_from_bin(ctx->u1, 17, hash, (int)hashLen);
  38190. sp_521_from_mp(ctx->u2, 17, rm);
  38191. sp_521_from_mp(ctx->s, 17, sm);
  38192. sp_521_from_mp(ctx->p2.x, 17, pX);
  38193. sp_521_from_mp(ctx->p2.y, 17, pY);
  38194. sp_521_from_mp(ctx->p2.z, 17, pZ);
  38195. if (hashLen == 66U) {
  38196. sp_521_rshift_17(ctx->u1, ctx->u1, 7);
  38197. }
  38198. ctx->state = 1;
  38199. break;
  38200. case 1: /* NORMS0 */
  38201. sp_521_mul_17(ctx->s, ctx->s, p521_norm_order);
  38202. err = sp_521_mod_17(ctx->s, ctx->s, p521_order);
  38203. if (err == MP_OKAY)
  38204. ctx->state = 2;
  38205. break;
  38206. case 2: /* NORMS1 */
  38207. sp_521_norm_17(ctx->s);
  38208. XMEMSET(&ctx->mont_inv_order_ctx, 0, sizeof(ctx->mont_inv_order_ctx));
  38209. ctx->state = 3;
  38210. break;
  38211. case 3: /* NORMS2 */
  38212. err = sp_521_mont_inv_order_17_nb((sp_ecc_ctx_t*)&ctx->mont_inv_order_ctx, ctx->s, ctx->s, ctx->tmp);
  38213. if (err == MP_OKAY) {
  38214. ctx->state = 4;
  38215. }
  38216. break;
  38217. case 4: /* NORMS3 */
  38218. sp_521_mont_mul_order_17(ctx->u1, ctx->u1, ctx->s);
  38219. ctx->state = 5;
  38220. break;
  38221. case 5: /* NORMS4 */
  38222. sp_521_mont_mul_order_17(ctx->u2, ctx->u2, ctx->s);
  38223. XMEMSET(&ctx->mulmod_ctx, 0, sizeof(ctx->mulmod_ctx));
  38224. ctx->state = 6;
  38225. break;
  38226. case 6: /* MULBASE */
  38227. err = sp_521_ecc_mulmod_17_nb((sp_ecc_ctx_t*)&ctx->mulmod_ctx, &ctx->p1, &p521_base, ctx->u1, 0, 0, heap);
  38228. if (err == MP_OKAY) {
  38229. if (sp_521_iszero_17(ctx->p1.z)) {
  38230. ctx->p1.infinity = 1;
  38231. }
  38232. XMEMSET(&ctx->mulmod_ctx, 0, sizeof(ctx->mulmod_ctx));
  38233. ctx->state = 7;
  38234. }
  38235. break;
  38236. case 7: /* MULMOD */
  38237. err = sp_521_ecc_mulmod_17_nb((sp_ecc_ctx_t*)&ctx->mulmod_ctx, &ctx->p2, &ctx->p2, ctx->u2, 0, 0, heap);
  38238. if (err == MP_OKAY) {
  38239. if (sp_521_iszero_17(ctx->p2.z)) {
  38240. ctx->p2.infinity = 1;
  38241. }
  38242. XMEMSET(&ctx->add_ctx, 0, sizeof(ctx->add_ctx));
  38243. ctx->state = 8;
  38244. }
  38245. break;
  38246. case 8: /* ADD */
  38247. err = sp_521_proj_point_add_17_nb((sp_ecc_ctx_t*)&ctx->add_ctx, &ctx->p1, &ctx->p1, &ctx->p2, ctx->tmp);
  38248. if (err == MP_OKAY)
  38249. ctx->state = 9;
  38250. break;
  38251. case 9: /* MONT */
  38252. /* (r + n*order).z'.z' mod prime == (u1.G + u2.Q)->x' */
  38253. /* Reload r and convert to Montgomery form. */
  38254. sp_521_from_mp(ctx->u2, 17, rm);
  38255. err = sp_521_mod_mul_norm_17(ctx->u2, ctx->u2, p521_mod);
  38256. if (err == MP_OKAY)
  38257. ctx->state = 10;
  38258. break;
  38259. case 10: /* SQR */
  38260. /* u1 = r.z'.z' mod prime */
  38261. sp_521_mont_sqr_17(ctx->p1.z, ctx->p1.z, p521_mod, p521_mp_mod);
  38262. ctx->state = 11;
  38263. break;
  38264. case 11: /* MUL */
  38265. sp_521_mont_mul_17(ctx->u1, ctx->u2, ctx->p1.z, p521_mod, p521_mp_mod);
  38266. ctx->state = 12;
  38267. break;
  38268. case 12: /* RES */
  38269. {
  38270. sp_int32 c = 0;
  38271. err = MP_OKAY; /* math okay, now check result */
  38272. *res = (int)(sp_521_cmp_17(ctx->p1.x, ctx->u1) == 0);
  38273. if (*res == 0) {
  38274. sp_digit carry;
  38275. /* Reload r and add order. */
  38276. sp_521_from_mp(ctx->u2, 17, rm);
  38277. carry = sp_521_add_17(ctx->u2, ctx->u2, p521_order);
  38278. /* Carry means result is greater than mod and is not valid. */
  38279. if (carry == 0) {
  38280. sp_521_norm_17(ctx->u2);
  38281. /* Compare with mod and if greater or equal then not valid. */
  38282. c = sp_521_cmp_17(ctx->u2, p521_mod);
  38283. }
  38284. }
  38285. if ((*res == 0) && (c < 0)) {
  38286. /* Convert to Montogomery form */
  38287. err = sp_521_mod_mul_norm_17(ctx->u2, ctx->u2, p521_mod);
  38288. if (err == MP_OKAY) {
  38289. /* u1 = (r + 1*order).z'.z' mod prime */
  38290. sp_521_mont_mul_17(ctx->u1, ctx->u2, ctx->p1.z, p521_mod,
  38291. p521_mp_mod);
  38292. *res = (int)(sp_521_cmp_17(ctx->p1.x, ctx->u1) == 0);
  38293. }
  38294. }
  38295. break;
  38296. }
  38297. } /* switch */
  38298. if (err == MP_OKAY && ctx->state != 12) {
  38299. err = FP_WOULDBLOCK;
  38300. }
  38301. return err;
  38302. }
  38303. #endif /* WOLFSSL_SP_NONBLOCK */
  38304. int sp_ecc_verify_521(const byte* hash, word32 hashLen, const mp_int* pX,
  38305. const mp_int* pY, const mp_int* pZ, const mp_int* rm, const mp_int* sm,
  38306. int* res, void* heap)
  38307. {
  38308. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38309. sp_digit* u1 = NULL;
  38310. sp_point_521* p1 = NULL;
  38311. #else
  38312. sp_digit u1[18 * 17];
  38313. sp_point_521 p1[2];
  38314. #endif
  38315. sp_digit* u2 = NULL;
  38316. sp_digit* s = NULL;
  38317. sp_digit* tmp = NULL;
  38318. sp_point_521* p2 = NULL;
  38319. sp_digit carry;
  38320. sp_int32 c = 0;
  38321. int err = MP_OKAY;
  38322. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38323. if (err == MP_OKAY) {
  38324. p1 = (sp_point_521*)XMALLOC(sizeof(sp_point_521) * 2, heap,
  38325. DYNAMIC_TYPE_ECC);
  38326. if (p1 == NULL)
  38327. err = MEMORY_E;
  38328. }
  38329. if (err == MP_OKAY) {
  38330. u1 = (sp_digit*)XMALLOC(sizeof(sp_digit) * 18 * 17, heap,
  38331. DYNAMIC_TYPE_ECC);
  38332. if (u1 == NULL)
  38333. err = MEMORY_E;
  38334. }
  38335. #endif
  38336. if (err == MP_OKAY) {
  38337. u2 = u1 + 2 * 17;
  38338. s = u1 + 4 * 17;
  38339. tmp = u1 + 6 * 17;
  38340. p2 = p1 + 1;
  38341. if (hashLen > 66U) {
  38342. hashLen = 66U;
  38343. }
  38344. sp_521_from_bin(u1, 17, hash, (int)hashLen);
  38345. sp_521_from_mp(u2, 17, rm);
  38346. sp_521_from_mp(s, 17, sm);
  38347. sp_521_from_mp(p2->x, 17, pX);
  38348. sp_521_from_mp(p2->y, 17, pY);
  38349. sp_521_from_mp(p2->z, 17, pZ);
  38350. if (hashLen == 66U) {
  38351. sp_521_rshift_17(u1, u1, 7);
  38352. }
  38353. err = sp_521_calc_vfy_point_17(p1, p2, s, u1, u2, tmp, heap);
  38354. }
  38355. if (err == MP_OKAY) {
  38356. /* (r + n*order).z'.z' mod prime == (u1.G + u2.Q)->x' */
  38357. /* Reload r and convert to Montgomery form. */
  38358. sp_521_from_mp(u2, 17, rm);
  38359. err = sp_521_mod_mul_norm_17(u2, u2, p521_mod);
  38360. }
  38361. if (err == MP_OKAY) {
  38362. /* u1 = r.z'.z' mod prime */
  38363. sp_521_mont_sqr_17(p1->z, p1->z, p521_mod, p521_mp_mod);
  38364. sp_521_mont_mul_17(u1, u2, p1->z, p521_mod, p521_mp_mod);
  38365. *res = (int)(sp_521_cmp_17(p1->x, u1) == 0);
  38366. if (*res == 0) {
  38367. /* Reload r and add order. */
  38368. sp_521_from_mp(u2, 17, rm);
  38369. carry = sp_521_add_17(u2, u2, p521_order);
  38370. /* Carry means result is greater than mod and is not valid. */
  38371. if (carry == 0) {
  38372. sp_521_norm_17(u2);
  38373. /* Compare with mod and if greater or equal then not valid. */
  38374. c = sp_521_cmp_17(u2, p521_mod);
  38375. }
  38376. }
  38377. if ((*res == 0) && (c < 0)) {
  38378. /* Convert to Montogomery form */
  38379. err = sp_521_mod_mul_norm_17(u2, u2, p521_mod);
  38380. if (err == MP_OKAY) {
  38381. /* u1 = (r + 1*order).z'.z' mod prime */
  38382. {
  38383. sp_521_mont_mul_17(u1, u2, p1->z, p521_mod, p521_mp_mod);
  38384. }
  38385. *res = (sp_521_cmp_17(p1->x, u1) == 0);
  38386. }
  38387. }
  38388. }
  38389. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38390. if (u1 != NULL)
  38391. XFREE(u1, heap, DYNAMIC_TYPE_ECC);
  38392. if (p1 != NULL)
  38393. XFREE(p1, heap, DYNAMIC_TYPE_ECC);
  38394. #endif
  38395. return err;
  38396. }
  38397. #endif /* HAVE_ECC_VERIFY */
  38398. #ifdef HAVE_ECC_CHECK_KEY
  38399. /* Check that the x and y oridinates are a valid point on the curve.
  38400. *
  38401. * point EC point.
  38402. * heap Heap to use if dynamically allocating.
  38403. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  38404. * not on the curve and MP_OKAY otherwise.
  38405. */
  38406. static int sp_521_ecc_is_point_17(const sp_point_521* point,
  38407. void* heap)
  38408. {
  38409. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38410. sp_digit* t1 = NULL;
  38411. #else
  38412. sp_digit t1[17 * 4];
  38413. #endif
  38414. sp_digit* t2 = NULL;
  38415. int err = MP_OKAY;
  38416. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38417. t1 = (sp_digit*)XMALLOC(sizeof(sp_digit) * 17 * 4, heap, DYNAMIC_TYPE_ECC);
  38418. if (t1 == NULL)
  38419. err = MEMORY_E;
  38420. #endif
  38421. (void)heap;
  38422. if (err == MP_OKAY) {
  38423. t2 = t1 + 2 * 17;
  38424. sp_521_sqr_17(t1, point->y);
  38425. (void)sp_521_mod_17(t1, t1, p521_mod);
  38426. sp_521_sqr_17(t2, point->x);
  38427. (void)sp_521_mod_17(t2, t2, p521_mod);
  38428. sp_521_mul_17(t2, t2, point->x);
  38429. (void)sp_521_mod_17(t2, t2, p521_mod);
  38430. (void)sp_521_sub_17(t2, p521_mod, t2);
  38431. sp_521_mont_add_17(t1, t1, t2, p521_mod);
  38432. sp_521_mont_add_17(t1, t1, point->x, p521_mod);
  38433. sp_521_mont_add_17(t1, t1, point->x, p521_mod);
  38434. sp_521_mont_add_17(t1, t1, point->x, p521_mod);
  38435. if (sp_521_cmp_17(t1, p521_b) != 0) {
  38436. err = MP_VAL;
  38437. }
  38438. }
  38439. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38440. if (t1 != NULL)
  38441. XFREE(t1, heap, DYNAMIC_TYPE_ECC);
  38442. #endif
  38443. return err;
  38444. }
  38445. /* Check that the x and y oridinates are a valid point on the curve.
  38446. *
  38447. * pX X ordinate of EC point.
  38448. * pY Y ordinate of EC point.
  38449. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  38450. * not on the curve and MP_OKAY otherwise.
  38451. */
  38452. int sp_ecc_is_point_521(const mp_int* pX, const mp_int* pY)
  38453. {
  38454. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38455. sp_point_521* pub = NULL;
  38456. #else
  38457. sp_point_521 pub[1];
  38458. #endif
  38459. const byte one[1] = { 1 };
  38460. int err = MP_OKAY;
  38461. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38462. pub = (sp_point_521*)XMALLOC(sizeof(sp_point_521), NULL,
  38463. DYNAMIC_TYPE_ECC);
  38464. if (pub == NULL)
  38465. err = MEMORY_E;
  38466. #endif
  38467. if (err == MP_OKAY) {
  38468. sp_521_from_mp(pub->x, 17, pX);
  38469. sp_521_from_mp(pub->y, 17, pY);
  38470. sp_521_from_bin(pub->z, 17, one, (int)sizeof(one));
  38471. err = sp_521_ecc_is_point_17(pub, NULL);
  38472. }
  38473. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38474. if (pub != NULL)
  38475. XFREE(pub, NULL, DYNAMIC_TYPE_ECC);
  38476. #endif
  38477. return err;
  38478. }
  38479. /* Check that the private scalar generates the EC point (px, py), the point is
  38480. * on the curve and the point has the correct order.
  38481. *
  38482. * pX X ordinate of EC point.
  38483. * pY Y ordinate of EC point.
  38484. * privm Private scalar that generates EC point.
  38485. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  38486. * not on the curve, ECC_INF_E if the point does not have the correct order,
  38487. * ECC_PRIV_KEY_E when the private scalar doesn't generate the EC point and
  38488. * MP_OKAY otherwise.
  38489. */
  38490. int sp_ecc_check_key_521(const mp_int* pX, const mp_int* pY,
  38491. const mp_int* privm, void* heap)
  38492. {
  38493. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38494. sp_digit* priv = NULL;
  38495. sp_point_521* pub = NULL;
  38496. #else
  38497. sp_digit priv[17];
  38498. sp_point_521 pub[2];
  38499. #endif
  38500. sp_point_521* p = NULL;
  38501. const byte one[1] = { 1 };
  38502. int err = MP_OKAY;
  38503. /* Quick check the lengs of public key ordinates and private key are in
  38504. * range. Proper check later.
  38505. */
  38506. if (((mp_count_bits(pX) > 521) ||
  38507. (mp_count_bits(pY) > 521) ||
  38508. ((privm != NULL) && (mp_count_bits(privm) > 521)))) {
  38509. err = ECC_OUT_OF_RANGE_E;
  38510. }
  38511. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38512. if (err == MP_OKAY) {
  38513. pub = (sp_point_521*)XMALLOC(sizeof(sp_point_521) * 2, heap,
  38514. DYNAMIC_TYPE_ECC);
  38515. if (pub == NULL)
  38516. err = MEMORY_E;
  38517. }
  38518. if (err == MP_OKAY && privm) {
  38519. priv = (sp_digit*)XMALLOC(sizeof(sp_digit) * 17, heap,
  38520. DYNAMIC_TYPE_ECC);
  38521. if (priv == NULL)
  38522. err = MEMORY_E;
  38523. }
  38524. #endif
  38525. if (err == MP_OKAY) {
  38526. p = pub + 1;
  38527. sp_521_from_mp(pub->x, 17, pX);
  38528. sp_521_from_mp(pub->y, 17, pY);
  38529. sp_521_from_bin(pub->z, 17, one, (int)sizeof(one));
  38530. if (privm)
  38531. sp_521_from_mp(priv, 17, privm);
  38532. /* Check point at infinitiy. */
  38533. if ((sp_521_iszero_17(pub->x) != 0) &&
  38534. (sp_521_iszero_17(pub->y) != 0)) {
  38535. err = ECC_INF_E;
  38536. }
  38537. }
  38538. /* Check range of X and Y */
  38539. if ((err == MP_OKAY) &&
  38540. ((sp_521_cmp_17(pub->x, p521_mod) >= 0) ||
  38541. (sp_521_cmp_17(pub->y, p521_mod) >= 0))) {
  38542. err = ECC_OUT_OF_RANGE_E;
  38543. }
  38544. if (err == MP_OKAY) {
  38545. /* Check point is on curve */
  38546. err = sp_521_ecc_is_point_17(pub, heap);
  38547. }
  38548. if (err == MP_OKAY) {
  38549. /* Point * order = infinity */
  38550. err = sp_521_ecc_mulmod_17(p, pub, p521_order, 1, 1, heap);
  38551. }
  38552. /* Check result is infinity */
  38553. if ((err == MP_OKAY) && ((sp_521_iszero_17(p->x) == 0) ||
  38554. (sp_521_iszero_17(p->y) == 0))) {
  38555. err = ECC_INF_E;
  38556. }
  38557. if (privm) {
  38558. if (err == MP_OKAY) {
  38559. /* Base * private = point */
  38560. err = sp_521_ecc_mulmod_base_17(p, priv, 1, 1, heap);
  38561. }
  38562. /* Check result is public key */
  38563. if ((err == MP_OKAY) &&
  38564. ((sp_521_cmp_17(p->x, pub->x) != 0) ||
  38565. (sp_521_cmp_17(p->y, pub->y) != 0))) {
  38566. err = ECC_PRIV_KEY_E;
  38567. }
  38568. }
  38569. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38570. if (pub != NULL)
  38571. XFREE(pub, heap, DYNAMIC_TYPE_ECC);
  38572. if (priv != NULL)
  38573. XFREE(priv, heap, DYNAMIC_TYPE_ECC);
  38574. #endif
  38575. return err;
  38576. }
  38577. #endif
  38578. #ifdef WOLFSSL_PUBLIC_ECC_ADD_DBL
  38579. /* Add two projective EC points together.
  38580. * (pX, pY, pZ) + (qX, qY, qZ) = (rX, rY, rZ)
  38581. *
  38582. * pX First EC point's X ordinate.
  38583. * pY First EC point's Y ordinate.
  38584. * pZ First EC point's Z ordinate.
  38585. * qX Second EC point's X ordinate.
  38586. * qY Second EC point's Y ordinate.
  38587. * qZ Second EC point's Z ordinate.
  38588. * rX Resultant EC point's X ordinate.
  38589. * rY Resultant EC point's Y ordinate.
  38590. * rZ Resultant EC point's Z ordinate.
  38591. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  38592. */
  38593. int sp_ecc_proj_add_point_521(mp_int* pX, mp_int* pY, mp_int* pZ,
  38594. mp_int* qX, mp_int* qY, mp_int* qZ,
  38595. mp_int* rX, mp_int* rY, mp_int* rZ)
  38596. {
  38597. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38598. sp_digit* tmp = NULL;
  38599. sp_point_521* p = NULL;
  38600. #else
  38601. sp_digit tmp[2 * 17 * 6];
  38602. sp_point_521 p[2];
  38603. #endif
  38604. sp_point_521* q = NULL;
  38605. int err = MP_OKAY;
  38606. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38607. if (err == MP_OKAY) {
  38608. p = (sp_point_521*)XMALLOC(sizeof(sp_point_521) * 2, NULL,
  38609. DYNAMIC_TYPE_ECC);
  38610. if (p == NULL)
  38611. err = MEMORY_E;
  38612. }
  38613. if (err == MP_OKAY) {
  38614. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 17 * 6, NULL,
  38615. DYNAMIC_TYPE_ECC);
  38616. if (tmp == NULL) {
  38617. err = MEMORY_E;
  38618. }
  38619. }
  38620. #endif
  38621. if (err == MP_OKAY) {
  38622. q = p + 1;
  38623. sp_521_from_mp(p->x, 17, pX);
  38624. sp_521_from_mp(p->y, 17, pY);
  38625. sp_521_from_mp(p->z, 17, pZ);
  38626. sp_521_from_mp(q->x, 17, qX);
  38627. sp_521_from_mp(q->y, 17, qY);
  38628. sp_521_from_mp(q->z, 17, qZ);
  38629. p->infinity = sp_521_iszero_17(p->x) &
  38630. sp_521_iszero_17(p->y);
  38631. q->infinity = sp_521_iszero_17(q->x) &
  38632. sp_521_iszero_17(q->y);
  38633. sp_521_proj_point_add_17(p, p, q, tmp);
  38634. }
  38635. if (err == MP_OKAY) {
  38636. err = sp_521_to_mp(p->x, rX);
  38637. }
  38638. if (err == MP_OKAY) {
  38639. err = sp_521_to_mp(p->y, rY);
  38640. }
  38641. if (err == MP_OKAY) {
  38642. err = sp_521_to_mp(p->z, rZ);
  38643. }
  38644. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38645. if (tmp != NULL)
  38646. XFREE(tmp, NULL, DYNAMIC_TYPE_ECC);
  38647. if (p != NULL)
  38648. XFREE(p, NULL, DYNAMIC_TYPE_ECC);
  38649. #endif
  38650. return err;
  38651. }
  38652. /* Double a projective EC point.
  38653. * (pX, pY, pZ) + (pX, pY, pZ) = (rX, rY, rZ)
  38654. *
  38655. * pX EC point's X ordinate.
  38656. * pY EC point's Y ordinate.
  38657. * pZ EC point's Z ordinate.
  38658. * rX Resultant EC point's X ordinate.
  38659. * rY Resultant EC point's Y ordinate.
  38660. * rZ Resultant EC point's Z ordinate.
  38661. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  38662. */
  38663. int sp_ecc_proj_dbl_point_521(mp_int* pX, mp_int* pY, mp_int* pZ,
  38664. mp_int* rX, mp_int* rY, mp_int* rZ)
  38665. {
  38666. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38667. sp_digit* tmp = NULL;
  38668. sp_point_521* p = NULL;
  38669. #else
  38670. sp_digit tmp[2 * 17 * 2];
  38671. sp_point_521 p[1];
  38672. #endif
  38673. int err = MP_OKAY;
  38674. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38675. if (err == MP_OKAY) {
  38676. p = (sp_point_521*)XMALLOC(sizeof(sp_point_521), NULL,
  38677. DYNAMIC_TYPE_ECC);
  38678. if (p == NULL)
  38679. err = MEMORY_E;
  38680. }
  38681. if (err == MP_OKAY) {
  38682. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 17 * 2, NULL,
  38683. DYNAMIC_TYPE_ECC);
  38684. if (tmp == NULL)
  38685. err = MEMORY_E;
  38686. }
  38687. #endif
  38688. if (err == MP_OKAY) {
  38689. sp_521_from_mp(p->x, 17, pX);
  38690. sp_521_from_mp(p->y, 17, pY);
  38691. sp_521_from_mp(p->z, 17, pZ);
  38692. p->infinity = sp_521_iszero_17(p->x) &
  38693. sp_521_iszero_17(p->y);
  38694. sp_521_proj_point_dbl_17(p, p, tmp);
  38695. }
  38696. if (err == MP_OKAY) {
  38697. err = sp_521_to_mp(p->x, rX);
  38698. }
  38699. if (err == MP_OKAY) {
  38700. err = sp_521_to_mp(p->y, rY);
  38701. }
  38702. if (err == MP_OKAY) {
  38703. err = sp_521_to_mp(p->z, rZ);
  38704. }
  38705. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38706. if (tmp != NULL)
  38707. XFREE(tmp, NULL, DYNAMIC_TYPE_ECC);
  38708. if (p != NULL)
  38709. XFREE(p, NULL, DYNAMIC_TYPE_ECC);
  38710. #endif
  38711. return err;
  38712. }
  38713. /* Map a projective EC point to affine in place.
  38714. * pZ will be one.
  38715. *
  38716. * pX EC point's X ordinate.
  38717. * pY EC point's Y ordinate.
  38718. * pZ EC point's Z ordinate.
  38719. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  38720. */
  38721. int sp_ecc_map_521(mp_int* pX, mp_int* pY, mp_int* pZ)
  38722. {
  38723. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38724. sp_digit* tmp = NULL;
  38725. sp_point_521* p = NULL;
  38726. #else
  38727. sp_digit tmp[2 * 17 * 5];
  38728. sp_point_521 p[1];
  38729. #endif
  38730. int err = MP_OKAY;
  38731. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38732. if (err == MP_OKAY) {
  38733. p = (sp_point_521*)XMALLOC(sizeof(sp_point_521), NULL,
  38734. DYNAMIC_TYPE_ECC);
  38735. if (p == NULL)
  38736. err = MEMORY_E;
  38737. }
  38738. if (err == MP_OKAY) {
  38739. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 17 * 5, NULL,
  38740. DYNAMIC_TYPE_ECC);
  38741. if (tmp == NULL)
  38742. err = MEMORY_E;
  38743. }
  38744. #endif
  38745. if (err == MP_OKAY) {
  38746. sp_521_from_mp(p->x, 17, pX);
  38747. sp_521_from_mp(p->y, 17, pY);
  38748. sp_521_from_mp(p->z, 17, pZ);
  38749. p->infinity = sp_521_iszero_17(p->x) &
  38750. sp_521_iszero_17(p->y);
  38751. sp_521_map_17(p, p, tmp);
  38752. }
  38753. if (err == MP_OKAY) {
  38754. err = sp_521_to_mp(p->x, pX);
  38755. }
  38756. if (err == MP_OKAY) {
  38757. err = sp_521_to_mp(p->y, pY);
  38758. }
  38759. if (err == MP_OKAY) {
  38760. err = sp_521_to_mp(p->z, pZ);
  38761. }
  38762. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38763. if (tmp != NULL)
  38764. XFREE(tmp, NULL, DYNAMIC_TYPE_ECC);
  38765. if (p != NULL)
  38766. XFREE(p, NULL, DYNAMIC_TYPE_ECC);
  38767. #endif
  38768. return err;
  38769. }
  38770. #endif /* WOLFSSL_PUBLIC_ECC_ADD_DBL */
  38771. #ifdef HAVE_COMP_KEY
  38772. /* Square root power for the P521 curve. */
  38773. static const uint32_t p521_sqrt_power[17] = {
  38774. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  38775. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  38776. 0x00000000,0x00000000,0x00000080
  38777. };
  38778. /* Find the square root of a number mod the prime of the curve.
  38779. *
  38780. * y The number to operate on and the result.
  38781. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  38782. */
  38783. static int sp_521_mont_sqrt_17(sp_digit* y)
  38784. {
  38785. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38786. sp_digit* t = NULL;
  38787. #else
  38788. sp_digit t[2 * 17];
  38789. #endif
  38790. int err = MP_OKAY;
  38791. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38792. t = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 17, NULL, DYNAMIC_TYPE_ECC);
  38793. if (t == NULL)
  38794. err = MEMORY_E;
  38795. #endif
  38796. if (err == MP_OKAY) {
  38797. {
  38798. int i;
  38799. XMEMCPY(t, y, sizeof(sp_digit) * 17);
  38800. for (i=518; i>=0; i--) {
  38801. sp_521_mont_sqr_17(t, t, p521_mod, p521_mp_mod);
  38802. if (p521_sqrt_power[i / 32] & ((sp_digit)1 << (i % 32)))
  38803. sp_521_mont_mul_17(t, t, y, p521_mod, p521_mp_mod);
  38804. }
  38805. XMEMCPY(y, t, sizeof(sp_digit) * 17);
  38806. }
  38807. }
  38808. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38809. if (t != NULL)
  38810. XFREE(t, NULL, DYNAMIC_TYPE_ECC);
  38811. #endif
  38812. return err;
  38813. }
  38814. /* Uncompress the point given the X ordinate.
  38815. *
  38816. * xm X ordinate.
  38817. * odd Whether the Y ordinate is odd.
  38818. * ym Calculated Y ordinate.
  38819. * returns MEMORY_E if dynamic memory allocation fails and MP_OKAY otherwise.
  38820. */
  38821. int sp_ecc_uncompress_521(mp_int* xm, int odd, mp_int* ym)
  38822. {
  38823. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38824. sp_digit* x = NULL;
  38825. #else
  38826. sp_digit x[4 * 17];
  38827. #endif
  38828. sp_digit* y = NULL;
  38829. int err = MP_OKAY;
  38830. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38831. x = (sp_digit*)XMALLOC(sizeof(sp_digit) * 4 * 17, NULL, DYNAMIC_TYPE_ECC);
  38832. if (x == NULL)
  38833. err = MEMORY_E;
  38834. #endif
  38835. if (err == MP_OKAY) {
  38836. y = x + 2 * 17;
  38837. sp_521_from_mp(x, 17, xm);
  38838. err = sp_521_mod_mul_norm_17(x, x, p521_mod);
  38839. }
  38840. if (err == MP_OKAY) {
  38841. /* y = x^3 */
  38842. {
  38843. sp_521_mont_sqr_17(y, x, p521_mod, p521_mp_mod);
  38844. sp_521_mont_mul_17(y, y, x, p521_mod, p521_mp_mod);
  38845. }
  38846. /* y = x^3 - 3x */
  38847. sp_521_mont_sub_17(y, y, x, p521_mod);
  38848. sp_521_mont_sub_17(y, y, x, p521_mod);
  38849. sp_521_mont_sub_17(y, y, x, p521_mod);
  38850. /* y = x^3 - 3x + b */
  38851. err = sp_521_mod_mul_norm_17(x, p521_b, p521_mod);
  38852. }
  38853. if (err == MP_OKAY) {
  38854. sp_521_mont_add_17(y, y, x, p521_mod);
  38855. /* y = sqrt(x^3 - 3x + b) */
  38856. err = sp_521_mont_sqrt_17(y);
  38857. }
  38858. if (err == MP_OKAY) {
  38859. XMEMSET(y + 17, 0, 17U * sizeof(sp_digit));
  38860. sp_521_mont_reduce_17(y, p521_mod, p521_mp_mod);
  38861. if ((((word32)y[0] ^ (word32)odd) & 1U) != 0U) {
  38862. sp_521_mont_sub_17(y, p521_mod, y, p521_mod);
  38863. }
  38864. err = sp_521_to_mp(y, ym);
  38865. }
  38866. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  38867. if (x != NULL)
  38868. XFREE(x, NULL, DYNAMIC_TYPE_ECC);
  38869. #endif
  38870. return err;
  38871. }
  38872. #endif
  38873. #endif /* WOLFSSL_SP_521 */
  38874. #ifdef WOLFSSL_SP_1024
  38875. /* Point structure to use. */
  38876. typedef struct sp_point_1024 {
  38877. /* X ordinate of point. */
  38878. sp_digit x[2 * 32];
  38879. /* Y ordinate of point. */
  38880. sp_digit y[2 * 32];
  38881. /* Z ordinate of point. */
  38882. sp_digit z[2 * 32];
  38883. /* Indicates point is at infinity. */
  38884. int infinity;
  38885. } sp_point_1024;
  38886. #ifndef WOLFSSL_SP_SMALL
  38887. /* Multiply a and b into r. (r = a * b)
  38888. *
  38889. * r A single precision integer.
  38890. * a A single precision integer.
  38891. * b A single precision integer.
  38892. */
  38893. SP_NOINLINE static void sp_1024_mul_16(sp_digit* r, const sp_digit* a,
  38894. const sp_digit* b)
  38895. {
  38896. sp_digit tmp_arr[16 * 2];
  38897. sp_digit* tmp = tmp_arr;
  38898. __asm__ __volatile__ (
  38899. "mov r3, #0\n\t"
  38900. "mov r4, #0\n\t"
  38901. "mov r9, r3\n\t"
  38902. "mov r12, %[r]\n\t"
  38903. "mov r10, %[a]\n\t"
  38904. "mov r11, %[b]\n\t"
  38905. "mov r6, #64\n\t"
  38906. "add r6, r6, r10\n\t"
  38907. "mov r14, r6\n\t"
  38908. "\n1:\n\t"
  38909. "mov %[r], #0\n\t"
  38910. "mov r5, #0\n\t"
  38911. "mov r6, #60\n\t"
  38912. "mov %[a], r9\n\t"
  38913. "subs %[a], %[a], r6\n\t"
  38914. "sbc r6, r6, r6\n\t"
  38915. "mvn r6, r6\n\t"
  38916. "and %[a], %[a], r6\n\t"
  38917. "mov %[b], r9\n\t"
  38918. "sub %[b], %[b], %[a]\n\t"
  38919. "add %[a], %[a], r10\n\t"
  38920. "add %[b], %[b], r11\n\t"
  38921. "\n2:\n\t"
  38922. /* Multiply Start */
  38923. "ldr r6, [%[a]]\n\t"
  38924. "ldr r8, [%[b]]\n\t"
  38925. "umull r6, r8, r6, r8\n\t"
  38926. "adds r3, r3, r6\n\t"
  38927. "adcs r4, r4, r8\n\t"
  38928. "adc r5, r5, %[r]\n\t"
  38929. /* Multiply Done */
  38930. "add %[a], %[a], #4\n\t"
  38931. "sub %[b], %[b], #4\n\t"
  38932. "cmp %[a], r14\n\t"
  38933. #ifdef __GNUC__
  38934. "beq 3f\n\t"
  38935. #else
  38936. "beq.n 3f\n\t"
  38937. #endif /* __GNUC__ */
  38938. "mov r6, r9\n\t"
  38939. "add r6, r6, r10\n\t"
  38940. "cmp %[a], r6\n\t"
  38941. #ifdef __GNUC__
  38942. "ble 2b\n\t"
  38943. #else
  38944. "ble.n 2b\n\t"
  38945. #endif /* __GNUC__ */
  38946. "\n3:\n\t"
  38947. "mov %[r], r12\n\t"
  38948. "mov r8, r9\n\t"
  38949. "str r3, [%[r], r8]\n\t"
  38950. "mov r3, r4\n\t"
  38951. "mov r4, r5\n\t"
  38952. "add r8, r8, #4\n\t"
  38953. "mov r9, r8\n\t"
  38954. "mov r6, #120\n\t"
  38955. "cmp r8, r6\n\t"
  38956. #ifdef __GNUC__
  38957. "ble 1b\n\t"
  38958. #else
  38959. "ble.n 1b\n\t"
  38960. #endif /* __GNUC__ */
  38961. "str r3, [%[r], r8]\n\t"
  38962. "mov %[a], r10\n\t"
  38963. "mov %[b], r11\n\t"
  38964. :
  38965. : [r] "r" (tmp), [a] "r" (a), [b] "r" (b)
  38966. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  38967. );
  38968. XMEMCPY(r, tmp_arr, sizeof(tmp_arr));
  38969. }
  38970. /* Square a and put result in r. (r = a * a)
  38971. *
  38972. * r A single precision integer.
  38973. * a A single precision integer.
  38974. */
  38975. SP_NOINLINE static void sp_1024_sqr_16(sp_digit* r, const sp_digit* a)
  38976. {
  38977. __asm__ __volatile__ (
  38978. "mov r3, #0\n\t"
  38979. "mov r4, #0\n\t"
  38980. "mov r5, #0\n\t"
  38981. "mov r9, r3\n\t"
  38982. "mov r12, %[r]\n\t"
  38983. "mov r6, #128\n\t"
  38984. "neg r6, r6\n\t"
  38985. "add sp, sp, r6\n\t"
  38986. "mov r11, sp\n\t"
  38987. "mov r10, %[a]\n\t"
  38988. "\n1:\n\t"
  38989. "mov %[r], #0\n\t"
  38990. "mov r6, #60\n\t"
  38991. "mov %[a], r9\n\t"
  38992. "subs %[a], %[a], r6\n\t"
  38993. "sbc r6, r6, r6\n\t"
  38994. "mvn r6, r6\n\t"
  38995. "and %[a], %[a], r6\n\t"
  38996. "mov r2, r9\n\t"
  38997. "sub r2, r2, %[a]\n\t"
  38998. "add %[a], %[a], r10\n\t"
  38999. "add r2, r2, r10\n\t"
  39000. "\n2:\n\t"
  39001. "cmp r2, %[a]\n\t"
  39002. #ifdef __GNUC__
  39003. "beq 4f\n\t"
  39004. #else
  39005. "beq.n 4f\n\t"
  39006. #endif /* __GNUC__ */
  39007. /* Multiply * 2: Start */
  39008. "ldr r6, [%[a]]\n\t"
  39009. "ldr r8, [r2]\n\t"
  39010. "umull r6, r8, r6, r8\n\t"
  39011. "adds r3, r3, r6\n\t"
  39012. "adcs r4, r4, r8\n\t"
  39013. "adc r5, r5, %[r]\n\t"
  39014. "adds r3, r3, r6\n\t"
  39015. "adcs r4, r4, r8\n\t"
  39016. "adc r5, r5, %[r]\n\t"
  39017. /* Multiply * 2: Done */
  39018. #ifdef __GNUC__
  39019. "bal 5f\n\t"
  39020. #else
  39021. "bal.n 5f\n\t"
  39022. #endif /* __GNUC__ */
  39023. "\n4:\n\t"
  39024. /* Square: Start */
  39025. "ldr r6, [%[a]]\n\t"
  39026. "umull r6, r8, r6, r6\n\t"
  39027. "adds r3, r3, r6\n\t"
  39028. "adcs r4, r4, r8\n\t"
  39029. "adc r5, r5, %[r]\n\t"
  39030. /* Square: Done */
  39031. "\n5:\n\t"
  39032. "add %[a], %[a], #4\n\t"
  39033. "sub r2, r2, #4\n\t"
  39034. "mov r6, #64\n\t"
  39035. "add r6, r6, r10\n\t"
  39036. "cmp %[a], r6\n\t"
  39037. #ifdef __GNUC__
  39038. "beq 3f\n\t"
  39039. #else
  39040. "beq.n 3f\n\t"
  39041. #endif /* __GNUC__ */
  39042. "cmp %[a], r2\n\t"
  39043. #ifdef __GNUC__
  39044. "bgt 3f\n\t"
  39045. #else
  39046. "bgt.n 3f\n\t"
  39047. #endif /* __GNUC__ */
  39048. "mov r8, r9\n\t"
  39049. "add r8, r8, r10\n\t"
  39050. "cmp %[a], r8\n\t"
  39051. #ifdef __GNUC__
  39052. "ble 2b\n\t"
  39053. #else
  39054. "ble.n 2b\n\t"
  39055. #endif /* __GNUC__ */
  39056. "\n3:\n\t"
  39057. "mov %[r], r11\n\t"
  39058. "mov r8, r9\n\t"
  39059. "str r3, [%[r], r8]\n\t"
  39060. "mov r3, r4\n\t"
  39061. "mov r4, r5\n\t"
  39062. "mov r5, #0\n\t"
  39063. "add r8, r8, #4\n\t"
  39064. "mov r9, r8\n\t"
  39065. "mov r6, #120\n\t"
  39066. "cmp r8, r6\n\t"
  39067. #ifdef __GNUC__
  39068. "ble 1b\n\t"
  39069. #else
  39070. "ble.n 1b\n\t"
  39071. #endif /* __GNUC__ */
  39072. "mov %[a], r10\n\t"
  39073. "str r3, [%[r], r8]\n\t"
  39074. "mov %[r], r12\n\t"
  39075. "mov %[a], r11\n\t"
  39076. "mov r3, #124\n\t"
  39077. "\n4:\n\t"
  39078. "ldr r6, [%[a], r3]\n\t"
  39079. "str r6, [%[r], r3]\n\t"
  39080. "subs r3, r3, #4\n\t"
  39081. #ifdef __GNUC__
  39082. "bge 4b\n\t"
  39083. #else
  39084. "bge.n 4b\n\t"
  39085. #endif /* __GNUC__ */
  39086. "mov r6, #128\n\t"
  39087. "add sp, sp, r6\n\t"
  39088. :
  39089. : [r] "r" (r), [a] "r" (a)
  39090. : "memory", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12"
  39091. );
  39092. }
  39093. /* Add b to a into r. (r = a + b)
  39094. *
  39095. * r A single precision integer.
  39096. * a A single precision integer.
  39097. * b A single precision integer.
  39098. */
  39099. SP_NOINLINE static sp_digit sp_1024_add_16(sp_digit* r, const sp_digit* a,
  39100. const sp_digit* b)
  39101. {
  39102. sp_digit c = 0;
  39103. __asm__ __volatile__ (
  39104. "ldm %[a]!, {r4, r5}\n\t"
  39105. "ldm %[b]!, {r6, r8}\n\t"
  39106. "adds r4, r4, r6\n\t"
  39107. "adcs r5, r5, r8\n\t"
  39108. "stm %[r]!, {r4, r5}\n\t"
  39109. "ldm %[a]!, {r4, r5}\n\t"
  39110. "ldm %[b]!, {r6, r8}\n\t"
  39111. "adcs r4, r4, r6\n\t"
  39112. "adcs r5, r5, r8\n\t"
  39113. "stm %[r]!, {r4, r5}\n\t"
  39114. "ldm %[a]!, {r4, r5}\n\t"
  39115. "ldm %[b]!, {r6, r8}\n\t"
  39116. "adcs r4, r4, r6\n\t"
  39117. "adcs r5, r5, r8\n\t"
  39118. "stm %[r]!, {r4, r5}\n\t"
  39119. "ldm %[a]!, {r4, r5}\n\t"
  39120. "ldm %[b]!, {r6, r8}\n\t"
  39121. "adcs r4, r4, r6\n\t"
  39122. "adcs r5, r5, r8\n\t"
  39123. "stm %[r]!, {r4, r5}\n\t"
  39124. "ldm %[a]!, {r4, r5}\n\t"
  39125. "ldm %[b]!, {r6, r8}\n\t"
  39126. "adcs r4, r4, r6\n\t"
  39127. "adcs r5, r5, r8\n\t"
  39128. "stm %[r]!, {r4, r5}\n\t"
  39129. "ldm %[a]!, {r4, r5}\n\t"
  39130. "ldm %[b]!, {r6, r8}\n\t"
  39131. "adcs r4, r4, r6\n\t"
  39132. "adcs r5, r5, r8\n\t"
  39133. "stm %[r]!, {r4, r5}\n\t"
  39134. "ldm %[a]!, {r4, r5}\n\t"
  39135. "ldm %[b]!, {r6, r8}\n\t"
  39136. "adcs r4, r4, r6\n\t"
  39137. "adcs r5, r5, r8\n\t"
  39138. "stm %[r]!, {r4, r5}\n\t"
  39139. "ldm %[a]!, {r4, r5}\n\t"
  39140. "ldm %[b]!, {r6, r8}\n\t"
  39141. "adcs r4, r4, r6\n\t"
  39142. "adcs r5, r5, r8\n\t"
  39143. "stm %[r]!, {r4, r5}\n\t"
  39144. "mov %[c], #0\n\t"
  39145. "adc %[c], %[c], %[c]\n\t"
  39146. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  39147. :
  39148. : "memory", "r4", "r5", "r6", "r8"
  39149. );
  39150. return c;
  39151. }
  39152. /* Sub b from a into r. (r = a - b)
  39153. *
  39154. * r A single precision integer.
  39155. * a A single precision integer.
  39156. * b A single precision integer.
  39157. */
  39158. SP_NOINLINE static sp_digit sp_1024_sub_in_place_32(sp_digit* a,
  39159. const sp_digit* b)
  39160. {
  39161. sp_digit c = 0;
  39162. __asm__ __volatile__ (
  39163. "ldm %[a], {r3, r4}\n\t"
  39164. "ldm %[b]!, {r5, r6}\n\t"
  39165. "subs r3, r3, r5\n\t"
  39166. "sbcs r4, r4, r6\n\t"
  39167. "stm %[a]!, {r3, r4}\n\t"
  39168. "ldm %[a], {r3, r4}\n\t"
  39169. "ldm %[b]!, {r5, r6}\n\t"
  39170. "sbcs r3, r3, r5\n\t"
  39171. "sbcs r4, r4, r6\n\t"
  39172. "stm %[a]!, {r3, r4}\n\t"
  39173. "ldm %[a], {r3, r4}\n\t"
  39174. "ldm %[b]!, {r5, r6}\n\t"
  39175. "sbcs r3, r3, r5\n\t"
  39176. "sbcs r4, r4, r6\n\t"
  39177. "stm %[a]!, {r3, r4}\n\t"
  39178. "ldm %[a], {r3, r4}\n\t"
  39179. "ldm %[b]!, {r5, r6}\n\t"
  39180. "sbcs r3, r3, r5\n\t"
  39181. "sbcs r4, r4, r6\n\t"
  39182. "stm %[a]!, {r3, r4}\n\t"
  39183. "ldm %[a], {r3, r4}\n\t"
  39184. "ldm %[b]!, {r5, r6}\n\t"
  39185. "sbcs r3, r3, r5\n\t"
  39186. "sbcs r4, r4, r6\n\t"
  39187. "stm %[a]!, {r3, r4}\n\t"
  39188. "ldm %[a], {r3, r4}\n\t"
  39189. "ldm %[b]!, {r5, r6}\n\t"
  39190. "sbcs r3, r3, r5\n\t"
  39191. "sbcs r4, r4, r6\n\t"
  39192. "stm %[a]!, {r3, r4}\n\t"
  39193. "ldm %[a], {r3, r4}\n\t"
  39194. "ldm %[b]!, {r5, r6}\n\t"
  39195. "sbcs r3, r3, r5\n\t"
  39196. "sbcs r4, r4, r6\n\t"
  39197. "stm %[a]!, {r3, r4}\n\t"
  39198. "ldm %[a], {r3, r4}\n\t"
  39199. "ldm %[b]!, {r5, r6}\n\t"
  39200. "sbcs r3, r3, r5\n\t"
  39201. "sbcs r4, r4, r6\n\t"
  39202. "stm %[a]!, {r3, r4}\n\t"
  39203. "ldm %[a], {r3, r4}\n\t"
  39204. "ldm %[b]!, {r5, r6}\n\t"
  39205. "sbcs r3, r3, r5\n\t"
  39206. "sbcs r4, r4, r6\n\t"
  39207. "stm %[a]!, {r3, r4}\n\t"
  39208. "ldm %[a], {r3, r4}\n\t"
  39209. "ldm %[b]!, {r5, r6}\n\t"
  39210. "sbcs r3, r3, r5\n\t"
  39211. "sbcs r4, r4, r6\n\t"
  39212. "stm %[a]!, {r3, r4}\n\t"
  39213. "ldm %[a], {r3, r4}\n\t"
  39214. "ldm %[b]!, {r5, r6}\n\t"
  39215. "sbcs r3, r3, r5\n\t"
  39216. "sbcs r4, r4, r6\n\t"
  39217. "stm %[a]!, {r3, r4}\n\t"
  39218. "ldm %[a], {r3, r4}\n\t"
  39219. "ldm %[b]!, {r5, r6}\n\t"
  39220. "sbcs r3, r3, r5\n\t"
  39221. "sbcs r4, r4, r6\n\t"
  39222. "stm %[a]!, {r3, r4}\n\t"
  39223. "ldm %[a], {r3, r4}\n\t"
  39224. "ldm %[b]!, {r5, r6}\n\t"
  39225. "sbcs r3, r3, r5\n\t"
  39226. "sbcs r4, r4, r6\n\t"
  39227. "stm %[a]!, {r3, r4}\n\t"
  39228. "ldm %[a], {r3, r4}\n\t"
  39229. "ldm %[b]!, {r5, r6}\n\t"
  39230. "sbcs r3, r3, r5\n\t"
  39231. "sbcs r4, r4, r6\n\t"
  39232. "stm %[a]!, {r3, r4}\n\t"
  39233. "ldm %[a], {r3, r4}\n\t"
  39234. "ldm %[b]!, {r5, r6}\n\t"
  39235. "sbcs r3, r3, r5\n\t"
  39236. "sbcs r4, r4, r6\n\t"
  39237. "stm %[a]!, {r3, r4}\n\t"
  39238. "ldm %[a], {r3, r4}\n\t"
  39239. "ldm %[b]!, {r5, r6}\n\t"
  39240. "sbcs r3, r3, r5\n\t"
  39241. "sbcs r4, r4, r6\n\t"
  39242. "stm %[a]!, {r3, r4}\n\t"
  39243. "sbc %[c], %[c], %[c]\n\t"
  39244. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  39245. :
  39246. : "memory", "r3", "r4", "r5", "r6"
  39247. );
  39248. return c;
  39249. }
  39250. /* Add b to a into r. (r = a + b)
  39251. *
  39252. * r A single precision integer.
  39253. * a A single precision integer.
  39254. * b A single precision integer.
  39255. */
  39256. SP_NOINLINE static sp_digit sp_1024_add_32(sp_digit* r, const sp_digit* a,
  39257. const sp_digit* b)
  39258. {
  39259. sp_digit c = 0;
  39260. __asm__ __volatile__ (
  39261. "ldm %[a]!, {r4, r5}\n\t"
  39262. "ldm %[b]!, {r6, r8}\n\t"
  39263. "adds r4, r4, r6\n\t"
  39264. "adcs r5, r5, r8\n\t"
  39265. "stm %[r]!, {r4, r5}\n\t"
  39266. "ldm %[a]!, {r4, r5}\n\t"
  39267. "ldm %[b]!, {r6, r8}\n\t"
  39268. "adcs r4, r4, r6\n\t"
  39269. "adcs r5, r5, r8\n\t"
  39270. "stm %[r]!, {r4, r5}\n\t"
  39271. "ldm %[a]!, {r4, r5}\n\t"
  39272. "ldm %[b]!, {r6, r8}\n\t"
  39273. "adcs r4, r4, r6\n\t"
  39274. "adcs r5, r5, r8\n\t"
  39275. "stm %[r]!, {r4, r5}\n\t"
  39276. "ldm %[a]!, {r4, r5}\n\t"
  39277. "ldm %[b]!, {r6, r8}\n\t"
  39278. "adcs r4, r4, r6\n\t"
  39279. "adcs r5, r5, r8\n\t"
  39280. "stm %[r]!, {r4, r5}\n\t"
  39281. "ldm %[a]!, {r4, r5}\n\t"
  39282. "ldm %[b]!, {r6, r8}\n\t"
  39283. "adcs r4, r4, r6\n\t"
  39284. "adcs r5, r5, r8\n\t"
  39285. "stm %[r]!, {r4, r5}\n\t"
  39286. "ldm %[a]!, {r4, r5}\n\t"
  39287. "ldm %[b]!, {r6, r8}\n\t"
  39288. "adcs r4, r4, r6\n\t"
  39289. "adcs r5, r5, r8\n\t"
  39290. "stm %[r]!, {r4, r5}\n\t"
  39291. "ldm %[a]!, {r4, r5}\n\t"
  39292. "ldm %[b]!, {r6, r8}\n\t"
  39293. "adcs r4, r4, r6\n\t"
  39294. "adcs r5, r5, r8\n\t"
  39295. "stm %[r]!, {r4, r5}\n\t"
  39296. "ldm %[a]!, {r4, r5}\n\t"
  39297. "ldm %[b]!, {r6, r8}\n\t"
  39298. "adcs r4, r4, r6\n\t"
  39299. "adcs r5, r5, r8\n\t"
  39300. "stm %[r]!, {r4, r5}\n\t"
  39301. "ldm %[a]!, {r4, r5}\n\t"
  39302. "ldm %[b]!, {r6, r8}\n\t"
  39303. "adcs r4, r4, r6\n\t"
  39304. "adcs r5, r5, r8\n\t"
  39305. "stm %[r]!, {r4, r5}\n\t"
  39306. "ldm %[a]!, {r4, r5}\n\t"
  39307. "ldm %[b]!, {r6, r8}\n\t"
  39308. "adcs r4, r4, r6\n\t"
  39309. "adcs r5, r5, r8\n\t"
  39310. "stm %[r]!, {r4, r5}\n\t"
  39311. "ldm %[a]!, {r4, r5}\n\t"
  39312. "ldm %[b]!, {r6, r8}\n\t"
  39313. "adcs r4, r4, r6\n\t"
  39314. "adcs r5, r5, r8\n\t"
  39315. "stm %[r]!, {r4, r5}\n\t"
  39316. "ldm %[a]!, {r4, r5}\n\t"
  39317. "ldm %[b]!, {r6, r8}\n\t"
  39318. "adcs r4, r4, r6\n\t"
  39319. "adcs r5, r5, r8\n\t"
  39320. "stm %[r]!, {r4, r5}\n\t"
  39321. "ldm %[a]!, {r4, r5}\n\t"
  39322. "ldm %[b]!, {r6, r8}\n\t"
  39323. "adcs r4, r4, r6\n\t"
  39324. "adcs r5, r5, r8\n\t"
  39325. "stm %[r]!, {r4, r5}\n\t"
  39326. "ldm %[a]!, {r4, r5}\n\t"
  39327. "ldm %[b]!, {r6, r8}\n\t"
  39328. "adcs r4, r4, r6\n\t"
  39329. "adcs r5, r5, r8\n\t"
  39330. "stm %[r]!, {r4, r5}\n\t"
  39331. "ldm %[a]!, {r4, r5}\n\t"
  39332. "ldm %[b]!, {r6, r8}\n\t"
  39333. "adcs r4, r4, r6\n\t"
  39334. "adcs r5, r5, r8\n\t"
  39335. "stm %[r]!, {r4, r5}\n\t"
  39336. "ldm %[a]!, {r4, r5}\n\t"
  39337. "ldm %[b]!, {r6, r8}\n\t"
  39338. "adcs r4, r4, r6\n\t"
  39339. "adcs r5, r5, r8\n\t"
  39340. "stm %[r]!, {r4, r5}\n\t"
  39341. "mov %[c], #0\n\t"
  39342. "adc %[c], %[c], %[c]\n\t"
  39343. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  39344. :
  39345. : "memory", "r4", "r5", "r6", "r8"
  39346. );
  39347. return c;
  39348. }
  39349. /* AND m into each word of a and store in r.
  39350. *
  39351. * r A single precision integer.
  39352. * a A single precision integer.
  39353. * m Mask to AND against each digit.
  39354. */
  39355. static void sp_1024_mask_16(sp_digit* r, const sp_digit* a, sp_digit m)
  39356. {
  39357. #ifdef WOLFSSL_SP_SMALL
  39358. int i;
  39359. for (i=0; i<16; i++) {
  39360. r[i] = a[i] & m;
  39361. }
  39362. #else
  39363. int i;
  39364. for (i = 0; i < 16; i += 8) {
  39365. r[i+0] = a[i+0] & m;
  39366. r[i+1] = a[i+1] & m;
  39367. r[i+2] = a[i+2] & m;
  39368. r[i+3] = a[i+3] & m;
  39369. r[i+4] = a[i+4] & m;
  39370. r[i+5] = a[i+5] & m;
  39371. r[i+6] = a[i+6] & m;
  39372. r[i+7] = a[i+7] & m;
  39373. }
  39374. #endif
  39375. }
  39376. /* Multiply a and b into r. (r = a * b)
  39377. *
  39378. * r A single precision integer.
  39379. * a A single precision integer.
  39380. * b A single precision integer.
  39381. */
  39382. SP_NOINLINE static void sp_1024_mul_32(sp_digit* r, const sp_digit* a,
  39383. const sp_digit* b)
  39384. {
  39385. sp_digit* z0 = r;
  39386. sp_digit z1[32];
  39387. sp_digit a1[16];
  39388. sp_digit b1[16];
  39389. sp_digit* z2 = r + 32;
  39390. sp_digit u;
  39391. sp_digit ca;
  39392. sp_digit cb;
  39393. ca = sp_1024_add_16(a1, a, &a[16]);
  39394. cb = sp_1024_add_16(b1, b, &b[16]);
  39395. u = ca & cb;
  39396. sp_1024_mul_16(z2, &a[16], &b[16]);
  39397. sp_1024_mul_16(z0, a, b);
  39398. sp_1024_mul_16(z1, a1, b1);
  39399. u += sp_1024_sub_in_place_32(z1, z0);
  39400. u += sp_1024_sub_in_place_32(z1, z2);
  39401. sp_1024_mask_16(a1, a1, 0 - cb);
  39402. u += sp_1024_add_16(z1 + 16, z1 + 16, a1);
  39403. sp_1024_mask_16(b1, b1, 0 - ca);
  39404. u += sp_1024_add_16(z1 + 16, z1 + 16, b1);
  39405. u += sp_1024_add_32(r + 16, r + 16, z1);
  39406. XMEMSET(a1 + 1, 0, sizeof(sp_digit) * (16 - 1));
  39407. a1[0] = u;
  39408. (void)sp_1024_add_16(r + 48, r + 48, a1);
  39409. }
  39410. /* Sub b from a into r. (r = a - b)
  39411. *
  39412. * r A single precision integer.
  39413. * a A single precision integer.
  39414. * b A single precision integer.
  39415. */
  39416. SP_NOINLINE static sp_digit sp_1024_sub_16(sp_digit* r, const sp_digit* a,
  39417. const sp_digit* b)
  39418. {
  39419. sp_digit c = 0;
  39420. __asm__ __volatile__ (
  39421. "ldm %[a]!, {r4, r5}\n\t"
  39422. "ldm %[b]!, {r6, r8}\n\t"
  39423. "subs r4, r4, r6\n\t"
  39424. "sbcs r5, r5, r8\n\t"
  39425. "stm %[r]!, {r4, r5}\n\t"
  39426. "ldm %[a]!, {r4, r5}\n\t"
  39427. "ldm %[b]!, {r6, r8}\n\t"
  39428. "sbcs r4, r4, r6\n\t"
  39429. "sbcs r5, r5, r8\n\t"
  39430. "stm %[r]!, {r4, r5}\n\t"
  39431. "ldm %[a]!, {r4, r5}\n\t"
  39432. "ldm %[b]!, {r6, r8}\n\t"
  39433. "sbcs r4, r4, r6\n\t"
  39434. "sbcs r5, r5, r8\n\t"
  39435. "stm %[r]!, {r4, r5}\n\t"
  39436. "ldm %[a]!, {r4, r5}\n\t"
  39437. "ldm %[b]!, {r6, r8}\n\t"
  39438. "sbcs r4, r4, r6\n\t"
  39439. "sbcs r5, r5, r8\n\t"
  39440. "stm %[r]!, {r4, r5}\n\t"
  39441. "ldm %[a]!, {r4, r5}\n\t"
  39442. "ldm %[b]!, {r6, r8}\n\t"
  39443. "sbcs r4, r4, r6\n\t"
  39444. "sbcs r5, r5, r8\n\t"
  39445. "stm %[r]!, {r4, r5}\n\t"
  39446. "ldm %[a]!, {r4, r5}\n\t"
  39447. "ldm %[b]!, {r6, r8}\n\t"
  39448. "sbcs r4, r4, r6\n\t"
  39449. "sbcs r5, r5, r8\n\t"
  39450. "stm %[r]!, {r4, r5}\n\t"
  39451. "ldm %[a]!, {r4, r5}\n\t"
  39452. "ldm %[b]!, {r6, r8}\n\t"
  39453. "sbcs r4, r4, r6\n\t"
  39454. "sbcs r5, r5, r8\n\t"
  39455. "stm %[r]!, {r4, r5}\n\t"
  39456. "ldm %[a]!, {r4, r5}\n\t"
  39457. "ldm %[b]!, {r6, r8}\n\t"
  39458. "sbcs r4, r4, r6\n\t"
  39459. "sbcs r5, r5, r8\n\t"
  39460. "stm %[r]!, {r4, r5}\n\t"
  39461. "sbc %[c], %[c], %[c]\n\t"
  39462. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  39463. :
  39464. : "memory", "r4", "r5", "r6", "r8"
  39465. );
  39466. return c;
  39467. }
  39468. /* Square a and put result in r. (r = a * a)
  39469. *
  39470. * r A single precision integer.
  39471. * a A single precision integer.
  39472. */
  39473. SP_NOINLINE static void sp_1024_sqr_32(sp_digit* r, const sp_digit* a)
  39474. {
  39475. sp_digit* z0 = r;
  39476. sp_digit* z2 = r + 32;
  39477. sp_digit z1[32];
  39478. sp_digit* a1 = z1;
  39479. sp_digit zero[16];
  39480. sp_digit u;
  39481. sp_digit mask;
  39482. sp_digit* p1;
  39483. sp_digit* p2;
  39484. XMEMSET(zero, 0, sizeof(sp_digit) * 16);
  39485. mask = sp_1024_sub_16(a1, a, &a[16]);
  39486. p1 = (sp_digit*)(((sp_digit)zero & mask ) | ((sp_digit)a1 & (~mask)));
  39487. p2 = (sp_digit*)(((sp_digit)zero & (~mask)) | ((sp_digit)a1 & mask ));
  39488. (void)sp_1024_sub_16(a1, p1, p2);
  39489. sp_1024_sqr_16(z2, &a[16]);
  39490. sp_1024_sqr_16(z0, a);
  39491. sp_1024_sqr_16(z1, a1);
  39492. u = 0;
  39493. u -= sp_1024_sub_in_place_32(z1, z2);
  39494. u -= sp_1024_sub_in_place_32(z1, z0);
  39495. u += sp_1024_sub_in_place_32(r + 16, z1);
  39496. zero[0] = u;
  39497. (void)sp_1024_add_16(r + 48, r + 48, zero);
  39498. }
  39499. #else
  39500. /* Multiply a and b into r. (r = a * b)
  39501. *
  39502. * r A single precision integer.
  39503. * a A single precision integer.
  39504. * b A single precision integer.
  39505. */
  39506. SP_NOINLINE static void sp_1024_mul_32(sp_digit* r, const sp_digit* a,
  39507. const sp_digit* b)
  39508. {
  39509. sp_digit tmp_arr[32 * 2];
  39510. sp_digit* tmp = tmp_arr;
  39511. __asm__ __volatile__ (
  39512. "mov r3, #0\n\t"
  39513. "mov r4, #0\n\t"
  39514. "mov r9, r3\n\t"
  39515. "mov r12, %[r]\n\t"
  39516. "mov r10, %[a]\n\t"
  39517. "mov r11, %[b]\n\t"
  39518. "mov r6, #128\n\t"
  39519. "add r6, r6, r10\n\t"
  39520. "mov r14, r6\n\t"
  39521. "\n1:\n\t"
  39522. "mov %[r], #0\n\t"
  39523. "mov r5, #0\n\t"
  39524. "mov r6, #124\n\t"
  39525. "mov %[a], r9\n\t"
  39526. "subs %[a], %[a], r6\n\t"
  39527. "sbc r6, r6, r6\n\t"
  39528. "mvn r6, r6\n\t"
  39529. "and %[a], %[a], r6\n\t"
  39530. "mov %[b], r9\n\t"
  39531. "sub %[b], %[b], %[a]\n\t"
  39532. "add %[a], %[a], r10\n\t"
  39533. "add %[b], %[b], r11\n\t"
  39534. "\n2:\n\t"
  39535. /* Multiply Start */
  39536. "ldr r6, [%[a]]\n\t"
  39537. "ldr r8, [%[b]]\n\t"
  39538. "umull r6, r8, r6, r8\n\t"
  39539. "adds r3, r3, r6\n\t"
  39540. "adcs r4, r4, r8\n\t"
  39541. "adc r5, r5, %[r]\n\t"
  39542. /* Multiply Done */
  39543. "add %[a], %[a], #4\n\t"
  39544. "sub %[b], %[b], #4\n\t"
  39545. "cmp %[a], r14\n\t"
  39546. #ifdef __GNUC__
  39547. "beq 3f\n\t"
  39548. #else
  39549. "beq.n 3f\n\t"
  39550. #endif /* __GNUC__ */
  39551. "mov r6, r9\n\t"
  39552. "add r6, r6, r10\n\t"
  39553. "cmp %[a], r6\n\t"
  39554. #ifdef __GNUC__
  39555. "ble 2b\n\t"
  39556. #else
  39557. "ble.n 2b\n\t"
  39558. #endif /* __GNUC__ */
  39559. "\n3:\n\t"
  39560. "mov %[r], r12\n\t"
  39561. "mov r8, r9\n\t"
  39562. "str r3, [%[r], r8]\n\t"
  39563. "mov r3, r4\n\t"
  39564. "mov r4, r5\n\t"
  39565. "add r8, r8, #4\n\t"
  39566. "mov r9, r8\n\t"
  39567. "mov r6, #248\n\t"
  39568. "cmp r8, r6\n\t"
  39569. #ifdef __GNUC__
  39570. "ble 1b\n\t"
  39571. #else
  39572. "ble.n 1b\n\t"
  39573. #endif /* __GNUC__ */
  39574. "str r3, [%[r], r8]\n\t"
  39575. "mov %[a], r10\n\t"
  39576. "mov %[b], r11\n\t"
  39577. :
  39578. : [r] "r" (tmp), [a] "r" (a), [b] "r" (b)
  39579. : "memory", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  39580. );
  39581. XMEMCPY(r, tmp_arr, sizeof(tmp_arr));
  39582. }
  39583. /* Square a and put result in r. (r = a * a)
  39584. *
  39585. * r A single precision integer.
  39586. * a A single precision integer.
  39587. */
  39588. SP_NOINLINE static void sp_1024_sqr_32(sp_digit* r, const sp_digit* a)
  39589. {
  39590. __asm__ __volatile__ (
  39591. "mov r3, #0\n\t"
  39592. "mov r4, #0\n\t"
  39593. "mov r5, #0\n\t"
  39594. "mov r9, r3\n\t"
  39595. "mov r12, %[r]\n\t"
  39596. "mov r6, #1\n\t"
  39597. "lsl r6, r6, #8\n\t"
  39598. "neg r6, r6\n\t"
  39599. "add sp, sp, r6\n\t"
  39600. "mov r11, sp\n\t"
  39601. "mov r10, %[a]\n\t"
  39602. "\n1:\n\t"
  39603. "mov %[r], #0\n\t"
  39604. "mov r6, #124\n\t"
  39605. "mov %[a], r9\n\t"
  39606. "subs %[a], %[a], r6\n\t"
  39607. "sbc r6, r6, r6\n\t"
  39608. "mvn r6, r6\n\t"
  39609. "and %[a], %[a], r6\n\t"
  39610. "mov r2, r9\n\t"
  39611. "sub r2, r2, %[a]\n\t"
  39612. "add %[a], %[a], r10\n\t"
  39613. "add r2, r2, r10\n\t"
  39614. "\n2:\n\t"
  39615. "cmp r2, %[a]\n\t"
  39616. #ifdef __GNUC__
  39617. "beq 4f\n\t"
  39618. #else
  39619. "beq.n 4f\n\t"
  39620. #endif /* __GNUC__ */
  39621. /* Multiply * 2: Start */
  39622. "ldr r6, [%[a]]\n\t"
  39623. "ldr r8, [r2]\n\t"
  39624. "umull r6, r8, r6, r8\n\t"
  39625. "adds r3, r3, r6\n\t"
  39626. "adcs r4, r4, r8\n\t"
  39627. "adc r5, r5, %[r]\n\t"
  39628. "adds r3, r3, r6\n\t"
  39629. "adcs r4, r4, r8\n\t"
  39630. "adc r5, r5, %[r]\n\t"
  39631. /* Multiply * 2: Done */
  39632. #ifdef __GNUC__
  39633. "bal 5f\n\t"
  39634. #else
  39635. "bal.n 5f\n\t"
  39636. #endif /* __GNUC__ */
  39637. "\n4:\n\t"
  39638. /* Square: Start */
  39639. "ldr r6, [%[a]]\n\t"
  39640. "umull r6, r8, r6, r6\n\t"
  39641. "adds r3, r3, r6\n\t"
  39642. "adcs r4, r4, r8\n\t"
  39643. "adc r5, r5, %[r]\n\t"
  39644. /* Square: Done */
  39645. "\n5:\n\t"
  39646. "add %[a], %[a], #4\n\t"
  39647. "sub r2, r2, #4\n\t"
  39648. "mov r6, #128\n\t"
  39649. "add r6, r6, r10\n\t"
  39650. "cmp %[a], r6\n\t"
  39651. #ifdef __GNUC__
  39652. "beq 3f\n\t"
  39653. #else
  39654. "beq.n 3f\n\t"
  39655. #endif /* __GNUC__ */
  39656. "cmp %[a], r2\n\t"
  39657. #ifdef __GNUC__
  39658. "bgt 3f\n\t"
  39659. #else
  39660. "bgt.n 3f\n\t"
  39661. #endif /* __GNUC__ */
  39662. "mov r8, r9\n\t"
  39663. "add r8, r8, r10\n\t"
  39664. "cmp %[a], r8\n\t"
  39665. #ifdef __GNUC__
  39666. "ble 2b\n\t"
  39667. #else
  39668. "ble.n 2b\n\t"
  39669. #endif /* __GNUC__ */
  39670. "\n3:\n\t"
  39671. "mov %[r], r11\n\t"
  39672. "mov r8, r9\n\t"
  39673. "str r3, [%[r], r8]\n\t"
  39674. "mov r3, r4\n\t"
  39675. "mov r4, r5\n\t"
  39676. "mov r5, #0\n\t"
  39677. "add r8, r8, #4\n\t"
  39678. "mov r9, r8\n\t"
  39679. "mov r6, #248\n\t"
  39680. "cmp r8, r6\n\t"
  39681. #ifdef __GNUC__
  39682. "ble 1b\n\t"
  39683. #else
  39684. "ble.n 1b\n\t"
  39685. #endif /* __GNUC__ */
  39686. "mov %[a], r10\n\t"
  39687. "str r3, [%[r], r8]\n\t"
  39688. "mov %[r], r12\n\t"
  39689. "mov %[a], r11\n\t"
  39690. "mov r3, #252\n\t"
  39691. "\n4:\n\t"
  39692. "ldr r6, [%[a], r3]\n\t"
  39693. "str r6, [%[r], r3]\n\t"
  39694. "subs r3, r3, #4\n\t"
  39695. #ifdef __GNUC__
  39696. "bge 4b\n\t"
  39697. #else
  39698. "bge.n 4b\n\t"
  39699. #endif /* __GNUC__ */
  39700. "mov r6, #1\n\t"
  39701. "lsl r6, r6, #8\n\t"
  39702. "add sp, sp, r6\n\t"
  39703. :
  39704. : [r] "r" (r), [a] "r" (a)
  39705. : "memory", "r2", "r3", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12"
  39706. );
  39707. }
  39708. #endif /* !WOLFSSL_SP_SMALL */
  39709. /* The modulus (prime) of the curve P1024. */
  39710. static const sp_digit p1024_mod[32] = {
  39711. 0xfea85feb,0x666d807a,0xac7ace87,0x80c5df10,0x89857db0,0xfce3e823,
  39712. 0x56971f1f,0x9f94d6af,0x1c3c09aa,0xa7cf3c52,0x31852a82,0xb6aff4a8,
  39713. 0x65681ce1,0x512ac5cd,0x326b4cd4,0xe26c6487,0xa666a6d0,0x356d27f4,
  39714. 0xf7c88a19,0xe791b39f,0x31a59cb0,0x228730d5,0xe2fc0f1b,0xf40aab27,
  39715. 0xb3e01a2e,0xbe9ae358,0x9cb48261,0x416c0ce1,0xdad0657a,0x65c61198,
  39716. 0x0a563fda,0x997abb1f
  39717. };
  39718. /* The Montgomery normalizer for modulus of the curve P1024. */
  39719. static const sp_digit p1024_norm_mod[32] = {
  39720. 0x0157a015,0x99927f85,0x53853178,0x7f3a20ef,0x767a824f,0x031c17dc,
  39721. 0xa968e0e0,0x606b2950,0xe3c3f655,0x5830c3ad,0xce7ad57d,0x49500b57,
  39722. 0x9a97e31e,0xaed53a32,0xcd94b32b,0x1d939b78,0x5999592f,0xca92d80b,
  39723. 0x083775e6,0x186e4c60,0xce5a634f,0xdd78cf2a,0x1d03f0e4,0x0bf554d8,
  39724. 0x4c1fe5d1,0x41651ca7,0x634b7d9e,0xbe93f31e,0x252f9a85,0x9a39ee67,
  39725. 0xf5a9c025,0x668544e0
  39726. };
  39727. /* The Montgomery multiplier for modulus of the curve P1024. */
  39728. static sp_digit p1024_mp_mod = 0x7c8f2f3d;
  39729. #if defined(WOLFSSL_SP_SMALL) || defined(HAVE_ECC_CHECK_KEY)
  39730. /* The order of the curve P1024. */
  39731. static const sp_digit p1024_order[32] = {
  39732. 0xbfaa17fb,0xd99b601e,0x2b1eb3a1,0x203177c4,0xe2615f6c,0xff38fa08,
  39733. 0xd5a5c7c7,0xa7e535ab,0x870f026a,0xa9f3cf14,0x0c614aa0,0x6dabfd2a,
  39734. 0x595a0738,0x144ab173,0xcc9ad335,0x389b1921,0x2999a9b4,0x4d5b49fd,
  39735. 0xfdf22286,0x39e46ce7,0x4c69672c,0xc8a1cc35,0xf8bf03c6,0xbd02aac9,
  39736. 0x2cf8068b,0x6fa6b8d6,0x672d2098,0x905b0338,0x36b4195e,0x99718466,
  39737. 0xc2958ff6,0x265eaec7
  39738. };
  39739. #endif
  39740. /* The base point of curve P1024. */
  39741. static const sp_point_1024 p1024_base = {
  39742. /* X ordinate */
  39743. {
  39744. 0xeae63895,0x880dc8ab,0x967e0979,0x80ec46c4,0xb63f73ec,0xee9163a5,
  39745. 0x80728d87,0xd5cfb4cc,0xba66910d,0xa7c1514d,0x7a60de74,0xa702c339,
  39746. 0x8b72f2e1,0x337c8654,0x5dd5bccb,0x9760af76,0x406ce890,0x718bd9e7,
  39747. 0xdb9dfa55,0x43d5f22c,0x30b09e10,0xab10db90,0xf6ce2308,0xb5edb6c0,
  39748. 0xb6ff7cbf,0x98b2f204,0x0aec69c6,0x2b1a2fd6,0x3ed9b52a,0x0a799005,
  39749. 0x332c29ad,0x53fc09ee,
  39750. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39751. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39752. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39753. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39754. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39755. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39756. (sp_digit)0, (sp_digit)0
  39757. },
  39758. /* Y ordinate */
  39759. {
  39760. 0x1bef16d7,0x75573fd7,0x6a67dcde,0xadb9b570,0xd5bb4636,0x80bdad5a,
  39761. 0xe9cb99a9,0x13515ad7,0xc5a4d5f2,0x492d979f,0x164aa989,0xac6f1e80,
  39762. 0xb7652fe0,0xcad696b5,0xad547c6c,0x70dae117,0xa9e032b9,0x416cff0c,
  39763. 0x9a140b2e,0x6b598ccf,0xf0de55f6,0xe7f7f5e5,0x654ec2b9,0xf5ea69f4,
  39764. 0x1e141178,0x3d778d82,0x02990696,0xd3e82016,0x3634a135,0xf9f1f053,
  39765. 0x3f6009f1,0x0a824906,
  39766. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39767. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39768. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39769. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39770. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39771. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39772. (sp_digit)0, (sp_digit)0
  39773. },
  39774. /* Z ordinate */
  39775. {
  39776. 0x00000001,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  39777. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  39778. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  39779. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  39780. 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
  39781. 0x00000000,0x00000000,
  39782. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39783. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39784. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39785. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39786. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39787. (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0, (sp_digit)0,
  39788. (sp_digit)0, (sp_digit)0
  39789. },
  39790. /* infinity */
  39791. 0
  39792. };
  39793. #ifdef WOLFSSL_SP_SMALL
  39794. /* Sub b from a into a. (a -= b)
  39795. *
  39796. * a A single precision integer.
  39797. * b A single precision integer.
  39798. */
  39799. SP_NOINLINE static sp_digit sp_1024_sub_in_place_32(sp_digit* a,
  39800. const sp_digit* b)
  39801. {
  39802. sp_digit c = 0;
  39803. __asm__ __volatile__ (
  39804. "mov r8, %[a]\n\t"
  39805. "add r8, r8, #128\n\t"
  39806. "\n1:\n\t"
  39807. "mov r5, #0\n\t"
  39808. "subs r5, r5, %[c]\n\t"
  39809. "ldr r3, [%[a]]\n\t"
  39810. "ldr r4, [%[a], #4]\n\t"
  39811. "ldr r5, [%[b]]\n\t"
  39812. "ldr r6, [%[b], #4]\n\t"
  39813. "sbcs r3, r3, r5\n\t"
  39814. "sbcs r4, r4, r6\n\t"
  39815. "str r3, [%[a]]\n\t"
  39816. "str r4, [%[a], #4]\n\t"
  39817. "sbc %[c], %[c], %[c]\n\t"
  39818. "add %[a], %[a], #8\n\t"
  39819. "add %[b], %[b], #8\n\t"
  39820. "cmp %[a], r8\n\t"
  39821. #ifdef __GNUC__
  39822. "bne 1b\n\t"
  39823. #else
  39824. "bne.n 1b\n\t"
  39825. #endif /* __GNUC__ */
  39826. : [c] "+r" (c), [a] "+r" (a), [b] "+r" (b)
  39827. :
  39828. : "memory", "r3", "r4", "r5", "r6", "r8"
  39829. );
  39830. return c;
  39831. }
  39832. #endif /* WOLFSSL_SP_SMALL */
  39833. /* Conditionally subtract b from a using the mask m.
  39834. * m is -1 to subtract and 0 when not copying.
  39835. *
  39836. * r A single precision number representing condition subtract result.
  39837. * a A single precision number to subtract from.
  39838. * b A single precision number to subtract.
  39839. * m Mask value to apply.
  39840. */
  39841. SP_NOINLINE static sp_digit sp_1024_cond_sub_32(sp_digit* r, const sp_digit* a,
  39842. const sp_digit* b, sp_digit m)
  39843. {
  39844. sp_digit c = 0;
  39845. __asm__ __volatile__ (
  39846. "mov r5, #128\n\t"
  39847. "mov r9, r5\n\t"
  39848. "mov r8, #0\n\t"
  39849. "\n1:\n\t"
  39850. "ldr r6, [%[b], r8]\n\t"
  39851. "and r6, r6, %[m]\n\t"
  39852. "mov r5, #0\n\t"
  39853. "subs r5, r5, %[c]\n\t"
  39854. "ldr r5, [%[a], r8]\n\t"
  39855. "sbcs r5, r5, r6\n\t"
  39856. "sbcs %[c], %[c], %[c]\n\t"
  39857. "str r5, [%[r], r8]\n\t"
  39858. "add r8, r8, #4\n\t"
  39859. "cmp r8, r9\n\t"
  39860. #ifdef __GNUC__
  39861. "blt 1b\n\t"
  39862. #else
  39863. "blt.n 1b\n\t"
  39864. #endif /* __GNUC__ */
  39865. : [c] "+r" (c)
  39866. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  39867. : "memory", "r5", "r6", "r8", "r9"
  39868. );
  39869. return c;
  39870. }
  39871. #ifdef WOLFSSL_SP_SMALL
  39872. /* Add b to a into r. (r = a + b)
  39873. *
  39874. * r A single precision integer.
  39875. * a A single precision integer.
  39876. * b A single precision integer.
  39877. */
  39878. SP_NOINLINE static sp_digit sp_1024_add_32(sp_digit* r, const sp_digit* a,
  39879. const sp_digit* b)
  39880. {
  39881. sp_digit c = 0;
  39882. __asm__ __volatile__ (
  39883. "mov r6, %[a]\n\t"
  39884. "mov r8, #0\n\t"
  39885. "add r6, r6, #128\n\t"
  39886. "sub r8, r8, #1\n\t"
  39887. "\n1:\n\t"
  39888. "adds %[c], %[c], r8\n\t"
  39889. "ldr r4, [%[a]]\n\t"
  39890. "ldr r5, [%[b]]\n\t"
  39891. "adcs r4, r4, r5\n\t"
  39892. "str r4, [%[r]]\n\t"
  39893. "mov %[c], #0\n\t"
  39894. "adc %[c], %[c], %[c]\n\t"
  39895. "add %[a], %[a], #4\n\t"
  39896. "add %[b], %[b], #4\n\t"
  39897. "add %[r], %[r], #4\n\t"
  39898. "cmp %[a], r6\n\t"
  39899. #ifdef __GNUC__
  39900. "bne 1b\n\t"
  39901. #else
  39902. "bne.n 1b\n\t"
  39903. #endif /* __GNUC__ */
  39904. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  39905. :
  39906. : "memory", "r4", "r5", "r6", "r8"
  39907. );
  39908. return c;
  39909. }
  39910. #endif /* WOLFSSL_SP_SMALL */
  39911. /* Mul a by digit b into r. (r = a * b)
  39912. *
  39913. * r A single precision integer.
  39914. * a A single precision integer.
  39915. * b A single precision digit.
  39916. */
  39917. SP_NOINLINE static void sp_1024_mul_d_32(sp_digit* r, const sp_digit* a,
  39918. sp_digit b)
  39919. {
  39920. __asm__ __volatile__ (
  39921. "add r9, %[a], #128\n\t"
  39922. /* A[0] * B */
  39923. "ldr r6, [%[a]], #4\n\t"
  39924. "umull r5, r3, r6, %[b]\n\t"
  39925. "mov r4, #0\n\t"
  39926. "str r5, [%[r]], #4\n\t"
  39927. /* A[0] * B - Done */
  39928. "\n1:\n\t"
  39929. "mov r5, #0\n\t"
  39930. /* A[] * B */
  39931. "ldr r6, [%[a]], #4\n\t"
  39932. "umull r6, r8, r6, %[b]\n\t"
  39933. "adds r3, r3, r6\n\t"
  39934. "adcs r4, r4, r8\n\t"
  39935. "adc r5, r5, #0\n\t"
  39936. /* A[] * B - Done */
  39937. "str r3, [%[r]], #4\n\t"
  39938. "mov r3, r4\n\t"
  39939. "mov r4, r5\n\t"
  39940. "cmp %[a], r9\n\t"
  39941. #ifdef __GNUC__
  39942. "blt 1b\n\t"
  39943. #else
  39944. "blt.n 1b\n\t"
  39945. #endif /* __GNUC__ */
  39946. "str r3, [%[r]]\n\t"
  39947. : [r] "+r" (r), [a] "+r" (a)
  39948. : [b] "r" (b)
  39949. : "memory", "r3", "r4", "r5", "r6", "r8", "r9"
  39950. );
  39951. }
  39952. /* Divide the double width number (d1|d0) by the divisor. (d1|d0 / div)
  39953. *
  39954. * d1 The high order half of the number to divide.
  39955. * d0 The low order half of the number to divide.
  39956. * div The divisor.
  39957. * returns the result of the division.
  39958. *
  39959. * Note that this is an approximate div. It may give an answer 1 larger.
  39960. */
  39961. SP_NOINLINE static sp_digit div_1024_word_32(sp_digit d1, sp_digit d0,
  39962. sp_digit div)
  39963. {
  39964. sp_digit r = 0;
  39965. __asm__ __volatile__ (
  39966. "lsr r6, %[div], #16\n\t"
  39967. "add r6, r6, #1\n\t"
  39968. "udiv r4, %[d1], r6\n\t"
  39969. "lsl r8, r4, #16\n\t"
  39970. "umull r4, r5, %[div], r8\n\t"
  39971. "subs %[d0], %[d0], r4\n\t"
  39972. "sbc %[d1], %[d1], r5\n\t"
  39973. "udiv r5, %[d1], r6\n\t"
  39974. "lsl r4, r5, #16\n\t"
  39975. "add r8, r8, r4\n\t"
  39976. "umull r4, r5, %[div], r4\n\t"
  39977. "subs %[d0], %[d0], r4\n\t"
  39978. "sbc %[d1], %[d1], r5\n\t"
  39979. "lsl r4, %[d1], #16\n\t"
  39980. "orr r4, r4, %[d0], lsr #16\n\t"
  39981. "udiv r4, r4, r6\n\t"
  39982. "add r8, r8, r4\n\t"
  39983. "umull r4, r5, %[div], r4\n\t"
  39984. "subs %[d0], %[d0], r4\n\t"
  39985. "sbc %[d1], %[d1], r5\n\t"
  39986. "lsl r4, %[d1], #16\n\t"
  39987. "orr r4, r4, %[d0], lsr #16\n\t"
  39988. "udiv r4, r4, r6\n\t"
  39989. "add r8, r8, r4\n\t"
  39990. "umull r4, r5, %[div], r4\n\t"
  39991. "subs %[d0], %[d0], r4\n\t"
  39992. "sbc %[d1], %[d1], r5\n\t"
  39993. "udiv r4, %[d0], %[div]\n\t"
  39994. "add r8, r8, r4\n\t"
  39995. "mov %[r], r8\n\t"
  39996. : [r] "+r" (r)
  39997. : [d1] "r" (d1), [d0] "r" (d0), [div] "r" (div)
  39998. : "r4", "r5", "r6", "r8"
  39999. );
  40000. return r;
  40001. }
  40002. /* AND m into each word of a and store in r.
  40003. *
  40004. * r A single precision integer.
  40005. * a A single precision integer.
  40006. * m Mask to AND against each digit.
  40007. */
  40008. static void sp_1024_mask_32(sp_digit* r, const sp_digit* a, sp_digit m)
  40009. {
  40010. #ifdef WOLFSSL_SP_SMALL
  40011. int i;
  40012. for (i=0; i<32; i++) {
  40013. r[i] = a[i] & m;
  40014. }
  40015. #else
  40016. int i;
  40017. for (i = 0; i < 32; i += 8) {
  40018. r[i+0] = a[i+0] & m;
  40019. r[i+1] = a[i+1] & m;
  40020. r[i+2] = a[i+2] & m;
  40021. r[i+3] = a[i+3] & m;
  40022. r[i+4] = a[i+4] & m;
  40023. r[i+5] = a[i+5] & m;
  40024. r[i+6] = a[i+6] & m;
  40025. r[i+7] = a[i+7] & m;
  40026. }
  40027. #endif
  40028. }
  40029. /* Compare a with b in constant time.
  40030. *
  40031. * a A single precision integer.
  40032. * b A single precision integer.
  40033. * return -ve, 0 or +ve if a is less than, equal to or greater than b
  40034. * respectively.
  40035. */
  40036. SP_NOINLINE static sp_int32 sp_1024_cmp_32(const sp_digit* a, const sp_digit* b)
  40037. {
  40038. sp_digit r = 0;
  40039. __asm__ __volatile__ (
  40040. "mov r3, #0\n\t"
  40041. "mvn r3, r3\n\t"
  40042. "mov r6, #124\n\t"
  40043. "\n1:\n\t"
  40044. "ldr r8, [%[a], r6]\n\t"
  40045. "ldr r5, [%[b], r6]\n\t"
  40046. "and r8, r8, r3\n\t"
  40047. "and r5, r5, r3\n\t"
  40048. "mov r4, r8\n\t"
  40049. "subs r8, r8, r5\n\t"
  40050. "sbc r8, r8, r8\n\t"
  40051. "add %[r], %[r], r8\n\t"
  40052. "mvn r8, r8\n\t"
  40053. "and r3, r3, r8\n\t"
  40054. "subs r5, r5, r4\n\t"
  40055. "sbc r8, r8, r8\n\t"
  40056. "sub %[r], %[r], r8\n\t"
  40057. "mvn r8, r8\n\t"
  40058. "and r3, r3, r8\n\t"
  40059. "sub r6, r6, #4\n\t"
  40060. "cmp r6, #0\n\t"
  40061. #ifdef __GNUC__
  40062. "bge 1b\n\t"
  40063. #else
  40064. "bge.n 1b\n\t"
  40065. #endif /* __GNUC__ */
  40066. : [r] "+r" (r)
  40067. : [a] "r" (a), [b] "r" (b)
  40068. : "r3", "r4", "r5", "r6", "r8"
  40069. );
  40070. return r;
  40071. }
  40072. /* Divide d in a and put remainder into r (m*d + r = a)
  40073. * m is not calculated as it is not needed at this time.
  40074. *
  40075. * a Number to be divided.
  40076. * d Number to divide with.
  40077. * m Multiplier result.
  40078. * r Remainder from the division.
  40079. * returns MP_OKAY indicating success.
  40080. */
  40081. static WC_INLINE int sp_1024_div_32(const sp_digit* a, const sp_digit* d, sp_digit* m,
  40082. sp_digit* r)
  40083. {
  40084. sp_digit t1[64], t2[33];
  40085. sp_digit div, r1;
  40086. int i;
  40087. (void)m;
  40088. div = d[31];
  40089. XMEMCPY(t1, a, sizeof(*t1) * 2 * 32);
  40090. r1 = sp_1024_cmp_32(&t1[32], d) >= 0;
  40091. sp_1024_cond_sub_32(&t1[32], &t1[32], d, (sp_digit)0 - r1);
  40092. for (i = 31; i >= 0; i--) {
  40093. sp_digit mask = 0 - (t1[32 + i] == div);
  40094. sp_digit hi = t1[32 + i] + mask;
  40095. r1 = div_1024_word_32(hi, t1[32 + i - 1], div);
  40096. r1 |= mask;
  40097. sp_1024_mul_d_32(t2, d, r1);
  40098. t1[32 + i] += sp_1024_sub_in_place_32(&t1[i], t2);
  40099. t1[32 + i] -= t2[32];
  40100. sp_1024_mask_32(t2, d, t1[32 + i]);
  40101. t1[32 + i] += sp_1024_add_32(&t1[i], &t1[i], t2);
  40102. sp_1024_mask_32(t2, d, t1[32 + i]);
  40103. t1[32 + i] += sp_1024_add_32(&t1[i], &t1[i], t2);
  40104. }
  40105. r1 = sp_1024_cmp_32(t1, d) >= 0;
  40106. sp_1024_cond_sub_32(r, t1, d, (sp_digit)0 - r1);
  40107. return MP_OKAY;
  40108. }
  40109. /* Reduce a modulo m into r. (r = a mod m)
  40110. *
  40111. * r A single precision number that is the reduced result.
  40112. * a A single precision number that is to be reduced.
  40113. * m A single precision number that is the modulus to reduce with.
  40114. * returns MP_OKAY indicating success.
  40115. */
  40116. static WC_INLINE int sp_1024_mod_32(sp_digit* r, const sp_digit* a, const sp_digit* m)
  40117. {
  40118. return sp_1024_div_32(a, m, NULL, r);
  40119. }
  40120. /* Multiply a number by Montgomery normalizer mod modulus (prime).
  40121. *
  40122. * r The resulting Montgomery form number.
  40123. * a The number to convert.
  40124. * m The modulus (prime).
  40125. * returns MEMORY_E when memory allocation fails and MP_OKAY otherwise.
  40126. */
  40127. static int sp_1024_mod_mul_norm_32(sp_digit* r, const sp_digit* a,
  40128. const sp_digit* m)
  40129. {
  40130. sp_1024_mul_32(r, a, p1024_norm_mod);
  40131. return sp_1024_mod_32(r, r, m);
  40132. }
  40133. #ifdef WOLFCRYPT_HAVE_SAKKE
  40134. /* Create a new point.
  40135. *
  40136. * heap [in] Buffer to allocate dynamic memory from.
  40137. * sp [in] Data for point - only if not allocating.
  40138. * p [out] New point.
  40139. * returns MEMORY_E when dynamic memory allocation fails and 0 otherwise.
  40140. */
  40141. static int sp_1024_point_new_ex_32(void* heap, sp_point_1024* sp,
  40142. sp_point_1024** p)
  40143. {
  40144. int ret = MP_OKAY;
  40145. (void)heap;
  40146. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && !defined(WOLFSSL_SP_NO_MALLOC)
  40147. (void)sp;
  40148. *p = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024), heap, DYNAMIC_TYPE_ECC);
  40149. #else
  40150. *p = sp;
  40151. #endif
  40152. if (*p == NULL) {
  40153. ret = MEMORY_E;
  40154. }
  40155. return ret;
  40156. }
  40157. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && !defined(WOLFSSL_SP_NO_MALLOC)
  40158. /* Allocate memory for point and return error. */
  40159. #define sp_1024_point_new_32(heap, sp, p) sp_1024_point_new_ex_32((heap), NULL, &(p))
  40160. #else
  40161. /* Set pointer to data and return no error. */
  40162. #define sp_1024_point_new_32(heap, sp, p) sp_1024_point_new_ex_32((heap), &(sp), &(p))
  40163. #endif
  40164. #endif /* WOLFCRYPT_HAVE_SAKKE */
  40165. #ifdef WOLFCRYPT_HAVE_SAKKE
  40166. /* Free the point.
  40167. *
  40168. * p [in,out] Point to free.
  40169. * clear [in] Indicates whether to zeroize point.
  40170. * heap [in] Buffer from which dynamic memory was allocate from.
  40171. */
  40172. static void sp_1024_point_free_32(sp_point_1024* p, int clear, void* heap)
  40173. {
  40174. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && !defined(WOLFSSL_SP_NO_MALLOC)
  40175. /* If valid pointer then clear point data if requested and free data. */
  40176. if (p != NULL) {
  40177. if (clear != 0) {
  40178. XMEMSET(p, 0, sizeof(*p));
  40179. }
  40180. XFREE(p, heap, DYNAMIC_TYPE_ECC);
  40181. }
  40182. #else
  40183. /* Clear point data if requested. */
  40184. if ((p != NULL) && (clear != 0)) {
  40185. XMEMSET(p, 0, sizeof(*p));
  40186. }
  40187. #endif
  40188. (void)heap;
  40189. }
  40190. #endif /* WOLFCRYPT_HAVE_SAKKE */
  40191. /* Convert an mp_int to an array of sp_digit.
  40192. *
  40193. * r A single precision integer.
  40194. * size Maximum number of bytes to convert
  40195. * a A multi-precision integer.
  40196. */
  40197. static void sp_1024_from_mp(sp_digit* r, int size, const mp_int* a)
  40198. {
  40199. #if DIGIT_BIT == 32
  40200. int j;
  40201. XMEMCPY(r, a->dp, sizeof(sp_digit) * a->used);
  40202. for (j = a->used; j < size; j++) {
  40203. r[j] = 0;
  40204. }
  40205. #elif DIGIT_BIT > 32
  40206. int i;
  40207. int j = 0;
  40208. word32 s = 0;
  40209. r[0] = 0;
  40210. for (i = 0; i < a->used && j < size; i++) {
  40211. r[j] |= ((sp_digit)a->dp[i] << s);
  40212. r[j] &= 0xffffffff;
  40213. s = 32U - s;
  40214. if (j + 1 >= size) {
  40215. break;
  40216. }
  40217. /* lint allow cast of mismatch word32 and mp_digit */
  40218. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  40219. while ((s + 32U) <= (word32)DIGIT_BIT) {
  40220. s += 32U;
  40221. r[j] &= 0xffffffff;
  40222. if (j + 1 >= size) {
  40223. break;
  40224. }
  40225. if (s < (word32)DIGIT_BIT) {
  40226. /* lint allow cast of mismatch word32 and mp_digit */
  40227. r[++j] = (sp_digit)(a->dp[i] >> s); /*lint !e9033*/
  40228. }
  40229. else {
  40230. r[++j] = (sp_digit)0;
  40231. }
  40232. }
  40233. s = (word32)DIGIT_BIT - s;
  40234. }
  40235. for (j++; j < size; j++) {
  40236. r[j] = 0;
  40237. }
  40238. #else
  40239. int i;
  40240. int j = 0;
  40241. int s = 0;
  40242. r[0] = 0;
  40243. for (i = 0; i < a->used && j < size; i++) {
  40244. r[j] |= ((sp_digit)a->dp[i]) << s;
  40245. if (s + DIGIT_BIT >= 32) {
  40246. r[j] &= 0xffffffff;
  40247. if (j + 1 >= size) {
  40248. break;
  40249. }
  40250. s = 32 - s;
  40251. if (s == DIGIT_BIT) {
  40252. r[++j] = 0;
  40253. s = 0;
  40254. }
  40255. else {
  40256. r[++j] = a->dp[i] >> s;
  40257. s = DIGIT_BIT - s;
  40258. }
  40259. }
  40260. else {
  40261. s += DIGIT_BIT;
  40262. }
  40263. }
  40264. for (j++; j < size; j++) {
  40265. r[j] = 0;
  40266. }
  40267. #endif
  40268. }
  40269. /* Convert a point of type ecc_point to type sp_point_1024.
  40270. *
  40271. * p Point of type sp_point_1024 (result).
  40272. * pm Point of type ecc_point.
  40273. */
  40274. static void sp_1024_point_from_ecc_point_32(sp_point_1024* p,
  40275. const ecc_point* pm)
  40276. {
  40277. XMEMSET(p->x, 0, sizeof(p->x));
  40278. XMEMSET(p->y, 0, sizeof(p->y));
  40279. XMEMSET(p->z, 0, sizeof(p->z));
  40280. sp_1024_from_mp(p->x, 32, pm->x);
  40281. sp_1024_from_mp(p->y, 32, pm->y);
  40282. sp_1024_from_mp(p->z, 32, pm->z);
  40283. p->infinity = 0;
  40284. }
  40285. /* Convert an array of sp_digit to an mp_int.
  40286. *
  40287. * a A single precision integer.
  40288. * r A multi-precision integer.
  40289. */
  40290. static int sp_1024_to_mp(const sp_digit* a, mp_int* r)
  40291. {
  40292. int err;
  40293. err = mp_grow(r, (1024 + DIGIT_BIT - 1) / DIGIT_BIT);
  40294. if (err == MP_OKAY) { /*lint !e774 case where err is always MP_OKAY*/
  40295. #if DIGIT_BIT == 32
  40296. XMEMCPY(r->dp, a, sizeof(sp_digit) * 32);
  40297. r->used = 32;
  40298. mp_clamp(r);
  40299. #elif DIGIT_BIT < 32
  40300. int i;
  40301. int j = 0;
  40302. int s = 0;
  40303. r->dp[0] = 0;
  40304. for (i = 0; i < 32; i++) {
  40305. r->dp[j] |= (mp_digit)(a[i] << s);
  40306. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  40307. s = DIGIT_BIT - s;
  40308. r->dp[++j] = (mp_digit)(a[i] >> s);
  40309. while (s + DIGIT_BIT <= 32) {
  40310. s += DIGIT_BIT;
  40311. r->dp[j++] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  40312. if (s == SP_WORD_SIZE) {
  40313. r->dp[j] = 0;
  40314. }
  40315. else {
  40316. r->dp[j] = (mp_digit)(a[i] >> s);
  40317. }
  40318. }
  40319. s = 32 - s;
  40320. }
  40321. r->used = (1024 + DIGIT_BIT - 1) / DIGIT_BIT;
  40322. mp_clamp(r);
  40323. #else
  40324. int i;
  40325. int j = 0;
  40326. int s = 0;
  40327. r->dp[0] = 0;
  40328. for (i = 0; i < 32; i++) {
  40329. r->dp[j] |= ((mp_digit)a[i]) << s;
  40330. if (s + 32 >= DIGIT_BIT) {
  40331. #if DIGIT_BIT != 32 && DIGIT_BIT != 64
  40332. r->dp[j] &= ((sp_digit)1 << DIGIT_BIT) - 1;
  40333. #endif
  40334. s = DIGIT_BIT - s;
  40335. r->dp[++j] = a[i] >> s;
  40336. s = 32 - s;
  40337. }
  40338. else {
  40339. s += 32;
  40340. }
  40341. }
  40342. r->used = (1024 + DIGIT_BIT - 1) / DIGIT_BIT;
  40343. mp_clamp(r);
  40344. #endif
  40345. }
  40346. return err;
  40347. }
  40348. /* Convert a point of type sp_point_1024 to type ecc_point.
  40349. *
  40350. * p Point of type sp_point_1024.
  40351. * pm Point of type ecc_point (result).
  40352. * returns MEMORY_E when allocation of memory in ecc_point fails otherwise
  40353. * MP_OKAY.
  40354. */
  40355. static int sp_1024_point_to_ecc_point_32(const sp_point_1024* p, ecc_point* pm)
  40356. {
  40357. int err;
  40358. err = sp_1024_to_mp(p->x, pm->x);
  40359. if (err == MP_OKAY) {
  40360. err = sp_1024_to_mp(p->y, pm->y);
  40361. }
  40362. if (err == MP_OKAY) {
  40363. err = sp_1024_to_mp(p->z, pm->z);
  40364. }
  40365. return err;
  40366. }
  40367. /* Reduce the number back to 1024 bits using Montgomery reduction.
  40368. *
  40369. * a A single precision number to reduce in place.
  40370. * m The single precision number representing the modulus.
  40371. * mp The digit representing the negative inverse of m mod 2^n.
  40372. */
  40373. SP_NOINLINE static void sp_1024_mont_reduce_32(sp_digit* a, const sp_digit* m,
  40374. sp_digit mp)
  40375. {
  40376. sp_digit ca = 0;
  40377. __asm__ __volatile__ (
  40378. "mov r9, %[mp]\n\t"
  40379. "mov r12, %[m]\n\t"
  40380. "mov r10, %[a]\n\t"
  40381. "mov r4, #0\n\t"
  40382. "add r11, r10, #128\n\t"
  40383. "\n1:\n\t"
  40384. /* mu = a[i] * mp */
  40385. "mov %[mp], r9\n\t"
  40386. "ldr %[a], [r10]\n\t"
  40387. "mul %[mp], %[mp], %[a]\n\t"
  40388. "mov %[m], r12\n\t"
  40389. "add r14, r10, #120\n\t"
  40390. "\n2:\n\t"
  40391. /* a[i+j] += m[j] * mu */
  40392. "ldr %[a], [r10]\n\t"
  40393. "mov r5, #0\n\t"
  40394. /* Multiply m[j] and mu - Start */
  40395. "ldr r8, [%[m]], #4\n\t"
  40396. "umull r6, r8, %[mp], r8\n\t"
  40397. "adds %[a], %[a], r6\n\t"
  40398. "adc r5, r5, r8\n\t"
  40399. /* Multiply m[j] and mu - Done */
  40400. "adds r4, r4, %[a]\n\t"
  40401. "adc r5, r5, #0\n\t"
  40402. "str r4, [r10], #4\n\t"
  40403. /* a[i+j+1] += m[j+1] * mu */
  40404. "ldr %[a], [r10]\n\t"
  40405. "mov r4, #0\n\t"
  40406. /* Multiply m[j] and mu - Start */
  40407. "ldr r8, [%[m]], #4\n\t"
  40408. "umull r6, r8, %[mp], r8\n\t"
  40409. "adds %[a], %[a], r6\n\t"
  40410. "adc r4, r4, r8\n\t"
  40411. /* Multiply m[j] and mu - Done */
  40412. "adds r5, r5, %[a]\n\t"
  40413. "adc r4, r4, #0\n\t"
  40414. "str r5, [r10], #4\n\t"
  40415. "cmp r10, r14\n\t"
  40416. #ifdef __GNUC__
  40417. "blt 2b\n\t"
  40418. #else
  40419. "blt.n 2b\n\t"
  40420. #endif /* __GNUC__ */
  40421. /* a[i+30] += m[30] * mu */
  40422. "ldr %[a], [r10]\n\t"
  40423. "mov r5, #0\n\t"
  40424. /* Multiply m[j] and mu - Start */
  40425. "ldr r8, [%[m]], #4\n\t"
  40426. "umull r6, r8, %[mp], r8\n\t"
  40427. "adds %[a], %[a], r6\n\t"
  40428. "adc r5, r5, r8\n\t"
  40429. /* Multiply m[j] and mu - Done */
  40430. "adds r4, r4, %[a]\n\t"
  40431. "adc r5, r5, #0\n\t"
  40432. "str r4, [r10], #4\n\t"
  40433. /* a[i+31] += m[31] * mu */
  40434. "mov r4, %[ca]\n\t"
  40435. "mov %[ca], #0\n\t"
  40436. /* Multiply m[31] and mu - Start */
  40437. "ldr r8, [%[m]]\n\t"
  40438. "umull r6, r8, %[mp], r8\n\t"
  40439. "adds r5, r5, r6\n\t"
  40440. "adcs r4, r4, r8\n\t"
  40441. "adc %[ca], %[ca], #0\n\t"
  40442. /* Multiply m[31] and mu - Done */
  40443. "ldr r6, [r10]\n\t"
  40444. "ldr r8, [r10, #4]\n\t"
  40445. "adds r6, r6, r5\n\t"
  40446. "adcs r8, r8, r4\n\t"
  40447. "adc %[ca], %[ca], #0\n\t"
  40448. "str r6, [r10]\n\t"
  40449. "str r8, [r10, #4]\n\t"
  40450. /* Next word in a */
  40451. "sub r10, r10, #120\n\t"
  40452. "cmp r10, r11\n\t"
  40453. #ifdef __GNUC__
  40454. "blt 1b\n\t"
  40455. #else
  40456. "blt.n 1b\n\t"
  40457. #endif /* __GNUC__ */
  40458. "ldr r6, [%[m]]\n\t"
  40459. "subs r6, r6, r8\n\t"
  40460. "neg %[ca], %[ca]\n\t"
  40461. "sbc r6, r6, r6\n\t"
  40462. "orr %[ca], %[ca], r6\n\t"
  40463. "mov %[a], r10\n\t"
  40464. "mov %[m], r12\n\t"
  40465. : [ca] "+r" (ca), [a] "+r" (a)
  40466. : [m] "r" (m), [mp] "r" (mp)
  40467. : "memory", "r4", "r5", "r6", "r8", "r9", "r10", "r11", "r12", "r14"
  40468. );
  40469. sp_1024_cond_sub_32(a - 32, a, m, ca);
  40470. }
  40471. /* Multiply two Montgomery form numbers mod the modulus (prime).
  40472. * (r = a * b mod m)
  40473. *
  40474. * r Result of multiplication.
  40475. * a First number to multiply in Montgomery form.
  40476. * b Second number to multiply in Montgomery form.
  40477. * m Modulus (prime).
  40478. * mp Montgomery mulitplier.
  40479. */
  40480. SP_NOINLINE static void sp_1024_mont_mul_32(sp_digit* r, const sp_digit* a,
  40481. const sp_digit* b, const sp_digit* m, sp_digit mp)
  40482. {
  40483. sp_1024_mul_32(r, a, b);
  40484. sp_1024_mont_reduce_32(r, m, mp);
  40485. }
  40486. /* Square the Montgomery form number. (r = a * a mod m)
  40487. *
  40488. * r Result of squaring.
  40489. * a Number to square in Montgomery form.
  40490. * m Modulus (prime).
  40491. * mp Montgomery mulitplier.
  40492. */
  40493. SP_NOINLINE static void sp_1024_mont_sqr_32(sp_digit* r, const sp_digit* a,
  40494. const sp_digit* m, sp_digit mp)
  40495. {
  40496. sp_1024_sqr_32(r, a);
  40497. sp_1024_mont_reduce_32(r, m, mp);
  40498. }
  40499. /* Mod-2 for the P1024 curve. */
  40500. static const uint8_t p1024_mod_minus_2[] = {
  40501. 6,0x06, 7,0x0f, 7,0x0b, 6,0x0c, 7,0x1e, 9,0x09, 7,0x0c, 7,0x1f,
  40502. 6,0x16, 6,0x06, 7,0x0e, 8,0x10, 6,0x03, 8,0x11, 6,0x0d, 7,0x14,
  40503. 9,0x12, 6,0x0f, 7,0x04, 9,0x0d, 6,0x00, 7,0x13, 6,0x01, 6,0x07,
  40504. 8,0x0d, 8,0x00, 6,0x06, 9,0x17, 6,0x14, 6,0x15, 6,0x11, 6,0x0b,
  40505. 9,0x0c, 6,0x1e, 13,0x14, 7,0x0e, 6,0x1d, 12,0x0a, 6,0x0b, 8,0x07,
  40506. 6,0x18, 6,0x0f, 6,0x10, 8,0x1c, 7,0x16, 7,0x02, 6,0x01, 6,0x13,
  40507. 10,0x15, 7,0x06, 8,0x14, 6,0x0c, 6,0x19, 7,0x10, 6,0x19, 6,0x19,
  40508. 9,0x16, 7,0x19, 6,0x1f, 6,0x17, 6,0x12, 8,0x02, 6,0x01, 6,0x04,
  40509. 6,0x15, 7,0x16, 6,0x04, 6,0x1f, 6,0x09, 7,0x06, 7,0x13, 7,0x09,
  40510. 6,0x0d, 10,0x18, 6,0x06, 6,0x11, 6,0x04, 6,0x01, 6,0x13, 8,0x06,
  40511. 6,0x0d, 8,0x13, 7,0x08, 6,0x08, 6,0x05, 7,0x0c, 7,0x0e, 7,0x15,
  40512. 6,0x05, 7,0x14, 10,0x19, 6,0x10, 6,0x16, 6,0x15, 7,0x1f, 6,0x14,
  40513. 6,0x0a, 10,0x11, 6,0x01, 7,0x05, 7,0x08, 8,0x0a, 7,0x1e, 7,0x1c,
  40514. 6,0x1c, 7,0x09, 10,0x18, 7,0x1c, 10,0x06, 6,0x0a, 6,0x07, 6,0x19,
  40515. 7,0x06, 6,0x0d, 7,0x0f, 7,0x0b, 7,0x05, 6,0x11, 6,0x1c, 7,0x1f,
  40516. 6,0x1e, 7,0x18, 6,0x1e, 6,0x00, 6,0x03, 6,0x02, 7,0x10, 6,0x0b,
  40517. 6,0x1b, 7,0x10, 6,0x00, 8,0x11, 7,0x1b, 6,0x18, 6,0x01, 7,0x0c,
  40518. 7,0x1d, 7,0x13, 6,0x08, 7,0x1b, 8,0x13, 7,0x16, 13,0x1d, 7,0x1f,
  40519. 6,0x0a, 6,0x01, 7,0x1f, 6,0x14, 1,0x01
  40520. };
  40521. /* Invert the number, in Montgomery form, modulo the modulus (prime) of the
  40522. * P1024 curve. (r = 1 / a mod m)
  40523. *
  40524. * r Inverse result.
  40525. * a Number to invert.
  40526. * td Temporary data.
  40527. */
  40528. static void sp_1024_mont_inv_32(sp_digit* r, const sp_digit* a,
  40529. sp_digit* td)
  40530. {
  40531. sp_digit* t = td;
  40532. int i;
  40533. int j;
  40534. sp_digit table[32][2 * 32];
  40535. XMEMCPY(table[0], a, sizeof(sp_digit) * 32);
  40536. for (i = 1; i < 6; i++) {
  40537. sp_1024_mont_sqr_32(table[0], table[0], p1024_mod, p1024_mp_mod);
  40538. }
  40539. for (i = 1; i < 32; i++) {
  40540. sp_1024_mont_mul_32(table[i], table[i-1], a, p1024_mod, p1024_mp_mod);
  40541. }
  40542. XMEMCPY(t, table[p1024_mod_minus_2[1]], sizeof(sp_digit) * 32);
  40543. for (i = 2; i < (int)sizeof(p1024_mod_minus_2) - 2; i += 2) {
  40544. for (j = 0; j < p1024_mod_minus_2[i]; j++) {
  40545. sp_1024_mont_sqr_32(t, t, p1024_mod, p1024_mp_mod);
  40546. }
  40547. sp_1024_mont_mul_32(t, t, table[p1024_mod_minus_2[i+1]], p1024_mod,
  40548. p1024_mp_mod);
  40549. }
  40550. sp_1024_mont_sqr_32(t, t, p1024_mod, p1024_mp_mod);
  40551. sp_1024_mont_mul_32(r, t, a, p1024_mod, p1024_mp_mod);
  40552. }
  40553. /* Normalize the values in each word to 32.
  40554. *
  40555. * a Array of sp_digit to normalize.
  40556. */
  40557. #define sp_1024_norm_32(a)
  40558. /* Map the Montgomery form projective coordinate point to an affine point.
  40559. *
  40560. * r Resulting affine coordinate point.
  40561. * p Montgomery form projective coordinate point.
  40562. * t Temporary ordinate data.
  40563. */
  40564. static void sp_1024_map_32(sp_point_1024* r, const sp_point_1024* p,
  40565. sp_digit* t)
  40566. {
  40567. sp_digit* t1 = t;
  40568. sp_digit* t2 = t + 2*32;
  40569. sp_int32 n;
  40570. sp_1024_mont_inv_32(t1, p->z, t + 2*32);
  40571. sp_1024_mont_sqr_32(t2, t1, p1024_mod, p1024_mp_mod);
  40572. sp_1024_mont_mul_32(t1, t2, t1, p1024_mod, p1024_mp_mod);
  40573. /* x /= z^2 */
  40574. sp_1024_mont_mul_32(r->x, p->x, t2, p1024_mod, p1024_mp_mod);
  40575. XMEMSET(r->x + 32, 0, sizeof(r->x) / 2U);
  40576. sp_1024_mont_reduce_32(r->x, p1024_mod, p1024_mp_mod);
  40577. /* Reduce x to less than modulus */
  40578. n = sp_1024_cmp_32(r->x, p1024_mod);
  40579. sp_1024_cond_sub_32(r->x, r->x, p1024_mod, ~(n >> 31));
  40580. sp_1024_norm_32(r->x);
  40581. /* y /= z^3 */
  40582. sp_1024_mont_mul_32(r->y, p->y, t1, p1024_mod, p1024_mp_mod);
  40583. XMEMSET(r->y + 32, 0, sizeof(r->y) / 2U);
  40584. sp_1024_mont_reduce_32(r->y, p1024_mod, p1024_mp_mod);
  40585. /* Reduce y to less than modulus */
  40586. n = sp_1024_cmp_32(r->y, p1024_mod);
  40587. sp_1024_cond_sub_32(r->y, r->y, p1024_mod, ~(n >> 31));
  40588. sp_1024_norm_32(r->y);
  40589. XMEMSET(r->z, 0, sizeof(r->z) / 2);
  40590. r->z[0] = 1;
  40591. }
  40592. /* Add two Montgomery form numbers (r = a + b % m).
  40593. *
  40594. * r Result of addition.
  40595. * a First number to add in Montgomery form.
  40596. * b Second number to add in Montgomery form.
  40597. * m Modulus (prime).
  40598. */
  40599. SP_NOINLINE static void sp_1024_mont_add_32(sp_digit* r, const sp_digit* a, const sp_digit* b,
  40600. const sp_digit* m)
  40601. {
  40602. __asm__ __volatile__ (
  40603. "mov r12, #0\n\t"
  40604. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  40605. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  40606. "adds r4, r4, r8\n\t"
  40607. "adcs r5, r5, r9\n\t"
  40608. "adcs r6, r6, r10\n\t"
  40609. "adcs r7, r7, r14\n\t"
  40610. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40611. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  40612. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  40613. "adcs r4, r4, r8\n\t"
  40614. "adcs r5, r5, r9\n\t"
  40615. "adcs r6, r6, r10\n\t"
  40616. "adcs r7, r7, r14\n\t"
  40617. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40618. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  40619. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  40620. "adcs r4, r4, r8\n\t"
  40621. "adcs r5, r5, r9\n\t"
  40622. "adcs r6, r6, r10\n\t"
  40623. "adcs r7, r7, r14\n\t"
  40624. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40625. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  40626. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  40627. "adcs r4, r4, r8\n\t"
  40628. "adcs r5, r5, r9\n\t"
  40629. "adcs r6, r6, r10\n\t"
  40630. "adcs r7, r7, r14\n\t"
  40631. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40632. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  40633. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  40634. "adcs r4, r4, r8\n\t"
  40635. "adcs r5, r5, r9\n\t"
  40636. "adcs r6, r6, r10\n\t"
  40637. "adcs r7, r7, r14\n\t"
  40638. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40639. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  40640. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  40641. "adcs r4, r4, r8\n\t"
  40642. "adcs r5, r5, r9\n\t"
  40643. "adcs r6, r6, r10\n\t"
  40644. "adcs r7, r7, r14\n\t"
  40645. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40646. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  40647. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  40648. "adcs r4, r4, r8\n\t"
  40649. "adcs r5, r5, r9\n\t"
  40650. "adcs r6, r6, r10\n\t"
  40651. "adcs r7, r7, r14\n\t"
  40652. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40653. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  40654. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  40655. "adcs r4, r4, r8\n\t"
  40656. "adcs r5, r5, r9\n\t"
  40657. "adcs r6, r6, r10\n\t"
  40658. "adcs r7, r7, r14\n\t"
  40659. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40660. "ldr r14, [%[m], #124]\n\t"
  40661. "adc r12, r12, #0\n\t"
  40662. "subs r14, r14, r7\n\t"
  40663. "neg r12, r12\n\t"
  40664. "sbc r14, r14, r14\n\t"
  40665. "sub %[r], %[r], #128\n\t"
  40666. "orr r12, r14\n\t"
  40667. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40668. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40669. "and r8, r8, r12\n\t"
  40670. "and r9, r9, r12\n\t"
  40671. "and r10, r10, r12\n\t"
  40672. "and r14, r14, r12\n\t"
  40673. "subs r4, r4, r8\n\t"
  40674. "sbcs r5, r5, r9\n\t"
  40675. "sbcs r6, r6, r10\n\t"
  40676. "sbcs r7, r7, r14\n\t"
  40677. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40678. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40679. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40680. "and r8, r8, r12\n\t"
  40681. "and r9, r9, r12\n\t"
  40682. "and r10, r10, r12\n\t"
  40683. "and r14, r14, r12\n\t"
  40684. "sbcs r4, r4, r8\n\t"
  40685. "sbcs r5, r5, r9\n\t"
  40686. "sbcs r6, r6, r10\n\t"
  40687. "sbcs r7, r7, r14\n\t"
  40688. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40689. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40690. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40691. "and r8, r8, r12\n\t"
  40692. "and r9, r9, r12\n\t"
  40693. "and r10, r10, r12\n\t"
  40694. "and r14, r14, r12\n\t"
  40695. "sbcs r4, r4, r8\n\t"
  40696. "sbcs r5, r5, r9\n\t"
  40697. "sbcs r6, r6, r10\n\t"
  40698. "sbcs r7, r7, r14\n\t"
  40699. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40700. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40701. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40702. "and r8, r8, r12\n\t"
  40703. "and r9, r9, r12\n\t"
  40704. "and r10, r10, r12\n\t"
  40705. "and r14, r14, r12\n\t"
  40706. "sbcs r4, r4, r8\n\t"
  40707. "sbcs r5, r5, r9\n\t"
  40708. "sbcs r6, r6, r10\n\t"
  40709. "sbcs r7, r7, r14\n\t"
  40710. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40711. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40712. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40713. "and r8, r8, r12\n\t"
  40714. "and r9, r9, r12\n\t"
  40715. "and r10, r10, r12\n\t"
  40716. "and r14, r14, r12\n\t"
  40717. "sbcs r4, r4, r8\n\t"
  40718. "sbcs r5, r5, r9\n\t"
  40719. "sbcs r6, r6, r10\n\t"
  40720. "sbcs r7, r7, r14\n\t"
  40721. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40722. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40723. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40724. "and r8, r8, r12\n\t"
  40725. "and r9, r9, r12\n\t"
  40726. "and r10, r10, r12\n\t"
  40727. "and r14, r14, r12\n\t"
  40728. "sbcs r4, r4, r8\n\t"
  40729. "sbcs r5, r5, r9\n\t"
  40730. "sbcs r6, r6, r10\n\t"
  40731. "sbcs r7, r7, r14\n\t"
  40732. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40733. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40734. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40735. "and r8, r8, r12\n\t"
  40736. "and r9, r9, r12\n\t"
  40737. "and r10, r10, r12\n\t"
  40738. "and r14, r14, r12\n\t"
  40739. "sbcs r4, r4, r8\n\t"
  40740. "sbcs r5, r5, r9\n\t"
  40741. "sbcs r6, r6, r10\n\t"
  40742. "sbcs r7, r7, r14\n\t"
  40743. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40744. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40745. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40746. "and r8, r8, r12\n\t"
  40747. "and r9, r9, r12\n\t"
  40748. "and r10, r10, r12\n\t"
  40749. "and r14, r14, r12\n\t"
  40750. "sbcs r4, r4, r8\n\t"
  40751. "sbcs r5, r5, r9\n\t"
  40752. "sbcs r6, r6, r10\n\t"
  40753. "sbc r7, r7, r14\n\t"
  40754. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40755. "sub %[r], %[r], #128\n\t"
  40756. : [r] "+r" (r), [a] "+r" (a), [b] "+r" (b), [m] "+r" (m)
  40757. :
  40758. : "memory", "r4", "r5", "r6", "r7", "r8", "r9", "r10", "r14", "r12"
  40759. );
  40760. }
  40761. /* Double a Montgomery form number (r = a + a % m).
  40762. *
  40763. * r Result of doubling.
  40764. * a Number to double in Montgomery form.
  40765. * m Modulus (prime).
  40766. */
  40767. SP_NOINLINE static void sp_1024_mont_dbl_32(sp_digit* r, const sp_digit* a, const sp_digit* m)
  40768. {
  40769. __asm__ __volatile__ (
  40770. "mov r12, #0\n\t"
  40771. "ldm %[a]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40772. "adds r4, r4, r4\n\t"
  40773. "adcs r5, r5, r5\n\t"
  40774. "adcs r6, r6, r6\n\t"
  40775. "adcs r7, r7, r7\n\t"
  40776. "adcs r8, r8, r8\n\t"
  40777. "adcs r9, r9, r9\n\t"
  40778. "adcs r10, r10, r10\n\t"
  40779. "adcs r14, r14, r14\n\t"
  40780. "stm %[r]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40781. "ldm %[a]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40782. "adcs r4, r4, r4\n\t"
  40783. "adcs r5, r5, r5\n\t"
  40784. "adcs r6, r6, r6\n\t"
  40785. "adcs r7, r7, r7\n\t"
  40786. "adcs r8, r8, r8\n\t"
  40787. "adcs r9, r9, r9\n\t"
  40788. "adcs r10, r10, r10\n\t"
  40789. "adcs r14, r14, r14\n\t"
  40790. "stm %[r]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40791. "ldm %[a]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40792. "adcs r4, r4, r4\n\t"
  40793. "adcs r5, r5, r5\n\t"
  40794. "adcs r6, r6, r6\n\t"
  40795. "adcs r7, r7, r7\n\t"
  40796. "adcs r8, r8, r8\n\t"
  40797. "adcs r9, r9, r9\n\t"
  40798. "adcs r10, r10, r10\n\t"
  40799. "adcs r14, r14, r14\n\t"
  40800. "stm %[r]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40801. "ldm %[a]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40802. "adcs r4, r4, r4\n\t"
  40803. "adcs r5, r5, r5\n\t"
  40804. "adcs r6, r6, r6\n\t"
  40805. "adcs r7, r7, r7\n\t"
  40806. "adcs r8, r8, r8\n\t"
  40807. "adcs r9, r9, r9\n\t"
  40808. "adcs r10, r10, r10\n\t"
  40809. "adcs r14, r14, r14\n\t"
  40810. "stm %[r]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40811. "ldr r4, [%[m], #124]\n\t"
  40812. "adc r12, r12, #0\n\t"
  40813. "subs r4, r4, r14\n\t"
  40814. "neg r12, r12\n\t"
  40815. "sbc r4, r4, r4\n\t"
  40816. "sub %[r], %[r], #128\n\t"
  40817. "orr r12, r4\n\t"
  40818. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40819. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40820. "and r8, r8, r12\n\t"
  40821. "and r9, r9, r12\n\t"
  40822. "and r10, r10, r12\n\t"
  40823. "and r14, r14, r12\n\t"
  40824. "subs r4, r4, r8\n\t"
  40825. "sbcs r5, r5, r9\n\t"
  40826. "sbcs r6, r6, r10\n\t"
  40827. "sbcs r7, r7, r14\n\t"
  40828. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40829. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40830. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40831. "and r8, r8, r12\n\t"
  40832. "and r9, r9, r12\n\t"
  40833. "and r10, r10, r12\n\t"
  40834. "and r14, r14, r12\n\t"
  40835. "sbcs r4, r4, r8\n\t"
  40836. "sbcs r5, r5, r9\n\t"
  40837. "sbcs r6, r6, r10\n\t"
  40838. "sbcs r7, r7, r14\n\t"
  40839. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40840. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40841. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40842. "and r8, r8, r12\n\t"
  40843. "and r9, r9, r12\n\t"
  40844. "and r10, r10, r12\n\t"
  40845. "and r14, r14, r12\n\t"
  40846. "sbcs r4, r4, r8\n\t"
  40847. "sbcs r5, r5, r9\n\t"
  40848. "sbcs r6, r6, r10\n\t"
  40849. "sbcs r7, r7, r14\n\t"
  40850. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40851. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40852. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40853. "and r8, r8, r12\n\t"
  40854. "and r9, r9, r12\n\t"
  40855. "and r10, r10, r12\n\t"
  40856. "and r14, r14, r12\n\t"
  40857. "sbcs r4, r4, r8\n\t"
  40858. "sbcs r5, r5, r9\n\t"
  40859. "sbcs r6, r6, r10\n\t"
  40860. "sbcs r7, r7, r14\n\t"
  40861. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40862. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40863. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40864. "and r8, r8, r12\n\t"
  40865. "and r9, r9, r12\n\t"
  40866. "and r10, r10, r12\n\t"
  40867. "and r14, r14, r12\n\t"
  40868. "sbcs r4, r4, r8\n\t"
  40869. "sbcs r5, r5, r9\n\t"
  40870. "sbcs r6, r6, r10\n\t"
  40871. "sbcs r7, r7, r14\n\t"
  40872. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40873. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40874. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40875. "and r8, r8, r12\n\t"
  40876. "and r9, r9, r12\n\t"
  40877. "and r10, r10, r12\n\t"
  40878. "and r14, r14, r12\n\t"
  40879. "sbcs r4, r4, r8\n\t"
  40880. "sbcs r5, r5, r9\n\t"
  40881. "sbcs r6, r6, r10\n\t"
  40882. "sbcs r7, r7, r14\n\t"
  40883. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40884. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40885. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40886. "and r8, r8, r12\n\t"
  40887. "and r9, r9, r12\n\t"
  40888. "and r10, r10, r12\n\t"
  40889. "and r14, r14, r12\n\t"
  40890. "sbcs r4, r4, r8\n\t"
  40891. "sbcs r5, r5, r9\n\t"
  40892. "sbcs r6, r6, r10\n\t"
  40893. "sbcs r7, r7, r14\n\t"
  40894. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40895. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40896. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40897. "and r8, r8, r12\n\t"
  40898. "and r9, r9, r12\n\t"
  40899. "and r10, r10, r12\n\t"
  40900. "and r14, r14, r12\n\t"
  40901. "sbcs r4, r4, r8\n\t"
  40902. "sbcs r5, r5, r9\n\t"
  40903. "sbcs r6, r6, r10\n\t"
  40904. "sbc r7, r7, r14\n\t"
  40905. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40906. "sub %[r], %[r], #128\n\t"
  40907. : [r] "+r" (r), [a] "+r" (a), [m] "+r" (m)
  40908. :
  40909. : "memory", "r4", "r5", "r6", "r7", "r8", "r9", "r10", "r14", "r12"
  40910. );
  40911. }
  40912. /* Triple a Montgomery form number (r = a + a + a % m).
  40913. *
  40914. * r Result of Tripling.
  40915. * a Number to triple in Montgomery form.
  40916. * m Modulus (prime).
  40917. */
  40918. SP_NOINLINE static void sp_1024_mont_tpl_32(sp_digit* r, const sp_digit* a, const sp_digit* m)
  40919. {
  40920. __asm__ __volatile__ (
  40921. "mov r12, #0\n\t"
  40922. "ldm %[a]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40923. "adds r4, r4, r4\n\t"
  40924. "adcs r5, r5, r5\n\t"
  40925. "adcs r6, r6, r6\n\t"
  40926. "adcs r7, r7, r7\n\t"
  40927. "adcs r8, r8, r8\n\t"
  40928. "adcs r9, r9, r9\n\t"
  40929. "adcs r10, r10, r10\n\t"
  40930. "adcs r14, r14, r14\n\t"
  40931. "stm %[r]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40932. "ldm %[a]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40933. "adcs r4, r4, r4\n\t"
  40934. "adcs r5, r5, r5\n\t"
  40935. "adcs r6, r6, r6\n\t"
  40936. "adcs r7, r7, r7\n\t"
  40937. "adcs r8, r8, r8\n\t"
  40938. "adcs r9, r9, r9\n\t"
  40939. "adcs r10, r10, r10\n\t"
  40940. "adcs r14, r14, r14\n\t"
  40941. "stm %[r]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40942. "ldm %[a]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40943. "adcs r4, r4, r4\n\t"
  40944. "adcs r5, r5, r5\n\t"
  40945. "adcs r6, r6, r6\n\t"
  40946. "adcs r7, r7, r7\n\t"
  40947. "adcs r8, r8, r8\n\t"
  40948. "adcs r9, r9, r9\n\t"
  40949. "adcs r10, r10, r10\n\t"
  40950. "adcs r14, r14, r14\n\t"
  40951. "stm %[r]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40952. "ldm %[a]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40953. "adcs r4, r4, r4\n\t"
  40954. "adcs r5, r5, r5\n\t"
  40955. "adcs r6, r6, r6\n\t"
  40956. "adcs r7, r7, r7\n\t"
  40957. "adcs r8, r8, r8\n\t"
  40958. "adcs r9, r9, r9\n\t"
  40959. "adcs r10, r10, r10\n\t"
  40960. "adcs r14, r14, r14\n\t"
  40961. "stm %[r]!, {r4, r5, r6, r7, r8, r9, r10, r14}\n\t"
  40962. "ldr r4, [%[m], #124]\n\t"
  40963. "adc r12, r12, #0\n\t"
  40964. "subs r4, r4, r14\n\t"
  40965. "neg r12, r12\n\t"
  40966. "sbc r4, r4, r4\n\t"
  40967. "sub %[r], %[r], #128\n\t"
  40968. "orr r12, r4\n\t"
  40969. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40970. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40971. "and r8, r8, r12\n\t"
  40972. "and r9, r9, r12\n\t"
  40973. "and r10, r10, r12\n\t"
  40974. "and r14, r14, r12\n\t"
  40975. "subs r4, r4, r8\n\t"
  40976. "sbcs r5, r5, r9\n\t"
  40977. "sbcs r6, r6, r10\n\t"
  40978. "sbcs r7, r7, r14\n\t"
  40979. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40980. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40981. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40982. "and r8, r8, r12\n\t"
  40983. "and r9, r9, r12\n\t"
  40984. "and r10, r10, r12\n\t"
  40985. "and r14, r14, r12\n\t"
  40986. "sbcs r4, r4, r8\n\t"
  40987. "sbcs r5, r5, r9\n\t"
  40988. "sbcs r6, r6, r10\n\t"
  40989. "sbcs r7, r7, r14\n\t"
  40990. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  40991. "ldm %[r], {r4, r5, r6, r7}\n\t"
  40992. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  40993. "and r8, r8, r12\n\t"
  40994. "and r9, r9, r12\n\t"
  40995. "and r10, r10, r12\n\t"
  40996. "and r14, r14, r12\n\t"
  40997. "sbcs r4, r4, r8\n\t"
  40998. "sbcs r5, r5, r9\n\t"
  40999. "sbcs r6, r6, r10\n\t"
  41000. "sbcs r7, r7, r14\n\t"
  41001. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41002. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41003. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41004. "and r8, r8, r12\n\t"
  41005. "and r9, r9, r12\n\t"
  41006. "and r10, r10, r12\n\t"
  41007. "and r14, r14, r12\n\t"
  41008. "sbcs r4, r4, r8\n\t"
  41009. "sbcs r5, r5, r9\n\t"
  41010. "sbcs r6, r6, r10\n\t"
  41011. "sbcs r7, r7, r14\n\t"
  41012. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41013. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41014. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41015. "and r8, r8, r12\n\t"
  41016. "and r9, r9, r12\n\t"
  41017. "and r10, r10, r12\n\t"
  41018. "and r14, r14, r12\n\t"
  41019. "sbcs r4, r4, r8\n\t"
  41020. "sbcs r5, r5, r9\n\t"
  41021. "sbcs r6, r6, r10\n\t"
  41022. "sbcs r7, r7, r14\n\t"
  41023. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41024. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41025. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41026. "and r8, r8, r12\n\t"
  41027. "and r9, r9, r12\n\t"
  41028. "and r10, r10, r12\n\t"
  41029. "and r14, r14, r12\n\t"
  41030. "sbcs r4, r4, r8\n\t"
  41031. "sbcs r5, r5, r9\n\t"
  41032. "sbcs r6, r6, r10\n\t"
  41033. "sbcs r7, r7, r14\n\t"
  41034. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41035. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41036. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41037. "and r8, r8, r12\n\t"
  41038. "and r9, r9, r12\n\t"
  41039. "and r10, r10, r12\n\t"
  41040. "and r14, r14, r12\n\t"
  41041. "sbcs r4, r4, r8\n\t"
  41042. "sbcs r5, r5, r9\n\t"
  41043. "sbcs r6, r6, r10\n\t"
  41044. "sbcs r7, r7, r14\n\t"
  41045. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41046. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41047. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41048. "and r8, r8, r12\n\t"
  41049. "and r9, r9, r12\n\t"
  41050. "and r10, r10, r12\n\t"
  41051. "and r14, r14, r12\n\t"
  41052. "sbcs r4, r4, r8\n\t"
  41053. "sbcs r5, r5, r9\n\t"
  41054. "sbcs r6, r6, r10\n\t"
  41055. "sbc r7, r7, r14\n\t"
  41056. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41057. "sub %[r], %[r], #128\n\t"
  41058. "sub %[m], %[m], #128\n\t"
  41059. "sub %[a], %[a], #128\n\t"
  41060. "mov r12, #0\n\t"
  41061. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41062. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41063. "adds r8, r8, r4\n\t"
  41064. "adcs r9, r9, r5\n\t"
  41065. "adcs r10, r10, r6\n\t"
  41066. "adcs r14, r14, r7\n\t"
  41067. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41068. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41069. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41070. "adcs r8, r8, r4\n\t"
  41071. "adcs r9, r9, r5\n\t"
  41072. "adcs r10, r10, r6\n\t"
  41073. "adcs r14, r14, r7\n\t"
  41074. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41075. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41076. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41077. "adcs r8, r8, r4\n\t"
  41078. "adcs r9, r9, r5\n\t"
  41079. "adcs r10, r10, r6\n\t"
  41080. "adcs r14, r14, r7\n\t"
  41081. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41082. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41083. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41084. "adcs r8, r8, r4\n\t"
  41085. "adcs r9, r9, r5\n\t"
  41086. "adcs r10, r10, r6\n\t"
  41087. "adcs r14, r14, r7\n\t"
  41088. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41089. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41090. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41091. "adcs r8, r8, r4\n\t"
  41092. "adcs r9, r9, r5\n\t"
  41093. "adcs r10, r10, r6\n\t"
  41094. "adcs r14, r14, r7\n\t"
  41095. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41096. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41097. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41098. "adcs r8, r8, r4\n\t"
  41099. "adcs r9, r9, r5\n\t"
  41100. "adcs r10, r10, r6\n\t"
  41101. "adcs r14, r14, r7\n\t"
  41102. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41103. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41104. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41105. "adcs r8, r8, r4\n\t"
  41106. "adcs r9, r9, r5\n\t"
  41107. "adcs r10, r10, r6\n\t"
  41108. "adcs r14, r14, r7\n\t"
  41109. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41110. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41111. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41112. "adcs r8, r8, r4\n\t"
  41113. "adcs r9, r9, r5\n\t"
  41114. "adcs r10, r10, r6\n\t"
  41115. "adcs r14, r14, r7\n\t"
  41116. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41117. "ldr r7, [%[m], #124]\n\t"
  41118. "adc r12, r12, #0\n\t"
  41119. "subs r7, r7, r14\n\t"
  41120. "neg r12, r12\n\t"
  41121. "sbc r7, r7, r7\n\t"
  41122. "sub %[r], %[r], #128\n\t"
  41123. "orr r12, r7\n\t"
  41124. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41125. "ldm %[m]!, {r4, r5, r6, r7}\n\t"
  41126. "and r4, r4, r12\n\t"
  41127. "and r5, r5, r12\n\t"
  41128. "and r6, r6, r12\n\t"
  41129. "and r7, r7, r12\n\t"
  41130. "subs r8, r8, r4\n\t"
  41131. "sbcs r9, r9, r5\n\t"
  41132. "sbcs r10, r10, r6\n\t"
  41133. "sbcs r14, r14, r7\n\t"
  41134. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41135. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41136. "ldm %[m]!, {r4, r5, r6, r7}\n\t"
  41137. "and r4, r4, r12\n\t"
  41138. "and r5, r5, r12\n\t"
  41139. "and r6, r6, r12\n\t"
  41140. "and r7, r7, r12\n\t"
  41141. "sbcs r8, r8, r4\n\t"
  41142. "sbcs r9, r9, r5\n\t"
  41143. "sbcs r10, r10, r6\n\t"
  41144. "sbcs r14, r14, r7\n\t"
  41145. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41146. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41147. "ldm %[m]!, {r4, r5, r6, r7}\n\t"
  41148. "and r4, r4, r12\n\t"
  41149. "and r5, r5, r12\n\t"
  41150. "and r6, r6, r12\n\t"
  41151. "and r7, r7, r12\n\t"
  41152. "sbcs r8, r8, r4\n\t"
  41153. "sbcs r9, r9, r5\n\t"
  41154. "sbcs r10, r10, r6\n\t"
  41155. "sbcs r14, r14, r7\n\t"
  41156. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41157. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41158. "ldm %[m]!, {r4, r5, r6, r7}\n\t"
  41159. "and r4, r4, r12\n\t"
  41160. "and r5, r5, r12\n\t"
  41161. "and r6, r6, r12\n\t"
  41162. "and r7, r7, r12\n\t"
  41163. "sbcs r8, r8, r4\n\t"
  41164. "sbcs r9, r9, r5\n\t"
  41165. "sbcs r10, r10, r6\n\t"
  41166. "sbcs r14, r14, r7\n\t"
  41167. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41168. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41169. "ldm %[m]!, {r4, r5, r6, r7}\n\t"
  41170. "and r4, r4, r12\n\t"
  41171. "and r5, r5, r12\n\t"
  41172. "and r6, r6, r12\n\t"
  41173. "and r7, r7, r12\n\t"
  41174. "sbcs r8, r8, r4\n\t"
  41175. "sbcs r9, r9, r5\n\t"
  41176. "sbcs r10, r10, r6\n\t"
  41177. "sbcs r14, r14, r7\n\t"
  41178. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41179. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41180. "ldm %[m]!, {r4, r5, r6, r7}\n\t"
  41181. "and r4, r4, r12\n\t"
  41182. "and r5, r5, r12\n\t"
  41183. "and r6, r6, r12\n\t"
  41184. "and r7, r7, r12\n\t"
  41185. "sbcs r8, r8, r4\n\t"
  41186. "sbcs r9, r9, r5\n\t"
  41187. "sbcs r10, r10, r6\n\t"
  41188. "sbcs r14, r14, r7\n\t"
  41189. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41190. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41191. "ldm %[m]!, {r4, r5, r6, r7}\n\t"
  41192. "and r4, r4, r12\n\t"
  41193. "and r5, r5, r12\n\t"
  41194. "and r6, r6, r12\n\t"
  41195. "and r7, r7, r12\n\t"
  41196. "sbcs r8, r8, r4\n\t"
  41197. "sbcs r9, r9, r5\n\t"
  41198. "sbcs r10, r10, r6\n\t"
  41199. "sbcs r14, r14, r7\n\t"
  41200. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41201. "ldm %[r], {r8, r9, r10, r14}\n\t"
  41202. "ldm %[m]!, {r4, r5, r6, r7}\n\t"
  41203. "and r4, r4, r12\n\t"
  41204. "and r5, r5, r12\n\t"
  41205. "and r6, r6, r12\n\t"
  41206. "and r7, r7, r12\n\t"
  41207. "sbcs r8, r8, r4\n\t"
  41208. "sbcs r9, r9, r5\n\t"
  41209. "sbcs r10, r10, r6\n\t"
  41210. "sbc r14, r14, r7\n\t"
  41211. "stm %[r]!, {r8, r9, r10, r14}\n\t"
  41212. "sub %[r], %[r], #128\n\t"
  41213. : [r] "+r" (r), [a] "+r" (a), [m] "+r" (m)
  41214. :
  41215. : "memory", "r4", "r5", "r6", "r7", "r8", "r9", "r10", "r14", "r12"
  41216. );
  41217. }
  41218. /* Subtract two Montgomery form numbers (r = a - b % m).
  41219. *
  41220. * r Result of subtration.
  41221. * a Number to subtract from in Montgomery form.
  41222. * b Number to subtract with in Montgomery form.
  41223. * m Modulus (prime).
  41224. */
  41225. SP_NOINLINE static void sp_1024_mont_sub_32(sp_digit* r, const sp_digit* a, const sp_digit* b,
  41226. const sp_digit* m)
  41227. {
  41228. __asm__ __volatile__ (
  41229. "mov r12, #0\n\t"
  41230. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41231. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  41232. "subs r4, r4, r8\n\t"
  41233. "sbcs r5, r5, r9\n\t"
  41234. "sbcs r6, r6, r10\n\t"
  41235. "sbcs r7, r7, r14\n\t"
  41236. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41237. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41238. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  41239. "sbcs r4, r4, r8\n\t"
  41240. "sbcs r5, r5, r9\n\t"
  41241. "sbcs r6, r6, r10\n\t"
  41242. "sbcs r7, r7, r14\n\t"
  41243. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41244. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41245. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  41246. "sbcs r4, r4, r8\n\t"
  41247. "sbcs r5, r5, r9\n\t"
  41248. "sbcs r6, r6, r10\n\t"
  41249. "sbcs r7, r7, r14\n\t"
  41250. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41251. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41252. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  41253. "sbcs r4, r4, r8\n\t"
  41254. "sbcs r5, r5, r9\n\t"
  41255. "sbcs r6, r6, r10\n\t"
  41256. "sbcs r7, r7, r14\n\t"
  41257. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41258. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41259. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  41260. "sbcs r4, r4, r8\n\t"
  41261. "sbcs r5, r5, r9\n\t"
  41262. "sbcs r6, r6, r10\n\t"
  41263. "sbcs r7, r7, r14\n\t"
  41264. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41265. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41266. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  41267. "sbcs r4, r4, r8\n\t"
  41268. "sbcs r5, r5, r9\n\t"
  41269. "sbcs r6, r6, r10\n\t"
  41270. "sbcs r7, r7, r14\n\t"
  41271. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41272. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41273. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  41274. "sbcs r4, r4, r8\n\t"
  41275. "sbcs r5, r5, r9\n\t"
  41276. "sbcs r6, r6, r10\n\t"
  41277. "sbcs r7, r7, r14\n\t"
  41278. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41279. "ldm %[a]!, {r4, r5, r6, r7}\n\t"
  41280. "ldm %[b]!, {r8, r9, r10, r14}\n\t"
  41281. "sbcs r4, r4, r8\n\t"
  41282. "sbcs r5, r5, r9\n\t"
  41283. "sbcs r6, r6, r10\n\t"
  41284. "sbcs r7, r7, r14\n\t"
  41285. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41286. "sbc r12, r12, r12\n\t"
  41287. "sub %[r], %[r], #128\n\t"
  41288. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41289. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41290. "and r8, r8, r12\n\t"
  41291. "and r9, r9, r12\n\t"
  41292. "and r10, r10, r12\n\t"
  41293. "and r14, r14, r12\n\t"
  41294. "adds r4, r4, r8\n\t"
  41295. "adcs r5, r5, r9\n\t"
  41296. "adcs r6, r6, r10\n\t"
  41297. "adcs r7, r7, r14\n\t"
  41298. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41299. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41300. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41301. "and r8, r8, r12\n\t"
  41302. "and r9, r9, r12\n\t"
  41303. "and r10, r10, r12\n\t"
  41304. "and r14, r14, r12\n\t"
  41305. "adcs r4, r4, r8\n\t"
  41306. "adcs r5, r5, r9\n\t"
  41307. "adcs r6, r6, r10\n\t"
  41308. "adcs r7, r7, r14\n\t"
  41309. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41310. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41311. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41312. "and r8, r8, r12\n\t"
  41313. "and r9, r9, r12\n\t"
  41314. "and r10, r10, r12\n\t"
  41315. "and r14, r14, r12\n\t"
  41316. "adcs r4, r4, r8\n\t"
  41317. "adcs r5, r5, r9\n\t"
  41318. "adcs r6, r6, r10\n\t"
  41319. "adcs r7, r7, r14\n\t"
  41320. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41321. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41322. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41323. "and r8, r8, r12\n\t"
  41324. "and r9, r9, r12\n\t"
  41325. "and r10, r10, r12\n\t"
  41326. "and r14, r14, r12\n\t"
  41327. "adcs r4, r4, r8\n\t"
  41328. "adcs r5, r5, r9\n\t"
  41329. "adcs r6, r6, r10\n\t"
  41330. "adcs r7, r7, r14\n\t"
  41331. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41332. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41333. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41334. "and r8, r8, r12\n\t"
  41335. "and r9, r9, r12\n\t"
  41336. "and r10, r10, r12\n\t"
  41337. "and r14, r14, r12\n\t"
  41338. "adcs r4, r4, r8\n\t"
  41339. "adcs r5, r5, r9\n\t"
  41340. "adcs r6, r6, r10\n\t"
  41341. "adcs r7, r7, r14\n\t"
  41342. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41343. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41344. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41345. "and r8, r8, r12\n\t"
  41346. "and r9, r9, r12\n\t"
  41347. "and r10, r10, r12\n\t"
  41348. "and r14, r14, r12\n\t"
  41349. "adcs r4, r4, r8\n\t"
  41350. "adcs r5, r5, r9\n\t"
  41351. "adcs r6, r6, r10\n\t"
  41352. "adcs r7, r7, r14\n\t"
  41353. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41354. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41355. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41356. "and r8, r8, r12\n\t"
  41357. "and r9, r9, r12\n\t"
  41358. "and r10, r10, r12\n\t"
  41359. "and r14, r14, r12\n\t"
  41360. "adcs r4, r4, r8\n\t"
  41361. "adcs r5, r5, r9\n\t"
  41362. "adcs r6, r6, r10\n\t"
  41363. "adcs r7, r7, r14\n\t"
  41364. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41365. "ldm %[r], {r4, r5, r6, r7}\n\t"
  41366. "ldm %[m]!, {r8, r9, r10, r14}\n\t"
  41367. "and r8, r8, r12\n\t"
  41368. "and r9, r9, r12\n\t"
  41369. "and r10, r10, r12\n\t"
  41370. "and r14, r14, r12\n\t"
  41371. "adcs r4, r4, r8\n\t"
  41372. "adcs r5, r5, r9\n\t"
  41373. "adcs r6, r6, r10\n\t"
  41374. "adc r7, r7, r14\n\t"
  41375. "stm %[r]!, {r4, r5, r6, r7}\n\t"
  41376. "sub %[r], %[r], #128\n\t"
  41377. : [r] "+r" (r), [a] "+r" (a), [b] "+r" (b), [m] "+r" (m)
  41378. :
  41379. : "memory", "r4", "r5", "r6", "r7", "r8", "r9", "r10", "r14", "r12"
  41380. );
  41381. }
  41382. #define sp_1024_mont_sub_lower_32 sp_1024_mont_sub_32
  41383. /* Conditionally add a and b using the mask m.
  41384. * m is -1 to add and 0 when not.
  41385. *
  41386. * r A single precision number representing conditional add result.
  41387. * a A single precision number to add with.
  41388. * b A single precision number to add.
  41389. * m Mask value to apply.
  41390. */
  41391. SP_NOINLINE static sp_digit sp_1024_cond_add_32(sp_digit* r, const sp_digit* a, const sp_digit* b,
  41392. sp_digit m)
  41393. {
  41394. sp_digit c = 0;
  41395. __asm__ __volatile__ (
  41396. "mov r5, #128\n\t"
  41397. "mov r9, r5\n\t"
  41398. "mov r8, #0\n\t"
  41399. "\n1:\n\t"
  41400. "ldr r6, [%[b], r8]\n\t"
  41401. "and r6, r6, %[m]\n\t"
  41402. "adds r5, %[c], #-1\n\t"
  41403. "ldr r5, [%[a], r8]\n\t"
  41404. "adcs r5, r5, r6\n\t"
  41405. "mov %[c], #0\n\t"
  41406. "adcs %[c], %[c], %[c]\n\t"
  41407. "str r5, [%[r], r8]\n\t"
  41408. "add r8, r8, #4\n\t"
  41409. "cmp r8, r9\n\t"
  41410. #ifdef __GNUC__
  41411. "blt 1b\n\t"
  41412. #else
  41413. "blt.n 1b\n\t"
  41414. #endif /* __GNUC__ */
  41415. : [c] "+r" (c)
  41416. : [r] "r" (r), [a] "r" (a), [b] "r" (b), [m] "r" (m)
  41417. : "memory", "r5", "r6", "r8", "r9"
  41418. );
  41419. return c;
  41420. }
  41421. static void sp_1024_rshift1_32(sp_digit* r, const sp_digit* a)
  41422. {
  41423. __asm__ __volatile__ (
  41424. "ldr r2, [%[a]]\n\t"
  41425. "ldr r3, [%[a], #4]\n\t"
  41426. "lsr r2, r2, #1\n\t"
  41427. "orr r2, r2, r3, lsl #31\n\t"
  41428. "lsr r3, r3, #1\n\t"
  41429. "ldr r4, [%[a], #8]\n\t"
  41430. "str r2, [%[r], #0]\n\t"
  41431. "orr r3, r3, r4, lsl #31\n\t"
  41432. "lsr r4, r4, #1\n\t"
  41433. "ldr r2, [%[a], #12]\n\t"
  41434. "str r3, [%[r], #4]\n\t"
  41435. "orr r4, r4, r2, lsl #31\n\t"
  41436. "lsr r2, r2, #1\n\t"
  41437. "ldr r3, [%[a], #16]\n\t"
  41438. "str r4, [%[r], #8]\n\t"
  41439. "orr r2, r2, r3, lsl #31\n\t"
  41440. "lsr r3, r3, #1\n\t"
  41441. "ldr r4, [%[a], #20]\n\t"
  41442. "str r2, [%[r], #12]\n\t"
  41443. "orr r3, r3, r4, lsl #31\n\t"
  41444. "lsr r4, r4, #1\n\t"
  41445. "ldr r2, [%[a], #24]\n\t"
  41446. "str r3, [%[r], #16]\n\t"
  41447. "orr r4, r4, r2, lsl #31\n\t"
  41448. "lsr r2, r2, #1\n\t"
  41449. "ldr r3, [%[a], #28]\n\t"
  41450. "str r4, [%[r], #20]\n\t"
  41451. "orr r2, r2, r3, lsl #31\n\t"
  41452. "lsr r3, r3, #1\n\t"
  41453. "ldr r4, [%[a], #32]\n\t"
  41454. "str r2, [%[r], #24]\n\t"
  41455. "orr r3, r3, r4, lsl #31\n\t"
  41456. "lsr r4, r4, #1\n\t"
  41457. "ldr r2, [%[a], #36]\n\t"
  41458. "str r3, [%[r], #28]\n\t"
  41459. "orr r4, r4, r2, lsl #31\n\t"
  41460. "lsr r2, r2, #1\n\t"
  41461. "ldr r3, [%[a], #40]\n\t"
  41462. "str r4, [%[r], #32]\n\t"
  41463. "orr r2, r2, r3, lsl #31\n\t"
  41464. "lsr r3, r3, #1\n\t"
  41465. "ldr r4, [%[a], #44]\n\t"
  41466. "str r2, [%[r], #36]\n\t"
  41467. "orr r3, r3, r4, lsl #31\n\t"
  41468. "lsr r4, r4, #1\n\t"
  41469. "ldr r2, [%[a], #48]\n\t"
  41470. "str r3, [%[r], #40]\n\t"
  41471. "orr r4, r4, r2, lsl #31\n\t"
  41472. "lsr r2, r2, #1\n\t"
  41473. "ldr r3, [%[a], #52]\n\t"
  41474. "str r4, [%[r], #44]\n\t"
  41475. "orr r2, r2, r3, lsl #31\n\t"
  41476. "lsr r3, r3, #1\n\t"
  41477. "ldr r4, [%[a], #56]\n\t"
  41478. "str r2, [%[r], #48]\n\t"
  41479. "orr r3, r3, r4, lsl #31\n\t"
  41480. "lsr r4, r4, #1\n\t"
  41481. "ldr r2, [%[a], #60]\n\t"
  41482. "str r3, [%[r], #52]\n\t"
  41483. "orr r4, r4, r2, lsl #31\n\t"
  41484. "lsr r2, r2, #1\n\t"
  41485. "ldr r3, [%[a], #64]\n\t"
  41486. "str r4, [%[r], #56]\n\t"
  41487. "orr r2, r2, r3, lsl #31\n\t"
  41488. "lsr r3, r3, #1\n\t"
  41489. "ldr r4, [%[a], #68]\n\t"
  41490. "str r2, [%[r], #60]\n\t"
  41491. "orr r3, r3, r4, lsl #31\n\t"
  41492. "lsr r4, r4, #1\n\t"
  41493. "ldr r2, [%[a], #72]\n\t"
  41494. "str r3, [%[r], #64]\n\t"
  41495. "orr r4, r4, r2, lsl #31\n\t"
  41496. "lsr r2, r2, #1\n\t"
  41497. "ldr r3, [%[a], #76]\n\t"
  41498. "str r4, [%[r], #68]\n\t"
  41499. "orr r2, r2, r3, lsl #31\n\t"
  41500. "lsr r3, r3, #1\n\t"
  41501. "ldr r4, [%[a], #80]\n\t"
  41502. "str r2, [%[r], #72]\n\t"
  41503. "orr r3, r3, r4, lsl #31\n\t"
  41504. "lsr r4, r4, #1\n\t"
  41505. "ldr r2, [%[a], #84]\n\t"
  41506. "str r3, [%[r], #76]\n\t"
  41507. "orr r4, r4, r2, lsl #31\n\t"
  41508. "lsr r2, r2, #1\n\t"
  41509. "ldr r3, [%[a], #88]\n\t"
  41510. "str r4, [%[r], #80]\n\t"
  41511. "orr r2, r2, r3, lsl #31\n\t"
  41512. "lsr r3, r3, #1\n\t"
  41513. "ldr r4, [%[a], #92]\n\t"
  41514. "str r2, [%[r], #84]\n\t"
  41515. "orr r3, r3, r4, lsl #31\n\t"
  41516. "lsr r4, r4, #1\n\t"
  41517. "ldr r2, [%[a], #96]\n\t"
  41518. "str r3, [%[r], #88]\n\t"
  41519. "orr r4, r4, r2, lsl #31\n\t"
  41520. "lsr r2, r2, #1\n\t"
  41521. "ldr r3, [%[a], #100]\n\t"
  41522. "str r4, [%[r], #92]\n\t"
  41523. "orr r2, r2, r3, lsl #31\n\t"
  41524. "lsr r3, r3, #1\n\t"
  41525. "ldr r4, [%[a], #104]\n\t"
  41526. "str r2, [%[r], #96]\n\t"
  41527. "orr r3, r3, r4, lsl #31\n\t"
  41528. "lsr r4, r4, #1\n\t"
  41529. "ldr r2, [%[a], #108]\n\t"
  41530. "str r3, [%[r], #100]\n\t"
  41531. "orr r4, r4, r2, lsl #31\n\t"
  41532. "lsr r2, r2, #1\n\t"
  41533. "ldr r3, [%[a], #112]\n\t"
  41534. "str r4, [%[r], #104]\n\t"
  41535. "orr r2, r2, r3, lsl #31\n\t"
  41536. "lsr r3, r3, #1\n\t"
  41537. "ldr r4, [%[a], #116]\n\t"
  41538. "str r2, [%[r], #108]\n\t"
  41539. "orr r3, r3, r4, lsl #31\n\t"
  41540. "lsr r4, r4, #1\n\t"
  41541. "ldr r2, [%[a], #120]\n\t"
  41542. "str r3, [%[r], #112]\n\t"
  41543. "orr r4, r4, r2, lsl #31\n\t"
  41544. "lsr r2, r2, #1\n\t"
  41545. "ldr r3, [%[a], #124]\n\t"
  41546. "str r4, [%[r], #116]\n\t"
  41547. "orr r2, r2, r3, lsl #31\n\t"
  41548. "lsr r3, r3, #1\n\t"
  41549. "str r2, [%[r], #120]\n\t"
  41550. "str r3, [%[r], #124]\n\t"
  41551. :
  41552. : [r] "r" (r), [a] "r" (a)
  41553. : "memory", "r2", "r3", "r4"
  41554. );
  41555. }
  41556. /* Divide the number by 2 mod the modulus (prime). (r = a / 2 % m)
  41557. *
  41558. * r Result of division by 2.
  41559. * a Number to divide.
  41560. * m Modulus (prime).
  41561. */
  41562. SP_NOINLINE static void sp_1024_div2_32(sp_digit* r, const sp_digit* a, const sp_digit* m)
  41563. {
  41564. sp_digit o;
  41565. o = sp_1024_cond_add_32(r, a, m, 0 - (a[0] & 1));
  41566. sp_1024_rshift1_32(r, r);
  41567. r[31] |= o << 31;
  41568. }
  41569. /* Double the Montgomery form projective point p.
  41570. *
  41571. * r Result of doubling point.
  41572. * p Point to double.
  41573. * t Temporary ordinate data.
  41574. */
  41575. #ifdef WOLFSSL_SP_NONBLOCK
  41576. typedef struct sp_1024_proj_point_dbl_32_ctx {
  41577. int state;
  41578. sp_digit* t1;
  41579. sp_digit* t2;
  41580. sp_digit* x;
  41581. sp_digit* y;
  41582. sp_digit* z;
  41583. } sp_1024_proj_point_dbl_32_ctx;
  41584. static int sp_1024_proj_point_dbl_32_nb(sp_ecc_ctx_t* sp_ctx, sp_point_1024* r, const sp_point_1024* p, sp_digit* t)
  41585. {
  41586. int err = FP_WOULDBLOCK;
  41587. sp_1024_proj_point_dbl_32_ctx* ctx = (sp_1024_proj_point_dbl_32_ctx*)sp_ctx->data;
  41588. typedef char ctx_size_test[sizeof(sp_1024_proj_point_dbl_32_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  41589. (void)sizeof(ctx_size_test);
  41590. switch (ctx->state) {
  41591. case 0:
  41592. ctx->t1 = t;
  41593. ctx->t2 = t + 2*32;
  41594. ctx->x = r->x;
  41595. ctx->y = r->y;
  41596. ctx->z = r->z;
  41597. /* Put infinity into result. */
  41598. if (r != p) {
  41599. r->infinity = p->infinity;
  41600. }
  41601. ctx->state = 1;
  41602. break;
  41603. case 1:
  41604. /* T1 = Z * Z */
  41605. sp_1024_mont_sqr_32(ctx->t1, p->z, p1024_mod, p1024_mp_mod);
  41606. ctx->state = 2;
  41607. break;
  41608. case 2:
  41609. /* Z = Y * Z */
  41610. sp_1024_mont_mul_32(ctx->z, p->y, p->z, p1024_mod, p1024_mp_mod);
  41611. ctx->state = 3;
  41612. break;
  41613. case 3:
  41614. /* Z = 2Z */
  41615. sp_1024_mont_dbl_32(ctx->z, ctx->z, p1024_mod);
  41616. ctx->state = 4;
  41617. break;
  41618. case 4:
  41619. /* T2 = X - T1 */
  41620. sp_1024_mont_sub_32(ctx->t2, p->x, ctx->t1, p1024_mod);
  41621. ctx->state = 5;
  41622. break;
  41623. case 5:
  41624. /* T1 = X + T1 */
  41625. sp_1024_mont_add_32(ctx->t1, p->x, ctx->t1, p1024_mod);
  41626. ctx->state = 6;
  41627. break;
  41628. case 6:
  41629. /* T2 = T1 * T2 */
  41630. sp_1024_mont_mul_32(ctx->t2, ctx->t1, ctx->t2, p1024_mod, p1024_mp_mod);
  41631. ctx->state = 7;
  41632. break;
  41633. case 7:
  41634. /* T1 = 3T2 */
  41635. sp_1024_mont_tpl_32(ctx->t1, ctx->t2, p1024_mod);
  41636. ctx->state = 8;
  41637. break;
  41638. case 8:
  41639. /* Y = 2Y */
  41640. sp_1024_mont_dbl_32(ctx->y, p->y, p1024_mod);
  41641. ctx->state = 9;
  41642. break;
  41643. case 9:
  41644. /* Y = Y * Y */
  41645. sp_1024_mont_sqr_32(ctx->y, ctx->y, p1024_mod, p1024_mp_mod);
  41646. ctx->state = 10;
  41647. break;
  41648. case 10:
  41649. /* T2 = Y * Y */
  41650. sp_1024_mont_sqr_32(ctx->t2, ctx->y, p1024_mod, p1024_mp_mod);
  41651. ctx->state = 11;
  41652. break;
  41653. case 11:
  41654. /* T2 = T2/2 */
  41655. sp_1024_div2_32(ctx->t2, ctx->t2, p1024_mod);
  41656. ctx->state = 12;
  41657. break;
  41658. case 12:
  41659. /* Y = Y * X */
  41660. sp_1024_mont_mul_32(ctx->y, ctx->y, p->x, p1024_mod, p1024_mp_mod);
  41661. ctx->state = 13;
  41662. break;
  41663. case 13:
  41664. /* X = T1 * T1 */
  41665. sp_1024_mont_sqr_32(ctx->x, ctx->t1, p1024_mod, p1024_mp_mod);
  41666. ctx->state = 14;
  41667. break;
  41668. case 14:
  41669. /* X = X - Y */
  41670. sp_1024_mont_sub_32(ctx->x, ctx->x, ctx->y, p1024_mod);
  41671. ctx->state = 15;
  41672. break;
  41673. case 15:
  41674. /* X = X - Y */
  41675. sp_1024_mont_sub_32(ctx->x, ctx->x, ctx->y, p1024_mod);
  41676. ctx->state = 16;
  41677. break;
  41678. case 16:
  41679. /* Y = Y - X */
  41680. sp_1024_mont_sub_lower_32(ctx->y, ctx->y, ctx->x, p1024_mod);
  41681. ctx->state = 17;
  41682. break;
  41683. case 17:
  41684. /* Y = Y * T1 */
  41685. sp_1024_mont_mul_32(ctx->y, ctx->y, ctx->t1, p1024_mod, p1024_mp_mod);
  41686. ctx->state = 18;
  41687. break;
  41688. case 18:
  41689. /* Y = Y - T2 */
  41690. sp_1024_mont_sub_32(ctx->y, ctx->y, ctx->t2, p1024_mod);
  41691. ctx->state = 19;
  41692. /* fall-through */
  41693. case 19:
  41694. err = MP_OKAY;
  41695. break;
  41696. }
  41697. if (err == MP_OKAY && ctx->state != 19) {
  41698. err = FP_WOULDBLOCK;
  41699. }
  41700. return err;
  41701. }
  41702. #endif /* WOLFSSL_SP_NONBLOCK */
  41703. static void sp_1024_proj_point_dbl_32(sp_point_1024* r, const sp_point_1024* p,
  41704. sp_digit* t)
  41705. {
  41706. sp_digit* t1 = t;
  41707. sp_digit* t2 = t + 2*32;
  41708. sp_digit* x;
  41709. sp_digit* y;
  41710. sp_digit* z;
  41711. x = r->x;
  41712. y = r->y;
  41713. z = r->z;
  41714. /* Put infinity into result. */
  41715. if (r != p) {
  41716. r->infinity = p->infinity;
  41717. }
  41718. /* T1 = Z * Z */
  41719. sp_1024_mont_sqr_32(t1, p->z, p1024_mod, p1024_mp_mod);
  41720. /* Z = Y * Z */
  41721. sp_1024_mont_mul_32(z, p->y, p->z, p1024_mod, p1024_mp_mod);
  41722. /* Z = 2Z */
  41723. sp_1024_mont_dbl_32(z, z, p1024_mod);
  41724. /* T2 = X - T1 */
  41725. sp_1024_mont_sub_32(t2, p->x, t1, p1024_mod);
  41726. /* T1 = X + T1 */
  41727. sp_1024_mont_add_32(t1, p->x, t1, p1024_mod);
  41728. /* T2 = T1 * T2 */
  41729. sp_1024_mont_mul_32(t2, t1, t2, p1024_mod, p1024_mp_mod);
  41730. /* T1 = 3T2 */
  41731. sp_1024_mont_tpl_32(t1, t2, p1024_mod);
  41732. /* Y = 2Y */
  41733. sp_1024_mont_dbl_32(y, p->y, p1024_mod);
  41734. /* Y = Y * Y */
  41735. sp_1024_mont_sqr_32(y, y, p1024_mod, p1024_mp_mod);
  41736. /* T2 = Y * Y */
  41737. sp_1024_mont_sqr_32(t2, y, p1024_mod, p1024_mp_mod);
  41738. /* T2 = T2/2 */
  41739. sp_1024_div2_32(t2, t2, p1024_mod);
  41740. /* Y = Y * X */
  41741. sp_1024_mont_mul_32(y, y, p->x, p1024_mod, p1024_mp_mod);
  41742. /* X = T1 * T1 */
  41743. sp_1024_mont_sqr_32(x, t1, p1024_mod, p1024_mp_mod);
  41744. /* X = X - Y */
  41745. sp_1024_mont_sub_32(x, x, y, p1024_mod);
  41746. /* X = X - Y */
  41747. sp_1024_mont_sub_32(x, x, y, p1024_mod);
  41748. /* Y = Y - X */
  41749. sp_1024_mont_sub_lower_32(y, y, x, p1024_mod);
  41750. /* Y = Y * T1 */
  41751. sp_1024_mont_mul_32(y, y, t1, p1024_mod, p1024_mp_mod);
  41752. /* Y = Y - T2 */
  41753. sp_1024_mont_sub_32(y, y, t2, p1024_mod);
  41754. }
  41755. #ifdef WOLFSSL_SP_SMALL
  41756. /* Sub b from a into r. (r = a - b)
  41757. *
  41758. * r A single precision integer.
  41759. * a A single precision integer.
  41760. * b A single precision integer.
  41761. */
  41762. SP_NOINLINE static sp_digit sp_1024_sub_32(sp_digit* r, const sp_digit* a,
  41763. const sp_digit* b)
  41764. {
  41765. sp_digit c = 0;
  41766. __asm__ __volatile__ (
  41767. "mov r6, %[a]\n\t"
  41768. "add r6, r6, #128\n\t"
  41769. "\n1:\n\t"
  41770. "mov r5, #0\n\t"
  41771. "subs r5, r5, %[c]\n\t"
  41772. "ldr r4, [%[a]]\n\t"
  41773. "ldr r5, [%[b]]\n\t"
  41774. "sbcs r4, r4, r5\n\t"
  41775. "str r4, [%[r]]\n\t"
  41776. "sbc %[c], %[c], %[c]\n\t"
  41777. "add %[a], %[a], #4\n\t"
  41778. "add %[b], %[b], #4\n\t"
  41779. "add %[r], %[r], #4\n\t"
  41780. "cmp %[a], r6\n\t"
  41781. #ifdef __GNUC__
  41782. "bne 1b\n\t"
  41783. #else
  41784. "bne.n 1b\n\t"
  41785. #endif /* __GNUC__ */
  41786. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  41787. :
  41788. : "memory", "r4", "r5", "r6"
  41789. );
  41790. return c;
  41791. }
  41792. #else
  41793. /* Sub b from a into r. (r = a - b)
  41794. *
  41795. * r A single precision integer.
  41796. * a A single precision integer.
  41797. * b A single precision integer.
  41798. */
  41799. SP_NOINLINE static sp_digit sp_1024_sub_32(sp_digit* r, const sp_digit* a,
  41800. const sp_digit* b)
  41801. {
  41802. sp_digit c = 0;
  41803. __asm__ __volatile__ (
  41804. "ldm %[a]!, {r4, r5}\n\t"
  41805. "ldm %[b]!, {r6, r8}\n\t"
  41806. "subs r4, r4, r6\n\t"
  41807. "sbcs r5, r5, r8\n\t"
  41808. "stm %[r]!, {r4, r5}\n\t"
  41809. "ldm %[a]!, {r4, r5}\n\t"
  41810. "ldm %[b]!, {r6, r8}\n\t"
  41811. "sbcs r4, r4, r6\n\t"
  41812. "sbcs r5, r5, r8\n\t"
  41813. "stm %[r]!, {r4, r5}\n\t"
  41814. "ldm %[a]!, {r4, r5}\n\t"
  41815. "ldm %[b]!, {r6, r8}\n\t"
  41816. "sbcs r4, r4, r6\n\t"
  41817. "sbcs r5, r5, r8\n\t"
  41818. "stm %[r]!, {r4, r5}\n\t"
  41819. "ldm %[a]!, {r4, r5}\n\t"
  41820. "ldm %[b]!, {r6, r8}\n\t"
  41821. "sbcs r4, r4, r6\n\t"
  41822. "sbcs r5, r5, r8\n\t"
  41823. "stm %[r]!, {r4, r5}\n\t"
  41824. "ldm %[a]!, {r4, r5}\n\t"
  41825. "ldm %[b]!, {r6, r8}\n\t"
  41826. "sbcs r4, r4, r6\n\t"
  41827. "sbcs r5, r5, r8\n\t"
  41828. "stm %[r]!, {r4, r5}\n\t"
  41829. "ldm %[a]!, {r4, r5}\n\t"
  41830. "ldm %[b]!, {r6, r8}\n\t"
  41831. "sbcs r4, r4, r6\n\t"
  41832. "sbcs r5, r5, r8\n\t"
  41833. "stm %[r]!, {r4, r5}\n\t"
  41834. "ldm %[a]!, {r4, r5}\n\t"
  41835. "ldm %[b]!, {r6, r8}\n\t"
  41836. "sbcs r4, r4, r6\n\t"
  41837. "sbcs r5, r5, r8\n\t"
  41838. "stm %[r]!, {r4, r5}\n\t"
  41839. "ldm %[a]!, {r4, r5}\n\t"
  41840. "ldm %[b]!, {r6, r8}\n\t"
  41841. "sbcs r4, r4, r6\n\t"
  41842. "sbcs r5, r5, r8\n\t"
  41843. "stm %[r]!, {r4, r5}\n\t"
  41844. "ldm %[a]!, {r4, r5}\n\t"
  41845. "ldm %[b]!, {r6, r8}\n\t"
  41846. "sbcs r4, r4, r6\n\t"
  41847. "sbcs r5, r5, r8\n\t"
  41848. "stm %[r]!, {r4, r5}\n\t"
  41849. "ldm %[a]!, {r4, r5}\n\t"
  41850. "ldm %[b]!, {r6, r8}\n\t"
  41851. "sbcs r4, r4, r6\n\t"
  41852. "sbcs r5, r5, r8\n\t"
  41853. "stm %[r]!, {r4, r5}\n\t"
  41854. "ldm %[a]!, {r4, r5}\n\t"
  41855. "ldm %[b]!, {r6, r8}\n\t"
  41856. "sbcs r4, r4, r6\n\t"
  41857. "sbcs r5, r5, r8\n\t"
  41858. "stm %[r]!, {r4, r5}\n\t"
  41859. "ldm %[a]!, {r4, r5}\n\t"
  41860. "ldm %[b]!, {r6, r8}\n\t"
  41861. "sbcs r4, r4, r6\n\t"
  41862. "sbcs r5, r5, r8\n\t"
  41863. "stm %[r]!, {r4, r5}\n\t"
  41864. "ldm %[a]!, {r4, r5}\n\t"
  41865. "ldm %[b]!, {r6, r8}\n\t"
  41866. "sbcs r4, r4, r6\n\t"
  41867. "sbcs r5, r5, r8\n\t"
  41868. "stm %[r]!, {r4, r5}\n\t"
  41869. "ldm %[a]!, {r4, r5}\n\t"
  41870. "ldm %[b]!, {r6, r8}\n\t"
  41871. "sbcs r4, r4, r6\n\t"
  41872. "sbcs r5, r5, r8\n\t"
  41873. "stm %[r]!, {r4, r5}\n\t"
  41874. "ldm %[a]!, {r4, r5}\n\t"
  41875. "ldm %[b]!, {r6, r8}\n\t"
  41876. "sbcs r4, r4, r6\n\t"
  41877. "sbcs r5, r5, r8\n\t"
  41878. "stm %[r]!, {r4, r5}\n\t"
  41879. "ldm %[a]!, {r4, r5}\n\t"
  41880. "ldm %[b]!, {r6, r8}\n\t"
  41881. "sbcs r4, r4, r6\n\t"
  41882. "sbcs r5, r5, r8\n\t"
  41883. "stm %[r]!, {r4, r5}\n\t"
  41884. "sbc %[c], %[c], %[c]\n\t"
  41885. : [c] "+r" (c), [r] "+r" (r), [a] "+r" (a), [b] "+r" (b)
  41886. :
  41887. : "memory", "r4", "r5", "r6", "r8"
  41888. );
  41889. return c;
  41890. }
  41891. #endif /* WOLFSSL_SP_SMALL */
  41892. /* Compare two numbers to determine if they are equal.
  41893. * Constant time implementation.
  41894. *
  41895. * a First number to compare.
  41896. * b Second number to compare.
  41897. * returns 1 when equal and 0 otherwise.
  41898. */
  41899. static int sp_1024_cmp_equal_32(const sp_digit* a, const sp_digit* b)
  41900. {
  41901. return ((a[0] ^ b[0]) | (a[1] ^ b[1]) | (a[2] ^ b[2]) |
  41902. (a[3] ^ b[3]) | (a[4] ^ b[4]) | (a[5] ^ b[5]) |
  41903. (a[6] ^ b[6]) | (a[7] ^ b[7]) | (a[8] ^ b[8]) |
  41904. (a[9] ^ b[9]) | (a[10] ^ b[10]) | (a[11] ^ b[11]) |
  41905. (a[12] ^ b[12]) | (a[13] ^ b[13]) | (a[14] ^ b[14]) |
  41906. (a[15] ^ b[15]) | (a[16] ^ b[16]) | (a[17] ^ b[17]) |
  41907. (a[18] ^ b[18]) | (a[19] ^ b[19]) | (a[20] ^ b[20]) |
  41908. (a[21] ^ b[21]) | (a[22] ^ b[22]) | (a[23] ^ b[23]) |
  41909. (a[24] ^ b[24]) | (a[25] ^ b[25]) | (a[26] ^ b[26]) |
  41910. (a[27] ^ b[27]) | (a[28] ^ b[28]) | (a[29] ^ b[29]) |
  41911. (a[30] ^ b[30]) | (a[31] ^ b[31])) == 0;
  41912. }
  41913. /* Returns 1 if the number of zero.
  41914. * Implementation is constant time.
  41915. *
  41916. * a Number to check.
  41917. * returns 1 if the number is zero and 0 otherwise.
  41918. */
  41919. static int sp_1024_iszero_32(const sp_digit* a)
  41920. {
  41921. return (a[0] | a[1] | a[2] | a[3] | a[4] | a[5] | a[6] | a[7] |
  41922. a[8] | a[9] | a[10] | a[11] | a[12] | a[13] | a[14] | a[15] |
  41923. a[16] | a[17] | a[18] | a[19] | a[20] | a[21] | a[22] | a[23] |
  41924. a[24] | a[25] | a[26] | a[27] | a[28] | a[29] | a[30] | a[31]) == 0;
  41925. }
  41926. /* Add two Montgomery form projective points.
  41927. *
  41928. * r Result of addition.
  41929. * p First point to add.
  41930. * q Second point to add.
  41931. * t Temporary ordinate data.
  41932. */
  41933. #ifdef WOLFSSL_SP_NONBLOCK
  41934. typedef struct sp_1024_proj_point_add_32_ctx {
  41935. int state;
  41936. sp_1024_proj_point_dbl_32_ctx dbl_ctx;
  41937. const sp_point_1024* ap[2];
  41938. sp_point_1024* rp[2];
  41939. sp_digit* t1;
  41940. sp_digit* t2;
  41941. sp_digit* t3;
  41942. sp_digit* t4;
  41943. sp_digit* t5;
  41944. sp_digit* t6;
  41945. sp_digit* x;
  41946. sp_digit* y;
  41947. sp_digit* z;
  41948. } sp_1024_proj_point_add_32_ctx;
  41949. static int sp_1024_proj_point_add_32_nb(sp_ecc_ctx_t* sp_ctx, sp_point_1024* r,
  41950. const sp_point_1024* p, const sp_point_1024* q, sp_digit* t)
  41951. {
  41952. int err = FP_WOULDBLOCK;
  41953. sp_1024_proj_point_add_32_ctx* ctx = (sp_1024_proj_point_add_32_ctx*)sp_ctx->data;
  41954. /* Ensure only the first point is the same as the result. */
  41955. if (q == r) {
  41956. const sp_point_1024* a = p;
  41957. p = q;
  41958. q = a;
  41959. }
  41960. typedef char ctx_size_test[sizeof(sp_1024_proj_point_add_32_ctx) >= sizeof(*sp_ctx) ? -1 : 1];
  41961. (void)sizeof(ctx_size_test);
  41962. switch (ctx->state) {
  41963. case 0: /* INIT */
  41964. ctx->t1 = t;
  41965. ctx->t2 = t + 2*32;
  41966. ctx->t3 = t + 4*32;
  41967. ctx->t4 = t + 6*32;
  41968. ctx->t5 = t + 8*32;
  41969. ctx->t6 = t + 10*32;
  41970. ctx->x = ctx->t6;
  41971. ctx->y = ctx->t1;
  41972. ctx->z = ctx->t2;
  41973. ctx->state = 1;
  41974. break;
  41975. case 1:
  41976. /* Check double */
  41977. (void)sp_1024_sub_32(ctx->t1, p1024_mod, q->y);
  41978. sp_1024_norm_32(ctx->t1);
  41979. if ((~p->infinity & ~q->infinity &
  41980. sp_1024_cmp_equal_32(p->x, q->x) & sp_1024_cmp_equal_32(p->z, q->z) &
  41981. (sp_1024_cmp_equal_32(p->y, q->y) | sp_1024_cmp_equal_32(p->y, ctx->t1))) != 0)
  41982. {
  41983. XMEMSET(&ctx->dbl_ctx, 0, sizeof(ctx->dbl_ctx));
  41984. ctx->state = 2;
  41985. }
  41986. else {
  41987. ctx->state = 3;
  41988. }
  41989. break;
  41990. case 2:
  41991. err = sp_1024_proj_point_dbl_32_nb((sp_ecc_ctx_t*)&ctx->dbl_ctx, r, p, t);
  41992. if (err == MP_OKAY)
  41993. ctx->state = 27; /* done */
  41994. break;
  41995. case 3:
  41996. {
  41997. ctx->state = 4;
  41998. break;
  41999. }
  42000. case 4:
  42001. /* U1 = X1*Z2^2 */
  42002. sp_1024_mont_sqr_32(ctx->t1, q->z, p1024_mod, p1024_mp_mod);
  42003. ctx->state = 5;
  42004. break;
  42005. case 5:
  42006. sp_1024_mont_mul_32(ctx->t3, ctx->t1, q->z, p1024_mod, p1024_mp_mod);
  42007. ctx->state = 6;
  42008. break;
  42009. case 6:
  42010. sp_1024_mont_mul_32(ctx->t1, ctx->t1, p->x, p1024_mod, p1024_mp_mod);
  42011. ctx->state = 7;
  42012. break;
  42013. case 7:
  42014. /* U2 = X2*Z1^2 */
  42015. sp_1024_mont_sqr_32(ctx->t2, p->z, p1024_mod, p1024_mp_mod);
  42016. ctx->state = 8;
  42017. break;
  42018. case 8:
  42019. sp_1024_mont_mul_32(ctx->t4, ctx->t2, p->z, p1024_mod, p1024_mp_mod);
  42020. ctx->state = 9;
  42021. break;
  42022. case 9:
  42023. sp_1024_mont_mul_32(ctx->t2, ctx->t2, q->x, p1024_mod, p1024_mp_mod);
  42024. ctx->state = 10;
  42025. break;
  42026. case 10:
  42027. /* S1 = Y1*Z2^3 */
  42028. sp_1024_mont_mul_32(ctx->t3, ctx->t3, p->y, p1024_mod, p1024_mp_mod);
  42029. ctx->state = 11;
  42030. break;
  42031. case 11:
  42032. /* S2 = Y2*Z1^3 */
  42033. sp_1024_mont_mul_32(ctx->t4, ctx->t4, q->y, p1024_mod, p1024_mp_mod);
  42034. ctx->state = 12;
  42035. break;
  42036. case 12:
  42037. /* H = U2 - U1 */
  42038. sp_1024_mont_sub_32(ctx->t2, ctx->t2, ctx->t1, p1024_mod);
  42039. ctx->state = 13;
  42040. break;
  42041. case 13:
  42042. /* R = S2 - S1 */
  42043. sp_1024_mont_sub_32(ctx->t4, ctx->t4, ctx->t3, p1024_mod);
  42044. ctx->state = 14;
  42045. break;
  42046. case 14:
  42047. /* X3 = R^2 - H^3 - 2*U1*H^2 */
  42048. sp_1024_mont_sqr_32(ctx->t5, ctx->t2, p1024_mod, p1024_mp_mod);
  42049. ctx->state = 15;
  42050. break;
  42051. case 15:
  42052. sp_1024_mont_mul_32(ctx->y, ctx->t1, ctx->t5, p1024_mod, p1024_mp_mod);
  42053. ctx->state = 16;
  42054. break;
  42055. case 16:
  42056. sp_1024_mont_mul_32(ctx->t5, ctx->t5, ctx->t2, p1024_mod, p1024_mp_mod);
  42057. ctx->state = 17;
  42058. break;
  42059. case 17:
  42060. /* Z3 = H*Z1*Z2 */
  42061. sp_1024_mont_mul_32(ctx->z, p->z, ctx->t2, p1024_mod, p1024_mp_mod);
  42062. ctx->state = 18;
  42063. break;
  42064. case 18:
  42065. sp_1024_mont_mul_32(ctx->z, ctx->z, q->z, p1024_mod, p1024_mp_mod);
  42066. ctx->state = 19;
  42067. break;
  42068. case 19:
  42069. sp_1024_mont_sqr_32(ctx->x, ctx->t4, p1024_mod, p1024_mp_mod);
  42070. ctx->state = 20;
  42071. break;
  42072. case 20:
  42073. sp_1024_mont_sub_32(ctx->x, ctx->x, ctx->t5, p1024_mod);
  42074. ctx->state = 21;
  42075. break;
  42076. case 21:
  42077. sp_1024_mont_mul_32(ctx->t5, ctx->t5, ctx->t3, p1024_mod, p1024_mp_mod);
  42078. ctx->state = 22;
  42079. break;
  42080. case 22:
  42081. sp_1024_mont_dbl_32(ctx->t3, ctx->y, p1024_mod);
  42082. ctx->state = 23;
  42083. break;
  42084. case 23:
  42085. sp_1024_mont_sub_32(ctx->x, ctx->x, ctx->t3, p1024_mod);
  42086. ctx->state = 24;
  42087. break;
  42088. case 24:
  42089. /* Y3 = R*(U1*H^2 - X3) - S1*H^3 */
  42090. sp_1024_mont_sub_lower_32(ctx->y, ctx->y, ctx->x, p1024_mod);
  42091. ctx->state = 25;
  42092. break;
  42093. case 25:
  42094. sp_1024_mont_mul_32(ctx->y, ctx->y, ctx->t4, p1024_mod, p1024_mp_mod);
  42095. ctx->state = 26;
  42096. break;
  42097. case 26:
  42098. sp_1024_mont_sub_32(ctx->y, ctx->y, ctx->t5, p1024_mod);
  42099. ctx->state = 27;
  42100. /* fall-through */
  42101. case 27:
  42102. {
  42103. int i;
  42104. sp_digit maskp = 0 - (q->infinity & (!p->infinity));
  42105. sp_digit maskq = 0 - (p->infinity & (!q->infinity));
  42106. sp_digit maskt = ~(maskp | maskq);
  42107. for (i = 0; i < 32; i++) {
  42108. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) |
  42109. (ctx->x[i] & maskt);
  42110. }
  42111. for (i = 0; i < 32; i++) {
  42112. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) |
  42113. (ctx->y[i] & maskt);
  42114. }
  42115. for (i = 0; i < 32; i++) {
  42116. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) |
  42117. (ctx->z[i] & maskt);
  42118. }
  42119. r->z[0] |= p->infinity & q->infinity;
  42120. r->infinity = p->infinity & q->infinity;
  42121. err = MP_OKAY;
  42122. break;
  42123. }
  42124. }
  42125. if (err == MP_OKAY && ctx->state != 27) {
  42126. err = FP_WOULDBLOCK;
  42127. }
  42128. return err;
  42129. }
  42130. #endif /* WOLFSSL_SP_NONBLOCK */
  42131. static void sp_1024_proj_point_add_32(sp_point_1024* r,
  42132. const sp_point_1024* p, const sp_point_1024* q, sp_digit* t)
  42133. {
  42134. sp_digit* t1 = t;
  42135. sp_digit* t2 = t + 2*32;
  42136. sp_digit* t3 = t + 4*32;
  42137. sp_digit* t4 = t + 6*32;
  42138. sp_digit* t5 = t + 8*32;
  42139. sp_digit* t6 = t + 10*32;
  42140. /* Check double */
  42141. (void)sp_1024_mont_sub_32(t1, p1024_mod, q->y, p1024_mod);
  42142. sp_1024_norm_32(t1);
  42143. if ((~p->infinity & ~q->infinity &
  42144. sp_1024_cmp_equal_32(p->x, q->x) & sp_1024_cmp_equal_32(p->z, q->z) &
  42145. (sp_1024_cmp_equal_32(p->y, q->y) | sp_1024_cmp_equal_32(p->y, t1))) != 0) {
  42146. sp_1024_proj_point_dbl_32(r, p, t);
  42147. }
  42148. else {
  42149. sp_digit maskp;
  42150. sp_digit maskq;
  42151. sp_digit maskt;
  42152. sp_digit* x = t6;
  42153. sp_digit* y = t1;
  42154. sp_digit* z = t2;
  42155. int i;
  42156. maskp = 0 - (q->infinity & (!p->infinity));
  42157. maskq = 0 - (p->infinity & (!q->infinity));
  42158. maskt = ~(maskp | maskq);
  42159. /* U1 = X1*Z2^2 */
  42160. sp_1024_mont_sqr_32(t1, q->z, p1024_mod, p1024_mp_mod);
  42161. sp_1024_mont_mul_32(t3, t1, q->z, p1024_mod, p1024_mp_mod);
  42162. sp_1024_mont_mul_32(t1, t1, p->x, p1024_mod, p1024_mp_mod);
  42163. /* U2 = X2*Z1^2 */
  42164. sp_1024_mont_sqr_32(t2, p->z, p1024_mod, p1024_mp_mod);
  42165. sp_1024_mont_mul_32(t4, t2, p->z, p1024_mod, p1024_mp_mod);
  42166. sp_1024_mont_mul_32(t2, t2, q->x, p1024_mod, p1024_mp_mod);
  42167. /* S1 = Y1*Z2^3 */
  42168. sp_1024_mont_mul_32(t3, t3, p->y, p1024_mod, p1024_mp_mod);
  42169. /* S2 = Y2*Z1^3 */
  42170. sp_1024_mont_mul_32(t4, t4, q->y, p1024_mod, p1024_mp_mod);
  42171. /* H = U2 - U1 */
  42172. sp_1024_mont_sub_32(t2, t2, t1, p1024_mod);
  42173. /* R = S2 - S1 */
  42174. sp_1024_mont_sub_32(t4, t4, t3, p1024_mod);
  42175. if (~p->infinity & ~q->infinity &
  42176. sp_1024_iszero_32(t2) & sp_1024_iszero_32(t4) & maskt) {
  42177. sp_1024_proj_point_dbl_32(r, p, t);
  42178. }
  42179. else {
  42180. /* X3 = R^2 - H^3 - 2*U1*H^2 */
  42181. sp_1024_mont_sqr_32(t5, t2, p1024_mod, p1024_mp_mod);
  42182. sp_1024_mont_mul_32(y, t1, t5, p1024_mod, p1024_mp_mod);
  42183. sp_1024_mont_mul_32(t5, t5, t2, p1024_mod, p1024_mp_mod);
  42184. /* Z3 = H*Z1*Z2 */
  42185. sp_1024_mont_mul_32(z, p->z, t2, p1024_mod, p1024_mp_mod);
  42186. sp_1024_mont_mul_32(z, z, q->z, p1024_mod, p1024_mp_mod);
  42187. sp_1024_mont_sqr_32(x, t4, p1024_mod, p1024_mp_mod);
  42188. sp_1024_mont_sub_32(x, x, t5, p1024_mod);
  42189. sp_1024_mont_mul_32(t5, t5, t3, p1024_mod, p1024_mp_mod);
  42190. sp_1024_mont_dbl_32(t3, y, p1024_mod);
  42191. sp_1024_mont_sub_32(x, x, t3, p1024_mod);
  42192. /* Y3 = R*(U1*H^2 - X3) - S1*H^3 */
  42193. sp_1024_mont_sub_lower_32(y, y, x, p1024_mod);
  42194. sp_1024_mont_mul_32(y, y, t4, p1024_mod, p1024_mp_mod);
  42195. sp_1024_mont_sub_32(y, y, t5, p1024_mod);
  42196. for (i = 0; i < 32; i++) {
  42197. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) |
  42198. (x[i] & maskt);
  42199. }
  42200. for (i = 0; i < 32; i++) {
  42201. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) |
  42202. (y[i] & maskt);
  42203. }
  42204. for (i = 0; i < 32; i++) {
  42205. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) |
  42206. (z[i] & maskt);
  42207. }
  42208. r->z[0] |= p->infinity & q->infinity;
  42209. r->infinity = p->infinity & q->infinity;
  42210. }
  42211. }
  42212. }
  42213. /* Multiply the point by the scalar and return the result.
  42214. * If map is true then convert result to affine coordinates.
  42215. *
  42216. * Fast implementation that generates a pre-computation table.
  42217. * 4 bits of window (no sliding!).
  42218. * Uses add and double for calculating table.
  42219. * 1024 doubles.
  42220. * 268 adds.
  42221. *
  42222. * r Resulting point.
  42223. * g Point to multiply.
  42224. * k Scalar to multiply by.
  42225. * map Indicates whether to convert result to affine.
  42226. * ct Constant time required.
  42227. * heap Heap to use for allocation.
  42228. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  42229. */
  42230. static int sp_1024_ecc_mulmod_fast_32(sp_point_1024* r, const sp_point_1024* g, const sp_digit* k,
  42231. int map, int ct, void* heap)
  42232. {
  42233. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42234. sp_point_1024* t = NULL;
  42235. sp_digit* tmp = NULL;
  42236. #else
  42237. sp_point_1024 t[16 + 1];
  42238. sp_digit tmp[2 * 32 * 6];
  42239. #endif
  42240. sp_point_1024* rt = NULL;
  42241. sp_digit n;
  42242. int i;
  42243. int c;
  42244. int y;
  42245. int err = MP_OKAY;
  42246. /* Constant time used for cache attack resistance implementation. */
  42247. (void)ct;
  42248. (void)heap;
  42249. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42250. t = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024) * (16 + 1),
  42251. heap, DYNAMIC_TYPE_ECC);
  42252. if (t == NULL)
  42253. err = MEMORY_E;
  42254. if (err == MP_OKAY) {
  42255. tmp = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 32 * 6, heap,
  42256. DYNAMIC_TYPE_ECC);
  42257. if (tmp == NULL)
  42258. err = MEMORY_E;
  42259. }
  42260. #endif
  42261. if (err == MP_OKAY) {
  42262. rt = t + 16;
  42263. /* t[0] = {0, 0, 1} * norm */
  42264. XMEMSET(&t[0], 0, sizeof(t[0]));
  42265. t[0].infinity = 1;
  42266. /* t[1] = {g->x, g->y, g->z} * norm */
  42267. (void)sp_1024_mod_mul_norm_32(t[1].x, g->x, p1024_mod);
  42268. (void)sp_1024_mod_mul_norm_32(t[1].y, g->y, p1024_mod);
  42269. (void)sp_1024_mod_mul_norm_32(t[1].z, g->z, p1024_mod);
  42270. t[1].infinity = 0;
  42271. sp_1024_proj_point_dbl_32(&t[ 2], &t[ 1], tmp);
  42272. t[ 2].infinity = 0;
  42273. sp_1024_proj_point_add_32(&t[ 3], &t[ 2], &t[ 1], tmp);
  42274. t[ 3].infinity = 0;
  42275. sp_1024_proj_point_dbl_32(&t[ 4], &t[ 2], tmp);
  42276. t[ 4].infinity = 0;
  42277. sp_1024_proj_point_add_32(&t[ 5], &t[ 3], &t[ 2], tmp);
  42278. t[ 5].infinity = 0;
  42279. sp_1024_proj_point_dbl_32(&t[ 6], &t[ 3], tmp);
  42280. t[ 6].infinity = 0;
  42281. sp_1024_proj_point_add_32(&t[ 7], &t[ 4], &t[ 3], tmp);
  42282. t[ 7].infinity = 0;
  42283. sp_1024_proj_point_dbl_32(&t[ 8], &t[ 4], tmp);
  42284. t[ 8].infinity = 0;
  42285. sp_1024_proj_point_add_32(&t[ 9], &t[ 5], &t[ 4], tmp);
  42286. t[ 9].infinity = 0;
  42287. sp_1024_proj_point_dbl_32(&t[10], &t[ 5], tmp);
  42288. t[10].infinity = 0;
  42289. sp_1024_proj_point_add_32(&t[11], &t[ 6], &t[ 5], tmp);
  42290. t[11].infinity = 0;
  42291. sp_1024_proj_point_dbl_32(&t[12], &t[ 6], tmp);
  42292. t[12].infinity = 0;
  42293. sp_1024_proj_point_add_32(&t[13], &t[ 7], &t[ 6], tmp);
  42294. t[13].infinity = 0;
  42295. sp_1024_proj_point_dbl_32(&t[14], &t[ 7], tmp);
  42296. t[14].infinity = 0;
  42297. sp_1024_proj_point_add_32(&t[15], &t[ 8], &t[ 7], tmp);
  42298. t[15].infinity = 0;
  42299. i = 30;
  42300. n = k[i+1] << 0;
  42301. c = 28;
  42302. y = (int)(n >> 28);
  42303. XMEMCPY(rt, &t[y], sizeof(sp_point_1024));
  42304. n <<= 4;
  42305. for (; i>=0 || c>=4; ) {
  42306. if (c < 4) {
  42307. n |= k[i--];
  42308. c += 32;
  42309. }
  42310. y = (n >> 28) & 0xf;
  42311. n <<= 4;
  42312. c -= 4;
  42313. sp_1024_proj_point_dbl_32(rt, rt, tmp);
  42314. sp_1024_proj_point_dbl_32(rt, rt, tmp);
  42315. sp_1024_proj_point_dbl_32(rt, rt, tmp);
  42316. sp_1024_proj_point_dbl_32(rt, rt, tmp);
  42317. sp_1024_proj_point_add_32(rt, rt, &t[y], tmp);
  42318. }
  42319. if (map != 0) {
  42320. sp_1024_map_32(r, rt, tmp);
  42321. }
  42322. else {
  42323. XMEMCPY(r, rt, sizeof(sp_point_1024));
  42324. }
  42325. }
  42326. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42327. if (tmp != NULL)
  42328. #endif
  42329. {
  42330. ForceZero(tmp, sizeof(sp_digit) * 2 * 32 * 6);
  42331. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42332. XFREE(tmp, heap, DYNAMIC_TYPE_ECC);
  42333. #endif
  42334. }
  42335. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42336. if (t != NULL)
  42337. #endif
  42338. {
  42339. ForceZero(t, sizeof(sp_point_1024) * 17);
  42340. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42341. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  42342. #endif
  42343. }
  42344. return err;
  42345. }
  42346. #if defined(FP_ECC) || !defined(WOLFSSL_SP_SMALL)
  42347. #define sp_1024_mont_dbl_lower_32 sp_1024_mont_dbl_32
  42348. #define sp_1024_mont_tpl_lower_32 sp_1024_mont_tpl_32
  42349. /* Double the Montgomery form projective point p a number of times.
  42350. *
  42351. * r Result of repeated doubling of point.
  42352. * p Point to double.
  42353. * n Number of times to double
  42354. * t Temporary ordinate data.
  42355. */
  42356. static void sp_1024_proj_point_dbl_n_32(sp_point_1024* p, int i,
  42357. sp_digit* t)
  42358. {
  42359. sp_digit* w = t;
  42360. sp_digit* a = t + 2*32;
  42361. sp_digit* b = t + 4*32;
  42362. sp_digit* t1 = t + 6*32;
  42363. sp_digit* t2 = t + 8*32;
  42364. sp_digit* x;
  42365. sp_digit* y;
  42366. sp_digit* z;
  42367. volatile int n = i;
  42368. x = p->x;
  42369. y = p->y;
  42370. z = p->z;
  42371. /* Y = 2*Y */
  42372. sp_1024_mont_dbl_32(y, y, p1024_mod);
  42373. /* W = Z^4 */
  42374. sp_1024_mont_sqr_32(w, z, p1024_mod, p1024_mp_mod);
  42375. sp_1024_mont_sqr_32(w, w, p1024_mod, p1024_mp_mod);
  42376. #ifndef WOLFSSL_SP_SMALL
  42377. while (--n > 0)
  42378. #else
  42379. while (--n >= 0)
  42380. #endif
  42381. {
  42382. /* A = 3*(X^2 - W) */
  42383. sp_1024_mont_sqr_32(t1, x, p1024_mod, p1024_mp_mod);
  42384. sp_1024_mont_sub_32(t1, t1, w, p1024_mod);
  42385. sp_1024_mont_tpl_lower_32(a, t1, p1024_mod);
  42386. /* B = X*Y^2 */
  42387. sp_1024_mont_sqr_32(t1, y, p1024_mod, p1024_mp_mod);
  42388. sp_1024_mont_mul_32(b, t1, x, p1024_mod, p1024_mp_mod);
  42389. /* X = A^2 - 2B */
  42390. sp_1024_mont_sqr_32(x, a, p1024_mod, p1024_mp_mod);
  42391. sp_1024_mont_dbl_32(t2, b, p1024_mod);
  42392. sp_1024_mont_sub_32(x, x, t2, p1024_mod);
  42393. /* b = 2.(B - X) */
  42394. sp_1024_mont_sub_lower_32(t2, b, x, p1024_mod);
  42395. sp_1024_mont_dbl_lower_32(b, t2, p1024_mod);
  42396. /* Z = Z*Y */
  42397. sp_1024_mont_mul_32(z, z, y, p1024_mod, p1024_mp_mod);
  42398. /* t1 = Y^4 */
  42399. sp_1024_mont_sqr_32(t1, t1, p1024_mod, p1024_mp_mod);
  42400. #ifdef WOLFSSL_SP_SMALL
  42401. if (n != 0)
  42402. #endif
  42403. {
  42404. /* W = W*Y^4 */
  42405. sp_1024_mont_mul_32(w, w, t1, p1024_mod, p1024_mp_mod);
  42406. }
  42407. /* y = 2*A*(B - X) - Y^4 */
  42408. sp_1024_mont_mul_32(y, b, a, p1024_mod, p1024_mp_mod);
  42409. sp_1024_mont_sub_32(y, y, t1, p1024_mod);
  42410. }
  42411. #ifndef WOLFSSL_SP_SMALL
  42412. /* A = 3*(X^2 - W) */
  42413. sp_1024_mont_sqr_32(t1, x, p1024_mod, p1024_mp_mod);
  42414. sp_1024_mont_sub_32(t1, t1, w, p1024_mod);
  42415. sp_1024_mont_tpl_lower_32(a, t1, p1024_mod);
  42416. /* B = X*Y^2 */
  42417. sp_1024_mont_sqr_32(t1, y, p1024_mod, p1024_mp_mod);
  42418. sp_1024_mont_mul_32(b, t1, x, p1024_mod, p1024_mp_mod);
  42419. /* X = A^2 - 2B */
  42420. sp_1024_mont_sqr_32(x, a, p1024_mod, p1024_mp_mod);
  42421. sp_1024_mont_dbl_32(t2, b, p1024_mod);
  42422. sp_1024_mont_sub_32(x, x, t2, p1024_mod);
  42423. /* b = 2.(B - X) */
  42424. sp_1024_mont_sub_lower_32(t2, b, x, p1024_mod);
  42425. sp_1024_mont_dbl_lower_32(b, t2, p1024_mod);
  42426. /* Z = Z*Y */
  42427. sp_1024_mont_mul_32(z, z, y, p1024_mod, p1024_mp_mod);
  42428. /* t1 = Y^4 */
  42429. sp_1024_mont_sqr_32(t1, t1, p1024_mod, p1024_mp_mod);
  42430. /* y = 2*A*(B - X) - Y^4 */
  42431. sp_1024_mont_mul_32(y, b, a, p1024_mod, p1024_mp_mod);
  42432. sp_1024_mont_sub_32(y, y, t1, p1024_mod);
  42433. #endif
  42434. /* Y = Y/2 */
  42435. sp_1024_div2_32(y, y, p1024_mod);
  42436. }
  42437. /* Convert the projective point to affine.
  42438. * Ordinates are in Montgomery form.
  42439. *
  42440. * a Point to convert.
  42441. * t Temporary data.
  42442. */
  42443. static void sp_1024_proj_to_affine_32(sp_point_1024* a, sp_digit* t)
  42444. {
  42445. sp_digit* t1 = t;
  42446. sp_digit* t2 = t + 2 * 32;
  42447. sp_digit* tmp = t + 4 * 32;
  42448. sp_1024_mont_inv_32(t1, a->z, tmp);
  42449. sp_1024_mont_sqr_32(t2, t1, p1024_mod, p1024_mp_mod);
  42450. sp_1024_mont_mul_32(t1, t2, t1, p1024_mod, p1024_mp_mod);
  42451. sp_1024_mont_mul_32(a->x, a->x, t2, p1024_mod, p1024_mp_mod);
  42452. sp_1024_mont_mul_32(a->y, a->y, t1, p1024_mod, p1024_mp_mod);
  42453. XMEMCPY(a->z, p1024_norm_mod, sizeof(p1024_norm_mod));
  42454. }
  42455. #endif /* FP_ECC || !WOLFSSL_SP_SMALL */
  42456. /* A table entry for pre-computed points. */
  42457. typedef struct sp_table_entry_1024 {
  42458. sp_digit x[32];
  42459. sp_digit y[32];
  42460. } sp_table_entry_1024;
  42461. #ifdef FP_ECC
  42462. #endif /* FP_ECC */
  42463. /* Add two Montgomery form projective points. The second point has a q value of
  42464. * one.
  42465. * Only the first point can be the same pointer as the result point.
  42466. *
  42467. * r Result of addition.
  42468. * p First point to add.
  42469. * q Second point to add.
  42470. * t Temporary ordinate data.
  42471. */
  42472. static void sp_1024_proj_point_add_qz1_32(sp_point_1024* r, const sp_point_1024* p,
  42473. const sp_point_1024* q, sp_digit* t)
  42474. {
  42475. sp_digit* t1 = t;
  42476. sp_digit* t2 = t + 2*32;
  42477. sp_digit* t3 = t + 4*32;
  42478. sp_digit* t4 = t + 6*32;
  42479. sp_digit* t5 = t + 8*32;
  42480. sp_digit* t6 = t + 10*32;
  42481. /* Check double */
  42482. (void)sp_1024_mont_sub_32(t1, p1024_mod, q->y, p1024_mod);
  42483. sp_1024_norm_32(t1);
  42484. if ((~p->infinity & ~q->infinity &
  42485. sp_1024_cmp_equal_32(p->x, q->x) & sp_1024_cmp_equal_32(p->z, q->z) &
  42486. (sp_1024_cmp_equal_32(p->y, q->y) | sp_1024_cmp_equal_32(p->y, t1))) != 0) {
  42487. sp_1024_proj_point_dbl_32(r, p, t);
  42488. }
  42489. else {
  42490. sp_digit maskp;
  42491. sp_digit maskq;
  42492. sp_digit maskt;
  42493. sp_digit* x = t2;
  42494. sp_digit* y = t5;
  42495. sp_digit* z = t6;
  42496. int i;
  42497. /* U2 = X2*Z1^2 */
  42498. sp_1024_mont_sqr_32(t2, p->z, p1024_mod, p1024_mp_mod);
  42499. sp_1024_mont_mul_32(t4, t2, p->z, p1024_mod, p1024_mp_mod);
  42500. sp_1024_mont_mul_32(t2, t2, q->x, p1024_mod, p1024_mp_mod);
  42501. /* S2 = Y2*Z1^3 */
  42502. sp_1024_mont_mul_32(t4, t4, q->y, p1024_mod, p1024_mp_mod);
  42503. /* H = U2 - X1 */
  42504. sp_1024_mont_sub_32(t2, t2, p->x, p1024_mod);
  42505. /* R = S2 - Y1 */
  42506. sp_1024_mont_sub_32(t4, t4, p->y, p1024_mod);
  42507. /* Z3 = H*Z1 */
  42508. sp_1024_mont_mul_32(z, p->z, t2, p1024_mod, p1024_mp_mod);
  42509. /* X3 = R^2 - H^3 - 2*X1*H^2 */
  42510. sp_1024_mont_sqr_32(t1, t4, p1024_mod, p1024_mp_mod);
  42511. sp_1024_mont_sqr_32(t5, t2, p1024_mod, p1024_mp_mod);
  42512. sp_1024_mont_mul_32(t3, p->x, t5, p1024_mod, p1024_mp_mod);
  42513. sp_1024_mont_mul_32(t5, t5, t2, p1024_mod, p1024_mp_mod);
  42514. sp_1024_mont_sub_32(x, t1, t5, p1024_mod);
  42515. sp_1024_mont_dbl_32(t1, t3, p1024_mod);
  42516. sp_1024_mont_sub_32(x, x, t1, p1024_mod);
  42517. /* Y3 = R*(X1*H^2 - X3) - Y1*H^3 */
  42518. sp_1024_mont_sub_lower_32(t3, t3, x, p1024_mod);
  42519. sp_1024_mont_mul_32(t3, t3, t4, p1024_mod, p1024_mp_mod);
  42520. sp_1024_mont_mul_32(t5, t5, p->y, p1024_mod, p1024_mp_mod);
  42521. sp_1024_mont_sub_32(y, t3, t5, p1024_mod);
  42522. maskp = 0 - (q->infinity & (!p->infinity));
  42523. maskq = 0 - (p->infinity & (!q->infinity));
  42524. maskt = ~(maskp | maskq);
  42525. for (i = 0; i < 32; i++) {
  42526. r->x[i] = (p->x[i] & maskp) | (q->x[i] & maskq) | (x[i] & maskt);
  42527. }
  42528. for (i = 0; i < 32; i++) {
  42529. r->y[i] = (p->y[i] & maskp) | (q->y[i] & maskq) | (y[i] & maskt);
  42530. }
  42531. for (i = 0; i < 32; i++) {
  42532. r->z[i] = (p->z[i] & maskp) | (q->z[i] & maskq) | (z[i] & maskt);
  42533. }
  42534. r->z[0] |= p->infinity & q->infinity;
  42535. r->infinity = p->infinity & q->infinity;
  42536. }
  42537. }
  42538. #ifdef WOLFSSL_SP_SMALL
  42539. #if defined(FP_ECC) || !defined(WOLFSSL_SP_SMALL)
  42540. /* Generate the pre-computed table of points for the base point.
  42541. *
  42542. * width = 4
  42543. * 16 entries
  42544. * 256 bits between
  42545. *
  42546. * a The base point.
  42547. * table Place to store generated point data.
  42548. * tmp Temporary data.
  42549. * heap Heap to use for allocation.
  42550. */
  42551. static int sp_1024_gen_stripe_table_32(const sp_point_1024* a,
  42552. sp_table_entry_1024* table, sp_digit* tmp, void* heap)
  42553. {
  42554. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42555. sp_point_1024* t = NULL;
  42556. #else
  42557. sp_point_1024 t[3];
  42558. #endif
  42559. sp_point_1024* s1 = NULL;
  42560. sp_point_1024* s2 = NULL;
  42561. int i;
  42562. int j;
  42563. int err = MP_OKAY;
  42564. (void)heap;
  42565. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42566. t = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024) * 3, heap,
  42567. DYNAMIC_TYPE_ECC);
  42568. if (t == NULL)
  42569. err = MEMORY_E;
  42570. #endif
  42571. if (err == MP_OKAY) {
  42572. s1 = t + 1;
  42573. s2 = t + 2;
  42574. err = sp_1024_mod_mul_norm_32(t->x, a->x, p1024_mod);
  42575. }
  42576. if (err == MP_OKAY) {
  42577. err = sp_1024_mod_mul_norm_32(t->y, a->y, p1024_mod);
  42578. }
  42579. if (err == MP_OKAY) {
  42580. err = sp_1024_mod_mul_norm_32(t->z, a->z, p1024_mod);
  42581. }
  42582. if (err == MP_OKAY) {
  42583. t->infinity = 0;
  42584. sp_1024_proj_to_affine_32(t, tmp);
  42585. XMEMCPY(s1->z, p1024_norm_mod, sizeof(p1024_norm_mod));
  42586. s1->infinity = 0;
  42587. XMEMCPY(s2->z, p1024_norm_mod, sizeof(p1024_norm_mod));
  42588. s2->infinity = 0;
  42589. /* table[0] = {0, 0, infinity} */
  42590. XMEMSET(&table[0], 0, sizeof(sp_table_entry_1024));
  42591. /* table[1] = Affine version of 'a' in Montgomery form */
  42592. XMEMCPY(table[1].x, t->x, sizeof(table->x));
  42593. XMEMCPY(table[1].y, t->y, sizeof(table->y));
  42594. for (i=1; i<4; i++) {
  42595. sp_1024_proj_point_dbl_n_32(t, 256, tmp);
  42596. sp_1024_proj_to_affine_32(t, tmp);
  42597. XMEMCPY(table[1<<i].x, t->x, sizeof(table->x));
  42598. XMEMCPY(table[1<<i].y, t->y, sizeof(table->y));
  42599. }
  42600. for (i=1; i<4; i++) {
  42601. XMEMCPY(s1->x, table[1<<i].x, sizeof(table->x));
  42602. XMEMCPY(s1->y, table[1<<i].y, sizeof(table->y));
  42603. for (j=(1<<i)+1; j<(1<<(i+1)); j++) {
  42604. XMEMCPY(s2->x, table[j-(1<<i)].x, sizeof(table->x));
  42605. XMEMCPY(s2->y, table[j-(1<<i)].y, sizeof(table->y));
  42606. sp_1024_proj_point_add_qz1_32(t, s1, s2, tmp);
  42607. sp_1024_proj_to_affine_32(t, tmp);
  42608. XMEMCPY(table[j].x, t->x, sizeof(table->x));
  42609. XMEMCPY(table[j].y, t->y, sizeof(table->y));
  42610. }
  42611. }
  42612. }
  42613. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42614. if (t != NULL)
  42615. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  42616. #endif
  42617. return err;
  42618. }
  42619. #endif /* FP_ECC || !WOLFSSL_SP_SMALL */
  42620. /* Multiply the point by the scalar and return the result.
  42621. * If map is true then convert result to affine coordinates.
  42622. *
  42623. * Stripe implementation.
  42624. * Pre-generated: 2^0, 2^256, ...
  42625. * Pre-generated: products of all combinations of above.
  42626. * 4 doubles and adds (with qz=1)
  42627. *
  42628. * r Resulting point.
  42629. * k Scalar to multiply by.
  42630. * table Pre-computed table.
  42631. * map Indicates whether to convert result to affine.
  42632. * ct Constant time required.
  42633. * heap Heap to use for allocation.
  42634. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  42635. */
  42636. static int sp_1024_ecc_mulmod_stripe_32(sp_point_1024* r, const sp_point_1024* g,
  42637. const sp_table_entry_1024* table, const sp_digit* k, int map,
  42638. int ct, void* heap)
  42639. {
  42640. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42641. sp_point_1024* rt = NULL;
  42642. sp_digit* t = NULL;
  42643. #else
  42644. sp_point_1024 rt[2];
  42645. sp_digit t[2 * 32 * 6];
  42646. #endif
  42647. sp_point_1024* p = NULL;
  42648. int i;
  42649. int j;
  42650. int y;
  42651. int x;
  42652. int err = MP_OKAY;
  42653. (void)g;
  42654. /* Constant time used for cache attack resistance implementation. */
  42655. (void)ct;
  42656. (void)heap;
  42657. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42658. rt = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024) * 2, heap,
  42659. DYNAMIC_TYPE_ECC);
  42660. if (rt == NULL)
  42661. err = MEMORY_E;
  42662. if (err == MP_OKAY) {
  42663. t = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 32 * 6, heap,
  42664. DYNAMIC_TYPE_ECC);
  42665. if (t == NULL)
  42666. err = MEMORY_E;
  42667. }
  42668. #endif
  42669. if (err == MP_OKAY) {
  42670. p = rt + 1;
  42671. XMEMCPY(p->z, p1024_norm_mod, sizeof(p1024_norm_mod));
  42672. XMEMCPY(rt->z, p1024_norm_mod, sizeof(p1024_norm_mod));
  42673. y = 0;
  42674. x = 255;
  42675. for (j=0; j<4; j++) {
  42676. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  42677. x += 256;
  42678. }
  42679. XMEMCPY(rt->x, table[y].x, sizeof(table[y].x));
  42680. XMEMCPY(rt->y, table[y].y, sizeof(table[y].y));
  42681. rt->infinity = !y;
  42682. for (i=254; i>=0; i--) {
  42683. y = 0;
  42684. x = i;
  42685. for (j=0; j<4; j++) {
  42686. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  42687. x += 256;
  42688. }
  42689. sp_1024_proj_point_dbl_32(rt, rt, t);
  42690. XMEMCPY(p->x, table[y].x, sizeof(table[y].x));
  42691. XMEMCPY(p->y, table[y].y, sizeof(table[y].y));
  42692. p->infinity = !y;
  42693. sp_1024_proj_point_add_qz1_32(rt, rt, p, t);
  42694. }
  42695. if (map != 0) {
  42696. sp_1024_map_32(r, rt, t);
  42697. }
  42698. else {
  42699. XMEMCPY(r, rt, sizeof(sp_point_1024));
  42700. }
  42701. }
  42702. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42703. if (t != NULL)
  42704. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  42705. if (rt != NULL)
  42706. XFREE(rt, heap, DYNAMIC_TYPE_ECC);
  42707. #endif
  42708. return err;
  42709. }
  42710. #ifdef FP_ECC
  42711. #ifndef FP_ENTRIES
  42712. #define FP_ENTRIES 16
  42713. #endif
  42714. /* Cache entry - holds precomputation tables for a point. */
  42715. typedef struct sp_cache_1024_t {
  42716. /* X ordinate of point that table was generated from. */
  42717. sp_digit x[32];
  42718. /* Y ordinate of point that table was generated from. */
  42719. sp_digit y[32];
  42720. /* Precomputation table for point. */
  42721. sp_table_entry_1024 table[16];
  42722. /* Count of entries in table. */
  42723. uint32_t cnt;
  42724. /* Point and table set in entry. */
  42725. int set;
  42726. } sp_cache_1024_t;
  42727. /* Cache of tables. */
  42728. static THREAD_LS_T sp_cache_1024_t sp_cache_1024[FP_ENTRIES];
  42729. /* Index of last entry in cache. */
  42730. static THREAD_LS_T int sp_cache_1024_last = -1;
  42731. /* Cache has been initialized. */
  42732. static THREAD_LS_T int sp_cache_1024_inited = 0;
  42733. #ifndef HAVE_THREAD_LS
  42734. static volatile int initCacheMutex_1024 = 0;
  42735. static wolfSSL_Mutex sp_cache_1024_lock;
  42736. #endif
  42737. /* Get the cache entry for the point.
  42738. *
  42739. * g [in] Point scalar multipling.
  42740. * cache [out] Cache table to use.
  42741. */
  42742. static void sp_ecc_get_cache_1024(const sp_point_1024* g, sp_cache_1024_t** cache)
  42743. {
  42744. int i;
  42745. int j;
  42746. uint32_t least;
  42747. if (sp_cache_1024_inited == 0) {
  42748. for (i=0; i<FP_ENTRIES; i++) {
  42749. sp_cache_1024[i].set = 0;
  42750. }
  42751. sp_cache_1024_inited = 1;
  42752. }
  42753. /* Compare point with those in cache. */
  42754. for (i=0; i<FP_ENTRIES; i++) {
  42755. if (!sp_cache_1024[i].set)
  42756. continue;
  42757. if (sp_1024_cmp_equal_32(g->x, sp_cache_1024[i].x) &
  42758. sp_1024_cmp_equal_32(g->y, sp_cache_1024[i].y)) {
  42759. sp_cache_1024[i].cnt++;
  42760. break;
  42761. }
  42762. }
  42763. /* No match. */
  42764. if (i == FP_ENTRIES) {
  42765. /* Find empty entry. */
  42766. i = (sp_cache_1024_last + 1) % FP_ENTRIES;
  42767. for (; i != sp_cache_1024_last; i=(i+1)%FP_ENTRIES) {
  42768. if (!sp_cache_1024[i].set) {
  42769. break;
  42770. }
  42771. }
  42772. /* Evict least used. */
  42773. if (i == sp_cache_1024_last) {
  42774. least = sp_cache_1024[0].cnt;
  42775. for (j=1; j<FP_ENTRIES; j++) {
  42776. if (sp_cache_1024[j].cnt < least) {
  42777. i = j;
  42778. least = sp_cache_1024[i].cnt;
  42779. }
  42780. }
  42781. }
  42782. XMEMCPY(sp_cache_1024[i].x, g->x, sizeof(sp_cache_1024[i].x));
  42783. XMEMCPY(sp_cache_1024[i].y, g->y, sizeof(sp_cache_1024[i].y));
  42784. sp_cache_1024[i].set = 1;
  42785. sp_cache_1024[i].cnt = 1;
  42786. }
  42787. *cache = &sp_cache_1024[i];
  42788. sp_cache_1024_last = i;
  42789. }
  42790. #endif /* FP_ECC */
  42791. /* Multiply the base point of P1024 by the scalar and return the result.
  42792. * If map is true then convert result to affine coordinates.
  42793. *
  42794. * r Resulting point.
  42795. * g Point to multiply.
  42796. * k Scalar to multiply by.
  42797. * map Indicates whether to convert result to affine.
  42798. * ct Constant time required.
  42799. * heap Heap to use for allocation.
  42800. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  42801. */
  42802. static int sp_1024_ecc_mulmod_32(sp_point_1024* r, const sp_point_1024* g, const sp_digit* k,
  42803. int map, int ct, void* heap)
  42804. {
  42805. #ifndef FP_ECC
  42806. return sp_1024_ecc_mulmod_fast_32(r, g, k, map, ct, heap);
  42807. #else
  42808. sp_digit tmp[2 * 32 * 6];
  42809. sp_cache_1024_t* cache;
  42810. int err = MP_OKAY;
  42811. #ifndef HAVE_THREAD_LS
  42812. if (initCacheMutex_1024 == 0) {
  42813. wc_InitMutex(&sp_cache_1024_lock);
  42814. initCacheMutex_1024 = 1;
  42815. }
  42816. if (wc_LockMutex(&sp_cache_1024_lock) != 0)
  42817. err = BAD_MUTEX_E;
  42818. #endif /* HAVE_THREAD_LS */
  42819. if (err == MP_OKAY) {
  42820. sp_ecc_get_cache_1024(g, &cache);
  42821. if (cache->cnt == 2)
  42822. sp_1024_gen_stripe_table_32(g, cache->table, tmp, heap);
  42823. #ifndef HAVE_THREAD_LS
  42824. wc_UnLockMutex(&sp_cache_1024_lock);
  42825. #endif /* HAVE_THREAD_LS */
  42826. if (cache->cnt < 2) {
  42827. err = sp_1024_ecc_mulmod_fast_32(r, g, k, map, ct, heap);
  42828. }
  42829. else {
  42830. err = sp_1024_ecc_mulmod_stripe_32(r, g, cache->table, k,
  42831. map, ct, heap);
  42832. }
  42833. }
  42834. return err;
  42835. #endif
  42836. }
  42837. #else
  42838. #if defined(FP_ECC) || !defined(WOLFSSL_SP_SMALL)
  42839. /* Generate the pre-computed table of points for the base point.
  42840. *
  42841. * width = 8
  42842. * 256 entries
  42843. * 128 bits between
  42844. *
  42845. * a The base point.
  42846. * table Place to store generated point data.
  42847. * tmp Temporary data.
  42848. * heap Heap to use for allocation.
  42849. */
  42850. static int sp_1024_gen_stripe_table_32(const sp_point_1024* a,
  42851. sp_table_entry_1024* table, sp_digit* tmp, void* heap)
  42852. {
  42853. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42854. sp_point_1024* t = NULL;
  42855. #else
  42856. sp_point_1024 t[3];
  42857. #endif
  42858. sp_point_1024* s1 = NULL;
  42859. sp_point_1024* s2 = NULL;
  42860. int i;
  42861. int j;
  42862. int err = MP_OKAY;
  42863. (void)heap;
  42864. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42865. t = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024) * 3, heap,
  42866. DYNAMIC_TYPE_ECC);
  42867. if (t == NULL)
  42868. err = MEMORY_E;
  42869. #endif
  42870. if (err == MP_OKAY) {
  42871. s1 = t + 1;
  42872. s2 = t + 2;
  42873. err = sp_1024_mod_mul_norm_32(t->x, a->x, p1024_mod);
  42874. }
  42875. if (err == MP_OKAY) {
  42876. err = sp_1024_mod_mul_norm_32(t->y, a->y, p1024_mod);
  42877. }
  42878. if (err == MP_OKAY) {
  42879. err = sp_1024_mod_mul_norm_32(t->z, a->z, p1024_mod);
  42880. }
  42881. if (err == MP_OKAY) {
  42882. t->infinity = 0;
  42883. sp_1024_proj_to_affine_32(t, tmp);
  42884. XMEMCPY(s1->z, p1024_norm_mod, sizeof(p1024_norm_mod));
  42885. s1->infinity = 0;
  42886. XMEMCPY(s2->z, p1024_norm_mod, sizeof(p1024_norm_mod));
  42887. s2->infinity = 0;
  42888. /* table[0] = {0, 0, infinity} */
  42889. XMEMSET(&table[0], 0, sizeof(sp_table_entry_1024));
  42890. /* table[1] = Affine version of 'a' in Montgomery form */
  42891. XMEMCPY(table[1].x, t->x, sizeof(table->x));
  42892. XMEMCPY(table[1].y, t->y, sizeof(table->y));
  42893. for (i=1; i<8; i++) {
  42894. sp_1024_proj_point_dbl_n_32(t, 128, tmp);
  42895. sp_1024_proj_to_affine_32(t, tmp);
  42896. XMEMCPY(table[1<<i].x, t->x, sizeof(table->x));
  42897. XMEMCPY(table[1<<i].y, t->y, sizeof(table->y));
  42898. }
  42899. for (i=1; i<8; i++) {
  42900. XMEMCPY(s1->x, table[1<<i].x, sizeof(table->x));
  42901. XMEMCPY(s1->y, table[1<<i].y, sizeof(table->y));
  42902. for (j=(1<<i)+1; j<(1<<(i+1)); j++) {
  42903. XMEMCPY(s2->x, table[j-(1<<i)].x, sizeof(table->x));
  42904. XMEMCPY(s2->y, table[j-(1<<i)].y, sizeof(table->y));
  42905. sp_1024_proj_point_add_qz1_32(t, s1, s2, tmp);
  42906. sp_1024_proj_to_affine_32(t, tmp);
  42907. XMEMCPY(table[j].x, t->x, sizeof(table->x));
  42908. XMEMCPY(table[j].y, t->y, sizeof(table->y));
  42909. }
  42910. }
  42911. }
  42912. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42913. if (t != NULL)
  42914. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  42915. #endif
  42916. return err;
  42917. }
  42918. #endif /* FP_ECC || !WOLFSSL_SP_SMALL */
  42919. /* Multiply the point by the scalar and return the result.
  42920. * If map is true then convert result to affine coordinates.
  42921. *
  42922. * Stripe implementation.
  42923. * Pre-generated: 2^0, 2^128, ...
  42924. * Pre-generated: products of all combinations of above.
  42925. * 8 doubles and adds (with qz=1)
  42926. *
  42927. * r Resulting point.
  42928. * k Scalar to multiply by.
  42929. * table Pre-computed table.
  42930. * map Indicates whether to convert result to affine.
  42931. * ct Constant time required.
  42932. * heap Heap to use for allocation.
  42933. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  42934. */
  42935. static int sp_1024_ecc_mulmod_stripe_32(sp_point_1024* r, const sp_point_1024* g,
  42936. const sp_table_entry_1024* table, const sp_digit* k, int map,
  42937. int ct, void* heap)
  42938. {
  42939. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42940. sp_point_1024* rt = NULL;
  42941. sp_digit* t = NULL;
  42942. #else
  42943. sp_point_1024 rt[2];
  42944. sp_digit t[2 * 32 * 6];
  42945. #endif
  42946. sp_point_1024* p = NULL;
  42947. int i;
  42948. int j;
  42949. int y;
  42950. int x;
  42951. int err = MP_OKAY;
  42952. (void)g;
  42953. /* Constant time used for cache attack resistance implementation. */
  42954. (void)ct;
  42955. (void)heap;
  42956. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  42957. rt = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024) * 2, heap,
  42958. DYNAMIC_TYPE_ECC);
  42959. if (rt == NULL)
  42960. err = MEMORY_E;
  42961. if (err == MP_OKAY) {
  42962. t = (sp_digit*)XMALLOC(sizeof(sp_digit) * 2 * 32 * 6, heap,
  42963. DYNAMIC_TYPE_ECC);
  42964. if (t == NULL)
  42965. err = MEMORY_E;
  42966. }
  42967. #endif
  42968. if (err == MP_OKAY) {
  42969. p = rt + 1;
  42970. XMEMCPY(p->z, p1024_norm_mod, sizeof(p1024_norm_mod));
  42971. XMEMCPY(rt->z, p1024_norm_mod, sizeof(p1024_norm_mod));
  42972. y = 0;
  42973. x = 127;
  42974. for (j=0; j<8; j++) {
  42975. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  42976. x += 128;
  42977. }
  42978. XMEMCPY(rt->x, table[y].x, sizeof(table[y].x));
  42979. XMEMCPY(rt->y, table[y].y, sizeof(table[y].y));
  42980. rt->infinity = !y;
  42981. for (i=126; i>=0; i--) {
  42982. y = 0;
  42983. x = i;
  42984. for (j=0; j<8; j++) {
  42985. y |= (int)(((k[x / 32] >> (x % 32)) & 1) << j);
  42986. x += 128;
  42987. }
  42988. sp_1024_proj_point_dbl_32(rt, rt, t);
  42989. XMEMCPY(p->x, table[y].x, sizeof(table[y].x));
  42990. XMEMCPY(p->y, table[y].y, sizeof(table[y].y));
  42991. p->infinity = !y;
  42992. sp_1024_proj_point_add_qz1_32(rt, rt, p, t);
  42993. }
  42994. if (map != 0) {
  42995. sp_1024_map_32(r, rt, t);
  42996. }
  42997. else {
  42998. XMEMCPY(r, rt, sizeof(sp_point_1024));
  42999. }
  43000. }
  43001. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  43002. if (t != NULL)
  43003. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  43004. if (rt != NULL)
  43005. XFREE(rt, heap, DYNAMIC_TYPE_ECC);
  43006. #endif
  43007. return err;
  43008. }
  43009. #ifdef FP_ECC
  43010. #ifndef FP_ENTRIES
  43011. #define FP_ENTRIES 16
  43012. #endif
  43013. /* Cache entry - holds precomputation tables for a point. */
  43014. typedef struct sp_cache_1024_t {
  43015. /* X ordinate of point that table was generated from. */
  43016. sp_digit x[32];
  43017. /* Y ordinate of point that table was generated from. */
  43018. sp_digit y[32];
  43019. /* Precomputation table for point. */
  43020. sp_table_entry_1024 table[256];
  43021. /* Count of entries in table. */
  43022. uint32_t cnt;
  43023. /* Point and table set in entry. */
  43024. int set;
  43025. } sp_cache_1024_t;
  43026. /* Cache of tables. */
  43027. static THREAD_LS_T sp_cache_1024_t sp_cache_1024[FP_ENTRIES];
  43028. /* Index of last entry in cache. */
  43029. static THREAD_LS_T int sp_cache_1024_last = -1;
  43030. /* Cache has been initialized. */
  43031. static THREAD_LS_T int sp_cache_1024_inited = 0;
  43032. #ifndef HAVE_THREAD_LS
  43033. static volatile int initCacheMutex_1024 = 0;
  43034. static wolfSSL_Mutex sp_cache_1024_lock;
  43035. #endif
  43036. /* Get the cache entry for the point.
  43037. *
  43038. * g [in] Point scalar multipling.
  43039. * cache [out] Cache table to use.
  43040. */
  43041. static void sp_ecc_get_cache_1024(const sp_point_1024* g, sp_cache_1024_t** cache)
  43042. {
  43043. int i;
  43044. int j;
  43045. uint32_t least;
  43046. if (sp_cache_1024_inited == 0) {
  43047. for (i=0; i<FP_ENTRIES; i++) {
  43048. sp_cache_1024[i].set = 0;
  43049. }
  43050. sp_cache_1024_inited = 1;
  43051. }
  43052. /* Compare point with those in cache. */
  43053. for (i=0; i<FP_ENTRIES; i++) {
  43054. if (!sp_cache_1024[i].set)
  43055. continue;
  43056. if (sp_1024_cmp_equal_32(g->x, sp_cache_1024[i].x) &
  43057. sp_1024_cmp_equal_32(g->y, sp_cache_1024[i].y)) {
  43058. sp_cache_1024[i].cnt++;
  43059. break;
  43060. }
  43061. }
  43062. /* No match. */
  43063. if (i == FP_ENTRIES) {
  43064. /* Find empty entry. */
  43065. i = (sp_cache_1024_last + 1) % FP_ENTRIES;
  43066. for (; i != sp_cache_1024_last; i=(i+1)%FP_ENTRIES) {
  43067. if (!sp_cache_1024[i].set) {
  43068. break;
  43069. }
  43070. }
  43071. /* Evict least used. */
  43072. if (i == sp_cache_1024_last) {
  43073. least = sp_cache_1024[0].cnt;
  43074. for (j=1; j<FP_ENTRIES; j++) {
  43075. if (sp_cache_1024[j].cnt < least) {
  43076. i = j;
  43077. least = sp_cache_1024[i].cnt;
  43078. }
  43079. }
  43080. }
  43081. XMEMCPY(sp_cache_1024[i].x, g->x, sizeof(sp_cache_1024[i].x));
  43082. XMEMCPY(sp_cache_1024[i].y, g->y, sizeof(sp_cache_1024[i].y));
  43083. sp_cache_1024[i].set = 1;
  43084. sp_cache_1024[i].cnt = 1;
  43085. }
  43086. *cache = &sp_cache_1024[i];
  43087. sp_cache_1024_last = i;
  43088. }
  43089. #endif /* FP_ECC */
  43090. /* Multiply the base point of P1024 by the scalar and return the result.
  43091. * If map is true then convert result to affine coordinates.
  43092. *
  43093. * r Resulting point.
  43094. * g Point to multiply.
  43095. * k Scalar to multiply by.
  43096. * map Indicates whether to convert result to affine.
  43097. * ct Constant time required.
  43098. * heap Heap to use for allocation.
  43099. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  43100. */
  43101. static int sp_1024_ecc_mulmod_32(sp_point_1024* r, const sp_point_1024* g, const sp_digit* k,
  43102. int map, int ct, void* heap)
  43103. {
  43104. #ifndef FP_ECC
  43105. return sp_1024_ecc_mulmod_fast_32(r, g, k, map, ct, heap);
  43106. #else
  43107. sp_digit tmp[2 * 32 * 6];
  43108. sp_cache_1024_t* cache;
  43109. int err = MP_OKAY;
  43110. #ifndef HAVE_THREAD_LS
  43111. if (initCacheMutex_1024 == 0) {
  43112. wc_InitMutex(&sp_cache_1024_lock);
  43113. initCacheMutex_1024 = 1;
  43114. }
  43115. if (wc_LockMutex(&sp_cache_1024_lock) != 0)
  43116. err = BAD_MUTEX_E;
  43117. #endif /* HAVE_THREAD_LS */
  43118. if (err == MP_OKAY) {
  43119. sp_ecc_get_cache_1024(g, &cache);
  43120. if (cache->cnt == 2)
  43121. sp_1024_gen_stripe_table_32(g, cache->table, tmp, heap);
  43122. #ifndef HAVE_THREAD_LS
  43123. wc_UnLockMutex(&sp_cache_1024_lock);
  43124. #endif /* HAVE_THREAD_LS */
  43125. if (cache->cnt < 2) {
  43126. err = sp_1024_ecc_mulmod_fast_32(r, g, k, map, ct, heap);
  43127. }
  43128. else {
  43129. err = sp_1024_ecc_mulmod_stripe_32(r, g, cache->table, k,
  43130. map, ct, heap);
  43131. }
  43132. }
  43133. return err;
  43134. #endif
  43135. }
  43136. #endif /* WOLFSSL_SP_SMALL */
  43137. /* Multiply the point by the scalar and return the result.
  43138. * If map is true then convert result to affine coordinates.
  43139. *
  43140. * km Scalar to multiply by.
  43141. * p Point to multiply.
  43142. * r Resulting point.
  43143. * map Indicates whether to convert result to affine.
  43144. * heap Heap to use for allocation.
  43145. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  43146. */
  43147. int sp_ecc_mulmod_1024(const mp_int* km, const ecc_point* gm, ecc_point* r,
  43148. int map, void* heap)
  43149. {
  43150. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  43151. sp_point_1024* point = NULL;
  43152. sp_digit* k = NULL;
  43153. #else
  43154. sp_point_1024 point[1];
  43155. sp_digit k[32];
  43156. #endif
  43157. int err = MP_OKAY;
  43158. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  43159. point = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024), heap,
  43160. DYNAMIC_TYPE_ECC);
  43161. if (point == NULL)
  43162. err = MEMORY_E;
  43163. if (err == MP_OKAY) {
  43164. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 32, heap,
  43165. DYNAMIC_TYPE_ECC);
  43166. if (k == NULL)
  43167. err = MEMORY_E;
  43168. }
  43169. #endif
  43170. if (err == MP_OKAY) {
  43171. sp_1024_from_mp(k, 32, km);
  43172. sp_1024_point_from_ecc_point_32(point, gm);
  43173. err = sp_1024_ecc_mulmod_32(point, point, k, map, 1, heap);
  43174. }
  43175. if (err == MP_OKAY) {
  43176. err = sp_1024_point_to_ecc_point_32(point, r);
  43177. }
  43178. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  43179. if (k != NULL)
  43180. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  43181. if (point != NULL)
  43182. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  43183. #endif
  43184. return err;
  43185. }
  43186. #ifdef WOLFSSL_SP_SMALL
  43187. /* Striping precomputation table.
  43188. * 4 points combined into a table of 16 points.
  43189. * Distance of 256 between points.
  43190. */
  43191. static const sp_table_entry_1024 p1024_table[16] = {
  43192. /* 0 */
  43193. { { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  43194. 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  43195. 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 },
  43196. { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  43197. 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  43198. 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 } },
  43199. /* 1 */
  43200. { { 0xe0162bc2,0xbf9c7ec6,0x10a89289,0xddecc6e3,0x9e499d81,0x5d599df0,
  43201. 0x6d358218,0x9a96ea28,0x70c5f8db,0x01aec7d3,0x8cf5d066,0xe72e4995,
  43202. 0x3e91d7f8,0xc2e7297d,0xda9f2f5a,0x8621db92,0x5a5679ed,0x4b26c867,
  43203. 0x2c56aac1,0x233385df,0xc6a13f99,0xb88e74d4,0xffa8ec11,0x1214b173,
  43204. 0x1f3f9fef,0xa0386a27,0xc0e7b44e,0xbd9b1b4e,0xeecd3496,0xafe528dc,
  43205. 0x1c49f80b,0x8dfff96a },
  43206. { 0xc03c0c83,0xb4a4753a,0xabcdcd75,0x68e69d18,0xf775b649,0xe3839b88,
  43207. 0xbf58f352,0x803f949a,0xbd0bc15c,0x5f702679,0x8ff298c2,0x85bf5d16,
  43208. 0xc6c7976e,0x3f6ebd98,0x45e3e1b4,0x20618af4,0x54e64093,0x67d5598e,
  43209. 0x504fed9e,0xb047283b,0x70d87517,0x450cabfd,0x3f5addbe,0x47d628bf,
  43210. 0x78cb4cca,0x0037ef30,0x6b1c4908,0x4e148d3c,0x4fcfd837,0xe256d329,
  43211. 0xde3c01f3,0x2aa1207b } },
  43212. /* 2 */
  43213. { { 0x755c2a27,0xcf3e0bb2,0x59585c44,0xd38e42f9,0x19285e60,0x46b13e0f,
  43214. 0x76273d0f,0xc3ecd0c0,0x193c569a,0x7800f085,0x4351818a,0xf04e74ab,
  43215. 0x8496363b,0x9258aa38,0xb8c894fe,0x8456617c,0x2af969a0,0x8bc62aaa,
  43216. 0x5a4668d9,0x66c2280b,0xa992f4fa,0xbc9df58e,0x3f401e99,0x5db0b7d9,
  43217. 0xc4c38c0e,0xe0614fe1,0x2ccdf6b3,0xd531151c,0xe143b618,0x1c7575ec,
  43218. 0xdf9398a4,0x40247985 },
  43219. { 0x8f055746,0xfba25178,0x0ab1e6e0,0xc5ba0040,0xac292697,0xe1b194fb,
  43220. 0x5b4f4740,0x77152119,0x9bb7ba54,0x250091d0,0xb9a139a4,0x7a674861,
  43221. 0xf353aa7e,0xba8413b3,0x2443ceee,0xafe77192,0x3847bbd0,0x14468d36,
  43222. 0x3da4942d,0x61f79ff6,0xd425b456,0x1563a1c1,0x75ff4630,0x3c270fcd,
  43223. 0xeb2802c9,0x42072090,0xc85c7004,0x68f0cdcb,0xfa032e74,0xca4372fb,
  43224. 0xc8b79d80,0x1a6fd1e6 } },
  43225. /* 3 */
  43226. { { 0x8d5116a3,0x967a901a,0xb2f5f47f,0x0b844394,0x60ebaf3b,0xe39ad452,
  43227. 0x60ccfc0c,0x1e1be617,0xcc3f53f2,0xac07e3d2,0x1ed11bb6,0xdd838e0e,
  43228. 0x1c15b0c2,0x45475307,0x920fe5b8,0x70dd4748,0xe471896d,0x1a20be2d,
  43229. 0x59276c7c,0x3c3fad8a,0xc886ee07,0x026a1cc3,0x6e831ac4,0x9fdb6f37,
  43230. 0xac501d65,0x26a35d1a,0x40da8574,0x0ae98905,0xabd734e5,0x65dde0a4,
  43231. 0x15614750,0x29b7d4dc },
  43232. { 0xcbf4e20b,0x44b3c2cb,0x58cc44c5,0x1c3f548f,0x5b0cac1f,0x39809b54,
  43233. 0x00f80621,0x0c0f02b5,0x066905e0,0xe612b890,0x8350188c,0x8f158ed7,
  43234. 0x3f5576b2,0xc01dc458,0xa45492e0,0x29803272,0x0ff92443,0x77a5623a,
  43235. 0x29d0dc41,0xd12a2b00,0x2780e87a,0xb4125459,0x0d53f272,0x1ebcf903,
  43236. 0x24301e8d,0xbae6ea40,0xa37d0798,0x1e5f3f2f,0x22b4126c,0x9342c310,
  43237. 0x5382497e,0x5d092802 } },
  43238. /* 4 */
  43239. { { 0x4b59213a,0xf5b495d0,0x8d70200e,0xca672039,0x2b6771c1,0x4bcb09a6,
  43240. 0x2b9eb0cb,0x26adeed4,0x8cdba212,0xeb544754,0xf08890d1,0x0e1abfcd,
  43241. 0x698e46b4,0x52509963,0x82e9c138,0xe1bff0b0,0x51099a71,0xa189e4cd,
  43242. 0xc9b91cc7,0x2360c9bc,0x137ec4be,0x9bd4d7dc,0xd1519f6e,0xd0356521,
  43243. 0xcf832503,0xbf5f6d78,0x8deea2b4,0xe4301031,0xef4c319c,0xc3132494,
  43244. 0x0f1fa7d7,0x2ab3bd47 },
  43245. { 0x922c9fbb,0x5753b680,0x0f16c6d1,0x869e7dc8,0xbac16efc,0x83445135,
  43246. 0x846d1d9b,0x4326a3b4,0xb2d62c21,0xb517fee3,0x0b292ad5,0x6905afa2,
  43247. 0x2cadac13,0x2a57131a,0xebdbca8d,0xcd904d8f,0x3f365fb2,0xdfeda86f,
  43248. 0xdc7eaa1c,0x7097b208,0xa45e77c0,0x89a35a84,0xcf5d118e,0x417a062c,
  43249. 0x1f6e99e8,0x3c0c04a8,0xba7a087d,0xc44704b0,0x3ea22ad2,0x6f8a27d1,
  43250. 0x4c27d229,0x93a4b416 } },
  43251. /* 5 */
  43252. { { 0x1f1efb7a,0xd4271bc1,0x33fccc0d,0xae4e68e6,0xb11f50a8,0x9d9bc8f1,
  43253. 0xaf076089,0x5430398f,0x443d0e03,0x45e242fb,0xf6e3d4c1,0x73ec2519,
  43254. 0xba9bad09,0xab70f790,0xf9add10f,0xde612ad5,0x14e942b4,0xb837e54e,
  43255. 0xddb8b68a,0x175a56d3,0x1ac2a408,0xe85b233c,0xf0c80f94,0xf8ff6c30,
  43256. 0x898db4f9,0x4b7f3fb7,0x45a7dcdd,0xa2c6044f,0xfe3d3895,0xf3abb2f6,
  43257. 0x32ee7763,0x342ce0d7 },
  43258. { 0xcf491b1f,0xeb261394,0x1909e395,0xdcaaeed7,0x9fe4dbea,0xdcc4055a,
  43259. 0x493d604d,0x17a6611d,0x1ce5ebef,0xba445a3a,0xe3989cb5,0xe82e2858,
  43260. 0x83f58406,0xb96f4282,0xa156cf55,0x99877b99,0x4e166a0e,0xaf906a66,
  43261. 0xb2976d13,0xcea1d353,0x36c61a01,0xefc16f27,0xb0f55d86,0xdb04c433,
  43262. 0x8eb34c01,0x3cb4b269,0x2ae60280,0x38d07f78,0x43be3ec5,0x43ac3bcb,
  43263. 0xe156fd20,0x455f4af3 } },
  43264. /* 6 */
  43265. { { 0x95532833,0x2e6fe0a6,0xd626d067,0xabca228e,0x649e73bd,0x22aef3d9,
  43266. 0xf03c4c0c,0x2083a87a,0x35169b45,0xe954e75d,0x74506a89,0x577509ee,
  43267. 0x2aeacf90,0x49cb276e,0xfa409f91,0x08275d77,0xf0bbd6b9,0x61eb6f3d,
  43268. 0xe4132704,0x948202cb,0xb1c498b1,0x35f3fc21,0x361fee59,0x76c68ba8,
  43269. 0x50e051f3,0xa18cbbd9,0x318e7042,0x2384a879,0x80dd1e8b,0x292abead,
  43270. 0x5c37c334,0x65713c29 },
  43271. { 0xceb77b9a,0xdccca8e9,0x23b69469,0x2f97e727,0xa01d6b28,0xc76abee6,
  43272. 0x5abecdfe,0x3925203d,0x29290d70,0x89448082,0xb0314438,0xf9931424,
  43273. 0x7cd447c3,0x04209df1,0xc855c827,0x7c6f2059,0x56c0e069,0xd97d7862,
  43274. 0x412d94c4,0x5a9db6fe,0x994c41dd,0x19a64591,0xc89e21a3,0x12348aa1,
  43275. 0xc6a03f0e,0xd6904b50,0xa616feac,0x55c15156,0x7cc7693b,0x4e36d1b5,
  43276. 0x3bae3c38,0x6b0e996c } },
  43277. /* 7 */
  43278. { { 0xcceced00,0x32789fab,0xe5b7aa66,0x3237e71a,0x2ddebcdf,0x87b2e269,
  43279. 0xb61dad8f,0xb7245120,0xd35f803c,0xe11e5e48,0x98e50f0d,0xfb4df5d7,
  43280. 0xbcd2ab92,0x60ee68b4,0x1ce3363d,0x98ab2f5c,0x7cd42647,0x15ba39da,
  43281. 0x83f4fb3f,0x1a6572eb,0xe56f08db,0x0f77de88,0x172562c2,0x1743761e,
  43282. 0x8a58f0f4,0xbe349ff8,0x84d1d6e2,0xe04da71b,0x9e9ff3b4,0x368f0342,
  43283. 0x678223f8,0x4022a205 },
  43284. { 0x83847375,0x527bbd05,0x3f451af0,0x3ae56b62,0x4b2c7f18,0x6198f24d,
  43285. 0x4525b98d,0xee323f5b,0x0e0884b5,0xa9d8d39a,0xfb12c776,0xd005d7f6,
  43286. 0x708bc154,0xd71c483e,0x742541bc,0x8ca6fd28,0xf8397ddb,0x0af3dccd,
  43287. 0x3eccf243,0xb80d3125,0x58d81b8d,0xc743a108,0x71391f68,0x3f48eb21,
  43288. 0x33bb657f,0x493aff88,0x07e47e31,0x1d15ed66,0xe08279f6,0x10159b11,
  43289. 0x24a6a956,0x312179cb } },
  43290. /* 8 */
  43291. { { 0xfb99cfe6,0x950323d3,0xc9334178,0x7b09bc26,0x7cbdfb6f,0x64111e41,
  43292. 0x89a75760,0x91141744,0x10919cb0,0x4c633df9,0x396bfd2f,0x715fc7c7,
  43293. 0x8cab62db,0x8ca19512,0x4db81aac,0x30672473,0xb4c4c54a,0xe67a246b,
  43294. 0xbf229646,0xd77ea0fa,0xfa5b5d70,0x5bed15f1,0xc2f192f3,0xa5686da5,
  43295. 0x7f6690ad,0xdecac72a,0xcaa50b7d,0x0c4af2a2,0x6049ad2f,0xf44631c1,
  43296. 0x04ecf056,0x325d2796 },
  43297. { 0x4848c144,0xee11fb55,0xb6a7af32,0x4e062925,0x369e0f9a,0x125b68e1,
  43298. 0xca53b21e,0xad9bdae6,0x2e98ea1b,0xf50d605c,0x9f2fa395,0xbdb9e153,
  43299. 0xe91532f5,0x4570e32d,0x46a250d7,0x810698ae,0xad9d9145,0x7fd9546c,
  43300. 0x11e97a5e,0xabf67721,0x249f82e9,0xca29f7d5,0x9851df63,0xa9c539a9,
  43301. 0x71d0e3e5,0xfd84d54b,0x041d2b56,0xd1e0459c,0xfd80096a,0xceb3eb6e,
  43302. 0xe32a79d3,0x19d48546 } },
  43303. /* 9 */
  43304. { { 0xb540f5e5,0xfe19ee8f,0x04e68d17,0x86d2a52f,0xadbdc871,0xd2320db0,
  43305. 0xd03a7fc8,0xa83ad5a8,0x08bcb916,0x54bf83c7,0x2e51e840,0x092133ea,
  43306. 0xcb52dddf,0xbce38424,0x31063583,0xd5c7be40,0x458e3176,0xc1ebb9df,
  43307. 0xbc4dabbf,0xafb19639,0xc05725a8,0x36350fe4,0x84e1cd24,0xac4a0634,
  43308. 0xc145b8de,0xadf73154,0xb3483237,0x0aa6dd9e,0xcbff2720,0xa3345c3d,
  43309. 0xb4e453b0,0x1b3ace6c },
  43310. { 0x90a8bdc5,0x0343e5e9,0x6306a089,0xa203bf9d,0x8e48520e,0x98489a35,
  43311. 0xde7d1d06,0xbd17debe,0x5f795d3f,0x8fafa6d7,0x387b0a3f,0xa4ceb630,
  43312. 0xffddeafa,0xe0166b32,0x7e764e02,0xa2fe2054,0xe871f304,0x55ab9824,
  43313. 0x952ec45e,0xa2bd36bb,0xa90d20ca,0x7b4c1484,0x75bcfb53,0x5319f387,
  43314. 0x6982c4e5,0x34238a4a,0xa102921d,0xa2bb61c7,0xdb3ab17e,0x1e061b64,
  43315. 0x192f0a14,0x538ec33e } },
  43316. /* 10 */
  43317. { { 0x576374c2,0xe53c7785,0x84727040,0xe60526d1,0x228ca044,0x8a066dc8,
  43318. 0xf1ce1313,0x1fe1c1b2,0xcdeb0c5d,0x2aeec832,0x9cbf826f,0xa7596699,
  43319. 0xde77a589,0xcd188e81,0x118d1254,0xe5ce0fe0,0x0790b86a,0xa142a984,
  43320. 0x39ac28ce,0xe28f043f,0x87de5804,0x4eef8290,0xf639a8c5,0x83c31b32,
  43321. 0x5887794f,0xd70454a7,0x18b1b391,0xca635d50,0x31d9c795,0xcefea076,
  43322. 0xb6f8aa25,0x13cbee76 },
  43323. { 0x8d3f34f3,0x79cabe0f,0xa3617fe3,0xbda9c31c,0xdd9426a1,0xb26dee23,
  43324. 0xf29c9104,0xe9dd9627,0xe2c6cd3b,0x033eb169,0xfcba2196,0x8a73f492,
  43325. 0xb858c83c,0x92e37e0b,0x23b3fbb7,0xe4f2aca6,0x64be00a2,0x8101fb1e,
  43326. 0x948f6448,0x91a7826a,0x907260e7,0x414067b4,0xe30bb835,0xf774aa50,
  43327. 0xc999c06e,0xf922ca80,0x0ba08511,0x6b8635b9,0x25fa04f0,0xbf936b5c,
  43328. 0xe02e8967,0x4e0a1ada } },
  43329. /* 11 */
  43330. { { 0x8ba29c4d,0x00ca6670,0x22988094,0xc08240ce,0x16dda752,0x21c5ca67,
  43331. 0xabbbfa34,0x689c0e45,0x3ed28b72,0x1d7545fd,0xd7c56ab4,0x5f221198,
  43332. 0x38759d65,0x4b3d8f74,0x8fe50b89,0x93490dfb,0xe80eba16,0xb641f5d7,
  43333. 0x79acb537,0x7b0da5eb,0x0c1d5e5e,0xab6b1497,0xa5da429a,0x2338e68d,
  43334. 0x2f6d2f25,0xe010c437,0x6530f3a7,0x226f16d2,0xcbef08bc,0xefb0f7b6,
  43335. 0x9f99c999,0x733e30d9 },
  43336. { 0xa42a38f9,0xecfe1582,0x4730b500,0xaec2d58e,0xde976b2c,0x2ee2f2a7,
  43337. 0xa969c1bb,0xf0539db5,0xfcecdb4a,0x31954168,0xe7a8e902,0xf2f7348a,
  43338. 0x3121541f,0x1d58d7cc,0x2202ae52,0x5d25b75c,0xf40835a7,0xdea9965a,
  43339. 0x529b4e46,0x3feb6a41,0xbd27ad9b,0x5c97fb6f,0x261f900b,0xd87554c0,
  43340. 0x04d5b19e,0xb43031d9,0xcb219b9c,0x33d5e9b8,0x3ee00bcf,0x7a43d492,
  43341. 0xb79a5c0c,0x56facb39 } },
  43342. /* 12 */
  43343. { { 0x7c834915,0x667eaed6,0xbc5eb64d,0x9f77aa6a,0x25d62011,0x729ebcb6,
  43344. 0x699fd9c2,0x0aee24f2,0x2b8d4f6c,0xe1eb5874,0x14c976d6,0x7f12710c,
  43345. 0xf6d9ea65,0x91390335,0x06b50064,0x668b7049,0x0876ee4f,0x65969a0e,
  43346. 0x2f9d9360,0xf901bf3f,0xb499e3ce,0xfb1a8651,0xf2dbcaaa,0x80b953fb,
  43347. 0x973b06b6,0x312cc566,0x3af36c64,0x3534d9c3,0x10ffd815,0xe4463a52,
  43348. 0xf18c2b91,0x57ea2b4b },
  43349. { 0x8aa0f2f2,0x00f5e162,0x0e46bcaa,0x8c7e75c5,0xa4a2c42d,0x97ab479a,
  43350. 0x14baa202,0xb4f308ea,0x6943cc2e,0xa901bd14,0xeed58804,0xbb125fee,
  43351. 0x9d180f7c,0x6502c8f9,0x1580c61c,0xe5353919,0x27101ee3,0x7e278069,
  43352. 0xfaa72717,0x7a0a40a1,0x4c75b153,0x32edce02,0x538f1c22,0xda23660b,
  43353. 0xbe307d2e,0x4d511e98,0x9baee0b4,0x24276e40,0x7ff1f307,0xa78c3927,
  43354. 0xea7935c9,0x60480b46 } },
  43355. /* 13 */
  43356. { { 0x3872ece3,0x31087d66,0x955b70f8,0x5f29be7d,0x9cf95bb8,0xb50b4fc7,
  43357. 0xdbffa621,0xbae3b58d,0xe022ba5d,0x0e61d280,0x4181449c,0x78ae5117,
  43358. 0xcf555485,0x0b132840,0xb8ce0b0e,0x800ed1b6,0x78d5de3d,0x35dffdd5,
  43359. 0x69a56b47,0xf7e42374,0x8d910ae7,0xd5e32369,0x6313c7c7,0xb6ff52a0,
  43360. 0xa92de9e5,0x5a2fe20d,0xd12110bb,0x41b347d3,0x40c16f23,0xc5905edb,
  43361. 0x9a8f88cc,0x0774a0d3 },
  43362. { 0xe3b6c106,0x3ae181ab,0x8de150b7,0x4ebe163f,0x6f354836,0xcf75b82f,
  43363. 0x3ac7ac16,0xaa0d2063,0x291722af,0x5c680668,0x11545553,0x73941e61,
  43364. 0xbf5de3f7,0x17127e38,0x1afb41da,0x32cfdf03,0x87bc8663,0xc6893c91,
  43365. 0xa62c9c99,0x75046744,0x962c1947,0x96866e2d,0x378cdf4c,0x489ec8df,
  43366. 0x3407fa32,0x3a60709b,0x551290d1,0xd37d2159,0xbab92273,0x9623d303,
  43367. 0x2432014b,0x08151954 } },
  43368. /* 14 */
  43369. { { 0xb05f2b26,0x569044f3,0x80b9f76c,0xb35a294a,0x4290f6ae,0x8839fe28,
  43370. 0x026a5877,0x761cfb23,0x2e5ff9c3,0x768926b6,0x0b11c576,0xbae6cd20,
  43371. 0x72a03efe,0xdc857756,0xe1bad63a,0x0cae074a,0xd709d99c,0x3fe491a1,
  43372. 0x6501d9c1,0x76c5ded6,0xc32aeff7,0x1da6eca1,0xc57683e8,0x50849d55,
  43373. 0xdf98d847,0x9e392e9c,0x64d9a564,0xfad7982f,0xa37b98b2,0xf7c3bdb7,
  43374. 0xf0860497,0x1fe09f94 },
  43375. { 0x7648cc63,0x49a7eaae,0x67cfa714,0x13ea2511,0x653f4559,0xfc8b923c,
  43376. 0x81a16e86,0xd957619b,0x3c864674,0x0c7e804b,0x1616599a,0xfc88134a,
  43377. 0x0a652328,0x366ea969,0x4bc9029e,0x41532960,0xae2aad2b,0xef9e1994,
  43378. 0x7f10bef5,0x9e2a8c52,0xc67bf860,0x73dcb586,0x844cc25d,0xf61a43fa,
  43379. 0x74eb3653,0xd74e7eea,0xdd240f02,0xf3356706,0xfd83bcb4,0xeec7694c,
  43380. 0xdb62526a,0x4de95786 } },
  43381. /* 15 */
  43382. { { 0x3deac2f7,0x4867d315,0xb61d9a8e,0xa084778a,0x0ab7b2d5,0xf3b76f96,
  43383. 0xcfdf4f79,0x00b30056,0x31ab8f4b,0xd0701e15,0x9c779d01,0x07f948d5,
  43384. 0x82675371,0x7c994ebc,0x48bad4c0,0x1104d4ee,0xbfc9d058,0x798ce0b5,
  43385. 0x309fa80b,0xc7ca898d,0xacb33eaf,0x0244f225,0x5b2f3175,0xd51e8dfc,
  43386. 0xa4d7be34,0x3e49ba6b,0xbda02b43,0x1760f4c7,0x4435275a,0x37e36a7e,
  43387. 0xe636980c,0x1c94418b },
  43388. { 0x09dc1414,0x43a21313,0x43c93537,0x060765fc,0xdf5f79ce,0x6ff3207a,
  43389. 0x85d4cfca,0x6f18b1fa,0x63e995ab,0xf5c4272e,0xa82b3002,0x121a09e4,
  43390. 0x97147f16,0x82b65d1b,0x20a7fe26,0x4993c20c,0xe6716726,0x99c9cb98,
  43391. 0xfeb440a0,0x5a02d673,0x251b4bc5,0x3f3fa9e1,0xa05338ea,0x75dbc474,
  43392. 0x7b09f6cb,0x3cb4044b,0x80434609,0x6767da18,0x098ceac2,0x97851422,
  43393. 0xb55235ba,0x611bfbb2 } },
  43394. };
  43395. /* Multiply the base point of P1024 by the scalar and return the result.
  43396. * If map is true then convert result to affine coordinates.
  43397. *
  43398. * Stripe implementation.
  43399. * Pre-generated: 2^0, 2^256, ...
  43400. * Pre-generated: products of all combinations of above.
  43401. * 4 doubles and adds (with qz=1)
  43402. *
  43403. * r Resulting point.
  43404. * k Scalar to multiply by.
  43405. * map Indicates whether to convert result to affine.
  43406. * ct Constant time required.
  43407. * heap Heap to use for allocation.
  43408. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  43409. */
  43410. static int sp_1024_ecc_mulmod_base_32(sp_point_1024* r, const sp_digit* k,
  43411. int map, int ct, void* heap)
  43412. {
  43413. return sp_1024_ecc_mulmod_stripe_32(r, &p1024_base, p1024_table,
  43414. k, map, ct, heap);
  43415. }
  43416. #else
  43417. /* Striping precomputation table.
  43418. * 8 points combined into a table of 256 points.
  43419. * Distance of 128 between points.
  43420. */
  43421. static const sp_table_entry_1024 p1024_table[256] = {
  43422. /* 0 */
  43423. { { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  43424. 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  43425. 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 },
  43426. { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  43427. 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
  43428. 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 } },
  43429. /* 1 */
  43430. { { 0xe0162bc2,0xbf9c7ec6,0x10a89289,0xddecc6e3,0x9e499d81,0x5d599df0,
  43431. 0x6d358218,0x9a96ea28,0x70c5f8db,0x01aec7d3,0x8cf5d066,0xe72e4995,
  43432. 0x3e91d7f8,0xc2e7297d,0xda9f2f5a,0x8621db92,0x5a5679ed,0x4b26c867,
  43433. 0x2c56aac1,0x233385df,0xc6a13f99,0xb88e74d4,0xffa8ec11,0x1214b173,
  43434. 0x1f3f9fef,0xa0386a27,0xc0e7b44e,0xbd9b1b4e,0xeecd3496,0xafe528dc,
  43435. 0x1c49f80b,0x8dfff96a },
  43436. { 0xc03c0c83,0xb4a4753a,0xabcdcd75,0x68e69d18,0xf775b649,0xe3839b88,
  43437. 0xbf58f352,0x803f949a,0xbd0bc15c,0x5f702679,0x8ff298c2,0x85bf5d16,
  43438. 0xc6c7976e,0x3f6ebd98,0x45e3e1b4,0x20618af4,0x54e64093,0x67d5598e,
  43439. 0x504fed9e,0xb047283b,0x70d87517,0x450cabfd,0x3f5addbe,0x47d628bf,
  43440. 0x78cb4cca,0x0037ef30,0x6b1c4908,0x4e148d3c,0x4fcfd837,0xe256d329,
  43441. 0xde3c01f3,0x2aa1207b } },
  43442. /* 2 */
  43443. { { 0x01900955,0xa95b6dae,0xceb4656d,0xa5dc9cc1,0xe72fe95b,0x50c78907,
  43444. 0xa040c334,0xa1ae5447,0x7952ea6e,0x91191370,0x6d097305,0x54ff7343,
  43445. 0xbda4d10f,0xa4db0074,0x91644070,0xfd5306f1,0x8b24522c,0x14b9fe73,
  43446. 0x7849f762,0x1468dad6,0xb0dcd2e4,0x87b29a18,0x5e1ad492,0xadd7f1a1,
  43447. 0xdbba2a1a,0x9ac63a81,0x81223379,0x01379c5b,0xb0e53bc8,0xf402b2f0,
  43448. 0x0bf13b61,0x8c3eb27f },
  43449. { 0xe513696f,0x9a4ad3e1,0x18c81ffa,0x0350ba5c,0x3c033d13,0x1e2fc136,
  43450. 0x17a531bc,0x53da6e71,0x1aed610d,0x42ec6490,0xe99ff567,0xd33e8df7,
  43451. 0x3deed12a,0xe4aad73e,0x180f4deb,0xd983b465,0x502f30b4,0x99365269,
  43452. 0xa8918d7f,0x7e2799ab,0x700fc79a,0x0ffe84b6,0x40bfd8c2,0x7b4400d6,
  43453. 0x5d2641bd,0xc3a21d21,0xc32621cb,0x79839442,0xb1401e83,0xace6500b,
  43454. 0x251c4310,0x7bf4163e } },
  43455. /* 3 */
  43456. { { 0xe3fd589e,0x1c174f88,0xdf974a03,0xdb501790,0x3e70549f,0xd09623e3,
  43457. 0x15924f34,0x8d091eff,0xf9b65ac5,0xeef79cad,0x3f69c2cf,0xd2cc4262,
  43458. 0x52cd82bc,0x817d9032,0xa5f1dddd,0xacf4f4d9,0x5011b6bd,0xd0612635,
  43459. 0x2ed140c9,0x9f74490d,0x4db686d2,0x64092e8c,0x776b0fcc,0x225eef16,
  43460. 0xdf16aeb6,0x0e8c01e9,0x84bbd82a,0x62836741,0x8956e337,0x757574e2,
  43461. 0x705a7f07,0x9871edc6 },
  43462. { 0x776535f7,0xbd0b76d5,0x2635b3b8,0x5214d602,0x9d216f64,0xc0c25ad9,
  43463. 0x5515bf75,0xfd4df3a7,0x5e9f1675,0x24a625bc,0x406873e7,0x3c35efb7,
  43464. 0xbb2e5c4a,0xef5c9a33,0x806b198a,0xa971b35e,0xa3c690ed,0x9f5c0ca5,
  43465. 0x8e1e2341,0xa8d5dd89,0x955ad9e4,0x4cecbcce,0x248d3416,0x2ecf4407,
  43466. 0x45c0af6e,0x1abb3811,0x1c780fff,0x3f4bee82,0xc272ed57,0xd14df768,
  43467. 0x371637ad,0x397ed10a } },
  43468. /* 4 */
  43469. { { 0x755c2a27,0xcf3e0bb2,0x59585c44,0xd38e42f9,0x19285e60,0x46b13e0f,
  43470. 0x76273d0f,0xc3ecd0c0,0x193c569a,0x7800f085,0x4351818a,0xf04e74ab,
  43471. 0x8496363b,0x9258aa38,0xb8c894fe,0x8456617c,0x2af969a0,0x8bc62aaa,
  43472. 0x5a4668d9,0x66c2280b,0xa992f4fa,0xbc9df58e,0x3f401e99,0x5db0b7d9,
  43473. 0xc4c38c0e,0xe0614fe1,0x2ccdf6b3,0xd531151c,0xe143b618,0x1c7575ec,
  43474. 0xdf9398a4,0x40247985 },
  43475. { 0x8f055746,0xfba25178,0x0ab1e6e0,0xc5ba0040,0xac292697,0xe1b194fb,
  43476. 0x5b4f4740,0x77152119,0x9bb7ba54,0x250091d0,0xb9a139a4,0x7a674861,
  43477. 0xf353aa7e,0xba8413b3,0x2443ceee,0xafe77192,0x3847bbd0,0x14468d36,
  43478. 0x3da4942d,0x61f79ff6,0xd425b456,0x1563a1c1,0x75ff4630,0x3c270fcd,
  43479. 0xeb2802c9,0x42072090,0xc85c7004,0x68f0cdcb,0xfa032e74,0xca4372fb,
  43480. 0xc8b79d80,0x1a6fd1e6 } },
  43481. /* 5 */
  43482. { { 0x8d5116a3,0x967a901a,0xb2f5f47f,0x0b844394,0x60ebaf3b,0xe39ad452,
  43483. 0x60ccfc0c,0x1e1be617,0xcc3f53f2,0xac07e3d2,0x1ed11bb6,0xdd838e0e,
  43484. 0x1c15b0c2,0x45475307,0x920fe5b8,0x70dd4748,0xe471896d,0x1a20be2d,
  43485. 0x59276c7c,0x3c3fad8a,0xc886ee07,0x026a1cc3,0x6e831ac4,0x9fdb6f37,
  43486. 0xac501d65,0x26a35d1a,0x40da8574,0x0ae98905,0xabd734e5,0x65dde0a4,
  43487. 0x15614750,0x29b7d4dc },
  43488. { 0xcbf4e20b,0x44b3c2cb,0x58cc44c5,0x1c3f548f,0x5b0cac1f,0x39809b54,
  43489. 0x00f80621,0x0c0f02b5,0x066905e0,0xe612b890,0x8350188c,0x8f158ed7,
  43490. 0x3f5576b2,0xc01dc458,0xa45492e0,0x29803272,0x0ff92443,0x77a5623a,
  43491. 0x29d0dc41,0xd12a2b00,0x2780e87a,0xb4125459,0x0d53f272,0x1ebcf903,
  43492. 0x24301e8d,0xbae6ea40,0xa37d0798,0x1e5f3f2f,0x22b4126c,0x9342c310,
  43493. 0x5382497e,0x5d092802 } },
  43494. /* 6 */
  43495. { { 0xff2f780d,0x583a2b7e,0xd7d76b1d,0x34d26820,0x86f74aec,0xe3c32847,
  43496. 0x10823feb,0x0fd42212,0xfb5e7bf4,0x227e417e,0xa568f8cd,0x510d49b6,
  43497. 0x1781bbec,0x53bce7d6,0x2f3718b7,0x9cfe3f22,0xd9de6c1f,0x7f44e89f,
  43498. 0x3fac9b55,0xf1cc553f,0xe6f300bc,0x9d2d0846,0x9f0ae6b1,0x976c82a2,
  43499. 0x24b8bbe0,0xe63dbf5e,0x973a5aa7,0x4cac7f45,0x84dd33c7,0xc6eb6237,
  43500. 0x142fee5d,0x0a26e434 },
  43501. { 0xacaa9a08,0x8081339f,0x5246ece1,0x40f31105,0x61393747,0x892c8170,
  43502. 0x242f02e1,0x8d8d4103,0x3b5de98a,0x482bfd20,0x5abbe952,0x89ef946b,
  43503. 0x37698249,0xb8d218b9,0x66617c7a,0xd5268e89,0x8b7d2b91,0x962e7551,
  43504. 0xfe8d67c3,0x2c5c7973,0x2b017c51,0x42e3150a,0xc1a29469,0x6f4e5ebc,
  43505. 0x531c7083,0xa39910ce,0xb77b9e50,0xaf4f6eb4,0xda120ad0,0x68cbb175,
  43506. 0xb92636ec,0x19497c61 } },
  43507. /* 7 */
  43508. { { 0x417659a8,0x6920b0c6,0x92cb28ff,0xc77ab9c7,0xb687797f,0x55b67180,
  43509. 0xe7759363,0x4caf58c1,0x5561b186,0x5155bdb6,0x780f4946,0x2e64e355,
  43510. 0x229a8b20,0xeb0ac9b7,0x2571bd60,0x88594d78,0xe3fa78f9,0x5dcc0939,
  43511. 0x2ac2d379,0x7b8b4830,0xb90f1444,0x505fbf60,0x3ce4b3c1,0xac610e81,
  43512. 0xd59b5c18,0x39a4f27a,0x7cea0222,0x5fa33973,0x8dff1c7b,0xe578730b,
  43513. 0x517bf7a6,0x96b91b8b },
  43514. { 0x9aac087c,0xc1a991f4,0x6cfdb28d,0xce62f74e,0x5f7600d6,0x08d6ff9a,
  43515. 0xf917f9c9,0xd781cd04,0x3de52dbf,0x7796f5f6,0x2ed72180,0xe7db64e0,
  43516. 0x6fa4137d,0x0f0876f6,0x3ca1f716,0x3271ee64,0x7c4ab8a3,0xcb9b2058,
  43517. 0x39481047,0xcba17107,0x598c5c37,0xdf9a190d,0x6f20e125,0x0cb6e72a,
  43518. 0xf4f2902d,0xa3142204,0x7ce2dcfb,0x42d28cb9,0xa3d3c351,0xdf261b8a,
  43519. 0xcffc249d,0x73f3d315 } },
  43520. /* 8 */
  43521. { { 0xe6fd3673,0x5d86855b,0x9d214b7b,0x309b70af,0xdcc46cd3,0x8d332f90,
  43522. 0x595510de,0xe553c015,0x38c1251c,0x5746a096,0x85cc1bc9,0xcd7cea5b,
  43523. 0x002eba8f,0x4ffa1468,0x22fcd77c,0x10a3cb70,0xc4ea05e3,0xb6999dfb,
  43524. 0x4efa756e,0x3375a0d0,0xdced5fd8,0x4d90279e,0x251fd56e,0x48192403,
  43525. 0x82a4c5f1,0xe87633a4,0x1b34105b,0x3170d130,0x7247e578,0x93998b0f,
  43526. 0x436ba1fa,0x88934f64 },
  43527. { 0x4713eabc,0xf09f43b0,0xaccdc517,0x4ca7dd91,0xef13ca7c,0x27daa63b,
  43528. 0x2588184b,0x8b2e5a7a,0xd95dc269,0x0a8cb612,0xe1f2f14c,0x346975a2,
  43529. 0xe172935c,0x1f29b8ed,0xd40bc1e3,0xc3cbfd6e,0x132623da,0xd3f46b3f,
  43530. 0xfb0b7681,0xc115be6d,0x56da4344,0x5e31c345,0xa8e43d98,0xa7c63f18,
  43531. 0x4bddb4ea,0x55cb2083,0x4a54f58c,0xb16a0c38,0x46fd69d9,0x74eacca2,
  43532. 0x153548e1,0x0d1898bb } },
  43533. /* 9 */
  43534. { { 0xe35ef043,0x4ea73461,0x3496b564,0x107b67d9,0xd0f83a3c,0xd62c173b,
  43535. 0x51d29c35,0xfad4b038,0x71b1c1a4,0x3f42882a,0x54b43b9e,0x5d2bcf66,
  43536. 0x2abdf543,0xc77b15aa,0xdabe3dc1,0x5cb38a80,0xa481673b,0x15fda0ae,
  43537. 0xe7b90ebe,0x86996b4d,0x2bc8f3d8,0x84f87e25,0x37c4e424,0xaded03d6,
  43538. 0xd7a7afd8,0xe5ede666,0xa1ccb93a,0x80dd95a2,0x46fba391,0xa55cfd25,
  43539. 0x46f82e60,0x2bdab1dc },
  43540. { 0xfa6fed61,0x7a4de22b,0xcc8dd94e,0xca458aa5,0x071222f5,0x3e372df1,
  43541. 0xe5aff377,0x06a4b44f,0x4a738e6d,0xbc2d0ba7,0x5f31f136,0x1a470e1d,
  43542. 0xe102a911,0x77ff933a,0x310c7885,0x8b380a50,0x783fc5ac,0x9f3c0228,
  43543. 0x44725d06,0xec668925,0x5ac84221,0x878f0e16,0xcfda6e8a,0x9a3af1af,
  43544. 0x78cd2aba,0x0183ed37,0x826d0eae,0x32cdbd60,0xcbee6415,0xb3234661,
  43545. 0xb9c10120,0x353eb892 } },
  43546. /* 10 */
  43547. { { 0x10b5521e,0xc8fdcad6,0x52e702f0,0x1a11b440,0x8ffda49c,0x6302680d,
  43548. 0xcbf36bad,0xcdb9654a,0x4c10a2d7,0x7b58ce11,0xe630e7e0,0x1e5d1f7d,
  43549. 0x6760a813,0x8cbe3d7d,0x6480d77f,0xeb35866b,0x7f036219,0x58728cf3,
  43550. 0x42a8a757,0xdd5865ed,0x906a2870,0x283f1f1d,0xa51f906b,0x79e23fa4,
  43551. 0x543b20a8,0xf2ac6e83,0xb81e7754,0x4f0b6379,0x840016ee,0x57fbc0d4,
  43552. 0xe621b67d,0x8da20771 },
  43553. { 0xecce65ec,0x3c855004,0xb748185e,0x76d10d1f,0x78797ad2,0x64be7bca,
  43554. 0x77e54aad,0x43444db0,0xbe0df0ff,0x17b6b0c9,0x055086a4,0x8fc4256c,
  43555. 0xfd74d5a3,0xf952c43b,0x01c4edb8,0x501e005a,0x4a57e328,0xd5172dfc,
  43556. 0x535d6ee3,0xdb40ce4e,0x0c650918,0xbaef1e5c,0x857561fc,0xe85145e7,
  43557. 0x34a224c6,0xe468536a,0x0ec0e0a2,0x69a8e227,0x242b03fc,0xb3f52247,
  43558. 0xc3bebd5f,0x862f55e2 } },
  43559. /* 11 */
  43560. { { 0x226049fe,0x2d6a390f,0xdcbbc9fb,0xcc92a578,0x97634fb7,0xa52feca4,
  43561. 0x3dea5893,0x2b340cb6,0x2a49e916,0xa39f338a,0x949e41f3,0x26b2df3d,
  43562. 0x065a7e40,0xc71c7cdb,0x468281a2,0x4a9b84a0,0x731eeeca,0x63eeb503,
  43563. 0x76cbb725,0xe6d09134,0xb94a678c,0x0cf979a9,0x808fd9f1,0xb44d8c3b,
  43564. 0xe0afc5b9,0xe60da613,0x3ea5be69,0x52dce7de,0xdc1ee74f,0x3a5d6864,
  43565. 0x3bc80790,0x71ab2891 },
  43566. { 0x3b5b60ad,0xcf618fc4,0x4a0c3184,0x0afb5e30,0xbc403302,0xd22381cc,
  43567. 0xdb1c0c66,0x33cf8953,0xa6112a8d,0x9c994e4d,0xd1967a86,0xd7aae2c3,
  43568. 0x5b7acd29,0xc28d5493,0x6c9a57fb,0x8075bd13,0x9c8427f9,0xc9c0373e,
  43569. 0x193225f5,0x2cbca18d,0x442c018c,0x73777d13,0xfbb3a727,0xebe5ed47,
  43570. 0x1962dc18,0x70437d49,0x2dc08806,0xf39c1e09,0x15fff35c,0x03e9c6f7,
  43571. 0x5e360a65,0x8d087bb6 } },
  43572. /* 12 */
  43573. { { 0x3fdc1844,0xbe212302,0x105eac56,0x6eca27ef,0xf168a348,0x2183a606,
  43574. 0xe1d7a4cb,0x295f807d,0x7ef5d43e,0x7246a632,0xc77025c7,0xae143205,
  43575. 0xf3484e3e,0x4bdfc7ca,0xdf52c075,0xec939895,0xd7a9cac0,0x82e655f6,
  43576. 0x8baeddb0,0x985dfe20,0x527de731,0x79c817e4,0x313de1ea,0x30ce0fbc,
  43577. 0xcc4f6cbb,0x9df95b89,0xf5bb20cd,0xf2aedf1e,0x1a8cfb01,0xfc1e0a89,
  43578. 0x63edb7ec,0x225ed34a },
  43579. { 0xbabb1a85,0x3e13154d,0x1e6a565a,0xd3d8dae7,0xab4b100f,0xd3217d56,
  43580. 0xebc78e1a,0xd44d934e,0x48e73d37,0x0215321b,0x201e43cb,0xbbc90bfa,
  43581. 0x27500905,0x3c23f1d0,0xc86691a1,0x2a2e5000,0x6065841c,0x08b2bad2,
  43582. 0x30026b60,0x15d41caf,0x5276ce61,0x1712c2f4,0x15932ffb,0x01c4c3e7,
  43583. 0x6a74caf2,0x7894e13d,0x0c0537a4,0x02d6f5df,0xc2b1c97e,0xa8fb7602,
  43584. 0xd0887c7b,0x612b60e5 } },
  43585. /* 13 */
  43586. { { 0xba245d6b,0xefd495cf,0xa2ce3ff6,0x5cf0cbb7,0xdff5feee,0x24da2ac0,
  43587. 0xcf28c6a3,0x90c914f8,0x4308a56b,0x72fdb50d,0x13d72034,0x03dbf779,
  43588. 0x822ac9e9,0xcfa5ec91,0x3aea3e81,0x0dde73c8,0x66289139,0x545ba962,
  43589. 0xca6acbd3,0xa52f648b,0x98a0683a,0xff6f276e,0xa378ed52,0x2536d3ac,
  43590. 0x885ac1d9,0x353c2c54,0x00bc84a7,0xcaff52da,0x37684167,0x3971f81c,
  43591. 0xd2d7986e,0x0f7334e1 },
  43592. { 0x6596067e,0xafbb5c83,0x38c19806,0x33e54e19,0x39cb0dcc,0x8285d967,
  43593. 0x424035f9,0x2b53f43d,0xdfef9095,0x38c531f8,0xdb0f571a,0x90fbe8e4,
  43594. 0xa39ca787,0x9a0c1ed2,0x606f2620,0x2fecc1d6,0x72b7cb4a,0x9dc890b1,
  43595. 0xccbb7868,0xc33ca6fb,0xfe73ee49,0xd1b11082,0xfcb66c48,0x590b7d17,
  43596. 0x86e14573,0x9356b0a6,0x053ead85,0x75d682c4,0xc54d30fb,0xb2ae55fa,
  43597. 0xf8aee949,0x67636a72 } },
  43598. /* 14 */
  43599. { { 0xb91d6bea,0x638063bc,0x923ecb96,0xae263a2e,0xc627aca6,0x9d7b0992,
  43600. 0x77af9e7e,0xc6ed001a,0x24aafebb,0x9214accf,0x78055a90,0xa3564b96,
  43601. 0xe027499d,0x00999b1c,0xe46a06a5,0xe413a4e1,0x2e51efe7,0xa05d13f6,
  43602. 0x9ba843be,0x35e87d34,0x3183159e,0x0a633825,0x54601923,0x6023e8ba,
  43603. 0xb7fd1cf2,0x9b107721,0xfdf2fd53,0x46b5542b,0x1c18af38,0xb314f4f8,
  43604. 0x60ac8965,0x086f9876 },
  43605. { 0x8cbb9850,0x76701954,0xa20d2c8c,0x6210b730,0x5335670c,0x4084d057,
  43606. 0x0324baea,0x3ecdc595,0xc76ee9b4,0x607fc5f2,0x440ffa64,0xf393d00f,
  43607. 0x2dc1463c,0xe0111796,0x9c7725e7,0xf00b8251,0x5bd1d186,0x35e60736,
  43608. 0x2cf72aac,0xf3d8554c,0xefa3497d,0xb4dd0fde,0xf646ad11,0xd712268c,
  43609. 0x9f7b8ead,0x07c20afb,0xfc06dfe5,0x630969d4,0x7245549a,0x76b7df1c,
  43610. 0xe61ae810,0x681f9403 } },
  43611. /* 15 */
  43612. { { 0xc9a0623b,0x7cad5163,0x67fab8d4,0xdbf82957,0x81af7c7c,0x2ccab0ec,
  43613. 0xe966d5c2,0x469e38c8,0xf0d4e41c,0x34430d52,0xa52b359c,0x426075a2,
  43614. 0x33bd0127,0x242dd3e3,0x9fed2341,0xcda3f635,0xd7d52ffa,0x4df33730,
  43615. 0x7640c3ef,0x5fff56f0,0x1bbde57c,0x4783c21c,0xeb8bb336,0xd8784a2a,
  43616. 0xead08405,0x1ec7c533,0xf9b62bd4,0x4b7f1423,0x7075d4af,0x5543145c,
  43617. 0xba60590a,0x0c9de94a },
  43618. { 0x95d5682b,0x8ed72735,0x2ec276ed,0x711c4283,0x8b36a0d2,0xd1f4aed5,
  43619. 0x8498a88f,0x62ab40c4,0x4480f451,0x58c8fc62,0xb79cffe2,0x8bc8ca4b,
  43620. 0x701a359d,0x90ab583c,0x3fd5d15d,0xaee31a73,0xc912333c,0x02a5597b,
  43621. 0xb6c3e3c2,0x1019cae4,0x29938088,0xe513042c,0xf47c8199,0x0e00283d,
  43622. 0xf2a00e92,0x90d68e58,0xa775ae3b,0x69e2df41,0x871c30b2,0xb8d2eca5,
  43623. 0xbb1de396,0x733dca0e } },
  43624. /* 16 */
  43625. { { 0x4b59213a,0xf5b495d0,0x8d70200e,0xca672039,0x2b6771c1,0x4bcb09a6,
  43626. 0x2b9eb0cb,0x26adeed4,0x8cdba212,0xeb544754,0xf08890d1,0x0e1abfcd,
  43627. 0x698e46b4,0x52509963,0x82e9c138,0xe1bff0b0,0x51099a71,0xa189e4cd,
  43628. 0xc9b91cc7,0x2360c9bc,0x137ec4be,0x9bd4d7dc,0xd1519f6e,0xd0356521,
  43629. 0xcf832503,0xbf5f6d78,0x8deea2b4,0xe4301031,0xef4c319c,0xc3132494,
  43630. 0x0f1fa7d7,0x2ab3bd47 },
  43631. { 0x922c9fbb,0x5753b680,0x0f16c6d1,0x869e7dc8,0xbac16efc,0x83445135,
  43632. 0x846d1d9b,0x4326a3b4,0xb2d62c21,0xb517fee3,0x0b292ad5,0x6905afa2,
  43633. 0x2cadac13,0x2a57131a,0xebdbca8d,0xcd904d8f,0x3f365fb2,0xdfeda86f,
  43634. 0xdc7eaa1c,0x7097b208,0xa45e77c0,0x89a35a84,0xcf5d118e,0x417a062c,
  43635. 0x1f6e99e8,0x3c0c04a8,0xba7a087d,0xc44704b0,0x3ea22ad2,0x6f8a27d1,
  43636. 0x4c27d229,0x93a4b416 } },
  43637. /* 17 */
  43638. { { 0x1f1efb7a,0xd4271bc1,0x33fccc0d,0xae4e68e6,0xb11f50a8,0x9d9bc8f1,
  43639. 0xaf076089,0x5430398f,0x443d0e03,0x45e242fb,0xf6e3d4c1,0x73ec2519,
  43640. 0xba9bad09,0xab70f790,0xf9add10f,0xde612ad5,0x14e942b4,0xb837e54e,
  43641. 0xddb8b68a,0x175a56d3,0x1ac2a408,0xe85b233c,0xf0c80f94,0xf8ff6c30,
  43642. 0x898db4f9,0x4b7f3fb7,0x45a7dcdd,0xa2c6044f,0xfe3d3895,0xf3abb2f6,
  43643. 0x32ee7763,0x342ce0d7 },
  43644. { 0xcf491b1f,0xeb261394,0x1909e395,0xdcaaeed7,0x9fe4dbea,0xdcc4055a,
  43645. 0x493d604d,0x17a6611d,0x1ce5ebef,0xba445a3a,0xe3989cb5,0xe82e2858,
  43646. 0x83f58406,0xb96f4282,0xa156cf55,0x99877b99,0x4e166a0e,0xaf906a66,
  43647. 0xb2976d13,0xcea1d353,0x36c61a01,0xefc16f27,0xb0f55d86,0xdb04c433,
  43648. 0x8eb34c01,0x3cb4b269,0x2ae60280,0x38d07f78,0x43be3ec5,0x43ac3bcb,
  43649. 0xe156fd20,0x455f4af3 } },
  43650. /* 18 */
  43651. { { 0x754ec21c,0xc057f262,0xe3a1ba38,0x3eacd4c9,0x116c1fe9,0x3a0210d1,
  43652. 0xeacc8ab6,0xe4ea4e94,0xea6f32ca,0x31c00c9a,0x86b975ce,0x5cb6239d,
  43653. 0xa14ea1e9,0x654d5d8c,0x5067fc8b,0x230d31f4,0x6355fecb,0x48bb90cb,
  43654. 0xdc172e8e,0x78f81ece,0xcb006737,0x288380a8,0xe162d012,0x19b02e01,
  43655. 0xc5af145c,0x0e087a06,0xb72dc354,0xf04dc8b7,0x8de3c066,0xf70ef214,
  43656. 0x13009fb7,0x4f148243 },
  43657. { 0x6e2055e2,0x5e004fce,0x86c32067,0x89e247ea,0x5f9daaa2,0x4ebcbd95,
  43658. 0xceb7f63b,0xd15f212f,0x863784a0,0x5ecc5c1f,0x75760251,0x53b3800b,
  43659. 0x8a6a2954,0xeb9301c3,0xa13cdd19,0x0f16ba18,0x887c2d24,0x8313d251,
  43660. 0x9a9413f6,0xf9923585,0xfe3fd7c5,0x423405e6,0x16e0ee05,0x678aeb34,
  43661. 0x3fadaab0,0x1f3be7bb,0x82884471,0x7901fa2c,0x4d662ff6,0xc950db30,
  43662. 0x3c01170b,0x74d5d2d4 } },
  43663. /* 19 */
  43664. { { 0x2b5bfe11,0xa3002dc0,0x52d321e7,0x0733410d,0x9679ba89,0x15920f65,
  43665. 0x685b236e,0x0e248c14,0x346f6040,0x8cfab594,0x40c717f0,0x9f57afb7,
  43666. 0x66044576,0x0dbab28c,0x9cdc3247,0x0fa09968,0xc230ed05,0x41e02ae2,
  43667. 0xe45bef74,0x0d961554,0xce4d7b6f,0x9688a982,0x5e62d22e,0xfadefac7,
  43668. 0xbd2cba28,0xaf1512a6,0xbe7c749f,0x78868e62,0xae9f5a6b,0x88048d81,
  43669. 0xc5857a29,0x6b1a5442 },
  43670. { 0x43242066,0x9f5ab9ad,0x2ccca2ae,0x0afef1b5,0x988edc4e,0xb1b43ec7,
  43671. 0x0341b0d5,0x0d0c00f1,0xb50aab37,0x4d68b8f7,0xf3a64a99,0x9a8e4e6f,
  43672. 0x7f1a684e,0x198338fb,0x351a0f5c,0x8bc0e748,0xdac44515,0x2cacf2cd,
  43673. 0x5e9ff76b,0xc14d3999,0x16393055,0x54a01b3f,0x888d8376,0x6ac3eea5,
  43674. 0x723277b1,0xb84d9a9a,0xe11dbbbf,0x99132691,0xabb67178,0x597717ae,
  43675. 0x8bb14ac8,0x4c213526 } },
  43676. /* 20 */
  43677. { { 0x95532833,0x2e6fe0a6,0xd626d067,0xabca228e,0x649e73bd,0x22aef3d9,
  43678. 0xf03c4c0c,0x2083a87a,0x35169b45,0xe954e75d,0x74506a89,0x577509ee,
  43679. 0x2aeacf90,0x49cb276e,0xfa409f91,0x08275d77,0xf0bbd6b9,0x61eb6f3d,
  43680. 0xe4132704,0x948202cb,0xb1c498b1,0x35f3fc21,0x361fee59,0x76c68ba8,
  43681. 0x50e051f3,0xa18cbbd9,0x318e7042,0x2384a879,0x80dd1e8b,0x292abead,
  43682. 0x5c37c334,0x65713c29 },
  43683. { 0xceb77b9a,0xdccca8e9,0x23b69469,0x2f97e727,0xa01d6b28,0xc76abee6,
  43684. 0x5abecdfe,0x3925203d,0x29290d70,0x89448082,0xb0314438,0xf9931424,
  43685. 0x7cd447c3,0x04209df1,0xc855c827,0x7c6f2059,0x56c0e069,0xd97d7862,
  43686. 0x412d94c4,0x5a9db6fe,0x994c41dd,0x19a64591,0xc89e21a3,0x12348aa1,
  43687. 0xc6a03f0e,0xd6904b50,0xa616feac,0x55c15156,0x7cc7693b,0x4e36d1b5,
  43688. 0x3bae3c38,0x6b0e996c } },
  43689. /* 21 */
  43690. { { 0xcceced00,0x32789fab,0xe5b7aa66,0x3237e71a,0x2ddebcdf,0x87b2e269,
  43691. 0xb61dad8f,0xb7245120,0xd35f803c,0xe11e5e48,0x98e50f0d,0xfb4df5d7,
  43692. 0xbcd2ab92,0x60ee68b4,0x1ce3363d,0x98ab2f5c,0x7cd42647,0x15ba39da,
  43693. 0x83f4fb3f,0x1a6572eb,0xe56f08db,0x0f77de88,0x172562c2,0x1743761e,
  43694. 0x8a58f0f4,0xbe349ff8,0x84d1d6e2,0xe04da71b,0x9e9ff3b4,0x368f0342,
  43695. 0x678223f8,0x4022a205 },
  43696. { 0x83847375,0x527bbd05,0x3f451af0,0x3ae56b62,0x4b2c7f18,0x6198f24d,
  43697. 0x4525b98d,0xee323f5b,0x0e0884b5,0xa9d8d39a,0xfb12c776,0xd005d7f6,
  43698. 0x708bc154,0xd71c483e,0x742541bc,0x8ca6fd28,0xf8397ddb,0x0af3dccd,
  43699. 0x3eccf243,0xb80d3125,0x58d81b8d,0xc743a108,0x71391f68,0x3f48eb21,
  43700. 0x33bb657f,0x493aff88,0x07e47e31,0x1d15ed66,0xe08279f6,0x10159b11,
  43701. 0x24a6a956,0x312179cb } },
  43702. /* 22 */
  43703. { { 0x07615ac2,0xa94cc3ca,0x121ad581,0x85865e64,0xa7986b79,0xae47616f,
  43704. 0x9d5e0f1d,0x395a40eb,0x3d9457ea,0xa9143264,0xfa2865d9,0x8de6d6a3,
  43705. 0x1014ae8c,0x0771db96,0x976a87cb,0x77a7cce6,0x143a0f60,0xa7de42e1,
  43706. 0xd993d934,0xe203cc09,0x98ec4c3d,0x92018693,0x3a25df4b,0xd77546d8,
  43707. 0x62b02d6b,0x0ad9eb47,0xd05a7189,0xfaaaf208,0x431221bb,0x5238181f,
  43708. 0x733511ea,0x417d6c78 },
  43709. { 0x0e91e9a8,0x3cbd81b7,0xc370d6b3,0x73340418,0x8eaa2373,0x825db10a,
  43710. 0x6c7d6756,0x8f2b09e4,0x94c33ded,0xe288ee9b,0x1695e3fb,0xcd8426bb,
  43711. 0xdce9e888,0xa6176c86,0x6165e362,0x3f4c8922,0x6063fb09,0x514e411f,
  43712. 0xc8f9e04c,0x6907ac20,0xdfd2ad61,0xcef7469c,0x8452199a,0xba30bae4,
  43713. 0x12ac3462,0x30681293,0xc92d482d,0x011be873,0xe8330995,0xff4cbf89,
  43714. 0xd1470a0a,0x02189d52 } },
  43715. /* 23 */
  43716. { { 0x92599c69,0x73e419dd,0x7fec32ca,0x5b94221b,0x09bbfbfd,0xb2bf9bd2,
  43717. 0x63ed895b,0x61ea97a4,0x3f486f79,0x6609146b,0xfd141a39,0xbd1c7a05,
  43718. 0x83d64135,0xc79ec8cf,0x9883507b,0x7f8fd42f,0x17b3d027,0xafcb53b7,
  43719. 0x67ca5a21,0x86658dcd,0xcd149786,0xa6a6c0ac,0x34b95067,0x16f3d70e,
  43720. 0xdf44958c,0x371208e3,0xec280212,0xd2dd64e6,0x30782c71,0x33b2c4ab,
  43721. 0x521176fa,0x7bbf8abd },
  43722. { 0xa78b981a,0xbe9e4aaf,0x304ec828,0x788b4e36,0x3959dea3,0x0c45cf39,
  43723. 0x240b39c7,0x70a9bdd3,0x28383b7d,0x499cd7dd,0x307a1026,0x30690b2e,
  43724. 0xee92f1b3,0x2262d598,0xb4725a48,0xc62d77de,0x7bc3aa0e,0xa16f25bc,
  43725. 0xd15ef7fa,0x62dd8b65,0x0b96d68f,0xd979221d,0xa00f1906,0xb92885c3,
  43726. 0xeb74c740,0xfa476b9b,0xc7576222,0x217ddbb5,0x5788504f,0xc2782c30,
  43727. 0xf812716b,0x860d096c } },
  43728. /* 24 */
  43729. { { 0x4d79bbf9,0xfebc337d,0x69f74f80,0x5d53eab8,0x33104d53,0xff36a095,
  43730. 0x196f8b97,0x2ab820da,0x75ce6909,0x961d3d1f,0x04683754,0xb197ec04,
  43731. 0x93a6cb9b,0xa68ce1bf,0xc5f021a3,0x503456ff,0x8940ffdb,0xb50a2db1,
  43732. 0xef004209,0x77c50f8f,0x04965875,0xd635d177,0x8bb8770a,0x725766d9,
  43733. 0xa078e53e,0x8e19b028,0xf9fc8378,0x364d4cca,0xf0dd39a0,0x1a3df411,
  43734. 0x03adf920,0x7e80e442 },
  43735. { 0x539a1ddf,0x4b5f8a57,0xee486562,0xd248e7ae,0x816021e1,0x1c7b491d,
  43736. 0xfd36d2c4,0x2e7b871b,0x0aec00d9,0xda38b504,0x6193f1b3,0xf2827612,
  43737. 0xfb1f78d6,0x69c3fe86,0xe827ac33,0x56c8b786,0x3487c8f7,0x1687f6c7,
  43738. 0x19dee5bc,0xab8f2217,0xff399418,0x04e8473f,0xa9027c80,0xf384c014,
  43739. 0xaa1d2e28,0x9967be9a,0xe065eef1,0x869686d3,0xc7bd837c,0x737c6b08,
  43740. 0x9e8bd863,0x5dcab5d1 } },
  43741. /* 25 */
  43742. { { 0x9a7d772b,0x0784283a,0xe540959b,0x6b49e525,0x86414ab5,0x546bb008,
  43743. 0x9d74b2a9,0xd4448162,0x203b0b1b,0x267890ad,0xc8d3f86b,0x1e7a82bc,
  43744. 0xd85a83c7,0x1352bfb5,0xfad07ccf,0xf29f16e3,0x41e0c43f,0xc02a63b8,
  43745. 0x6b379fef,0x904f22c5,0xb1244f26,0x19d8a653,0x3a28bdea,0x6635b6df,
  43746. 0xf6d455ce,0x18b68851,0x9cff3735,0x74ac2818,0x8b2cbdab,0xad40f9df,
  43747. 0xadc9d498,0x08cc2d9e },
  43748. { 0xc170c84b,0x2e6a6866,0x5a49a484,0xbb989e8b,0xd04c8992,0x7b0e00e0,
  43749. 0x61b3a423,0x55ad3478,0xb0d01899,0x3c952450,0xe3100cb3,0xe3922155,
  43750. 0xf03276d0,0x19265b6e,0x76d42b53,0x0fe8595a,0xfc6353b6,0x0a96dee0,
  43751. 0x246f893e,0x761e0dc8,0xf0a74cba,0x4ec902be,0x3fdfad9b,0x61008684,
  43752. 0x4fdb6975,0x5d6a60e4,0x7ef7590a,0x3f53aac8,0x12870a37,0xd29e6be0,
  43753. 0x55aa55b0,0x991fadc1 } },
  43754. /* 26 */
  43755. { { 0xb4844ffe,0x82bc4b0f,0x60f8b871,0x73922714,0x4ce3f1f3,0x8ac000e2,
  43756. 0x163519ec,0xf0d548b4,0x88288b5f,0x7aaf842b,0x2bdc9a70,0x9e8b0c4c,
  43757. 0x4ba5fd67,0xa06d5152,0xf93cdec3,0xd0b1afa0,0xdf89f8f0,0x280955ba,
  43758. 0xeea32c92,0x86cbe92d,0x3fe05be4,0x0cae3f99,0xfa6919aa,0xf2607095,
  43759. 0x6e0f1b8b,0x0f54741e,0x30ecf988,0x2aed1f74,0x734991d7,0x9296f76b,
  43760. 0x259f0fe9,0x66cf8d28 },
  43761. { 0x226f5868,0x9b01905b,0x16909e9e,0xc102e88c,0x4a37eb54,0x2bd08916,
  43762. 0xc9816323,0xf72253e8,0x86bac53c,0x37f84e9d,0xafeaaaf7,0x2e352454,
  43763. 0x2ca0046e,0x67c86f77,0x6663372e,0x86bce50e,0xb6950a04,0xf6a3a960,
  43764. 0xfc1aba93,0x61f994d7,0xc1326e6e,0x1957c12b,0x2e56b005,0x9b658fe4,
  43765. 0x8592740c,0x9cd297fc,0x177f26a5,0x7654ce9b,0xa79d2ebb,0xaaa699db,
  43766. 0x0ecb6448,0x5fca0c5a } },
  43767. /* 27 */
  43768. { { 0x569a6663,0xe26e25f3,0xe6aa4ca7,0x09597ee7,0x8d18b80c,0x25a4cda6,
  43769. 0x22926730,0x450602b5,0x07387209,0x9af5f650,0x26733a53,0xfeeedb34,
  43770. 0x86572951,0x0f5ce768,0x8398ae9a,0x872a360b,0x2b30f6c3,0x60347a80,
  43771. 0x1a162158,0xd2113b23,0xee6c6dec,0x6fd9cf92,0x5cbcf9e6,0x85f0a5a8,
  43772. 0x2ba3fe84,0xd7a5a6e4,0x51ecd727,0xaafe6720,0xa2081a10,0xe09c6bb2,
  43773. 0xb973b0b4,0x657acbf0 },
  43774. { 0xc274c8d4,0x3130466f,0x30a994d1,0x42765176,0x7079435f,0x217258ca,
  43775. 0xeb897a06,0x44850406,0x561ee130,0xf38dfeee,0xaa1778bb,0x11f4facf,
  43776. 0xb9abb9e9,0x765c6617,0xd8f10932,0xb135499b,0xa73b9159,0xc0eb6337,
  43777. 0x6f7e8b6a,0xf2c1ccf1,0x187def53,0x5b32c03a,0x830b9c62,0x89ad1d49,
  43778. 0x2f10e538,0x1735eae3,0x9d5f55bc,0xb1cbd9c2,0xe539db0d,0x42428c47,
  43779. 0xc852b3bb,0x3d2da412 } },
  43780. /* 28 */
  43781. { { 0x871f2865,0x97702b6e,0x142920d6,0x56cb639f,0x45b58611,0x328522a0,
  43782. 0xf3b13812,0xf3943ad1,0x712206e8,0xe6c2200a,0xa34d59ea,0xc2890e5a,
  43783. 0xf6b7f759,0xab52fd40,0x180bf567,0xf522c8de,0xaccee396,0x181e97b2,
  43784. 0xc4ea5cbb,0xe0375819,0xab51d3ef,0x0d9985e8,0xbcb50fd8,0xe26c96ca,
  43785. 0x97e1c80d,0xfb9d6b13,0xf796357d,0x582b1814,0x07f4c7fb,0x89a78221,
  43786. 0xc0357e61,0x02aeef2d },
  43787. { 0x2c7ec9be,0x2ba7926f,0x7258b201,0x292f307e,0xc6fa6b4a,0x74e62a10,
  43788. 0xe2bcc5ab,0x80c08549,0x7bb8c073,0xb4160db8,0x329f194d,0xd5ef0529,
  43789. 0x6dda4a9c,0x0eb8da14,0x15ea23d1,0x0b5d43d2,0xfc34bfae,0x6cebef02,
  43790. 0x848757a7,0xacd364d0,0x2d34cca3,0xc1401368,0x1d2d95e2,0x09ca6742,
  43791. 0x786eaa28,0xc3fd1d6e,0xa2965fec,0x9eb1136d,0xc0779203,0x48871baa,
  43792. 0x4b15aeb0,0x6b446c01 } },
  43793. /* 29 */
  43794. { { 0x25e8fe80,0xc819eb2e,0x98238a17,0x2b5f7906,0x81e41849,0xd6f1e996,
  43795. 0x98ea6d45,0x58ad8ad6,0xbfd02e40,0x5bae5ad4,0xa812416d,0x016dc327,
  43796. 0xa3347ca1,0x8b31a985,0x82a65391,0x0b4da610,0xb48c35fb,0x1cb91b2d,
  43797. 0xd2aaf8c4,0x9e96817c,0xcdfdcdc0,0x1a630483,0x12b69254,0x70559361,
  43798. 0xf8a2a097,0x5fdcd712,0x35cc5281,0x59ab623a,0x932b6095,0x30c8ebe0,
  43799. 0xb08e052f,0x8613424b },
  43800. { 0xb2231d8a,0x28902063,0xd9a61667,0xb0f62329,0x071a9f27,0xaafa0fe7,
  43801. 0x603f047e,0x6bcd8960,0xfd92a1c3,0x118cca76,0x71d483b6,0x3414e62b,
  43802. 0xba705262,0xa123ccdd,0xfd9b5c5a,0x1a576437,0x4c8d0fa3,0xa5301bc2,
  43803. 0x102427cd,0x96f0ad44,0xd3aa6c02,0x0e6fb5e0,0x072a3996,0xcd8c4880,
  43804. 0x840d3fad,0x4dafca12,0xde91d541,0x29f4ca3d,0x8441734d,0x0037c598,
  43805. 0x9ccfe57c,0x86333a99 } },
  43806. /* 30 */
  43807. { { 0xecf53b40,0xd213a751,0x2f78a542,0xcff2c6f2,0xf13ae56d,0x0f59f0e2,
  43808. 0x0e61748e,0x91f8ccbf,0xd72c4145,0x0aadecb9,0x4c9cdcb7,0x6b2ed852,
  43809. 0x1eaffc70,0x8e00b72c,0xaa728102,0x89b24285,0xb679cafa,0xaa7ea7e0,
  43810. 0x4f0a6f6f,0x5d2b8c26,0x0e804397,0x7ed7b173,0xc8573049,0x5a93eb45,
  43811. 0x0986e93e,0xc92bf5d4,0x6a20c0af,0x526b5a9c,0xb99dc3af,0x0adf47c9,
  43812. 0xba202cc9,0x12b25fe2 },
  43813. { 0x33eea395,0x09b8d78a,0xf633fc5c,0xc7a93618,0x270eceef,0x7e821629,
  43814. 0xc628ed0c,0x524779b8,0xa1d68939,0x91db5ca1,0x586edc90,0x8626e18e,
  43815. 0xfeb3f3bf,0xfe023e8b,0x0250171c,0x6279fde1,0x55e172de,0xe52ec7dc,
  43816. 0xc6d4ca45,0x445e8695,0xbdbc10f1,0x42de3878,0x6fc3835e,0x2b114de8,
  43817. 0x7e10b652,0x9faba456,0x390e78fe,0x4111d82a,0xaedf0aca,0x576b61c2,
  43818. 0x74accb74,0x216279a9 } },
  43819. /* 31 */
  43820. { { 0x4047f747,0xc14cdabf,0xc1315a1e,0x03ca233d,0x40e5d0a7,0x59e7cbd3,
  43821. 0xbb413869,0x1fd0c4e9,0x0f01fbd8,0x189d08b1,0xa76b823d,0x50449c42,
  43822. 0x398b00a1,0x81c224a1,0x8e8179e4,0x08084e4f,0x698e41e9,0xfd8af994,
  43823. 0x5610bf2e,0x1e30e37c,0xa7d2790f,0x4e6a043f,0xb3195388,0x9d96e60c,
  43824. 0x03799dfd,0xe75f986d,0xf8ff902f,0x3b4a8f11,0x7588416e,0xfa945378,
  43825. 0x9827535e,0x20683e3f },
  43826. { 0xd0378878,0xcb582e26,0xa7945787,0x9e214c23,0x8f6688b3,0x13d000bf,
  43827. 0x40515270,0x7548d4f5,0x40111f5d,0x7113c15d,0xa8bff902,0x3bf5a526,
  43828. 0x9b4945cc,0xbda6b010,0xbc2f3a05,0x83dcc74e,0x43efdfa1,0x2aef6284,
  43829. 0x565c5bf4,0xd2e60ee9,0x592f243a,0x4f0fa10d,0x1bc3bf51,0x6ae58b32,
  43830. 0x60576a74,0x813b0868,0x4d73081a,0x0bc023f8,0x32dcee59,0x9fd03aa0,
  43831. 0x27d6c795,0x5e416bf5 } },
  43832. /* 32 */
  43833. { { 0x026cc23c,0x24313760,0xb5b29058,0xf819aaee,0xc5d2ee17,0xa92272f8,
  43834. 0xee5cc402,0x8048e7cb,0x77def07d,0xdbc7d6ee,0xf6af821e,0x61d69244,
  43835. 0x996cbb89,0x5f7966ed,0x96a155a4,0xf81b17ea,0x03f3ed56,0xb2d9ef70,
  43836. 0xe882a5b2,0x5e6e5906,0xae947180,0x86fa1072,0x658c76f4,0x34d9fc51,
  43837. 0xcb035aa0,0x9f603dc0,0x75be6481,0xb7b39feb,0xcf04a9ef,0xca87554a,
  43838. 0x87b4fde3,0x4ff682ec },
  43839. { 0xd0a10ad5,0x3125627f,0x968e6f45,0x7fd45c72,0x806a1163,0x2981bd6b,
  43840. 0xde5033e3,0xb92de1cd,0xbf4f8988,0x3b44b45e,0xdae7e1dc,0xca1b9896,
  43841. 0x0778d878,0x52166e5a,0xa5116847,0x82d472be,0xf2895445,0xfbdd382a,
  43842. 0x5d6ec4c9,0x22ed1602,0xb6552b02,0x3614eb1c,0xa1e6210f,0x63c5df73,
  43843. 0x021a74a7,0xe9160285,0xc65cbd4d,0xa44ca400,0x0f15e299,0x48cb187e,
  43844. 0x3402507c,0x51eb818e } },
  43845. /* 33 */
  43846. { { 0xb92100ab,0x1fc1d178,0x9605b839,0xdf2e3d60,0xb71e59d0,0x12a7c255,
  43847. 0x14fcbe04,0x3f8b6675,0x59fd06af,0x0e8a3935,0x12020d07,0x56326502,
  43848. 0x528e7be5,0x6696fcd1,0x0c7b7654,0x6588514b,0x5912a5b5,0x0cd80f8c,
  43849. 0xf324cb7f,0x8bafef04,0xc6da3d75,0x6b53eecf,0x31d1df2f,0xedef48d8,
  43850. 0x73812b6d,0xf336b965,0xee626031,0xc82eae4a,0xd244f09b,0x300abd32,
  43851. 0x31d9647f,0x8b0af955 },
  43852. { 0x2e603544,0xb770180a,0x221acd9e,0x2b573ac3,0x62407032,0x3a17f665,
  43853. 0xb89abc3d,0xad3e74ad,0xd793225a,0x8a3d2e3a,0xef02564b,0x457bba04,
  43854. 0xfc2dd2b5,0x8875652f,0xe67143e8,0xd2905d15,0x02e48d70,0x6d884b42,
  43855. 0xc7636a57,0x06f99219,0x35e378df,0xa8dc3421,0x10c64a02,0x95c1d73d,
  43856. 0xcc157a66,0xcd6a4ece,0x8e24a354,0xbadcc1c8,0x9839329d,0x8024f1b2,
  43857. 0x4da48ad0,0x5363e549 } },
  43858. /* 34 */
  43859. { { 0xe23fc641,0x1f5523b7,0x86667063,0xfe54e72f,0x8e009d2f,0x294a15f5,
  43860. 0x8c57f5e1,0xf203997f,0xb16d64dc,0xa229724c,0x4baa2ffb,0x697be4fd,
  43861. 0x0a6e8ed6,0x3f507e46,0x78508536,0x0afe3a5d,0x95408208,0xeeef6cdd,
  43862. 0xf2c4237c,0x701fd889,0x5c385253,0x496d883a,0x72a212f1,0xe25c67ed,
  43863. 0x1ff78fcd,0x4b416783,0xc16f4146,0xe9967004,0xc45b0697,0xfa45c3a1,
  43864. 0x3fbd30c3,0x63334018 },
  43865. { 0xa2fbbbce,0x39c9a0cc,0xaa0cb744,0x876f6e5c,0x3438ece3,0x9ce6010e,
  43866. 0x13802d82,0x0aad148e,0x9cd45a1b,0x9c3e5c60,0x7bcfc1e0,0x875cb859,
  43867. 0xd8584dd0,0xb19ff790,0xd81c2a2b,0x2598b81e,0x02be07e3,0x118bdf2f,
  43868. 0xb9765ce9,0x074fc8ee,0xb24f95ae,0x125e9d88,0x0c98f09d,0x3bb12cdc,
  43869. 0xa0b74b27,0x4a6aee07,0xc08077ce,0x4723d2f9,0xbea8026f,0x959447d6,
  43870. 0x16280b73,0x93a7075c } },
  43871. /* 35 */
  43872. { { 0x715b27f9,0x26bbefe2,0x2a280923,0xa935a5e2,0xfd58a26a,0x5ddf23af,
  43873. 0x7c138694,0x54c83e16,0x892a2153,0x44799bc9,0x9b8d09f5,0x4e6e4710,
  43874. 0xd588ea68,0xc63af616,0x883ab1b6,0x5e896706,0x3d209336,0x3c1393a0,
  43875. 0x92c23dda,0xd02f2921,0xdcf6ea43,0xab70cb7a,0x791559e1,0x12434ea8,
  43876. 0x6d70ff0b,0x040680db,0x2832ba45,0x1a10fe52,0xe5f0cb8f,0xd69f9c08,
  43877. 0x44b141fd,0x1a7422ac },
  43878. { 0x9f40b675,0xc3a9dd2e,0xfcc71f39,0x2a7c6603,0x1948e342,0x18939a61,
  43879. 0xed0ab484,0x8f3b6158,0xee31ca6b,0xa3aa7d97,0xf7a8db63,0xbc1e865e,
  43880. 0x2c7c62e4,0x315f8c09,0x9f5c6d0f,0xa260788f,0x4b6f3ec5,0xb1833129,
  43881. 0x36b4d849,0x73adbcd6,0xbc699a9b,0x66e14890,0x2a1175e7,0xbf3790d8,
  43882. 0xfc53ca4f,0x7f43605a,0x87ff6091,0x577f6c47,0x600c82b6,0x827c7552,
  43883. 0x9d25599c,0x0944d630 } },
  43884. /* 36 */
  43885. { { 0xe6ab9620,0xcfdeb63e,0x786cd808,0xdff4fa6d,0x456320b3,0x145edd82,
  43886. 0xc4943915,0x2ae5f862,0xb73b3f87,0x9508e813,0xe52f97a9,0x3bd805f3,
  43887. 0xc9829b62,0xf71b5c28,0x86e0cefc,0xb394c70e,0x23bdb36e,0x534fb1a9,
  43888. 0xdbe27e5a,0xd64f5862,0x83ab6169,0xbae23df3,0x27c828cb,0xdd6df1b1,
  43889. 0x3a307a8a,0x1901899f,0x811ddf66,0x36cc8659,0x79943b77,0xa3cb7774,
  43890. 0x6fd86576,0x7d89f383 },
  43891. { 0xc9f92b2b,0xf8564242,0xc46e32bd,0x700c6a75,0x7f99a5c5,0x93e768b7,
  43892. 0x03149568,0xb6efe858,0xc2ce6709,0xbbfe8a19,0xee6ec493,0x721a3b1b,
  43893. 0xc371c28d,0x26eeeea9,0x15177e1d,0xd798115e,0xb068a5a5,0xd7bf3bce,
  43894. 0x46d2b4b2,0xdf8da220,0x59be9dfc,0x3df0995b,0x77640b79,0xc96897bc,
  43895. 0x5a2bd3c5,0xce0cf4c2,0x89afe744,0x16f45d6e,0x3a8509bb,0xb53f3acb,
  43896. 0x63f2a6e6,0x449af81f } },
  43897. /* 37 */
  43898. { { 0xa16d9377,0xc2fcf132,0x7e1a2f9e,0x9ab377b3,0x86d19ae5,0x72e1a12e,
  43899. 0xd013bbb1,0xd2b12e66,0xcb5f66ba,0x0972e055,0x399eab50,0xd11de1c0,
  43900. 0xc65f5ec2,0xc1f314fd,0x8a9ff593,0xfc311841,0xe05246e6,0xdf73c1ec,
  43901. 0x1625056d,0xc28d1363,0x6fb25e19,0x30a9dbd7,0x845cd2d7,0x049ed244,
  43902. 0xd36e852d,0xc779b83f,0xf68c8a83,0x85a35fc7,0xc95e8033,0x299bf1e1,
  43903. 0x20891af5,0x0e8617c3 },
  43904. { 0x67c81b5c,0x53720602,0xe737873c,0x2fa89dcd,0xa8144fd0,0x2a7430b0,
  43905. 0x26208c83,0x3006c5a7,0xd8ea40f5,0x4e066660,0x896413a4,0x9dd025f9,
  43906. 0x46b9149f,0xbdf380cc,0x0a125cc2,0x80156619,0x52793c37,0x04d6a3b7,
  43907. 0x6b7a62f2,0xb6001374,0x585d5978,0xa9cfe268,0x8395fe66,0xdcad0cb8,
  43908. 0x46b261f6,0xbab468fc,0x9d9d9218,0xca0ef5ef,0x5e452402,0xc507d4a8,
  43909. 0x326cf687,0x6f4404f1 } },
  43910. /* 38 */
  43911. { { 0x4febd3ff,0xa3e1920b,0xfdfd2bba,0xca6234d8,0xe19a9829,0xb7d1af2a,
  43912. 0xc6f5bc20,0x23de1610,0xdaa39ca9,0xe204dbf3,0x6d8c70ab,0x2a2de9b8,
  43913. 0x7c9d370b,0x272e0c37,0xe565510e,0x80914c06,0x57cbb6b0,0xb611e7a8,
  43914. 0xd8266a6e,0x076fc6ef,0x3095801c,0xdfac34ee,0xb9e24063,0x69ff40a2,
  43915. 0x787aa5c5,0xa7ba31a9,0x33c70cd2,0x0e4d1fdf,0x6895f074,0x903e3132,
  43916. 0x7fb671e2,0x905771f8 },
  43917. { 0xa4062bee,0x5199ba0d,0x94d7d9f9,0x18e7238c,0x1e0922c0,0xf53f29bc,
  43918. 0xb12d855f,0xde9b2a81,0x6d68ca29,0x649f3eed,0xc50c097f,0x64adfc34,
  43919. 0x9db398a0,0x81964ab9,0x7a587224,0x00d59c47,0x74c5903a,0x09fea396,
  43920. 0x15043dd0,0x6aafd8ee,0x5f1ecc20,0xc5721a6e,0x0db9b7b4,0xb6d6a483,
  43921. 0x66c8d52a,0x06ffc617,0xacc82a27,0x3de241d6,0x27f2f7a8,0x0605f052,
  43922. 0x6404decc,0x6a22953b } },
  43923. /* 39 */
  43924. { { 0x74fce389,0x92452d8f,0x2afa5564,0x059634c0,0xf0ed7825,0x9377ccbb,
  43925. 0x37718e0d,0x89f4045b,0x9fa69a4d,0x11074e7d,0x7295b0ba,0x5d70bb07,
  43926. 0xf107ede6,0xb22d54ad,0xa1a29c7b,0x5c39a3d8,0xd795e3ab,0x37236c02,
  43927. 0x2b589951,0xf7282d00,0x5790bee2,0x5e2265be,0xa8e65ea2,0x91e0ea11,
  43928. 0x6001cebd,0x0e71a708,0x2c1c5402,0x16900f5a,0x357f6981,0xc3b2d5c0,
  43929. 0x619e3427,0x528c9ea0 },
  43930. { 0x5f26c577,0x1edc86b4,0x9438bd45,0xf8074708,0x792582a7,0x2dfe1013,
  43931. 0xde1e569f,0xe08eaca0,0x9a55a356,0x5f952efa,0xe4976216,0xa4d80b53,
  43932. 0xcd5d71f2,0xd2b65855,0x66cea3f0,0x246704bf,0x492323ca,0x193f641f,
  43933. 0x9adb1325,0xa681855c,0x2d19d652,0x86d522ce,0x5b82ed7b,0x53609f10,
  43934. 0x8e150d29,0x3b0f0094,0x0b13e891,0x23ad8bfb,0xf794b449,0xcbb1556c,
  43935. 0x738bcf57,0x200f9093 } },
  43936. /* 40 */
  43937. { { 0x8388387f,0xf9b22fc5,0x28e883c5,0xcf26f170,0xd1b7973c,0x447cab90,
  43938. 0xf6ec9171,0x8d5d4ea2,0xc30cdbc0,0x2e16f498,0x48623c2b,0xdc92910c,
  43939. 0x30dbc545,0xeb1491b0,0x14de21b0,0x631deb2e,0x2fe830f4,0x04a21066,
  43940. 0x379c1f3f,0xa4c6979c,0xfb06a795,0x8a732b68,0x1619dfa9,0x3a44327a,
  43941. 0x8dbe2c9b,0x91a307d3,0x03989fea,0x939bc8d2,0x0f4a331f,0x3daabaf2,
  43942. 0xdd0f55dc,0x5c307e98 },
  43943. { 0x35b233da,0xbbc4e0c4,0x22f6f985,0xe3d29085,0xa8b02468,0x99dd2d21,
  43944. 0xa96916e7,0x978f40e9,0x614bcced,0x0327d86c,0xb290762c,0x95e95502,
  43945. 0xa879f2ed,0x0ffd2197,0x50e0bd33,0xc4365137,0x0827c4c4,0x26c3148a,
  43946. 0x3fcfc0b2,0xc79812a8,0x31928589,0xc3d8d17e,0x8830f42d,0x8b572cfe,
  43947. 0x4b07f83f,0x7cd9ff92,0x0a51148f,0x331ca950,0x4c59f9ac,0xd0c53968,
  43948. 0xc1434785,0x1df16dfa } },
  43949. /* 41 */
  43950. { { 0x68bcacc3,0xcc7bb4ac,0x430f58cf,0x06ded34f,0xd461855a,0xc59f9f4f,
  43951. 0x45c9f0bc,0xf5491994,0x4375c892,0xdc5f7ec6,0x3c85983a,0x1b8708f1,
  43952. 0x82fcd087,0xb32a5cc4,0x2d6b4c0f,0xefdcdc35,0x8ac6fb2d,0x4bb24f04,
  43953. 0x33906471,0x5982d4f5,0xb83a3ac4,0x162eb52f,0x2337a223,0x7130df28,
  43954. 0xcbc3dbd3,0xdce7b802,0x2467ac0e,0x8b395959,0x1b56717e,0x21d3d2e8,
  43955. 0x46512617,0x729a7f50 },
  43956. { 0x8420f90a,0x874ed1aa,0x0fe4c855,0x6368e19e,0xb0be74af,0xb62d4aaa,
  43957. 0x8ca60ca9,0x76fcc480,0x7645a867,0xf310b5a5,0xddb1b24c,0x131bac9b,
  43958. 0x2dea5b44,0xef77d71d,0x72fcc64e,0x4706d210,0x673d77f0,0x29b92691,
  43959. 0xe89e0663,0x22e00bf3,0x74077d40,0x472d0cd3,0x829232e2,0x3e21040d,
  43960. 0x38dc8533,0x2f916dfb,0x14b8f667,0x48bbb59b,0xd44be19d,0x19de9f4a,
  43961. 0x232d9d5c,0x7f6d3649 } },
  43962. /* 42 */
  43963. { { 0x6e794819,0x3bd064de,0xf82ebda1,0x5a6b694e,0xb91e2804,0x1f017fe0,
  43964. 0x07a43cd2,0x190d31f3,0x630433e9,0x6c26f226,0x0abfdcb4,0xba488aa7,
  43965. 0xa46411c0,0x418d9085,0xbffb5880,0x1b934fe6,0xe200f849,0x75d1e237,
  43966. 0xa55413db,0xdf04d63f,0xe23b3f77,0xe216ed75,0x0f91bd30,0xa05866cb,
  43967. 0x7729c509,0x84c395d9,0x452ab2d7,0xec97e188,0x0093d686,0x8cb7c1f9,
  43968. 0x628f086c,0x2d032395 },
  43969. { 0x4a44b4c5,0xa81c9407,0xcc702c98,0xb9846879,0xceb0dc97,0xcb502287,
  43970. 0x6e3aa321,0x30301126,0xe4c256c2,0xc0ac8763,0xe55b4845,0x65034d20,
  43971. 0xf240f35b,0xaa96a040,0x7cf7eedc,0x046d26d3,0x3b810656,0x62a5a8e1,
  43972. 0x83d70c2b,0x86044b97,0x59e4da8f,0x2fbaff88,0x5457f5d1,0x929d901a,
  43973. 0xb531b757,0xd29e1eb2,0x9e4e9739,0x214dabdc,0x4eaa9bd9,0x5bd724fc,
  43974. 0x1ef9bb9b,0x734c12b3 } },
  43975. /* 43 */
  43976. { { 0x92f9b086,0x98fe3c2e,0xb3fd4544,0x4641b93e,0x5c02c65c,0x47ce208b,
  43977. 0xc4f03242,0x8a52dca1,0x679d29f6,0xb5ec17d9,0x9406f5f4,0x11d2fed0,
  43978. 0x0d9ba811,0x260f63dc,0x15472a3f,0xde2b056f,0x007290e6,0x1b170d9f,
  43979. 0xb6b5c8f9,0xa2e23e8d,0xcf34c3ee,0x345a2839,0x1b973ee2,0x9bdc5461,
  43980. 0xbb24d1c5,0x65bda6c2,0x3c6141a1,0x97d52ba3,0x9d2eb201,0x47bb1612,
  43981. 0x21fbe49f,0x7c558a87 },
  43982. { 0x3f350fec,0xb9485a52,0x6a38d4c0,0x016678c5,0x0d5aa64d,0x8ef346a2,
  43983. 0xd96da2e4,0xb85daa02,0x4f647b3c,0x845ec4ea,0x0d5e946c,0xc0d1a6ca,
  43984. 0x4fa9f4ab,0x41d8d1c1,0x9c8b1303,0x43972cc5,0x434ffbfb,0x67e1f48d,
  43985. 0x819d2318,0x350ce93a,0x6ddef23f,0x49f53090,0x200cf12c,0x3c2e6cf9,
  43986. 0x640432fc,0x42691cc1,0x72496b52,0xbfff74b4,0x020a97be,0x44527c9f,
  43987. 0x7b3c4348,0x34cd7dca } },
  43988. /* 44 */
  43989. { { 0x59e7fe87,0xf031761a,0x0047cd72,0xb1eae31a,0xfae30f62,0x27902e68,
  43990. 0xb71db143,0xa666f48d,0x0e0038f4,0x75ee6678,0x02bdd76d,0x3b45ac67,
  43991. 0xa0d6cd5c,0x0d2fb828,0x9d8c5b11,0x27ce7f1d,0x120b5e96,0x141fe0e4,
  43992. 0xb9267c37,0x95a1b984,0xd60312cd,0x5206e589,0xda549356,0x1867342e,
  43993. 0x070c74ac,0x374520b9,0x9557b0b3,0x2703cbb5,0xa6ed8c14,0xf621f59c,
  43994. 0xabf7b887,0x7ceb1cc2 },
  43995. { 0xdb7fd65b,0x0647a5bb,0x36c9457c,0xd8d45cc0,0x9e12718a,0xc6da99db,
  43996. 0xe93a7fb1,0xed1dbbf4,0xbd1566a1,0x4512c95c,0xdbc0c919,0x4861ba00,
  43997. 0x9e7f5269,0x3c6cc298,0x0941aaae,0x67196150,0xc8c538e3,0xbfcf5d0f,
  43998. 0xa25a551f,0xad6e9929,0x17ca0f26,0x90710985,0xfa89ef7e,0x743b78ea,
  43999. 0x71ab4549,0x39d5ea31,0xe6d1c36d,0x7442f3f3,0x059d568d,0x25a683e0,
  44000. 0x227ced5c,0x1f629a99 } },
  44001. /* 45 */
  44002. { { 0xe45a1c3e,0x8925ddac,0x41f7545f,0x72d29365,0x37e7f828,0x45622fcb,
  44003. 0x3e4c79d2,0x88234513,0x9c2645d6,0x5dffaf84,0x994802b9,0x3078f4dd,
  44004. 0x9d339fa0,0x566927f0,0x9fd91dcc,0x9a500a1e,0x0ab0abd7,0xce008180,
  44005. 0x8194e5df,0xd97135a3,0x98adf088,0x9e876307,0x9a45a2a7,0x3baf01b8,
  44006. 0x788b4399,0x6fed6154,0xe77a997d,0x980e5722,0x2a378eed,0xaac90ffa,
  44007. 0x8bd805a2,0x4a75fda2 },
  44008. { 0x55e74cbc,0xd09a8fbb,0xfab18f25,0x737738ce,0x9764ec3a,0x0fc23ad6,
  44009. 0xe7e0ad31,0xc5a7d35b,0xe481cc9b,0xe75e068e,0x3d4aec34,0xf0c2ea99,
  44010. 0x0d4a63c4,0xf1324fe8,0x99b0592c,0x5dbb7c16,0xa7e0f46b,0x442d674d,
  44011. 0xa300faea,0x5a5d66c7,0x3333ac83,0xe83dc821,0x8c408496,0x70ef812e,
  44012. 0x99ef5fc1,0x96e1dcb6,0x1734e862,0x6e2b771b,0x583507d8,0x04629cdc,
  44013. 0x23d8179a,0x5819f9ae } },
  44014. /* 46 */
  44015. { { 0x6aa78811,0xd9969121,0x2103e7c3,0xf64ee8f4,0x22b9e698,0xddf01070,
  44016. 0x4f582cde,0xe6001f9e,0x2ecfac1a,0x24a608af,0x06393009,0x6ef4c784,
  44017. 0xebf72911,0x5262eae6,0x8c4ee5a0,0xddbd0af5,0xecd87bc7,0x875aff90,
  44018. 0x6f24f114,0x2fddb34c,0xe865f172,0x48104281,0x886c1b9a,0x95692426,
  44019. 0x9ef4231f,0x6f5f3208,0xd0a7e82e,0xaf587acf,0x9ac395c8,0xd6571917,
  44020. 0x1364a750,0x7459603c },
  44021. { 0xf41ae519,0x1c2475bf,0x4af8f251,0x34401fb1,0xaefb2c3d,0x70ddfcd2,
  44022. 0x51cdaf08,0x9b2d385b,0x8208bb19,0x8531c256,0x4c33f3f6,0x16c89df6,
  44023. 0x24571769,0xc23cfa99,0x86d010ba,0x2339b51e,0x22638313,0x08db0e8d,
  44024. 0x00fedeb7,0xf769e179,0xa3687ef1,0x3fd96dcb,0x91476475,0xcd046b23,
  44025. 0x0c45c8dd,0xf3ff2064,0xb8343d78,0xefd167bd,0x4b77ee90,0x493ccb6d,
  44026. 0xb3cf7b45,0x33025513 } },
  44027. /* 47 */
  44028. { { 0x35eaaca1,0x36f00469,0x89119102,0x0c384b75,0xe6d2954c,0xcb375665,
  44029. 0xb1e9d6d7,0xcb9199b9,0xc29c2757,0x75852349,0xb8e738d0,0x89cbd1ba,
  44030. 0x5923a427,0x9b8dbe90,0x18fe1889,0xa237793e,0xa742e083,0xa4271757,
  44031. 0x4eebd613,0x8c4979d2,0xd4f2cf77,0x40325054,0x958705de,0xa3b8a091,
  44032. 0x33d999ba,0x1b191bd9,0x3b0fee1e,0xbafefba4,0x3facdf14,0xb3bad184,
  44033. 0x4387561c,0x9328adb0 },
  44034. { 0xf906b872,0xabe84e80,0x78262665,0x705523a0,0x3398ccf7,0xd89c6a7e,
  44035. 0xf55b5323,0x2fab551d,0x0554dea8,0xa0578eca,0x375589cd,0xef26523d,
  44036. 0x864ad750,0xd8fd6242,0x178fe1fe,0x93f27fc5,0x9df87422,0x7b3e6f30,
  44037. 0x3750d054,0x2862e49e,0x5dc038a1,0x7d90c6b2,0x84db682b,0xc1a1ae22,
  44038. 0x9881930a,0x47f3dab7,0xbaf3e0a4,0x30e6bd52,0xf62d25c5,0x0680025b,
  44039. 0xadd0d5e7,0x0aa1f3cf } },
  44040. /* 48 */
  44041. { { 0x22a10453,0xa9822190,0x2a03a10b,0xdd1eb91c,0x96646f3b,0xafbb5d95,
  44042. 0xf38b6fc6,0xa58de344,0xb8cfca1d,0xce47c3e5,0x0f70da04,0xfcd8e16d,
  44043. 0xda262ed6,0xac44349b,0xc56e2f8e,0x9320d87b,0x19138e58,0x9ce3ea08,
  44044. 0xa2b236c0,0xa5862dff,0x8e7efb0d,0x6b0f9a5c,0x16ac78eb,0x4b53432b,
  44045. 0x709b51af,0x6ff43105,0x8f519628,0x08e236f8,0xeed403ad,0x1f93f176,
  44046. 0x9636545e,0x559337e0 },
  44047. { 0xd8fd807a,0x30ddf738,0xab131222,0xf4e0ec9d,0x625afbc3,0x14a2f4db,
  44048. 0x9f12f895,0xd5b70604,0xac3044fd,0xb46f3c23,0xf540148f,0x1b232d1f,
  44049. 0x39b4e554,0x61b458f5,0x0dd70b75,0xf694b24a,0x289581d9,0x0fc64299,
  44050. 0xee5fe22d,0xc05d49be,0x6a18bf63,0x7af3447f,0x7f1929d6,0xe96a1dc2,
  44051. 0xc1551e8c,0x6afe6028,0x2b5d4fa2,0x27dacaf3,0x545c2cb4,0x4a1631bc,
  44052. 0xb0c914d3,0x930070f9 } },
  44053. /* 49 */
  44054. { { 0x69a9bc05,0xd2f32c5e,0x589c4b73,0x0a5c19c6,0x94665f9c,0x095c9e5e,
  44055. 0xbcfb4c39,0x8ab0f293,0x1ddb7c31,0xb9070877,0x66b38048,0x894e9658,
  44056. 0x606bd9bd,0xf19a90cf,0xb6fd2d69,0xcc1d58df,0x461d8a69,0x886dcc4e,
  44057. 0xf9ce4831,0xc455c277,0x765f8a82,0x749a5996,0xc3badc8d,0x2ffc668c,
  44058. 0x9112cdab,0x38018396,0xb243c7cb,0xa98795c3,0x010a2224,0x8775f310,
  44059. 0x587b5e14,0x043a2141 },
  44060. { 0x3a873752,0x7bbe9dbc,0x2f442fee,0xee1493f4,0xc18c2181,0x981ca2c8,
  44061. 0xe29769e7,0x00ce3090,0xde768c5f,0xb4626ac8,0x34d7677e,0x33e9ce46,
  44062. 0xe0fa94e6,0xf89c2cad,0x41f5b5bf,0x04f5cc11,0x2228c12c,0x2565f736,
  44063. 0x0c05cce5,0xf1bf706a,0xbe487c4f,0x5d07ffff,0xa499f1a4,0x3ec43c09,
  44064. 0x98d94800,0x4f4e79bb,0x073f12f8,0x8a335a16,0x0f970d6d,0x4bb5eaf7,
  44065. 0xf24d0ae8,0x18d0747b } },
  44066. /* 50 */
  44067. { { 0x84601faf,0x58d3c77c,0xaf1c1f72,0xc9465be2,0xd116d806,0xff626798,
  44068. 0xd5b0d93c,0x3996c0c6,0x5ec6723a,0x2fa1ad75,0x03ba5349,0x966a8144,
  44069. 0x2ac34d8a,0xdc4c9422,0xed675865,0xddf471de,0x953d528f,0xd8aca597,
  44070. 0x24ebf67d,0xb2e463b5,0x7e25b4d3,0x25824871,0x43159daa,0x23c5adba,
  44071. 0x83357540,0x5458f9c6,0xf938b1a6,0xcf685da7,0xcefed231,0x981a4fda,
  44072. 0x08bb5e59,0x711093ed },
  44073. { 0x401f161a,0x12aa3fc6,0x974c5e87,0xf7358560,0x17b5df82,0x4aa252fb,
  44074. 0xa48e6299,0xb0b82b07,0x29dd847d,0x00234157,0x4529c5a6,0xf1e54d00,
  44075. 0x6d98f538,0xcc1c539e,0x28d3abcb,0x36162b53,0x2a84f0cd,0x75a37938,
  44076. 0x4dee7484,0xf717a81b,0x4c23bf1b,0x16cf35fb,0x787e8b3e,0x7fd1c29f,
  44077. 0x59b79ab0,0xb7da7e68,0x85f6c60b,0x072100a0,0xe7ed48b5,0x31840159,
  44078. 0x4d9c97d4,0x17898bda } },
  44079. /* 51 */
  44080. { { 0xae1b8cf8,0xcd8483d8,0xe9a28856,0x323d4b42,0x204a4bc2,0x7633584f,
  44081. 0xca7a69fa,0x4e0b2228,0xf757bab2,0x8afbda8b,0x6cc5f9ca,0x85b24088,
  44082. 0xd41a95c3,0x47fb4813,0xc2aabe6b,0x3f1bc53c,0x1ad1599d,0xf22cda3f,
  44083. 0xc31ea9b1,0x1b2ec081,0x01614ac1,0x048f304b,0xc6afa7ab,0xce31cee9,
  44084. 0x4140dc3d,0x55af7633,0xdce8abba,0x84b7ab37,0xc7cf3efe,0x50de7648,
  44085. 0x15356ab2,0x73a88dcf },
  44086. { 0x06e83b39,0x3f868288,0x9f44037d,0x477a4413,0x17dbc841,0xf9058b0f,
  44087. 0x54d17549,0x2db64f4f,0xf2307ffe,0xa23cea6a,0x4f126261,0x393efd55,
  44088. 0x10f37f26,0x2f4e658a,0xf4ee1e35,0xa4437ce3,0xa93cde8b,0x64ef42a7,
  44089. 0x939aa901,0x1debc9f4,0x3d7b5cd4,0x44223d6a,0xf88a3acc,0x789a6a11,
  44090. 0x2c608a2d,0x56fb9df8,0xbbf56c06,0xe79db8e3,0x668fa300,0x73c56af2,
  44091. 0xae396a1e,0x52f32b17 } },
  44092. /* 52 */
  44093. { { 0xe714f71a,0x56f524c1,0x9add8519,0xc1be1262,0x65cadbe3,0xad9189d8,
  44094. 0x5a0fb649,0xd88bf5c8,0x21d192d9,0x9efa6a92,0x6f724b6f,0xe3fe8389,
  44095. 0xb250119c,0xec3fae24,0x2ae0d3c0,0x4b6af9f6,0xd619624d,0x8fceba0b,
  44096. 0x2fdb6e3a,0x7dc3092b,0x3263cd29,0xc91da376,0xf95c43bd,0x30c0761e,
  44097. 0xcdeb44d9,0x89136400,0x43c0d31d,0xfd7dce84,0x9871899f,0x78fec3b1,
  44098. 0xefdf58c1,0x79e14d28 },
  44099. { 0x9bb40c55,0xe3822235,0x0ed07a42,0x0a27202d,0x4838c1f4,0x48e6c1a9,
  44100. 0xd864a78e,0x2b5f24a7,0x0c6c55c9,0x7e7f140a,0xce12d508,0xe62c104a,
  44101. 0xc11b1e10,0x9b0a1a7e,0xafbb3dd5,0xfd8a275f,0x9a3b6b30,0xdff354fe,
  44102. 0x46602a01,0x5a105d9e,0x93bb65f7,0x3d371b4d,0x0f82fdeb,0xda5cbf0b,
  44103. 0xde468545,0x4601229b,0xc73d517e,0x505e10b9,0x672ff492,0x77cfa541,
  44104. 0x99566ce2,0x0d8ec28a } },
  44105. /* 53 */
  44106. { { 0xcbeee995,0x014cf73e,0xd491e80c,0xb2eb88bc,0xd9aba5d4,0x615a6cad,
  44107. 0x9304c84d,0x2f7d4633,0x8ab03c9a,0xba0501d2,0x91babb94,0xc8f723de,
  44108. 0x50405772,0xc885f977,0xc7fcb094,0xb5e1d2b3,0xdf96c71a,0x61ee7995,
  44109. 0x3464499e,0xb8c8daab,0x5f607932,0xdb425ddd,0xb1243587,0x70251ca1,
  44110. 0x9fc74340,0x26d7d3be,0xc902ac89,0x8c179310,0x4559a74f,0x72522c15,
  44111. 0xc3734afc,0x86001e27 },
  44112. { 0xe7693947,0x13b00ba5,0x012c062b,0x6478641e,0xe85490a8,0xe1a438e0,
  44113. 0xd9574d5e,0x5173dbbf,0x9bd3ba61,0x9532eb8c,0x5f3ea075,0x1f41bcb8,
  44114. 0x8cbb92b9,0xac1cc247,0x1ef901b4,0x0f34648e,0xd2b3b2ee,0xdd929d1e,
  44115. 0xc3d75bfc,0x470f1eab,0x139cf4d2,0x5cdbc6f7,0xf0424953,0xcd86454d,
  44116. 0x47fcb383,0x1e079812,0x17df930c,0xb9f209b4,0x114ebc00,0x4225fc31,
  44117. 0x347946c1,0x020591cb } },
  44118. /* 54 */
  44119. { { 0x275e0af4,0xe3003721,0xe78a4a4b,0x721141ef,0xd1757485,0x666cfcf6,
  44120. 0x168e659e,0x5fa1d737,0x0e2842ee,0x263e3e54,0x948bd5f6,0xadecc3d4,
  44121. 0x246b104a,0x019de03d,0xf343d818,0xf8a9e903,0x5b0c0d31,0xcb57ba4a,
  44122. 0x51e2765f,0x8246c506,0x6519bf67,0x80c5751f,0xf2119a01,0x5f05c200,
  44123. 0x7821d4f4,0x7e6487b8,0x261c3a06,0x262f94aa,0x72146052,0x56cfe489,
  44124. 0xa1df05ef,0x5119985f },
  44125. { 0xb18586c0,0x5819497d,0xc6eeaa62,0x004415d6,0x97cda28b,0x7c6a46b6,
  44126. 0x7c194594,0x9a149b28,0x4ed3a506,0xb56369fa,0x43c94cb4,0x7092aa66,
  44127. 0xa9e9eee2,0x55bce73a,0x77893509,0x34bb2870,0x06eb5326,0x8af95fb0,
  44128. 0x9638f485,0x87cd0323,0x5ba75bf8,0x29376268,0x9d42d581,0xf32d6f3d,
  44129. 0x65c6d64d,0xa4cad574,0xb2cded41,0x985f50fb,0x9006a067,0xcf34ce0e,
  44130. 0x58a57f9a,0x59eaf265 } },
  44131. /* 55 */
  44132. { { 0x6ec3876f,0x7b407efb,0xf0f48648,0x780c6123,0xbf893039,0x2abb56ff,
  44133. 0x45a91ab0,0x9592eaa0,0x78811b82,0xce5b84d7,0x1f9f3fc9,0x86a71a34,
  44134. 0xf0e7e13b,0xc17fdd86,0x655a0880,0x88ed8297,0x81d5e666,0x75d6dc74,
  44135. 0x1d171797,0xeffc9df6,0xe3f79e1f,0x36ad4c8d,0x2046192e,0xdb15317d,
  44136. 0x274fda62,0x78c9fa7a,0x82dd9914,0x04ec924f,0x3a64971c,0x059d1e38,
  44137. 0x2620bbfb,0x3b4450ea },
  44138. { 0xc776dcdb,0x3db7a955,0x81c8ba47,0x35c4a57c,0x505760fb,0xae285003,
  44139. 0xb3aec353,0xe3e80691,0x47117be5,0x380335be,0x056ccf61,0xe1c47e3a,
  44140. 0x33977916,0x253cfdeb,0xf5cb7ee1,0x3decdfba,0x7cf4b704,0xf3c9794f,
  44141. 0x9ff81462,0x2401680c,0xbe3daa9f,0x4e440e11,0x69f91d8a,0xc5d04377,
  44142. 0xcb5e9c5d,0x4106c7a8,0x33b7d24d,0x191909a1,0x3764b4a2,0xe893c838,
  44143. 0xc429b614,0x4a7fe30c } },
  44144. /* 56 */
  44145. { { 0x2455c7c5,0xe78f3a70,0x70157754,0x5b7636e8,0x7623262c,0xf32c4524,
  44146. 0x1bc780c7,0x2c98b11e,0x915ed877,0xd48eaeac,0x199265f4,0xbb04d3c0,
  44147. 0xcfa5200f,0x6b52b19b,0x93ea3fe8,0xc46a0981,0xba758059,0xd82c733d,
  44148. 0x1896aacc,0xd324bbd6,0xce8ecd51,0xac09a2fc,0x02fc44b3,0x529918fd,
  44149. 0xaaa1784b,0xf0c45e4a,0xfe22085c,0x35626340,0xc50c7d61,0x53cbb676,
  44150. 0x65126b23,0x83fa1ea3 },
  44151. { 0x10ccc646,0x60ac86da,0x7b0451e9,0x2ce0637f,0x8a088610,0xbbbcf630,
  44152. 0x20349982,0x23c19019,0xfc0bcda0,0x707fc39c,0x1bd4fd7d,0x7f4d1f15,
  44153. 0x44713bbb,0xd6a64e74,0xc5ac9e60,0x57bdc676,0x37b61169,0x456c5303,
  44154. 0xdcf40a1d,0xd3451396,0x4997d2c7,0xf3edec25,0xc2c4a739,0x534ae9a4,
  44155. 0x6a6ad2e2,0x1401397e,0x23e95f81,0x20769d4d,0xde98fabf,0xcee007c6,
  44156. 0x931c51e0,0x61409779 } },
  44157. /* 57 */
  44158. { { 0x15156623,0x3ddb32db,0xab7a67c2,0x68137fbc,0x6f19e3c2,0x26011f50,
  44159. 0x89924c61,0x34218b02,0xc6804c1c,0x492a0b0f,0xafaae6a7,0xd65be706,
  44160. 0x0d01be61,0x3b13d23e,0xf87f4c69,0x44545b47,0x04dc1aa3,0xd42236e2,
  44161. 0x3c5161ec,0x6135261d,0xbd88bc07,0x1eb46a63,0x1599d720,0x78c6d836,
  44162. 0x69baf0f3,0xf6955fe1,0x17072820,0x467eebd6,0x3e3a340a,0x2f1b8a2a,
  44163. 0x2d0b5f88,0x636dac76 },
  44164. { 0xb4c80af3,0x94280db9,0x4e3892ab,0x9a189cd1,0xd1477ddc,0x26e702e0,
  44165. 0x68f9f14f,0xe91aee38,0x80baa0b2,0x2864f63a,0x8b714a29,0xacd81f73,
  44166. 0xc5fe7cb6,0x30e1b870,0xb10837fd,0x883ea1c3,0x6b20489f,0x2da27953,
  44167. 0x58a2da5f,0x3aeb2a68,0x03a8fa14,0xe2330bf2,0xdc70b1c4,0xb5c488b5,
  44168. 0x299678f4,0x0a78c4d9,0x25df675c,0x233bd098,0x7b67d368,0x37b5c076,
  44169. 0x4d0bef3f,0x2f6dbdfe } },
  44170. /* 58 */
  44171. { { 0x2e4da7c7,0x2f8472fd,0xae677932,0x708cfc91,0x3dc268e2,0x364af08a,
  44172. 0x799a2424,0x0f10dfe0,0x71d58bff,0xef912d58,0x988962e6,0x6bf35dfc,
  44173. 0x5f47ea0a,0x28b96fa9,0xaad308c1,0x734a79ea,0x9f437bba,0x95730337,
  44174. 0x6cf54f75,0x002cbd8e,0xe7632eec,0x47606dcf,0x53193104,0x404b5ecb,
  44175. 0x0acf729d,0x0ae0897c,0x3bddf1de,0x89628b86,0xf87d7448,0xeced154e,
  44176. 0x458d5d4e,0x5cb6e197 },
  44177. { 0x008c75ed,0x98cef197,0xf6eeaaf8,0x7cf49d3e,0x1875e96d,0x1d6f9e02,
  44178. 0xdd9b0d8a,0xfcec2cfe,0xb9576daa,0x38a61cfe,0x36a7dbb8,0x10003f39,
  44179. 0x23b814f4,0xb37c3868,0xb80e3153,0x9fb66dcb,0x059847a8,0x9e7e2eba,
  44180. 0x35a72770,0xa4ec63fd,0xfc9e0ed0,0x311f3d91,0xd515baa4,0x3c1dc094,
  44181. 0xa08cd4e3,0x75a06ebc,0x2ed5eeaa,0xab617238,0xe1f52c1f,0x2e82bbb0,
  44182. 0x5175d6e5,0x2149d630 } },
  44183. /* 59 */
  44184. { { 0x5f9311f6,0xee1a8e6f,0xbabc1f85,0xc97e3c9f,0xb494209a,0x4fa7c52e,
  44185. 0x19774fe1,0x04c2f51c,0x8555844f,0x5cefd122,0xb5873ab3,0xb53862a3,
  44186. 0xcbed19fc,0x768efdd6,0xee58469a,0xcdc12479,0x3d80c09c,0x11237e31,
  44187. 0xc044c28c,0xdd74a290,0xbd47e287,0x9ee6517a,0xad0ffeef,0xc2421228,
  44188. 0x818d281f,0x4273088f,0x43ec0de1,0xebc744bc,0xb415bd73,0x5b26eccf,
  44189. 0xcb07c26c,0x14e2f350 },
  44190. { 0x4216946b,0x548d2a10,0x7a4bd92d,0x6e801f07,0x43695160,0x5996d0a3,
  44191. 0x63a197c9,0x0f1b5c2f,0x061f77c9,0x79da3c4f,0x93ff7b22,0x1c1cd634,
  44192. 0xa234123f,0x5e61b650,0xf284033c,0x826b34c5,0xc2f34214,0x718b90e8,
  44193. 0xae806ec5,0xa5f35620,0xe324a9b4,0xa2fae345,0x8b53cb51,0x8c0bb95e,
  44194. 0xf9965778,0xc94f6ac2,0x6b9def32,0x07ec607d,0xd0ed8f27,0x63bf1dba,
  44195. 0xdcb61e4f,0x58537e02 } },
  44196. /* 60 */
  44197. { { 0x64f80ba2,0x1f64b064,0x0559a45b,0xe8e055e7,0xf1f4b634,0xc3262b34,
  44198. 0xde8c8482,0xef4f7d5f,0xc30c780a,0x9d55dea0,0xcfa1e693,0x1740afb9,
  44199. 0x7460c34b,0x2cfe6a66,0x1187c1ee,0xf6695941,0x5f974d94,0x1382f277,
  44200. 0x004549eb,0x1ca0ace4,0xbabded02,0xf8244b3f,0x4e3653ea,0xc36f4d06,
  44201. 0xc55c5f83,0xeab9f0dc,0xacebce90,0xd93b9cef,0x19061425,0x16658e72,
  44202. 0x82d7970d,0x4857835f },
  44203. { 0xd2576210,0xdcd525bc,0xd51b5443,0x9f378aa7,0x1bd83994,0xfe97bf17,
  44204. 0xf38ac621,0x930d0f63,0x818408cc,0xaf8f2c17,0x260f53f6,0x2692c87e,
  44205. 0xdb0a75e4,0x0ee45407,0xffdb1b37,0x0ec47ae5,0x7aa6a44b,0x769129dc,
  44206. 0x2e40b75d,0xb6f932b2,0x95ef3b77,0xe06764d0,0x68bc63e8,0x28fd47f5,
  44207. 0x9c0014c0,0xd1810494,0xd7995d8e,0x90e2d3fd,0x6c2a85af,0xeb39a05d,
  44208. 0xa21f3128,0x6c0277bd } },
  44209. /* 61 */
  44210. { { 0xb509e7ef,0xe41b7086,0x3d7f9f91,0x8842ec7b,0x5526b88b,0xcd285f94,
  44211. 0x051dd0ab,0x6e44e064,0x774f1ceb,0x90198c10,0x123e661b,0x6ecabe98,
  44212. 0x32f647d9,0x44811136,0x26c52aee,0x1dd82b45,0x939dc9d5,0xd650907f,
  44213. 0xfcd455bf,0xbd5eeef2,0x8d2e5d7c,0x7815a4dd,0x88bc9f2a,0x5ad4ec92,
  44214. 0x57a3b322,0xc6f10d0b,0x20b9cbdb,0xe8d0c1e7,0x9b774ee8,0x5a0b071a,
  44215. 0xf22fcf8f,0x3067bc9a },
  44216. { 0xb7ca9326,0xe0e589f2,0xb1224f63,0x17a106fd,0x747a57bd,0xb2354521,
  44217. 0x62b0882e,0x2614982d,0x4391ffcf,0x7f3af544,0xa84e440d,0x1aaa337b,
  44218. 0x941bb071,0x28ea37b0,0x2e4a7f54,0xa957dcb4,0x1a6ad5fb,0xe7ab662c,
  44219. 0xf7c36a20,0xd135e381,0x9baa0b6b,0x42e7980c,0x94e4671f,0x4237030c,
  44220. 0x8b0922e3,0x24cc63ff,0x445a589f,0xd10d5279,0xa870ff6c,0xbb99d316,
  44221. 0xa996c195,0x390c83ca } },
  44222. /* 62 */
  44223. { { 0xffc4a73f,0x50d3fa82,0x3bd53303,0x2665d635,0x264bb77d,0x80a06f8a,
  44224. 0x22d73d84,0x81c04a6e,0x0323b8aa,0x2409cff5,0x8c4c4d5a,0x31dce217,
  44225. 0x0c0f9c19,0x374aa80e,0x00186bb8,0x0b25a387,0xaaf1487f,0xd0b77a10,
  44226. 0xab498de1,0x15f39ad5,0x1aa0c116,0x92e32da6,0x96e25ce8,0x228e3dbd,
  44227. 0x5e8646d1,0xb57c88dc,0x267b1c68,0x672b1164,0x600bdec5,0x5d0d807f,
  44228. 0x223e573a,0x3ea4007d },
  44229. { 0xa595d0a3,0xd76debd0,0xaff0b3b4,0xa6bd76cb,0x9b1bdb97,0xbf2c154f,
  44230. 0x4c714c71,0x62b19ab4,0x221af663,0xc9bf33b9,0x8c941ef6,0x23d87c49,
  44231. 0xd79f0f6d,0x255804c3,0x2a7acbc1,0x6f1a1005,0x550528af,0x5dab79d9,
  44232. 0xc8d16213,0xfd77a6f0,0xde5e1029,0x40508b6d,0xf95da12b,0xd95ac0f2,
  44233. 0x758a8ba1,0x8860af71,0x7160c8fb,0x0b194c83,0xce004d34,0xa40e6c80,
  44234. 0x6b14aaa0,0x09f82a17 } },
  44235. /* 63 */
  44236. { { 0xc21366dc,0x60abe588,0xaf75daf9,0x729c0a4f,0xacb93ed4,0x70501fd9,
  44237. 0x87a16d70,0xb97e744e,0x98e7361b,0xa42e0a7a,0x28b54cf3,0x1acdaff2,
  44238. 0xb7bd9078,0xf087ccbb,0x663250e7,0xda6f3983,0xbaf07c09,0x66d693ee,
  44239. 0x8cbaf157,0x79baf4c3,0xdfca99d0,0x5a984e07,0xf26d8dab,0xab4d3247,
  44240. 0x7eba36f9,0x4d0be701,0x0e8dd216,0x37bb9e65,0x531c4f03,0x72aa4e24,
  44241. 0xb753d85a,0x77d1e984 },
  44242. { 0xd8e62367,0xd9373239,0xb9820cf1,0x3361848b,0x5a9c97c4,0x00c7e344,
  44243. 0x14f960fc,0x9a0ec9ae,0x740474b5,0xcf41f0cf,0xece065d5,0xa5eede8f,
  44244. 0x9e808610,0xb1de5a4e,0xae0cf75d,0x17c44ae4,0x6b148d0b,0x2fa56323,
  44245. 0xd29ff2dc,0x64fa740f,0x88cb212e,0xc605eb8a,0x6a863016,0xf2c771ad,
  44246. 0x607b4c17,0x6d6112e7,0x40d49785,0xfe90ec07,0xe256e0e5,0x599be18b,
  44247. 0xca54adb0,0x4e6eabec } },
  44248. /* 64 */
  44249. { { 0xfb99cfe6,0x950323d3,0xc9334178,0x7b09bc26,0x7cbdfb6f,0x64111e41,
  44250. 0x89a75760,0x91141744,0x10919cb0,0x4c633df9,0x396bfd2f,0x715fc7c7,
  44251. 0x8cab62db,0x8ca19512,0x4db81aac,0x30672473,0xb4c4c54a,0xe67a246b,
  44252. 0xbf229646,0xd77ea0fa,0xfa5b5d70,0x5bed15f1,0xc2f192f3,0xa5686da5,
  44253. 0x7f6690ad,0xdecac72a,0xcaa50b7d,0x0c4af2a2,0x6049ad2f,0xf44631c1,
  44254. 0x04ecf056,0x325d2796 },
  44255. { 0x4848c144,0xee11fb55,0xb6a7af32,0x4e062925,0x369e0f9a,0x125b68e1,
  44256. 0xca53b21e,0xad9bdae6,0x2e98ea1b,0xf50d605c,0x9f2fa395,0xbdb9e153,
  44257. 0xe91532f5,0x4570e32d,0x46a250d7,0x810698ae,0xad9d9145,0x7fd9546c,
  44258. 0x11e97a5e,0xabf67721,0x249f82e9,0xca29f7d5,0x9851df63,0xa9c539a9,
  44259. 0x71d0e3e5,0xfd84d54b,0x041d2b56,0xd1e0459c,0xfd80096a,0xceb3eb6e,
  44260. 0xe32a79d3,0x19d48546 } },
  44261. /* 65 */
  44262. { { 0xb540f5e5,0xfe19ee8f,0x04e68d17,0x86d2a52f,0xadbdc871,0xd2320db0,
  44263. 0xd03a7fc8,0xa83ad5a8,0x08bcb916,0x54bf83c7,0x2e51e840,0x092133ea,
  44264. 0xcb52dddf,0xbce38424,0x31063583,0xd5c7be40,0x458e3176,0xc1ebb9df,
  44265. 0xbc4dabbf,0xafb19639,0xc05725a8,0x36350fe4,0x84e1cd24,0xac4a0634,
  44266. 0xc145b8de,0xadf73154,0xb3483237,0x0aa6dd9e,0xcbff2720,0xa3345c3d,
  44267. 0xb4e453b0,0x1b3ace6c },
  44268. { 0x90a8bdc5,0x0343e5e9,0x6306a089,0xa203bf9d,0x8e48520e,0x98489a35,
  44269. 0xde7d1d06,0xbd17debe,0x5f795d3f,0x8fafa6d7,0x387b0a3f,0xa4ceb630,
  44270. 0xffddeafa,0xe0166b32,0x7e764e02,0xa2fe2054,0xe871f304,0x55ab9824,
  44271. 0x952ec45e,0xa2bd36bb,0xa90d20ca,0x7b4c1484,0x75bcfb53,0x5319f387,
  44272. 0x6982c4e5,0x34238a4a,0xa102921d,0xa2bb61c7,0xdb3ab17e,0x1e061b64,
  44273. 0x192f0a14,0x538ec33e } },
  44274. /* 66 */
  44275. { { 0xa19b56cf,0x193496fe,0x7bb99acd,0x663d77f4,0x57d0a881,0x8f04afa8,
  44276. 0x082835fd,0xcced3da2,0x5d82cec7,0x7e21faed,0xf8009c85,0x6e175b99,
  44277. 0x2d05a307,0xd9c6e31b,0x81487d82,0x96948d4a,0xd46f6655,0x86ebd3f2,
  44278. 0x773ccc49,0x86851aa8,0x8b1640a6,0x3e220f22,0x41a20b75,0x9f06e3a8,
  44279. 0x90ac0a6f,0x2cfffe5e,0x8ebeb3fb,0xf5a9b1da,0x6e08e2c9,0x2587d997,
  44280. 0x03e9f401,0x6fd60298 },
  44281. { 0x8eb7516a,0x54709f8d,0xbdc598ab,0x83058a74,0x87e801ce,0xd234dd98,
  44282. 0xd17b8a96,0xfd0f9d90,0x6e90f6ab,0xaa1e549f,0x5a7ed55b,0x2496ff80,
  44283. 0x6c254c19,0x0d9f657a,0xb8962575,0x3cdea49c,0x2dff27de,0xb685a3f0,
  44284. 0xdb8bc04b,0x3c50e7fd,0x987236b0,0x904ff0ff,0xbb0d5055,0x494298fd,
  44285. 0xe14be8d0,0x34b3386d,0x7c3d30d6,0x7ad34e9c,0xe159fdd9,0x1f2b32bd,
  44286. 0xc761e5c0,0x84cfa23c } },
  44287. /* 67 */
  44288. { { 0x8b99b964,0x13bc11eb,0x58e2fc47,0x8e280c0a,0xd4c9a54b,0x870fbc49,
  44289. 0xbf6e20fa,0x37a334a2,0xd7c88cfa,0xee583d0d,0xef4af1da,0x05e029a8,
  44290. 0x0c2ef8a6,0x6d55e234,0x209e9b62,0x61b6fdfe,0xbb8e080f,0x3b1dad26,
  44291. 0x9392fc1a,0x5adbc162,0x0aae3f4e,0x02ac0fe6,0xc2bf4d5b,0x8d99801a,
  44292. 0xc282fed2,0x2333f93f,0xb52db33f,0x16dcb10c,0xc55752e7,0x09f90f84,
  44293. 0xc84a0d8e,0x287d4c51 },
  44294. { 0x0e9867da,0x5fa58201,0x1a874cda,0x614589b3,0xfbdee22e,0x005e27c5,
  44295. 0xe612bda8,0xe357fef5,0x2d3635f9,0x4e0dbedf,0x6f125a86,0x62be70e4,
  44296. 0x0d94a2e5,0xa09b9884,0x28b5e5d1,0x7eb99a15,0x751028b5,0x21b9416e,
  44297. 0xe06d2cc4,0x1b137fd7,0xfea09845,0x6fa1f517,0xffcecbd7,0x3ba1e966,
  44298. 0x832f453e,0xd4c89a4a,0xeca68fa1,0x07b1e2af,0x4bd395a3,0xd0fb4453,
  44299. 0xd8ef9e13,0x0132a3dc } },
  44300. /* 68 */
  44301. { { 0x576374c2,0xe53c7785,0x84727040,0xe60526d1,0x228ca044,0x8a066dc8,
  44302. 0xf1ce1313,0x1fe1c1b2,0xcdeb0c5d,0x2aeec832,0x9cbf826f,0xa7596699,
  44303. 0xde77a589,0xcd188e81,0x118d1254,0xe5ce0fe0,0x0790b86a,0xa142a984,
  44304. 0x39ac28ce,0xe28f043f,0x87de5804,0x4eef8290,0xf639a8c5,0x83c31b32,
  44305. 0x5887794f,0xd70454a7,0x18b1b391,0xca635d50,0x31d9c795,0xcefea076,
  44306. 0xb6f8aa25,0x13cbee76 },
  44307. { 0x8d3f34f3,0x79cabe0f,0xa3617fe3,0xbda9c31c,0xdd9426a1,0xb26dee23,
  44308. 0xf29c9104,0xe9dd9627,0xe2c6cd3b,0x033eb169,0xfcba2196,0x8a73f492,
  44309. 0xb858c83c,0x92e37e0b,0x23b3fbb7,0xe4f2aca6,0x64be00a2,0x8101fb1e,
  44310. 0x948f6448,0x91a7826a,0x907260e7,0x414067b4,0xe30bb835,0xf774aa50,
  44311. 0xc999c06e,0xf922ca80,0x0ba08511,0x6b8635b9,0x25fa04f0,0xbf936b5c,
  44312. 0xe02e8967,0x4e0a1ada } },
  44313. /* 69 */
  44314. { { 0x8ba29c4d,0x00ca6670,0x22988094,0xc08240ce,0x16dda752,0x21c5ca67,
  44315. 0xabbbfa34,0x689c0e45,0x3ed28b72,0x1d7545fd,0xd7c56ab4,0x5f221198,
  44316. 0x38759d65,0x4b3d8f74,0x8fe50b89,0x93490dfb,0xe80eba16,0xb641f5d7,
  44317. 0x79acb537,0x7b0da5eb,0x0c1d5e5e,0xab6b1497,0xa5da429a,0x2338e68d,
  44318. 0x2f6d2f25,0xe010c437,0x6530f3a7,0x226f16d2,0xcbef08bc,0xefb0f7b6,
  44319. 0x9f99c999,0x733e30d9 },
  44320. { 0xa42a38f9,0xecfe1582,0x4730b500,0xaec2d58e,0xde976b2c,0x2ee2f2a7,
  44321. 0xa969c1bb,0xf0539db5,0xfcecdb4a,0x31954168,0xe7a8e902,0xf2f7348a,
  44322. 0x3121541f,0x1d58d7cc,0x2202ae52,0x5d25b75c,0xf40835a7,0xdea9965a,
  44323. 0x529b4e46,0x3feb6a41,0xbd27ad9b,0x5c97fb6f,0x261f900b,0xd87554c0,
  44324. 0x04d5b19e,0xb43031d9,0xcb219b9c,0x33d5e9b8,0x3ee00bcf,0x7a43d492,
  44325. 0xb79a5c0c,0x56facb39 } },
  44326. /* 70 */
  44327. { { 0xa3018bfa,0x019165a2,0x9ffad984,0x100c6b24,0x55341a9b,0xbbf1b1f6,
  44328. 0x25dc4cc9,0xe6bd1d97,0x2bfffe60,0x52850ed5,0x7e5509ab,0x24e992cc,
  44329. 0x4ceb59f1,0xff6c502e,0x1aa7d148,0x2f0b3573,0xe7e3aa46,0xe90c1ddd,
  44330. 0xd1142880,0xbaec9f45,0x65be5dd5,0x475cfd26,0x1febce13,0x83abb14e,
  44331. 0x80942d30,0x6aba4829,0x297e82c8,0x1e1b235d,0x50d8218d,0xb771cdbe,
  44332. 0xd94d6cbb,0x88599266 },
  44333. { 0x155ccaf2,0x08847290,0x7c5b773e,0x8679ebc7,0xb2dd08ed,0xa88b2dd1,
  44334. 0x87d475db,0x960a180e,0x6694d02a,0x80fdb6b7,0x3f3f9e96,0x3e8758c9,
  44335. 0x4ad836c4,0xbda3f6fa,0x32fb387d,0x9400c581,0x2550200f,0x25a78542,
  44336. 0x776ecf18,0x2a97c351,0x566db59a,0x03ebf46e,0x26545eda,0x4743a280,
  44337. 0xcf74ab44,0xed169d84,0x88cb3f69,0xbaab931d,0xd8257196,0x70ae932c,
  44338. 0xa0c09719,0x797224a6 } },
  44339. /* 71 */
  44340. { { 0x441f3567,0x632923f8,0x2e24bf1d,0xc11c3168,0xb7671fff,0x4b97726b,
  44341. 0x7a5e1a22,0x601746a7,0x3addb417,0x53dddea0,0x7f59b846,0x57867a3c,
  44342. 0x56cd7ff7,0xb012a987,0xf19ba9a8,0x1bd5fec9,0xf8306748,0x750379a2,
  44343. 0xab8c05d1,0x7763445d,0x7903f42a,0x5d7f441b,0xa903e46d,0xc011674d,
  44344. 0xadd126c1,0x1b1d3c4d,0x61455b40,0xa2752aac,0x555c356e,0x4da42a68,
  44345. 0xd820852c,0x3ff09c15 },
  44346. { 0xf9cb7784,0x4c0a1bce,0x2422f305,0xaec539bc,0x0c414aa7,0x5f40f9fd,
  44347. 0xffd42bc4,0xd3aa316c,0x2f358e15,0x42f5a4c3,0xd6e27682,0x00bdcd9e,
  44348. 0xf8a5ecee,0x069f789f,0x05e14f5d,0x8078018e,0x8b40c741,0x2bb3e493,
  44349. 0x7917f72d,0x5dbc8c1d,0xcc57150c,0xe0eea664,0xc3fa8920,0xa25ecc5a,
  44350. 0x1c797164,0x3c21b0f5,0x634ad16b,0x8f09a2f2,0x58391d9a,0x8e730fc5,
  44351. 0x4fdfae4c,0x47ef1805 } },
  44352. /* 72 */
  44353. { { 0x3da285e4,0x9965f3d1,0x3a01e3f4,0xba7d4dba,0x61214ad0,0x4738413a,
  44354. 0x22397549,0xd3b7d535,0x5a730b92,0xa53dbdcf,0x332d165d,0x3130d92b,
  44355. 0x82f97ef4,0x44a28541,0x44dce1b6,0xbf62221c,0x7e2a0ec9,0xbba13858,
  44356. 0xcbfad998,0x33f32c8d,0xb5fed44b,0x409e5f3f,0xc66217bb,0x5c328c65,
  44357. 0xfcdf71a9,0xb00db69f,0xb8920788,0xa23c2a21,0x3ae6464b,0xf8ab28e6,
  44358. 0xb8de0861,0x1a6b6e9c },
  44359. { 0x06af77aa,0xaf6ec2b6,0xa887f065,0x2e60f5cd,0x9f498c56,0x87d21400,
  44360. 0xfcbaaf4b,0xdb595b59,0x271ab855,0x0fb592a1,0xd4349b0c,0xa0ce10e5,
  44361. 0x887d8c9c,0x9d6187d8,0x154bd6db,0x03ee95f9,0x5d06c999,0x8fe53213,
  44362. 0xfb6a64d0,0xf4a7bc30,0x66a4cb60,0x3d22af0d,0x5d37367c,0x16952cef,
  44363. 0x997d8e55,0x6f0ea734,0x731732d0,0xb447c70f,0xa9cb3942,0x00ab3034,
  44364. 0x28510fd0,0x79dd0180 } },
  44365. /* 73 */
  44366. { { 0x3ac7424e,0x04e0033a,0x60fda4d0,0xdb06b688,0xbcb772fb,0x236a9766,
  44367. 0xf297cda4,0x294a8e2b,0xdb013c6e,0x4b0aab85,0x8723a3ad,0x3d2aec98,
  44368. 0x13c84a6b,0x0cae32cd,0x70ec169e,0x21888f5e,0x42a88262,0x739633bd,
  44369. 0x7b60d9b8,0x68ac792e,0x10769fe1,0x89f2b722,0xd24bed34,0x8f3fcfe6,
  44370. 0xa3eb24aa,0xd35efb88,0x484c706b,0xddecfa3f,0x929ece0d,0x7cc119a9,
  44371. 0x8d405436,0x87e5ad45 },
  44372. { 0x7d1000a7,0xba99aa9d,0xae823833,0x8b94affc,0xdfb83dc5,0xc8229628,
  44373. 0x845a418d,0x2f59fe11,0x5d417054,0xa8b970f8,0x72b71581,0x8918c265,
  44374. 0xc0d1dd17,0xe4ef477d,0x3afad7c0,0xb50b4cf3,0x01870a5b,0x21baea79,
  44375. 0xbb3a2868,0xc77087f9,0x124a59cd,0x7857531e,0x57f43239,0xed74c26f,
  44376. 0x0164c94a,0xd5f5ae25,0xf094bf74,0x6608b7e2,0xfdceea32,0xf4cdb5ba,
  44377. 0x990cc045,0x0b712519 } },
  44378. /* 74 */
  44379. { { 0x88d5c64d,0x5a290ca1,0xa7492534,0x0596d749,0x2a00e925,0xa04b0d3d,
  44380. 0xcaf7b66b,0x082cd02c,0xecdded83,0x912b50c2,0xff31646e,0x813ce9de,
  44381. 0xc75fff95,0x62ae70c7,0x7e2a4615,0x6f6852e0,0x03804fd1,0x320fd7d0,
  44382. 0x8218e8d9,0xb1a2a4dd,0xafc645d7,0x4918a6fb,0xe8d9fdbe,0xfb080fa1,
  44383. 0x4470b6ee,0x33d4d08a,0x6d974ef7,0xd2ba2077,0x69dae5d2,0x8ecb95a7,
  44384. 0x7d69596d,0x7a3f423a },
  44385. { 0x9a929387,0x362d2ca6,0xcb1c1fff,0xabdb7581,0x7e51b6cb,0xd892ec9f,
  44386. 0x3a4e131f,0xee8d8632,0x5bd87561,0x4680e3f1,0xd4e7e732,0xe3a597e1,
  44387. 0x5581fefe,0x3cc72b7c,0xca8cae0b,0xf3e77f8a,0x5e2fd4af,0xfcc7d7dc,
  44388. 0x21355b79,0xdd3a4552,0xa2c07177,0x546b24f2,0x0689621f,0x415b532d,
  44389. 0x3f78163e,0x2be9af51,0x33d7ed21,0x27d63b9b,0x96802943,0xab019ef2,
  44390. 0x1623faf4,0x2da5fc55 } },
  44391. /* 75 */
  44392. { { 0xc8a5c600,0x62429cf3,0x3fe33e7c,0xa7a80c22,0x0a57ddcb,0x9ffda740,
  44393. 0x925b0c74,0xd1ae156d,0x6b100eb0,0x097a43f9,0xef943c81,0x169e945c,
  44394. 0x1128cf24,0xa1f734e5,0x419f0133,0x04387c4a,0x01044024,0xc007868b,
  44395. 0x90359cf2,0xe5416abf,0x478d54e3,0xf9c76fee,0x42a2173e,0x66219da6,
  44396. 0x9fe30141,0x61e03156,0x93ef247e,0xa0ff5ce3,0x072b6592,0x811792ba,
  44397. 0x70c854d3,0x855f0219 },
  44398. { 0x847314c4,0x61fbfb6c,0xeb45b96a,0x97906155,0x6ba2afac,0x7102e146,
  44399. 0xab949781,0xed51f975,0xc110c4fe,0x9d2f5b17,0xaff57667,0x7ac8ce70,
  44400. 0x6eb244e7,0xe7366a21,0x551c65c7,0xdd1bbcec,0xe1a859de,0xb525060a,
  44401. 0x8ba7d2e7,0x7a048174,0xab8ea8c4,0xe1a2c541,0x6fdff078,0x6e7824c3,
  44402. 0x14874b04,0x79b49fc7,0x06b1f733,0x22ae337f,0x6f8fe6cf,0x1c352192,
  44403. 0x525d0797,0x292236cf } },
  44404. /* 76 */
  44405. { { 0x7d8b29dc,0xcdb8d80a,0x08ea648a,0xd17a2024,0xae92be91,0x7db12c5e,
  44406. 0xfda72fbc,0x1f347d18,0x9e760c6f,0x11374b40,0xd8e38d91,0x7361e8f1,
  44407. 0x739ac1f4,0x7714be9d,0xb4df5c4e,0xc1f9701c,0x6f72cae1,0xd9138ed8,
  44408. 0x6ad180c4,0x1c7fe1f7,0x9e2dbf9c,0xf8c185be,0x7c70c44d,0x835db269,
  44409. 0xb0d15b5f,0xf997cfea,0x61e6545e,0x5101445a,0x25184e5e,0x16b06884,
  44410. 0x7521e7aa,0x7cfac359 },
  44411. { 0x3c0bc53a,0x81182167,0x7e751367,0x84b5ede3,0xa3657a18,0x3ca255fd,
  44412. 0xba1fdd98,0x096abbf4,0xc5da77d8,0x9ce8369f,0xaab342c5,0xf27b9ae7,
  44413. 0x972059f1,0x06c91bd6,0x914ecfe9,0xee0dab30,0x93f53f12,0xbb647fbb,
  44414. 0xffa57e0e,0x30c38a7a,0x9f2ad607,0x517d06ef,0xbb99dcc9,0x49728d87,
  44415. 0x446080a1,0xb0034af1,0x12b9c17d,0xcc810c3f,0x772a22a0,0x7225f14f,
  44416. 0x1ddf82bd,0x6ce3dc7f } },
  44417. /* 77 */
  44418. { { 0xa4397830,0xc07cd835,0xf4733306,0x4dd9290c,0x29989e8c,0xdd35d3a8,
  44419. 0x563d8152,0x79902559,0xe87de61b,0xf278d911,0x1024e35c,0x9c7340c7,
  44420. 0x4a0d0e59,0x2d444461,0xf32626a1,0x63e7608f,0xc4c9baa9,0x627a37e9,
  44421. 0x76fffd25,0x0c56dc51,0xcef2a1cd,0xcb6defc8,0xefc559d9,0xcbcc0d56,
  44422. 0x041cb692,0xe45f3fc5,0xe5161e09,0xcd05c239,0x5c3b559c,0x2a731ee9,
  44423. 0xa3d0a16d,0x85151122 },
  44424. { 0x86ff19e2,0x782d0335,0x1da28603,0xc2c60daa,0x557c7eed,0xb2e78cfe,
  44425. 0x1bc4e8b0,0xa8f6f984,0x3df35c67,0xcc1f9b4b,0x4764462a,0x96e13603,
  44426. 0x7c7ae0b0,0xbf910b97,0x51435956,0x27c7f305,0xf631eae5,0xc14db15c,
  44427. 0x7e69b34c,0xa51d6142,0x5fc12ff2,0xdec82851,0xfb887162,0xfcceae13,
  44428. 0xde1488bd,0xda332ac1,0x2ee3e74c,0xa20374e2,0xf0ae069c,0x597ea1a1,
  44429. 0x77bdec04,0x8b1159f2 } },
  44430. /* 78 */
  44431. { { 0x2f961d30,0x4af71a44,0x7ac7248f,0xbdf968a8,0xb1a906cd,0xd32df87c,
  44432. 0x04abf925,0x00c10e26,0xb9f04d4c,0xb8711759,0x939705da,0x00d54e60,
  44433. 0xc9f80849,0xf7587433,0x6a7a2375,0x2e9abade,0x94ac17ac,0x5676d478,
  44434. 0xc202d99c,0x4ca0525b,0xabfae73d,0x95b8bcad,0x3405991b,0x2371ed38,
  44435. 0x458a99c3,0x2b69e47a,0x2b78c866,0x7cac0b18,0xe0232c7c,0x6ceaa79b,
  44436. 0x588f7459,0x0bd86433 },
  44437. { 0x7e734189,0xdea1a8b4,0xcfe5fa17,0x52c5ac88,0x11437664,0x444a4d4e,
  44438. 0xaf9e9750,0xc2522308,0xd30c6b3b,0x78b1d0c3,0x4c6df477,0x2edae5f0,
  44439. 0x2ee88dd7,0x53131d9a,0xacc93e34,0xc4e380ee,0xa8db0e8e,0xd499b1ac,
  44440. 0x7f5d49d7,0x77348c16,0x1556ccd7,0xc9663257,0x2611d13d,0x65ce0e8c,
  44441. 0xb5a2fdcc,0x2c95fe66,0x8658faa1,0x26698832,0x31c32c98,0xda87d1f4,
  44442. 0xfcd91907,0x46650598 } },
  44443. /* 79 */
  44444. { { 0x6b4a5efa,0x4c6c13cc,0x1d07b265,0xc481989b,0x8bdc69c0,0x10b966ce,
  44445. 0x2c2531d4,0xf54cfaa2,0xcad0a100,0xcb5f1808,0xee5da449,0xbeb52538,
  44446. 0xbedd83cc,0xa6240085,0xd6255c78,0xe792dacf,0x2062058f,0x88371906,
  44447. 0xed1658c1,0x96615e83,0x7d28d542,0x4b549b27,0x83b75df3,0xeaf127db,
  44448. 0x17fbb942,0x4f60df6d,0xf6f7c930,0xd08631db,0x6018789f,0x17c38f98,
  44449. 0xb9a9280c,0x0c43574a },
  44450. { 0x1d20cad0,0x76eb324c,0x8c61108a,0x90decb09,0x6f06d36d,0xa6e9d39c,
  44451. 0xbc0da197,0x6cd978ba,0x507ac5ce,0x5948b1c0,0xc5497eb5,0x2bd47164,
  44452. 0x4d5914e3,0x2a9c4c0f,0xa759f03c,0x772c5046,0x69ac847e,0xe7d7328a,
  44453. 0x3048b330,0xa8d57d0c,0x40f7bace,0xe60034e0,0xa85f1790,0x823d9193,
  44454. 0x5c859736,0xa6e9b66c,0x679e1022,0x22ca2c7a,0x09023fa4,0x00e7a19c,
  44455. 0x2726d5b9,0x324999f1 } },
  44456. /* 80 */
  44457. { { 0x7c834915,0x667eaed6,0xbc5eb64d,0x9f77aa6a,0x25d62011,0x729ebcb6,
  44458. 0x699fd9c2,0x0aee24f2,0x2b8d4f6c,0xe1eb5874,0x14c976d6,0x7f12710c,
  44459. 0xf6d9ea65,0x91390335,0x06b50064,0x668b7049,0x0876ee4f,0x65969a0e,
  44460. 0x2f9d9360,0xf901bf3f,0xb499e3ce,0xfb1a8651,0xf2dbcaaa,0x80b953fb,
  44461. 0x973b06b6,0x312cc566,0x3af36c64,0x3534d9c3,0x10ffd815,0xe4463a52,
  44462. 0xf18c2b91,0x57ea2b4b },
  44463. { 0x8aa0f2f2,0x00f5e162,0x0e46bcaa,0x8c7e75c5,0xa4a2c42d,0x97ab479a,
  44464. 0x14baa202,0xb4f308ea,0x6943cc2e,0xa901bd14,0xeed58804,0xbb125fee,
  44465. 0x9d180f7c,0x6502c8f9,0x1580c61c,0xe5353919,0x27101ee3,0x7e278069,
  44466. 0xfaa72717,0x7a0a40a1,0x4c75b153,0x32edce02,0x538f1c22,0xda23660b,
  44467. 0xbe307d2e,0x4d511e98,0x9baee0b4,0x24276e40,0x7ff1f307,0xa78c3927,
  44468. 0xea7935c9,0x60480b46 } },
  44469. /* 81 */
  44470. { { 0x3872ece3,0x31087d66,0x955b70f8,0x5f29be7d,0x9cf95bb8,0xb50b4fc7,
  44471. 0xdbffa621,0xbae3b58d,0xe022ba5d,0x0e61d280,0x4181449c,0x78ae5117,
  44472. 0xcf555485,0x0b132840,0xb8ce0b0e,0x800ed1b6,0x78d5de3d,0x35dffdd5,
  44473. 0x69a56b47,0xf7e42374,0x8d910ae7,0xd5e32369,0x6313c7c7,0xb6ff52a0,
  44474. 0xa92de9e5,0x5a2fe20d,0xd12110bb,0x41b347d3,0x40c16f23,0xc5905edb,
  44475. 0x9a8f88cc,0x0774a0d3 },
  44476. { 0xe3b6c106,0x3ae181ab,0x8de150b7,0x4ebe163f,0x6f354836,0xcf75b82f,
  44477. 0x3ac7ac16,0xaa0d2063,0x291722af,0x5c680668,0x11545553,0x73941e61,
  44478. 0xbf5de3f7,0x17127e38,0x1afb41da,0x32cfdf03,0x87bc8663,0xc6893c91,
  44479. 0xa62c9c99,0x75046744,0x962c1947,0x96866e2d,0x378cdf4c,0x489ec8df,
  44480. 0x3407fa32,0x3a60709b,0x551290d1,0xd37d2159,0xbab92273,0x9623d303,
  44481. 0x2432014b,0x08151954 } },
  44482. /* 82 */
  44483. { { 0xfb7b2108,0xf9236d89,0xad75f9aa,0x3ecc83cc,0xb4e1da11,0xf7c72b15,
  44484. 0x0315c362,0x552aeaef,0xf272fe3f,0x11e140ed,0x87843ee8,0x99d79bf6,
  44485. 0x1d9bb25b,0xce6b54fd,0x5b1bad74,0xb20b0e21,0x5b84c90d,0x54a0214f,
  44486. 0xfca6cec9,0x459bbf52,0x9e4df76f,0xe363c48d,0xd64cf17e,0x3045f84e,
  44487. 0xf62ada48,0x8402a167,0x6a74ca01,0x2c9e1bf3,0xf691c42d,0xe8cf9d41,
  44488. 0xc2c4b874,0x5abf2178 },
  44489. { 0xf3b3bccd,0x4777966b,0xbe3e0caa,0x0047e0f0,0x8c7d5043,0xcb8383b3,
  44490. 0x946fd5fc,0xe77e3baf,0xe9ec0e87,0x79baa785,0xc8a18d25,0xd83c557c,
  44491. 0x25befcfe,0x9b96e5af,0x98c71b61,0x4f05d15e,0x77e62da1,0x081f991a,
  44492. 0xcbaa3821,0x1c6ec781,0xe54d9bfb,0x7522f65d,0x44ed1430,0xf5d05573,
  44493. 0x95cafdda,0x3035b31f,0x6378f5bf,0x47e67f43,0x5270b9d9,0x029f7cad,
  44494. 0x4d916a48,0x15ad1587 } },
  44495. /* 83 */
  44496. { { 0xaa588ae4,0x00de2ece,0xa371a232,0x552ebc58,0x71230444,0xd00ea934,
  44497. 0xe4b1832d,0xafbfa67d,0xb689e843,0x29216341,0x61f4e2e8,0x1f96bbbd,
  44498. 0x04c29dc5,0x95420684,0x42317fd1,0xc7fe3827,0x63483162,0xe0a0aec6,
  44499. 0x0700184f,0xfc2b94d1,0xfe1fbd85,0x07219973,0xfb074352,0x648b6ab1,
  44500. 0xc46e5392,0x23bbdaad,0x00fa56ff,0x0db8dd1f,0x866725f6,0x104815eb,
  44501. 0x52e81963,0x3f9c4cca },
  44502. { 0x32ce637e,0xff36b297,0xf5d25cdd,0x81a15f2d,0x8b02ad97,0x1a1d052d,
  44503. 0xcfbab3e9,0x2e5f3bbc,0x614eeb75,0x60d2cbd7,0xcd5a793a,0xd4491843,
  44504. 0xcdba2144,0x2242cf75,0x88b99766,0xa20705e7,0xec77e132,0x64e12cc0,
  44505. 0xb61a9b05,0xb1c14df6,0x74825b5a,0x8fd97f04,0x3da31223,0x95604821,
  44506. 0x4d30c70d,0xde486727,0x1c12ee69,0xbcab8f15,0x668d893d,0x5dc638b4,
  44507. 0x223f574b,0x6479dad6 } },
  44508. /* 84 */
  44509. { { 0xb05f2b26,0x569044f3,0x80b9f76c,0xb35a294a,0x4290f6ae,0x8839fe28,
  44510. 0x026a5877,0x761cfb23,0x2e5ff9c3,0x768926b6,0x0b11c576,0xbae6cd20,
  44511. 0x72a03efe,0xdc857756,0xe1bad63a,0x0cae074a,0xd709d99c,0x3fe491a1,
  44512. 0x6501d9c1,0x76c5ded6,0xc32aeff7,0x1da6eca1,0xc57683e8,0x50849d55,
  44513. 0xdf98d847,0x9e392e9c,0x64d9a564,0xfad7982f,0xa37b98b2,0xf7c3bdb7,
  44514. 0xf0860497,0x1fe09f94 },
  44515. { 0x7648cc63,0x49a7eaae,0x67cfa714,0x13ea2511,0x653f4559,0xfc8b923c,
  44516. 0x81a16e86,0xd957619b,0x3c864674,0x0c7e804b,0x1616599a,0xfc88134a,
  44517. 0x0a652328,0x366ea969,0x4bc9029e,0x41532960,0xae2aad2b,0xef9e1994,
  44518. 0x7f10bef5,0x9e2a8c52,0xc67bf860,0x73dcb586,0x844cc25d,0xf61a43fa,
  44519. 0x74eb3653,0xd74e7eea,0xdd240f02,0xf3356706,0xfd83bcb4,0xeec7694c,
  44520. 0xdb62526a,0x4de95786 } },
  44521. /* 85 */
  44522. { { 0x3deac2f7,0x4867d315,0xb61d9a8e,0xa084778a,0x0ab7b2d5,0xf3b76f96,
  44523. 0xcfdf4f79,0x00b30056,0x31ab8f4b,0xd0701e15,0x9c779d01,0x07f948d5,
  44524. 0x82675371,0x7c994ebc,0x48bad4c0,0x1104d4ee,0xbfc9d058,0x798ce0b5,
  44525. 0x309fa80b,0xc7ca898d,0xacb33eaf,0x0244f225,0x5b2f3175,0xd51e8dfc,
  44526. 0xa4d7be34,0x3e49ba6b,0xbda02b43,0x1760f4c7,0x4435275a,0x37e36a7e,
  44527. 0xe636980c,0x1c94418b },
  44528. { 0x09dc1414,0x43a21313,0x43c93537,0x060765fc,0xdf5f79ce,0x6ff3207a,
  44529. 0x85d4cfca,0x6f18b1fa,0x63e995ab,0xf5c4272e,0xa82b3002,0x121a09e4,
  44530. 0x97147f16,0x82b65d1b,0x20a7fe26,0x4993c20c,0xe6716726,0x99c9cb98,
  44531. 0xfeb440a0,0x5a02d673,0x251b4bc5,0x3f3fa9e1,0xa05338ea,0x75dbc474,
  44532. 0x7b09f6cb,0x3cb4044b,0x80434609,0x6767da18,0x098ceac2,0x97851422,
  44533. 0xb55235ba,0x611bfbb2 } },
  44534. /* 86 */
  44535. { { 0xf00ad2a1,0xbdbaa55e,0x14a290d7,0x29efa85e,0xe92b1694,0x3b4a4768,
  44536. 0x11ec8130,0x67111bcd,0x88bd27b2,0x0e425702,0xd9a03c06,0xf28cf2a3,
  44537. 0xf318884a,0xbb7c8d2d,0xe3aaeb20,0xe2ea1462,0x43b85d77,0x33535804,
  44538. 0x554ee9bd,0x81ee4482,0xe6aa198f,0xeb2eee9e,0xc26c5944,0x7a5aa804,
  44539. 0x82ab167c,0xa0ef2da5,0x02fe21a5,0x5a2ab476,0x3370298e,0x169cb3b8,
  44540. 0x0eb3aa8d,0x86e6c544 },
  44541. { 0x0b793d9b,0xede03321,0x1ddb5ece,0xf79fade1,0x68930b64,0xf73fda92,
  44542. 0xfe4fd1b2,0x06aad97d,0x92a4dc88,0x073a5b1d,0xbc976d75,0x8af8cbd8,
  44543. 0x63ce26c0,0x60b4abb1,0xdcb1fb06,0x9c8300a9,0xda95b3d3,0x335a594c,
  44544. 0xb37eac87,0x1f97d7d4,0x20eefaab,0xa3d2eba2,0xf3e828c8,0x3258c906,
  44545. 0x85ab7781,0xc832616f,0x8c28b617,0x72597192,0x3233b82d,0xcd7196bc,
  44546. 0x19fa126d,0x83867eb9 } },
  44547. /* 87 */
  44548. { { 0x22474edb,0x774fe73e,0x1a84e1ae,0x2a766394,0x9c6dd6e3,0x270329ad,
  44549. 0x14f8bf5d,0x00c4a415,0xd2267b90,0x3ce2ea37,0x11d24fae,0x12753015,
  44550. 0x263a1b78,0x7c14d854,0x1ae0b206,0x20c8401b,0x081f49fc,0xf32a011b,
  44551. 0x959c6df8,0x1e8123fb,0x800e1d06,0xa328dc7c,0x24259a9a,0x5876a378,
  44552. 0xb7ef6c37,0x23ada8b5,0xa93d4c9f,0x023f6b6e,0xffb6389f,0x89f5414d,
  44553. 0xe628b39e,0x4b26bba2 },
  44554. { 0x5d318454,0xd30b1cb4,0xd7436cb6,0x123b749f,0x568a7461,0x3110c726,
  44555. 0x1c84fd1e,0xc85de123,0x08403d55,0xa5f8d6e6,0x9b1fabf8,0x395b6e13,
  44556. 0x3cfedce0,0xfe6d68c3,0x94b91110,0x1d90381f,0x2dcc6eb7,0xf0a8ea81,
  44557. 0x7e90ca2b,0x59e80413,0xc8a25c5a,0xbeb5fc07,0x5d84663c,0x009c253a,
  44558. 0x910b6a7c,0x00b15073,0x4108f8d5,0x8607da4c,0xcb901e65,0x02c3d9c3,
  44559. 0x2c9615c6,0x4d697bc5 } },
  44560. /* 88 */
  44561. { { 0xefa8fb40,0xe0db1ef0,0x5ba3989c,0x29021c5b,0x809d19df,0xa8d6fb15,
  44562. 0x4c1219e1,0x6b787b73,0x14ef05e2,0x6417e168,0x8f9796e2,0x449342db,
  44563. 0xbf84421b,0x2f878a5e,0xe94a4536,0xe71916d7,0xae119693,0x9818bba3,
  44564. 0x5768804e,0xec674be9,0xf8424f8a,0x0a26074c,0x466ce6ab,0xdbc93b9d,
  44565. 0xc920078b,0xb3f15a98,0x3870f1a3,0x9d10fd0d,0xe4e785a7,0xa61241d9,
  44566. 0xe6c8cd80,0x76ca87a1 },
  44567. { 0xe02e48b7,0x4357fb56,0xcc09e9c6,0xfbd14b13,0x24069cf0,0xdb5f2435,
  44568. 0x2c3b01a9,0xf878165c,0xe6956dad,0xe549e7c4,0xbbd60b68,0xf2fe9538,
  44569. 0x059dc653,0x952f856b,0xb377fe9b,0xd3f60225,0xbfe908c4,0x6a0c7328,
  44570. 0xbc8f5f2d,0xce6aa2d3,0x24425050,0xf7213443,0x3d3b3ce5,0x17e1266a,
  44571. 0xc1677512,0x75b5e43f,0x37fb894a,0x15927062,0x2be3e375,0x15260753,
  44572. 0x6da3b7be,0x27e7f2c6 } },
  44573. /* 89 */
  44574. { { 0xe6a15883,0x638f65ad,0x66afdb33,0xd4a7e68c,0xd3f12de5,0x6207b6ab,
  44575. 0x37b87810,0x1c6ff950,0x64acf6d3,0xc0d44cb2,0xf2be78c2,0x163ac601,
  44576. 0x1636980e,0x1c63cc5a,0x95c9349b,0x3e92cfe8,0x41ec7220,0x7738e0d8,
  44577. 0x2d5fa961,0x6169d764,0xc3e028e9,0x2aa776c1,0xb16d5409,0x93dc5646,
  44578. 0x706df4d9,0xa0b27fb5,0xce9c6b97,0x9e991170,0x53c85f40,0xea8e42be,
  44579. 0x83246528,0x02e96437 },
  44580. { 0xae78ea1f,0x91540add,0x7b670e96,0x51a1b74d,0xf7006826,0xf9936441,
  44581. 0x7d7520c7,0x8f97d6ea,0x69ce12e1,0x0faa6a02,0x79208342,0x2590aca8,
  44582. 0x75614436,0x7a483863,0xf381408f,0x07c6149e,0xd7853406,0x733bf584,
  44583. 0x9abbb6f7,0x8761b010,0xf528a09a,0xe4eb249f,0x2e00ae3c,0x08781ed8,
  44584. 0x2178effa,0x864c1b25,0x9d513a7e,0xcc1e62a2,0x1919062f,0xedb8b94e,
  44585. 0x4f16527d,0x739f53da } },
  44586. /* 90 */
  44587. { { 0x924adc5f,0x7a5f4a88,0xa818f56d,0x95646c16,0x7795f954,0x0ec49129,
  44588. 0xd19c5400,0x2b48753d,0x205912b4,0x16fa236b,0xe87a4946,0x6b3d65f3,
  44589. 0x045fd066,0xa7174a01,0x12a5e140,0xb6350313,0xa96b8623,0xa79c4b44,
  44590. 0x9ab003d5,0x7a339d65,0x3826f31a,0xc72f30c6,0x6f7090cd,0xb4e7390c,
  44591. 0x906ebe24,0x59ac6c36,0xbba4505a,0x39a7f06d,0xc58c413a,0x839991e1,
  44592. 0xa20e0e84,0x020c23ff },
  44593. { 0xafc74661,0x120e4ada,0x277fc065,0x37bbcf63,0xb6dce799,0x41049cf6,
  44594. 0x7b161ba1,0x5b8d6b53,0xa9610fb2,0x22218431,0xdfdde769,0xde9ec9d1,
  44595. 0x42d80630,0xd32bfa4d,0x6244df4b,0x3885702a,0x45592dfb,0xcdedd1ed,
  44596. 0xfb4e01b8,0x0e1df45b,0x86e215b0,0x8f4bded2,0x6a937e6a,0x80935487,
  44597. 0x8130f723,0x415278ba,0x38a821f8,0xc6dc4692,0xfd8b4f8a,0x2207b119,
  44598. 0xf9269cef,0x76e7bf53 } },
  44599. /* 91 */
  44600. { { 0x27ebd187,0x5f128428,0xb65aadbb,0x8d3320ab,0x72258695,0xb042765a,
  44601. 0x8f0986ab,0xda3f33f9,0xaebff503,0x411807a7,0x825f71a5,0x25c776ca,
  44602. 0xff7df24b,0xc0de7bed,0x165f1fb4,0xda8b0f42,0x731f3ae3,0x5f3ff737,
  44603. 0x193e0a52,0x4cd1d7e7,0xb6b3ba46,0x8df84aa3,0xaa1f3782,0xba84b897,
  44604. 0xe7733ac7,0x6e7960cc,0x50981a21,0x4d46d6ab,0x7cbb80ed,0x1ec12c25,
  44605. 0x2b96ef09,0x79e7ad27 },
  44606. { 0x8f30caae,0x3cd970dc,0x0a6ebef4,0x85cabcf1,0xc714616d,0x63c1863e,
  44607. 0x519e3a98,0x1c50db0b,0x64cb13d6,0xf39b8963,0x22547b69,0xdf67d81f,
  44608. 0xd67db0cc,0x7157abb9,0x889491b7,0xccca25ba,0x7a27e0dc,0xf689207c,
  44609. 0x0fd43281,0x34ae8fbe,0x5720ec09,0xa5d91f73,0xcdfd7bed,0xb2f61909,
  44610. 0x4a039e32,0x1ec10232,0xdb0d8fdc,0xd3c3d65e,0x4fe5005d,0x32c916c8,
  44611. 0x4c0bea94,0x7f8c37ac } },
  44612. /* 92 */
  44613. { { 0x43ac05e5,0x33ec1e54,0xcd8d3825,0xda4a4da4,0x88bf9e2b,0x86d88c0b,
  44614. 0xb53811dc,0x34d71dd0,0xa3c3aba4,0x655040d2,0xb61611be,0x2bc40949,
  44615. 0x279a4fa0,0x1c2d426e,0x3b065ac3,0x535a5aa2,0xc52ea890,0xdaa8a32f,
  44616. 0x9fddad22,0x5a5deca7,0x2ab3b26f,0x911f05fd,0xf37cd81e,0x5dace7db,
  44617. 0x90d16b8c,0x0e0e44e7,0xe4f5894e,0x15e68aed,0xfc92a74f,0xafe04999,
  44618. 0x970e7c2f,0x1d7703aa },
  44619. { 0x3f0062a9,0xa8a4c81d,0xd96a20ba,0xe31eb2b8,0x864bd101,0x66dd98df,
  44620. 0x4413b614,0xba05f592,0xe9a555f8,0x51a67a0d,0x2e4b52d1,0xacc2f097,
  44621. 0x7184ab23,0xab5daaec,0x7c7f691b,0xce08b43e,0x76c427f4,0x520e530b,
  44622. 0xe423ebdc,0x7d352069,0x34df14ce,0x6b5e39e8,0x446305ac,0x3dcbf295,
  44623. 0xfe34cdc1,0x682cb2e1,0x111f5afb,0xd4ac45d1,0x47f296f9,0xc5ef63cd,
  44624. 0x93c20871,0x0a2c40ec } },
  44625. /* 93 */
  44626. { { 0xaf5747db,0x09bc384f,0xc06ab86b,0x3bad6086,0x9e7c1547,0xa406882e,
  44627. 0x55977abf,0x2d5326d1,0xda81deb0,0x063a9a05,0x524b6111,0x9a86e4a7,
  44628. 0x4ab2eb90,0x1402f87a,0xd5c600ba,0x7d0721d4,0xf289fdbf,0x1a2fd9a9,
  44629. 0xecde6f07,0xf5dce66d,0xdab9fa73,0x62171277,0x6c474bab,0x6d2dc49f,
  44630. 0x76eed033,0xdc017e1f,0x4da825d3,0xb97175c0,0x54b05e43,0x6c297e3d,
  44631. 0x56c9c87e,0x2efb4546 },
  44632. { 0x8b21c064,0xa4712b00,0x4a70629e,0xd186fe42,0x9b74f0af,0x6435b340,
  44633. 0x7ec9e629,0x6965aa43,0xc4c60d08,0xdda14673,0xbf3057aa,0x0b656670,
  44634. 0x3ce86f60,0x7f05e840,0x04401a16,0xc05073a9,0x294e607e,0x16b1e638,
  44635. 0x69cf7046,0x20783252,0xe8ce7d3a,0x2941141b,0x7577053d,0xd38ad8d3,
  44636. 0xcaa6630d,0xdba68fb3,0xe9504350,0xecbeaff1,0x1d2d760b,0x9f5166d5,
  44637. 0x462891e4,0x337532ce } },
  44638. /* 94 */
  44639. { { 0x3a00bb9b,0x3f111853,0x45f66685,0x2d2ffbae,0xd4aee24d,0x9ae11a85,
  44640. 0x0341856e,0x18ba1e1b,0x2731349f,0xa9ac8178,0x545715b5,0xc13dfd4a,
  44641. 0x5daad2ea,0xa5f7423c,0x535b76a7,0x30a483b9,0xff873e9b,0x92e9ada4,
  44642. 0x723a1055,0x15662d84,0x8edac4e0,0xb935497b,0x39d8fa70,0x61b6441a,
  44643. 0x40d1589f,0x1541d756,0xf0a05f0a,0x62994237,0x6bb28908,0xfd8b0034,
  44644. 0xd4cd32bf,0x192a2b5d },
  44645. { 0x365ced07,0x63576628,0x05de1d1f,0x029f32fb,0xbf40a7aa,0x6d17b9bc,
  44646. 0x9bb50a47,0x1b1b2a08,0x795a6278,0x9389abbb,0xb34fc19b,0x52cff60f,
  44647. 0x387d8739,0xf3ab9492,0x6920ccd6,0xa8f053e6,0x63a9b4f0,0x3ef2dd4b,
  44648. 0x51e82129,0x9ab0ede1,0x0838bfa1,0xafba0c0b,0x9ffc11be,0x2bd5a7ac,
  44649. 0x95cc0878,0x058bfd95,0xf8c2f0c6,0x686d48a3,0x1d9b31ba,0xc33abaaf,
  44650. 0x3bc0c268,0x632e2289 } },
  44651. /* 95 */
  44652. { { 0x15a1ccca,0x1c851d20,0x7e522bc3,0x4efe290c,0x18eab053,0x0b741d55,
  44653. 0xbc85e217,0xae656197,0x01cf8b29,0xae13141e,0x66948478,0x2e2cb593,
  44654. 0xc31bd8ae,0xeb57bb0f,0xc264e788,0xdecef5d6,0x9cb96d86,0x6fa856cc,
  44655. 0x279183da,0x2db16813,0x383d796a,0xf03f3820,0x1d0c6fed,0x58a456ff,
  44656. 0x8a6abd9b,0x25589805,0x83f96f19,0x339f52c5,0xda7e9ea7,0xcf6ded8f,
  44657. 0x5d1ccd45,0x68c3d9c1 },
  44658. { 0xe6b392b7,0x67e26265,0x775d9509,0xcec1d9bf,0xd76514f7,0xe16abcd4,
  44659. 0x0de72e1c,0xd86f59b2,0x1adfb033,0xa66e43cd,0x05e457cc,0xdb344340,
  44660. 0x5681daa2,0xb67a7916,0xf0114731,0xc32e7bab,0xd3b1e961,0x066fe16e,
  44661. 0xf63d26e6,0x924e298e,0x541add6d,0x9bea0dd8,0x9982f971,0xef9500df,
  44662. 0xc5f076ac,0x5c876e63,0xb23d396b,0x55e12ae5,0x2ec6747a,0x09efbb36,
  44663. 0x233286a5,0x8f2055ee } },
  44664. /* 96 */
  44665. { { 0xb82c1af0,0x4a4ab9e3,0xf2cae264,0xfc65e9e7,0x60187d46,0x4feaac0a,
  44666. 0xe393b363,0x27d3f335,0x819bacce,0x9c9f7c00,0xb8aa6611,0x3f7418b5,
  44667. 0x372aae95,0xffa94557,0x8db38589,0x937d7804,0x6f1fbc1c,0xd10c86df,
  44668. 0xa2f0a0ce,0x48aebd89,0x367439eb,0xae5d5fa2,0x3f17d2d8,0x103a6a0b,
  44669. 0x411d9894,0xf233f68a,0x218b67a2,0x7fece8b3,0x2319bf06,0x0422540f,
  44670. 0x340d322e,0x1292c8c9 },
  44671. { 0x0386463d,0xf5eb5587,0x0371d97f,0xd4bbc2b2,0x0b819c5a,0x1b364571,
  44672. 0xcf04ad41,0x0cbb42d6,0x66939ec1,0x5d819c76,0xa01847e7,0x8745ac13,
  44673. 0x1c7232e4,0x4f704b02,0xacb05780,0x2c9e58a0,0xb561e295,0x9523b8b3,
  44674. 0x79f9ba35,0x3384df00,0x1eaa9628,0x78231fc2,0x8aea2b90,0xa2eac54f,
  44675. 0x30d1c263,0x8075ed77,0xfb339000,0xacb44ed5,0xf011293a,0x92546ac2,
  44676. 0xeb821764,0x7c78762b } },
  44677. /* 97 */
  44678. { { 0x067902b6,0xb8f7d6fb,0xd1735980,0xb2823a43,0x59741ddd,0x062cfb12,
  44679. 0x4033f95c,0x6e391b07,0x68589b8c,0x3831d0a3,0x522290f2,0xe3474d49,
  44680. 0x222e1f3a,0x4dab14d6,0x53f08d39,0x8f00fcde,0x707f28f5,0x559917ae,
  44681. 0x068e607c,0x166aa0ba,0xd7e1f824,0x602713e7,0x4d6a328f,0x7c255540,
  44682. 0x9890cd2a,0x0d2e3264,0xeca0b20a,0xf2207944,0x52f4e09c,0x5c98dc07,
  44683. 0xd84de81d,0x69403504 },
  44684. { 0xe5407206,0xf8b7b366,0x0d88fa8c,0x1ecf54cf,0xf7272e6f,0x6fefe548,
  44685. 0x81ab4468,0xd6531372,0x4e474408,0x52cb5f0e,0x6490737f,0x9e426b3a,
  44686. 0x4980d071,0x2576c19b,0x0f272caf,0x91f34628,0x468f31c9,0x78e60a4f,
  44687. 0x90844d89,0x8776a329,0xb951582b,0x8a55700c,0x14b1adbf,0xab1af365,
  44688. 0xfbd343ef,0x22ebff92,0xb7d81f34,0x32f9fb01,0xba6b30e1,0xad850e06,
  44689. 0xbc5f9546,0x6da9e027 } },
  44690. /* 98 */
  44691. { { 0x5c9490ce,0x21eee4c2,0x0df68381,0xa96ec4a3,0xa4a9368e,0xe6c607e0,
  44692. 0x4bc262f3,0xd8b0492a,0x460c34ff,0x0846a210,0x28df33cd,0xf7ff7a64,
  44693. 0x21827612,0x10c55044,0x149bcd01,0x9d25fce9,0xcfc613dc,0x725611cd,
  44694. 0x97f51ce5,0x159f7e88,0x4e8c08b5,0x3fa3bf31,0x75e7538f,0xea156115,
  44695. 0x91c84020,0xd1e0a951,0xcf02ad0a,0x0d2268ba,0x058b8e5f,0xa04c6ac4,
  44696. 0xb3515912,0x773b40b9 },
  44697. { 0x3631cfd2,0x00ff2cdc,0x807737bc,0x14c4c2d3,0x338a5270,0xd600616a,
  44698. 0xb32cabde,0xd0e3306d,0xa70b17ca,0x336738ea,0x79f353ee,0xf2f4aa8d,
  44699. 0x576f3ad3,0x712f6ad9,0x89b2bce0,0xe4279852,0xda92ca30,0x05d8f94d,
  44700. 0xd8492dd9,0x9891d475,0x4d15e4bd,0x3e06a5ca,0x254eabbd,0x4725d4eb,
  44701. 0xc0ed513c,0x31394ace,0xbbfaae6c,0x7e0f9859,0x833fd137,0xdc125546,
  44702. 0xc56c4f75,0x12b46385 } },
  44703. /* 99 */
  44704. { { 0x932951de,0x810dbebd,0x5aa69c94,0x96959d42,0xecb2f08d,0x5fc49c04,
  44705. 0x2250b82c,0xac74f0cc,0x3aec4e1d,0x96a439a5,0x90499acd,0xc33cab9a,
  44706. 0x54d9b3af,0x2fccde66,0x3863ae8b,0xf4af285c,0x46febf88,0x2373373e,
  44707. 0x3c9ab7ed,0x751d672c,0xfe12020c,0xc1c51130,0x52f3e56e,0xad82402f,
  44708. 0xa4a64a81,0x3489ab7a,0xd9f163f2,0x0a1fb661,0x0e553317,0x17c69be1,
  44709. 0x7d88d417,0x61c1935e },
  44710. { 0x3492ae43,0x2e722d9b,0x0538f05a,0x1ef89d95,0x200aab63,0xae77e588,
  44711. 0xeba4b117,0x2872c120,0x3a461cb8,0x5c2432c8,0xcb938f26,0x315b3434,
  44712. 0x8c4c7dc0,0x05bf2ac5,0x596b378d,0xd2e501dd,0xcb890c30,0xa8506c9f,
  44713. 0x7c361f0c,0x3d0af461,0x5a35cbae,0x21f7b718,0xf3fc0138,0xbd1035f1,
  44714. 0x8b248edf,0x74628af5,0x48c9cae0,0x8d6421d0,0x2ca18773,0x75e3da39,
  44715. 0x71d3db94,0x27ad0df2 } },
  44716. /* 100 */
  44717. { { 0x305b5aed,0x9e3bda79,0x5998d6a7,0x2c67d4a4,0x0f7eb700,0xc855e1d3,
  44718. 0x147d1c44,0xc18a7e9e,0xc89540ed,0x3ea99618,0x7e6bfd20,0xa53be20a,
  44719. 0xecc14437,0xc9487e64,0x34ef85c6,0x72979207,0xd5e1ebd5,0xfa0d4e71,
  44720. 0x4d48d6b6,0xfda2b1e6,0x66e200d4,0x782a1e05,0x5a5366a1,0x2a3c70da,
  44721. 0x1a473738,0xfe3fbd2b,0x7fe020e8,0xd7ef8c06,0xeacfb665,0xec686fde,
  44722. 0x6dd1542f,0x5d9b5e27 },
  44723. { 0xcb3e472e,0x3637c5a5,0x30a1405e,0x2153d927,0xb4498558,0x009992e5,
  44724. 0xf39a0851,0x18f00ccd,0xb5c6c560,0x26237c11,0x1343540e,0x418ed408,
  44725. 0x7e7f3184,0xfef7cbf0,0xbf48576b,0xecd92366,0xbc94c91a,0x1b75be1a,
  44726. 0x4a162276,0x8e1778de,0xc5c6bcb8,0xc52e57d3,0x5ab71858,0x5cc382c7,
  44727. 0x3f6e39f9,0xe12c2c28,0xd62735fc,0x4c7e0ef2,0x835a5996,0xe071deb1,
  44728. 0xcbb8c766,0x24f891cd } },
  44729. /* 101 */
  44730. { { 0x6778c1e2,0x24ef60bf,0x00d5be5c,0xff49c03d,0x2f01a09f,0xec11986e,
  44731. 0xae096e58,0x59a728a4,0x7077984c,0xaabbcedb,0x870ca5a5,0xfb473bd2,
  44732. 0x4de30e3d,0x8c928c61,0x4f67abca,0x3fae7f9a,0xec21a9cf,0x83c2b2eb,
  44733. 0x9cd9b5de,0xafa70d62,0xc60b18df,0xadeaea59,0x4049b54c,0xd5fef7be,
  44734. 0x6dd310e3,0xfceebc76,0x8f6321cc,0x7748efe3,0x18ee8af5,0xfe9c32b1,
  44735. 0xd42df612,0x863ac3cf },
  44736. { 0xb85a2fe2,0x0a36fca7,0xee429dc6,0xf3e70d08,0x141c3944,0x8c9ba209,
  44737. 0x67272a0a,0x306a8106,0xf968bd06,0xe69a1555,0x153c603d,0xb86f7e47,
  44738. 0xef56e4fa,0x9706614a,0x98780b4c,0xc0dc36b8,0x3a1d3263,0x43657fe2,
  44739. 0x435522c9,0x01f97a86,0xedfef679,0xd91897f6,0x6daa17a0,0xebbe31d4,
  44740. 0x85accfbd,0x6f179100,0x8f9fc1de,0xe0da6e32,0xe1e7142c,0x1c9d53db,
  44741. 0x8b86725a,0x3e3f1b1e } },
  44742. /* 102 */
  44743. { { 0x7b7fbf05,0xb7ea15c0,0x1f1a3882,0x992f11b6,0xd1dcd1bc,0xc9ddd95a,
  44744. 0xad0f7e8b,0x31f5b7fa,0xfca7ab79,0x2936e5eb,0x19a55be6,0x30f417dc,
  44745. 0x43cde554,0x1f6f4e43,0x82f044bf,0x971f5e65,0x4288c408,0x73c3b8e4,
  44746. 0xb807f575,0x61aac59f,0x818b58f0,0xa64ee2dd,0x97a3b0d3,0x6f7a0a60,
  44747. 0x0394b058,0x8b85ecc8,0xbfb3517d,0x9a059474,0xa79c3f06,0x89ad5977,
  44748. 0x700a8025,0x81208ed8 },
  44749. { 0x14c4ce37,0x10935099,0xa1aa48a6,0xf34bb843,0x580d58e8,0x86007024,
  44750. 0xb375b8ba,0x6db42c49,0xed3bde83,0xac365524,0x649233b6,0x5521e1b4,
  44751. 0x64dd946f,0xbc7cc5d5,0xbfb5b6ae,0x9c14b035,0x0146c1a3,0x7f22ba18,
  44752. 0x872214f5,0x0b62fbbc,0xb4921764,0x3acfd7f7,0xcb4d6df1,0x5ff10da1,
  44753. 0x62600a91,0x660e2620,0x81d9167f,0x7ac7da9d,0xb6e7a199,0x6e8e260c,
  44754. 0x80deb3c2,0x44383fb8 } },
  44755. /* 103 */
  44756. { { 0xe44f9af6,0xe107f01d,0x8cb1fa1c,0x36381a4d,0xfb7dd493,0xe65be3ec,
  44757. 0x26a8839f,0xd0b8435a,0x3ec789d8,0xee60f915,0x2bcc5e1f,0xe25fea50,
  44758. 0x7e44a81c,0x0477c0c5,0x230ba5b8,0x349e9f83,0xde180dd9,0xdd42f32f,
  44759. 0x64a3d11c,0x8b039eaf,0xbeb7083a,0x80ef884e,0xf12742cb,0x288e60c4,
  44760. 0x720a0262,0x44156cc5,0x7253b77f,0xcd547de6,0xa6013a59,0x9829a6ec,
  44761. 0x0d548445,0x8aee708f },
  44762. { 0x32c54409,0x18f22d9c,0x75ebaac4,0xa9ebfa46,0x86284981,0x90e2e928,
  44763. 0x6b3a8e0c,0xd0201f6f,0xbd77641e,0xc973016c,0x70170575,0xf926f2f0,
  44764. 0xfec0ce01,0x4984048f,0xf319d304,0xbf696211,0xc91a88c4,0x74b5c844,
  44765. 0xe0030a82,0x4c40fbce,0xe4f6d521,0xbed67525,0x29d67d1e,0xaf7e47cc,
  44766. 0xc21d3536,0xfa307db8,0xbbb29405,0x56b6c46a,0x033e805f,0xf059a7e3,
  44767. 0x6096a5a0,0x970f61fe } },
  44768. /* 104 */
  44769. { { 0x1bec8e4a,0x1bc53d23,0x35a6034c,0x8809ac14,0x509e464d,0x4ee081da,
  44770. 0x8a488235,0x496ae1fd,0x325864b6,0xa1ae9863,0x74cd069f,0xbaca13e9,
  44771. 0xb1d8a6b4,0x3738cc58,0xe76b9da4,0x5fa71f58,0xc7eb16fb,0xc919be88,
  44772. 0xad4e429d,0xf5c8f13f,0x2499f9ed,0x4583b671,0xa10d8bd7,0xbce20115,
  44773. 0x5790bb7e,0xf66d7605,0x482b78dd,0x9316aede,0x75f855fa,0xe0d8fb2d,
  44774. 0x5a7dcca7,0x404b5b94 },
  44775. { 0x517a15c7,0xf9ee682a,0xef880202,0xaae4cfbc,0x5106a354,0xcee2c139,
  44776. 0x170febe7,0x5de60192,0x73d0c54b,0x589e39fd,0x8c9092b7,0x195c7135,
  44777. 0x0a7bfe5f,0xcb7ed53f,0xf61cc979,0x2bd9242a,0x5395f7d9,0x8d2ef16c,
  44778. 0x70b32f09,0x0d4ac1ca,0x52d185c1,0xa587526d,0x942d6195,0x2932b04a,
  44779. 0xa500b0ac,0xfe25a979,0x562fd230,0x5fa1f4ae,0x20da253c,0x60f55af2,
  44780. 0x83146002,0x7faa11b5 } },
  44781. /* 105 */
  44782. { { 0x6e402149,0xb0ba4f0c,0x963cc119,0x3584cc1d,0xa6527476,0x7740dc1a,
  44783. 0xc95715f2,0x3f77ff75,0x3f89fb0e,0xb2f234ad,0xef9be3ff,0x55159032,
  44784. 0x04237e82,0xfc9fb21d,0xa153ed93,0xeb2eff38,0x10041d13,0x89d53ae0,
  44785. 0x7f1bd828,0xcf2e545b,0x43953ea5,0xdd4a27ce,0xd85e75c8,0x00d2e5d4,
  44786. 0x241be1c3,0xeb93ed62,0x0242032d,0x1e53f25f,0xc3a4e701,0xb9957636,
  44787. 0xed98febf,0x14b63a52 },
  44788. { 0x71c43336,0x7610b553,0x23a4824b,0x19dfd4a6,0x0286051b,0x7b97a2e0,
  44789. 0x8f5f1edb,0x86abbb9c,0x9b67daad,0x67a57d77,0xcd5ffafb,0x8ace506d,
  44790. 0x89ac3c63,0x85da9f95,0x75a3d150,0x081cbaa8,0xe9346ed2,0x03353d8f,
  44791. 0xa1f9a02d,0xb2ab61f1,0x3a659c71,0xb0cb0937,0x4f5df8a1,0xb7e0e30b,
  44792. 0xeb7d5a1d,0x77c4c741,0x728e5cf0,0x8f046c9c,0xf7c171ac,0x32dd0bc7,
  44793. 0x836d2655,0x02485873 } },
  44794. /* 106 */
  44795. { { 0x75a4cd8d,0xcd40dd23,0x97bcba78,0x132ca433,0x258d61f5,0x30c5cd84,
  44796. 0xda1e8e68,0x0a7ec059,0x1d65d40a,0x07a8f171,0xf4350d76,0x869e655e,
  44797. 0x5983ae42,0xb98ce6f0,0x9d8bebd0,0x7b61391d,0xb1ba5d49,0x3a529e25,
  44798. 0x1f6b2cf6,0x46f732e9,0x3fa3b629,0xbd66ec6a,0xc3ef0ed2,0x397950ec,
  44799. 0x5f08b476,0xee9008cb,0x965a0e2e,0xfd6be425,0x1177bc87,0x78ed513c,
  44800. 0xfe512dae,0x6798cedf },
  44801. { 0x1b97c5c6,0x49e3f8fd,0x78c3b33f,0x39fbab3e,0x40f595ba,0x44274412,
  44802. 0x5d7d4376,0x174225b9,0x79c44777,0x880b3fcc,0x3296b245,0xdc3aca83,
  44803. 0x1734e184,0x55913df7,0x9c934472,0xa4db23d3,0xd1420a11,0xcebb3733,
  44804. 0xf3608bdc,0xb9d20cf9,0x30cfe13f,0xa618acf6,0x5f30874c,0x75f06b31,
  44805. 0x9f0005a5,0x506efe7f,0x01bfc9db,0x8aaea78c,0xf78e7c41,0xf9179255,
  44806. 0x52e96395,0x3ea7aed2 } },
  44807. /* 107 */
  44808. { { 0x5b06ae25,0x98617e04,0xcb5750ef,0xbcac148d,0x604c2ba2,0x91ea2f0e,
  44809. 0x76b78975,0x00c19f6b,0x651da181,0x79b9b6d0,0xc945705b,0xf3225beb,
  44810. 0x5c005bf1,0x30b435f3,0xbc24d86d,0x440b4482,0xd6373777,0x2b8f0996,
  44811. 0x1c44b4dc,0x65fd6c56,0x30906999,0xe9405ee6,0x08aa1ec1,0x19ff0924,
  44812. 0x3d2f2895,0xeef3246a,0xbc746797,0x016c3765,0xd0705f7e,0x62d2569f,
  44813. 0x05250044,0x6a8ad39c },
  44814. { 0x46be7282,0xe45f020d,0x21380f12,0x9405afed,0xd5da6ad0,0x4cdca5bd,
  44815. 0x7f8be61e,0xc2d6f184,0x596b8178,0x20132953,0x7a8df954,0x8d3b1e7b,
  44816. 0x39572b4d,0x757c61bb,0x80cc3b56,0xd749b57b,0x37b3ffec,0x9590ff93,
  44817. 0x145dc94d,0x39bbb653,0x2335e573,0x70c1c606,0xf763feba,0x9c2e72d7,
  44818. 0xcc61b732,0x4768e424,0xaa73f2ca,0x777d2fa6,0xc5cb58cd,0xdee4dbaa,
  44819. 0x9cfae1aa,0x1a181179 } },
  44820. /* 108 */
  44821. { { 0x77575ed0,0x6f6ff62f,0x7d1da99b,0x18f14fa9,0x69efd7f6,0x2e72aefb,
  44822. 0xddc28633,0xc45ab4cb,0x586c5834,0xb0e20d48,0x39775dd8,0xd397011a,
  44823. 0xf4134498,0x0130c808,0xf5115ed8,0x2d408eba,0x0260ded9,0xc506a05c,
  44824. 0x19cab911,0x9e5b7362,0xe8693a86,0x4cf508c6,0xcc773617,0x4e71245f,
  44825. 0x95d89ca3,0x2f71aa1f,0x607bbc98,0x4bba7c6a,0x212b7fd2,0xf3a515e7,
  44826. 0x9230f5a8,0x7d2ddc75 },
  44827. { 0x4ed2cae8,0x3d05816d,0xb9c00377,0x4cf6bc7d,0x646b08d4,0xc23e98e6,
  44828. 0x4b9c0180,0xf9ee6c61,0xef9179c1,0xe11c9a13,0x8ed9688a,0xa5b6147e,
  44829. 0xd06670a7,0x7afeb648,0x17685275,0xd670333c,0x75f9e8f2,0xa89dd969,
  44830. 0x37a68ade,0xbb57228d,0x454cb186,0x21a05d5e,0x063dd550,0x4810158f,
  44831. 0x4cb6caf3,0x92dd4f08,0x7854abe7,0x70c4d852,0x6e729d76,0x845969dc,
  44832. 0xb1bf40ba,0x5a52f87a } },
  44833. /* 109 */
  44834. { { 0x09ecacbd,0xed019e91,0x7b89bdea,0x6544023d,0x5707371e,0x7cc51f0b,
  44835. 0x16c8e217,0x14832b04,0x81259ab5,0xb1aa6682,0x23e361d4,0x6e100f92,
  44836. 0xe3a95c2a,0xe593eee9,0x16c10e26,0x699b6bbd,0x9473a13f,0xad487873,
  44837. 0xb274987c,0xf1c14dc5,0x2559e2e9,0x57dc0075,0xc3d47ad2,0x8449849d,
  44838. 0xdd527793,0x83df278a,0xeefd5b99,0x770e3ec8,0x76bd02a0,0x2ae58446,
  44839. 0x3e705ffe,0x17f02764 },
  44840. { 0x29abea1f,0xdda4010d,0x2407ac4c,0x636b9695,0x0433218b,0x96a60129,
  44841. 0x163d534a,0xf221fc3b,0xccc20565,0x05ba15be,0x96285577,0x1238e54d,
  44842. 0x878804d3,0x1b144257,0xa89a9fe4,0x96fbf304,0x4be642b1,0xc8a7f06c,
  44843. 0x6e2b085e,0xdd1a20e8,0xff4a591d,0x8f7f27c2,0xa4a343b8,0xc17b0753,
  44844. 0xbb173d4d,0x684b1e88,0x3dc07bbe,0x3accea44,0x4c441d77,0xdb15c88d,
  44845. 0x53e5957e,0x0ef0309a } },
  44846. /* 110 */
  44847. { { 0xfa8e5b60,0x4fc25721,0x691c0bb2,0x646938ad,0x0b0a2248,0xe46d4b76,
  44848. 0x7de16877,0x863f9ac2,0x2721c630,0x503bb6ef,0x0b67fb02,0xf8c199df,
  44849. 0xe07abd39,0x78c1ed72,0xb32f0dda,0xcf9deb7b,0x6c3c89f3,0xaff726f0,
  44850. 0x1972225a,0xb7008b2d,0x4f145f5c,0x8f5a6117,0x457c4f37,0x4e0e6f8c,
  44851. 0x1c453c64,0x8bbdaa44,0xa6e92c80,0x57be326d,0x5d773561,0xa9bc3fd9,
  44852. 0xbb37b72a,0x3d3b6cc6 },
  44853. { 0x9722c880,0x6e6f12cc,0x286b6889,0x3a1b6ae7,0xad2fafec,0xba1cc09b,
  44854. 0x43bb8bef,0xad64ad7a,0x97c3f4c3,0xa5af6a00,0xc353a91b,0x2afcb0d9,
  44855. 0x69ccbf6b,0xca13fcab,0xf2abc190,0x699a1391,0x23a247e5,0x2dbd5542,
  44856. 0x95488d9a,0xe206180f,0x1244cc3c,0xba9e7bff,0x87d3a365,0x29297abe,
  44857. 0xfa4ca5e2,0x4054fa38,0x67be1b6c,0xb390623d,0x78f41a44,0x1fa67c57,
  44858. 0xc7b544e7,0x2e946e43 } },
  44859. /* 111 */
  44860. { { 0xc60934ae,0x2980fddf,0x164206d1,0x2c3e7eff,0x416ed75a,0xf75e7f96,
  44861. 0x5cd0b2dc,0xfac60cf3,0x1faad87b,0xddc4bece,0x9849e5dd,0x753fa87c,
  44862. 0x2c1bf1ae,0xc5d516a3,0x14732b4b,0x565dbea8,0xce48696b,0x007ebe3a,
  44863. 0xcdb97694,0x40ca74d6,0x65e4e7be,0x3f5cd270,0x3aac4ebc,0x74847c01,
  44864. 0x43d6c3a1,0x6762e034,0x467a076a,0x690d8c95,0x1eda677d,0x768d78d6,
  44865. 0x0181d8c2,0x0997ce55 },
  44866. { 0x965a0b81,0x9297746c,0xe5e12dfa,0x48b58be6,0x715f437f,0x5573b3c4,
  44867. 0xb565c459,0xe425e907,0x1582797c,0x4f43f512,0x8ea5474f,0xe5dafa6f,
  44868. 0x13de04ac,0x2aeb8fbe,0xe8a07c83,0xed7f95f0,0x662c09fe,0x3e012a6e,
  44869. 0xc742cf17,0xbf96e9b8,0xe28a1c45,0x8ea5759a,0x5cf4e2f3,0x475941b4,
  44870. 0xf901a019,0x7dd3c02d,0x70916b2e,0xe7a4deea,0x2fa9b988,0x50b272b5,
  44871. 0xd0917fe6,0x96f9f09f } },
  44872. /* 112 */
  44873. { { 0x2c310a96,0x78e8aac4,0xf7a2a734,0x32a98303,0x23962207,0xc46ca83d,
  44874. 0xd9541280,0xad131e6e,0x2cabe911,0x5791fc5e,0x841b6c68,0x50cb77eb,
  44875. 0x3d3c8878,0xaff93dea,0xf1007bce,0x06541f1d,0x55cdf1fd,0x4ee729c2,
  44876. 0x323e3972,0xe0f71317,0xad4d08c1,0xa2de7a41,0xa35e22bf,0xa9912abf,
  44877. 0x89b03325,0xa050122b,0x06514d4e,0x8b9e51f4,0x79d3e0ab,0x423c7aad,
  44878. 0x40b8fea5,0x71998e26 },
  44879. { 0xceb6ed78,0x40140fcd,0x18534516,0x653cf377,0xe8d60dcc,0x0450b65a,
  44880. 0x9dac55f8,0xce6c1a76,0xae05686c,0x8a96a92d,0x12712562,0x2fe44762,
  44881. 0xa4f39425,0x747bcb50,0xfc531fc2,0xf0ec6ff2,0x10fe9ff0,0xc97c3447,
  44882. 0x9c792cff,0xfb488783,0x026fb019,0x552c5248,0xd804c290,0x4001a29c,
  44883. 0x35c8ca73,0x742b5ad8,0x6ee5dfa0,0xc3781f17,0x3dfa4ab1,0xca6b85f0,
  44884. 0x0b0d32ac,0x8389941a } },
  44885. /* 113 */
  44886. { { 0xde067dff,0xc0f062a2,0xbcb80162,0xd4f32690,0x0707a2bd,0x98cd990d,
  44887. 0xfae4a391,0x5afc63b8,0xb32ad814,0x684f1b7b,0xf199dfb1,0xb0a2dce2,
  44888. 0x48f25848,0x2260e17f,0xc2d5e862,0x7393db00,0x338cf171,0x9e88f854,
  44889. 0x02acf522,0x00679429,0x6835af3d,0x19157cb8,0xb8a2614c,0x2faa6f92,
  44890. 0x134ec46c,0x04ff95f5,0xfb7a8135,0xcf00626e,0xb37a4704,0x454b3d05,
  44891. 0x2694ec25,0x1fbfda31 },
  44892. { 0xc8f69c77,0xfdebb657,0xa3df88fa,0x92a8278b,0xc1fb78b4,0x463b5571,
  44893. 0x11c71a33,0xd2066a1a,0x089958b0,0x10c88143,0xcf9d67a6,0xb975c7e0,
  44894. 0x73037b8f,0xdaa5d208,0x40bf5861,0x5ee5005d,0x7dba69a9,0x300e6ce7,
  44895. 0xc962cc74,0x893c3cb3,0x4cf84055,0x0ac98629,0x225c9d70,0x0a7ef63a,
  44896. 0xb91e47e8,0xfe184869,0x8c2f84be,0x1b9d7deb,0xc0e278bf,0x67788915,
  44897. 0xc426f19e,0x4f9488ca } },
  44898. /* 114 */
  44899. { { 0xdd51b8ce,0x610dfcd4,0x36230e80,0x08579278,0x36599562,0xedc7ff1c,
  44900. 0xe2cae877,0x905ead4b,0xe7967608,0xa1c325d9,0xbd38926c,0x3e39eddd,
  44901. 0x5f6f0a4e,0xda92c868,0xf47a0fa4,0xe16f800a,0xe5f60aab,0x50b4db5b,
  44902. 0x983853d3,0x3665412f,0x9b79789c,0x64b62250,0x4e0e72b2,0xea560058,
  44903. 0xe555c2bb,0xabbd4901,0x17292e11,0x378419a7,0xe174218f,0x6e0b5aaa,
  44904. 0x8f796b92,0x688e0684 },
  44905. { 0x313b8f64,0xcdfef641,0x942c7462,0xaef11b7b,0x5c0d8abd,0x067cfb77,
  44906. 0xaf4041a9,0x608ea5f0,0x6935210f,0x23d5bd82,0x27917a08,0x5ab904fc,
  44907. 0x45d22d21,0x85dbb1fe,0x4d36159f,0xc3d5e509,0x1d39b8f2,0xaebb528e,
  44908. 0xf44acef0,0xdd5ca828,0x20c57a54,0x24209adf,0x78f95f44,0x5742b433,
  44909. 0xa9337d37,0xd11fa7d9,0xc64cfdb7,0xd66a0c09,0x9bb817ec,0x56e55b8f,
  44910. 0xe4c41265,0x1723c7e3 } },
  44911. /* 115 */
  44912. { { 0xdc8b43f3,0x9a6486d8,0x26409e68,0xfc3e0e61,0xd9b46003,0x1889c437,
  44913. 0x6284ec7b,0x3a850335,0x6a9dbaea,0x5a3665c4,0xe978933c,0x7bf6941d,
  44914. 0x69341490,0x1ed5a510,0x8cb8002d,0x664a7b7a,0x60ed0a59,0x603f76e4,
  44915. 0x1f4ebf27,0xc3e06ba3,0xf2c38a7f,0x296ced41,0xcf1db08a,0x2ac18f79,
  44916. 0xcde7a3b6,0xc919e882,0xdbf68b06,0x15e77d29,0x4e947cb5,0x21978baa,
  44917. 0x7630993a,0x84bf542b },
  44918. { 0xe364f21e,0xc1decda9,0x012e557e,0x0d6cf345,0x588f90e1,0xba246848,
  44919. 0xe3b104b8,0x9f6dda4b,0xe3aef57a,0x6bf7a346,0xe8327ea9,0x210299fe,
  44920. 0xda95e6c7,0xaa99f487,0xd2cdf645,0x24ff813e,0x8bd414b8,0xd1dbb2d2,
  44921. 0xcafa1a61,0x065101af,0x9cdebda4,0x7d9f4b9a,0xe41039e4,0xaf41b395,
  44922. 0xc50adf42,0xe3e9e6ba,0x341e9e49,0x4f2133ae,0xcb157f23,0x4968c0f3,
  44923. 0xda068153,0x383f827b } },
  44924. /* 116 */
  44925. { { 0x6583ff4c,0x2ec46a21,0x4ad709e7,0x4e645a29,0xc04ca12a,0xdc66e9cf,
  44926. 0x9160a7e5,0x82f128f4,0x569c762e,0xbfb227b1,0xc2edb8e7,0xf80c7963,
  44927. 0x49a0f688,0xa7dafe06,0x2d14b8cc,0xb7e41754,0x86de40be,0x3a0c5c53,
  44928. 0x1db79331,0xf0d05286,0xfbfe071b,0xb902ce69,0x210e9903,0x61e46956,
  44929. 0xf703ebb8,0xfaef874e,0xdd5f78b6,0xf668947e,0x5af5ea3a,0x6fe86547,
  44930. 0x43f94625,0x3b121f15 },
  44931. { 0x659275e9,0x5b26e847,0x6d0fce50,0x47581cfd,0x8aa3f1ef,0x55f5cbfd,
  44932. 0xe484e60e,0x1e7be315,0xfe9698e4,0xd8f1a20f,0x7ab04784,0x25d46da9,
  44933. 0x834cdb3e,0xa526db75,0x8d08a009,0x1fd408d9,0x5b5ca816,0xfc004b20,
  44934. 0x65e4bbe8,0x5b3e3bb3,0x759bb6ef,0xf50cc125,0xc2fac737,0xf05fa817,
  44935. 0xd273951a,0x9ee102d2,0xfecb3367,0x2a8e540b,0x2a6a515f,0x673446fb,
  44936. 0x37290c83,0x5505e1d1 } },
  44937. /* 117 */
  44938. { { 0xd15e68a6,0x0c3014a1,0x64dd35e5,0x6f9f0b26,0x03ad67f9,0x18c3742d,
  44939. 0xd2c14484,0x74818c0e,0x0d41a3cb,0xc5181169,0xc49f3e9e,0x65c8c83f,
  44940. 0x2c279386,0x9b260c61,0xced04e9c,0xf6086fae,0xfd7c4758,0xa7b2cceb,
  44941. 0x90297fd8,0x4b3c3133,0x09701ac8,0xca8264e8,0x508b3762,0x9f976a87,
  44942. 0x983a8dfe,0x5d582714,0xd9d598e9,0x350d2669,0x0f6fd348,0x85cb89cb,
  44943. 0xa574317c,0x617d80d4 },
  44944. { 0x70022b67,0x4cef267e,0x3768b94a,0x80536bb5,0xd2784462,0x3153a566,
  44945. 0x38243919,0x49054d44,0x5df78c4a,0x8d11e172,0xd5a1e35a,0x9b252a71,
  44946. 0x8171e31d,0x07866c80,0x1b38a00e,0x0a8501db,0xce770236,0x2ed932b8,
  44947. 0x8edaf7d0,0xa2d77609,0xb93006e9,0x3aee5dab,0xbbfeb036,0xfaffc8c4,
  44948. 0x4e21b38b,0x077b9678,0xdca8e069,0x491fc59f,0x0e938471,0x3f624f55,
  44949. 0x7cd1780b,0x5156f508 } },
  44950. /* 118 */
  44951. { { 0x0206e8d0,0x58234e22,0x7f15af32,0xf5f6f5d4,0xd638950f,0xafab7289,
  44952. 0x7d4495f4,0x66ec4d09,0x68da80a9,0xad890c5d,0x64f8a36b,0xe4aa0920,
  44953. 0x0f4d5c5f,0x799e257e,0x24495e31,0x44c677ae,0xa5b8e352,0x720387b3,
  44954. 0x75a287b9,0x703790f4,0xc3c1f2f7,0x54895cc5,0x41a7fa41,0xb8680f9b,
  44955. 0xb00b008b,0xfcd47458,0xba6473cb,0x149cc838,0xac9be19a,0x78ed5f7a,
  44956. 0xb33765ba,0x5254599c },
  44957. { 0xa21b54c4,0x08739679,0xb6497d9d,0x029ece2a,0xc8488640,0xf14f1a92,
  44958. 0xe9fa79d9,0xae48dcff,0x46c208db,0x14b911c2,0xdae3f69e,0x5ab0fbf2,
  44959. 0xd1edb838,0x180ac87e,0x188586bb,0x146fd718,0x5467cbd0,0x210eb654,
  44960. 0x1667cfee,0xaa239408,0xb73d1a60,0xdb125c1a,0x881c1cbe,0xde685300,
  44961. 0x37c30232,0xfe34c713,0x6f3c8d18,0xc6c6070e,0xb4af4e83,0x07e365ba,
  44962. 0xdcf82b45,0x22f0a7ed } },
  44963. /* 119 */
  44964. { { 0xea7f1b7f,0xe262791f,0xdcff09d4,0x9c3d8c5d,0x39c7dc58,0x86c2a9c3,
  44965. 0x4276e8c0,0x4dad4017,0xe9fe1d56,0x0a918f59,0x2aa810c9,0xb8d79670,
  44966. 0x4aa5cdc4,0xeb7a8836,0xe7afa72e,0xfc4c23bb,0x4ac86908,0x4dbb5c9e,
  44967. 0x6a0c7e6f,0x37e39013,0x49c218d2,0x855d7001,0x94b324a2,0xe475bc67,
  44968. 0x6287a071,0xc98a8dc6,0x5fb4323c,0x395a299b,0x0c0389e9,0xe186c3ee,
  44969. 0x16734c46,0x79f81e6f },
  44970. { 0x364f3c4e,0x83f2c1f3,0x1367e14b,0x536b2ac5,0x5933e43d,0x44a6dcfc,
  44971. 0x10d961fe,0x34e59475,0x7e3f2aae,0x08234ece,0xbdea7f25,0xcb92e00a,
  44972. 0xa791a124,0x1efba4f0,0x1192d53a,0xc2086fd2,0xb51c8af6,0xfec0d0fc,
  44973. 0xdc0f1b5f,0x48d1b2ca,0x812dbe19,0xb07a388f,0xdedbdd45,0x40873a6a,
  44974. 0xd702589a,0xbc2a1268,0x17e27b64,0xbbf6e3a8,0x6d386e85,0x73ee5663,
  44975. 0x9de7c000,0x442ecd37 } },
  44976. /* 120 */
  44977. { { 0x8a2f90a6,0xb4cd1ae6,0x6f5ad0cc,0xf277d41d,0x401d4b8e,0x6a3828c4,
  44978. 0xd8376631,0xe817a134,0xf5e1124b,0x142b758d,0xfd6b95e4,0x25fbc69d,
  44979. 0xd74a9e3e,0xa30c9f5f,0xd89663ce,0x5ac0f163,0x0ce6386d,0x32a9eef7,
  44980. 0xd8ed5544,0x7a690ea5,0x9889427a,0x5de23ff0,0xeaaced58,0x75ad36a5,
  44981. 0xd3e18465,0x3514a6c1,0x7f093910,0x3d9162c3,0xe33d56e8,0x5c10add9,
  44982. 0x06aa691e,0x85176b73 },
  44983. { 0x28a21e38,0xa32110fa,0x5773d538,0x97b6379d,0x2d020dc4,0xd3697bbf,
  44984. 0x961833cd,0x59177593,0xe5fa8516,0x6d7045fa,0x786ab5d2,0x3390f29a,
  44985. 0xdc4f5b70,0xac0bda30,0xdcc615c6,0xcca0240a,0xc5146d91,0x8e1f1702,
  44986. 0xa72cef87,0xceb472d0,0x0b669ba1,0x84840708,0x7e61aa0a,0x79b08f9d,
  44987. 0x4669560b,0x388160be,0x948eb71e,0x23935c2d,0x9431590c,0xd7fd83c0,
  44988. 0x6e5768b3,0x8ab154bb } },
  44989. /* 121 */
  44990. { { 0x353c4a96,0x28686003,0x905cd835,0x4e5c60e8,0x8f66f8cc,0xbd591364,
  44991. 0x9faccf9e,0xb6b80b98,0xe32639e5,0xbc1c1fae,0x278aadeb,0x2f6396d2,
  44992. 0x1898202d,0x00a796d0,0x3a474835,0x18ab548f,0xb31b0e3e,0xacd056c3,
  44993. 0x0164512d,0x15ba68dd,0x4b03f3bc,0x203836d9,0xd8f206c5,0xd64eca6b,
  44994. 0x9f1779b6,0x931a361e,0x52ab34a8,0xd82690fc,0x92922e22,0x342bb8e0,
  44995. 0xe00b02a9,0x1bfcdd84 },
  44996. { 0x75a365d9,0x310b9a43,0x08d8fb03,0xd4ade15e,0xd742df83,0x9c9753d7,
  44997. 0xde318742,0xcf7309d4,0x3360ace0,0x1228e212,0xf7669643,0x1043d238,
  44998. 0xf90f5a53,0xfc2adbed,0x7b5f9397,0x41d64cb7,0xc446d010,0x5200b30a,
  44999. 0x231720fe,0xc3c8642d,0xb9aa2075,0xfcc0122d,0x041eae47,0x856e3b12,
  45000. 0x68c876a4,0x45864455,0x233606b1,0x1a1c7842,0x227757bf,0x9b766d1f,
  45001. 0xf7b9d4f1,0x25b78a3b } },
  45002. /* 122 */
  45003. { { 0x156707ce,0x90835718,0x4314f90a,0x9bdc2398,0x8be57dbd,0x017c885a,
  45004. 0xad63a4b8,0xd4bba225,0x15aacffd,0x5ce71b86,0x72954722,0x5f266475,
  45005. 0x4f0ad3dd,0x0a80f1f7,0xfc352ed7,0x010538a3,0x4203c6ca,0xf8a64045,
  45006. 0x330c73b4,0x2b2c7a88,0x02dcac1b,0xb3433ee6,0xed2b17c7,0x2e0499cf,
  45007. 0xbd6329c7,0x9f8681a4,0x36fadc37,0x38979946,0x92b7895b,0xdc5650c8,
  45008. 0x65a51cf0,0x70ab9570 },
  45009. { 0x7b585d93,0x46778ec4,0xa633fe4e,0xca6d3610,0x4ea0311a,0x21da154e,
  45010. 0xbd64002f,0xaf22190b,0xd91cb7a9,0x9e633ac7,0xee6837d7,0xed13c31f,
  45011. 0x1616ee8a,0xda4a07d7,0x3afcd616,0xd78a2732,0xba14d694,0xc06696e5,
  45012. 0x4df58420,0x733754d7,0x2778e3c9,0xe85e504e,0x55b5a5c2,0x3055aa0c,
  45013. 0x8a3acb5c,0x313df538,0x2a088eda,0x5896acb5,0x84c85dde,0xfc8842a0,
  45014. 0x51dde6be,0x5fec9f79 } },
  45015. /* 123 */
  45016. { { 0xfe519f99,0x5ebc2c7c,0xe5410353,0xe396bd80,0x8a3988f3,0xaded9402,
  45017. 0xd601bda1,0x1c03b735,0x14ce64ac,0xfd302036,0x01240290,0x5837ebe9,
  45018. 0xa554097d,0xcaaea1a3,0xb0b88139,0xdce73d25,0xecb090b9,0x35ed412b,
  45019. 0xd63dab3c,0x99029ff7,0x062db071,0x555437d9,0x42a4c11d,0x277d2f56,
  45020. 0x24fc9109,0x477fa645,0x2799254d,0x7b12e9b7,0xd84c618c,0x7ad2ae22,
  45021. 0xce8ed195,0x0a8d5663 },
  45022. { 0x0a21fde1,0x43ac5163,0x6903d849,0xcfcf5dd6,0x5fdd6281,0x6d2499ee,
  45023. 0x77a49a34,0x4dedc6f0,0x2875c06f,0x46bda2c0,0x347b8046,0xd0e0e0f6,
  45024. 0x5e67836f,0x1058169b,0xde8a8042,0xc961912a,0xa93b3d32,0xdf3fea0a,
  45025. 0x0c576bc5,0x9f138edb,0xd8d37e47,0x7971ad6e,0xcce5e7cb,0xeab85739,
  45026. 0x1d202b40,0x88a4b434,0xe3a1fd26,0x5d842557,0xb3a86f91,0x872fabd5,
  45027. 0x6aa4629f,0x95b93493 } },
  45028. /* 124 */
  45029. { { 0x99f951de,0x9998a701,0xf058db45,0x8fade596,0xf3d03dd3,0x4d479c1e,
  45030. 0x33b141d3,0x6e928d5d,0xacfe8a40,0x9a465800,0xc1cefa3d,0xd108ad2f,
  45031. 0xe013726e,0x64b96921,0x8e83bb9f,0xb9b6a6b6,0x1242e544,0x29f1e6dc,
  45032. 0x2f65966b,0xd3f8f676,0x5e105b41,0xa34dd096,0x16011e1c,0xd4e9139a,
  45033. 0x2515541b,0xeea4dc68,0xc822166d,0x6f8030ac,0x31d16124,0xbdc7ae1d,
  45034. 0x621afa7d,0x2e25ef51 },
  45035. { 0xdd8e7357,0x2533cf8f,0xeaceddb8,0x333ba218,0x0784d2ac,0x68e3e31d,
  45036. 0xf2804ae2,0x1c927f36,0x77e7ad7e,0x01433d22,0x587f78a0,0x0b401cf0,
  45037. 0xaa0027ae,0x9dfcf036,0x1d9a46b5,0xc9e46c8b,0x1f288d32,0xaa6de486,
  45038. 0x1b8a043d,0xdd56da2f,0xf2d0bb56,0x346230e5,0x19defb56,0x19f0b6e4,
  45039. 0x21d2c874,0x55ec37cd,0xb70e45b3,0x3dbf0397,0xac7ce852,0xf0862a8d,
  45040. 0xe141f3d6,0x87979ea7 } },
  45041. /* 125 */
  45042. { { 0x7f1c747f,0x9b7e7b3f,0xc6e63369,0x151a4c1d,0xb372dba0,0x4273ff70,
  45043. 0xd3ee54fe,0xca6d2234,0xd33cae0f,0x12fc8e0c,0x5dd6f10c,0x27328538,
  45044. 0xf01a9cf9,0xc86f3fbd,0xe36cae91,0x5322677f,0x2fefea44,0x39a70033,
  45045. 0xce8af217,0x2c9ca328,0xf6a731f4,0xc0256776,0x66a96813,0xc687b3df,
  45046. 0x8db2eda8,0x194aab12,0xeec4febd,0xde30dc5a,0x979241b2,0xc052236a,
  45047. 0xc23d4c16,0x3ec98802 },
  45048. { 0x4072f74d,0x0f9e760c,0xab594059,0xe78eb0de,0xc9b009c2,0xdb3dea40,
  45049. 0x38b59ae5,0x47e875f0,0x2b4daa06,0xf40eb436,0x090f3788,0x9a6a4f92,
  45050. 0xedbfaf8b,0xefebe9af,0x9867e256,0xf87f96a5,0x75ab6aeb,0x1e6fed23,
  45051. 0x3fdb13cb,0x17f2782a,0x70fa2621,0x5102c71e,0xfd4c0dbe,0x5d2b06ec,
  45052. 0x30347297,0x537cc268,0x2b67e780,0x8dbf5e2b,0xba25da32,0x2f633f3a,
  45053. 0xefaec914,0x3e9315e8 } },
  45054. /* 126 */
  45055. { { 0x239a9ea9,0x9255cfa5,0x0be33a62,0x20f3c690,0x9cb642bd,0x759eeb4b,
  45056. 0x00bae718,0x3316c546,0xf3410f84,0x874a76d5,0x90f129b6,0x123b502e,
  45057. 0x12851f1c,0xadc8f9a8,0x1b62408c,0xf57b764a,0x1a80777b,0x116ec01f,
  45058. 0x1f0ddc5c,0x746ecef2,0xe5a6a5a7,0x3c49d47c,0x06e955ba,0x1e15dbe7,
  45059. 0xb45d79b0,0x629c0c79,0x778d1087,0x11278308,0x8c6a22d7,0x22585dc7,
  45060. 0x0a682791,0x2ed02a0d },
  45061. { 0x4daa2682,0x53043416,0x01359625,0x0e26d32b,0xbd867097,0x449c834a,
  45062. 0xee77ae2e,0x11a19d2b,0x3af6c169,0x39bd529a,0x5cd61054,0x36cca5c0,
  45063. 0xdc6c0fe1,0x6370a59b,0xb93d5135,0xca420d27,0x554c451a,0xd8730d45,
  45064. 0x96cdebf2,0xebd258c9,0xa50f9a05,0x0cb1b990,0x7b0f0151,0x69a8c97a,
  45065. 0x11d217e1,0x2cc36d34,0x752f75e8,0xf117688a,0xa09b2a61,0x1db01394,
  45066. 0xa9efd7dd,0x14627844 } },
  45067. /* 127 */
  45068. { { 0x232803cf,0x6bca3aed,0x9a96ff34,0xc1e4398b,0x74ab788b,0xcaf6757f,
  45069. 0x7e68c04d,0xc3a53e00,0x5cb7cd20,0x5f969c19,0xdc068bca,0xf28b65a6,
  45070. 0x1d863032,0xe3ca01d3,0x87808e14,0x9b733b81,0xefe618be,0xb5d704d9,
  45071. 0xb01b946d,0x276f3542,0xfbedddbf,0xe057e19e,0x903275ce,0x7d182f2b,
  45072. 0x880f7bc6,0x3cdc5f77,0x78476c14,0xd6f03d3f,0xa9ba5072,0x035f5557,
  45073. 0xb4029628,0x7acb57b6 },
  45074. { 0x44e6b07c,0xd2413569,0xe1c7345d,0x451c4cc9,0xe273b9fb,0x407444d8,
  45075. 0xb88e34fc,0xfe496079,0xf152776d,0x77d184cf,0xc742299c,0x6d1033b9,
  45076. 0x77bf2897,0x29a0a684,0xee8f0420,0x59ffdf10,0x44bb56d6,0x4e17146c,
  45077. 0xfb9ae855,0x831d06c2,0xd93e7cd5,0xb2cb82db,0x3c96b607,0x83381c46,
  45078. 0x7549e2a8,0x06aed251,0x774a21d4,0xef97891c,0x8675fbdd,0xae9807c7,
  45079. 0x6363516c,0x6a5a05b9 } },
  45080. /* 128 */
  45081. { { 0x6a8f4f33,0x92e71ea6,0x4dea8f4a,0xf2fc6fc6,0xfee88461,0xd356252c,
  45082. 0x08954d08,0x59b0a83e,0x468ab766,0x5bd68c23,0x900f8d04,0x40281357,
  45083. 0x52b867ae,0x181c19c0,0x18764c41,0x986a5169,0x13575d24,0xcb01dfae,
  45084. 0x593677b7,0x17269ae5,0x46dc9b19,0xf6d17025,0xc40097c8,0x8de68499,
  45085. 0x259c407b,0x76df0032,0x17d29d8b,0x4091aad9,0x4a7ab5f6,0xa7f46d21,
  45086. 0x70ece48c,0x688054b4 },
  45087. { 0x51a5b86c,0xf0d168aa,0x95777247,0x2437e4d8,0xf1720329,0xae844076,
  45088. 0x9647a54e,0x0a7ac87d,0x0405622c,0x1e597a4b,0xf0a79f2f,0xedefe5c6,
  45089. 0x4d55156d,0xaf3ef0c2,0xef047cf6,0x917fb04e,0x54b62137,0x3792799f,
  45090. 0x314be0b8,0x875ea32f,0x0c466b0c,0xe157c65b,0x7e218978,0xd28c90ce,
  45091. 0xcde587af,0xb90fc3ba,0x8b877bed,0xdd32d71c,0xca8e10cd,0x3b432200,
  45092. 0xd94f6e53,0x0021f419 } },
  45093. /* 129 */
  45094. { { 0x43519d26,0x2191122c,0x40a51845,0xbdafac1d,0x548bb89f,0xcc6f71e9,
  45095. 0x16844bf9,0x9ef3375c,0x178e8d55,0xe7789f79,0x1f8be1c5,0x04f599b6,
  45096. 0x2cbbde40,0x8088c99a,0x893206c9,0x8939a260,0xfcd30851,0xa1ae4bff,
  45097. 0xe08feafe,0x664cb3fe,0xff14aabc,0x61f38099,0x2a841ef9,0x0d8394cc,
  45098. 0x17f01db6,0x75fad8ad,0x6debb773,0x6fc34576,0xa4252512,0x1e716b05,
  45099. 0x29e1ed9f,0x79855880 },
  45100. { 0x95106473,0xa2cb3aaa,0x5a61da04,0x95fafa41,0x539563c0,0xfd3c9362,
  45101. 0x95312b87,0xbaa48091,0xbf885c76,0x6c7e7582,0x230c78d5,0x70f6dab6,
  45102. 0x7747440d,0x8ce3051c,0xffdb6186,0x6dbebd14,0x190e4096,0xb0e041fa,
  45103. 0x6ee62e2a,0xba10c466,0x74f333d6,0x93d57e2a,0xfe7b9b66,0x006aadc4,
  45104. 0x06d2837d,0xfaf72f6c,0x910741ea,0x318cc5e6,0x65692477,0x9c502609,
  45105. 0x1d0fb08d,0x95d823c3 } },
  45106. /* 130 */
  45107. { { 0x140528a5,0x6aeebd86,0x53979bc8,0xf268c2ba,0x4ec144ab,0xb1bc9b8a,
  45108. 0x82a7d7ed,0x1efabb0d,0x4e0118d8,0xf12c70d1,0xa1c1558e,0x31607168,
  45109. 0xe4b7e73e,0x33e428b7,0x83aec9dd,0x63176637,0xe12ac35c,0x5172ffbe,
  45110. 0xbc17b2a4,0x37df0bfb,0x741f812a,0x4212f870,0xe2888f9c,0x3dcecbdb,
  45111. 0x756ca55d,0xa9dc15aa,0xb9028e41,0xf31918ec,0x6aeadb03,0x7ede0285,
  45112. 0x78654f54,0x0e2708d5 },
  45113. { 0xcde20f88,0x2270cc53,0x5f5b1039,0x9338272c,0x5dcb1dbf,0x5042e19e,
  45114. 0xb72d74c1,0x4b3de219,0x2aaaaa55,0x16c49a8b,0xbba86ba6,0x008443e5,
  45115. 0x20cf1695,0xee6bcd72,0xa89abd11,0x59ffac6b,0xf115639d,0x2831217b,
  45116. 0xf34cba52,0xe4d28af2,0x0727a906,0xf27f03e7,0x69017766,0x6842c79f,
  45117. 0x7a81123e,0xcb3469bd,0xa42973b8,0x48c0f346,0x23990dbd,0xfc5784a6,
  45118. 0xfb299678,0x0d3dab3b } },
  45119. /* 131 */
  45120. { { 0xce29c3cc,0x8f8376e6,0xf016cbc6,0xcb0507ec,0x5e394ce1,0xdebff996,
  45121. 0x73c50d41,0x24fc526f,0x2d16ce3d,0x4edd5a54,0x91c13141,0xbb37bdd9,
  45122. 0xe33a8606,0xe3442ef2,0xc0629da8,0x2ae90337,0x592ab331,0x57faec64,
  45123. 0xd82b857b,0x1a938997,0xa3373176,0xad6c8cb9,0x9086751f,0x82595de2,
  45124. 0x18c17196,0xa81e97fb,0xbf697357,0xe4f48a13,0x5cb89f69,0xa1387c2e,
  45125. 0x5874b426,0x530b4eeb },
  45126. { 0xbab7b5ae,0xe9f275a1,0x03a57bf4,0xbb69dc4d,0xa45c505b,0xc974dc4a,
  45127. 0x416ac402,0x726369f3,0xaed985dc,0x735e4e78,0xcdd446a1,0x0548d879,
  45128. 0x9e16b02a,0x84ceb069,0x789b11a6,0xf73f6fa4,0xb2a4e784,0x6aa0c41f,
  45129. 0x93a9b697,0xb1f76902,0xf03a8ab2,0x814cce00,0x844d66c1,0x64cb255b,
  45130. 0x30952201,0xb794e7d6,0x3da32271,0xe052d4e4,0x08b6a4d9,0x5278b2e7,
  45131. 0x80c6577f,0x90942552 } },
  45132. /* 132 */
  45133. { { 0x0d5b4c2f,0xd269a14d,0x5c8a649c,0x2b8fc59b,0xb0e37d4a,0x95becb3a,
  45134. 0x9111037e,0xfda1a768,0x94e35322,0x5810e05a,0xa178fafc,0xa24dcc12,
  45135. 0x8e3dce62,0x5c2c63b2,0x9452c444,0x995c3f17,0x42d45161,0x35330ec3,
  45136. 0xb4ef8129,0xa025a60a,0x8bae9c13,0x85493252,0xe2e3caf8,0x25d1a606,
  45137. 0x3649bf47,0xd44091ab,0x704ec5f1,0xc7d0afbf,0xbd8b3333,0x27bd1d62,
  45138. 0xcfe616f5,0x50570111 },
  45139. { 0xf534356b,0xd0084ace,0x4b4b0fbc,0x9df1de05,0xcee04dc1,0x021afe05,
  45140. 0x361b78e1,0x64bde688,0xef78d38b,0xa324fcc7,0xeb0a5e4e,0xfeb372ce,
  45141. 0x65811996,0xef04fcb3,0x5eb0ab4e,0x7dce5d50,0x238c586e,0x1e29b588,
  45142. 0xbcd80037,0xde5e3197,0x4806b9cf,0x8bf5e451,0xd18e67ab,0x4330968b,
  45143. 0xf9f63fad,0x26a7d04e,0xb5c18bb4,0xa1c7f123,0x25dce22c,0x485b8482,
  45144. 0xd540e79f,0x8ff0b36f } },
  45145. /* 133 */
  45146. { { 0x3ff42cff,0x99f2e2f4,0x1c35317c,0xa3c19f9d,0xaba1b545,0xdb749392,
  45147. 0x4afa9a32,0x84232b05,0xd7dcd436,0x0b855d46,0x45cf9915,0x8ac35e20,
  45148. 0xf001a218,0xd7cf22c7,0xed408305,0x057d35ae,0x553ccfcd,0x25a4a519,
  45149. 0x93e2b939,0x5e565793,0x3422ec27,0xa20332b0,0x3ac53958,0x9b09005e,
  45150. 0x79e9b163,0x628051a3,0xfc6618d6,0xb4a0dc09,0x6748e7af,0x9e0e857f,
  45151. 0xc577d63e,0x71b28eee },
  45152. { 0x99726bf8,0x4942b0cd,0x1c208f3c,0x1290a3b9,0xb0598eaa,0xfd7290e7,
  45153. 0xa25a9128,0xc6a7791f,0xc037d7da,0x2d33db24,0x70e2837b,0xc21efeb0,
  45154. 0xe3dae2a0,0xbf70d96e,0x85076027,0x43ed8191,0x4d4ad7e3,0x4aeb0aa8,
  45155. 0xe8c5b74c,0xbc75101f,0xad26ebdd,0xdbfb2a6e,0x6b78aa4e,0xba812068,
  45156. 0xe1159848,0xc94aa8f2,0x3eba5c4e,0x0d10d9db,0x6318295a,0xce7fec47,
  45157. 0x330d925a,0x7294711a } },
  45158. /* 134 */
  45159. { { 0x32bbd495,0xfce45904,0xbe54973f,0x330f4dd1,0x5d9c3f4e,0x006bee1d,
  45160. 0x59ba7204,0x40ee6078,0x42c2c768,0xc194fd3f,0xe9fe88be,0xa0e76b12,
  45161. 0xec2b0210,0x17cddddb,0x00811ec7,0x689d436b,0x284be9e4,0xa6a6ba37,
  45162. 0x007d4114,0xabc395b2,0x0f11e744,0xf8cdf9f3,0xe9396402,0xc5febec8,
  45163. 0xeeb46285,0x8a751743,0xc6e0d137,0x99bf8782,0xbeb292e3,0x3965e170,
  45164. 0x5801fd5f,0x001c39d8 },
  45165. { 0xda4a0912,0xf4805cb9,0x4410bca4,0xd27cb76a,0xec71d65b,0xef3dcb8e,
  45166. 0x4816849a,0x780fbb2b,0xa8b24635,0xef6a7026,0x12c44e68,0x15625c88,
  45167. 0x4d7a74a8,0x624c232c,0x4b1631e4,0x81a77037,0xdb917c2e,0x04e4f7f1,
  45168. 0x1f61ed95,0x1d0465fd,0xcbde6e3d,0xb1048049,0xd7131fcf,0x637ce0c1,
  45169. 0x8ada4715,0x22e4dbc2,0xace99726,0xf7530c5c,0xee287450,0xa0160dcc,
  45170. 0xbb91af13,0x9132e670 } },
  45171. /* 135 */
  45172. { { 0x7996099d,0x8057efe2,0xa06e608c,0xb72344db,0xd0958588,0xeb4a8740,
  45173. 0x79e5aee9,0xe53daf06,0x908a2fad,0xc9560a9a,0x107e706a,0x7f4be131,
  45174. 0x2830246a,0x6d5f3d9b,0x27cca3e6,0xa5f8e8da,0x4c28f292,0xeb51dca6,
  45175. 0xf31dfd78,0x4cfa310e,0x2ca073e5,0x92e0c7c2,0xa40da683,0x102f1694,
  45176. 0x750d38fc,0x16bb07cc,0xbadae035,0x703e83e2,0xb4d3c9dd,0xea93c066,
  45177. 0x79940ed1,0x7d0b03e5 },
  45178. { 0x4dd94c63,0x5fe7ea30,0x738b0b3a,0x57ef01c5,0xa14e6b4b,0x9534a78c,
  45179. 0xa5353276,0x07622cde,0x7c22d006,0xaf696a07,0x7d46b209,0x733c1886,
  45180. 0x626c2b4a,0x9654ccbb,0xa84f3c4c,0xa098d3a1,0x2d734b74,0x3596f9ed,
  45181. 0x5d551c90,0xdfd3021a,0x1ec5123f,0xe2ba7d2f,0xb2c1aa39,0xf9726925,
  45182. 0xf8eb2927,0xd2e75d0e,0x19192a6f,0xfaba712e,0x9b83e50e,0xa606b43a,
  45183. 0xdab5de60,0x31b1782f } },
  45184. /* 136 */
  45185. { { 0x4034db92,0x878dba45,0x8f34dc4d,0xa3977901,0xdf754c33,0x8d004f2e,
  45186. 0xcd563a88,0xeaa5954a,0xbb5ffad1,0xa29d6c89,0xb0d8bdb8,0xa8adf655,
  45187. 0x8cdbdb47,0xf7fb842d,0x80d3205b,0xb72e3a03,0x7cac7ca9,0xc335b0b2,
  45188. 0xd8a5475d,0xffc60bcb,0xeba4d25f,0x736f7719,0x0c50fca6,0x3d901c38,
  45189. 0x80c01900,0x1fdacf7b,0x5681f84d,0x75cf658f,0x5cefbbc1,0x57a7e634,
  45190. 0x3e07ed1f,0x6fc0fbe5 },
  45191. { 0xb81b0e5f,0x496d116b,0x2ac853b8,0xd82dd2a5,0x327387f0,0x357e22d4,
  45192. 0xba912c59,0x3e332a84,0x49d5dcc1,0x8b71c643,0x438d85d3,0x0c982ee9,
  45193. 0xbf7fcd4e,0x90b9553c,0x38fed5e3,0x2cb39bbc,0x5ac42903,0xa2c67c9c,
  45194. 0xbf07da55,0xebf21217,0xa0b9e4ee,0x55ac05ad,0x8ee9e0c6,0x10bb12c2,
  45195. 0x48bb6e3f,0x5cf3aee5,0x8b046e91,0x4ae7269c,0xaa0e553f,0xcb266012,
  45196. 0xa94c8fc8,0x701935a1 } },
  45197. /* 137 */
  45198. { { 0xa4626dea,0xde58d41d,0x15b9039f,0x25ef66ca,0x3164e65b,0x99a810a4,
  45199. 0x748cfccf,0x9fe6daad,0x2f142fa9,0x7ab9a6bd,0x5d471796,0xa4cba168,
  45200. 0x6bc3a39b,0x12d30b36,0x8bf45076,0x1f46a5dc,0x1421ac0e,0xb868e529,
  45201. 0x59bba1c4,0x7a686206,0xda698b90,0x2b4b552e,0xe5453707,0x5039dcd4,
  45202. 0x9e90165f,0x42a07a9e,0xd7d45dfc,0xa838fff3,0x3b5ceb30,0x41991e5a,
  45203. 0x969ca600,0x6c961ec8 },
  45204. { 0xc4e7eb46,0x703bdc1b,0x596c7b48,0xd6bac557,0x66afd74d,0x4f9917cd,
  45205. 0x656ce6f3,0x56355105,0x32497175,0x3d1fb50c,0x63effb2d,0xfda6783e,
  45206. 0xeefaa2bd,0xbd79f1f3,0x17af9ef7,0xa4efbe54,0x5a55b7a4,0x6cef6462,
  45207. 0x1a713304,0x116f3238,0xb95625a3,0xdb2a2a7f,0x0b027e96,0x6a0aa43a,
  45208. 0x4832b3bc,0x458fe5d2,0x5adfaac0,0x523418df,0xc49e7f9a,0xc05a89cb,
  45209. 0x69e24b53,0x830883d8 } },
  45210. /* 138 */
  45211. { { 0x02557389,0x959b1c62,0xadefc0bc,0x5fe5ce97,0x8330f383,0x893bbe7f,
  45212. 0x16cfb81e,0x27e0c6af,0xd04428fd,0x6f64e65b,0xb79e6182,0x53de9245,
  45213. 0x487e11ca,0x08a313c1,0x445bce93,0x65cec3b9,0xd67ed49e,0x33bc0314,
  45214. 0x30782352,0x69f36b24,0x93ad31d2,0xd78e5daf,0xc780890c,0xf2682b70,
  45215. 0x9e45efe9,0x7015c34f,0xe6cbafea,0x135d4ba4,0x7e3fcc6c,0x43a378a4,
  45216. 0x96638f8c,0x2376f97f },
  45217. { 0xae575b99,0x0a6e1ec0,0x81b970dc,0x7e14cb4f,0xd3a73947,0xf00a3824,
  45218. 0xfb235a9d,0x0b4b9c81,0x5bf62944,0x8d15115f,0x1e165d7a,0xcfd35b43,
  45219. 0xb2ee3e3b,0x5d12fea2,0xf5182e7b,0x629984a6,0xc365d08e,0x4e43e2f3,
  45220. 0x30f36e72,0x99327091,0xfd345401,0x698b4a00,0xbaf96dce,0x23c4fd0e,
  45221. 0x23675554,0xa60ba0ae,0xb0325784,0x51bdac2d,0x215464a1,0x8ab4190a,
  45222. 0x6bf10296,0x8c461661 } },
  45223. /* 139 */
  45224. { { 0x2d1f36a5,0xeffca258,0x894c5f2d,0x0eded2b2,0x43ced84f,0x35a5cdb8,
  45225. 0xdb0e3b9b,0x290f8982,0x0719a112,0xcce0eaf0,0x39a362d6,0xd0e657e4,
  45226. 0x62697e47,0x5516a55d,0x8e636514,0x269e1f77,0xd50269bc,0x5e3dedcb,
  45227. 0x441c57c5,0xecec2300,0xc705578d,0xdb83f31c,0x1e489eab,0x1bdefb73,
  45228. 0x395fcdb4,0x20b678cf,0xff9db001,0x908cf91c,0x55f52cc8,0xcbebc6f4,
  45229. 0xb4c61162,0x155ea622 },
  45230. { 0x876fa42e,0x94be2f1f,0x7fadeee7,0xab5e8749,0x38c865af,0x692e70f5,
  45231. 0xdf8059b0,0x16e99b84,0x8b5a7ac9,0x0ceb606e,0x2d463d2b,0xced23357,
  45232. 0x2a9a09a0,0x2d0f2623,0x3861fbdf,0x2529998c,0xc1be310b,0x711888a7,
  45233. 0x0d8aade3,0x9b1229c5,0x3b13533d,0xdbcf9b78,0xff029708,0x3ca746f8,
  45234. 0xda83ef88,0xa5a013a1,0x4ab28444,0x8e904d18,0xbcbd4aba,0x2fe84b3d,
  45235. 0x259058c3,0x8f570f24 } },
  45236. /* 140 */
  45237. { { 0x2ca9c508,0xdeb66c8a,0x69d6b780,0x2dc5bec2,0x88ead600,0x16d61266,
  45238. 0x49d72614,0x61841b97,0xce472e6f,0x41e40e6c,0x1fa7a876,0xada24264,
  45239. 0xcc3997a0,0x45b9fd33,0x7c15dcf4,0xb25e8fa9,0x12e9629d,0x0124ceb2,
  45240. 0x7db3d956,0x3a8c72c6,0x7c1a7844,0x8e2ded2b,0x6dd027ff,0x94ab09c6,
  45241. 0x7e7a2bc6,0xf89a057d,0xcf70c763,0xad8bf226,0xc8a26212,0x4cb268e7,
  45242. 0xb2c44c1d,0x3d171e87 },
  45243. { 0x8ce49820,0x382ac16e,0xc0c44dc9,0x24ee45e2,0x73e858c4,0x0ec67912,
  45244. 0x46327cf9,0x918cb25c,0xc6159c1f,0x43e3876b,0x37545cb3,0xb6b6e0e0,
  45245. 0x5d12347e,0x64b839ab,0xa300d541,0x72e09274,0x881c1169,0x26ab28e6,
  45246. 0xeb75a843,0x4a580fff,0x359120df,0x0a5802ca,0x3209f4a3,0x7fee82d0,
  45247. 0x8e6a9380,0xb518016b,0xc2ee11ca,0xb99c6c70,0xab9d4ec7,0x16105af1,
  45248. 0x34cd9004,0x234e98f8 } },
  45249. /* 141 */
  45250. { { 0x14db9cda,0xff435208,0x96adec90,0x99cfdc47,0xaf458b6d,0x843aaa6f,
  45251. 0x743eaa31,0x3f1f7415,0x61735d81,0x915e192e,0x0ac595d5,0x3441a22d,
  45252. 0xc044bc8d,0x704bbf67,0xbe23a236,0x2f960471,0x15d1d557,0xcc326388,
  45253. 0x76b1dd94,0x9410230b,0x0c1c8a67,0xf2e5439f,0x833c910d,0x56b141ac,
  45254. 0x865b84df,0x467c999f,0x21f02b7b,0x1b0251fa,0x96216950,0xde5b5260,
  45255. 0xce3a1e93,0x6a2130e3 },
  45256. { 0x4b3ca1a7,0xd21b67a0,0x00c0ce80,0xaf42ed53,0x932cf07a,0x22ccd368,
  45257. 0x5c25c35a,0x36523a81,0x8dd04d06,0xecdd3958,0xb2f93a3b,0x73da3502,
  45258. 0xd5e5b530,0x4c5e0c3c,0x13268777,0xef9f5486,0x1e742292,0xed87fefc,
  45259. 0xa24e5ede,0x6d9ac29e,0x33849f1a,0x08abc9f0,0x40f23905,0xb09b2292,
  45260. 0x7f934353,0x6791072c,0xe6aeb550,0x102a6381,0x96feb870,0x3ee07409,
  45261. 0x9c4d2830,0x34f06faa } },
  45262. /* 142 */
  45263. { { 0x2348f005,0x869dc79f,0xdf4920b1,0x9b5c5d71,0x6dee64a4,0xfd1b57ca,
  45264. 0xe82a4fb4,0x21b7f734,0xb9578366,0x637cb834,0x7d287d96,0xc934101b,
  45265. 0x0392ecab,0x1590f8ac,0x7f75f4e3,0x280dc373,0x6a61ac62,0x8b36f50f,
  45266. 0xa65568da,0x74f58304,0xd930870a,0x80d792a9,0xfc8895cc,0x6d17b192,
  45267. 0x4914939f,0x498392fa,0xd41d5b9e,0xaf36027d,0x5caa82b5,0x452d79e2,
  45268. 0xf4115d1a,0x764d47b1 },
  45269. { 0xa2ee8b9c,0x5df22303,0x85dfcd48,0x1b9f72d3,0x10813a37,0x6b42b983,
  45270. 0x3de741f5,0xe28c523b,0xf303bb5b,0x0857625a,0xac9bf9af,0x926f299a,
  45271. 0x0d445b34,0x21beac08,0xd6ba2c0e,0x6a523a02,0x7fce2864,0xe302a1b1,
  45272. 0xe300c1ea,0x4516a235,0x7b4a9311,0x4543736a,0xc0cc89f7,0xd3c0b9e8,
  45273. 0x40ed88de,0x0481904f,0x3cb7fc70,0x4f269b56,0x321b9738,0x09a1d53a,
  45274. 0x230a3810,0x1c0dd9c3 } },
  45275. /* 143 */
  45276. { { 0xc46a7d9a,0xffaa1f67,0xbedf91cc,0x64743334,0x47a42f2e,0x45833a74,
  45277. 0x241ffaa9,0x67980051,0x335efe6b,0x70979a84,0xf08b2403,0x5f0613f5,
  45278. 0x64f211dc,0x6bb22fcd,0xa0572cfc,0xe1b8b2a3,0x7950a14a,0x19e0eb41,
  45279. 0x3eb6cd4c,0xe634bb29,0x470a25ff,0x31a04b25,0xa3d15a0a,0xa41f7ac9,
  45280. 0xbf2fede9,0xefed85ec,0x81b94a00,0x1f581f5f,0x9ef4a15c,0xaa3996b0,
  45281. 0xb06041bc,0x52d8be39 },
  45282. { 0xfd631a2f,0xbd1536f6,0xb351a8dc,0x91fae7f0,0x9b126212,0xd1a590c7,
  45283. 0x2bd0f435,0x52d4875f,0x92b0ea70,0x9aedb6d3,0xb83ab89e,0x0bd0abdc,
  45284. 0x89fe192c,0x827a1062,0x102a0bda,0x6566a960,0xce036814,0xda083037,
  45285. 0x58639405,0x30bed79f,0xdbca8df9,0x972019b6,0xefdaa3f5,0x89201286,
  45286. 0x5236b892,0xb337b996,0x28fc2e73,0x11d3e38e,0x880e8da3,0x70787f41,
  45287. 0xdae4a45d,0x6cff6367 } },
  45288. /* 144 */
  45289. { { 0xf89a8bb4,0xbd3d0433,0x93b98f71,0x42144c33,0x03470a2d,0x82b616c8,
  45290. 0xe5da089e,0x98fcc757,0x7bf5fda6,0x542354ef,0x9ebd34cc,0x1885c253,
  45291. 0xbec5dd0d,0x2e20b285,0x782a1bca,0xe71bbbe1,0x9b854ef0,0x959ded30,
  45292. 0x8997fa6a,0x17249979,0xd81f3c45,0x50cf8fa8,0x60c11152,0xa9a3b517,
  45293. 0xecf845ea,0xc9b0ef7d,0xb9fed11b,0xc9339e23,0x28256080,0xc93e9c5c,
  45294. 0x613ec1e7,0x1d2c8217 },
  45295. { 0x987cfc93,0x7381347d,0xf187f810,0x047603bb,0x1250ca31,0x3fa6bc9d,
  45296. 0xbb055bf3,0x480091e0,0x3a3af87c,0xbdf95f1a,0x140540ab,0xe2687770,
  45297. 0xd7fe045b,0x998df730,0xb723bc2d,0xb398135f,0x15ebec46,0xac230f8c,
  45298. 0x5f5561c0,0xe08e1830,0xda60a47f,0x7c0fbf4c,0xe16d4bfc,0x06e95c24,
  45299. 0x74617e92,0x74163495,0x4ae0c20e,0x39719869,0x2131e2b6,0xfe269312,
  45300. 0x0a537722,0x25486e36 } },
  45301. /* 145 */
  45302. { { 0x53572806,0x618795ca,0x656968e1,0xb2c89449,0x3fb323ae,0x149c2c97,
  45303. 0x409bc7d6,0xfb15de26,0xc79121b3,0xa90cda72,0x204cabbb,0x6d2fa14e,
  45304. 0x91604125,0xcbcda6f7,0xb435f947,0x25086261,0xc282eb10,0xdb686c38,
  45305. 0xf1a791cb,0x51016d62,0x61a2266c,0x6b1c7ed1,0x271d74a6,0x26780666,
  45306. 0x824287a4,0xb5ffeda1,0xbbe4f0f3,0xcbe503ff,0xb9482a74,0xd7f7f0be,
  45307. 0x088493f1,0x751b2358 },
  45308. { 0xe9c9be68,0xd597b9d6,0x67d10c6c,0x1794b5c4,0x7762b2f4,0xa88cdc3d,
  45309. 0xa1b44e11,0x6d94a63a,0xaaa8eca8,0xfb0bbbb9,0xc963d87f,0xf4b0f2d0,
  45310. 0x5dc7075d,0xb753062c,0x49933989,0xfed726ac,0x57f9ccde,0x5da60638,
  45311. 0x75f8c766,0x221c392a,0x5dc672ca,0xcd264d95,0xb66ecc8d,0x7004ff22,
  45312. 0x18a458ba,0xfb1aa9ae,0x8babd653,0xea9644df,0x2ba0de7c,0xa9378e80,
  45313. 0xca2c6c75,0x144cc12d } },
  45314. /* 146 */
  45315. { { 0x2989aa3a,0x593a0a1d,0x59e6e64d,0xd83f2283,0xd32e732e,0xe938b0cb,
  45316. 0x3c3cb249,0xf4c464c5,0xf89ea6ac,0x9750a5f8,0x346cfc32,0x467e5bbf,
  45317. 0x37b2b809,0xc9bfab9d,0x3b339c6d,0xf8eb7453,0x3b766dee,0x3fe01fbe,
  45318. 0xef6aea27,0xb3154254,0x7be61b10,0x555c3df2,0xdd818488,0x70fb6d81,
  45319. 0xbbe714f9,0xda1af3a4,0x9d18f693,0x575f2017,0x2465b839,0xdc08fc6b,
  45320. 0x6b84a951,0x874ecf33 },
  45321. { 0xbbb3f6be,0x624af83e,0x08bb423d,0xf578fbb9,0xd7873527,0x5623b0ba,
  45322. 0xa62e0442,0xc3659bd8,0xfe236f79,0x2903b167,0xe53f26a6,0x55a430c6,
  45323. 0x3ad712cf,0x222547ae,0x76eb272b,0xb73890d7,0x3d628df9,0x95b4f70b,
  45324. 0x53eae4ac,0x9f0e13b0,0xe7f2174e,0x5b4f5138,0x98dbae17,0x75482cf9,
  45325. 0x44518480,0x2b69bbde,0xcafef15c,0x4f279652,0xb6bcaf19,0xa0a3ef2b,
  45326. 0xce4c634f,0x31fb8581 } },
  45327. /* 147 */
  45328. { { 0x615cd607,0x398306d1,0xaa32c3a6,0x680c9faa,0x7779131d,0xe87a705b,
  45329. 0x36708b00,0x1031013a,0x9445297f,0x814fa0e1,0xa6a79b56,0x70c5583a,
  45330. 0x4b16bed4,0x03039cbf,0xaaaaf8d3,0x18a7ca8d,0x5cdb68a5,0xf33159e7,
  45331. 0xd23814fa,0xdea0e738,0x8d0f4f9f,0xeb352718,0xdcdff032,0xb0b76609,
  45332. 0x3d48338b,0x65ba8ea9,0x55dd507a,0x18044d82,0x4a4a50b4,0x844a223e,
  45333. 0x18e19e54,0x98323000 },
  45334. { 0x57f3d5a6,0x28a21027,0x6e8cadcd,0xffce5648,0x02551f3b,0x9590381b,
  45335. 0x935ebdf1,0xb26cc64f,0xc083aa6e,0x60611291,0x88e4cf41,0xcd988a66,
  45336. 0xdd53b1b5,0x581c3f73,0x77fc621d,0x78c804a9,0xfadca2fa,0x31874330,
  45337. 0xc83ccf02,0xf7008da4,0xa79a4707,0xc4122a1d,0x4a915eb5,0x9a8e0d3f,
  45338. 0xd0123660,0xa2de157d,0x65ead2a0,0x45ef43b2,0x188db285,0xd0a22ade,
  45339. 0x922e0caa,0x8abbe39e } },
  45340. /* 148 */
  45341. { { 0x3a2d2f01,0xb4446905,0x5dc6685c,0xd27c3193,0x1d74a027,0x6a908bbf,
  45342. 0x5b50ec1d,0x01da350f,0x3f3c2e26,0x1d3dd45e,0xb836ee92,0xf66e11d0,
  45343. 0x474b979c,0x7e03908f,0x98b87834,0x19e7c5b9,0xbd3d1de9,0xa741d3fe,
  45344. 0x1ef6059b,0x63c68e8d,0x3674e247,0x9b9ff939,0x3e7e67f6,0x1d7d53e7,
  45345. 0xaee9e248,0x698dc326,0xb3bd984c,0x52f23eda,0x6f8fe8a7,0xf95e31b0,
  45346. 0xc3d0ba95,0x0f15b4d0 },
  45347. { 0x790a8d85,0x8f2f6635,0xe2595af1,0x51bffbae,0x24b51287,0xd15b7ec6,
  45348. 0x3234715d,0x7639b6ab,0x2bc5441d,0x0cdd5299,0xf6d05833,0x54800ea4,
  45349. 0xf6d6e360,0x21efd752,0x19290613,0xc0b7ffe5,0xeea898cd,0xb68a5825,
  45350. 0x22982266,0xecedba92,0xbbd06bb2,0x678a91b0,0x4bb6b0cb,0xb2436dc0,
  45351. 0xcaf8ea98,0xcf7a99e7,0x71aa05bb,0xb92d0e6e,0xf5993eb1,0xbf8d0471,
  45352. 0x20385ddb,0x515db378 } },
  45353. /* 149 */
  45354. { { 0x6f5bef22,0xee43eaaa,0x20348712,0x952d2698,0x7a3af6c6,0x1e4c484e,
  45355. 0x9a8c9403,0x18d434c6,0x5001899a,0x63e5d741,0xfe8ea40c,0x5238dbbc,
  45356. 0x96798721,0xca6cc8d2,0x04acbde8,0x73db6aee,0xb7f993ce,0xbf69328d,
  45357. 0xad45e334,0xa3f79bbf,0x7c1f1630,0x8c51ec93,0x9b00a6de,0x4907325f,
  45358. 0x12d82bc3,0x49e6acb4,0x0ec59fc9,0x5901b36d,0x9cf34e3b,0xcb09b710,
  45359. 0x1abf4c02,0x2de0487e },
  45360. { 0x8dd9d484,0x18b722f3,0x7c77bacc,0x83349393,0x93d92b8a,0x58dbb8f1,
  45361. 0x8e3fac25,0x80d78d50,0x745f4a7d,0xf0500981,0x877cc29d,0xd072bfed,
  45362. 0xc30a89f8,0x67abf8f2,0x9a0820d7,0x92c567ea,0x8a3a5738,0x425ab12e,
  45363. 0xf055521b,0xc162faeb,0xb94ea5e9,0xee1c4f26,0x3d71e546,0x1e414994,
  45364. 0x43e8be1d,0x258183b8,0xef9eae0b,0x44917c82,0x73874a30,0x6813a457,
  45365. 0xcc42f86e,0x6f6ac071 } },
  45366. /* 150 */
  45367. { { 0x4dd6e3b1,0xd38822ad,0xad620869,0xfc78e1cc,0x2cacde80,0xe7843845,
  45368. 0xa8469fe3,0x121cc14a,0xe67e8ef2,0x8e8f3da7,0x4d347448,0xdb83d16e,
  45369. 0x798631f4,0x3ba1dd98,0x0a4c4c17,0xdfab5977,0x3edc701f,0x1f0a1306,
  45370. 0x6cd8ff28,0x4649d601,0xbcc55bc9,0x2267230b,0x5760412a,0x02a19c60,
  45371. 0x328faef6,0xc719d5f1,0xf67eaad9,0x27cb969e,0x719bafb5,0xf342530e,
  45372. 0xff5a82cb,0x6e2c24cc },
  45373. { 0xadaf8793,0x6313024b,0x035c948e,0x944bccf1,0x953500bf,0xe9a066b7,
  45374. 0x1d116765,0x7991a946,0x9fd93c78,0x95addb2e,0xe92e5495,0x05d2c037,
  45375. 0x9f03e5cf,0xcb145b18,0x95aa1f72,0x81ae48ca,0x135a6e4f,0x203f2702,
  45376. 0x49b2a7d5,0x2bcef5a2,0x02d7f2a3,0x0687a900,0x6c6745b0,0x2f7d3228,
  45377. 0x86507305,0x3da8a875,0x2e8dc58f,0xbe38b884,0xdbf11185,0x6b48bf34,
  45378. 0x97c08f91,0x5af7fd0d } },
  45379. /* 151 */
  45380. { { 0xf4a224a5,0x55f9b950,0xcc50273a,0x41904574,0x643f1fd5,0x34f81330,
  45381. 0x0e50f783,0x996801bb,0x89581712,0x866d7403,0xa4091d36,0xdb9a405d,
  45382. 0x16a46fe7,0xf1e379df,0x83bf9168,0x8d04a93f,0x32b20bca,0xae4c8335,
  45383. 0xf72a1c10,0x99d334b1,0xd8195db4,0x8fbc9977,0xfba14b5d,0xcaeb3dff,
  45384. 0x76daf476,0x60fef022,0xdb5b72f4,0x4b948dfe,0xb6dfb062,0x5185c925,
  45385. 0x9609d4ae,0x27a9c381 },
  45386. { 0xf12a93af,0x73c37346,0x5536634d,0x028b707c,0x498193d1,0x8efa58d5,
  45387. 0xef21b69d,0x4f83a5cc,0xa788a0e2,0x05cbb0a3,0x65b13c98,0x01031781,
  45388. 0x2b73784c,0xfea20e58,0xe50361f2,0xdf9713a0,0xd0cc22d9,0x31449a0f,
  45389. 0x7c5e2e1b,0x183752e7,0xb67044cf,0x6e44d6bd,0x733e177a,0x012dde95,
  45390. 0x08ee2c23,0x68b49669,0x1f5f1949,0xd9bb0541,0x6acd886f,0x95182c71,
  45391. 0xfbde9244,0x1c690694 } },
  45392. /* 152 */
  45393. { { 0x3a880026,0x5db67d17,0x125d95f2,0x89c4f0a0,0x3f6cb7a4,0x29050551,
  45394. 0x5cbbdca5,0x3eb231d1,0x972bcbd3,0xf8cffc99,0xad55a03a,0xcb4ef4d4,
  45395. 0x22867c2f,0x944d47ca,0x0ead1aa5,0x96d88548,0xcbc8b045,0x76a57cf8,
  45396. 0x005e55a0,0xdfe5844b,0x1d18a097,0x5e9e7e19,0x52923c74,0x957a26e8,
  45397. 0x7f5db339,0xd0867b79,0x63bed0c8,0x2553408e,0x689ad23c,0x1596e5d5,
  45398. 0xa504c339,0x7b8c13d6 },
  45399. { 0x52fb6901,0x2fc43aad,0x16ca253b,0x1c0313f9,0x515aadc6,0x1475830a,
  45400. 0x7f577dc2,0xc93d1926,0xf723c0dd,0x26e52e8e,0x3eb9f6da,0x2f1e0eb8,
  45401. 0xf180376d,0x9979de82,0xb0834939,0x43e28ecb,0xa39c38e7,0x9a2d51dc,
  45402. 0xa8e3f6b5,0x6e6063a9,0x4b9b3270,0x4cf1da3a,0xd2f8915d,0x6e5348a2,
  45403. 0x50507912,0x5e75e3e0,0x20d383fa,0xaeffce57,0x8fd2fb29,0x1d6d53cc,
  45404. 0x696f4cd0,0x0e3c3ef6 } },
  45405. /* 153 */
  45406. { { 0x21ee1d83,0x3bc337c1,0x787b7788,0x97e08f6d,0x138fa4ce,0xbf709fcc,
  45407. 0xa0348e58,0xbaf77647,0xa55e672d,0x04f8babc,0x7d5ec5dd,0x0ed2919d,
  45408. 0x33e99218,0x8ce64bff,0x24b059af,0xac09fc57,0xdc5e32ba,0x506831f9,
  45409. 0x465af6a9,0x26a22677,0xc97f1ff8,0x3c5efe66,0xbc6087fd,0x1515e0d6,
  45410. 0xaa8edc6b,0xb1a39c5e,0x0e79ed29,0x3dd816bb,0xbc3788b8,0x6cc13769,
  45411. 0xc092a51c,0x463098e3 },
  45412. { 0xc8bd0fa7,0x3a6408c7,0xce6bde49,0xd1764311,0x283ef7be,0xe315e108,
  45413. 0x99b5d938,0x8213cc77,0x45a49a6b,0xaf7f1581,0xe529e4d1,0xd00fdb0f,
  45414. 0xce66c9d6,0x55d38f77,0x1bd4b952,0xb4f7ccc0,0xaf71f986,0x8d975b49,
  45415. 0xcd64d00a,0x12b59fcb,0xa5a3bad7,0x1860e504,0x2b5c89f1,0x6d976044,
  45416. 0x7a3e231f,0xfed0c659,0x178cba92,0x58114c33,0x6698e11e,0xe2e74c06,
  45417. 0xa348b85a,0x7f8fd093 } },
  45418. /* 154 */
  45419. { { 0xc19428af,0xf24592ca,0x3a308665,0x192a1c81,0xe30bbd7f,0x42589812,
  45420. 0x836c6bb9,0x10db0723,0x598e4987,0x9c7a41e9,0x6ead6f4b,0x8aff179e,
  45421. 0x75862c44,0x70f8f9b9,0x6f21983e,0x6b3b0237,0x98e65152,0x25d83e9b,
  45422. 0xd751218a,0x3b2d26a8,0x9d6f1da6,0x9508281a,0xa5a81f74,0x8df78d05,
  45423. 0xe4687471,0xd79ee559,0x6787d8cc,0x2060ca57,0xa8476c95,0x427a84ff,
  45424. 0xe6435131,0x87b64c51 },
  45425. { 0x4b30d3c4,0x87f46f65,0x23b4ef14,0xcdec4c5c,0x63ca4d68,0xb3b74766,
  45426. 0xcf3fb56d,0x1df34269,0x0fd7d46a,0xd4f139c4,0x6a69a8bd,0xa3b7c7c7,
  45427. 0xcbadd7d2,0xee56b4c9,0xac942334,0xb28ff342,0x786f1da3,0x0046fdfa,
  45428. 0xb700c82e,0xce5d149c,0x50966597,0xca30ef81,0xfcff4bdd,0x44a20609,
  45429. 0x44925268,0x0f2f65e7,0xd4021f38,0xe5b6552c,0x042dbbd0,0x77ea9c2a,
  45430. 0xd9c062f5,0x8c95267c } },
  45431. /* 155 */
  45432. { { 0x5fc1abb1,0x6655032e,0x12fe4743,0x2215af54,0x29f05ef5,0xfd657560,
  45433. 0xdc191be9,0xb0e73325,0xc08639b0,0x7ab3c65e,0x1c3e6673,0x67507f51,
  45434. 0xc8615555,0x638befc3,0x42f0c4ad,0x5d0188cf,0xd896186d,0x843a301c,
  45435. 0xb2c6741e,0x045603f7,0xfa3cd1d0,0xf7545c0c,0x4a40672e,0xf612affd,
  45436. 0x45b9e8dd,0x56197c9f,0x87922d74,0xb453237d,0x4b2d59bf,0xbf132e3a,
  45437. 0xb84a6a16,0x8afa1b73 },
  45438. { 0xe793ac70,0x6b3596ea,0xeef6dd10,0x4c94ef8e,0x70422e40,0x926b4fa2,
  45439. 0xe9e5d763,0xc8c71dce,0xf512aadf,0x352fcb70,0xa883975f,0x1b7ba138,
  45440. 0x058c3b13,0x57991390,0x97740fd1,0x9692092a,0x160b0697,0x19ad945b,
  45441. 0x10837ab2,0xbc634388,0xf174bb71,0x76ee11c4,0xab1b80eb,0x6111bfc1,
  45442. 0x70ec458a,0xbc82bac8,0x312d3325,0xeee60127,0xb240adc8,0xb4118b1a,
  45443. 0x2b5a093c,0x67211191 } },
  45444. /* 156 */
  45445. { { 0xf55cf9bf,0x91e99306,0xa46b96d9,0x9b045308,0x9e7a65df,0xae3c1e1d,
  45446. 0xc731bcbb,0x453cb151,0xa4d58a61,0x14be5227,0x97c74cc2,0x39dac922,
  45447. 0x822e00d6,0x4d0f7a45,0xc62b03df,0xafeb1d51,0xbaa18b2d,0xbb1dc3a4,
  45448. 0xdf2b74f0,0x7f3c7178,0x896b6a33,0xfcd328a6,0x1dce055f,0xe95ed454,
  45449. 0x6a4e2b87,0x97fbc76b,0xfa59dce9,0xe5ec67f1,0xcc0367c1,0x052368ac,
  45450. 0x54e4a3fe,0x7c863916 },
  45451. { 0xca7388cf,0x55e94b5e,0xc0335d38,0x17cc0a60,0x616f85ba,0x9b69b78b,
  45452. 0x10122980,0x705d02ef,0x1cfd0a79,0x565a6e80,0x7d1ee352,0xeb74a96d,
  45453. 0x427b9dad,0x5c8832ed,0xe6d5330f,0x96ea8528,0x18d24ee8,0x30d8862b,
  45454. 0x9ff939f7,0x9cd38ed5,0x01060252,0x690fc9a2,0x2303b3ff,0xc62d88b8,
  45455. 0xdd52b469,0xfc42d7a4,0x8cad2d93,0x06f8dfa2,0x60920438,0x50236090,
  45456. 0xfce855ad,0x32582758 } },
  45457. /* 157 */
  45458. { { 0x359e8c60,0xeb20e45f,0x364ca186,0xc71bb8a5,0xdff8e110,0x02b15071,
  45459. 0x4c93e578,0x074e91d3,0xb829d0d8,0xc0326e00,0x626a83fa,0x3c192258,
  45460. 0xfb29a09e,0x387a64d5,0xe5ac5c82,0xcaaa3d34,0xada2da29,0x8ed685e5,
  45461. 0xeb29650e,0x92720267,0x763802f3,0xf7184b19,0xdf6b1aea,0x23f5dd0e,
  45462. 0x25e6125d,0xbe1fa347,0x0c872a1a,0xd6287f9d,0xac57c3af,0x49aa93d2,
  45463. 0x5bda7656,0x1a4e6a71 },
  45464. { 0x554d1267,0x1a126ede,0x1cd02b48,0x37f94533,0xce31fb1d,0xd70af04c,
  45465. 0x097dc012,0xcf410b0b,0x36c7b6c5,0x930e1d17,0xc6891085,0x902fee41,
  45466. 0x79fb638f,0x349ba4a7,0xacd6f8df,0xa16c5821,0x2e076ace,0xfb3b83c1,
  45467. 0xe501d14d,0x6b8d033b,0x20f2d2da,0x0593d452,0x99df1880,0x3752526d,
  45468. 0x9feb33a6,0xca32351c,0x1f6ef456,0xd91343bc,0x35b9dc8a,0xc74857db,
  45469. 0x85b4e832,0x856a7c93 } },
  45470. /* 158 */
  45471. { { 0x0d0a5583,0xa007d002,0xeda4658a,0x2f1301dd,0x34d939be,0x91c07964,
  45472. 0xa70c0836,0xa0cb6780,0xbe81e540,0xc0b4df95,0x5d4ac8b8,0x6cbbcd34,
  45473. 0x54756239,0x57c52ed0,0x1805ceb6,0xcac2dca4,0x79344255,0x915ee6ab,
  45474. 0x24c9a2a6,0x366def31,0x8c12c674,0xbd3b962f,0x7dbb7c3b,0xaab64f1b,
  45475. 0xe22bb95b,0x3c0e4553,0xc4c63b74,0x2408feba,0x2a4da631,0x3ca77312,
  45476. 0xc636da40,0x62889084 },
  45477. { 0x8cb8d208,0xa457fd53,0x543f06d4,0x7a8f8009,0xf2eff2ab,0xb66de154,
  45478. 0xf72517e7,0xfddb28eb,0xf9389d2c,0x0149fe66,0xd85b88ce,0x79e8773f,
  45479. 0x0ba543f7,0x452e090b,0xb0b03fc0,0xdeb9b5cf,0x6c5ed77b,0x3113448a,
  45480. 0x8ffc0372,0x3609f3cf,0x5c1b4c4a,0x2bc9c46d,0x8fa59be9,0xe66f3bf3,
  45481. 0xcdb02691,0x1396bf5f,0x009f88f9,0xf1ec59d4,0x2ad9dfe3,0xc2903456,
  45482. 0x5ada4d58,0x79d8122c } },
  45483. /* 159 */
  45484. { { 0xaa529507,0x14d4e4ce,0x74655d00,0x056a0814,0x4f0fc474,0xc0d30a38,
  45485. 0x3443cb8e,0x8a8203ea,0x97f1728d,0x33c62fb0,0xb520ef52,0x8a38dcfd,
  45486. 0x7cac9d3e,0xa0f90d5d,0x873cea50,0x28a7b0bf,0x6c6c41cb,0xd115ae3a,
  45487. 0xa13812c1,0xa35171da,0x624d507e,0x25d4bba5,0x7e98f42f,0x91dad289,
  45488. 0x96a41371,0xffd6b1e9,0xb69e5b77,0xd46c2125,0x20c4f707,0xc7d2b424,
  45489. 0x8142557a,0x2ab3af95 },
  45490. { 0x6a5372a6,0x86ca074c,0x56292ba7,0x728fb83e,0x77741cf5,0x745596dc,
  45491. 0x520ef49d,0x70b4cea1,0x61e46472,0x1472fe34,0x3fb8ac5d,0xf4d6bd66,
  45492. 0xc10bc071,0x46e52cc9,0x371a3461,0x28794efe,0x276fe877,0xa4850718,
  45493. 0x9bef5ab4,0xedad5773,0x3f15c815,0x24c2d9ff,0x8f8395c3,0x188950e5,
  45494. 0x80b6a855,0xbae40996,0x8a8803e1,0x4f53e22c,0x039d25ee,0xaf233f61,
  45495. 0x250409ca,0x07db2c35 } },
  45496. /* 160 */
  45497. { { 0x037d4703,0xc7f3b8db,0xc5f488b9,0xe83708df,0x8471d402,0x1fba830f,
  45498. 0x5a2faae9,0xa55ee8d2,0x5404fc1e,0xc2e5bf10,0xaa2d5651,0x647d5027,
  45499. 0x7ebaf5f9,0x37a53c0c,0x95b30abf,0x7adf0bb2,0xd64c93ba,0x5a62e1fe,
  45500. 0xe2ef4a78,0x7ffc18c0,0x4d2cd04f,0x139dd9d9,0x5ea0af02,0x253fbab7,
  45501. 0x0fef9acf,0x7c8100ea,0xc8615aa7,0x74c5384d,0x9fe52069,0xcb28682d,
  45502. 0xcf7dd759,0x08b6ca8f },
  45503. { 0x036c3b5a,0xe04e5bea,0x7f9f2b4b,0x38726102,0x29797c0f,0xa9fca570,
  45504. 0x82879ea3,0x1656180b,0x607f0ddf,0x153389bb,0x67b0e087,0x99a1223c,
  45505. 0x9d897fc7,0x0d1808ec,0x916edf19,0x9470711a,0x07217118,0xf8f52f2b,
  45506. 0xd18888b6,0x5d8b29ff,0x4cc6f900,0xef1e22c5,0xeb24877f,0xc4036165,
  45507. 0x35479525,0xfda95233,0x6861468a,0xd622a421,0x74faba08,0x5d043b07,
  45508. 0x0d31a7d2,0x2c337b02 } },
  45509. /* 161 */
  45510. { { 0xea22fa65,0x7b2305bc,0xd159f63a,0xbe183ef4,0x3f35923f,0x3473d87d,
  45511. 0xc11d7753,0xb27fb306,0x2a054cff,0x702e7e6b,0xaf185619,0x3ce9f97c,
  45512. 0x4e7d51c5,0x83550243,0xf356ac5b,0xa63e3d82,0xd7645131,0x867b7caa,
  45513. 0xa671fc9d,0xee85e6af,0x2b07cd77,0x3b985ede,0xffda5193,0x07d598b0,
  45514. 0xa942dc36,0xb10eca39,0x506218a9,0x17f3dcee,0x06b7d5ca,0x3d94e8d1,
  45515. 0xed8831c9,0x509b2634 },
  45516. { 0x48caed54,0xb1b9414e,0xcbf51e97,0x77a78c6c,0x4de9b258,0xa4688c8d,
  45517. 0x91ee3d78,0x0024137c,0xe30ee64c,0xa68f9234,0x88190d78,0x573255bc,
  45518. 0xba80690b,0x41e8e05f,0xec354f4c,0x50038d84,0xdfa52816,0xb18f02d6,
  45519. 0xccb63fda,0xc47f9007,0xe98ae455,0x29d480fb,0x5d0e319d,0x4ac45d22,
  45520. 0x026db719,0xd06f3575,0x2c3587b9,0x733b9e20,0x2c317727,0x22483992,
  45521. 0x54bb8752,0x1592d5a7 } },
  45522. /* 162 */
  45523. { { 0xcf7453f0,0x5778d9a2,0xed83c1f0,0xaffb899a,0xe0a82ba7,0xae6506d3,
  45524. 0xea3d5081,0x32c84e1a,0x810aa38b,0x9ad528c0,0xbd37d041,0xb1fdb020,
  45525. 0xd06ce41f,0x78d6cbe1,0x2e74b7f6,0xd287f0f0,0xc43bb022,0xf5cd2575,
  45526. 0xf81a71b3,0x6d28f2f3,0xc633e7f4,0xe65bb1f5,0xc4fc580e,0x32e5fc1c,
  45527. 0xbb7b07a5,0xcd55539f,0xc3caaf3a,0xb5a94471,0x4cc22d2d,0xb958bdf4,
  45528. 0x77a2777c,0x1614bdbd },
  45529. { 0xed0ab04d,0x4c1f0230,0x6e2082ea,0xae347b00,0xc42c5b5f,0x9f10bc63,
  45530. 0xde019935,0xb0539e6f,0x65dd0825,0xd89bd4e7,0xbbceda16,0x92260fef,
  45531. 0xe62aca32,0x8aaa755c,0x5ec82c5f,0xed762fa9,0x18650768,0x99e64c01,
  45532. 0xc92e348c,0x57dd6245,0x31ea6d68,0x0db88a77,0x07b44736,0xef0012ab,
  45533. 0x171d70fe,0xb9356b94,0x03f891b0,0xe68b0628,0xb79c20a2,0x3a54a53a,
  45534. 0xb00b0728,0x489656c7 } },
  45535. /* 163 */
  45536. { { 0x71353c25,0xe43649ba,0x13f67e24,0x517f27a1,0x1c1eb9e3,0x10bd333a,
  45537. 0x78e29bf9,0x94e1c05c,0x4743f15d,0x84fe7d97,0x90da2df0,0x9c874908,
  45538. 0x53673be1,0x82403fa7,0x1baea1b1,0x7ebf5db4,0x24180ead,0xcfe0ae35,
  45539. 0xc2f50c3f,0x1d15873f,0x70661cd9,0x16851ad6,0xa51e8c2c,0x802968d9,
  45540. 0xe0161099,0xe7d1a9cd,0xa8a7ea56,0x2b153c89,0x06e3c498,0x6d41b789,
  45541. 0xd6769dcb,0x082bb2e9 },
  45542. { 0xc4d6615f,0x6180ef46,0x01b9829c,0xfc629dc1,0x0fb264ca,0xde222ec0,
  45543. 0x10ecc2c4,0xc5457e06,0x1eea2c4d,0x95ce599f,0x8f9c5b2c,0x0433fa72,
  45544. 0xcd6310f9,0xee035462,0xce2e2253,0x84c57c3b,0x96d87e44,0x6c8ec31a,
  45545. 0xa452c5a7,0x30bfe393,0xa047b235,0xc592b140,0xc018545e,0x7bd8be18,
  45546. 0x5c178c46,0x794e0107,0x2e23005b,0x48471946,0x622a54f3,0x2665e237,
  45547. 0x901c9042,0x36451a46 } },
  45548. /* 164 */
  45549. { { 0x19893e71,0x17802d18,0x539a2082,0xa1765d8b,0x2302ecfc,0xfc6aea01,
  45550. 0x365bf59d,0x8d4cf51b,0x0d232a80,0x87741d72,0x18e80427,0xac343eb3,
  45551. 0xe74739ec,0x553ecb2f,0x1a8b07ca,0xaeca79a8,0x56f4ab3a,0x089ff322,
  45552. 0x3fa1d1f7,0x5e95d729,0xf62a9a16,0x260569ae,0xaa08ddc2,0x5e776232,
  45553. 0x1b7bb54a,0x93fabec3,0x743d56e7,0x48a20956,0xeb0ebeff,0x749cdb12,
  45554. 0x69b8fcf1,0x705307a4 },
  45555. { 0xe488310b,0x7a8e4c04,0x5325cd7b,0x12726e32,0x4983efac,0x5d0fd8b0,
  45556. 0x02ddb913,0x796e552c,0x77b9685c,0x0eeca3f7,0xb15f24a3,0x9b766e89,
  45557. 0x48efc979,0x7c2736d6,0xa8021c6c,0x3d619685,0xa0b2f1ea,0xfe33e278,
  45558. 0xb676d6b0,0x95c69879,0x1af4e0be,0xa0747319,0x36c4ee55,0xa2fab5f1,
  45559. 0x59e5f3b9,0x6938b8ff,0x39cafe6e,0x1e114da4,0x6a6ad120,0xc9595ec3,
  45560. 0x57e62aec,0x80f79bd0 } },
  45561. /* 165 */
  45562. { { 0x60af09b3,0x3cef42a7,0x933dfe14,0x3c016ebd,0xed85eaa8,0x720cf1e0,
  45563. 0xceaa3bc9,0xd4f5e99f,0xb7106f97,0x7216b9d2,0xc9668ad2,0x65f34c36,
  45564. 0x5b0c651f,0xa8fb82bc,0xf2fda4de,0x20f42f1c,0xd21f659e,0xeb31ab2c,
  45565. 0xa13d1618,0xb7a776c7,0x38662be5,0xec441022,0xcad08e0b,0xc825da70,
  45566. 0x022c0180,0x99299079,0x2aef9ffd,0x7623bda0,0xf5c58b50,0xde84f4f3,
  45567. 0xd824ff19,0x5f5a5da4 },
  45568. { 0x7e8311dc,0x5737257e,0x466cf136,0xdef94f51,0xb05ca21a,0xa73e1645,
  45569. 0x02e4ab37,0x38ea9b3c,0x8579165b,0x7760eac9,0xc24b01a4,0xdffdd047,
  45570. 0x3fb95584,0x188d4fd1,0x25548bda,0xfaac38b8,0x59e9dcac,0x1a79a6f0,
  45571. 0x09a2700f,0x983f720f,0xfb8a7e48,0x8cbba554,0x47a1fad5,0x38a19968,
  45572. 0x5abd6b5e,0x11856547,0xf3716ec2,0x75113d31,0x4212907b,0x1391e781,
  45573. 0x0dc15889,0x5319c801 } },
  45574. /* 166 */
  45575. { { 0x6b61c3af,0x2320136e,0x07b4bb68,0x1d40f2de,0x380c97f0,0x651dee7f,
  45576. 0x6a8c313a,0xa978ba70,0x2011ca10,0x22c587d6,0xab1f445b,0x48bba218,
  45577. 0xe50444e6,0x8c5eaf07,0x442fccf9,0x5549f02a,0x3d80493d,0x2564746f,
  45578. 0x79c04591,0x42d24f61,0xabdc8887,0x1600fa18,0xded38f8f,0x5cb8600a,
  45579. 0x923aeb46,0xa4bf9b90,0x1e1c578a,0xd63fee35,0xebb9ea14,0xf3c9c5ac,
  45580. 0xf11a4ff0,0x3d13314d },
  45581. { 0xb4513d1e,0xe5cc662d,0xd55952bd,0xde78a8c5,0xe7f86d0a,0xe8a37a3f,
  45582. 0x7a04f0c5,0xca2d12a4,0x2e25d06c,0x4c6696e4,0xb2136071,0x52614698,
  45583. 0x89f6e1cb,0xf4d2701b,0x80efd95e,0xaafd6177,0xc5bb6907,0xe6d73ac4,
  45584. 0x420db35a,0x49e874ac,0xf2751fa0,0x11631de4,0xa1fa2edd,0xb29f7336,
  45585. 0xb7fd794d,0x4c406864,0xe22f92a6,0x73cb21d3,0x2043cc76,0xeae904e6,
  45586. 0xb322c6ad,0x67f28a9f } },
  45587. /* 167 */
  45588. { { 0xca148ab5,0x7c17b258,0xb3c60051,0xb9a1976f,0xc8f28df9,0xea260698,
  45589. 0xe8d45017,0x87b2cc74,0x0578a422,0x37257329,0x17bec732,0x81d5ee25,
  45590. 0x1d48bbc4,0xd7411fcf,0x487f5cfe,0x46217e6b,0x41eb8e1b,0xcb007ac5,
  45591. 0xe05a00c8,0xc41c57a6,0xd2f9fa99,0x1f954d2b,0x40941cad,0x370bd5db,
  45592. 0x3829509d,0xe487879c,0x5ceca5ee,0x4c137552,0xfd3efb9e,0xe8ef7fa4,
  45593. 0x1bd1bdb2,0x5ff09174 },
  45594. { 0x579c6632,0x791912a4,0xb8a20815,0xbb19a44f,0x535639d3,0xf4f97b84,
  45595. 0xbc3c9bce,0xe57e2bcb,0xf19e6410,0x122b3f2b,0x1357d9ad,0x1f0189da,
  45596. 0x79e5ff66,0x675573bb,0xef2f3c4c,0x444e5c98,0x04d10731,0xd6f61e20,
  45597. 0xac75d635,0x0dfa366f,0x2c854f23,0x9fc47c86,0x0ad0850b,0xc04ae43e,
  45598. 0x2f720c32,0x5ce94f64,0xa753bc9d,0x67efae65,0xb0373a63,0xc27d30d3,
  45599. 0x29721646,0x6681013a } },
  45600. /* 168 */
  45601. { { 0xe84509df,0x1385d913,0xcf339376,0xe978bedd,0x3423a148,0x2df425d3,
  45602. 0xee8cb579,0x43fa0ae3,0x31c4553c,0xf015369d,0xdfbf1d48,0x05cf08bb,
  45603. 0x9444244a,0xadff4be6,0xa35dda33,0x01635f81,0xe76fab7c,0x085c8949,
  45604. 0x16737783,0x4bd7fcde,0xa254f8d2,0xfd8cb52c,0x413ec985,0x62168a66,
  45605. 0x7a9026cc,0xf2db9741,0x50e1e1b7,0x3962ee56,0xd3beffde,0xbee0a346,
  45606. 0x0bdfab1f,0x3b35b72f },
  45607. { 0x535c3749,0xbff8de9f,0x8add9c48,0x23c1f20f,0xc8f8f663,0xa975b37b,
  45608. 0xe8f3ae49,0x2529e475,0x1d5e2628,0xc32f10d5,0x67862f1d,0x5ac0d297,
  45609. 0x854cbe36,0x13c79338,0x4b67e462,0x48f004ef,0xe5d10ee1,0xfa37a150,
  45610. 0xd28288a0,0x4974778d,0xcfb73f4d,0x96830a66,0x07804952,0x9f444013,
  45611. 0x9760b694,0x8233c709,0x25b75c99,0x8340cca5,0xc771f99c,0x3f62e40b,
  45612. 0xcd95c685,0x47d0a1eb } },
  45613. /* 169 */
  45614. { { 0x652811f1,0x266f4fff,0x62ef3002,0xeaacaa93,0x50cba0ca,0x6c387a55,
  45615. 0x007f5467,0xa350142a,0x202f2673,0xc7fd102a,0x33dc6e65,0x5daee570,
  45616. 0x064a63d9,0x60682ec3,0x462b251e,0x46cf0bb0,0x5da936e7,0x0e030ca5,
  45617. 0x434265b5,0xc87a60f2,0x69b4e8f5,0x9637b2bb,0x7ad7770a,0x601fb58c,
  45618. 0xed3a15a6,0x1f2147f6,0x2995e961,0x05b47d5e,0x83213a16,0xcb0ca9b3,
  45619. 0x4995a85c,0x8f4b614a },
  45620. { 0x4b4eb3c1,0x5aa8ec19,0x20323a70,0x8c549ac4,0x4f6cc6aa,0x00d49322,
  45621. 0x45f9a5a3,0x0e53b9bb,0x0897abbb,0xe46ef110,0xd7acd7d0,0xfe873e57,
  45622. 0x0f7cb588,0x7cfccfe5,0xc85557d1,0x0ea53d65,0x7288f2e2,0xfdd9eb44,
  45623. 0xc0eb68a8,0xab2dedfa,0x08603a0c,0x58221470,0x00feb06c,0x69464689,
  45624. 0x25e5caac,0x804cf5bf,0x9fc91ae9,0xd8559858,0x73c45eae,0xed9378b1,
  45625. 0x524c9801,0x8f942d02 } },
  45626. /* 170 */
  45627. { { 0x8e845808,0x1f1ec302,0xb77abfc5,0xc302bffa,0xf8d97dc7,0x26afd4b9,
  45628. 0x3aac594b,0x3d3a83c4,0x674d94dc,0xe3b74bd1,0xcaa5911c,0x4464b737,
  45629. 0x871c2cd2,0x62925773,0x3b4440fe,0x419f2485,0xe052ad7d,0xdda6a0f3,
  45630. 0x846c86c0,0x645280d6,0xf8324f42,0xa25689fa,0x07cf117a,0xc74ad1e8,
  45631. 0x8ddc9db7,0x5626dea0,0x966fc85d,0x52620373,0xf3b1eb53,0xe0ad57c3,
  45632. 0x949c1acb,0x38300252 },
  45633. { 0x5e744723,0xa0ef5a40,0x1ae08481,0xdb5bcf75,0xfec1f76f,0xabfad8cc,
  45634. 0xfab37fc6,0xfba5d831,0xc8fedb78,0xbe39e248,0xad93f310,0xa5cfad5f,
  45635. 0x913d5c24,0x747fdb1e,0x4518b7f5,0x052a47c9,0x7cfb4327,0x9e208d6c,
  45636. 0x70e538be,0xb135cb9c,0x5bb17916,0x36352759,0x5b3106c7,0xa2c07880,
  45637. 0xc209bb06,0xd2d42a06,0xd3c504ad,0xb525b471,0x822ce034,0xc9f4b368,
  45638. 0xeb4185a5,0x15f18796 } },
  45639. /* 171 */
  45640. { { 0x0aee4684,0x094dea06,0x7cdbdbc8,0x42b21f06,0xb1931319,0xa439e149,
  45641. 0x81a7dba6,0xea4bdd41,0x3c2ae80f,0xc6213706,0x12823dc2,0xb58b0967,
  45642. 0x832611b1,0x7443d515,0x13c20384,0x2e16f831,0x2bd992d2,0x0ce204d6,
  45643. 0xf419388b,0x499dbcd6,0x1d3778c7,0x492ded1d,0xc5ddae73,0x9d5bd74f,
  45644. 0x994b6259,0xd4813d52,0x0e86ca68,0x191d9cf6,0xf3e9c2ac,0x562179ea,
  45645. 0x9fee1238,0x6146f1f3 },
  45646. { 0x078e2aa6,0xbd06d33e,0x9dee9265,0x693af7f7,0xdaa40e84,0xd56e0f81,
  45647. 0x9b9a407e,0x05fbbb88,0xede99519,0xdcf44adc,0x092dba39,0x7f71f8d3,
  45648. 0x4231774b,0x675b5da5,0xa5f605eb,0x7456a251,0x87a39a9e,0x9031d4af,
  45649. 0x05b474bd,0xdb430006,0xb665aa91,0xbda5dbf2,0x6631eeb4,0x5d1a3df5,
  45650. 0x62377c58,0x028149ef,0x685d0bff,0x2e1af4e9,0x82a465de,0xe0ea0875,
  45651. 0x06bd0050,0x95543f9e } },
  45652. /* 172 */
  45653. { { 0x85d7c6ef,0xf7cbc6f4,0x63b1bc24,0xcad8084d,0xbf8cba62,0xdf90ce88,
  45654. 0xb455c192,0x98e4b686,0x774fc6ed,0x6146b8d5,0x7ae20077,0x70e2389e,
  45655. 0x61c22529,0x5241c479,0x3884e5f5,0x7d221510,0x17e28273,0xd6d20ce2,
  45656. 0x4f2674f8,0xe3119f51,0x70c011db,0x85459055,0xfcfb760e,0xdfab75d9,
  45657. 0x9e8c2a19,0x9546362a,0x4a7d4b27,0x4b6d3f8a,0xee5d698c,0xa5c87104,
  45658. 0x2ba296ff,0x6db43478 },
  45659. { 0x5c3f0d95,0x06486493,0x4e748895,0x8917db82,0x6b2f3e44,0xf73fdf62,
  45660. 0x2b7f574b,0xc60edc54,0xaf732723,0xbe1c09a2,0x7cad114c,0x7d34669d,
  45661. 0x321aaff9,0x9646600a,0xed0cd61c,0xb94e2bba,0xdec4750e,0x866e1a41,
  45662. 0xb1a89f58,0xa1be990d,0xf2759693,0xc39e4d6c,0xc0e0dddf,0x11cfb780,
  45663. 0xd99c8a41,0xf0afcd7f,0x6e1c3050,0xcebffadb,0x96d2c6e4,0x4f3981b0,
  45664. 0x2ae27a94,0x07a791e7 } },
  45665. /* 173 */
  45666. { { 0x1e9f0300,0xe70e9047,0xbccdf904,0xe0253ad9,0xff053078,0x51c0289d,
  45667. 0xae893462,0xf1ef092e,0xa4846845,0x2c90a91a,0xf1dad4b4,0x1946eda0,
  45668. 0x33df67b2,0xf07650f3,0x0b15a014,0xc6e988db,0xb542f0f9,0x72e0c66e,
  45669. 0xe0c0378f,0x5d4b6311,0xae86950d,0x548badaa,0xb35f1c8f,0x6801638d,
  45670. 0x944d1ad4,0x129e3216,0x40471d32,0x9951bac8,0x85e94dde,0x03cc29f3,
  45671. 0x4543ecac,0x6d6acc2e },
  45672. { 0x57b2d299,0xeb999e95,0xe3d721cd,0x3a2bcd9b,0xbb4cb444,0x2e60384f,
  45673. 0xdc060faa,0xae177709,0x8c987cde,0x74f0e6d3,0x1076fbed,0x9a237cf8,
  45674. 0x7983fbff,0x69af1513,0x323f9584,0x6c3f7a1d,0x6db64398,0x3e21cacf,
  45675. 0x96703d92,0x7cd8134f,0xb8393f76,0x0755898f,0x2e825222,0x1b5b28bc,
  45676. 0x7924aa7c,0xb78799c1,0x81427a8a,0x1db378f2,0xff289492,0xd5a451b1,
  45677. 0x3d3c46ee,0x79d18212 } },
  45678. /* 174 */
  45679. { { 0x109d5589,0x1a3edff9,0x029b4499,0xded52eb4,0xb4b54adf,0x13eb9d30,
  45680. 0xa27bff67,0x4f9214c1,0x67f0f460,0x4c817ee7,0xc3a50e28,0xbadf8d83,
  45681. 0x94026237,0xc5dc03c9,0x966647c1,0x5f29581b,0x8a0687f3,0x10b6a089,
  45682. 0x31634517,0xae787cec,0x62e75188,0x2001dba5,0x45e2c3fb,0x55d4e1a7,
  45683. 0xb67d3395,0xbfcacdeb,0xbc6842ee,0xa1a0af9c,0x3e88580b,0x50590a2b,
  45684. 0xa784cdc8,0x73104491 },
  45685. { 0x2648d676,0x44ca2cdf,0x4f1b12b1,0x9a85eca5,0x2980e1eb,0x1b9dac94,
  45686. 0x1ac8aa89,0xf30d3709,0xc719e195,0x73072ab7,0x2f703797,0xba518c82,
  45687. 0xac0067f6,0xac090e14,0x8dcd2927,0x0e6cfc70,0x21e7da63,0x4f5889e2,
  45688. 0x8371c7c6,0xb4aaa40b,0x8f7878c9,0x1f9dabe2,0xd84caf3f,0xf78aed6b,
  45689. 0x9e0e1d92,0x3c39dd07,0x122424dc,0x680be5fb,0x0bdc0099,0xf41b214d,
  45690. 0x5180c54f,0x6a8f8fc9 } },
  45691. /* 175 */
  45692. { { 0x53235132,0x62a1ed63,0x59dba88b,0x1db233f1,0x291efdd8,0x85625452,
  45693. 0xb25111ae,0xc7505297,0x1d701bd8,0xb5921af9,0x9774f45d,0xb4d05d72,
  45694. 0xf18e73ff,0x6e3d4c5e,0x899b3038,0x897d985f,0xc89b1558,0x8a9c30fb,
  45695. 0x4d13181c,0x3c92d1a3,0x2223320e,0x292e86ba,0x01ceed02,0xcf2454c2,
  45696. 0x583f309f,0x27a45f74,0xad0fd1a3,0x75a6102c,0xcb9c7538,0xdb4f45d2,
  45697. 0xdb283fd7,0x4752d8c1 },
  45698. { 0xd5dff4d5,0x514d6cea,0x45a827f4,0x74cd5fdb,0x4fc7135e,0x1070a60c,
  45699. 0x1be5778e,0xdec0bb78,0x58dc6b08,0x271e12cd,0x54bc2496,0xb765089b,
  45700. 0x619098ac,0x6ddf2c63,0x67528832,0xfd6ebac6,0xc2508af1,0xeaa2d025,
  45701. 0x4dcfc1f0,0x13c2cda8,0x45510be0,0x1c7836a8,0x1a886801,0x3904688d,
  45702. 0xafaf2545,0x643132aa,0x2830a88d,0x49685577,0x8744b470,0x569491ca,
  45703. 0x75fb8552,0x3a6518f3 } },
  45704. /* 176 */
  45705. { { 0x224042a0,0xaaa8ed50,0x2452f1e6,0x6cb4e3b0,0x768211d8,0xedca5f4c,
  45706. 0xef4d5d3f,0x4e0fe3f9,0x522d46e5,0x33a8e2a4,0xf1446775,0x5998e21f,
  45707. 0xf592d01b,0x1496c50e,0x83a67739,0x69104c2f,0x472bbf00,0x28670bcb,
  45708. 0x503177bd,0x8ea883b2,0x7d2712a2,0xc5d8bc05,0xb439c994,0x41ef9317,
  45709. 0xdcda1aff,0x9801d3a8,0x7038f6fb,0xd686eeb5,0xfbfbf820,0xe80c5cd0,
  45710. 0xedc25817,0x540ac363 },
  45711. { 0xfe7f43df,0xa71969a9,0x2c1b9e4c,0xe6653808,0x859c2917,0xad9677d8,
  45712. 0x96aa4404,0xbaca9545,0xff1297da,0x0e9d855f,0x22aea7de,0x1f61897b,
  45713. 0x36f13f8e,0x96edccfd,0x16e200df,0x627d3070,0xc98988a4,0x729f0736,
  45714. 0x97f231d2,0x95e25e60,0xf6048752,0xaf7f221b,0x4019b299,0xd6682609,
  45715. 0x26b4b1d9,0x1d99de09,0x1acdd7a3,0xec47cf66,0x6ebe15e9,0x4de9f2b3,
  45716. 0xfa16974f,0x17db32ec } },
  45717. /* 177 */
  45718. { { 0x6cf40599,0x75ef6919,0x00c020ea,0x7ea10dfb,0xfcaaf679,0x3da5ae7b,
  45719. 0x88ddd678,0x0d663ca3,0x255bcfcd,0x5a21f8fe,0xe344bc7e,0xe9c3f538,
  45720. 0x548e0632,0x35f62b1d,0x43c6e64d,0x654f2425,0x26993627,0xc755a7a6,
  45721. 0xb0f41324,0xa3b7c5f7,0x3a2180f3,0x05697f79,0x1e81675b,0x6cf85fb1,
  45722. 0xe53428f5,0x6d3cdb35,0x52d28b02,0xe3aa1591,0xf7a3fb78,0xa8470255,
  45723. 0xa194445d,0x460bd01b },
  45724. { 0xc24d8077,0xbc34dc23,0x4c720d2c,0x82f4b580,0x6f5d1ffe,0xa29da911,
  45725. 0x92783ce2,0x578af520,0xb5904af3,0xe29f51ab,0xf7aa1190,0x46c570d7,
  45726. 0x571bddf0,0x4a522fba,0xae89bb51,0xbf4e2a06,0x59f3444d,0x799b35cc,
  45727. 0x26cc2557,0xc3028367,0xafcec177,0x94a4e985,0x7c36cbd0,0xadaf7dcb,
  45728. 0x75d39077,0xed31b787,0x2d3e24bc,0x52d6904f,0x1f95421b,0xc5ca2669,
  45729. 0x1734878d,0x7d342c3c } },
  45730. /* 178 */
  45731. { { 0x11fd127f,0xe5cf2c0a,0x119e4c5e,0x66d36bb8,0x6ef56ac3,0x621ab252,
  45732. 0xe5430675,0x30cfeaee,0xac3e9619,0x2ede27d2,0xf8fce671,0x6413513a,
  45733. 0x075f4c3d,0x6159c61b,0x59069d98,0xd447efe9,0xea76aea9,0xaf8d6f68,
  45734. 0x0f5bd164,0xac5dc61b,0x1e88bb98,0xdbab446e,0x1ba92320,0x618b8b16,
  45735. 0x78989865,0xa0eafb3c,0xc08b7e82,0x0c7abcc2,0x20d160bb,0x10f09b6e,
  45736. 0x8e4c63a7,0x5be0afa6 },
  45737. { 0x1bbbf49c,0x82ab6d38,0x8c0703fe,0x3e09ce49,0xe10f4263,0xeca58b5d,
  45738. 0xda5a4532,0xd9cc6581,0xf618f7b7,0x07e18876,0x250f7fe7,0x0419a5e3,
  45739. 0xde6b86be,0xbb1a9e90,0x37359169,0x584a7deb,0x5149db2c,0x38eb3489,
  45740. 0xb0ebabb8,0x14546a33,0xc2f88a92,0x0067f0b0,0x0a2db019,0xbde0dfe7,
  45741. 0xc63e6f3e,0xba51b06c,0xe9206fad,0xa19127b9,0xfe80dc0a,0xe4eb5e87,
  45742. 0xd4de30ae,0x1e6fccf5 } },
  45743. /* 179 */
  45744. { { 0xaa8ac924,0xb57dff66,0xc298b3e8,0x06e9ad31,0x65fb080c,0xd140e329,
  45745. 0x1d95c93f,0x7dab211d,0x8a180caa,0x6d68d842,0xa20ded69,0x1a929408,
  45746. 0x38df461f,0xa8151753,0x60eae932,0xff5604ae,0x7dae4c0b,0x901b9e49,
  45747. 0xde262e89,0x4573a97f,0xf1084983,0xed69d9a4,0x64724f1d,0x8ffa022f,
  45748. 0xea85a15f,0xd5f1c2e4,0x01453794,0x4c626ce9,0xbf0907dd,0x80440cd6,
  45749. 0x5ddaa837,0x4522d461 },
  45750. { 0xebfbe7c5,0x8895f079,0x84ef3446,0x30ea1ded,0xd4a1ab96,0x716a9eb6,
  45751. 0x50a30c68,0x1a4a5d22,0x0043bbaa,0x5a16631c,0x5010e5f5,0xbd107502,
  45752. 0x3d8c0556,0xbffe3e9d,0x07772419,0x31b30b18,0x84b82297,0x90ff7ef0,
  45753. 0xf21a18c3,0x00c37d75,0x565bb8f8,0x18d0a635,0x45e3bceb,0xbac1da2a,
  45754. 0x23f0b08d,0x1c38e90c,0x5fbc5ac5,0xf1ba1aa2,0xdda71fc6,0x09d5256b,
  45755. 0x6d7e40ba,0x346501a9 } },
  45756. /* 180 */
  45757. { { 0xcc2b0f1d,0x86be448c,0xac4c3703,0xe3eb45c9,0x9fc96bbf,0x5387f65d,
  45758. 0x5ae27fda,0xcef3c4e9,0x1bc18089,0xa008f776,0x22ca18a1,0xf374a084,
  45759. 0x53b73371,0xee882842,0x7cc09354,0xcb6fc6d8,0x61496d6b,0x8489ec1b,
  45760. 0x49e325c4,0xa92c29b9,0x7bdec166,0x15c6ca52,0xdcea2813,0x95444eee,
  45761. 0x3a21154f,0x34683eb3,0xd39061cf,0x8fb26f98,0x06c940bb,0xc3b08aa8,
  45762. 0xe554c96d,0x7c1d42cf },
  45763. { 0xdc110aa7,0x766e703f,0xf362e378,0xab7b79d7,0x5aadca3c,0xd259c75d,
  45764. 0x60be3373,0x2a6eca79,0x06c4e8ff,0xf4744a4b,0xf3b705bf,0xb2842cce,
  45765. 0xae304b53,0x1a3af5aa,0x1b2d31b8,0x7bbfa201,0x4bee88d9,0xc4ba6eba,
  45766. 0x565cb839,0x2d3565ce,0xdaf7ece8,0x24808696,0xe6959745,0x2c7ccce7,
  45767. 0xe94f9837,0xefd6eb3c,0x3811a326,0x0a33b4cf,0xfffa93a6,0x14203f43,
  45768. 0x73c31d90,0x031e9828 } },
  45769. /* 181 */
  45770. { { 0x765a17ff,0x4fefecfc,0xd1290a65,0xa09f3888,0x938da038,0xbf265c46,
  45771. 0xa169ad46,0x4bb6145d,0x23a62fe8,0x33cf8214,0xabc860a5,0x562df571,
  45772. 0x815c38c4,0xbf2a90fa,0x17eda875,0x45ba1d6e,0x946fa5e1,0x799d881a,
  45773. 0xb90f5a3b,0x6c1be784,0xb10ff52a,0x0910a37c,0xa4f4fd36,0xc38c1fe4,
  45774. 0x8e2d3ba0,0xc3180fc5,0xb17a6187,0x3e2ff050,0x943a35c2,0x3a00059b,
  45775. 0xa28cc51c,0x494d3645 },
  45776. { 0x4ba021f8,0x398426b6,0x796deb6c,0xd14c9083,0x7e36c762,0x6d2e5395,
  45777. 0x751cf216,0x8f556eca,0x19b24a19,0xdaca1e00,0x4b20c2ae,0x47887da4,
  45778. 0xff41a733,0x93ed4ccd,0x5c7c0cd7,0x8d717c44,0x91bf7009,0xcc48634a,
  45779. 0x3b59bbaf,0xa1f146f9,0xe5624f15,0xdd38bb39,0x303f8443,0x96d41aad,
  45780. 0x4bf104fc,0x6b670f03,0x29706582,0x0503f9ed,0xb34200f5,0x768e1f47,
  45781. 0xbbd4c6f3,0x3cfdcc5e } },
  45782. /* 182 */
  45783. { { 0xb523e13d,0x536c2a86,0x2920d0a0,0x1014a458,0xe7571296,0x3d52b478,
  45784. 0x7eb51bea,0x05746066,0x87b0e919,0x709f7861,0x686888e8,0x028aed88,
  45785. 0xd94afcd4,0x79a809d7,0xe2129af3,0x50c6032f,0x983c4082,0x75e4be72,
  45786. 0x7ab3be8e,0x98331bbb,0xb618c728,0xd31a032c,0x3f59c4a4,0x36dd85a1,
  45787. 0xed4f61e2,0xdbece345,0x1e571715,0xba7aaccd,0x64a1ebd7,0x138c58da,
  45788. 0x3d1aeea1,0x89296d0f },
  45789. { 0xcca82c97,0xb165288f,0x1427e8dc,0x26c6c12d,0x4c3edda9,0x66a94f07,
  45790. 0xeaa01ebe,0x94600e1e,0x30f5e86d,0x14abce7c,0xcb456a31,0x741d7020,
  45791. 0x279f42c2,0xab05aa13,0xd4238468,0x70b60faf,0x318d39e6,0xa18efec1,
  45792. 0x8920b318,0xeb07f1ac,0xd8399e03,0x01e3cba8,0x3c81a301,0x65f8932e,
  45793. 0xccc667d8,0xae8bca7d,0xa268607c,0xcee1ae79,0xcac0a12c,0x3182e64c,
  45794. 0x2b1a4c54,0x9233a2f7 } },
  45795. /* 183 */
  45796. { { 0x0acbee17,0x717e8df6,0x5c24fcdc,0x0f0959c2,0xe54ffcb0,0x46f09887,
  45797. 0xd285116b,0xb993deca,0xbba1fa51,0x0bfaa4f8,0xd0f2183e,0x9c9249ef,
  45798. 0x96847779,0xf93cb358,0x2322d421,0x284bfb7f,0xd42af009,0x40cc709a,
  45799. 0x9bb1d615,0xc69f2274,0x717c3c6a,0x76f50b3a,0xbb9c5eeb,0x8b21e985,
  45800. 0xa4783b5f,0x58fb19ae,0x52e1c3e7,0x04c86b9b,0xf2971ac8,0xaca59092,
  45801. 0x21ed8291,0x2bb26a69 },
  45802. { 0x15f81416,0x98a34435,0xaaff5bb4,0x086e72e7,0x0317261c,0x3d1f64de,
  45803. 0x5c0a1cfe,0x31c0786c,0xb3683401,0x542ea4d8,0x1a39b4cd,0x2f77273a,
  45804. 0xcbef27f1,0x14fe7ee1,0x16bb27dc,0xee7fc09e,0x410e5dc7,0xc0dccc17,
  45805. 0x1943b3dd,0xa3466742,0x3f31c1b7,0x92934b60,0xc22c1070,0x0186ded9,
  45806. 0x799f966b,0xa37ee8ba,0x249b0893,0x0f3bfcb4,0x2e92d4de,0xbae61447,
  45807. 0xe196eb08,0x937cb3f8 } },
  45808. /* 184 */
  45809. { { 0x16fbfdce,0x57c0e77c,0xc98d4cc0,0xea034cc9,0x42572d20,0xe7606d72,
  45810. 0x0019a83c,0x9861b55c,0xf1597162,0x80ba2803,0x05a0fd7b,0x0f4141dd,
  45811. 0x4b0daaa2,0x8865913b,0xaa3848ec,0xe6685746,0x3e0485d2,0x16d15a5a,
  45812. 0x3b6905dd,0x81c0c774,0x818af2ba,0xcec31b7d,0xd2b74b78,0x80d8f194,
  45813. 0x543e2f28,0xca659db2,0x9fb07c1c,0x31b83a7d,0x1f1048c0,0x86537fdc,
  45814. 0x78586a11,0x4d57bb07 },
  45815. { 0x53b396b6,0xbc4b768a,0x93b51dac,0xbc8b24c4,0xa30ae1b3,0x33e511eb,
  45816. 0x945147c5,0x893bbd95,0x179fe3ce,0x6cc86031,0x3f920bd4,0x34b0a167,
  45817. 0x6b256160,0xb32912eb,0x9d168d83,0xbc69a2a4,0xef0dd128,0xb4949e7a,
  45818. 0x872699e1,0x2613419a,0xbf21376b,0x06c58477,0xa4f97147,0xe55b1909,
  45819. 0x7b9b745f,0x63d6eb75,0x08df3c85,0xb5365b29,0x55fcfae3,0x0e257e43,
  45820. 0x979f2aa8,0x1067c118 } },
  45821. /* 185 */
  45822. { { 0x32bf8883,0xc8455084,0x6fd06667,0x4755286a,0x77c2335d,0xd70b0f8f,
  45823. 0x2f4a2c94,0x678e60da,0xd118acf5,0xa468d8ac,0xbf5b90d9,0xce93830b,
  45824. 0xed4e9104,0xea4b1c74,0x27776ea4,0xac67316d,0x361bab12,0xb98ad75c,
  45825. 0x99122451,0xc323d482,0x530a43ae,0x26440220,0x3292d5a5,0x3a44532e,
  45826. 0x5fecf1bc,0xdb48694b,0xc667b8b8,0xe4e0516e,0xa4306ade,0xb3aa595f,
  45827. 0xf34e9725,0x7e4f7091 },
  45828. { 0xb7f70919,0x3f3816e9,0x16b003f5,0x765216ed,0x778c99e5,0x46c6cff4,
  45829. 0x30a51810,0xe6a5abe8,0x45e728db,0xef6f49e6,0xcaccefd6,0x6fdd73ea,
  45830. 0x8c37f3f7,0xec394e6f,0xb6407fc3,0x73320802,0x96625cbd,0x988e8f7a,
  45831. 0x7cabfb00,0x83292363,0x407f359a,0x258ba9df,0xccbfae50,0xff01aee5,
  45832. 0xfe251813,0xfbeaeace,0x83f1cba1,0x9c69f161,0x9eadcdb5,0x512c58ad,
  45833. 0x6ccce8bd,0x2ae49cd4 } },
  45834. /* 186 */
  45835. { { 0xc40849f2,0x1239b0e3,0xa441098c,0x5136a4cd,0xe547f649,0x61535a99,
  45836. 0x7a9bbac6,0x92e4bdc4,0x53547af6,0x195a1646,0x8b47a74a,0x85ecb319,
  45837. 0x9de6a2b2,0x278553fc,0x0e2ba52d,0x471c038a,0x35bcba93,0x12ba1b88,
  45838. 0x6f31eca2,0xd4bf50da,0x802b32c6,0xd146e3f6,0x3c64c8c4,0x0c9c0131,
  45839. 0xeed21297,0xad30f12d,0x9c68530f,0x9b75bffb,0x8918de51,0x23c0ad3e,
  45840. 0xa73771b7,0x180e9d52 },
  45841. { 0x29ab77b0,0xc316542f,0xf7aee628,0xdd411d9c,0x353c2f40,0x044c0685,
  45842. 0x4b0ae4cf,0x638dc7e4,0x95fc266f,0xa0924185,0xfd2feb7d,0x639da671,
  45843. 0x5ea39798,0x56858ed5,0x58f3832a,0x7a694f31,0xd316d831,0xa94233c6,
  45844. 0x30a35a7b,0x2fcacb26,0xf1ff713b,0xfef8f7dd,0x59eee2f3,0x8b9b4525,
  45845. 0x156d064a,0xd1b4f91b,0x2f5cfcfc,0x177866c2,0x3777eb41,0x12bc2566,
  45846. 0xd8ab85b4,0x21ca6f3c } },
  45847. /* 187 */
  45848. { { 0xa3e66635,0x0e162b13,0x2a9f76af,0x1ef20a2b,0x46db3356,0xab473a30,
  45849. 0x7802bb8d,0x0840bd77,0xa699b44c,0x5b6baf5e,0x1b2207f1,0xc6e11900,
  45850. 0x790b0105,0xe5de16a9,0xdb67f004,0x22b12f15,0x8a025d25,0x185fad45,
  45851. 0xdf0a1142,0xbccf6953,0xf45034c0,0x4c42129b,0x1c277bff,0x0f740400,
  45852. 0x280a9e18,0x6e440b4c,0x842aa2b4,0x767de8f5,0x05e8d94f,0x3de20ab8,
  45853. 0x20227635,0x5aff5859 },
  45854. { 0xa8458e40,0x805acd20,0x149732bd,0x5a5557d8,0x5f1ca72d,0xc7074131,
  45855. 0x952b5323,0x7f2e269c,0x6494fadf,0x5c592556,0x1a7d2666,0x153b7acd,
  45856. 0x86fe2865,0xa6df063d,0x57d53b6b,0x1e91db13,0xe93ead01,0x9195bb89,
  45857. 0x2963bfe6,0x3d71e1af,0x88278886,0xfab2b9c2,0x3b859b6f,0x77836692,
  45858. 0xf7029dd1,0x6e695174,0x7b984561,0xc7987876,0x5907d849,0x64fb4f1d,
  45859. 0x88d8a977,0x3eab7e1c } },
  45860. /* 188 */
  45861. { { 0x52e5718b,0xc73a94b6,0xf4cee1e9,0xe3aefa54,0x553eedea,0x654e9e63,
  45862. 0x5f3aca1a,0xf2541e1b,0x0d083316,0xd7129489,0xfb7f950e,0x7965af63,
  45863. 0xc74e3e4a,0xd8fc9e0d,0xeaf79ebc,0xb4ee48d2,0x8b7787e6,0xa458a86a,
  45864. 0xf7cceaf0,0xd8c7621f,0xdf67980d,0x8228eeff,0xf9106727,0x210d4742,
  45865. 0xb07e3629,0x91f63501,0x7971e29d,0x441761c6,0x03a3b8a5,0xc0ccc65f,
  45866. 0x38e09544,0x3491da4f },
  45867. { 0xcb062eae,0x6706d046,0x5d08776d,0xee7db735,0x292315d2,0x80de8052,
  45868. 0xc402bbdb,0x40785662,0x26ed3337,0x5f93525c,0x7d568ed3,0x6cea14d6,
  45869. 0x66888b1e,0x916a1189,0x5dc71675,0x0fbd5205,0xe4575df2,0x833d1077,
  45870. 0xec092335,0x4e93100a,0x6cd85389,0x2f9e1d01,0x43226368,0xeebd3725,
  45871. 0x1ba4cfd7,0x401d172b,0x574c5838,0x377dab9d,0x80d517de,0xaeaa6958,
  45872. 0x6ad15a18,0x0c843dfd } },
  45873. /* 189 */
  45874. { { 0xc9373300,0x455811ff,0x99fdc300,0x1c39332a,0x353cb655,0xe19bb81c,
  45875. 0x96a83d27,0x774b924a,0xb2ee3f1a,0xcbfc8fcb,0x010d56c7,0xaf278ec4,
  45876. 0xe0abaf79,0x6fde682f,0x7339aebf,0x7566d072,0x71205db6,0xbd35ad5d,
  45877. 0x7051c9d0,0xb5bbe694,0xd3a3067c,0x577db480,0x572d7530,0x2c70ff54,
  45878. 0xe06d853d,0xe8615aec,0x05abfb5d,0x71999ccb,0xea0a8ed7,0xeeefc96b,
  45879. 0x35f6df69,0x2dcc469d },
  45880. { 0xc65f0e77,0xcca6cd06,0xbd71b14a,0xddcc7980,0x3c93cc00,0xb6221f8b,
  45881. 0xae8cbf57,0xddfcd5b3,0x76f8e63f,0xbc92973f,0x06e132b7,0xe9848a34,
  45882. 0xd51ec9e2,0x4cc59a03,0x3a33081a,0x9c9d32bb,0x80e8466b,0x00121052,
  45883. 0x1bbe7295,0xc2b0032a,0x24938448,0xdbfc6572,0xb6bba0ff,0xe972a0ce,
  45884. 0xc0a94802,0xf60c0a4f,0x599d8bc7,0xf62c41cc,0x312da0b8,0x820c96ee,
  45885. 0xcdbdf9fc,0x5a1a65db } },
  45886. /* 190 */
  45887. { { 0x42485684,0xbfba691a,0x29c470c9,0x613116b9,0xe62a0519,0xb4b01971,
  45888. 0x5ff499da,0xf3245aa6,0xa5238eff,0xc2ef87f4,0xcc9d5515,0xc16dc6ba,
  45889. 0x2dbdacac,0x5a7f227e,0xa9bbaecb,0x8dedaac4,0x2e7c9885,0xff308a6d,
  45890. 0xe6895593,0x4c6f2fc2,0x177e0611,0x3655f285,0x300b1bee,0xa63e8d06,
  45891. 0x13c17b54,0xbed0ce79,0xc4974262,0xca4abe35,0xbc4e4037,0xf4b44a17,
  45892. 0xefe5fbd9,0x5ae95099 },
  45893. { 0x804f7455,0x122e5ee7,0x22066682,0x341a4997,0x7795e333,0x97d24c31,
  45894. 0xe48efced,0x12f4123c,0x19fbc21c,0xe8738d92,0x0663a3ae,0xbb3bdc61,
  45895. 0x8593a6db,0x3603d8c2,0xe3c1ac75,0x926227f2,0x5eaae519,0xfea92ac0,
  45896. 0xfd6812ac,0x5b596f0b,0xfc2a82dc,0x3ce7e844,0x63522b27,0x3840481a,
  45897. 0x52867895,0x836088b1,0x26588688,0x21ffb7cc,0x2f4a7cac,0x0ca33161,
  45898. 0xa3edd298,0x4110667e } },
  45899. /* 191 */
  45900. { { 0xc2d04b63,0x81830357,0xf4929a18,0x3fc5a34d,0x22d195df,0xc73bf6da,
  45901. 0xcb432473,0x14df2f89,0xe997f138,0x345afe5c,0x8b9604f4,0xd8e3f5f9,
  45902. 0x50c10ae5,0xad7942e9,0xeed25ff3,0xcefd5447,0x0e73c0cc,0xbf68e51e,
  45903. 0xab54fa4c,0x5b1ad591,0x12b61c8c,0x8bbc1105,0xb5abf760,0xbb932913,
  45904. 0x01e79649,0xdb1231be,0x040ccbe7,0xd0a83e91,0x90a96db9,0x3dde426f,
  45905. 0x34df11ea,0x1cceb645 },
  45906. { 0x0c6d0f55,0x2d210c4f,0x9c673c9d,0x6cadf61b,0xa9ce3fbb,0xdd7f9919,
  45907. 0x93b063e4,0x135f494c,0x145a93be,0x580bdb3c,0x0f52ef7c,0x4d872332,
  45908. 0x8814bb6a,0x74d876e8,0xc7a97dee,0x4f6f723a,0x3e3cd833,0x7de2b8f0,
  45909. 0xae720270,0x6162f082,0xddfa486e,0xe88ec2d4,0x8d3a17c6,0xd965c859,
  45910. 0x3980171a,0x62e59e54,0xbbef6b22,0x0ab6285d,0x4d48b203,0x3cf45195,
  45911. 0x4ea25ea3,0x1f175233 } },
  45912. /* 192 */
  45913. { { 0x3467ea91,0x808a765b,0xfd2d9c45,0x3f4632ee,0x9cf2bc6f,0x7b75dc6d,
  45914. 0x359813ae,0xefc8d240,0xe44cbd8d,0x23ecb209,0x21525622,0x59ba10e3,
  45915. 0x3f1ee19a,0xfa14d934,0xfb0c48f7,0xdf97c21b,0xea30d437,0xc4e62890,
  45916. 0x651475c2,0xb286e2a4,0x126672a5,0x291f01e4,0x31aab3b8,0x9c6fda5c,
  45917. 0xe17d22ec,0xb7277a5a,0x914f0bad,0xbd88ed83,0x6a2392e1,0xd0b05d1b,
  45918. 0x65893c2b,0x4cb8af90 },
  45919. { 0xbb4b1953,0xa2b02057,0xf597f6ee,0x4ce08b44,0x5e6412c8,0x854f5d9b,
  45920. 0xb3cd4919,0x1913262d,0x6e42bb5d,0x902762e4,0xd78e7f60,0x8355c8e6,
  45921. 0x38b6c16c,0x8efaa824,0xe550f618,0xd0173790,0xe57d778e,0x118af462,
  45922. 0x715b4714,0xa16ad5e8,0x41dea4f9,0x900596c3,0x280ca610,0x2a957c32,
  45923. 0x374c65a1,0x2faee800,0x50080414,0xdb105127,0xff080fa1,0x8c1db931,
  45924. 0xd79878fc,0x486a5c25 } },
  45925. /* 193 */
  45926. { { 0x941b4f36,0x0521e213,0xf803b4f9,0xbaacfb14,0x52a54ba8,0xfdf1e22e,
  45927. 0x8fe4796c,0xacfabbba,0x58dbacb6,0xae0788db,0xc19dfa51,0xdf98d736,
  45928. 0x35a716ee,0x155c286a,0x9c86461b,0xbe7d4676,0x63a64a5e,0x50b6380f,
  45929. 0x9f609262,0x14b41914,0xa2dfc5b3,0x0919a7d0,0xcef466ac,0xc454da55,
  45930. 0x6986aaec,0x93fa4a24,0x71a49ced,0x5090b171,0xc1fa75ad,0x602f1d6c,
  45931. 0x78e4c054,0x5d269f89 },
  45932. { 0x14920419,0x3a74030c,0x90968739,0x0845d868,0xeeb70fa6,0x81b994c4,
  45933. 0xd9fc5bcb,0xabcaa06d,0xf58f8f2d,0x06539427,0xb1dc52aa,0x35c85f67,
  45934. 0x2c911baa,0x5a7d8d72,0xaec2d834,0x4041005c,0x7a8e5347,0xb5868a44,
  45935. 0x8de512c3,0x04ee180b,0x211168eb,0x4daa66e5,0x2317cd8a,0xc0bd5dab,
  45936. 0x61164df6,0xa1d4185d,0x1dbad7c9,0xacedca26,0x09b02683,0x0fe4b5ac,
  45937. 0x26d9550f,0x8ac9995a } },
  45938. /* 194 */
  45939. { { 0x2640a39d,0xb2c8dc9b,0xede0c9f9,0x21ff0b38,0xa1ecba0a,0x74f469bd,
  45940. 0x080d0417,0x8a902ccd,0xf4994604,0xe956fa32,0x9776ab15,0x348f85cf,
  45941. 0x0066f492,0xc21fc6ee,0xfeeef367,0x35b1ebfe,0x4613e5ed,0x7804581c,
  45942. 0xea6ba071,0xcbdfe8e6,0x950d73ed,0xddfcaa32,0x1da48889,0xc9747936,
  45943. 0xdbaffbd1,0xce867c8c,0x1cbaeae7,0xd267431f,0x897912c8,0x68255045,
  45944. 0xd7ea1e4d,0x0c7c1ddc },
  45945. { 0x1ce963a7,0x53aa30cc,0xc4c5fade,0x7352f64c,0x2828afbf,0x2b9aa2f8,
  45946. 0xca212107,0x64273c56,0x85a576dc,0xaadd7654,0x90b5c77c,0x6196ac3e,
  45947. 0xd1aaf39b,0x20d43e9f,0xcd05cbc4,0xfc392062,0x4c0ff2fd,0x14163872,
  45948. 0x2ae821e6,0xcf32b8d8,0x3fa7a3f0,0x5f58f943,0xf644ca92,0xaebf1d2d,
  45949. 0x1918a75f,0x0c061563,0x6b876118,0x7989b5ed,0xad412441,0xbf342445,
  45950. 0x1df633ab,0x24ffc9ae } },
  45951. /* 195 */
  45952. { { 0x93c7cb2b,0x89fcdc05,0x590053fb,0xc1243b95,0x6182343c,0x601debcf,
  45953. 0x66c18a63,0x364546ef,0xec913287,0xa5290701,0xf9788c31,0xc35b8026,
  45954. 0x92d1f7d7,0x852b862a,0x0aa79728,0x1809cb05,0xa3cb2005,0x897d467c,
  45955. 0x9ef5b946,0xf20c77c0,0xf2241984,0xc3372c42,0xf35bb206,0xda053e0d,
  45956. 0xa9c140b5,0xbc26c6d0,0xcb56fb33,0x61cfcc0c,0x299b3968,0x1c3cf9ef,
  45957. 0x40621ba4,0x89e4d3d1 },
  45958. { 0xa45a9be3,0xd35e80e7,0x07356fbd,0xc4daa578,0xb967bc2f,0x0186d62e,
  45959. 0x47cd16e3,0xa702679e,0x5f30ce9b,0xca2f1c02,0x1f864f50,0xf1205b46,
  45960. 0x85061d66,0x7fd6d797,0x8a08809e,0x47edc4f6,0x9a4d3ae2,0x5dac0449,
  45961. 0x6d1f9da8,0xf844664a,0xd7a83a71,0x9f30ce84,0xeaac33f1,0xe9382bac,
  45962. 0x948622ab,0x1f033831,0xf7681eb2,0xb037a4ba,0x99a1b5c7,0xd156a908,
  45963. 0xe6f1d0fb,0x675d3e6f } },
  45964. /* 196 */
  45965. { { 0x707193e5,0xd9767ffd,0x810358e5,0xe478aa91,0x328d8ef7,0x5634f9ff,
  45966. 0x6dbbd9a7,0x913a0ee8,0x7e215686,0x379b2968,0x89d9da38,0x903f410a,
  45967. 0x1b1334d2,0xd9f8d7b9,0xbd82efb5,0x9fe74229,0x3803c778,0xdb568b62,
  45968. 0xd3d25344,0x93e9a350,0x724497e8,0x559c35b0,0xa169e23b,0xc472d436,
  45969. 0xcc5b4c69,0x09864632,0x83c7f531,0x9f6d759d,0x1e497888,0xa91cf1db,
  45970. 0x60af1a4b,0x5f7f92fe },
  45971. { 0x0545167e,0xf18a1cc6,0xaffa88e0,0x55ee2e02,0x432a7bcf,0x24cdff51,
  45972. 0xa7510866,0x7382da42,0x40511af7,0xe894c11f,0x2aaf1423,0xaa4e4e31,
  45973. 0xf63dd2ae,0x8c3d36f0,0xd7660635,0xfc5c9550,0x37ea7eab,0x01253731,
  45974. 0x39b950f6,0x2a5cd598,0x40e63442,0x95a0f601,0xf2ac7045,0x905e238e,
  45975. 0x446b0f73,0x44bacc0e,0xc448578a,0x4cd4206e,0xa5bd7803,0x367b1aaa,
  45976. 0x0a2b458d,0x25beced9 } },
  45977. /* 197 */
  45978. { { 0x0c33a8fb,0x079a7382,0x0f25dc1d,0xcfbf6cd1,0xc6d482b6,0x4ffc73f8,
  45979. 0x07bf844a,0x3e51f18c,0x599162f0,0xa7651236,0x14013811,0xac59a74e,
  45980. 0xe55018a0,0x957a6865,0xe3ca09b1,0xe1ec51bd,0xa960253f,0xbc0c7eb3,
  45981. 0x7de03f84,0xe83bfd14,0x52fbdb09,0xc0540ed1,0xcea15ec1,0x6ba52edd,
  45982. 0x4b261307,0xf3d30ed5,0xe8397206,0x9bd7bae8,0x096373aa,0xf20d8692,
  45983. 0xc3b0bf63,0x0a616a4b },
  45984. { 0x6e1339c9,0x2075f3ed,0xbf8b00a6,0x7afaa072,0xbccd9b47,0xdfafec82,
  45985. 0x00ca54c7,0x4713158f,0x38bc31ae,0x449102f1,0x310dfc8a,0xaf98f158,
  45986. 0x59e954d4,0xc9ef2075,0xc527a0c4,0xe8021af9,0x7a192023,0x6e801277,
  45987. 0x7fb02377,0x635f538c,0xe8c9e951,0x5df1974f,0x15cc9097,0x0287faed,
  45988. 0xf7a5115c,0xfa0728f0,0x0fac623d,0x90dbfbe6,0x0311ba09,0xa8d40fd4,
  45989. 0x07c6464c,0x876d154e } },
  45990. /* 198 */
  45991. { { 0xc2d3ea8a,0xd3a4d6d2,0xa842600e,0x36be681b,0xe4070672,0xc53f100d,
  45992. 0x6a7d7a7b,0xe3e5b6fe,0x5d5e1a83,0x6e6994f9,0x76097c2a,0x07cacd22,
  45993. 0xa6791011,0x12d98dba,0x102e0e24,0xddfc4461,0xd493272a,0x4815dbc2,
  45994. 0xa9436696,0x7e38e64b,0x32b2bf90,0x4960eb1a,0xd928e28b,0xda457525,
  45995. 0x2a077c9e,0x72f75b39,0x7fd61d00,0x27760cbb,0x0f4b1456,0xaf235d1b,
  45996. 0xe76d1700,0x3040c23b },
  45997. { 0x4efa9a70,0xb10dc55b,0x53e86610,0xd4de414f,0x09f8a27f,0x3d95c113,
  45998. 0x06661d3c,0x505109a5,0x60eb513e,0xcaa2994a,0x1e7d338b,0x3ee41537,
  45999. 0x4651e71f,0x4fd145fc,0xcbc313b4,0x51bbf838,0x1eb92150,0xb039e078,
  46000. 0x14bf5ac7,0xe8696b44,0x8be0d48c,0x2d667188,0xdd8f2b6f,0xbe93b2f5,
  46001. 0xeb8a7f8a,0xc1dfd1e7,0x90f751c5,0x862b3dd9,0xa32a74be,0x1eb1ad58,
  46002. 0x1ebbc9a2,0x5486d79a } },
  46003. /* 199 */
  46004. { { 0xa1359e13,0xcb2e34ff,0x28196051,0x202d8dbf,0x23564b5e,0xe95e023d,
  46005. 0x42f6ac12,0xfb1340b6,0xb653725d,0x543ba852,0x8d2466ad,0x81aedcd6,
  46006. 0x547c728b,0xbf780224,0x9569fb65,0x559f8a11,0xdfb22ec9,0x505b7a62,
  46007. 0x9eed5e52,0x07107540,0x299f6f11,0x9c899288,0x3db6f8c7,0xa7d69261,
  46008. 0xb3ca79a9,0x30eb7fb3,0xfb2160b0,0xcab99bb8,0xd28b409a,0xd2012568,
  46009. 0x5ac45f8b,0x380f1b0f },
  46010. { 0xe6a0068f,0xc0b99e6b,0xc8a73753,0x4b67cf2a,0xb2faeb7c,0xa6c9a548,
  46011. 0x340260c3,0x7f417f99,0xcc0f739e,0x8ee56855,0x780949da,0xf08b510f,
  46012. 0x8d5c6eff,0xb1770fc2,0xfd96a7bb,0xb4f5abee,0xf2665a2a,0xa07b1136,
  46013. 0xb601dcf9,0x2fb380a4,0x162becc6,0xcc803614,0xee6b83b3,0x3498fb96,
  46014. 0xa8c17eeb,0xea9b0fd6,0xa177efc2,0x5834b5ba,0x5b110b3e,0x929044f5,
  46015. 0xebd7285e,0x4abedded } },
  46016. /* 200 */
  46017. { { 0x700ef376,0x3355e1b9,0x66cdabff,0xd56e5d9a,0x47e87646,0xb3dc2575,
  46018. 0x00f79369,0x28f44b8a,0xa0c52e29,0x08c32b1e,0x3729b392,0x5a78de12,
  46019. 0xb26d239d,0x4184519a,0xe0ce4a6b,0x23f6b4b7,0xacb2a9f9,0x235f6f8a,
  46020. 0xe2064a59,0xbb8bc454,0x1bf3062e,0x37efd034,0x94dff6f9,0x6bac683b,
  46021. 0x8aa7fa06,0xc3364b1e,0xce0b3745,0x0616772a,0xd1e3fb0f,0x46f08d08,
  46022. 0x18e132d3,0x6a20abb3 },
  46023. { 0x6a85cbc7,0xea831016,0x934f9aa7,0xd0990946,0xe778f1b3,0xc2211088,
  46024. 0x2247b799,0x7ea4ff8f,0x454484ce,0xb3171d71,0x4f98c364,0x29403949,
  46025. 0x97df1458,0x5da911f3,0x09439116,0xa6b58093,0x174238bc,0x75f9509a,
  46026. 0x8209758d,0xfeb51821,0xa47925d0,0xae0c6021,0xaf8a315e,0x0e946694,
  46027. 0x6bad04b7,0xae7af8a3,0xf072447d,0x44c15e7f,0xa5456ffe,0x5184668a,
  46028. 0xbf36b977,0x45e353a7 } },
  46029. /* 201 */
  46030. { { 0x93092f71,0x76056764,0xf5b92d71,0xeb66b6c2,0xe2c8b6c5,0x9db3149b,
  46031. 0x20c0363e,0xf62f583a,0x03cd7097,0x688acd33,0xebb916ac,0x85d0c0f8,
  46032. 0x84c19b0e,0x1bf7462c,0x7c4a6ad1,0xc76ed5f9,0xd119f369,0xec8b88ba,
  46033. 0xebe50b83,0x59b8371b,0x866706a6,0x0cc69508,0xf8373d2c,0x531c75a3,
  46034. 0x2a5a02fb,0x4e1cd3a3,0xda39a1d0,0xe8274778,0x75da333e,0xedfc5bbb,
  46035. 0xca79bd36,0x15941f24 },
  46036. { 0xa77dd512,0x42e8c0f8,0x1dc365f6,0xa91b59a7,0x08753862,0xe80d14cd,
  46037. 0xd272faca,0x1624230d,0x4027cb5a,0xeea3ec16,0xc1ef9f03,0xc1700b59,
  46038. 0x0da3148d,0xd411c127,0xc4181af1,0x801ee448,0x9e3a900b,0xedf28559,
  46039. 0x0d09affd,0x5d67b0bd,0x8b370024,0xd839df96,0xe6f836b8,0x3b6307e0,
  46040. 0xbd3201c9,0x5382e588,0x7a1d02bb,0x636d8a6b,0x968641e9,0x70b7db76,
  46041. 0x118fad03,0x6d17c34a } },
  46042. /* 202 */
  46043. { { 0xc181c99b,0xcf608841,0xc87bdcaf,0xb65dc901,0x3720dabe,0xb460b447,
  46044. 0x5377515b,0x4c79c396,0x0a96c277,0xd447f22e,0x2ac0f440,0x0d952130,
  46045. 0xc90583ad,0x8330b26b,0x928904a0,0xe25e977a,0x85c50b18,0x1deaffd9,
  46046. 0xa5ad5f6a,0xcf4dbcb7,0xc8a37ed5,0xcbcd0019,0x1e9850b6,0x7846dd90,
  46047. 0xb0b8e605,0x1ac8194a,0x34132f90,0xb9728571,0xf56ee28b,0x4ce9f149,
  46048. 0x3e9e1d4e,0x1ab9b5a4 },
  46049. { 0x314fa7a3,0x206dab92,0x478ff963,0xcc4af0f0,0x904d9fdb,0x4cce1713,
  46050. 0x12c045fe,0xac20a2eb,0xfd8f6d7d,0x44fc5478,0xca7b6ffa,0x886e72c5,
  46051. 0x6fd6f758,0x7fa4529b,0x92a820d5,0x4df1d1b1,0x2789f149,0x3d812f9f,
  46052. 0xaabb53d2,0x9842f083,0x2a03ab32,0x2648539b,0xb1512502,0x631ce090,
  46053. 0x731f6bd5,0xe1294d15,0x9436e634,0xb229361d,0x3ca966af,0x8c4281c4,
  46054. 0xc21ab3ed,0x24b34956 } },
  46055. /* 203 */
  46056. { { 0x659824e2,0x49bdcb86,0x4e13e74c,0x6dc4ce48,0x6bbe1eea,0xa4c01a26,
  46057. 0x1e3ec457,0x47b2b8e7,0x2f5a8e4b,0x7e8b15e0,0xe333530d,0xe81eb6e6,
  46058. 0x17a45202,0xacba369e,0xd70e4c9f,0x81241431,0x3e12beb8,0xc190af4b,
  46059. 0x11f486fd,0x53270523,0x29fb2bce,0x9f6c41e1,0xb70f6c08,0xbe6287eb,
  46060. 0x3feb4477,0x1479850a,0x9bcf18bb,0xfcfdfb11,0xda80d040,0x925c292f,
  46061. 0x7e3c5bf9,0x212d65e5 },
  46062. { 0xca15cf08,0x23adb386,0x81e172eb,0x4dfa4ac4,0x4d42d0c0,0x9d1dbf93,
  46063. 0x74404dc7,0xd9cf6073,0xe932bfcd,0x60508441,0x1c682a98,0x9ae910ca,
  46064. 0x41ac1cc0,0x9528fc18,0xdbbed630,0xe6a120ae,0x30ccf250,0x94e0e1ec,
  46065. 0xe58bbf2f,0xfe84ba54,0x9faa4415,0xc66d0b4f,0xecee7ce5,0x0c58f1e7,
  46066. 0x6fa6873a,0x7a1d43eb,0x399f1348,0x96c6c5a0,0xe6727ab7,0xe6ef9aaa,
  46067. 0x9a5c2447,0x66afa554 } },
  46068. /* 204 */
  46069. { { 0xc980e91d,0xda5aaba8,0x6ac98efa,0xa93cf509,0x8da32662,0xb0990e0a,
  46070. 0x0081453e,0x01d21530,0x3d71de84,0x2bb0d33e,0x3e19a012,0x465f6d80,
  46071. 0x78a838e7,0x5902ff4c,0x1931348c,0x74e2afb7,0x9cfb057b,0xa4932757,
  46072. 0x3ad03f8f,0x761ea642,0x58ffa40a,0xb7d4c245,0x77a87e30,0xb5e9c0d9,
  46073. 0xc9c84d26,0xd1c5edba,0x3d1963a0,0xeca8839a,0xebf6bf0d,0xbc6f2f35,
  46074. 0x0d58abdf,0x01ef0631 },
  46075. { 0x3ecdcbb0,0x2bf90316,0x27c1c955,0x19e2d728,0x9575c930,0x9e527030,
  46076. 0x96983930,0x0dc1c5a9,0x7cd082df,0xef9f80ff,0xdf97e051,0xcd915075,
  46077. 0x9cc61b55,0xf286fffe,0x80f24cc4,0x352db38f,0x36523ae3,0xed9b99ec,
  46078. 0x10b104a9,0x109a8ca8,0x305203ad,0xc2700fe7,0x769400f5,0x2a2ee24e,
  46079. 0xee0c452c,0xd595d399,0xf7f02a41,0x0ab75d6a,0x0db730b7,0x34108099,
  46080. 0x5e8d1202,0x0e4f5ffd } },
  46081. /* 205 */
  46082. { { 0x0ff14c38,0xbd1c6444,0xaece11f2,0x9a5b59fa,0x22af6330,0xaa4605a7,
  46083. 0x82af24ee,0xddc9f65a,0xeb9a1159,0xf4ee4bfe,0x74e84eaf,0x2463d076,
  46084. 0x0e0baace,0x88cbe1e0,0xd5fabdcb,0x7ca568ea,0xc57eb99d,0xbd80d524,
  46085. 0xe9be9873,0x9c46572c,0x7300b85e,0x918a1dcd,0x40f54176,0x49221312,
  46086. 0xb5b14236,0xf7e324ff,0x2434f16a,0x40dda501,0xa133d97c,0x08833421,
  46087. 0x0876f020,0x33d41161 },
  46088. { 0x9878e5ec,0x7531a36b,0x46918232,0x5de3e321,0xd0a30464,0xd15f9a33,
  46089. 0xaa173659,0x734c1b87,0xf925d4fe,0xac2094a2,0xc262b0f4,0x43c965a1,
  46090. 0x447d5cbc,0x759c903e,0x05239300,0x92af215e,0x1f593f34,0xfffb6d5f,
  46091. 0xc3cddb5f,0x65943b4b,0xbfdd5408,0x9d03a29c,0x198d76c0,0x8f7cda6b,
  46092. 0xc0f27b59,0xc0790a22,0x8cb58ccf,0xba557a84,0x76c54fdc,0x5922052d,
  46093. 0x47b6b466,0x2d3de7aa } },
  46094. /* 206 */
  46095. { { 0x65add3b7,0xaade7462,0xabf24c2a,0xe5888f35,0xe1a57d93,0xd41549ca,
  46096. 0x2c76f7bf,0x0e22e18e,0xbe3202b3,0x67f288ea,0x1d1d0f0a,0xb79a66ba,
  46097. 0x2881ad18,0x0e0ab749,0xc7adb0e9,0x7d424086,0x2842132f,0x870c32c5,
  46098. 0x58f9a09e,0x858477f1,0xec025589,0x422a9372,0xa5098777,0xbe428c5c,
  46099. 0x57660058,0x45b79564,0x957f37cf,0x6c7fc631,0xd6316289,0x8b7023dd,
  46100. 0x5b1c12a6,0x47003bb6 },
  46101. { 0xc91c1c96,0xd99401c1,0x27a12970,0xaa5dcdf9,0xc3c29107,0x3ab92e17,
  46102. 0xa3fe4710,0x26fce8f7,0x4ee998ee,0xb0d09d5e,0x8e3a41f8,0xafa62204,
  46103. 0xa26ca506,0xb1c012a5,0x99b57252,0x2c6f734c,0x512f7fe1,0x1093d79f,
  46104. 0xacee19a6,0x2f30906e,0x056d1ea6,0x6bff8381,0xeff35f21,0x61c75856,
  46105. 0xc1ad2224,0x6e07e978,0x6b20fde8,0x2cca6ca1,0x633fe81b,0xab4d6d2d,
  46106. 0xb06a2ce6,0x73dff504 } },
  46107. /* 207 */
  46108. { { 0xd8e20fb8,0x8b615805,0x82b533f0,0x7c6873e4,0x56a854ca,0x5205f001,
  46109. 0xcb369211,0x87fec6ac,0xc7f092b7,0x1fa3c0ec,0xe845fe4c,0x5b36647e,
  46110. 0xf8b1f112,0xd4781e85,0x8b0f1a6f,0xc6526839,0xdcb8eb92,0xceeb8c6c,
  46111. 0x8e5f6d52,0x133f0ead,0xc8d934dc,0x31883e23,0x428ac45a,0x214ed5bd,
  46112. 0xdbbfca85,0xf77ca492,0x07e5ae13,0xdf4113fe,0x72ab05fb,0x63e4a0d2,
  46113. 0x7148f535,0x7544d0b7 },
  46114. { 0x80797ace,0x4fe8d134,0xaf86d97e,0x216d6aa0,0xef5a68fc,0xdbf0a688,
  46115. 0x9f9b2684,0x18b26f45,0x8999d2fc,0x52fefcfa,0x62423955,0xd5af8d82,
  46116. 0xf63a3780,0x8f123469,0xdcd4feaf,0x2933454f,0xa73b5d09,0xba8018b7,
  46117. 0xe5552c18,0x9af1f276,0xff26bb1c,0xc5d4773d,0x06dd4f44,0x9ef49410,
  46118. 0x5f39ba49,0xad8f12f9,0xf66ca4f2,0x5767f6dc,0x7922f59a,0xba8773f1,
  46119. 0xc1e42d49,0x220081ea } },
  46120. /* 208 */
  46121. { { 0xba37a0ba,0x3043d573,0xdd176df6,0x05a431bc,0xc42070f7,0x03322cfc,
  46122. 0x67c2d109,0x5cabd30e,0xcbf8bcfa,0x362c95de,0x7787b10b,0xd767d277,
  46123. 0x6ec05e64,0x612c915e,0xce69c30e,0x9e669631,0x682e2635,0x27c9dd8f,
  46124. 0x95ffcc38,0x79021f12,0x8a2adca2,0x06a8ee79,0x4b5d500a,0x8e00e784,
  46125. 0x8d80d6c5,0x87746fc7,0x915f10cc,0x246053be,0x219f6fd8,0x844e328b,
  46126. 0x11bd3733,0x620541ac },
  46127. { 0x509e5a29,0x0f7fd382,0xb432531e,0x8748d7d0,0xcd3883b9,0x8f749354,
  46128. 0x8bfbb17a,0xc6b8ac74,0x05f2d2c5,0xa4616a66,0x1bcb1b83,0xb3d96625,
  46129. 0x2fee265a,0xcf753104,0xdb225058,0xc70d73fb,0xf0c2d556,0x1211d434,
  46130. 0x54b259b3,0x862061d8,0xc42b3f7d,0xffe4606d,0xe86a4949,0x4c5c8585,
  46131. 0x160eedac,0x04ddcc8b,0x568e2420,0x1804ce67,0x42141656,0x91f3855a,
  46132. 0xf932be97,0x7f378198 } },
  46133. /* 209 */
  46134. { { 0xdfa6639a,0x9a374bda,0x02ab7391,0x0cbd48d4,0x47031e2d,0x5c5ef236,
  46135. 0xd0599d1f,0xb49ee2bc,0xe0d38443,0xd285eb60,0x269392e8,0xdbbea92f,
  46136. 0xb8bc538f,0x91455fbf,0xe469b768,0xae259ff1,0x41de5682,0xc1cecb1f,
  46137. 0x9952d1ae,0xc876f071,0xe7bf7446,0x1ce25181,0x282ad2f1,0xcb93ad86,
  46138. 0x6ba4ef67,0x8fa3cd31,0xe507aa3e,0xfce68a04,0xa61bb608,0xced74170,
  46139. 0xf6ac10d0,0x6de716b3 },
  46140. { 0x172d6dc5,0xd4e58d04,0x6397c65c,0xbed2cde6,0x0c9eb4e8,0x7ae77e18,
  46141. 0x75fa2edb,0x56275468,0xa91e6738,0x4b30324e,0x235c8b2e,0x6023a856,
  46142. 0xa8f92887,0x9df6d6c2,0xf6f5e8b5,0xec2c185f,0x3ad5748a,0x7892e12b,
  46143. 0xd54aefbc,0x7aebb4f2,0xee868821,0x14915448,0xb1d9bd5b,0xa26c5f71,
  46144. 0x2ff00df7,0xe5ccd166,0xb95b1dee,0xebc99f17,0x3fe1f774,0x90983616,
  46145. 0xbb3d25b0,0x51f90830 } },
  46146. /* 210 */
  46147. { { 0xf2922461,0x49376fa1,0x1650d0d1,0xdbb1b1c3,0x0dd8608d,0x92b91c33,
  46148. 0x36b89906,0x3e612c4b,0xdf560052,0xe1977b0b,0x636a2545,0xf8afff70,
  46149. 0x11723d8e,0xcda7d278,0x81bde7ba,0x0b0bc4bb,0xed2a578e,0x3cb080b2,
  46150. 0x171b2e02,0x5bda0d0d,0x941bb9ae,0xf6df38cf,0xc14a65c5,0x85dd81db,
  46151. 0xc19dd98e,0x7f98c82d,0x52206f93,0xc613747f,0x5f5bbe78,0x9e13a2c2,
  46152. 0x0aa34be7,0x5eed218e },
  46153. { 0x01d4dc0b,0xe1565754,0xf566bb07,0xa1ae5f27,0xb82225d5,0xe985ebeb,
  46154. 0x1189ec6b,0x5f3ad21c,0xecce4d9d,0x17da518c,0xd6b65b59,0xc84a2d3e,
  46155. 0x8ffa771c,0x7f988175,0x2ac69a7a,0x50d6ae12,0xc6e6846d,0xcb7f30b1,
  46156. 0x5bd0bb13,0x8c023a60,0xd73f2407,0x9a10fecd,0xe5f0a996,0x8c5158cc,
  46157. 0xbd8f5806,0xd26bf615,0x915a46e1,0xaf32ea87,0x0287d308,0xeaf74e81,
  46158. 0xa6264254,0x8c14ba06 } },
  46159. /* 211 */
  46160. { { 0xb17ee201,0x0c877895,0x88e57a77,0xc05aa471,0x97822456,0x19c3e763,
  46161. 0xc9c3ba1d,0x0be6f8c0,0xb4389ebe,0xfe85f4ff,0x0ce7fbb6,0x538bccce,
  46162. 0x65266c64,0x876eab2a,0xcf9a3842,0x5c9ac690,0xccc8f981,0x9f5cf3b1,
  46163. 0x9cf687de,0xfa17be6a,0x83835c15,0xfcfc10fc,0x150ef2eb,0x086b0fdb,
  46164. 0x884a52e6,0x9f97ecd9,0xb0cd1eb8,0x416e6fa2,0x3ecc03ba,0xe2bd1599,
  46165. 0xeabb165e,0x645c0a5d },
  46166. { 0x50aa7e31,0xd94c4205,0x2f851da5,0xaec8df0c,0x3c726e6a,0x99646909,
  46167. 0x2619bf9a,0x72dbdc36,0xe253fbd5,0x1b4260e0,0x8c709e06,0x97c259fb,
  46168. 0xcddaec5b,0xfabf7cbb,0xe4b703e9,0xb4d5e8b1,0x0734efdd,0x1b06e56e,
  46169. 0x1f55f8a5,0x02d4a4f9,0x3f565c8d,0x7f8608ba,0x816d1d94,0x822f47d2,
  46170. 0x5ce7b136,0x0cc36156,0x31d04242,0xe46ee5ef,0x683567f6,0xb2a65f70,
  46171. 0xd2fa6c91,0x27e9ff40 } },
  46172. /* 212 */
  46173. { { 0xd7e952e7,0x75251893,0xc735bf18,0x15b30583,0x96fe0491,0x732b5992,
  46174. 0x806d2fca,0x27451858,0x1b885ed9,0x71ab76a0,0x6d9f55ec,0xbdce9d97,
  46175. 0x48f2ba9c,0x3da60b20,0x592b132b,0x6977c086,0x099051d7,0xb6dca9cb,
  46176. 0xd188ae25,0xd9c2ab23,0xe20aaf3d,0x9f469f3f,0x5aad74d0,0xdbd1f7cf,
  46177. 0x22a9eb3b,0x3d5efe5c,0x137010c4,0x8c5edfa2,0x57870260,0xada2217b,
  46178. 0x3dac9776,0x4feee567 },
  46179. { 0xb5d3d780,0x30e18d52,0x07166744,0x4dadb5d3,0x5a742156,0x320d386e,
  46180. 0x8d6bbb86,0x5d8c290e,0x2d263dd1,0x981a4323,0x98984636,0x33d0e7ca,
  46181. 0xa519acb1,0x5138784d,0xdddc81ff,0x832e3fab,0x3199a43a,0xfc278594,
  46182. 0x32743163,0x5b4cabcf,0x74f94fa7,0x9fa010bd,0x5694a627,0xc28a743d,
  46183. 0xcb657a24,0xc1d2a888,0xe86a25ea,0x7eef2503,0x04c561ff,0xed11a5d3,
  46184. 0x9c9ede0e,0x4fe818e7 } },
  46185. /* 213 */
  46186. { { 0x7fc1c7ff,0x00252c9d,0x9fa89ad1,0xa9bd419d,0x4064e9cc,0xc93a124a,
  46187. 0x43942ecc,0x384cbcb8,0x8749695b,0x004c21fd,0x421165bf,0x69c81d9f,
  46188. 0xdde01102,0xe2325628,0x5a9b004d,0xec937457,0xf6dcfc21,0xfb3346bf,
  46189. 0x4d372c7d,0xac4da64b,0xf20494e2,0xcecb7ad3,0xe867c150,0x562c41b5,
  46190. 0xc2b723d8,0x299395ce,0x7ee53231,0xc91adfc5,0xf10b6597,0xe06f1161,
  46191. 0xb74d3ffc,0x81915529 },
  46192. { 0x6ed9d4ee,0x8ec12431,0x689aff01,0x3dffa154,0x2a89a3f4,0x4aba349f,
  46193. 0xd467efb2,0x2db1e8e2,0x039102e2,0x18dea354,0xe52f082b,0x422ab853,
  46194. 0xed36dd47,0x7130a2c1,0x0295d1ee,0xca60e86d,0x7c7f5ad3,0xe6ac6808,
  46195. 0xde864658,0x0f83cecf,0x461d1265,0x72e66c21,0xbd385099,0xfeef4150,
  46196. 0xa6632289,0x0f183f3a,0x792dc795,0x275454be,0x11367702,0x2744c11b,
  46197. 0xe8ea6ef3,0x7d06bcc7 } },
  46198. /* 214 */
  46199. { { 0x7090212f,0x89285942,0x5521e844,0x691b7d4c,0xbe2dbb92,0x4c038422,
  46200. 0xbd81f880,0x317721ed,0xac89bc36,0xc136cbee,0x7b8f004d,0x4f71b60b,
  46201. 0x4e218ab8,0x269132d0,0xe6cc814d,0xb0e2496e,0x75fadc15,0x0b2ce317,
  46202. 0x66d223c5,0x82e3c084,0x4c612f8b,0x9721caa6,0xa4b65355,0x59a751eb,
  46203. 0xc7d3d9d1,0x3433aad5,0xe80d4246,0x1e61b9d2,0xfc673caa,0x149f655f,
  46204. 0xd0f9cb92,0x48b52b99 },
  46205. { 0xefdc05be,0xa3915399,0x13e095e9,0xde70db18,0xcddb3fda,0x447862e9,
  46206. 0x1a009451,0xa2b03162,0x23920ea3,0x4b27980c,0xa23b8feb,0xac5394f1,
  46207. 0x3e5616d4,0x163f7256,0xb714219a,0xaa0ff93f,0x93d62474,0xd26f96d2,
  46208. 0x7dcfe276,0xdd212ea8,0x47038d15,0xab27bf2f,0xf418168e,0xe58c8325,
  46209. 0xb32a989a,0xe3704222,0xbfc9f13b,0xa3694390,0x0d0684ad,0xf16e2606,
  46210. 0x9d8c76ec,0x17c0de87 } },
  46211. /* 215 */
  46212. { { 0xdcc01958,0xbca5f453,0x1ce88393,0x7d945954,0x561f5b6d,0x5e6350a1,
  46213. 0x7e2d36bc,0x291c3c86,0xa5ac3a6c,0xf6c7ed84,0xd98006cd,0x7913c40b,
  46214. 0x5671ec3b,0xf78bb087,0xb43e89a9,0x1c928f6e,0xae1ea1ed,0xfdf28df3,
  46215. 0xb924b2b5,0x62bba5b1,0x1a116e05,0x491d2705,0x167ed3e3,0x08ec02b7,
  46216. 0x5bc0b046,0xe291cf7b,0x8c5d7f59,0x30e50169,0xf5c799b7,0x0c7c350d,
  46217. 0x0ac6e1d7,0x6862b9e2 },
  46218. { 0x9ffa1f64,0x56c6f4e7,0xa1e24349,0xfed6a91a,0xcdb75232,0xe9a0ee0c,
  46219. 0x0322d607,0xbfc90b37,0x462fef87,0x29480ad2,0xc2bfcf34,0xfc214969,
  46220. 0xa539e38f,0x6e5211e0,0x12a5149c,0x2a59ec26,0xd706b532,0x195fe212,
  46221. 0xe99c8429,0xf77fb108,0x5dc80482,0x74ceaea3,0xbd92d298,0xa5a6030b,
  46222. 0xaaea15ee,0xad42dca5,0x4987109c,0xd6ac3bc7,0x290af649,0xc64e1c40,
  46223. 0x51f8de6c,0x5093fa2d } },
  46224. /* 216 */
  46225. { { 0x4c2d553b,0xc4cf3280,0x3b966c29,0xdc1abe22,0x2296914a,0x556a549c,
  46226. 0x999976c9,0xd8c9f8b5,0x776e83f3,0xc22c57bd,0x7c85ec57,0x4f2942ab,
  46227. 0x6e2c61f5,0xef3407e5,0xf213db48,0xf005e8ca,0xf32698c7,0x470c853d,
  46228. 0xcac0a54b,0xe6f488d7,0x60b7501e,0xb6bd6bed,0x714a4bd9,0xf0103106,
  46229. 0x6e098894,0x5285bc3b,0xf5f92a00,0xec06741a,0xef7ef24a,0x32f16426,
  46230. 0x6c77a438,0x12f9c44d },
  46231. { 0x83313a1c,0x1951e964,0x33c58b37,0x98edd3da,0xc7ac4044,0x4edbbf52,
  46232. 0x0dcb5ee8,0x866ca6f7,0x6dd422f8,0xec0ae8f5,0x0661ec2e,0x1077bc54,
  46233. 0xd422523c,0x6d39913a,0x58e7cb3e,0xd105e1e8,0xc979bb45,0x47c9397f,
  46234. 0x0997b592,0x3221d4a9,0xe8952fe7,0x0ef628a3,0x4e946241,0xd08d5827,
  46235. 0x59780f40,0x64cbed0f,0x08e110ec,0x13d7c227,0x7679b1a3,0xd186d866,
  46236. 0x26ae1d18,0x02f75e4e } },
  46237. /* 217 */
  46238. { { 0x47f307d7,0x1b637ebf,0xd0141477,0x6b644a6a,0x2e05a80c,0x82a33d65,
  46239. 0xfed07b31,0xc8f1a0f3,0x3696e597,0xc09ee7f9,0xc7ffc01e,0xcdaa7ec3,
  46240. 0xf8f373b9,0x549f88fe,0xc3bb8989,0xc88d1961,0xdfcaa7b7,0xd92a4fe9,
  46241. 0x3ae4ab20,0x12ff9ee2,0xf5ecb1a5,0xf5aea641,0xe32fb47d,0xe769237f,
  46242. 0x25d085c0,0x96a5c420,0x26c755a2,0xdc912558,0x9bce9723,0x580b985f,
  46243. 0x63961941,0x72b1b566 },
  46244. { 0x790e5558,0x9d708a08,0x0689af80,0x98536041,0x42313b5f,0xe85e7b8a,
  46245. 0x55a49d1a,0xe6ba1292,0xac371b0b,0x5e76c4b0,0x938e6e19,0x58504f39,
  46246. 0x60ae9a21,0x8dd41422,0x968485ce,0xd8b04e9b,0x887efe43,0xf94c4ba5,
  46247. 0xf11c5e73,0x11268e67,0xcf6b99c4,0x92623e28,0x7a0a9662,0xf2d0aaa8,
  46248. 0x4ca02ed3,0xb266772a,0x2d63b551,0x68ee8e4e,0x2e78b5b5,0xcdebb299,
  46249. 0xe17225ad,0x5df19216 } },
  46250. /* 218 */
  46251. { { 0x8df2e7e3,0x20027e1e,0xd8da07de,0xb183cc68,0x4b4ae694,0xce35ba69,
  46252. 0x3ca62e88,0x896d97df,0x52efed2c,0x3de4713b,0x26bd084f,0xd006c40e,
  46253. 0xfc81923b,0x1e9b71bb,0x1aacc6b0,0x9991c7b6,0x8f656840,0x650c9364,
  46254. 0x87f47524,0x138561d1,0xbffd3ca2,0x610f2b11,0xfa191418,0x96915faf,
  46255. 0x955e5309,0x8f1236de,0xa1872d79,0x613cbeea,0x66a2a48b,0x7f7b44ea,
  46256. 0xe0a89c32,0x452265c2 },
  46257. { 0x25430010,0x4ad5ec79,0xebd090c0,0xcac786ff,0x20a9d3f5,0xa5f9f4ff,
  46258. 0xa3edc65f,0xfcbf4112,0x0cf3eb11,0x8824839c,0x8aa5b700,0xb8dd6d4e,
  46259. 0xb7568ab8,0xe2271dfd,0xb744560e,0xe43ec373,0x1cf75296,0x78eaf926,
  46260. 0x3fa96d9b,0x1809ae0e,0xdc25dfd5,0x0b312d2d,0x6bab7711,0x6b8f78b4,
  46261. 0xb5ecf1e4,0x069efc8d,0x609fecaa,0xc1952bae,0x5f4dbde1,0x43e302ed,
  46262. 0x1e078555,0x14b02bf9 } },
  46263. /* 219 */
  46264. { { 0xb87e5b57,0x2c71c768,0xf531a557,0x0bcc78f7,0xf7597dc8,0x4ff93f8b,
  46265. 0x139e175f,0xb28e026d,0xcb94ca6c,0x6b83b727,0x0079f7fc,0x2eafe3b2,
  46266. 0xcf3bd170,0x2aca54de,0x6af0dc6c,0x17c4133c,0xccf5e35e,0xbea1e665,
  46267. 0x345505c6,0xa6691a48,0xe6100b89,0x2633abd0,0xc17d0388,0x966c6706,
  46268. 0x1a0cf90c,0x7aefffbe,0xd0add64c,0x4d847be7,0xaea2aa46,0xd49bcdfb,
  46269. 0x2cc7d0a5,0x85e07e74 },
  46270. { 0x0bc25bca,0x23aae0a6,0xe44f64ec,0x6e8e55f1,0xb607b773,0xe1e696d8,
  46271. 0xd3005909,0xaa90a746,0x2cbc4990,0x072b1ccd,0xc68e2f5d,0x0d0fe6c6,
  46272. 0x53e28ec9,0x920ec5f0,0xf0040cc1,0x79b21fb4,0xfcc4a2c7,0xa7375bd3,
  46273. 0xe1bac7dd,0xf5f5def9,0x35c0f8d3,0xdc315d79,0x2cacd318,0x7117c170,
  46274. 0xe926f71c,0x6f2823c4,0xed02f39a,0x38db58bb,0x7db69323,0xe5b49231,
  46275. 0x8d49f430,0x0964039f } },
  46276. /* 220 */
  46277. { { 0x56999eba,0x21774f16,0xb1de6305,0x3d8ee287,0xde0b2669,0xd81af726,
  46278. 0x3f8942a1,0x37446939,0xea03e13c,0xbcf6b615,0x94e273cf,0xd30c0c35,
  46279. 0xc6725c56,0x4fd33a56,0xa8be97a2,0xa57534ad,0x7c22a251,0x799242a6,
  46280. 0x9d0c5c49,0x4e51bdb5,0xc6a42768,0xd7cd76cc,0xd426bf59,0x914097ac,
  46281. 0x66e9beb2,0x59404a2c,0x5c96e3e9,0x4738fe98,0xaad666d0,0xbcbb3e0e,
  46282. 0x63bc5e56,0x626b0fd2 },
  46283. { 0xe1a1ec42,0x47217dba,0xab5acc50,0xaa6ae7db,0x865331d1,0xb7e1ab1e,
  46284. 0x3d30126f,0xb8453070,0xdee61851,0x280649e0,0xea689544,0x8806f4a3,
  46285. 0xcb56f632,0x4bbe43ad,0xbcaff94f,0x036b9bda,0xbd0637be,0x0d941e65,
  46286. 0x686f3abb,0x82179d44,0xaad6afd6,0x1486912c,0xff7e1534,0x9a3b891e,
  46287. 0xeb86fd96,0x88c426ce,0x117928c3,0xb56e6a81,0x96399e00,0x933e7135,
  46288. 0xa17b6ac1,0x09bbddd9 } },
  46289. /* 221 */
  46290. { { 0xe4fd3673,0x75e39c1d,0xa65c8e07,0xf880d9d1,0x7289c7fe,0x4725c1dc,
  46291. 0x3529d200,0x5b6735ee,0x3c747af3,0xc1f8f2ed,0x912efdf5,0x5cf3998f,
  46292. 0x49859c39,0xed722618,0x0e69795d,0x23793a2f,0x86b1d2a7,0x8a6ab8d6,
  46293. 0x22a882e4,0x00c815de,0xf9db8d7e,0xbe77d6fc,0x02267547,0x0886fb32,
  46294. 0x49c10edc,0xb62687d4,0x7c83ed4c,0x9f1c3e17,0x5af366ea,0xe6d5d7f0,
  46295. 0xd1efad24,0x2eaa01b8 },
  46296. { 0x1f357c74,0x5e47fb70,0xa9e3b794,0x93085c4a,0x6e85a905,0x4f098733,
  46297. 0xbe0244c9,0xf53808ff,0xa3b5660d,0x91dddf93,0xf3b95ed6,0x8b76377b,
  46298. 0xbb3920d4,0x91b911b7,0x86a13cf3,0x7ccf08bf,0xea018e58,0x53ed8f97,
  46299. 0x78c55194,0xb1ea4343,0xe0d2d5a6,0x8e6adde9,0x9b96259a,0xfc2b248f,
  46300. 0xeef17ddd,0x96ebceae,0x557f9c85,0xf694b443,0x07d5bba8,0x48cd150f,
  46301. 0xb4c1986b,0x02d31de9 } },
  46302. /* 222 */
  46303. { { 0xde79499d,0xa6bb9e1e,0xfd0fc2ad,0xf6ca8ff8,0x1a7d9356,0xbec0f8e8,
  46304. 0xe8f06327,0xbc3d1c9f,0x3b300beb,0x805c7217,0x413c181b,0x00420a08,
  46305. 0xf0ca9d01,0x9e9a167e,0x1aeeddd6,0x076c909d,0x8e3a8a72,0x64a1997f,
  46306. 0xa77b429e,0x3ce7f7a7,0x5c94d3e9,0xaac0fbf4,0xe6d48407,0xf37694a7,
  46307. 0xa91921e7,0xf56679e2,0xee1dbbd6,0xf23fe0f3,0xcbf9fa99,0xc7917566,
  46308. 0xe0f4d765,0x965860f2 },
  46309. { 0x7fa5f79c,0xe734702b,0x5af2d26d,0x930bd426,0x6c73e0ce,0x45bd8b98,
  46310. 0x4ee44a2d,0x7dbe7bed,0x956c8a1a,0xc129e024,0x77cdf80e,0x6fdc05ac,
  46311. 0x589ca59b,0x70a6ba2b,0x999825af,0xfc484021,0x7a23f0b6,0x1d284b54,
  46312. 0x28a0a8af,0xb1da10a4,0x2b2af6d8,0xb1eb1b31,0x33935ee3,0xf051443a,
  46313. 0x8effa6ec,0x7a07eb26,0xd662654c,0x16ee4086,0x4549ee4c,0x7a7bc501,
  46314. 0x1fa98a52,0x65081032 } },
  46315. /* 223 */
  46316. { { 0xb67ed9b2,0x49f0e460,0xc36d93d2,0x0cda0fd0,0x88c75e1c,0xbb5963e9,
  46317. 0x614bc0c9,0x757bbe93,0x9a768605,0x9a9b8801,0x48edc544,0xa8b7e2af,
  46318. 0xb51a5985,0x9e77ed9e,0xebbf024c,0xdd025274,0x1545c636,0x598b6288,
  46319. 0x4800dba0,0x39bdaed0,0x81e2a23a,0x7fc20139,0x550cb4f2,0xdc66fd5c,
  46320. 0xb52068c7,0xad27032f,0x8169fa15,0xc9a0bcae,0x3a7ca8a2,0x60606f21,
  46321. 0x9862652f,0x98295046 },
  46322. { 0x2e11c128,0x3e374600,0x0e6dca7e,0x80dfae5d,0xd9552264,0xe44016e2,
  46323. 0x880b7143,0xf65f88f2,0x526b881c,0xca3d28d4,0xdfb86afe,0xf9c59dd1,
  46324. 0x4c74f958,0x548860c2,0x9cb69f4f,0xd06ea43c,0x7334ecec,0x5343c9ae,
  46325. 0x35329713,0x5cc2ccd6,0x5f3a6c0c,0xa95ff403,0xb372653b,0x2e01a1cc,
  46326. 0xa250523d,0x31510fdf,0xa6227eb2,0xeee538e2,0xca23cd10,0xeadfc8a0,
  46327. 0x3e78f54b,0x4b7e6e1b } },
  46328. /* 224 */
  46329. { { 0xdb5f928b,0x79c9076f,0xb7347cec,0xe6250bb6,0xac00ec41,0x54b67798,
  46330. 0x9d9619c7,0x900d20ba,0x59e4343f,0xed42c0d0,0x451935d7,0x3df39e85,
  46331. 0x64f701ce,0x26391182,0xe1f87aac,0xce8f2554,0x65f91aaa,0xfddd6789,
  46332. 0xa324539f,0x96cd163f,0x4bace995,0x5c815f2c,0xa94f9ea5,0xd78c8c2a,
  46333. 0xef24e455,0x7ab2aff4,0x1cddc26a,0xf0ed6409,0x00ca2822,0x954a420b,
  46334. 0xd3297658,0x0611c4c5 },
  46335. { 0xa9e81829,0xf192001c,0x08a282cc,0xded33320,0x8f9ded9b,0x0bfd7de1,
  46336. 0xb7889003,0x6793ac0d,0x3577a5dd,0xbb00d91d,0x802d3c2b,0xe17a23a7,
  46337. 0xfb549014,0xff95f88c,0xc71b6e07,0x7cd1bf4b,0x23588c8b,0x2e3b24a0,
  46338. 0xa4112076,0x9b5335b8,0xc4056d30,0x2481c05e,0xe916a1b5,0x55c7410c,
  46339. 0x850179f4,0xbbe03271,0xb3cd1208,0x15e6c177,0x90cbfe50,0x509a24c0,
  46340. 0x1c108566,0x82079529 } },
  46341. /* 225 */
  46342. { { 0x1c7d353e,0x5d2d3cff,0x7de0ce3b,0xd5e7eccd,0x6ca87635,0xb4b1075f,
  46343. 0x25f9ad3e,0xda8404e0,0x205cb5ae,0x6b963e89,0x09f221a1,0x9e5ee0d8,
  46344. 0xea41aca4,0xd64c85d9,0x34442a34,0x6a46c4e9,0x3cf655a4,0xac6ff97e,
  46345. 0xe5417d7c,0x76565c1e,0xeebf9c4c,0x681009a9,0x88da6388,0x95b61d39,
  46346. 0xf6b472c6,0x6402b46a,0x0b7f1171,0x1fde5165,0xbe0c05e3,0x94f8f273,
  46347. 0xa88344a7,0x7487b036 },
  46348. { 0x9c3e2370,0xa860e575,0xf8048719,0x19d58193,0xa6e2f9aa,0x3a0dbf3c,
  46349. 0x6144719b,0xb6c7e959,0xdeffec21,0xa9049c74,0x3f50cebf,0x8ba064b2,
  46350. 0x49a1de15,0xb12822c0,0xb1d527f2,0xb654b7d9,0x0ffd0430,0xc470859d,
  46351. 0x4f05446b,0x37c74a67,0xa3add995,0xe553251b,0xe33533b5,0x4a3ed6cb,
  46352. 0x27e419ce,0x2f2f44d0,0xa5d1b979,0x2d84ee82,0xdb6fa69f,0xcc76b123,
  46353. 0x21fa3bdd,0x834f85c5 } },
  46354. /* 226 */
  46355. { { 0x2ce9b31a,0x329347c1,0xfe3fb3b7,0x1d88522a,0x52ff90fd,0x4bcefb4d,
  46356. 0x2b1a081d,0x53b17386,0x2a411f08,0x538c11ba,0x141b603a,0x7895b93c,
  46357. 0xb10bd741,0x2993b9aa,0x09912986,0xccbbd046,0xeea0aba5,0x669fafb0,
  46358. 0x35661897,0xd4844622,0x367ffa54,0x4a63b89c,0x1c3478da,0xcbad5d1d,
  46359. 0xaa6034f7,0xc5339227,0xe61b1391,0x0e6d705f,0xf74ff515,0xdd14b660,
  46360. 0x5332b54c,0x639d8b0a },
  46361. { 0x162217cd,0xfa423162,0x811c28e6,0x2e0e4a2a,0x21766dc0,0x68d9ce18,
  46362. 0x046a06ef,0x51263739,0xdde92101,0x44eea231,0x114298d3,0x0607c8f2,
  46363. 0x63d957e9,0x27f272ba,0xa5e8cae1,0xe7ce80cc,0x24f7a63f,0x5816ebe2,
  46364. 0x89673e34,0x4dece5a7,0x536babd4,0x13756a22,0xe3bf77af,0x644d61ae,
  46365. 0x2bcf98bc,0x60b2bf6e,0x29fa962c,0x3b0b59f3,0xabb50023,0xb0769a1a,
  46366. 0x0c75402c,0x40903136 } },
  46367. /* 227 */
  46368. { { 0x1670433f,0x84d2873a,0x25493dfc,0xc9394df6,0x80fcf89e,0xeb05a19a,
  46369. 0xdb297616,0xe39e4310,0xd9e63046,0x50742dc9,0x1de9ca9e,0xf31ad8c8,
  46370. 0xfb7b1d0d,0x86aabf94,0x1b3c82d1,0x36cda27a,0x39702d84,0xfb1a2ef4,
  46371. 0x46081299,0x280bfddc,0xd2396238,0xe4b2b48d,0x7b3c9353,0x2db2c2f3,
  46372. 0x12fb8a69,0xd5b5b317,0x08180474,0xf9b87a3b,0x1e952578,0xd8590986,
  46373. 0xf37a2bc8,0x80668eed },
  46374. { 0xb39a0249,0xe2edcd35,0xb2f8aeae,0xaf230cd4,0x7223df05,0x295b15e4,
  46375. 0xe0e937f4,0xbb66982a,0x8cbc9162,0x019d2b72,0xcf49dca1,0x5c512ae9,
  46376. 0x630f07b4,0x11b491a7,0xa03874e9,0x48d4f34c,0x44cb7433,0xc1fd0ea6,
  46377. 0xf95b30c3,0x13f79ae1,0xed8b60ac,0x40362d4d,0x61ead81c,0x9e8314ff,
  46378. 0x498c3d28,0xed600dd4,0xc2521702,0x5fcb1c19,0x3a9c1f33,0x592329fc,
  46379. 0x1bde6ce9,0x04677548 } },
  46380. /* 228 */
  46381. { { 0x39233c96,0xee3de56e,0x80737eaf,0x868c409c,0x201abc68,0xacae11bd,
  46382. 0x2b486205,0x0f2cea9b,0x6f19056c,0xe32387e1,0xa5dc2a41,0xea75365a,
  46383. 0x12b4be86,0x76c29acc,0x8d63294d,0xa01fcab7,0x0cab9f24,0x81dbe88b,
  46384. 0xf414c054,0x76646e5b,0xcb96b7aa,0xfe111893,0x7664e097,0xb649f5b1,
  46385. 0x53fcf5a9,0xa196422e,0x0b7ff634,0x5978c9bd,0x3c229895,0xb5feb38e,
  46386. 0x0833c456,0x038a49fb },
  46387. { 0x13e93257,0x35e3818c,0xa612741b,0x14cebc9d,0x7caac06b,0x4f6e9249,
  46388. 0x3daa1116,0x82278e33,0x4de2034a,0xe7cc565e,0x0a1ba630,0xbb7dc95f,
  46389. 0x66956fbd,0x81dd9f23,0xbb132dd6,0xc63e6319,0xfc241337,0x6e22b022,
  46390. 0x7e8beb1c,0x23848193,0xd8c938ac,0x83b1994d,0xa6bb5644,0xb54cfaca,
  46391. 0x06f91807,0x1a7cd44e,0xa8f8d9f3,0x1dd439bb,0x7f74a8e6,0x660c2a78,
  46392. 0x121b5660,0x4bb76e22 } },
  46393. /* 229 */
  46394. { { 0xe6354817,0x7a151e8a,0xf038b438,0x33d494ea,0x85958986,0x4c86c688,
  46395. 0x1dcbac12,0x72153827,0xc0edad06,0xf487af8c,0xe500e5d6,0xad33051f,
  46396. 0xd6e47f55,0x0a711b1b,0x8c746ad5,0xa68709a7,0x6402f35e,0x27f17262,
  46397. 0xfb30c130,0xc6d08efa,0xc06c7497,0x9ef1c041,0xdcc3e2da,0xd0c74ece,
  46398. 0x092e1073,0x30c5f96e,0x2aa12b74,0x0f1393cf,0x2107eb02,0x24584016,
  46399. 0x7b76f98b,0x8843d25f },
  46400. { 0xedb2a83e,0x4e1501dc,0x2bb8d724,0xbcfe8fb0,0xd925df62,0x09020659,
  46401. 0x42ab6fc3,0x3c715dcf,0xa0f09dfd,0x73c05055,0xe3590aea,0x126745d8,
  46402. 0x76ff749e,0x5382f4d8,0xa920c663,0xfc69feef,0x9fd711ca,0xde160211,
  46403. 0x9075c4d5,0x4219c3bd,0x3ded6bf2,0x3800cbd1,0x6263a116,0x8c7ea0eb,
  46404. 0x7d264c37,0x35bd7958,0x7159c98c,0x56e22e45,0xfa7373b5,0x71bf2a2d,
  46405. 0x8935c949,0x0503f939 } },
  46406. /* 230 */
  46407. { { 0x71dad4f6,0x65addc66,0x024bea1b,0x238e4889,0xf605d3dd,0xfb76c8e2,
  46408. 0xb0d96b89,0x13d5f5de,0x6601b2cb,0xe0b5ba35,0x83e3d254,0xe37d491d,
  46409. 0x240c8ea7,0xe8860423,0xe91c99ba,0x374182f3,0xa87ad919,0x26c2caf9,
  46410. 0xf574f295,0x4b13040a,0x944000a3,0x5b9bced1,0x06df42e7,0x4ccc57be,
  46411. 0x4bd1089d,0x22e8ec50,0xdddbb500,0x0c53177a,0x9ecfeadb,0x690d31d2,
  46412. 0x176668f9,0x735778fe },
  46413. { 0x843c1137,0x0f86ee3e,0x3f0b73cd,0x3c1c42fa,0x8ab20e3a,0x0e75679d,
  46414. 0x16242fae,0x6f95f1f4,0x39b092e4,0x7b88e11c,0x4c236ac0,0x1629403e,
  46415. 0x2dac02e6,0x66105f41,0x862e0632,0x74dc28a7,0xf3b23c8d,0x2118ffb2,
  46416. 0x0745ffbf,0x1182417c,0x4c05711e,0x49b55a04,0xcefbe4de,0x2c665b74,
  46417. 0x97bf7107,0x1cc4c01d,0xc54f0676,0xb2ca06da,0x7450d0f8,0xfc599daa,
  46418. 0x1a3182a1,0x52e637a6 } },
  46419. /* 231 */
  46420. { { 0x6bebc6db,0x481700f1,0xf9503d92,0x4a6b45db,0x5d153919,0xc715cd3c,
  46421. 0xe5ad2abc,0x942a1c05,0xab7b466f,0x36a82433,0xba13918b,0xba413bed,
  46422. 0x90f4e6ce,0x698a5624,0xf3f1f3ca,0xbb720da6,0x63471ab3,0x2116d41d,
  46423. 0x303d3609,0xe00d2227,0x463ba69e,0x7fd4cc00,0x62845fd1,0xac609e4d,
  46424. 0x80adc9c7,0x63603b2c,0x45fafbca,0xbf16fc9a,0xc4bc94ab,0x41007f7f,
  46425. 0xa74b1698,0x7c916b4f },
  46426. { 0x78bac2d4,0xc1026f91,0x2601a875,0x8a2e8098,0x0073d640,0xad2f276e,
  46427. 0xfcc1fb88,0x443610c4,0xca6b291f,0x5727b822,0x88ec60fc,0x0645532c,
  46428. 0xed9ad48b,0x51e48899,0xf543f103,0x841b48b5,0xd591ceeb,0xa6ccb1be,
  46429. 0x9dcf5a8b,0xfc4adf0f,0xb347ddb4,0x3a7ca020,0xcb44c521,0xaa1accc2,
  46430. 0x0527c0c4,0x773b6828,0x7023cf50,0xaa374c10,0x6b74c926,0x733d1000,
  46431. 0x77a8d07c,0x1ff3916f } },
  46432. /* 232 */
  46433. { { 0xf997939d,0xaa218fe4,0x791583b3,0x3d4dfbbb,0x87f7560b,0xb3a7b5da,
  46434. 0x5da92c98,0xa9c02801,0x46666f4a,0xe1eb4aad,0x14ce9dd7,0x2eb17a51,
  46435. 0xef8f3076,0xf46a66a4,0x810e546e,0x900b45c6,0x4baf04dd,0xf7af2258,
  46436. 0x5c84d42f,0x3cc1c872,0x8e4c83de,0x3093f225,0x170d88b2,0x62fade41,
  46437. 0xac076e44,0xe19612e4,0x32dd141b,0xf48d7346,0x925e34da,0xc1b1f759,
  46438. 0x072b90c9,0x19ed1a56 },
  46439. { 0x6c735473,0x9cf7fcde,0x6003bc3e,0xaab88e67,0xfb199bb8,0x12187cbc,
  46440. 0x9accccbd,0xbb730441,0xb0f65459,0x214aff3c,0x6f926282,0x6aec81a3,
  46441. 0x9f9d20b8,0xaa82cb32,0x5773cc90,0x82f3f90f,0xf62257e1,0x4af60e6b,
  46442. 0xbd4762df,0xf18b44bf,0xdb970753,0x3948b129,0x7c22c18e,0xc6e920e9,
  46443. 0x57be97ad,0x393d6208,0x46b637f9,0xe8d7382c,0xf1fed1d5,0xf6625ccb,
  46444. 0x68681599,0x6f31e0f9 } },
  46445. /* 233 */
  46446. { { 0x82b8f204,0xc45afe55,0xd358b54a,0xac0441b6,0xacd5f5ed,0x7213e7bf,
  46447. 0x139bcd93,0x1914c70b,0x96dbcbb0,0x714b4581,0x1ed35d21,0xe9297d35,
  46448. 0x6a3e1f20,0x8f640837,0x2f3cd705,0x150a8a9d,0xdcdd9f6d,0xfb36e801,
  46449. 0x5cf56d82,0x5a54eb65,0x92aa5a21,0x7610500c,0x3b089f03,0xd10d0ae2,
  46450. 0xc42b66e8,0x491b2079,0x0eee8d48,0x4af1ae3d,0x41556f45,0x137e4c28,
  46451. 0x63d8a7e6,0x875e3308 },
  46452. { 0xaf6c0acc,0xdc80fddc,0xbb1e7c08,0xd5ad1e66,0x828585ad,0xdc717ae1,
  46453. 0x275c7da6,0xbdc54340,0xd26b9e15,0xf4b4c852,0x6a05fa50,0x5f0a1fbf,
  46454. 0x817bcb32,0xc6f81e47,0x70ff2e1d,0x2cbd4328,0x67c7f7fc,0x8a249016,
  46455. 0xb585a6c4,0xd045acb7,0x4666c057,0x2e972ad4,0xe6d7d63d,0xc74d87cf,
  46456. 0x0e274144,0xf7067d87,0x8b2584ae,0xb2ca157a,0x75f0fdeb,0x495c5bfb,
  46457. 0xf386e009,0x5abb0581 } },
  46458. /* 234 */
  46459. { { 0xf0c97f57,0x8be62d2b,0x962f28c7,0x0fe04871,0x47b50abb,0xc548a467,
  46460. 0x44fa09ed,0xf6b26e03,0xab05a96e,0xfd44c6e3,0x70e6ae82,0xedb0032c,
  46461. 0xd7e4899d,0x28bd402b,0x9b7c11c2,0x43f2e963,0xce913716,0x0ec3fc0e,
  46462. 0x02fd0f8c,0x769b8bc9,0x7cabc3ac,0x9d9cb3aa,0x06924cc9,0xe88a8892,
  46463. 0x42609014,0xa51461aa,0x962e79e0,0xc7f4aa8b,0x8b1b3e80,0x4ef0210a,
  46464. 0x1bfee4bc,0x70544680 },
  46465. { 0x121901c1,0xfab3d713,0xfead54aa,0xe90a2627,0xbc08ba23,0x64f6d285,
  46466. 0x36ec227e,0x8d993015,0x06c191ab,0x99a16ab9,0xf649ce2c,0x86b1cf5b,
  46467. 0x66be3a80,0x59206759,0xccba2cf0,0x18836279,0xeff53486,0x2c157b87,
  46468. 0x4b223af2,0xbfac9896,0x0aae7a57,0xcd0fd4f0,0x63218a80,0xdaddb940,
  46469. 0xdf88f14e,0x3844bb79,0xb71ed9fd,0xc1b3e3d4,0xd6205036,0x6c634a13,
  46470. 0xb8680a6b,0x6f56aecf } },
  46471. /* 235 */
  46472. { { 0xd9205c5d,0xb01dc803,0x67123929,0x68955f7d,0x9d9b6565,0x3debbffd,
  46473. 0xd3b1acfe,0xb844395e,0x6094eeff,0x04328b21,0x22991feb,0x6631ffa8,
  46474. 0x190dd075,0x0dde66e6,0xe8577c05,0x75b03c55,0x91722407,0x6c91ce5f,
  46475. 0x8ebb3a3f,0x9a288a40,0x058a1396,0x1d376f8a,0x9a6e0676,0xf3a59457,
  46476. 0x7b71d288,0x103029c5,0xb44c30c0,0x0843f428,0x730e0b9c,0xd8e6aff8,
  46477. 0x4ed644ad,0x7b6be811 },
  46478. { 0x3d3aa54e,0x3ec38e4a,0xd83d509a,0x10233943,0x243955e2,0xf84aa621,
  46479. 0xf51d3d44,0x29104717,0x7eca4e37,0x62d2442c,0x85fa55de,0x8c5a523d,
  46480. 0x851da1b5,0xc6f5ccda,0x20001468,0x044bcaa8,0xe01702e0,0xf7501e68,
  46481. 0xe6a0acec,0xf0819359,0xac0ef0b2,0x33dda6ad,0xfd964f01,0x97aeedc8,
  46482. 0x530b90d8,0x48dacd0e,0xb84122eb,0x4c5fad6f,0xd700a1de,0x2284ec1e,
  46483. 0xdbca5474,0x86f9a835 } },
  46484. /* 236 */
  46485. { { 0x450cc69f,0x0e1d9055,0xc9edf98f,0x50eb14bc,0xee7eba01,0x1bb94e77,
  46486. 0x998f8e53,0x5f7a6737,0x1b16eef0,0x588384e3,0xd85c5e15,0xbb928723,
  46487. 0xcbd952aa,0xfe51e345,0x7e241674,0xc5d0ee28,0x100182f0,0xfdc146ef,
  46488. 0xe7f5be2c,0x0f739e92,0xb656bd3e,0x501ab3af,0x5168e289,0xb1552dde,
  46489. 0xb8ee104a,0x940dfe31,0xc4304475,0x42923603,0xc460a913,0x9306f114,
  46490. 0x03b51f86,0x5bfa9faf },
  46491. { 0x107b258e,0x2a23f52c,0xd66341dc,0x989e82bb,0x823cff1a,0x54a3ced8,
  46492. 0x719b491f,0xf45b7794,0x2433dfb8,0x898c2218,0xc49250ee,0x0f9dd91c,
  46493. 0x4fa17655,0x50c2a2ae,0x2c327f45,0xf7aa1ce4,0x583b1e41,0x13a15ad6,
  46494. 0xa1bfad9e,0x9aa0d5a5,0x8e1fbdcd,0x9b1caa28,0x915f7f87,0xaf9283b6,
  46495. 0x87e81a1e,0xc10e4e0c,0x1080d296,0x04fdca56,0x12755bd8,0x6acc9616,
  46496. 0x828feeda,0x1b1266aa } },
  46497. /* 237 */
  46498. { { 0x774ee49c,0x4ebc0a00,0xcb6237d7,0x776f6852,0x5df938a3,0xfc0544ac,
  46499. 0xb6fbfbbd,0xc3388ec8,0x745f2eae,0x84ac8bcd,0xb1ece937,0xa9c56609,
  46500. 0x7de8fa13,0x656fb6ac,0xa532b871,0x5f8ded74,0xaa889f09,0xab0d428b,
  46501. 0x10b7aec2,0x43b27f28,0xfeecb34c,0x26426e1e,0x9e89c2db,0x44431b6b,
  46502. 0x39211090,0xaac4bc5d,0x4fd81058,0x926f7368,0x471ef60e,0x452fa691,
  46503. 0x218d7a23,0x33517fdb },
  46504. { 0x593c4a36,0xa9c33f46,0x36b1a9ee,0xac69d718,0x4277beec,0x55a20c1d,
  46505. 0x7e4f179c,0x3e8ca24e,0xd46d88a2,0x57373369,0x730702f8,0x71ceb1cc,
  46506. 0x35eed574,0x8b184d97,0x0704cec2,0x7f4517a2,0xd7062a53,0x7f129d18,
  46507. 0xb1d77e1c,0x07a4571b,0x8350d8b2,0x774ac309,0x61fab8ef,0x27b2919f,
  46508. 0xb5dd801b,0xa7c4cc13,0x1434591f,0xe7e6255b,0x5a3592b3,0x349937b8,
  46509. 0x30c77549,0x31fac63d } },
  46510. /* 238 */
  46511. { { 0x04913fb6,0x2ee8cf1b,0x1769a6b3,0x7e401350,0x783e61f0,0x790ebb71,
  46512. 0xe27f2ffe,0x1e5107f9,0xedaf89bf,0x124ba67f,0xe58de68d,0x189200e1,
  46513. 0x6df5abee,0x962732a3,0xacbeb4aa,0x72cc37cf,0xe93c5a76,0xb0c5fa96,
  46514. 0xde63393b,0x4c2a317c,0x830b2d6c,0x97f65e67,0x1be5b96a,0x4afc3504,
  46515. 0x730ce66d,0x0bf40a60,0x9340d84f,0x96a1ba79,0x07626b08,0x3ee18254,
  46516. 0x7ab0cbf5,0x01db35db },
  46517. { 0xac0efee2,0x6e0fbc2d,0xd71dbb45,0x8406ebcd,0x19b69abe,0xe72bde3e,
  46518. 0x37e01822,0x49cb7e61,0x11458b4c,0xcbb8c01c,0x687c5d63,0x420b4847,
  46519. 0x454c6776,0x1847dfa1,0xd1839d18,0xbede911d,0x278df046,0x1b9dc9c9,
  46520. 0x881a336c,0x294bd62b,0x93e77adc,0x7f096879,0x43ce3ba7,0x7ac90665,
  46521. 0x7764eefc,0x148695fd,0x9ac465cf,0xe0c20f0b,0xa6e2cdb1,0x636e8d28,
  46522. 0xd755341d,0x7b6ba98c } },
  46523. /* 239 */
  46524. { { 0xc1881ab4,0xcb1d9e03,0xb3168c88,0x19c25d55,0x282364ce,0xa82d3d47,
  46525. 0xf161aa24,0x95994390,0xe1ebb2c9,0x7838bc00,0xbdec7a75,0x8fd5dfcc,
  46526. 0x4ff7220a,0x4dd203c2,0x0efeff48,0x5ec173b3,0x16428b35,0x99f1d2b3,
  46527. 0x056e813f,0xc06bd9e5,0xc0b319f1,0x929172ba,0xfd223b15,0x6ae0e384,
  46528. 0x98d091ed,0xbd01059e,0xa654648e,0x6b3168e4,0x3375e798,0x2211447f,
  46529. 0x71eb4508,0x47e81019 },
  46530. { 0xbc8c290d,0x7045d45a,0x810fb33a,0xa33d1355,0x46fbbf2f,0x2baf0092,
  46531. 0x385c7cd9,0xacff3f1b,0xe161985c,0xc5b150ec,0x2a888748,0xc6ee0a7f,
  46532. 0x5e88dcc8,0x9d888c8e,0xccb86443,0x4dd735f2,0x3c40f6f2,0xcc1e13b7,
  46533. 0xf3fed691,0xfc3a25ff,0x257ee5c7,0x4cb43b17,0xf32db135,0xaa654f93,
  46534. 0x02dff2d3,0x44f58d0a,0xa8ca6394,0x78e3f188,0xf3e86697,0x39646cce,
  46535. 0xe0dce87b,0x785b1902 } },
  46536. /* 240 */
  46537. { { 0xa92f9a20,0xfcce2361,0x9d64540e,0xb7bdca87,0x1d00d7c5,0xd4739a85,
  46538. 0x2e97c926,0x067ac8dc,0x78da6a8b,0x2aea3ffe,0x63c51b69,0x6828bf54,
  46539. 0x7155141a,0x76f1c479,0x3977d810,0xf4bcbef6,0x541bce7a,0x75bc4949,
  46540. 0xd17041a5,0xe01f4066,0x87755eaf,0xd282d5bd,0x59e7ae80,0x6e2107dd,
  46541. 0x382ab36f,0xaa56e166,0xb9d1d634,0x65ee8ef6,0xce4ed844,0x99a2160a,
  46542. 0xb7712c27,0x6557c367 },
  46543. { 0xd75b6e52,0x561b0268,0x118d0e89,0xb0813640,0x6a2eb1ae,0xcff53330,
  46544. 0x6d090894,0x4e462226,0xb5fc1d48,0xbb351227,0x57a3062d,0x9365ea07,
  46545. 0xd66e2dc5,0x4caca37b,0xb9095887,0x220d7d23,0x8c4473bf,0x9c0fd393,
  46546. 0x6787da4f,0xadff370a,0xd057f4b8,0xef0aebcc,0x1173f33a,0x205e744c,
  46547. 0x925a26b4,0xb8d1f0a5,0x722fbbfd,0xa9364f49,0x8227d284,0xc891ae77,
  46548. 0xa0e08ab4,0x15c40d04 } },
  46549. /* 241 */
  46550. { { 0x2a0e18d1,0x9baf169a,0x4c0327c2,0x9971c017,0x7bc262ce,0xd81a323f,
  46551. 0x818ff379,0x2099db8d,0x4cd3c330,0x663f663d,0x011a0553,0xef5325c3,
  46552. 0xf980a470,0x9cd70bdc,0x1c9ed070,0xe64452d1,0xac676e13,0xafbf43f4,
  46553. 0xae85c2a5,0x97bec0a6,0x470490c4,0x2faae550,0x491e6ba9,0x0ab97a87,
  46554. 0xaafa9914,0x4055f537,0x36726557,0xfc95adbb,0xd119d6bf,0x646343b9,
  46555. 0x9d341e37,0x788e94a0 },
  46556. { 0x9c53461a,0x053a6fe5,0x08e3b6ed,0x75ec897e,0x0768d939,0xa8f5d2f3,
  46557. 0xcc213d4f,0x9bd6bff6,0x05b0147c,0x590c7b41,0x7c7b8169,0x20a3628b,
  46558. 0x5bce78e9,0xc66a086e,0x4dec1d8f,0x3dd4d282,0xc19dcce9,0x890acf44,
  46559. 0xd8435a7e,0x6632d875,0xea6381b2,0x590167c1,0xf0dcc128,0xb2259797,
  46560. 0x46f8d463,0x91a612b4,0xc15efa39,0x42185d78,0x119f6788,0xdf55ec37,
  46561. 0x780dea93,0x91b19cc6 } },
  46562. /* 242 */
  46563. { { 0xcb5d8b80,0xebf2709d,0xfc35660e,0x03b96182,0x055ef969,0xb873d991,
  46564. 0xe47c4342,0xd1ea4b4d,0xd54f8867,0xcc4b9244,0xfd8d77ef,0x93b1a2ca,
  46565. 0xe8c1f563,0x068d24e7,0x49973056,0x5f5fabb6,0x0542374f,0x83248c50,
  46566. 0x3f38e913,0xc36de2b5,0x7bb680be,0xed07e8eb,0xd8f313b5,0x964813d7,
  46567. 0xafd2d392,0x7bb6a069,0x0848a31a,0xc06d848e,0xe4f0c325,0x6867fb2f,
  46568. 0x067343af,0x3c2ba834 },
  46569. { 0x9d3ad63b,0xab62d775,0x59e0eb1f,0x3f9cab97,0x3885e117,0x70332a63,
  46570. 0xe20b2f9e,0xf22cafce,0x49eca947,0xb529ba7e,0x6228d88d,0x24954216,
  46571. 0x39239561,0x80ea23ec,0xd4370644,0x1b8907e7,0x563e4e44,0x4b7fa455,
  46572. 0xb2a4b0fa,0xcca9829e,0x48060792,0xd0a720a4,0x246991ce,0x8ccdda0c,
  46573. 0x348d086b,0x37a2325b,0xf60aee13,0x566ed509,0x147f253f,0x3d30e091,
  46574. 0xc1073bd8,0x1fa627a5 } },
  46575. /* 243 */
  46576. { { 0x42478fd4,0xa11222a2,0x670b2000,0xacf4c6f1,0x8359c6de,0xf71bb04f,
  46577. 0x7b93cdbc,0x618e2829,0x230db60b,0x96e1bae3,0x965b3b29,0xf17fd3b4,
  46578. 0xbc7055dd,0xa58639c6,0x4b817d7f,0xc3ea92ed,0xd23b08a4,0x9082b2a6,
  46579. 0xdc17010e,0x8471228a,0x20e89d97,0x753b9e46,0x03ff77c9,0xcf7e4f97,
  46580. 0x2bbe60e5,0x6c3f8245,0xb80e017d,0x9e432cbc,0xc0a45edb,0x150a5acd,
  46581. 0x4798743e,0x67b8bd05 },
  46582. { 0xf4797cf7,0xe66079b4,0xd03fde02,0xe31c998a,0x54caaef1,0x5aa3763a,
  46583. 0xf7649711,0x64d9a1fe,0xaf29b1a7,0x7ce0dc73,0xfb66ca93,0x6661b083,
  46584. 0x32fb6a78,0xbf4d74fe,0xdf00a561,0x25f6ef09,0x831d1159,0x2bc4383f,
  46585. 0x536bde37,0x6d5cc10c,0x882cc65b,0xd4945f9f,0x451a99b8,0x81f48f13,
  46586. 0x6bac11a4,0x140161cd,0xf18a4a0a,0x9d94d4ed,0xa467a824,0x65363165,
  46587. 0xa4c9aedf,0x74297aa9 } },
  46588. /* 244 */
  46589. { { 0xe21124ba,0xc49758a4,0xa87ffbd2,0x99bd8198,0x3d6638a8,0x45fbcdd1,
  46590. 0x15f7bf76,0x94645ff8,0xc4e6d57e,0x5fa6736f,0x92e61db9,0x1eae6475,
  46591. 0xcbdf944a,0x79575c0c,0x25b31d74,0xa3d13047,0x4cab5ae6,0x7881df22,
  46592. 0x1a2887f2,0x8dbfd299,0xa26ac459,0x23d07590,0xd8661d4a,0x2e589852,
  46593. 0x8a0140f7,0x37b5c13b,0x3fb3782a,0x0f94199e,0x1bc14e90,0x722aa059,
  46594. 0xd55bbb12,0x89aab7ba },
  46595. { 0xd656bdc7,0x8b345a96,0xe176cd3b,0x43bdc8af,0x32d64c43,0xd69518b6,
  46596. 0x79b82b41,0xfcf364a7,0xffb0cf82,0x907b344e,0x5101287b,0xf3d0c83c,
  46597. 0x34cd90ef,0xe9f26a59,0x07082b5c,0xe5f5aaf2,0xece7c165,0x4eb72c75,
  46598. 0xbe986cd6,0xe9590a81,0xff1536aa,0xfeef498f,0xa8263d5e,0x04560243,
  46599. 0x54ae872b,0x940be14f,0xe3207686,0xbee7bcc9,0xc1bc4d7a,0xd496a27d,
  46600. 0x5940ab46,0x002dc297 } },
  46601. /* 245 */
  46602. { { 0xb69d60c3,0xee533937,0xfe972755,0x260be552,0xc0c725a6,0xb11fb78d,
  46603. 0xcab2e7c2,0x6982c27e,0xee2322cb,0x4bceedd9,0x122704f7,0x952b19ed,
  46604. 0x854a6165,0x2df4c285,0x7b192485,0xba40b5bf,0x0119f52a,0xfcbca950,
  46605. 0xe5add86f,0x7467d1cb,0xd9d0f2c1,0x9bf536fb,0xb8d4ebc9,0x3c296e34,
  46606. 0x05a81317,0x0495f8f4,0x73335f76,0x8c59e8d6,0xe0542122,0x0b53d324,
  46607. 0x3c3bda73,0x4d564535 },
  46608. { 0x7e5c0877,0x7322f800,0x0ca9a764,0x481b43e6,0xa2c12716,0x231f4f4b,
  46609. 0xed3136c2,0x09596857,0x38db30de,0xae826322,0x99908ebc,0x652fad40,
  46610. 0xaf0d231e,0x0b8d1814,0x09cbc349,0x2680c54b,0x4bf3bf8e,0xfd4562f3,
  46611. 0x092b595f,0x2985090b,0x5e15fc34,0xe6f39ca4,0xbc378168,0x70175191,
  46612. 0x845a4a87,0x906944b3,0x82a1541a,0xacc6d74a,0xb155c8b4,0xadc9bab3,
  46613. 0x77306c62,0x1f2f89ce } },
  46614. /* 246 */
  46615. { { 0x9affefdf,0x8253ef41,0x4cf9256b,0x05d7ece5,0xb444e483,0x377002f2,
  46616. 0xcba5471f,0xb189755f,0xd5cbe015,0xc88483cb,0x6a0b8429,0x254f7c69,
  46617. 0x61f3f61d,0x18850bd4,0x0a247157,0x7ba21089,0xd92eeb0d,0x35abbc2e,
  46618. 0x965dec89,0xfb56cabe,0xbc55684a,0x9da23724,0x6a7a7492,0xd8ba396f,
  46619. 0x2ef4ba46,0xfcb90db7,0x9909b27a,0xdd234fe0,0x76f4366e,0xbdf3c164,
  46620. 0x17e50d47,0x09c8097f },
  46621. { 0x60050c07,0x6a04b140,0x43a8e37e,0xc29e8318,0xbb55e41f,0xcb9429b2,
  46622. 0x2ce60e3a,0xed2fea5a,0xdb9d82f4,0xdc7b1ff3,0x687d37fa,0x48ebecc3,
  46623. 0xecb07539,0x79153e32,0x57075692,0x6a60054f,0x800759ba,0x3871cd0c,
  46624. 0x30922df1,0x17a7386f,0x83357b7c,0x4e9fc59e,0x39415186,0x1d26b3a9,
  46625. 0xd34db889,0x912a0222,0x59fcdb71,0x6672fcf4,0x44ff3036,0x5a3f268d,
  46626. 0x6911e16c,0x6f113ed3 } },
  46627. /* 247 */
  46628. { { 0x1836f1c9,0x52a9df59,0x4232307d,0xfa6519f5,0x5ded285a,0x8406c701,
  46629. 0xaf627f75,0x0a1545ca,0xace0417d,0xae1111ee,0xa6113443,0xfb28bdf6,
  46630. 0x52dbcbcb,0xde9ef0ab,0x7813e658,0xe9dc181b,0x99127225,0x0b1dabdb,
  46631. 0x22814c59,0x5f0598e3,0xd934ee7e,0x5c3b966e,0xb99ba4bf,0x4eb84eda,
  46632. 0x3c1b55e7,0xb2919a34,0x94aa860f,0xa9addb49,0xf6811ff6,0x1b7220df,
  46633. 0xd1a183e2,0x6636a23b },
  46634. { 0x20587283,0xdf5d5a2d,0xef07fc5d,0x0b3822c9,0x0ef6de38,0x1786bd55,
  46635. 0x25d1671d,0x163cf907,0x1cdb1def,0x74bf971f,0x0842fc4a,0x5749e830,
  46636. 0x27f854f7,0x0e2edbc7,0xbce24acb,0xbb27bbda,0x05bed08d,0xc1b19cec,
  46637. 0xf7c904bc,0xaada123e,0xd89982db,0x02429f1b,0x65f6e632,0x49d3616e,
  46638. 0xee59fd32,0xa3789fa8,0xfe9f29f5,0x160ba3ba,0xaf5378a0,0x0f2d3b61,
  46639. 0x73c2a6f8,0x7aeecc76 } },
  46640. /* 248 */
  46641. { { 0xdc43b0db,0xf3a4757c,0x98119cad,0x3d8a4e85,0x4616c156,0xf8095bf6,
  46642. 0x4f533e97,0x3e2a07bc,0x39cfc5ad,0xa9824367,0xcd68052c,0x18a6ba3a,
  46643. 0x8a1cec66,0xbd60e590,0x02b1b695,0xae3841a5,0x190a195b,0x986dff12,
  46644. 0xad31fd9b,0x2df2beac,0xcc728f7b,0x7d893224,0x0cf0a992,0xc38ea738,
  46645. 0x586a44ea,0xa8439a80,0x1615f03c,0xede7f7f0,0x27a1f885,0x48249908,
  46646. 0xb78a7645,0x28ec4006 },
  46647. { 0xa2fe0009,0xe1820c2e,0xf13874e9,0xe11ba5d2,0xc524db52,0x97522454,
  46648. 0x7fede529,0x4d477426,0x9b2500d4,0x01d3419a,0x1869244b,0xce08a492,
  46649. 0xdd1be1b9,0xba169023,0x32a301e0,0x242c3e54,0x70906788,0x9b56f7ba,
  46650. 0xc74a8cc4,0xf0ad2a09,0xd76f9439,0x99cd1841,0x621fb60e,0xeddafe0b,
  46651. 0xbc397634,0x056bee54,0xff7f0a84,0x4653f860,0x2011c0af,0x6bd4876f,
  46652. 0x0c9525c3,0x134f4cc7 } },
  46653. /* 249 */
  46654. { { 0xe938dff4,0x9621a3ec,0x486a79a3,0x7d101a7b,0xde950537,0xf2c4ef97,
  46655. 0xe65d87db,0xf3184099,0x373b8cfa,0xb89c7ffb,0xe842916e,0x68baa505,
  46656. 0x4ebea764,0xa790fd09,0xe592892b,0x679df6d4,0xfcfed741,0x2023331c,
  46657. 0x9880ff21,0x0bf4efd2,0xd0344501,0x7ca78ddd,0x342858c8,0x2cb09ecb,
  46658. 0x2575487a,0x9e5eb6dc,0xebcb0491,0x50675a15,0x7381d471,0x09d2e74f,
  46659. 0x83d3d6f4,0x6ea37829 },
  46660. { 0x4e5cc40a,0xc65c094b,0x1af37dfb,0x7a2e3f6a,0xf9026e44,0xef677e9d,
  46661. 0x93880f53,0xb7878c95,0x7f644aa9,0x4aa30b07,0x2f208c3c,0xa0c51683,
  46662. 0x658d663b,0x7c0277ae,0xae1d9130,0xef0b3c38,0x695c3ea4,0x302f37a7,
  46663. 0x6a0c5e0d,0xe004c1c5,0x20cbcf9f,0x9fd495c4,0x568a0e7c,0x706d5b9d,
  46664. 0x59286454,0x8b225dff,0x8d9a709c,0x527d4465,0x87c08d68,0x47c558da,
  46665. 0xbb4ef07d,0x606ee6e6 } },
  46666. /* 250 */
  46667. { { 0x57c621f6,0x02d99fc7,0x7fe83d48,0x292e40c1,0x9ef199b0,0x1bdfc7a1,
  46668. 0xe62c7666,0x78a04102,0xe6738753,0x16cda370,0x1e3a65af,0xbc81974d,
  46669. 0xf78fe209,0x19742048,0xbf5981c6,0xc83a058a,0x9c89702d,0xf26b2434,
  46670. 0x9d1a678a,0x988b2f1e,0xff29ae29,0x472bf9b0,0x1d7cf5ec,0xa143e398,
  46671. 0xb268ddd8,0x9c9d7e45,0x5fc4ff76,0x166cda55,0xa4aa7673,0x6044cdf0,
  46672. 0xe9148707,0x49dba6f7 },
  46673. { 0xa758e37a,0x20e47fb2,0x2d8eaf66,0xaf6b31d7,0x6f9c2210,0x352ad5f9,
  46674. 0x90efc32b,0x0093f727,0x41e4b264,0x435c99dc,0x05b15795,0xbfa878e0,
  46675. 0x0e673575,0x99c520a4,0x87eea759,0xca682594,0xf12a348b,0x029f7b81,
  46676. 0x2aa2ce35,0xa547cc18,0xead5e2c5,0xa11d874b,0x55682cdf,0x9af0349b,
  46677. 0x8bbe8e66,0xf86ebfea,0xf55394ab,0x3dab8782,0xebc8eb8f,0x458bf797,
  46678. 0x9b7de78c,0x4890a7a4 } },
  46679. /* 251 */
  46680. { { 0x8da995f6,0xd7299689,0xec6156ef,0xd39eaae7,0x356a82d5,0x6959040c,
  46681. 0xc135bcfe,0xb2046b21,0x0f595c78,0xea720b64,0xe7c5fb40,0x02824efa,
  46682. 0x0edb3bfc,0x97d8fd4c,0x79f24ebe,0x12f02905,0x187ea6b9,0x16fc47cf,
  46683. 0x789d5c23,0xc219fd27,0x89263ecc,0x233a6b6c,0x8b6d30a6,0x823634b2,
  46684. 0xc9b33680,0xca352e25,0x40c77456,0x9388d6ca,0x3c92065b,0xf8e55b0b,
  46685. 0x02439a76,0x5c17474b },
  46686. { 0x8aaccab5,0xd888e7c2,0xaaced05b,0x18027836,0xccec0f65,0x185b877d,
  46687. 0x125c2882,0x93cadc1c,0x67fdc54c,0x45df540a,0xc2788a33,0x4f3c86e2,
  46688. 0xe3a0fa2c,0x3e874469,0x273983cf,0xc59daa47,0x4a96d8a5,0x3063c48b,
  46689. 0xc2e58915,0xc38d2bcf,0x84e428c3,0x90e78b87,0xf0c4fd53,0x900a292c,
  46690. 0x941e6005,0xb7f92db7,0x6ca53a1c,0x95679241,0xb1ab0fa7,0x35f6f31d,
  46691. 0x7b58408c,0x5d675eb4 } },
  46692. /* 252 */
  46693. { { 0x870c6025,0xaeee1a77,0x91a2dfca,0xfc4a23b7,0x386b64c4,0x7b0e60c4,
  46694. 0xe5ae72b1,0xd5d5b17d,0x9eefa212,0x6dfc88ac,0xd4038b96,0x4feaefbe,
  46695. 0x8e2d2ecc,0x099ac356,0x012af207,0x548ea612,0x89c31218,0x4ffed9db,
  46696. 0xe0e67331,0x1c1e91c4,0xaf8300e0,0x009bb64f,0x6773c3be,0x8780501c,
  46697. 0xc08219fa,0xe0cd6ede,0xf81b06ff,0x7c055e07,0xe080b36f,0x82b63f9c,
  46698. 0x0a9feca3,0x02fccbaf },
  46699. { 0xb47cac61,0x9991d4d1,0xab86e12c,0x2e9d1687,0x2b94f042,0x8c6855ec,
  46700. 0x48e648e5,0xca400519,0xef89ac57,0x9ba91fb2,0x1be792cd,0x4f419206,
  46701. 0xbd0f1e15,0x82d221cb,0xfc444019,0x062eb13b,0x99790fdc,0xf3a97c32,
  46702. 0x6067a64b,0x4e796d94,0x6d23775a,0xc46dd300,0xed7f0f23,0x8672c4d5,
  46703. 0x3b4f63d7,0x821851dc,0xd26273f2,0x50a3ae0c,0xeac60f6f,0x800e58fc,
  46704. 0x13845545,0x56f1e456 } },
  46705. /* 253 */
  46706. { { 0x32c24f3b,0x01ccb3f6,0x06d817e6,0x99eb1c7f,0x6aa26776,0x8dc640bb,
  46707. 0x0845d5e0,0x7838affe,0xf81a79a8,0xf34fecb1,0x3e6819b0,0x6a2e282d,
  46708. 0x8237a4b8,0xc4b977ce,0x87636439,0x0f46b3db,0x97970497,0xa465f540,
  46709. 0x8791be43,0xd7e08762,0x34198ec6,0x00220b6c,0x093d94bb,0x57b38637,
  46710. 0x29d690b2,0x84012e16,0x20aad1a4,0x02ec9db5,0x85dc34e3,0xafee2fc6,
  46711. 0x25500cf8,0x911d1936 },
  46712. { 0xf5e5af5b,0x13b1bd58,0x7b6a22a7,0xa7ca263b,0xf3af2adc,0xab6bec4d,
  46713. 0xa04420bd,0x16651e59,0x4ba36c11,0x3b448b3b,0xff424310,0x3c62bfcd,
  46714. 0xf1a96cbb,0xde15c4a5,0xe4d1f980,0xbe0ad8a1,0x36673a3a,0x812bd14e,
  46715. 0x9212acdd,0x40303af6,0x576095ce,0x8f6dab9c,0x107f5ca5,0x7df1882a,
  46716. 0x8896a3b0,0xb903e63c,0xd863b3f0,0xf5048544,0xc09887de,0x5e5019b9,
  46717. 0xa0f53865,0x2be744fe } },
  46718. /* 254 */
  46719. { { 0x5b50f324,0x054cd05f,0x1ea3c7a2,0xb9b1eb24,0x7ff8e6b7,0x4a858a5c,
  46720. 0xec040882,0xd83902fe,0xd0cba9bd,0x72b26494,0xb29c9e1e,0xd0176f90,
  46721. 0xcebadb81,0x05d4eb02,0x372b8bfc,0x874405b1,0x79ead190,0x5c412881,
  46722. 0xec2b48cd,0xd44a3dd3,0x3f4d5033,0x84499a77,0x564c3a09,0xb37b38cd,
  46723. 0xf42e803b,0x80e99497,0xb8f518b2,0xc07b47a0,0x3568fde4,0xc710e3c5,
  46724. 0xcead0e7a,0x735f542f },
  46725. { 0x38380039,0xcaa9a171,0xf74d19c8,0xadfafe17,0xccbc1a8b,0x92d4393e,
  46726. 0xfe029705,0x3c5dbf39,0x930e9b36,0x4552b5ab,0x2afd494a,0x7ee63032,
  46727. 0x3f02ac43,0x826a9ad7,0x99356298,0x98c53562,0x7342bb39,0x0c869f87,
  46728. 0xe4f9b79a,0xd7510020,0xd34789a9,0x6361d1a4,0xcfa85637,0xf0ded5ba,
  46729. 0x88ac07e4,0x407ee73f,0x09ef1cbd,0xfac7d03f,0x4d475bad,0x25d697cb,
  46730. 0x14bd399e,0x1e984c9d } },
  46731. /* 255 */
  46732. { { 0x4850c817,0xc76d0561,0x3489812d,0xb08a5b19,0x5e58cbbe,0x7273d154,
  46733. 0x4be61e5a,0x8900b5fa,0xd7aeb8e1,0xaa088691,0xd35a3d4b,0xe66666af,
  46734. 0x57ec7d3d,0x38a2c199,0x668d6f5c,0xa0648e8f,0x7adc1746,0x1f9fc92c,
  46735. 0x843065c3,0x23a116c0,0x61e6ae69,0x36370a20,0x2aa47e73,0x626c3736,
  46736. 0xdeff6d84,0x540c25f2,0xcdbed2d4,0x9804824c,0x039a9492,0x4b5bfce0,
  46737. 0x76942e01,0x6c474a56 },
  46738. { 0x7d88e3a1,0x3aeb9a41,0xc484742a,0x105d3c88,0x3fe61131,0xe59de8d1,
  46739. 0x1a869e8b,0x148f5b6b,0xaa75d90a,0x7a8abc59,0x62146013,0x2f0c9bc7,
  46740. 0xc3824cd9,0x43faa747,0x6a5d0b92,0x81763a18,0x9bcbaebc,0xbbc341bc,
  46741. 0xf745d1dd,0xe1813160,0xb75ce5f4,0xa53ce52d,0xd50de4c2,0x15eae66c,
  46742. 0x75d7656d,0x5ed8996c,0xc4ca552a,0xe4ff5711,0x3c5305b4,0x215e985a,
  46743. 0xfa1ba2ce,0x6b258954 } },
  46744. };
  46745. /* Multiply the base point of P1024 by the scalar and return the result.
  46746. * If map is true then convert result to affine coordinates.
  46747. *
  46748. * Stripe implementation.
  46749. * Pre-generated: 2^0, 2^128, ...
  46750. * Pre-generated: products of all combinations of above.
  46751. * 8 doubles and adds (with qz=1)
  46752. *
  46753. * r Resulting point.
  46754. * k Scalar to multiply by.
  46755. * map Indicates whether to convert result to affine.
  46756. * ct Constant time required.
  46757. * heap Heap to use for allocation.
  46758. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  46759. */
  46760. static int sp_1024_ecc_mulmod_base_32(sp_point_1024* r, const sp_digit* k,
  46761. int map, int ct, void* heap)
  46762. {
  46763. return sp_1024_ecc_mulmod_stripe_32(r, &p1024_base, p1024_table,
  46764. k, map, ct, heap);
  46765. }
  46766. #endif
  46767. /* Multiply the base point of P1024 by the scalar and return the result.
  46768. * If map is true then convert result to affine coordinates.
  46769. *
  46770. * km Scalar to multiply by.
  46771. * r Resulting point.
  46772. * map Indicates whether to convert result to affine.
  46773. * heap Heap to use for allocation.
  46774. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  46775. */
  46776. int sp_ecc_mulmod_base_1024(const mp_int* km, ecc_point* r, int map, void* heap)
  46777. {
  46778. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  46779. sp_point_1024* point = NULL;
  46780. sp_digit* k = NULL;
  46781. #else
  46782. sp_point_1024 point[1];
  46783. sp_digit k[32];
  46784. #endif
  46785. int err = MP_OKAY;
  46786. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  46787. point = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024), heap,
  46788. DYNAMIC_TYPE_ECC);
  46789. if (point == NULL)
  46790. err = MEMORY_E;
  46791. if (err == MP_OKAY) {
  46792. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 32, heap,
  46793. DYNAMIC_TYPE_ECC);
  46794. if (k == NULL)
  46795. err = MEMORY_E;
  46796. }
  46797. #endif
  46798. if (err == MP_OKAY) {
  46799. sp_1024_from_mp(k, 32, km);
  46800. err = sp_1024_ecc_mulmod_base_32(point, k, map, 1, heap);
  46801. }
  46802. if (err == MP_OKAY) {
  46803. err = sp_1024_point_to_ecc_point_32(point, r);
  46804. }
  46805. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  46806. if (k != NULL)
  46807. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  46808. if (point != NULL)
  46809. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  46810. #endif
  46811. return err;
  46812. }
  46813. /* Multiply the base point of P1024 by the scalar, add point a and return
  46814. * the result. If map is true then convert result to affine coordinates.
  46815. *
  46816. * km Scalar to multiply by.
  46817. * am Point to add to scalar mulitply result.
  46818. * inMont Point to add is in montgomery form.
  46819. * r Resulting point.
  46820. * map Indicates whether to convert result to affine.
  46821. * heap Heap to use for allocation.
  46822. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  46823. */
  46824. int sp_ecc_mulmod_base_add_1024(const mp_int* km, const ecc_point* am,
  46825. int inMont, ecc_point* r, int map, void* heap)
  46826. {
  46827. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  46828. sp_point_1024* point = NULL;
  46829. sp_digit* k = NULL;
  46830. #else
  46831. sp_point_1024 point[2];
  46832. sp_digit k[32 + 32 * 2 * 6];
  46833. #endif
  46834. sp_point_1024* addP = NULL;
  46835. sp_digit* tmp = NULL;
  46836. int err = MP_OKAY;
  46837. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  46838. point = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024) * 2, heap,
  46839. DYNAMIC_TYPE_ECC);
  46840. if (point == NULL)
  46841. err = MEMORY_E;
  46842. if (err == MP_OKAY) {
  46843. k = (sp_digit*)XMALLOC(
  46844. sizeof(sp_digit) * (32 + 32 * 2 * 6),
  46845. heap, DYNAMIC_TYPE_ECC);
  46846. if (k == NULL)
  46847. err = MEMORY_E;
  46848. }
  46849. #endif
  46850. if (err == MP_OKAY) {
  46851. addP = point + 1;
  46852. tmp = k + 32;
  46853. sp_1024_from_mp(k, 32, km);
  46854. sp_1024_point_from_ecc_point_32(addP, am);
  46855. }
  46856. if ((err == MP_OKAY) && (!inMont)) {
  46857. err = sp_1024_mod_mul_norm_32(addP->x, addP->x, p1024_mod);
  46858. }
  46859. if ((err == MP_OKAY) && (!inMont)) {
  46860. err = sp_1024_mod_mul_norm_32(addP->y, addP->y, p1024_mod);
  46861. }
  46862. if ((err == MP_OKAY) && (!inMont)) {
  46863. err = sp_1024_mod_mul_norm_32(addP->z, addP->z, p1024_mod);
  46864. }
  46865. if (err == MP_OKAY) {
  46866. err = sp_1024_ecc_mulmod_base_32(point, k, 0, 0, heap);
  46867. }
  46868. if (err == MP_OKAY) {
  46869. sp_1024_proj_point_add_32(point, point, addP, tmp);
  46870. if (map) {
  46871. sp_1024_map_32(point, point, tmp);
  46872. }
  46873. err = sp_1024_point_to_ecc_point_32(point, r);
  46874. }
  46875. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  46876. if (k != NULL)
  46877. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  46878. if (point)
  46879. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  46880. #endif
  46881. return err;
  46882. }
  46883. #ifndef WOLFSSL_SP_SMALL
  46884. /* Generate a pre-computation table for the point.
  46885. *
  46886. * gm Point to generate table for.
  46887. * table Buffer to hold pre-computed points table.
  46888. * len Length of table.
  46889. * heap Heap to use for allocation.
  46890. * returns BAD_FUNC_ARG when gm or len is NULL, LENGTH_ONLY_E when table is
  46891. * NULL and length is returned, BUFFER_E if length is too small and 0 otherwise.
  46892. */
  46893. int sp_ecc_gen_table_1024(const ecc_point* gm, byte* table, word32* len,
  46894. void* heap)
  46895. {
  46896. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  46897. sp_point_1024* point = NULL;
  46898. sp_digit* t = NULL;
  46899. #else
  46900. sp_point_1024 point[1];
  46901. sp_digit t[6 * 2 * 32];
  46902. #endif
  46903. int err = MP_OKAY;
  46904. if ((gm == NULL) || (len == NULL)) {
  46905. err = BAD_FUNC_ARG;
  46906. }
  46907. if ((err == MP_OKAY) && (table == NULL)) {
  46908. *len = sizeof(sp_table_entry_1024) * 256;
  46909. err = LENGTH_ONLY_E;
  46910. }
  46911. if ((err == MP_OKAY) && (*len < (int)(sizeof(sp_table_entry_1024) * 256))) {
  46912. err = BUFFER_E;
  46913. }
  46914. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  46915. if (err == MP_OKAY) {
  46916. point = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024), heap,
  46917. DYNAMIC_TYPE_ECC);
  46918. if (point == NULL)
  46919. err = MEMORY_E;
  46920. }
  46921. if (err == MP_OKAY) {
  46922. t = (sp_digit*)XMALLOC(sizeof(sp_digit) * 6 * 2 * 32, heap,
  46923. DYNAMIC_TYPE_ECC);
  46924. if (t == NULL)
  46925. err = MEMORY_E;
  46926. }
  46927. #endif
  46928. if (err == MP_OKAY) {
  46929. sp_1024_point_from_ecc_point_32(point, gm);
  46930. err = sp_1024_gen_stripe_table_32(point,
  46931. (sp_table_entry_1024*)table, t, heap);
  46932. }
  46933. if (err == 0) {
  46934. *len = sizeof(sp_table_entry_1024) * 256;
  46935. }
  46936. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  46937. if (t != NULL)
  46938. XFREE(t, heap, DYNAMIC_TYPE_ECC);
  46939. if (point != NULL)
  46940. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  46941. #endif
  46942. return err;
  46943. }
  46944. #else
  46945. /* Generate a pre-computation table for the point.
  46946. *
  46947. * gm Point to generate table for.
  46948. * table Buffer to hold pre-computed points table.
  46949. * len Length of table.
  46950. * heap Heap to use for allocation.
  46951. * returns BAD_FUNC_ARG when gm or len is NULL, LENGTH_ONLY_E when table is
  46952. * NULL and length is returned, BUFFER_E if length is too small and 0 otherwise.
  46953. */
  46954. int sp_ecc_gen_table_1024(const ecc_point* gm, byte* table, word32* len,
  46955. void* heap)
  46956. {
  46957. int err = 0;
  46958. if ((gm == NULL) || (len == NULL)) {
  46959. err = BAD_FUNC_ARG;
  46960. }
  46961. if ((err == 0) && (table == NULL)) {
  46962. *len = 0;
  46963. err = LENGTH_ONLY_E;
  46964. }
  46965. if ((err == 0) && (*len != 0)) {
  46966. err = BUFFER_E;
  46967. }
  46968. if (err == 0) {
  46969. *len = 0;
  46970. }
  46971. (void)heap;
  46972. return err;
  46973. }
  46974. #endif
  46975. /* Multiply the point by the scalar and return the result.
  46976. * If map is true then convert result to affine coordinates.
  46977. *
  46978. * km Scalar to multiply by.
  46979. * gm Point to multiply.
  46980. * table Pre-computed points.
  46981. * r Resulting point.
  46982. * map Indicates whether to convert result to affine.
  46983. * heap Heap to use for allocation.
  46984. * returns MEMORY_E when memory allocation fails and MP_OKAY on success.
  46985. */
  46986. int sp_ecc_mulmod_table_1024(const mp_int* km, const ecc_point* gm, byte* table,
  46987. ecc_point* r, int map, void* heap)
  46988. {
  46989. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  46990. sp_point_1024* point = NULL;
  46991. sp_digit* k = NULL;
  46992. #else
  46993. sp_point_1024 point[1];
  46994. sp_digit k[32];
  46995. #endif
  46996. int err = MP_OKAY;
  46997. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  46998. point = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024), heap,
  46999. DYNAMIC_TYPE_ECC);
  47000. if (point == NULL) {
  47001. err = MEMORY_E;
  47002. }
  47003. if (err == MP_OKAY) {
  47004. k = (sp_digit*)XMALLOC(sizeof(sp_digit) * 32, heap, DYNAMIC_TYPE_ECC);
  47005. if (k == NULL)
  47006. err = MEMORY_E;
  47007. }
  47008. #endif
  47009. if (err == MP_OKAY) {
  47010. sp_1024_from_mp(k, 32, km);
  47011. sp_1024_point_from_ecc_point_32(point, gm);
  47012. #ifndef WOLFSSL_SP_SMALL
  47013. err = sp_1024_ecc_mulmod_stripe_32(point, point,
  47014. (const sp_table_entry_1024*)table, k, map, 0, heap);
  47015. #else
  47016. (void)table;
  47017. err = sp_1024_ecc_mulmod_32(point, point, k, map, 0, heap);
  47018. #endif
  47019. }
  47020. if (err == MP_OKAY) {
  47021. err = sp_1024_point_to_ecc_point_32(point, r);
  47022. }
  47023. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  47024. if (k != NULL)
  47025. XFREE(k, heap, DYNAMIC_TYPE_ECC);
  47026. if (point != NULL)
  47027. XFREE(point, heap, DYNAMIC_TYPE_ECC);
  47028. #endif
  47029. return err;
  47030. }
  47031. /* Multiply p* in projective co-ordinates by q*.
  47032. *
  47033. * r.x = p.x - (p.y * q.y)
  47034. * r.y = (p.x * q.y) + p.y
  47035. *
  47036. * px [in,out] A single precision integer - X ordinate of number to multiply.
  47037. * py [in,out] A single precision integer - Y ordinate of number to multiply.
  47038. * q [in] A single precision integer - multiplier.
  47039. * t [in] Two single precision integers - temps.
  47040. */
  47041. static void sp_1024_proj_mul_qx1_32(sp_digit* px, sp_digit* py,
  47042. const sp_digit* q, sp_digit* t)
  47043. {
  47044. sp_digit* t1 = t;
  47045. sp_digit* t2 = t + 2 * 32;
  47046. /* t1 = p.x * q.y */
  47047. sp_1024_mont_mul_32(t1, px, q, p1024_mod, p1024_mp_mod);
  47048. /* t2 = p.y * q.y */
  47049. sp_1024_mont_mul_32(t2, py, q, p1024_mod, p1024_mp_mod);
  47050. /* r.x = p.x - (p.y * q.y) */
  47051. sp_1024_mont_sub_32(px, px, t2, p1024_mod);
  47052. /* r.y = (p.x * q.y) + p.y */
  47053. sp_1024_mont_add_32(py, t1, py, p1024_mod);
  47054. }
  47055. /* Square p* in projective co-ordinates.
  47056. *
  47057. * px' = (p.x + p.y) * (p.x - p.y) = p.x^2 - p.y^2
  47058. * py' = 2 * p.x * p.y
  47059. *
  47060. * px [in,out] A single precision integer - X ordinate of number to square.
  47061. * py [in,out] A single precision integer - Y ordinate of number to square.
  47062. * t [in] Two single precision integers - temps.
  47063. */
  47064. static void sp_1024_proj_sqr_32(sp_digit* px, sp_digit* py, sp_digit* t)
  47065. {
  47066. sp_digit* t1 = t;
  47067. sp_digit* t2 = t + 2 * 32;
  47068. /* t1 = p.x + p.y */
  47069. sp_1024_mont_add_32(t1, px, py, p1024_mod);
  47070. /* t2 = p.x - p.y */
  47071. sp_1024_mont_sub_32(t2, px, py, p1024_mod);
  47072. /* r.y = p.x * p.y */
  47073. sp_1024_mont_mul_32(py, px, py, p1024_mod, p1024_mp_mod);
  47074. /* r.x = (p.x + p.y) * (p.x - p.y) */
  47075. sp_1024_mont_mul_32(px, t1, t2, p1024_mod, p1024_mp_mod);
  47076. /* r.y = (p.x * p.y) * 2 */
  47077. sp_1024_mont_dbl_32(py, py, p1024_mod);
  47078. }
  47079. #ifdef WOLFSSL_SP_SMALL
  47080. /* Perform the modular exponentiation in Fp* for SAKKE.
  47081. *
  47082. * Simple square and multiply when expontent bit is one algorithm.
  47083. * Square and multiply performed in Fp*.
  47084. *
  47085. * base [in] Base. MP integer.
  47086. * exp [in] Exponent. MP integer.
  47087. * res [out] Result. MP integer.
  47088. * returns 0 on success and MEMORY_E if memory allocation fails.
  47089. */
  47090. int sp_ModExp_Fp_star_1024(const mp_int* base, mp_int* exp, mp_int* res)
  47091. {
  47092. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  47093. !defined(WOLFSSL_SP_NO_MALLOC)
  47094. sp_digit* td;
  47095. sp_digit* t;
  47096. sp_digit* tx;
  47097. sp_digit* ty;
  47098. sp_digit* b;
  47099. sp_digit* e;
  47100. #else
  47101. sp_digit t[4 * 2 * 32];
  47102. sp_digit tx[2 * 32];
  47103. sp_digit ty[2 * 32];
  47104. sp_digit b[2 * 32];
  47105. sp_digit e[2 * 32];
  47106. #endif
  47107. sp_digit* r;
  47108. int err = MP_OKAY;
  47109. int bits;
  47110. int i;
  47111. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  47112. !defined(WOLFSSL_SP_NO_MALLOC)
  47113. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * 8 * 32 * 2, NULL,
  47114. DYNAMIC_TYPE_TMP_BUFFER);
  47115. if (td == NULL) {
  47116. err = MEMORY_E;
  47117. }
  47118. #endif
  47119. if (err == MP_OKAY) {
  47120. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  47121. !defined(WOLFSSL_SP_NO_MALLOC)
  47122. t = td;
  47123. tx = td + 4 * 32 * 2;
  47124. ty = td + 5 * 32 * 2;
  47125. b = td + 6 * 32 * 2;
  47126. e = td + 7 * 32 * 2;
  47127. #endif
  47128. r = ty;
  47129. bits = mp_count_bits(exp);
  47130. sp_1024_from_mp(b, 32, base);
  47131. sp_1024_from_mp(e, 32, exp);
  47132. XMEMCPY(tx, p1024_norm_mod, sizeof(sp_digit) * 32);
  47133. sp_1024_mul_32(b, b, p1024_norm_mod);
  47134. err = sp_1024_mod_32(b, b, p1024_mod);
  47135. }
  47136. if (err == MP_OKAY) {
  47137. XMEMCPY(ty, b, sizeof(sp_digit) * 32);
  47138. for (i = bits - 2; i >= 0; i--) {
  47139. sp_1024_proj_sqr_32(tx, ty, t);
  47140. if ((e[i / 32] >> (i % 32)) & 1) {
  47141. sp_1024_proj_mul_qx1_32(tx, ty, b, t);
  47142. }
  47143. }
  47144. }
  47145. if (err == MP_OKAY) {
  47146. sp_1024_mont_inv_32(tx, tx, t);
  47147. XMEMSET(tx + 32, 0, sizeof(sp_digit) * 32);
  47148. sp_1024_mont_reduce_32(tx, p1024_mod, p1024_mp_mod);
  47149. XMEMSET(ty + 32, 0, sizeof(sp_digit) * 32);
  47150. sp_1024_mont_reduce_32(ty, p1024_mod, p1024_mp_mod);
  47151. sp_1024_mul_32(r, tx, ty);
  47152. err = sp_1024_mod_32(r, r, p1024_mod);
  47153. }
  47154. if (err == MP_OKAY) {
  47155. err = sp_1024_to_mp(r, res);
  47156. }
  47157. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  47158. !defined(WOLFSSL_SP_NO_MALLOC)
  47159. if (td != NULL) {
  47160. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  47161. }
  47162. #endif
  47163. return err;
  47164. }
  47165. #else
  47166. /* Pre-computed table for exponentiating g.
  47167. * Striping: 8 points at a distance of (128 combined for
  47168. * a total of 256 points.
  47169. */
  47170. static const sp_digit sp_1024_g_table[256][32] = {
  47171. { 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
  47172. 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
  47173. 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
  47174. 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
  47175. 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
  47176. 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
  47177. 0x00000000, 0x00000000 },
  47178. { 0x335c1685, 0x170a46d2, 0xe1007a58, 0xeac9e971, 0x43ca4a73,
  47179. 0x40e8f3df, 0x82642475, 0x2646f815, 0xb36576d1, 0x3af49bb4,
  47180. 0x72bf1afb, 0xd89e2d14, 0x2fd151e6, 0x27be882c, 0x8f88717c,
  47181. 0xaddedc85, 0x16ac6c6f, 0xd6d859bf, 0x2d8eae58, 0x0e741a1b,
  47182. 0x61c1f30d, 0x6faf7a00, 0x9b67e096, 0x66dbd09a, 0x7d3b4f7d,
  47183. 0x21f11c06, 0xc727c98e, 0x6152ba02, 0xe86cb221, 0xafd58891,
  47184. 0x6bd3baf4, 0x59e93c6a },
  47185. { 0x71dd4594, 0xe54dd36f, 0x00aef1e6, 0xbbc9cc9f, 0xa19f6530,
  47186. 0x9ea5a44e, 0x3f520928, 0x8588aa99, 0x8f5c1418, 0x9753794c,
  47187. 0xc11399fa, 0x118bd792, 0xf5cb6ab5, 0xb9bd3afd, 0x2ecb9652,
  47188. 0x813d1cb2, 0x40389813, 0xfd456267, 0x4ac8431c, 0x51f7119b,
  47189. 0x0a180eb6, 0xdd9f6a91, 0x9f7bfa2e, 0x13946d17, 0x50a9d0d9,
  47190. 0x16f18631, 0x6f8373d3, 0x5f19c20d, 0x9b6a52b9, 0xbe85ac6a,
  47191. 0x74f62e03, 0x63ef187b },
  47192. { 0x016f45e7, 0x7c376b7f, 0x2bec82f8, 0x1c1bdb57, 0xce429b60,
  47193. 0x7392f741, 0xc7afd81d, 0x6fdbf0a2, 0x7241098b, 0xbda41b1f,
  47194. 0xbb60f8cf, 0x5b407474, 0xb330bc4d, 0x933e0d41, 0x733fa3be,
  47195. 0xae182830, 0x0f5c6cd1, 0xa0ed299b, 0x3f9860c8, 0x7ff3354e,
  47196. 0x15559c41, 0xb1360986, 0x129f85cb, 0xab0cb63c, 0x47685fbe,
  47197. 0x682ecc49, 0xeb199633, 0x505e8ec2, 0xddac2cda, 0x90dcc794,
  47198. 0xf192da23, 0x4fe6791c },
  47199. { 0x05e8733c, 0x94a423d5, 0x1d5717c1, 0xcc845e65, 0xe961b322,
  47200. 0x237c7e88, 0xdb4181cc, 0x0c4471c6, 0x713bd721, 0x00c875e2,
  47201. 0xb2c17b09, 0x9dfde9ed, 0xe88ceaf6, 0x430a6de5, 0x7b81cea6,
  47202. 0xaaa7a61a, 0x233f98d5, 0xea52d026, 0x60689a9a, 0xb55efdd0,
  47203. 0x5cac4aab, 0x30cfa7ce, 0x8e950761, 0xfa4db114, 0x4e9a1e52,
  47204. 0x309570c4, 0x1a040170, 0x18c21f61, 0xbe78d9d2, 0x555d1ffe,
  47205. 0x561db297, 0x04482a18 },
  47206. { 0x73d486d8, 0xe7758ac2, 0x61cdc1e7, 0x8169f946, 0x2188ab4f,
  47207. 0x723c99fc, 0xf3373630, 0xa0e54f02, 0xbd8c2260, 0x560bee25,
  47208. 0x4531bc60, 0x28fc307c, 0x7e44feb5, 0xd6f21f1a, 0x57128d37,
  47209. 0xc8e4499c, 0xd7b2ea45, 0x963b053e, 0x32a3d222, 0x40c27a04,
  47210. 0x35459668, 0x5b51854d, 0xd73557e9, 0x66e1a49f, 0x8692077a,
  47211. 0x0d267fd9, 0xe7342702, 0xfa1350d3, 0x68ccdb44, 0x1a9c3f25,
  47212. 0xdedbf89f, 0x833a0ff8 },
  47213. { 0xab376b76, 0xa8c419c7, 0x27d0f0cc, 0x3b7294f3, 0xa90c514d,
  47214. 0xe56bb9e2, 0xa62575a6, 0x931ba51e, 0x098c0a88, 0x56fee07b,
  47215. 0xb4c16a2a, 0x04be5aee, 0xe6eb260b, 0xe513350b, 0xa1d5c270,
  47216. 0x339edad6, 0xe9dbadd1, 0xf366ed59, 0x2dd06ec0, 0x4213be88,
  47217. 0xcb1187db, 0x22d639c8, 0xd8a1058a, 0x1fec95e1, 0xa2b744f1,
  47218. 0x03f73ea6, 0xf4f05c0c, 0x741fd51a, 0x85f811a0, 0x2e2df95a,
  47219. 0xeb24965f, 0x692b3ce3 },
  47220. { 0xd2a127b4, 0x0ce6cb72, 0x8f92816f, 0x66a46ea5, 0x47a37616,
  47221. 0x43ecf463, 0xe0ab96ee, 0x163d9a01, 0xb2edbe8c, 0xc8145c6d,
  47222. 0x4de4e665, 0x2f426cae, 0x74e252f9, 0x174d0b40, 0x7d2af831,
  47223. 0x54c240d7, 0x3d652936, 0x581fa397, 0xa09d4695, 0x05b9491c,
  47224. 0x5452643c, 0x8c4e8533, 0xd4128327, 0x32d64331, 0x70361f25,
  47225. 0x64479038, 0x89ef09f2, 0x774191b1, 0x81de5fe0, 0xc0cf0aaf,
  47226. 0xf40042d6, 0x333e430a },
  47227. { 0xcf26d3b7, 0x5df04de4, 0xb53f79be, 0x57a77306, 0x1808b664,
  47228. 0xa4013c5f, 0x85037360, 0xef291ea4, 0x0b061037, 0x1ffc9d7d,
  47229. 0x65c913bb, 0xd9d04dd9, 0xf13b8587, 0x948a37af, 0xfe3ee755,
  47230. 0xb5443483, 0x04631386, 0x3fc21e74, 0xcddeb58c, 0xb3a104e5,
  47231. 0x6572cd52, 0x94fe1862, 0x15aaa408, 0xeb9a71a1, 0x459ea462,
  47232. 0x8adc6fe5, 0x4aeb02a3, 0xbb18d175, 0x2f7791d1, 0xae127636,
  47233. 0xd6bbd708, 0x10e8b31d },
  47234. { 0x3ed9f1af, 0xb87f03e5, 0x56676166, 0x03ad2477, 0x74ce15b8,
  47235. 0x38dcd630, 0x26b1e85b, 0x1877e2b0, 0x1af99c15, 0xb1654d17,
  47236. 0x9382547a, 0x9782e9e4, 0x26d55ef5, 0x6dc7fc7c, 0x2fbeb54c,
  47237. 0x9038f95d, 0x036c0357, 0xfe590dfe, 0x4fdc3f7f, 0xcfcb6eae,
  47238. 0xf35e1a88, 0xcb1fbc54, 0xda0a5568, 0x3c8e1db2, 0x5b6f5557,
  47239. 0x9a87393f, 0xe7ac0a06, 0x38646b32, 0x2a8495ab, 0xfd261c83,
  47240. 0x0cdcc4bc, 0x6485524c },
  47241. { 0xc4a6ff2a, 0x1abfb3e2, 0x35a6428a, 0x2aa03fba, 0x89aff742,
  47242. 0x884227f0, 0xba5dbd93, 0x2337883a, 0xd2a182cb, 0x38186ae9,
  47243. 0x49a01f05, 0xb9f0764d, 0x917b1e7a, 0x92411feb, 0x570cbb5b,
  47244. 0x700b1903, 0xb914be7c, 0x5d5181d5, 0x1981182d, 0x135c4437,
  47245. 0x574b9997, 0x32758d24, 0x632d28b2, 0xa650a8f5, 0xfa383f09,
  47246. 0x24078bac, 0x00a33d80, 0x6546a60c, 0x2df8b449, 0xa4061c7a,
  47247. 0xf234563c, 0x1f76f3f2 },
  47248. { 0x44c436b0, 0x9aa2c143, 0x1f69c87a, 0x79070556, 0x5f6db2df,
  47249. 0x35f3117b, 0xed56ba82, 0x85761f41, 0x7d0afa48, 0xf831464f,
  47250. 0x3adce71e, 0xa99f2915, 0x116b7488, 0xb27bf693, 0x9bb9443a,
  47251. 0xa98a5a8c, 0x2ee5fde8, 0x7f878026, 0x1812acb7, 0x3a6f93dd,
  47252. 0xdc84bc92, 0xaf92a4cc, 0xf1d4995a, 0x3c2562af, 0x04ed899d,
  47253. 0xfd9fc33c, 0x4ed2a538, 0xc028ca94, 0x049ea726, 0xd0f367bb,
  47254. 0x3d108e05, 0x04924ffb },
  47255. { 0xc673562f, 0x06548e3d, 0xe2eae48c, 0xd3b33025, 0x5e1c6977,
  47256. 0xe61fd32b, 0x6ebe557b, 0x424e2064, 0x41d6e18e, 0x767391c0,
  47257. 0x14d7e95b, 0x4b8ebb8e, 0x20991b8c, 0x4ae8b7d4, 0xe01290d3,
  47258. 0xf8a0df66, 0x925e5f4e, 0xc97e24a3, 0x1508272a, 0x79a7b2cb,
  47259. 0x25072661, 0xb40b072e, 0x9062fa49, 0xdad9e182, 0xf3c53bce,
  47260. 0x8780a784, 0x9f142799, 0x58a82b76, 0xc1468426, 0x08cd849c,
  47261. 0xc380ae35, 0x4dfce809 },
  47262. { 0xd527b780, 0x45069cb2, 0x977930dd, 0xd52da015, 0xe27d0263,
  47263. 0x10cc600b, 0xbb2d1b2b, 0x34102c26, 0x554adf3c, 0x4c652623,
  47264. 0x45f0ff47, 0xd6891382, 0xca916e7c, 0x83fa8cc5, 0xd15c8d8a,
  47265. 0x1e10f139, 0x81dc56b3, 0xf173dc2e, 0x5c4ed9ba, 0x7fcecb04,
  47266. 0x47d01228, 0x307fd7d8, 0x9f3a532f, 0x24a57153, 0xe2153c22,
  47267. 0x59e9e81d, 0xe428a408, 0xc562595d, 0x9339bd23, 0xdc7daff8,
  47268. 0xb8a06802, 0x0d075908 },
  47269. { 0xde085f2a, 0x870af2a7, 0xbe99b2e5, 0x88fcd24f, 0x59ca413b,
  47270. 0x88c0d261, 0x8559f851, 0x1f02a2e4, 0xf622da0d, 0x83b96021,
  47271. 0x6dca3615, 0x5c05c2f5, 0x7910c682, 0x0148cf1c, 0x272695be,
  47272. 0x392f2896, 0xa8d64ef6, 0x883d0bb5, 0x1cfcbc52, 0xef0d2244,
  47273. 0x526117e5, 0xf5dafcec, 0xf04928e9, 0xb68612b9, 0x393f2e2a,
  47274. 0x283f744d, 0x700c1151, 0xfbeed7ed, 0xa4360dfe, 0xf2cde215,
  47275. 0x2f08535a, 0x24fa961c },
  47276. { 0x616df7f6, 0x0767db3f, 0xfbd90326, 0x643057d8, 0x6e82d544,
  47277. 0x174daa90, 0x689643db, 0x2284f345, 0xcc89a060, 0x18b191df,
  47278. 0xd6c27d12, 0xbab46af4, 0xc9895145, 0x5a57f486, 0xcc942f9e,
  47279. 0xc03214e9, 0x41950158, 0x273e1c8f, 0x39ad43ab, 0x8ceb759f,
  47280. 0xe50ee173, 0x5e1b8b7f, 0x8f4d7d4e, 0xf635b1fc, 0x755603f3,
  47281. 0x8eff77e3, 0x7752fa60, 0x201f61d1, 0x4a6fb6e1, 0x94d7a03d,
  47282. 0xfc4f0114, 0x371cc23d },
  47283. { 0xda90c351, 0x289b115d, 0x364d9c06, 0x6d196ebf, 0xf650b31b,
  47284. 0x77a89202, 0x6f57642f, 0xcc28c164, 0x08100127, 0xdc4f7e36,
  47285. 0xdc4c807b, 0x8836cd08, 0xe00240f2, 0x1280f156, 0x99cb3953,
  47286. 0x3f9a6d78, 0x3a802038, 0x40a494d3, 0xe87d3474, 0x45697e91,
  47287. 0x26dde24a, 0x70d97d07, 0x7640c30e, 0x06f6a58d, 0x5ba6e6c6,
  47288. 0x03c2c0e8, 0xf1bc13e8, 0x330f6a7a, 0xc9f4d78f, 0x3e602e4f,
  47289. 0x0c80fb7f, 0x92b6bca0 },
  47290. { 0x5f00822e, 0x2e3d5c83, 0xb8b16f12, 0x0e825712, 0x92b0a330,
  47291. 0x81c329c4, 0xa7cc1954, 0x6b4e32ad, 0x1bb1413f, 0x0bee9cee,
  47292. 0x4a92ca27, 0xedfb7baa, 0xea3b9153, 0xcd472afa, 0x00f0c0f9,
  47293. 0xe8f09e7e, 0x5cdebb70, 0xa4e1d872, 0x4a9b63b6, 0xfe2bae08,
  47294. 0x3fd58f65, 0xf40141b8, 0xa3b62759, 0xd7ec5eda, 0x790e3088,
  47295. 0x9aaf6e67, 0x1f277e31, 0x215ad830, 0xcf33871c, 0xe7db4b98,
  47296. 0x4f02f89d, 0x71ff62c9 },
  47297. { 0x2a4a84d9, 0xaa4c7102, 0x5ebc71e6, 0xe2ee4acd, 0xf1cd6578,
  47298. 0x3b11a8a5, 0xfff120a5, 0x83f5ef9f, 0x09e65033, 0xa4c598e1,
  47299. 0xca044180, 0xe1e9f990, 0xf59828c1, 0x8b832d46, 0x33af536b,
  47300. 0x753f28a0, 0xb6d4f68a, 0x92edc4b1, 0x72ccd1f0, 0xedde692a,
  47301. 0xd2226432, 0xd3aa0f7d, 0xa3d2661c, 0x38dbb63e, 0xfdc37dda,
  47302. 0xf1e19fc6, 0x84ef6b4c, 0x6c18b350, 0xdf1bba69, 0xe6a83fe9,
  47303. 0x5f958273, 0x40fd47e7 },
  47304. { 0x267140a4, 0x5b88b746, 0xeab6f2fb, 0x6dbbfc1e, 0x69862548,
  47305. 0xdd9ec88e, 0x2eb6efc2, 0x69beeba1, 0x8ac8ff88, 0xcfc2214a,
  47306. 0xb5a21950, 0x95d5c96e, 0x4171fb69, 0x93389c05, 0x1b468337,
  47307. 0x2d85d452, 0x4113425c, 0x14d68a08, 0xec6c2174, 0xe52c0139,
  47308. 0xf730084d, 0x20cf0b97, 0x1f578aa3, 0x1ac16a26, 0xf9b6ae43,
  47309. 0x18b9fab3, 0xd854a695, 0x68d82111, 0xdffbe286, 0x0b334d98,
  47310. 0xe639338c, 0x5b1c1157 },
  47311. { 0x72b6bb8f, 0x90edaab1, 0x02fc92c2, 0x8dc64ed2, 0xfe694c73,
  47312. 0xf42ba3c5, 0xcb54dce4, 0x316dc65f, 0x632420dc, 0xcb2d66a3,
  47313. 0x056dcf94, 0x16e706e7, 0xa4f32c9d, 0x2809c764, 0xea6edca8,
  47314. 0xab18d830, 0x81c65f57, 0x4fd1ace6, 0x7da12c10, 0x1f91651c,
  47315. 0xc7791a48, 0x0ac3bd66, 0x785e67a3, 0xb6ad1cf4, 0xda0fd591,
  47316. 0xe4d3fc44, 0x6e1c6344, 0xce164801, 0x33e50ab3, 0x84de9cb8,
  47317. 0xa756eef4, 0x963ab83a },
  47318. { 0xdf4ea5a3, 0x944b47d8, 0x5cfe45fe, 0x96568815, 0x8a3c3564,
  47319. 0xd16e7d58, 0xe7c99e15, 0x84e55b3e, 0xf55071bc, 0x3fee204d,
  47320. 0x04057dce, 0x71006f29, 0xbba75570, 0xfe8c390d, 0x3319adac,
  47321. 0x3645bcb6, 0x7c20bfd8, 0x8189e8b0, 0x7d7d9578, 0x8e550969,
  47322. 0xb99f4e3b, 0x037d1321, 0xa60cfb6a, 0x011b2521, 0x837382da,
  47323. 0x66594aaa, 0x83c1dc07, 0xc89b91fd, 0x076b9884, 0x6b82b899,
  47324. 0xbe45c558, 0x443480fc },
  47325. { 0x9114221a, 0xf8ffffb4, 0x3e857a7a, 0x4aec4f2e, 0x0fa54787,
  47326. 0x42e2d0e4, 0xd6f96152, 0xef3e6b31, 0xfbfe9b77, 0xb2296537,
  47327. 0xfb43a86a, 0xc2a9d0f2, 0x24572ac6, 0x241284ed, 0xe721ba7b,
  47328. 0xa3868917, 0xc117a78d, 0xdbef7c00, 0xd31605ac, 0x38149071,
  47329. 0x065a8ee9, 0xc2dada9e, 0xc442be82, 0xd5b138d8, 0xf6d72b58,
  47330. 0x9b6c224b, 0x8eb03e6d, 0xb9d355cf, 0xa1700371, 0xab6d1eb0,
  47331. 0xcffaa7eb, 0x97118a88 },
  47332. { 0xcdecb5d8, 0xbf9c59a2, 0xa93a6866, 0x8083c81b, 0x04774fbf,
  47333. 0x24e0dd81, 0xa02070b4, 0xe779a3ca, 0x0fbfb781, 0x9d352fbb,
  47334. 0x3ef2a1c4, 0xa8b0d820, 0x14b3e501, 0xb858637b, 0x8a882ff2,
  47335. 0x5ba70a49, 0x3b06efa5, 0xa2730083, 0x102fee2a, 0xa42c02f4,
  47336. 0x8a0223a5, 0xe4e76299, 0x85c3fc72, 0xdba2ba26, 0xfe52eae7,
  47337. 0x554fe763, 0x270f45f6, 0x30b5405a, 0xa573387c, 0xd56a177a,
  47338. 0x4b71fa82, 0x17c0778d },
  47339. { 0x2735e37b, 0x0e6dff1d, 0x656ec572, 0xc9884e56, 0x9ebba978,
  47340. 0xa2f5ac9d, 0xba09f3c4, 0x40fa4518, 0xf5b04377, 0x8c3fa177,
  47341. 0x967a2eca, 0xa1a1decd, 0x0528bd40, 0x768bca70, 0x18691c4a,
  47342. 0xf224952b, 0xe86d5fd5, 0x16e12c45, 0x37859a6a, 0x7a0d9157,
  47343. 0xa0ffce0e, 0x723f4309, 0xa96cc9a3, 0x5a8db79b, 0x1ad23a38,
  47344. 0x6dd12ae0, 0xe2bf5d84, 0x9ffec3a1, 0xa452ed66, 0xd6ce84e1,
  47345. 0x571fe4c6, 0x1219d5c8 },
  47346. { 0x262969eb, 0x43eaa67f, 0x2f03e773, 0x3a3ab39d, 0x57bb0909,
  47347. 0xe6127e51, 0x8d150274, 0x0f82b0ed, 0xe580bdbd, 0xffffcad8,
  47348. 0xa9743e6b, 0x51d3d075, 0x8bac11d6, 0x1484bdb1, 0xeb24c388,
  47349. 0x95cd9990, 0x7fac67c6, 0x216a61d0, 0xa04e6b87, 0x4308f762,
  47350. 0xcba57cc8, 0x2865dd61, 0xd234a07a, 0x3c296b0d, 0x3a0793f9,
  47351. 0x76f92839, 0x0be29ece, 0x70b57e1f, 0x7e626f42, 0x1314a82f,
  47352. 0xd657f230, 0x2c8d7ab2 },
  47353. { 0x0825e4d6, 0x67cf5892, 0x6ef83b44, 0xdf51eaa5, 0x1310108d,
  47354. 0x63e665d8, 0x8dd0963f, 0x229f89f5, 0x9df6436a, 0x8c4b14dd,
  47355. 0xd45ebba7, 0x99dae469, 0x5a4df381, 0x118aab77, 0x29e37feb,
  47356. 0xda8978bd, 0xaca2d7ef, 0x69ced5aa, 0xc67d6a8a, 0x6c98d05d,
  47357. 0x77f84a34, 0x7474bf0d, 0xed8cd59a, 0xd4428b2e, 0xd1d398fb,
  47358. 0xb0fd1cd5, 0x94a20b11, 0x596013db, 0x1b404c44, 0x96eb705a,
  47359. 0x4b09d958, 0x2299d277 },
  47360. { 0xc64397e6, 0x5b9cd58d, 0xbf6dd31e, 0xac198f1e, 0x3e9f1db2,
  47361. 0x5866d8e1, 0x8fcdc68c, 0x405ae287, 0xe53c01fd, 0xa4b280cd,
  47362. 0x411db5f6, 0xdc963f2d, 0xbec4f8a0, 0xed5d5189, 0x916ee98b,
  47363. 0x336fd13d, 0x042df48e, 0x6925b1b3, 0xace0074e, 0x0cf56291,
  47364. 0x25317e95, 0xe8d38b48, 0x821c446b, 0xc7ad1d2b, 0xf0b65934,
  47365. 0x71c44135, 0x52ca0d50, 0x971b736f, 0x27b46c26, 0xaf9ffa57,
  47366. 0x1936618e, 0x21ac6779 },
  47367. { 0x2d7fbcd2, 0xab420e3f, 0x97bdfc18, 0x12722473, 0x4df5d4b4,
  47368. 0x492033f8, 0x3807b7d3, 0x6fcd4236, 0xb33c3625, 0xdfc19b09,
  47369. 0xa0f22814, 0x13d6f375, 0x037c19b8, 0x70978a59, 0x0ff27b9c,
  47370. 0x4f398997, 0x615a4389, 0xfc0e1a45, 0x3e602f74, 0xffa3496a,
  47371. 0xb261ca1c, 0xc3f1c431, 0xee0164cd, 0x612211db, 0xe7f7be9f,
  47372. 0x30463ee4, 0x92c2e1bb, 0x015f7e78, 0x24483a56, 0x663d88d6,
  47373. 0x0e62d9d8, 0x0e8ec1e7 },
  47374. { 0x8a0878dd, 0xa88ccc29, 0x6640071a, 0x99ac175d, 0xa5173617,
  47375. 0x90344820, 0xdd58a315, 0x316d023e, 0x88d221a1, 0x30785bd4,
  47376. 0x959c48e3, 0xb74b3de7, 0x4c67a771, 0x42ee0382, 0xe0b91453,
  47377. 0x59ef6cdd, 0x9b237e91, 0x7830ae28, 0x495d8325, 0xe1847a4c,
  47378. 0xd0773666, 0x67b1217e, 0xa294a325, 0x58192c86, 0x864d8326,
  47379. 0x76aa0f56, 0xf4b13e5b, 0xe2a2bd12, 0x1b6b73fd, 0xd850c1c0,
  47380. 0x5d103635, 0x653a795f },
  47381. { 0x50dcb199, 0xcfe28985, 0x7fa02b60, 0xb35b8e5e, 0xc97603d0,
  47382. 0xbca7d7c3, 0x27f131b5, 0xb0e5288d, 0xe2b12d52, 0x3aa704de,
  47383. 0x1db725c7, 0xe206b1d8, 0xc5d1b113, 0x0b12839a, 0xdb45d763,
  47384. 0x14f970cb, 0xb2125e8e, 0xc997f93e, 0xee7daa26, 0xbd75739c,
  47385. 0x1fef20e9, 0x46ecbd3f, 0x7c6a42b1, 0xf994a114, 0x27fb0fd1,
  47386. 0xd289eb4f, 0x9a40da4b, 0x11186d31, 0xfb9d7976, 0x083f65a5,
  47387. 0xd444675e, 0x30dfc47b },
  47388. { 0x9eaadfe8, 0xbcfc5ae2, 0xb4d4e812, 0x25027e54, 0x8b533561,
  47389. 0xab0702df, 0x56a6a214, 0xa2b9c204, 0x3059068e, 0xb1a3df7a,
  47390. 0x9883110f, 0xa3514b21, 0xc4b78e1c, 0xb7be2336, 0x3e2f6984,
  47391. 0x17073ce6, 0x2ddf7ac6, 0x86e114a6, 0x07d7c3c8, 0x276192bf,
  47392. 0xeb1ae289, 0x5da69e0b, 0x25184939, 0x983af175, 0x407a3aa0,
  47393. 0x9ac52a4d, 0xae0fe218, 0x1535c7da, 0x397f2501, 0xe16fe872,
  47394. 0x54c212cf, 0x572a591f },
  47395. { 0x09a5553a, 0x49668419, 0x327733bc, 0x3f054318, 0x3eefd690,
  47396. 0xf9ceb4b2, 0xf22126d4, 0xbd3cbf9b, 0x2fed9578, 0x6d9671c0,
  47397. 0xca0306d8, 0xbba597ce, 0x3d674fe5, 0xb705ed61, 0x67f33f76,
  47398. 0xf1d3622b, 0x11cb8c31, 0x15bcf3c6, 0xe53d1aa9, 0xa38467dc,
  47399. 0xf908ab43, 0x902fe929, 0x8d15767a, 0x6e3e499d, 0x90afd07b,
  47400. 0x8142db5c, 0x6c8b190e, 0x120c6fbc, 0x24919a4e, 0x80c86553,
  47401. 0xd8c82c3c, 0x65c2cbe1 },
  47402. { 0xa660bb63, 0x684cda20, 0x86e86245, 0x27dc3b0a, 0x6ba0eed7,
  47403. 0x76472cf6, 0x679dd158, 0x79c162e5, 0x08452d44, 0xb6884277,
  47404. 0x413f579e, 0x829bc6b3, 0x95011770, 0x92ea15ec, 0x47738183,
  47405. 0x5e34e300, 0x73e1d2f1, 0x8c3ca349, 0x229bd3de, 0xa5c4f1dc,
  47406. 0x94ef7ed3, 0x783eff1b, 0xdfae7a1a, 0x46db738d, 0x1a099852,
  47407. 0x4353d72e, 0xa0dcf4ab, 0x2533ad58, 0x0e7888b9, 0xd8055016,
  47408. 0x3ba77f66, 0x831440d5 },
  47409. { 0xf611b2da, 0xf43e2e32, 0xd0fa46ac, 0x5d066e29, 0x820b3c0d,
  47410. 0xe897f3e8, 0x1d3e44f0, 0xc45c28e6, 0xdfd27a66, 0x929d7f66,
  47411. 0x101e8517, 0x735b860a, 0x3de078dd, 0xea3fce98, 0x638ce11a,
  47412. 0xc9977db5, 0x48536b3b, 0x0488382f, 0x64cadfc6, 0x7e0c7a3c,
  47413. 0x82147b71, 0x3cd17f7f, 0x1b411e3e, 0xe95663cc, 0x985fb46d,
  47414. 0x5739ac8f, 0xbcf119ca, 0x385399cd, 0xe15a2815, 0x4a985a70,
  47415. 0x6d5f4566, 0x504c3a8a },
  47416. { 0xb8fa53c7, 0x00b55283, 0x509474e3, 0x985cff38, 0x437ce25f,
  47417. 0x234d241c, 0xe5a129ed, 0x29832430, 0xaabcc674, 0x6ad38956,
  47418. 0x7ee81ee1, 0xa2dc001d, 0x670b2702, 0x4c23c6b6, 0xa6e8a3bb,
  47419. 0xb35e567e, 0xa69673ea, 0xbc70b3ce, 0xe6e28eac, 0x85a7a9c3,
  47420. 0x5537b7da, 0x2ae684de, 0x6de937dc, 0x5ecac3e5, 0xf8430422,
  47421. 0xbf2ea6c9, 0x77fdc520, 0x38caf7d0, 0x69f56add, 0xc27af0b1,
  47422. 0xc71d21d2, 0x496e4699 },
  47423. { 0x9fa93467, 0xba14fc82, 0x0eb2a614, 0xc2e37684, 0x4833e09b,
  47424. 0x659bcfaf, 0x3686bdcc, 0xbc859752, 0x81f3216a, 0x40bfd080,
  47425. 0x17c081b8, 0xc463bda6, 0xbb04793b, 0xbd01fa86, 0x2cd640c5,
  47426. 0x5a21ece6, 0x2203d5c4, 0x97bf6a54, 0x951167b7, 0xceb40edc,
  47427. 0x765ba268, 0xd67aacaf, 0xaeab51f9, 0x8ba0d9e9, 0xb0d6863a,
  47428. 0xc14b215e, 0xe5f06952, 0x354cdcdb, 0xcb3744b5, 0x4f2b5ccf,
  47429. 0x13037fe8, 0x13389173 },
  47430. { 0x45003cd1, 0xee680640, 0x44ae2ac6, 0xfdac17bc, 0xde8e5314,
  47431. 0x4bcd419f, 0xc7cea95c, 0x81e34eb9, 0x38f37e01, 0xbb57762d,
  47432. 0x260990c8, 0xecc4cfb0, 0x50a34a7b, 0x0bc493f9, 0x543304ef,
  47433. 0x68074172, 0x6bc8aa2a, 0xaec0fcb2, 0x3b45fea5, 0x9e7a9b46,
  47434. 0x55fbdbac, 0x4bb2952e, 0x0485dff4, 0x50f0c0a6, 0x4dea4796,
  47435. 0x02c5104d, 0x695e3a02, 0xd2cefa09, 0x6da1f345, 0x4c8102b4,
  47436. 0xf3833fbd, 0x422eb573 },
  47437. { 0xa6ad3f47, 0xac592eb6, 0x9714ba0e, 0xb0861f6d, 0x07281459,
  47438. 0x57c1e919, 0x64ea5803, 0xcf7c94e2, 0x54b12723, 0x725376ac,
  47439. 0xdafb736a, 0xf2a6ba41, 0xcba03cdc, 0xc89e8920, 0x5b0fd3ad,
  47440. 0xf2e20cb4, 0xd66059fe, 0x26ea5a54, 0x889df8bc, 0xee63fa8b,
  47441. 0x66a3f2bf, 0x40f1c7e1, 0x747312e1, 0x09febc9c, 0x727999ff,
  47442. 0x7d19b9c2, 0xb7fd2b05, 0xa9fbbb4c, 0xa0da2dc6, 0xcfba27d7,
  47443. 0x2c252582, 0x368541cf },
  47444. { 0x22799d37, 0x510d3c9e, 0xacfa333a, 0x1b677de5, 0x080f795b,
  47445. 0x4e6ae18f, 0xafc8dfc2, 0x69b53c2a, 0x0e842dc2, 0x797541b6,
  47446. 0xac067fe8, 0xd5a6f2af, 0xbd07d877, 0xd0208a03, 0x654be2f2,
  47447. 0x34b473f0, 0xf515e23e, 0xe67c102a, 0x2ac1af48, 0xb00dbf9d,
  47448. 0xb6a13d00, 0xe264fa41, 0x97e94c11, 0x1669786a, 0x86a586f4,
  47449. 0x09d8cf2d, 0xc7f927e9, 0x073bf869, 0x2241a566, 0xb8977880,
  47450. 0x22261334, 0x59a5bf59 },
  47451. { 0x81347191, 0xe9d1c91e, 0xeb969972, 0x186c1abc, 0xa9d46a7f,
  47452. 0x07888767, 0xdaa7d397, 0xda93cfcc, 0xd91b9aa0, 0x08bee9f1,
  47453. 0xf8dd3c6c, 0x8267fd78, 0x94228100, 0xf93860d0, 0xdadb47fb,
  47454. 0x6a6a71aa, 0xa6156f8a, 0x9caa06b7, 0x39848bc9, 0xaa1b05e0,
  47455. 0x2aaa9135, 0x36ddc237, 0xb13f3bd1, 0x77e7e079, 0x4acc5f4d,
  47456. 0x8d0b5cbe, 0x984cfd36, 0x04da45f8, 0xd3d3e0f8, 0xf14ef618,
  47457. 0x43eb799c, 0x467564c1 },
  47458. { 0xb6fff5d7, 0x8d725904, 0x92dc4752, 0x037f33af, 0x6d20b8aa,
  47459. 0x9095d575, 0x43baec39, 0x32235fc1, 0x68a2b9b0, 0xa2feb4af,
  47460. 0x94d35c61, 0x61c50318, 0xea877486, 0xac92b6a2, 0x011bc6f3,
  47461. 0x8eb48b15, 0xc79edcb2, 0xa28fe128, 0xa5d2a006, 0x9f71bc0c,
  47462. 0x2f15b850, 0xf3167732, 0x7a036218, 0xfe8d728c, 0x4f81e09e,
  47463. 0x068f39cb, 0x7b7c50d9, 0x1773f016, 0xed6a1e03, 0x0d0f7adb,
  47464. 0x4ee984d5, 0x8a0dee16 },
  47465. { 0x47366e6f, 0x504991bf, 0xe86c3005, 0xb8084d9f, 0xa40cce36,
  47466. 0x14c4c751, 0x3f1961e2, 0xbbb46aa6, 0x40445e43, 0x56a785f9,
  47467. 0xc91e215f, 0xdb8d1b57, 0xc7ee808d, 0x6a8e453e, 0xbbaa1e8c,
  47468. 0xc0367ef8, 0xe3e18109, 0x310d91f1, 0x7e20a2c3, 0xf97cfd0e,
  47469. 0x554cc277, 0xf1e80c84, 0x7b628403, 0xe89bbc1d, 0x3fe0a17c,
  47470. 0x7778a966, 0xc1f00073, 0x9e9db19f, 0xb6f6bed2, 0x2ce7fe7d,
  47471. 0xee97ce23, 0x7b04b5d2 },
  47472. { 0x82c5faf8, 0x5b546bc7, 0x8eb81097, 0x1a734c5e, 0xe77851e0,
  47473. 0x3d566861, 0xe956d51f, 0x833a1013, 0xc3c3c37c, 0xc7351731,
  47474. 0xe0c148ec, 0x607738fb, 0xe1bbef41, 0x2ec6f0bb, 0xcfa51857,
  47475. 0x0aa2ac6e, 0x66e3adf0, 0x072902d7, 0xc622d6e3, 0xcd4d5089,
  47476. 0xa6dd802f, 0x3ae21b23, 0x33886372, 0xe5465a55, 0xa8d81822,
  47477. 0xd85119a0, 0x3786977a, 0x4f14d032, 0x9c7b272c, 0x515b081c,
  47478. 0xc99be31c, 0x1c6a95a4 },
  47479. { 0xc2821363, 0xa6b14ad5, 0x4d17de1c, 0x829c1823, 0xccade848,
  47480. 0xaef5d2c4, 0x82489e27, 0xf412ab39, 0xf081d927, 0x92c9c098,
  47481. 0x75cbad1f, 0x6f87bdf4, 0x1a1d9fb1, 0xf4aadab8, 0xb75f3b76,
  47482. 0x475a7923, 0xdbbba8fe, 0x99dd0ad6, 0x4b70ab45, 0x836f6164,
  47483. 0x34bd9af1, 0x2a464881, 0xba9abda3, 0x5c91226e, 0xe65625fb,
  47484. 0x4cec8709, 0x0818e4be, 0xd4b3919e, 0x14f6879c, 0xa5c09c84,
  47485. 0x30a864c9, 0x72708a02 },
  47486. { 0xf34a466c, 0x4f33c0b1, 0x7f9d45ba, 0xa1bae09c, 0x0e28785c,
  47487. 0xd70f0fee, 0x90880881, 0x824c7146, 0xbb043da3, 0xe2416c2a,
  47488. 0xcec6f432, 0x733da713, 0xc9793e1c, 0x2b590649, 0xb35c9365,
  47489. 0xdb62d5b0, 0x3e5c1b2a, 0x355eb6e2, 0xbb16b515, 0xcfe8b5ce,
  47490. 0xf709691c, 0x9e081869, 0x61a85bd5, 0xc865f9fb, 0xfae103f7,
  47491. 0xf169d3cc, 0x73467e9d, 0x9525c473, 0x43695113, 0x7db55c0b,
  47492. 0x73265d21, 0x7491c74c },
  47493. { 0x80d2b94d, 0x312ed5bf, 0xba4b260b, 0x1b8ac633, 0xd62219a1,
  47494. 0xac86c58c, 0xaeb82c8e, 0x317ccf6b, 0x59ef9ced, 0x2dfb29ee,
  47495. 0xe42bcd5a, 0xdaa7d898, 0x5974b201, 0x93e295c8, 0xd9fc5adc,
  47496. 0x69e75784, 0x012aa3ba, 0xd6c4709f, 0xc85d3cb9, 0x1fda9f37,
  47497. 0xd3dd4abd, 0xe5487e25, 0x0b3ba22e, 0x00fd4b01, 0xc6e8dcbb,
  47498. 0xcb591493, 0xbce68664, 0xb7329fab, 0x68906b76, 0x6829d1c2,
  47499. 0x74176841, 0x8bcfd3e5 },
  47500. { 0xd3c8c314, 0x06882734, 0x11870833, 0x95f0b2f1, 0xc068ba16,
  47501. 0xb937f7c3, 0x77924787, 0x5365e0d8, 0x1f992227, 0x15527e5e,
  47502. 0x27dffd4f, 0x0a069648, 0x2f586389, 0xd58b3df2, 0x6af20ead,
  47503. 0x83446b89, 0x50746257, 0x09d7970b, 0x4022a691, 0xd9e8d206,
  47504. 0x671ec379, 0xd1e5f8af, 0x057fe91e, 0x6f542509, 0x52890418,
  47505. 0xf14dda81, 0x1db932ad, 0xbd78010e, 0x905a9378, 0x3e18d1e4,
  47506. 0xbd37ab49, 0x53cadcf7 },
  47507. { 0x5e53d0ff, 0x1bb5edf7, 0x888abf67, 0xd886606c, 0x12206d15,
  47508. 0x6491b0f8, 0xe22b6a33, 0xb3018345, 0xb173b317, 0xaba6794b,
  47509. 0x7dc9e595, 0x8c1e5867, 0x239624d1, 0x4e106482, 0xda55dd53,
  47510. 0x61752e59, 0x9e42879c, 0x018b4eab, 0x491f2bed, 0xcaf6784b,
  47511. 0x1e79429e, 0x3dcdb9d2, 0x10f26224, 0x36941485, 0xa650ec5c,
  47512. 0x106f190a, 0xb69a9760, 0x7542a5ae, 0xc32d1046, 0x69bd75e9,
  47513. 0xbf8c62b1, 0x90849964 },
  47514. { 0x5a93c661, 0xb1390cf6, 0x9db5f056, 0x18486264, 0xa51a1788,
  47515. 0x92a93a9d, 0x6772de9a, 0x1b0cbb8f, 0x7c71487c, 0x6e67febd,
  47516. 0x4e62423e, 0xf9b4382d, 0xbb5a42f8, 0x96fda50e, 0x6089a4f2,
  47517. 0xc921b337, 0x875ec516, 0x49d32d7b, 0xc410124b, 0xbd86d2ca,
  47518. 0xc421fb7a, 0xf6862209, 0xf6b7de33, 0x3e1949ab, 0xe93c9268,
  47519. 0xcdee18f0, 0x08dc4cc0, 0xd4edbd5e, 0x73580d22, 0xc2b75be4,
  47520. 0x468cd7e8, 0x3d7f6ffa },
  47521. { 0xdffbd5d1, 0xea7b290c, 0x970338df, 0x9d759da6, 0x90feedc9,
  47522. 0x56680b08, 0x42dce68e, 0xbc690af5, 0xb2ae4d82, 0x8519df2b,
  47523. 0x7f195b60, 0x5612467f, 0xd83c21f4, 0x659a342c, 0x55651633,
  47524. 0x55771bf5, 0x548ba562, 0x5fc68935, 0x9492f23a, 0xb5419203,
  47525. 0x9c9c6017, 0x567528e3, 0x511e6019, 0x3f064ed4, 0x1d16a555,
  47526. 0x303f9eb9, 0x2254abee, 0x3e18c4fd, 0xfd434e7c, 0x40994d6f,
  47527. 0x6dde74e6, 0x8fb12d3f },
  47528. { 0x293cb7a4, 0x6c6381a2, 0xb87b7e4d, 0x453e09f0, 0x078ac3ef,
  47529. 0x4f212823, 0x578cae91, 0xe89ffad0, 0x716ba4dd, 0x4a2b696a,
  47530. 0xf6f580a0, 0x14681a14, 0x4c2f1307, 0x1358f97b, 0x2932fb89,
  47531. 0x87896996, 0x268a5af7, 0x29dd850a, 0xfe239f83, 0xaf771f6d,
  47532. 0x4f47499d, 0x5f20fd2e, 0x867ca0e9, 0x9b643e77, 0x375981ec,
  47533. 0xe7858ecd, 0x19ab1c97, 0xbe946a59, 0x06ff3453, 0x4f9303a2,
  47534. 0x75d237b1, 0x3fcc6731 },
  47535. { 0xdf21f920, 0x509debd5, 0xc1401b90, 0xfaf70e1f, 0x95a64aaf,
  47536. 0x2429cbfd, 0x2c37a122, 0xf2120855, 0x7deb926b, 0x1d4c93f4,
  47537. 0x9fb3f1dc, 0x12f3e4c0, 0x5b51bc46, 0x56085a59, 0xf10fdbd2,
  47538. 0x2a2f5d62, 0xdf0cb3c2, 0x60dd62cf, 0x6b0f254b, 0x154424a3,
  47539. 0x564612b7, 0xc3a5a05d, 0xa1f5249c, 0xbebe30cf, 0x7e62a188,
  47540. 0x24ec6903, 0xaf429939, 0x75f0fbac, 0xb3fa8685, 0xd41345dc,
  47541. 0xc7151c34, 0x645146fd },
  47542. { 0xba1924f9, 0xecec633a, 0x006326e1, 0xbba6f136, 0x7e50fc17,
  47543. 0x203757ac, 0xef3d8e00, 0xca531919, 0x51dc5a74, 0x9545a6aa,
  47544. 0xd31412b8, 0x6e21d58f, 0x7bb1d000, 0x01bc3005, 0x6ed1a9c3,
  47545. 0xf1789c69, 0x9858fa48, 0x7af2d35f, 0x8197be85, 0x434d09b9,
  47546. 0x29aa265d, 0x1dc07755, 0xc058fa80, 0xcad03be7, 0x54ba14ce,
  47547. 0x92d70a9f, 0x6c050a74, 0x6dc78505, 0x4d005dda, 0x2a7ca4a9,
  47548. 0xabfb9f2e, 0x448d3d72 },
  47549. { 0x29b33989, 0xdc56f145, 0xa9ae815a, 0x868351bc, 0x4b074414,
  47550. 0xb3f45613, 0x3cd9f33b, 0x955ce42a, 0x5ff6e4a3, 0x13ade4ec,
  47551. 0xa50eaa91, 0xd3aac715, 0x5666efdf, 0x0c61ec99, 0xf6a4470a,
  47552. 0x108a28b8, 0xe54844c9, 0x402ef584, 0xd0e2f337, 0xb825b162,
  47553. 0xb46f7cbc, 0x3dcd131f, 0x96f2fd89, 0x208178ec, 0x25928c78,
  47554. 0x4d8c5d67, 0x9963c459, 0x285a33df, 0xd92a309f, 0x72497175,
  47555. 0xcb7019a5, 0x76881479 },
  47556. { 0x91767eed, 0xba43a114, 0x92bf65db, 0x5e11b9ad, 0x03a5e21a,
  47557. 0xe8a22ce0, 0x2a335415, 0x63604421, 0x4a9ead62, 0xc2c563b4,
  47558. 0xa0b2aee5, 0x4bc06264, 0x8bf2e1d7, 0x75b8d575, 0xd08a265d,
  47559. 0x1cff0ee7, 0xb0b712a7, 0x17914e1d, 0x4b18692d, 0xc35925d0,
  47560. 0x56cce815, 0xde253f4c, 0x9fff0e3a, 0xa479241c, 0xddabed19,
  47561. 0x50b9d06e, 0x59fae506, 0x67135260, 0x532ce180, 0xf37600fb,
  47562. 0x5e5a8626, 0x670eb01c },
  47563. { 0x73cdbb43, 0xdf73c0af, 0x7f2431ad, 0xcf08ecc5, 0x2a1a3845,
  47564. 0x91780541, 0x9224ddf1, 0x69a104f2, 0xbeac7eff, 0x4352f38d,
  47565. 0x7c2d1322, 0xfc3b3b4e, 0xb5e4b476, 0xa69e9430, 0x975a46f0,
  47566. 0x7d932340, 0x5d64eece, 0x8093899e, 0xdb2345e9, 0x7b821250,
  47567. 0x7f4b796b, 0x23552932, 0x4bb90b1f, 0x2ee9cc15, 0x9112f7d6,
  47568. 0x1fa9c8f5, 0x1cbaae32, 0x2d0f2f98, 0x0075166a, 0xb77f0366,
  47569. 0x635dff27, 0x504852e7 },
  47570. { 0xa2f392fa, 0x2f0f3ce5, 0xec6c9078, 0x326c076a, 0x84baaaf6,
  47571. 0xad01de92, 0xcbe8e993, 0xb01b16d3, 0x2d950908, 0x71305c24,
  47572. 0x3853af38, 0xc66fd617, 0xd3c429a0, 0x7735140e, 0x1fabf027,
  47573. 0x8a31b12a, 0x058b3177, 0xa0530002, 0xa9c7deb9, 0xabffd9fc,
  47574. 0xe8667d30, 0xd05ef69b, 0xe9a9e13f, 0x2f3a7308, 0xb91eae9c,
  47575. 0x3f4c9a19, 0x618ce6c4, 0x50d0cee7, 0x5240f8b0, 0xfb24dc40,
  47576. 0xf7e90cc4, 0x992fe151 },
  47577. { 0x38f197aa, 0x4454db31, 0x87872f98, 0xa4ded69d, 0x44f0a828,
  47578. 0x97b427b0, 0xa31e48c6, 0x9821e1ae, 0xdd98efec, 0xe38cb09f,
  47579. 0x480cb3ae, 0x20b84fa8, 0x47475573, 0xba5bb4a8, 0xcd50e96b,
  47580. 0xa9be080a, 0xef103550, 0xc4451e9c, 0xc441325c, 0x626ee75f,
  47581. 0x38a5e33d, 0x6eea5e98, 0xa2b0abd2, 0x7321beb9, 0x9b6082a9,
  47582. 0xca92e484, 0x992bcc2a, 0x1dc8168a, 0x9c8eb9fb, 0x134ecf4b,
  47583. 0x4c5b71e0, 0x5a68bfa8 },
  47584. { 0xff0a2bfb, 0xb4ff3b45, 0x5502f8b0, 0xd105fff9, 0x5b1c0c26,
  47585. 0x14de5885, 0x0d3b9d04, 0xed16865b, 0x026d3917, 0x2f5a2453,
  47586. 0xf4db3c0e, 0x6a22f493, 0xe2418f2e, 0x4871548a, 0x509bef61,
  47587. 0x6ab363a8, 0xb8cbbbec, 0x91ca1e3a, 0x4011a396, 0x71e0dc98,
  47588. 0x0d5ca577, 0xff982e0a, 0x81897bc1, 0xeb40b045, 0x085ad5e7,
  47589. 0x4bc24a46, 0xa6337b7c, 0xd15c8fa0, 0xbef1628f, 0x56ce6ef7,
  47590. 0x9f5ef439, 0x78acfdf9 },
  47591. { 0xf8520189, 0x45bf7f15, 0xc77f61c4, 0x954202a0, 0xdfa22e1b,
  47592. 0x39edc6b9, 0x1f4a3487, 0xd2d60267, 0x4814cc52, 0xcd933929,
  47593. 0x05e9f123, 0xde76a124, 0xae36b6f7, 0xe2306ea0, 0xb83a58e0,
  47594. 0x53815218, 0xa041231a, 0x9862bb76, 0xbf31be71, 0xe8da253c,
  47595. 0x37de861f, 0x2dfc5332, 0x90ae4890, 0xf25c93f6, 0x8baa6ed2,
  47596. 0x66bcb8f0, 0x908b4a29, 0x6f10ae0f, 0xb061c949, 0x8cb4b48c,
  47597. 0xd075a366, 0x0ad92d73 },
  47598. { 0xc2ca548a, 0xbfb95fed, 0x80cd89ab, 0x4778c620, 0x3466c280,
  47599. 0xbe99154b, 0xd4be8902, 0xea3be093, 0x13e681ed, 0x847b7995,
  47600. 0x02f40161, 0xf22a8f4b, 0x4aeb7fe8, 0x3ef2cb4d, 0xb3aed5f6,
  47601. 0x9adc5151, 0x98c31163, 0xec1ccfd1, 0xa3d7d88f, 0xdc2ac17b,
  47602. 0x46421097, 0x08fa64d3, 0x94b90bcf, 0x5ebf80b7, 0x0b50a9eb,
  47603. 0x1b78b4ba, 0x279aa66b, 0x1a4fe934, 0x075b3ced, 0x8ef4dcaf,
  47604. 0x70a6e9ae, 0x95bbd8a0 },
  47605. { 0xe614bbd0, 0x59f92495, 0xb823e363, 0x7567a887, 0xfc1bd6a7,
  47606. 0xe247c9ec, 0x8e835c42, 0x2bfaaf47, 0xaade066a, 0x314ef4e0,
  47607. 0x5c16d336, 0x072baa63, 0xe2f0e389, 0xfa429c71, 0xbd07d90f,
  47608. 0xcac1e5d0, 0x514f5c04, 0x69ff35ea, 0xc0554ec1, 0x893053fc,
  47609. 0x2a35947f, 0xab1d86b7, 0x2aebe487, 0xe29fb060, 0xdfb9cf21,
  47610. 0xa0a10d6d, 0xf20dfcf5, 0xad147059, 0xb8867a2a, 0x480dc66f,
  47611. 0xc125a919, 0x375a884f },
  47612. { 0x1217f7ea, 0x178cbe2e, 0x875c6dab, 0x1a161e2a, 0x1bdb1a54,
  47613. 0xf7707ec0, 0xe4fd73ca, 0x678864a0, 0xd13a0d86, 0xbaebc664,
  47614. 0xc8d30668, 0x40325f99, 0x2f1c5950, 0xb93ed9c9, 0x541e0667,
  47615. 0xfdf36763, 0xb91a6763, 0xfd97fbb0, 0x6079c9a0, 0x26aa69ea,
  47616. 0x1eaa8c47, 0xc7303c80, 0xafa63c55, 0xdec75c81, 0x4fd12adb,
  47617. 0x01cdcde2, 0x1968838a, 0x9fe0dda7, 0x38415379, 0x66bb093b,
  47618. 0x08cb84ec, 0x268d818b },
  47619. { 0x41580555, 0x73dae358, 0x473d103b, 0x4fc32e67, 0xbeccc1ab,
  47620. 0x240c1013, 0xb24ee9de, 0xda4099f2, 0x9fa8e066, 0x37b0cb5b,
  47621. 0x6438d7ee, 0xb5ae04e4, 0x2b720140, 0x7f7d3164, 0x339e4a78,
  47622. 0x86ef4edb, 0x3a7d8375, 0xa5e77eed, 0xbd707c2e, 0x883fad37,
  47623. 0x0f979189, 0x816b633a, 0x2e7a208e, 0xe24c028a, 0x4435516a,
  47624. 0x1171fe3c, 0x4f5f2bf5, 0x3eb93b33, 0x01b53a56, 0x8419ed4b,
  47625. 0x056ca44b, 0x8b02735c },
  47626. { 0xe1019195, 0xb89bb464, 0xf3fc28c1, 0x1de4c026, 0x2bfc3b21,
  47627. 0xac120e6e, 0x91bdf92f, 0xec71bc5a, 0x0d995bc9, 0x485d7ab4,
  47628. 0xe6491ffe, 0x97c6768e, 0xafbce265, 0xd9552d19, 0x8e1b76c2,
  47629. 0xbae6c7fe, 0xd7e3ad1b, 0x167d8281, 0x5e989734, 0x3e149af9,
  47630. 0x8a0c8182, 0xd1f0024c, 0xc3006c0d, 0xf571ffdb, 0x58773d4c,
  47631. 0xb32ecf7e, 0xfd3540d8, 0x5822a782, 0x04365042, 0x5ab45c3f,
  47632. 0x4b4d85fe, 0x400e3aa0 },
  47633. { 0x5e46e4a2, 0x47321649, 0x24136074, 0x37a2ed64, 0xc60ec77d,
  47634. 0x659223b1, 0xe5e0ac2e, 0x5e13aac3, 0xc5107ab7, 0xda17c41b,
  47635. 0x73c253db, 0x65b22ec9, 0xa5012296, 0xff3867b8, 0x0621a99b,
  47636. 0xfed660d5, 0xc89fc3f5, 0xa3c28506, 0xf16451a7, 0x3ed350b9,
  47637. 0x67cb586f, 0x27c3e032, 0x967185b1, 0xc807c779, 0x4a13009b,
  47638. 0x09c157d4, 0xadaf1f4d, 0x362f7647, 0xf3a6a198, 0x4a42b9ac,
  47639. 0x8da6e039, 0x131c3da2 },
  47640. { 0xa7da83ba, 0x4a785ff1, 0xd04f4436, 0xf415b425, 0xec03f812,
  47641. 0x7c0899bd, 0x80f5f4a2, 0xc58d411a, 0xfda251b9, 0x3d32d610,
  47642. 0xcd3b2f32, 0x99bb4504, 0xf4c2083c, 0x198c444b, 0x730e83fd,
  47643. 0x60c261af, 0xcb02db90, 0x060ca4df, 0x9df1e7c8, 0x0ff7838b,
  47644. 0xc4c690c9, 0x6b79cf97, 0x5d75f154, 0x131514d7, 0x1cb0e8ff,
  47645. 0xa7c074f1, 0xb2c17615, 0xb920aac1, 0x44aa0ff0, 0xde8098ad,
  47646. 0x34545ce9, 0x71d1a46a },
  47647. { 0xfa1b382e, 0x76178f76, 0x772dda0d, 0xa0d8ecc3, 0xc5d4d130,
  47648. 0xaa5aab2a, 0x8d72622c, 0x27d38ba4, 0xca3bed06, 0xc5410db6,
  47649. 0x793ceccf, 0xf637a588, 0x6e65e3d7, 0x1f65dafd, 0x60a45641,
  47650. 0xc3b44a85, 0x4f78540b, 0x0f47b3a8, 0x5e4d60f6, 0x824fdadd,
  47651. 0x17d3b6d5, 0xd8ccf90c, 0x325fc13a, 0x008eabdf, 0x3648fab9,
  47652. 0x3e90d716, 0x24c52d4b, 0x3964ff3a, 0x533d0acb, 0xb95cc416,
  47653. 0x1167f521, 0x6cd2699f },
  47654. { 0x12f4f3ac, 0x2d8c0b3b, 0x99d1bdfb, 0xb03dcfe2, 0x30f37326,
  47655. 0x540034f8, 0x7c5a8c82, 0x22dd6893, 0xcd8f1442, 0xeb7093d0,
  47656. 0x585742f2, 0x892795a7, 0x087adadd, 0xe15f282c, 0x16ab7b5e,
  47657. 0x7bbdc749, 0xa58acbb4, 0xd30fe40b, 0xe2bac39b, 0x0de417eb,
  47658. 0xc61a04bc, 0x4b4b19a6, 0xf2735569, 0x9338c34d, 0x30ab196f,
  47659. 0xe8f03742, 0x6c88c965, 0xfa2efcb8, 0xc7eeb826, 0x19eee274,
  47660. 0xda345dc2, 0x327c063f },
  47661. { 0x5b47cd53, 0xab399eff, 0x1943aefe, 0xbbe9869d, 0x1402a866,
  47662. 0xe64ecc7b, 0xb1c25a16, 0xc3e7c2aa, 0x022de271, 0xc4216b79,
  47663. 0x366d6a5f, 0xe58dfcc8, 0xda813336, 0xd159509e, 0x130bfb7c,
  47664. 0x370400f2, 0x93b48780, 0x1be4e059, 0x39f3cd22, 0x0623a1fe,
  47665. 0xeecb4f87, 0x72aa22b2, 0x6c27b83b, 0x1af4c496, 0xda5fa5bf,
  47666. 0x7a42a94b, 0x48b01af2, 0x9afba822, 0x3670112c, 0xeb6b9d2a,
  47667. 0xc0df6856, 0x020f19d1 },
  47668. { 0xa4dbba20, 0x37051a86, 0xdb1de5c5, 0xb618ebc6, 0xe6525840,
  47669. 0x9a780a19, 0xd2bccc4d, 0x9440302d, 0x10285a24, 0xe9ff023d,
  47670. 0x3a486268, 0x3b937ee3, 0x4cd61147, 0xe37ee2f2, 0xa3d057cf,
  47671. 0x79fbbfd3, 0xccddefce, 0x5fba16d3, 0x5b231727, 0x916058ec,
  47672. 0x720c3adb, 0x47699ebe, 0x8b4f6bba, 0x26274386, 0xf18a0770,
  47673. 0x54b0092a, 0xacca1160, 0x99d090eb, 0x0c888f60, 0xf757e1ff,
  47674. 0xb0050544, 0x79e72720 },
  47675. { 0x2820a239, 0x632acf25, 0xaae6b310, 0xb1a3974e, 0x48c0a1df,
  47676. 0xd61fd6ba, 0x5a3ee7aa, 0xd2453c39, 0xb980446d, 0x548455a0,
  47677. 0xde16676f, 0x9f29d97b, 0x789375a1, 0xf252ca0c, 0x7743a985,
  47678. 0xe961af3e, 0x66cdbd8d, 0x70c79c56, 0xcbc538f9, 0x14a3854e,
  47679. 0xa126851c, 0x58daa73a, 0x2a9f558c, 0xe9b5bb45, 0xfbd15e05,
  47680. 0x37af7f83, 0x38a1939d, 0xa4487927, 0x9511a056, 0xe428b2b5,
  47681. 0x7015846d, 0x001d3ce3 },
  47682. { 0xe145b1d7, 0xd6be36b9, 0x009c5664, 0xf3e3938a, 0xe7c0f6db,
  47683. 0x2e562e7d, 0xc343f539, 0x951044e6, 0xd90897b1, 0xa5ab62b8,
  47684. 0x512f797c, 0xb1a1f70b, 0x750f28e4, 0x91cdd754, 0xffb8165d,
  47685. 0xb4c80e2f, 0x594d02b3, 0x65ed39c7, 0x56833edc, 0xcc12a49d,
  47686. 0xf3693a18, 0xe73694bc, 0xfcd2c404, 0x34cc134a, 0x11d40194,
  47687. 0x071bd5fc, 0xfc585e46, 0x05759047, 0x790b7a04, 0xb3280360,
  47688. 0x40afc684, 0x4bb8c6fc },
  47689. { 0xfd0f8796, 0x3120e2dd, 0xb133c9de, 0x6968a40d, 0xa9369c6e,
  47690. 0xfea366c0, 0x6007273b, 0x37e5b6d6, 0x8cb81439, 0x39e4ecf0,
  47691. 0x9febc005, 0x487fe9cd, 0x0199b53c, 0xeb8af444, 0x293519eb,
  47692. 0x2f124e3b, 0xc82c9c16, 0x860c218a, 0x709dc590, 0xacd1d6f2,
  47693. 0x36d50529, 0x5696d545, 0x59120bfc, 0xc03f5df9, 0x10ffa690,
  47694. 0x99a3e88d, 0x6c432827, 0xd4f9cfa5, 0x9a135d89, 0x2e8fea9e,
  47695. 0xb6a77e78, 0x3699a881 },
  47696. { 0x1eb1c64d, 0x5bca3372, 0xf1d28154, 0xe9cf3a2d, 0x6537106f,
  47697. 0xb7e2e9b3, 0x4f7cbf4d, 0x06c17151, 0x2058b37f, 0xcbde416e,
  47698. 0x8834e9c5, 0x82c53a7e, 0xe9ac3a75, 0x94dbdfe2, 0xc5e67c02,
  47699. 0x795ec6cb, 0x1426a80d, 0x8c23c25f, 0x6a8d4f9f, 0xee2cd20d,
  47700. 0xd3b7c235, 0x838daa54, 0x3d7a4d52, 0xb9e08ec0, 0x781cb473,
  47701. 0xca9475e9, 0x5ec31caa, 0x7271f39e, 0x82535187, 0x1df08e9f,
  47702. 0x208aff8b, 0x4f3a4b03 },
  47703. { 0x1ed095f8, 0x0f7b8107, 0xda226d4e, 0x23e37fa6, 0xafb36d1d,
  47704. 0x8b0f9852, 0x07d8e311, 0xb114634e, 0xe3e0f16e, 0xb9634a97,
  47705. 0x421eec37, 0x2454bb9c, 0xd72b21c1, 0xb4ecd5db, 0x6df20d7c,
  47706. 0xf9603868, 0xdf86e0a2, 0x9f5359fd, 0x5ac488aa, 0xc43d54fa,
  47707. 0xd1049df4, 0x56d714ab, 0xb020607a, 0x13152b3e, 0x7a02325e,
  47708. 0x49be1c18, 0x52ae84db, 0x44f24f4a, 0x0b5a7b80, 0x9e525c03,
  47709. 0xa6d179fd, 0x6d874446 },
  47710. { 0xbe9a42f5, 0xd29d07aa, 0x3781ccc8, 0x1fd5316c, 0x9dc69ea1,
  47711. 0x71a75a6d, 0x88fee91a, 0x4e19e0df, 0xf8d44f12, 0x99c2b4dc,
  47712. 0x31ae94e4, 0x05f6df92, 0xcf28ccc2, 0x27fba876, 0xf57f7ceb,
  47713. 0x6e1a0f01, 0xf3fd3b74, 0xe03f1f34, 0x42c1d213, 0xa0edc4a7,
  47714. 0x7deb8580, 0x5caac270, 0xaf0848bc, 0x0f5d791f, 0x07ac759d,
  47715. 0x17f514ad, 0x904fc531, 0x95a39734, 0x7bb70f3d, 0x95a4aca9,
  47716. 0xff9c5609, 0x3cf384c9 },
  47717. { 0xce1fc9e3, 0x700506ba, 0x676b0399, 0x49721742, 0xe72bf7b3,
  47718. 0x2b4a1b8d, 0x79b209f7, 0xca8602a8, 0xce26a8e1, 0x90580b90,
  47719. 0xfe24f39a, 0x1ef339b7, 0x629362e1, 0xb6c5d991, 0x577b24f4,
  47720. 0x51174e1a, 0x05e451e9, 0xf380fcb5, 0x148321bd, 0xf4d97afb,
  47721. 0x747e5d2a, 0x099806bb, 0xbe99a608, 0x85525d65, 0xd455e820,
  47722. 0x264828d9, 0xd8560a65, 0x8c8c5405, 0x71030770, 0x3c67e73c,
  47723. 0xee73df26, 0x2b248850 },
  47724. { 0x8541159f, 0x2173cde6, 0x4fb410b2, 0x78224c18, 0x1f2ca1c7,
  47725. 0x07a28619, 0xa8b23e40, 0x52c207d6, 0xa6b2344a, 0x071a0210,
  47726. 0xb5ed2945, 0xdb0e587c, 0x810fcc6c, 0x6c56b8ef, 0x62d843b9,
  47727. 0x1248c58f, 0x74c66975, 0x4b90363d, 0xe66c66f6, 0x6348f7f2,
  47728. 0xc126bcbe, 0xb2f9d441, 0x73ce49e8, 0xac07f2a3, 0xe81b0df0,
  47729. 0x52486758, 0x1d4621d1, 0xa108b54d, 0x74414a1c, 0x17261ece,
  47730. 0x6a3ac215, 0x938b3bcc },
  47731. { 0xe4ded340, 0xa9e4a16b, 0x80e88036, 0x8e65fb2a, 0xdcd73acb,
  47732. 0x97089606, 0xaaa657a9, 0x1c3a0434, 0x49101b06, 0xf304fc58,
  47733. 0xda0bb64c, 0xe60fb61a, 0xf5542df5, 0x818c2aec, 0x56f76d5f,
  47734. 0x74020576, 0x92533d97, 0xb566b790, 0x74d6eb5f, 0xae4655e5,
  47735. 0xa55b44b7, 0x60f7a1b5, 0x93747ea5, 0x7970179b, 0xf2dace56,
  47736. 0x8ae7e0e8, 0x84e83c06, 0x98474607, 0x15307341, 0x24e8c9ed,
  47737. 0xd9e89d6b, 0x6cff58a5 },
  47738. { 0x03e51f68, 0x508c01b0, 0x1d2fe7d6, 0xe1d1f225, 0x09bd8805,
  47739. 0xf7998d0b, 0x03e415b7, 0x255e907a, 0x607d9798, 0xd148467d,
  47740. 0x9b453896, 0x055c3b1e, 0x809f50f4, 0x35001013, 0xd0233fdc,
  47741. 0xfbbb2fa6, 0xff1820b8, 0x0b680b0a, 0x38d317e0, 0xb1d404dc,
  47742. 0xccc8c7df, 0x133d5444, 0x6ec13f84, 0x7fa847e6, 0x046e2e48,
  47743. 0xc33f83d8, 0x4863b3ac, 0x3c627fc5, 0xeb936af7, 0x5f67f8aa,
  47744. 0x31b79327, 0x5fe4ac8f },
  47745. { 0x8b6f401e, 0x581aa4bf, 0xad5c7ed4, 0x05db12a3, 0x6fb07b4a,
  47746. 0x7b018726, 0x9c22bcd4, 0xfdd11f04, 0x69371c95, 0x5454a7d4,
  47747. 0x99a46eaf, 0x066c55fb, 0x7fef96d0, 0x18637c7c, 0x6b83e95c,
  47748. 0xbafc1d34, 0x00bb42dc, 0x55c38593, 0x34e7e712, 0xdd8dec2b,
  47749. 0xb184cee8, 0x69c9cfb0, 0x49a27864, 0x8dcc0c42, 0x2010f2e7,
  47750. 0x290d95f2, 0x6977a420, 0x86e254c9, 0xeb2abdad, 0x20931c89,
  47751. 0x121c0548, 0x81377164 },
  47752. { 0x9c5a8edf, 0x6266b25e, 0x1078a7ad, 0x6e1388c2, 0x4876eedf,
  47753. 0x5f02737d, 0x62744617, 0x242fa7f9, 0xb385382a, 0x3e2cfbd9,
  47754. 0x02f71bef, 0xbadad7b1, 0x677d0a92, 0x562abcfa, 0x51fdff34,
  47755. 0x573ebd17, 0x7c250c78, 0xd7f65852, 0xc47ca896, 0xe0cf16ee,
  47756. 0x67622c9e, 0x8ccd79b0, 0xf8f2c075, 0x31fc5882, 0xa6008515,
  47757. 0x9232b37e, 0x82e8c5ba, 0x4d7bb361, 0xd2f146fe, 0xbf24735c,
  47758. 0x9cd2db98, 0x79c280ee },
  47759. { 0xf2b48122, 0xbdcc8203, 0xb04ac48e, 0xa8c04916, 0x9fc4885e,
  47760. 0xacf064dc, 0x82c1001c, 0xab838997, 0x676de250, 0x7339e721,
  47761. 0x8e1ab820, 0x17aa5aea, 0x6bc14b2e, 0x24d28ca0, 0x816b6230,
  47762. 0x570c5bb7, 0xcee6b606, 0x6c51235c, 0x183eae42, 0x1b2bf89f,
  47763. 0x9c66274b, 0x3e3af3c6, 0xb51e38bc, 0xe0b04426, 0x73e40e3b,
  47764. 0x26dbc58e, 0xb5be5be4, 0x3f9dd578, 0x52c8f408, 0x9fd9f791,
  47765. 0xa9e3ff4f, 0x758073a4 },
  47766. { 0x8691ca22, 0x7d27b057, 0x13a2a1b6, 0xf206bfd6, 0xac795413,
  47767. 0xe84bd385, 0x75536607, 0xc5d18a2a, 0xc8a0e24c, 0x2e166de7,
  47768. 0x3c474dbd, 0x56d5750c, 0x1366843a, 0xdef444c1, 0xcf4b8432,
  47769. 0x14646e53, 0xa9fd9783, 0x4bc0d030, 0x297ee203, 0xbda4c824,
  47770. 0xfd7be6c7, 0x3d0b10bf, 0x08c7f3ff, 0x2d216476, 0xb4fd4c45,
  47771. 0x06e52599, 0x49e9e104, 0xfbab9fa1, 0x8661d32d, 0x9342a7fa,
  47772. 0xfaf66aa8, 0x3f3e3458 },
  47773. { 0x951597aa, 0x51ec35af, 0x49df64eb, 0xb677d4ac, 0x9bf4eff5,
  47774. 0x0276cd9c, 0x515a2935, 0x423eca49, 0xfd9bb9c3, 0x8a696553,
  47775. 0xede1f09c, 0xf99ee9df, 0x199e5f98, 0xb8fa2956, 0x35292c32,
  47776. 0xb7638758, 0xfc40e81b, 0x8734eddc, 0x65457d95, 0xd82d5e9f,
  47777. 0x30c78d2b, 0xc8ee323e, 0xc1433d67, 0xe77b2e4c, 0x3c8314ae,
  47778. 0x56d9f807, 0x2a0e2f63, 0x441eede2, 0x6c48295e, 0x1e9e17ed,
  47779. 0x34c294ef, 0x640d20c4 },
  47780. { 0x3284d513, 0x4e9a0b8e, 0xf315053a, 0x074c3545, 0x45acd52a,
  47781. 0xb36e7407, 0x1de50db7, 0xd80bdcfc, 0x2549fc46, 0x8d9d47dc,
  47782. 0x303f07a8, 0x29b6ef13, 0x6d4ad4c2, 0x4e461aca, 0xfc9f1b73,
  47783. 0xca8e351d, 0x57460e65, 0x8bc4094d, 0x0f32d367, 0xb6302b33,
  47784. 0x285742e8, 0x69a074b6, 0x876c29c3, 0xdfe52b11, 0x912bd17a,
  47785. 0xf39e4609, 0x349aa639, 0x8ee40d66, 0xc72e05c1, 0xb968902a,
  47786. 0xc0d92816, 0x0f9c1ca8 },
  47787. { 0x67433df3, 0x1ebbaab3, 0x15d3628c, 0xb6aa5347, 0x97f0c5cc,
  47788. 0x13a320d8, 0x65e408f9, 0x72c918cb, 0xd5373451, 0x4b638854,
  47789. 0x0b4dca09, 0x731399a3, 0x0a3b1326, 0xcf256730, 0x6608b388,
  47790. 0x5ea60dfa, 0x7b290dfd, 0x58ad74b0, 0xd7694f9b, 0x83202789,
  47791. 0xb6630fb1, 0x48593db8, 0xc65e3eaf, 0x3db47f70, 0x3e7263f8,
  47792. 0x63949c91, 0xe6e6ff33, 0x9b9acec6, 0x098a8240, 0x34bd9ba7,
  47793. 0x45d36ec5, 0x7e31c12f },
  47794. { 0x0dfd2dd7, 0xbe281d68, 0x24ab61d8, 0x1efacb00, 0x94431f97,
  47795. 0xb9c3005f, 0x959cb3bc, 0x660c8dfa, 0xcffbb406, 0xfdd5fc30,
  47796. 0x7969a10d, 0x7a4631be, 0xde13fd1b, 0x336e309e, 0xfc947076,
  47797. 0x76b3bfad, 0xdcc72223, 0xfa91925d, 0x156c4ee1, 0x741f0d73,
  47798. 0x0e2b3747, 0x4f64ee41, 0xefc4d93c, 0x86be92d3, 0xfc4fbb2e,
  47799. 0xc53b7e03, 0x337ca1bb, 0xac196cf5, 0x7e23ba60, 0x4de41a30,
  47800. 0x326d5357, 0x1a219c45 },
  47801. { 0xaa4db0bc, 0xfdcf7ef8, 0x7b6c9963, 0x2e231806, 0x3d8a192f,
  47802. 0xc2639067, 0xffdc7771, 0xc0cec2e2, 0xa2fc0edb, 0x997c8e35,
  47803. 0x82cc6043, 0x78e10ec1, 0x2b0c8120, 0xfd0de2cb, 0x69e57f8e,
  47804. 0x4d6c457f, 0x5b53f1c3, 0x953e69b2, 0xc4f89cb8, 0x422a330a,
  47805. 0x95566be6, 0x92ff2329, 0x437442d1, 0x73cd502d, 0xbea69403,
  47806. 0xf04ce590, 0xf8030662, 0x6ac1537e, 0xb6d0bf93, 0xe02bcf77,
  47807. 0xbc90192f, 0x17aaa999 },
  47808. { 0x8e55db2e, 0x0d3d5643, 0x3b946851, 0x835dee43, 0x5b88462f,
  47809. 0x1a1440e5, 0xea17e27c, 0xa6ff3b35, 0xdd95f7a9, 0x23f99c36,
  47810. 0xbdd672cf, 0x7217fdd9, 0xdd2045c0, 0xf400ac1e, 0x4ff06b25,
  47811. 0x94b55c87, 0x0e4a49be, 0x0a44a0e5, 0xb43b6813, 0xe8925e91,
  47812. 0x214f96c5, 0x78bedde1, 0x0f97fa97, 0x0f456a4c, 0xa5bfd267,
  47813. 0xa28fd86b, 0xbe7608ef, 0x3b4b2d8f, 0x226474bc, 0xfbd5ff8c,
  47814. 0xa5f3b24a, 0x6b282af0 },
  47815. { 0x6341a595, 0x78fc025f, 0xa445e28c, 0x591c38d6, 0xeb446842,
  47816. 0x72bd6e3d, 0x75547833, 0x3f9466d3, 0x083e16c4, 0x911414d3,
  47817. 0x95a7acb4, 0x145d9466, 0x8fd2fb64, 0x102ddf09, 0x0bfd87b1,
  47818. 0x2a2b2d2d, 0x59455088, 0x69e9be5c, 0xa80245de, 0xee378bf4,
  47819. 0xb2306b0e, 0x80b0bd68, 0xc2be9f3d, 0x76a545c6, 0x4802c245,
  47820. 0x429d167b, 0x2b412dfb, 0x13e64427, 0xee8d9762, 0xb664f529,
  47821. 0x54706ebf, 0x6d4f5d23 },
  47822. { 0x00ba9f88, 0x35c8f2b6, 0x7bb6d0bf, 0xfdc807e0, 0xb3b81e5b,
  47823. 0x0a126d42, 0xa7ac781e, 0x335ce6ce, 0xf37dcba6, 0x3e308e6f,
  47824. 0x63c96487, 0x028dca62, 0x8818434d, 0x72eba57e, 0x79b78a26,
  47825. 0xa9e3d59f, 0x2f07aea3, 0xd2f0a7dd, 0x24d05f74, 0xe0fe4678,
  47826. 0x0116deb6, 0xb2085170, 0x58f37580, 0x9c2a5e92, 0x74070bb3,
  47827. 0xe78bd7a5, 0xb9977d90, 0x551fc872, 0x40db81b4, 0x6eda93c4,
  47828. 0xd65d34ad, 0x4aaf0b4f },
  47829. { 0x3514c7af, 0x9bef2506, 0xbc181ead, 0xb09e7dad, 0x8fa3ec58,
  47830. 0xef3cae87, 0x173b8685, 0xd8dbfab5, 0x921d32dd, 0xb2490fc0,
  47831. 0x8bd9c466, 0x4eef386b, 0xa061dbdb, 0xc1cdd52f, 0x25bc04db,
  47832. 0x64de989a, 0x85728636, 0x06f9836b, 0x8be44aa0, 0x11a5a804,
  47833. 0x097018c7, 0x16dede4e, 0xb2c11fb1, 0x72aec577, 0xa721ecd9,
  47834. 0x144dade1, 0xd6ebf3a9, 0xf99c526b, 0x1c2e14d7, 0xa1d4165b,
  47835. 0x82bc6337, 0x8b2cbd39 },
  47836. { 0x8a52e991, 0x28ec1bf2, 0xcf9d42ec, 0x0ba202f6, 0xc634ea45,
  47837. 0x8307d130, 0xc5762b9c, 0x3fc257b3, 0x487c2a2d, 0xbd3298d1,
  47838. 0xa319488a, 0xca14f1a7, 0x06ba06d2, 0xc70ca93b, 0xee405e89,
  47839. 0x9aa3f4b3, 0x35deeae7, 0xcc64eeb3, 0x03bf1d4c, 0xd155f578,
  47840. 0x45616bfd, 0x041ec0b5, 0x086e33f6, 0x23df80e6, 0xf0243cf5,
  47841. 0x399a79c8, 0x874ccd58, 0x86c2824e, 0x8fc5c831, 0x220eeaec,
  47842. 0x7dbe3670, 0x57e28304 },
  47843. { 0xfbcdf666, 0x6e60b698, 0x8bebb1d2, 0xbdd06a99, 0x80498436,
  47844. 0x4044adba, 0x522bc88d, 0xd76bf75e, 0x28423b20, 0x655c4b9b,
  47845. 0x53398a72, 0x65c0f492, 0x0ca37601, 0x76d4f2b7, 0x2030fa5a,
  47846. 0x46989925, 0xb6054705, 0x96b37e87, 0x53de1b2f, 0xef96f731,
  47847. 0xad54ef05, 0x5ecbbc8c, 0xa93617b0, 0xeb289d0a, 0x7cba217d,
  47848. 0x3ac0fbd5, 0x19d4a2d7, 0xd0d3cb56, 0xc91d6063, 0xe8bee9d4,
  47849. 0x696ffda6, 0x4f12e037 },
  47850. { 0x15f1a610, 0x4ccfa422, 0x3786519a, 0x804a5c55, 0x73838134,
  47851. 0x1246a454, 0x4b284e2a, 0xfa15b484, 0x146d1320, 0x36464c65,
  47852. 0x70a8a0fa, 0xfb6ba88c, 0x93c4804e, 0x74e7cee7, 0xb95ae16a,
  47853. 0x8c34d22c, 0xf9c1d4dd, 0x9d9ed89f, 0x32025371, 0x61a0866d,
  47854. 0x9bd6444a, 0x45b232b2, 0xf277bab1, 0xf888e92c, 0xa9448b02,
  47855. 0x73e69c6e, 0x5b521ecb, 0x1a496ea9, 0x5858afb2, 0xa8f78ea7,
  47856. 0xb1266f91, 0x83d2333e },
  47857. { 0x67b478d7, 0x1c633288, 0x50a2fc9c, 0xa1ee1ae1, 0x18d2241b,
  47858. 0x05b6ab30, 0x893cd696, 0x69f1f288, 0xa8117a87, 0x159d6660,
  47859. 0x70e73d77, 0xe8120119, 0x93f55f0a, 0x528fef00, 0xd854dfb2,
  47860. 0xb3978db8, 0xf45d9fbb, 0xd6b43ef6, 0xd5bee397, 0x17de4bfe,
  47861. 0x6bf76dad, 0xa01e0f59, 0x3d40754c, 0x28b2280e, 0xf8e86ef3,
  47862. 0x8edb6122, 0xb7d1e586, 0x8226b6af, 0x2f40a55b, 0x46353215,
  47863. 0xc5a31621, 0x7362f13e },
  47864. { 0x73c0c430, 0x792eb27c, 0xa51c3657, 0x8cc0a65f, 0xd2194f1b,
  47865. 0x50a5cece, 0x814b4947, 0x18945688, 0x4b6fbbf4, 0xbbf0a81a,
  47866. 0xf0aa8608, 0x376f4f58, 0x3987795e, 0xd9361d68, 0xe3a8d0d5,
  47867. 0xb6510cd8, 0xb6c1a455, 0x63e2fdbf, 0xaec891f9, 0x2c91154e,
  47868. 0xff568f64, 0x0eb1e715, 0x2f2b399e, 0xe7af9cd7, 0x89f0bf0b,
  47869. 0x1fc39bac, 0x90983695, 0xf0861d92, 0xda0a20a8, 0xd9b16f02,
  47870. 0xa38c0ead, 0x2f10693f },
  47871. { 0x0c06ded2, 0x07a6ce91, 0x2fd9087b, 0xf974842f, 0xa9f635a6,
  47872. 0xe468bfd6, 0x1ed60626, 0x04b61891, 0x369ee548, 0x1fb2f89f,
  47873. 0xdc96a201, 0x9cbd1113, 0x10d633ac, 0x6759acfe, 0x8faa629e,
  47874. 0x64ba66fc, 0x47f38283, 0xa686ae49, 0xd59cda99, 0x828c3a05,
  47875. 0x08ea2f6e, 0x7c7afb14, 0xaf3953c8, 0x2551c8e4, 0x9daa9e4f,
  47876. 0x5b53d279, 0xad6f1940, 0x1eff68d4, 0x96437cdb, 0x2775dbdd,
  47877. 0x4fe7a043, 0x985f83e4 },
  47878. { 0xeaf45294, 0x89603c16, 0xc24b5751, 0x70131160, 0x39d6b52d,
  47879. 0x4c112018, 0xed943340, 0x7079cf02, 0x74f41b68, 0x0c5b028b,
  47880. 0x9c8ac1e1, 0x3dc3f076, 0xf8b24f0e, 0x5ac5eea3, 0xe34c5c22,
  47881. 0xee6684ba, 0x9abc452a, 0xa5259e63, 0xe9df45cc, 0xb07d2cd1,
  47882. 0x1a443cfa, 0x07019c93, 0x92c003b3, 0x68fddaa9, 0x0d8cbc2e,
  47883. 0x2d9f179c, 0x1e781ca7, 0xbbf15a6f, 0x50dcc799, 0x54d779d5,
  47884. 0x0fe962f1, 0x0c88e540 },
  47885. { 0xe8f44357, 0x84f71a6a, 0x3a3cab6a, 0xf75b4bf6, 0x5aebc680,
  47886. 0x334c9d9e, 0x8a753ef2, 0xcecaf084, 0x075e3c8e, 0xe28014c1,
  47887. 0xf74f8d3a, 0xbb9d5a38, 0xb80e32ae, 0x75988464, 0xf2bc3792,
  47888. 0x7b328e6f, 0xeed0e197, 0xebbb1faf, 0x5a33065a, 0x674eac95,
  47889. 0x922dbce8, 0x8c19fd8f, 0x987b907a, 0x8c17ae85, 0x3b3a2cd7,
  47890. 0x89f33627, 0xfa87772f, 0xebaea019, 0x3a25ced6, 0x4e5de499,
  47891. 0xaf110715, 0x8e2560b8 },
  47892. { 0x3141aba6, 0x56d3746c, 0xbab2cf9e, 0x45a1079f, 0x9cdd27c7,
  47893. 0xb6382831, 0x9dfd950e, 0x22237632, 0x3a9408ff, 0x1e0b15cd,
  47894. 0xb1160118, 0x49a80200, 0xa383bba7, 0x2719db5d, 0x651046d5,
  47895. 0x6078340a, 0x97523b1f, 0x8929d4de, 0x8e0a28ab, 0x4040345c,
  47896. 0x0adf09c7, 0x61275ac2, 0x2331d611, 0xb41ab265, 0x5391ca50,
  47897. 0x230cc77c, 0x8f922315, 0x88be0c92, 0x92fd9a29, 0xfef3d92b,
  47898. 0x8324f2e5, 0x59005f22 },
  47899. { 0x3c4c1c74, 0x6bb1750c, 0xe966fb79, 0xbe73aac0, 0x66c5973f,
  47900. 0x85a75d92, 0x3a8656b6, 0x8c97f932, 0x50446cde, 0x2b7043b1,
  47901. 0x3ff3897f, 0x548916f7, 0xb18b72b2, 0x913dd01c, 0x488c0de6,
  47902. 0xd0a751f1, 0x8558ca58, 0x19175714, 0x44a663da, 0x97714301,
  47903. 0xb0e08618, 0x2df190ac, 0xf39ead9c, 0x0080fc0c, 0x17382da1,
  47904. 0x0085ac6e, 0x3262a338, 0xe9791851, 0xb43bae8d, 0xe4495936,
  47905. 0xd783df6e, 0x57a78e26 },
  47906. { 0x40dbddd8, 0x161b346f, 0x9410c3ac, 0x2b49a927, 0x1886cf3b,
  47907. 0x8c542783, 0x33b93deb, 0x72df3232, 0x40df579d, 0x9c8d59f5,
  47908. 0xc20ef500, 0xe5d7a67d, 0x67f08643, 0xc46b3918, 0xad96adc3,
  47909. 0xecfa2445, 0x0c4544d0, 0x658f589b, 0xe08417d7, 0xe6ec9301,
  47910. 0xc454e288, 0x6ca5ef6a, 0xac0f462d, 0x4191048f, 0x08d8a036,
  47911. 0x852407d8, 0xf6d35b7e, 0xb4c533a7, 0x8f6ada87, 0x3251e412,
  47912. 0x81c472e8, 0x1ca370c5 },
  47913. { 0xa801b68a, 0x94bd5171, 0xfd1998b3, 0x7312879c, 0x41163202,
  47914. 0x4905aabf, 0xf5b01fdb, 0xb5fe87f4, 0x9cda128b, 0x78de523a,
  47915. 0xc7bd31f7, 0x0bf161a1, 0x23904c35, 0xb5decfd0, 0xe188f12d,
  47916. 0x224b2882, 0xf99dae74, 0x0dd2801d, 0x08cd1cd2, 0xcad467b5,
  47917. 0xc0867e39, 0x6c311c3d, 0x2b425072, 0x71a11720, 0x2efd9003,
  47918. 0x83bf464e, 0x1dbd3b03, 0x53d0448a, 0xe6265baa, 0x32db52f4,
  47919. 0x4c33ac79, 0x2584b34c },
  47920. { 0x2aeec688, 0x3cb86389, 0x45fbe523, 0xa5e740ba, 0xfd60b5f8,
  47921. 0x422e71f7, 0x4874913d, 0x455d185c, 0xfa17d80d, 0x04c2bb36,
  47922. 0xac054524, 0x3f271854, 0xa8b9a657, 0x76dd3045, 0x62ee7cc8,
  47923. 0x2e42c3e1, 0x4df6c7d0, 0x00266706, 0xdc7cb488, 0x5927dd51,
  47924. 0x187897e0, 0x6b3faabe, 0xf2d5737c, 0xfe6ad22e, 0xff51a9ff,
  47925. 0xafb60269, 0x69807baa, 0xe1c83545, 0x951ca49a, 0xacddb6ff,
  47926. 0x3f9ab085, 0x7e811374 },
  47927. { 0x830a88b1, 0xad722a8b, 0xce1117e1, 0x91918ea8, 0x0409b47d,
  47928. 0x3e02d0b8, 0x6c46d1d3, 0xb53812d3, 0xe589669c, 0x2fd09db0,
  47929. 0x15b0cd5e, 0x9845cd06, 0x2386c453, 0x0c1c155a, 0xf5ff43cb,
  47930. 0xda774de5, 0xe391c0cd, 0xbb076b98, 0x5004f286, 0x97d71eff,
  47931. 0xaeec0bfe, 0x23e0b46c, 0x32a1ad94, 0xe4538667, 0x396da422,
  47932. 0xfe0c9f81, 0x63db2bfe, 0x6376c1a2, 0xba56fa91, 0x001c7918,
  47933. 0xdf8485a6, 0x436b8c64 },
  47934. { 0x8ab764bc, 0x88117e9d, 0xa077df84, 0xdfa61e94, 0x0c18eebd,
  47935. 0x5a7765d3, 0xfc9451dc, 0x548916af, 0x071a347a, 0x01a52e33,
  47936. 0xb23b41df, 0x633b95de, 0x43c8c286, 0xdd7d68c9, 0x18d97068,
  47937. 0xe4f9d41e, 0x8c92799d, 0x79908b90, 0xd47394a3, 0xe614148e,
  47938. 0xcd51e53f, 0xe5018517, 0x0243dcb6, 0x5060075e, 0x17954405,
  47939. 0xe5dcde62, 0x537da5ff, 0x6f7c90e1, 0x0768cb66, 0x1df7aae4,
  47940. 0x6dbe95e1, 0x5266ca9e },
  47941. { 0x1386b3db, 0x84ddee6d, 0x7c38e540, 0xf9e4af5a, 0xeb04f49d,
  47942. 0xb3418440, 0xfde5a4fd, 0x2138a1e8, 0x30257cfc, 0x3e6e6924,
  47943. 0x19fd70c1, 0x3519c6e3, 0x86c31ff0, 0x8f34e174, 0x940ce1e8,
  47944. 0xf1e298fd, 0x14960d7c, 0x6fb8cb1d, 0x2b2f3bff, 0x207c1347,
  47945. 0x146ef8ff, 0x899a20b4, 0x7bd3e220, 0x7dec362b, 0x626bea27,
  47946. 0xa975044e, 0x4fb4cb67, 0x0f32b449, 0x1fc6703a, 0xc17a0920,
  47947. 0x9cd84a2b, 0x41f325b9 },
  47948. { 0xce2843a4, 0x312ed513, 0x00728afc, 0xe748498e, 0x4d864ce5,
  47949. 0xa8ef2822, 0xa620083b, 0x34064704, 0x4bed338d, 0x5905e1d9,
  47950. 0x063e7b38, 0x2a578cb5, 0x289e7bb9, 0x98276d96, 0xf17b7341,
  47951. 0xdfe2dc47, 0x1dac8944, 0x5923521f, 0x23400aa7, 0x3db6d28d,
  47952. 0xa761ba43, 0xc647705e, 0x9bfd07dd, 0x8947ba6d, 0x242ca8fd,
  47953. 0x00f2e3ac, 0xeb8c3468, 0x49ef4670, 0xd9aa18fd, 0x7db3d37b,
  47954. 0xe58cea9e, 0x56b30fb6 },
  47955. { 0xcd80a428, 0x07ecdcaa, 0x8732c891, 0x7af922dc, 0x3ada441f,
  47956. 0x20d88798, 0x924b008a, 0x3bed9a44, 0xb2e81c3a, 0x2123533c,
  47957. 0x65f807d3, 0xc34e4075, 0x1f2faecb, 0x0bfaefa5, 0xade8a88d,
  47958. 0x78b634a5, 0x94392a91, 0xc4e0b7f8, 0x90bb1cd8, 0x30922377,
  47959. 0xf87204ae, 0xdea9b4fa, 0x85d3cd83, 0x3edf81f5, 0xc6523a79,
  47960. 0x58f88c51, 0x17c0d969, 0xe472fb8b, 0xdccf7f07, 0x899081e5,
  47961. 0x58bdd146, 0x1353cc57 },
  47962. { 0x39bf6e18, 0x28a56497, 0x649b89c7, 0x59e8b5a2, 0xdce8b8e7,
  47963. 0x8d9434a0, 0x2047040c, 0xd935bf51, 0x6a7b8e82, 0x2ab3a164,
  47964. 0x27f81294, 0xf1583ed6, 0x72d67297, 0x8416a7e0, 0xcd39e42b,
  47965. 0x49685d86, 0x958ddbad, 0x8a797fc7, 0x155ce6de, 0xa558f928,
  47966. 0xf8a36235, 0x75f4e570, 0x52877ae5, 0xbc69cfc0, 0xa6b16ebd,
  47967. 0x8f4193a9, 0xbb1cc1f1, 0x8d1df43c, 0x5a21e789, 0x723a830e,
  47968. 0xf451df58, 0x3ec2185d },
  47969. { 0x1f0bc2d7, 0xb9d4c7d7, 0x6e51d412, 0x6982c6cc, 0xa09f80f6,
  47970. 0x92e02d93, 0x047ae09c, 0xb7dd2d25, 0x37f351f9, 0x3503149f,
  47971. 0xc77850be, 0x69d49ce1, 0x12f0d2c8, 0x60242acb, 0x7bc28b9d,
  47972. 0xba188c56, 0x06bc0550, 0x8e406121, 0x8d7d4329, 0xb0d84b1f,
  47973. 0xd38951e0, 0xb4a67ae7, 0x8bc97607, 0xb527c57b, 0x5497aa72,
  47974. 0xbc93c5f3, 0x39bdd666, 0x5f1de8cc, 0xe9d447a3, 0x3087dc5c,
  47975. 0xa211abe5, 0x89b356b6 },
  47976. { 0xdfdcc837, 0xed6db0af, 0xa871b7a9, 0x0fb80baa, 0x1c1d4b72,
  47977. 0x413abfc9, 0xadac9e5c, 0xf5b56bf7, 0x8b8657a3, 0x5664a2da,
  47978. 0x0e41d94e, 0x11b04f72, 0x37433658, 0x63e11d26, 0xf426daea,
  47979. 0xee628ece, 0xcb162dc2, 0x011619c9, 0x87648643, 0x9cf5817f,
  47980. 0x5584bc86, 0xe1bb9702, 0x00bf7928, 0x2cc27cef, 0xdc60eee5,
  47981. 0x4ef3a80e, 0x87adc2f9, 0x7e1202be, 0x8a0d4f52, 0x656f18e0,
  47982. 0x57c5d126, 0x39c4f10d },
  47983. { 0xe88aecd3, 0xb3a9b68c, 0xa518aa9d, 0x555b0918, 0x4bd4ee54,
  47984. 0xedc1cdad, 0x02068d84, 0x79b68b67, 0x811ac72d, 0x7dac80d0,
  47985. 0xa81a0a78, 0x6d1e6d35, 0x3bd16283, 0xc841e9ea, 0x894c4444,
  47986. 0xa7bc1775, 0xf1aa1202, 0xf2b63725, 0xc7d4c556, 0xbec7767e,
  47987. 0xd46ff51b, 0x2817ebb3, 0x73f7e339, 0xfde5be8d, 0x5aed24c4,
  47988. 0x44c6c977, 0xb6e579cf, 0x0b9a1707, 0x9069fbcc, 0xcff16478,
  47989. 0x49152b00, 0x414b542d },
  47990. { 0x606e173b, 0x33c31e58, 0x90e6713a, 0x5b7f4e1b, 0xdebb20af,
  47991. 0x425fb512, 0x05120e70, 0xc788c617, 0x9013e4ec, 0x3ef05602,
  47992. 0x81c6e6d7, 0x9f9d35ac, 0x9450690a, 0xe131e88f, 0x44af082e,
  47993. 0x708f9b32, 0x1ba2aea9, 0xb2e4d66c, 0x740db29c, 0xaf1f4a6e,
  47994. 0xd1843007, 0x74ab9248, 0xed556a6c, 0x13338ef8, 0x270d17a6,
  47995. 0xf48e623e, 0x9608f5bf, 0x3c7362fa, 0x444e8515, 0x43977874,
  47996. 0xe00b8b2a, 0x52678d6a },
  47997. { 0xdf36aeb4, 0x5dff1c59, 0xa92bc0ab, 0x52d6653c, 0x927a5f81,
  47998. 0x0e03f496, 0x2dfd491f, 0x8509d414, 0xa571f89b, 0x258c2c52,
  47999. 0x93334485, 0x2bd61804, 0x3f7d9e09, 0x1a33e94f, 0x2c1bf906,
  48000. 0xfab418d3, 0x5aa5695c, 0xf39c490e, 0xf6d2d7ff, 0x0e41196e,
  48001. 0x0f7948a9, 0x3ecd4075, 0xd3053b4f, 0x4b58f9b2, 0x5d9974c9,
  48002. 0xb8ee842a, 0xbf22f682, 0x23a59c1d, 0xc8efcea6, 0x045ac614,
  48003. 0xc10ceedd, 0x7040ba5b },
  48004. { 0x515a1a96, 0x2c364f81, 0x184327e0, 0x31a63503, 0x1ad93d4f,
  48005. 0x0a096650, 0x273b6173, 0x9d7694f1, 0xd2cda9d2, 0x8886d876,
  48006. 0x2814c177, 0x1e01a742, 0x8667696b, 0x3492276b, 0x5b25f006,
  48007. 0x2fd4f0c6, 0xfb294c4a, 0x6527349f, 0xde1d336f, 0xc1fe0d8a,
  48008. 0xe7e3860e, 0xaf9a23e8, 0xb774c31e, 0x97d2b721, 0x4365784a,
  48009. 0xfac3e582, 0x70f4eaa3, 0xff2dff4e, 0xfe873248, 0x3d281e1a,
  48010. 0x0bd1c9c1, 0x9043a6d6 },
  48011. { 0x766c7937, 0x1511a0fe, 0xabbc3be3, 0x1b2ded5c, 0xe00888ac,
  48012. 0x2ac160cc, 0x616200f3, 0x928754bd, 0x34a2ea06, 0xb801c83d,
  48013. 0x9cbe106f, 0x8ad7a03a, 0xcedfcd94, 0x996b0822, 0xe4069880,
  48014. 0xc3c3463a, 0xf597f663, 0xfb12ea4d, 0x40c92af9, 0x2c8d3834,
  48015. 0x4e8da154, 0x79bc85c6, 0xdb4e801a, 0x95771fa2, 0x1e3579b2,
  48016. 0x7bd2c138, 0xffaad078, 0xe45c75df, 0xb73eac46, 0xb0760a3c,
  48017. 0x3a125f35, 0x26362b48 },
  48018. { 0xeefc3e89, 0x25c68d28, 0x69e9ee71, 0x2d0ee877, 0xaf5e4b75,
  48019. 0x8b07bb86, 0xcb86b333, 0xdb709072, 0xff552bac, 0xfd3d20ea,
  48020. 0x4c0da1e9, 0xa5eeb2b1, 0x44f97145, 0x391f688a, 0x1e06d485,
  48021. 0x21fbd310, 0xbea9cd49, 0x45e4f2a5, 0xa7bf21da, 0x7b60d464,
  48022. 0x054d5471, 0x193f88c8, 0xbee0f2e9, 0x5ace53d1, 0xc1439273,
  48023. 0x92c26563, 0x96c6b5ee, 0x9c86e0b2, 0x09ff59ba, 0x452fe231,
  48024. 0x555c935e, 0x2e952b20 },
  48025. { 0xd75f886e, 0x2a846bca, 0xd43dfc58, 0xe68a5dbe, 0x007b1b86,
  48026. 0x103e45b6, 0x355ff2b5, 0x580e2ec9, 0xa263ecc9, 0xbc702f26,
  48027. 0x181e5e33, 0x2835b386, 0x6c122076, 0x025113ec, 0x7fbd856d,
  48028. 0xa5c26e3a, 0x9d6ebcb1, 0x8ef83fb3, 0xa44d2fa8, 0x7aaa53f2,
  48029. 0x53b1fa97, 0x7c14ef33, 0x17559a30, 0xff604a11, 0xb09377e0,
  48030. 0x2bcd96b0, 0xdb2f0273, 0xa5c14896, 0xeb53ef06, 0x1c0a84c9,
  48031. 0x30378e4b, 0x1236d017 },
  48032. { 0xc084373b, 0xd7481c8f, 0x646097ae, 0x29ae4768, 0x613bc34b,
  48033. 0x1300dfa0, 0x934bc2b0, 0x3712714c, 0x0e2be7e2, 0x86524629,
  48034. 0xed010800, 0x554fbb9f, 0x42314576, 0xf0ec0b38, 0x330a3282,
  48035. 0x65baf594, 0x706ef817, 0x3bdde1a8, 0xba7530e9, 0x7d2c727d,
  48036. 0x74cc95cb, 0xbb0c5d66, 0x2438906d, 0xb3fcd365, 0xd14658f3,
  48037. 0x19881941, 0x6c97f0e9, 0xe616f555, 0x4b9ec7ea, 0x353c2d85,
  48038. 0x620cb56e, 0x02a48014 },
  48039. { 0x506ccd38, 0x11d6d23d, 0x9059baa6, 0x229a1c54, 0x69d011c5,
  48040. 0x717c9c27, 0xd828937d, 0xe87e1b46, 0x83835083, 0xf5d63bbb,
  48041. 0xaadac258, 0xf0a7b427, 0x9f154d1f, 0x99ab26bd, 0x8ec955fd,
  48042. 0xdec0ffbf, 0x49fcb880, 0xee957c67, 0x1e0114de, 0x32395dee,
  48043. 0x369f46c7, 0x192a64b7, 0x91eb2599, 0x43044660, 0xa2e8c3da,
  48044. 0xbe2da887, 0xc3556d18, 0xa44e2c25, 0xb55f75f3, 0x31390414,
  48045. 0x8f217fe0, 0x1d8bde6f },
  48046. { 0xa2028924, 0x03cd39f8, 0xb06ecb9f, 0x6e54f19c, 0xd6f05846,
  48047. 0x862bbcb7, 0x5a060776, 0xdbe06716, 0xb10fec10, 0x9397c97a,
  48048. 0x6f1bb65c, 0xf4213826, 0xa672ba38, 0x414deccb, 0xf88b05e6,
  48049. 0x594d4d43, 0xac94d4d1, 0x7993f57a, 0xbfb17638, 0x74fc2a6a,
  48050. 0xb6fc655a, 0xd8196b5b, 0xee8d2139, 0xdc375c84, 0x360d3a26,
  48051. 0xb9b00a02, 0xdeb93b87, 0xb36ed35c, 0xcc83209e, 0xf565b28b,
  48052. 0xc61013c1, 0x349c6943 },
  48053. { 0x4de6c88a, 0xd1b39444, 0x4700207e, 0xd5c2c471, 0x21c2b780,
  48054. 0xb6f458a2, 0x0850993e, 0x749f7564, 0xbaef0c18, 0x400ba579,
  48055. 0x737c70f0, 0x2d742938, 0x21467ebf, 0xc5a8e2ec, 0x5337f453,
  48056. 0x243a666e, 0xed0bd50a, 0xc991f1c7, 0xf4bd1f91, 0x3a7f3e90,
  48057. 0x5f0e129b, 0x96089e8a, 0x07389635, 0xd0d3a177, 0x27182ac9,
  48058. 0x9cf842d5, 0x0817c5c2, 0x21195299, 0x87255769, 0xa32f327e,
  48059. 0x89c2d8fa, 0x056587ab },
  48060. { 0x1ce4733d, 0x008562ed, 0x98e51444, 0x5faff7cb, 0xa9ab46b9,
  48061. 0x5f03021f, 0xb61a8c13, 0x89494c5e, 0x36b35976, 0x57c95036,
  48062. 0x2ac2d2f6, 0x6be84c8f, 0x9bd2703e, 0x0e5b34d8, 0x7e872abb,
  48063. 0xc4ad918f, 0xc4052ee1, 0xc2a89e9f, 0x3190b51e, 0xc2caee3f,
  48064. 0x6fff254f, 0x58fd1437, 0x883e0972, 0x6f3c0d68, 0x0fb15438,
  48065. 0x63d0a0e9, 0xf6caae00, 0xc438764b, 0x3f1d0f6c, 0x815f1565,
  48066. 0xb86cdbde, 0x1b87f2ed },
  48067. { 0x2b0b15b1, 0x35792bbb, 0xce6ba779, 0xa3e4b5a7, 0xdd8f3779,
  48068. 0xfbacffd9, 0xc298d1ef, 0x005450bd, 0xc47031c6, 0x0e3f5556,
  48069. 0x95d68066, 0x0770f07a, 0x2d1052c2, 0xce3e84e0, 0x7aa8cc54,
  48070. 0xb050791e, 0xba3223a3, 0x4d621e73, 0x39632990, 0x87b9b94d,
  48071. 0x7eb8056d, 0x8df9cb47, 0xedfca0cc, 0xe2430de8, 0x9712a0ca,
  48072. 0x374bf416, 0x88848a99, 0xbe3f3c77, 0xc4a3e59e, 0xb22b87b1,
  48073. 0x3e95bc23, 0x8e0227c4 },
  48074. { 0x3210964d, 0x000e22a8, 0xff056eeb, 0xdccd5df5, 0xdaf1ead7,
  48075. 0x02173a1f, 0x67cdcae3, 0xd02833e0, 0x8bdcc90c, 0x1cc574cb,
  48076. 0x3224b4f5, 0x86eca714, 0xbb3f8298, 0xd00e603a, 0x0c1a8deb,
  48077. 0xb98ece1b, 0x378c261d, 0x228a46e4, 0xa6165e5d, 0xc6f9dd0d,
  48078. 0x4b7ef0e2, 0xb3ae3899, 0xbda9f306, 0x3a3c16b3, 0x38a084db,
  48079. 0x5e9a26d3, 0x5394e950, 0x528e5993, 0x4ea206bc, 0x848ecb11,
  48080. 0x40545d6e, 0x14b15ab5 },
  48081. { 0x664c59a2, 0x0f6d86c9, 0x60fd7aa5, 0x3dfe2be1, 0x9072cb8e,
  48082. 0x33f9b569, 0x8176a7e0, 0x5f2325d9, 0x4587080b, 0x79a0d4e7,
  48083. 0x0d5d4e05, 0xa4ee0def, 0xc87b28e1, 0xc0ad9ffa, 0x3f09b4ee,
  48084. 0xd6f18d2f, 0x292e9d87, 0xcc896ae7, 0x6094763c, 0xca88953d,
  48085. 0x18fbf9fa, 0xdbee97a8, 0x4b63d701, 0xdf20e0e9, 0x47ea722f,
  48086. 0xcbba6e30, 0x612b571f, 0xce57e1ca, 0x009a55f5, 0x1e16ac76,
  48087. 0xc4389e2e, 0x742bbed8 },
  48088. { 0xc1dc2c73, 0x23ea86dc, 0xc1643abf, 0x4bbbfd5b, 0x24d8ca1f,
  48089. 0x07f8fa1f, 0x8cb5cac7, 0xde68a6e0, 0x54e66a7d, 0x7d54c64b,
  48090. 0xa9b7ad78, 0x789dba22, 0xe364ab94, 0x4d88d540, 0x1f72e011,
  48091. 0xc8c2e02d, 0x46e2a278, 0x4c826057, 0x4b187c7d, 0xe6c35bb3,
  48092. 0xeb8fe0c9, 0xed8b3dfe, 0x7d11e415, 0xb6bc34e8, 0xb865c7f9,
  48093. 0xb3908bbf, 0xe1ecc17c, 0x717d1ce6, 0xf7cdd69b, 0x151e3308,
  48094. 0xb5c94124, 0x97bd5a14 },
  48095. { 0x81e82861, 0xe01c62fe, 0xdd42c40e, 0x703d4b6d, 0xe65e91e5,
  48096. 0x7e52e55b, 0x5abbbfdd, 0xb8b49374, 0xc72a45f4, 0xb4f15f52,
  48097. 0x550f29d8, 0xce8435a8, 0x582de75f, 0x9df76b9b, 0xa20c8b96,
  48098. 0x52e84c5f, 0x0a8a0af4, 0xaf77d2d1, 0xca6013c3, 0x0389bbd8,
  48099. 0x26f8305f, 0xb0d9b9ba, 0x0cec8b9a, 0xf053e848, 0xffabda18,
  48100. 0x4d63367a, 0xa6424c2a, 0x50f53be4, 0x864fba2e, 0xf892c58c,
  48101. 0x48cc5469, 0x317c6d31 },
  48102. { 0x2cb7d42b, 0x0c3525b0, 0x310facae, 0x55240bc9, 0xff20408f,
  48103. 0x8d5d2022, 0xe0c10ea0, 0x6b01402f, 0x718eb23d, 0x7fbef68a,
  48104. 0x41252a19, 0xa0146b5a, 0x110e0d6e, 0x59afce48, 0x022de181,
  48105. 0xe9a1d27f, 0xdc3f49da, 0x6db96d16, 0xefbe4008, 0xfc1ae3f5,
  48106. 0xeccbc11c, 0xf9d70641, 0x525f8636, 0x49022279, 0xc2763c30,
  48107. 0x3769796a, 0x1d90630b, 0x9cc3483c, 0xee3d3f17, 0x451651f0,
  48108. 0x9da0b8fd, 0x6ae59739 },
  48109. { 0xbff4d2ee, 0x57b13bc7, 0x30b173d8, 0x20754229, 0x0794936c,
  48110. 0xb6254bd5, 0x5efd55be, 0x1d5f232a, 0x4e0c3389, 0xc06f4a85,
  48111. 0x8e61f944, 0xcf2c5b59, 0xfd5f87b7, 0xc564861f, 0x5a2afa4c,
  48112. 0xee261fb1, 0x2d97a774, 0xb0ff7226, 0xd6cf007a, 0x1a89ae22,
  48113. 0xd346f214, 0x28880534, 0x97b6497e, 0x8fe73bff, 0xfa2afffc,
  48114. 0x8a8595b2, 0xf151a726, 0x9ef9cf3e, 0xe744b82b, 0xa84ee5f1,
  48115. 0xbc63fe72, 0x6649048d },
  48116. { 0x1e8b760d, 0x91b7bb78, 0x25aadaa0, 0xd47b0bd8, 0xfab5226f,
  48117. 0x81493d9f, 0xbffc148e, 0x4a6dd226, 0xa29be3db, 0x5a032f8a,
  48118. 0x34b0ab0b, 0x318dbc70, 0x7d654868, 0xdcccbfb5, 0x9c581e46,
  48119. 0x8506ab37, 0x2830ece2, 0x09136a6e, 0xcf6c80c7, 0x48b79356,
  48120. 0xef6b1e86, 0xfa176377, 0x83f0f1c9, 0x2c9c1cc1, 0x16abeddd,
  48121. 0x96f0526d, 0xa93b0de4, 0x3e0e98e2, 0x0f13873a, 0x6f2d7ada,
  48122. 0xf3fa49ec, 0x4eb93b5c },
  48123. { 0xe11fae32, 0xbd89f7e5, 0xc4023f51, 0xd13d74f5, 0x491c3f6f,
  48124. 0x1b0014df, 0x555279b7, 0x1d849a57, 0x05ba0068, 0xbb9e8897,
  48125. 0xc13ca2ca, 0x82222419, 0xfd33676f, 0xafbbb685, 0x75878a2a,
  48126. 0x931c3f52, 0xef3d5173, 0x12aeefef, 0xbd8a6878, 0x189a5cc8,
  48127. 0xd99f0c16, 0x82cffdb3, 0xa19d48b6, 0xbf565406, 0xe9c6c4e0,
  48128. 0x5605e223, 0x86804172, 0x53e781de, 0xc7001cc8, 0xcdf5c90b,
  48129. 0x7c043f68, 0x2b582d93 },
  48130. { 0x81abc2ae, 0xa1165c82, 0xe2b69eca, 0xa73380f5, 0x07fff66f,
  48131. 0xc097b3d2, 0x54776506, 0x5d603826, 0xb57fa21c, 0xdcbac9f3,
  48132. 0xc98dbdd5, 0x78750db4, 0xd9eff32a, 0x85e21103, 0x2f11c41c,
  48133. 0xceed172c, 0x9e348c09, 0xa8e39264, 0x831eddfb, 0x71cb936b,
  48134. 0xf50864a3, 0x915c3d06, 0xe93acfcd, 0xfe8e33cd, 0xb3f2f7aa,
  48135. 0x4bee10d7, 0xeb7cee9a, 0xc1d8eb48, 0xfa574afd, 0x4fa49ce3,
  48136. 0x862db4c0, 0x78615109 },
  48137. { 0x7ae72c21, 0x3fe3f480, 0xfd0f0da5, 0x631aa144, 0xf8c3a454,
  48138. 0xc76ee1e8, 0x51b4f1ab, 0x379ae094, 0xd7cdbb24, 0x2a3a4397,
  48139. 0x82bd5fcd, 0x7a14cffe, 0xf427ef5a, 0xbbe4ed12, 0x284d3ccf,
  48140. 0x9b0a43ee, 0x8eec6e1e, 0x57b78b93, 0x67b8e87b, 0x18d404e4,
  48141. 0x34374c20, 0x0c8adc05, 0x5428deb5, 0x64373605, 0xc3afa2cf,
  48142. 0xb4d80ec0, 0x3aa956f9, 0x6d51f93c, 0x84161c68, 0x9f9a28ab,
  48143. 0x6bc9c025, 0x540b6bb7 },
  48144. { 0x321d315d, 0x04e1734c, 0xd86e05d0, 0x4ef56612, 0xbba8cd81,
  48145. 0xeafae145, 0xacdc789a, 0x1fb07a49, 0x5877570f, 0x6a21e9ad,
  48146. 0xb9bc53de, 0x2e4a837e, 0x1d6298eb, 0x436db293, 0xea362f45,
  48147. 0x43afbc78, 0xaabf6585, 0x2a973d97, 0x0c924d60, 0xdce7dabe,
  48148. 0x7cadf0e9, 0xf69d98f0, 0x75020538, 0xe0b505a1, 0x4461cd29,
  48149. 0x3db7d1a3, 0x5e20e818, 0xe1c28776, 0x52dd50f6, 0x2ca25867,
  48150. 0x92e0388c, 0x897cab14 },
  48151. { 0x0d8bab8a, 0x59ed3813, 0xa438200a, 0xc11d364c, 0x40581415,
  48152. 0x0687bf2c, 0x7ac89674, 0x86ad0d3a, 0xb97411a0, 0x44928105,
  48153. 0xf383371c, 0x74984b11, 0x0d1a831e, 0x70d2ed84, 0x6c912fe0,
  48154. 0xd883628b, 0x14fa88d2, 0x44f8f7fb, 0xcf0ac93e, 0x564f2a4d,
  48155. 0xa6c24fa6, 0x82f629aa, 0xbf6cd949, 0xab906ba3, 0x20a5182d,
  48156. 0x2c822e67, 0x30eb93a5, 0x2ff47dac, 0xfff673aa, 0xdc62c4a4,
  48157. 0x476b0ec5, 0x64b00763 },
  48158. { 0xb3c9a404, 0x1e3f533e, 0xb7ef9952, 0xb1db7f73, 0x6c253693,
  48159. 0xc7f13e29, 0x0738eed4, 0x7ce7f4c4, 0xce26cad0, 0xccfd3b33,
  48160. 0x01ec5cf1, 0xd8784935, 0xdc084e01, 0x3f8fc09d, 0xc39b5acf,
  48161. 0x217cab32, 0x9ef5551c, 0x42daf0bb, 0xe1217a95, 0xfbc76f56,
  48162. 0xc237002a, 0x80178b12, 0xb070a293, 0x0b52c39f, 0x576ca964,
  48163. 0xe3925153, 0x19d68e36, 0x25559424, 0x09e50e84, 0x291fb82c,
  48164. 0x6618ed8c, 0x7dd22ea6 },
  48165. { 0x49cbb3bf, 0x7ffe844b, 0x5562fb25, 0xde0cc704, 0x9f5a845a,
  48166. 0x1e6ee537, 0xe51277fc, 0x956d7f26, 0x30635718, 0x2c75d4b9,
  48167. 0x96957f34, 0x39a14892, 0x82e5742b, 0x8cf4eb32, 0x83247b72,
  48168. 0x6b0d3ddd, 0x201a4237, 0x67a9f633, 0x1414a485, 0x416403c1,
  48169. 0xb6f6a916, 0x60afd447, 0xdac6f790, 0x95f94930, 0xbd3b9d82,
  48170. 0x685ff94b, 0x51cadf0f, 0x5c8f98fc, 0xb13b7489, 0x9559c88a,
  48171. 0x5f18fcc8, 0x31377c66 },
  48172. { 0x7dcfb35f, 0x35c5de09, 0x01cc36f8, 0x2dccca9f, 0x7576cb63,
  48173. 0x7e93e85d, 0xf7b4b375, 0x0c2dd48a, 0xb09a19b5, 0x9d95cd4f,
  48174. 0x71bfe607, 0x752ed159, 0x2596dad2, 0x439880cf, 0x69e90a6f,
  48175. 0xe52efb53, 0x03d3e60a, 0x44097663, 0xa95070e0, 0xfcf364fa,
  48176. 0x05624dd2, 0xd8f993b6, 0x00d5e467, 0xb35a9824, 0x0c8f4524,
  48177. 0xe289d024, 0x648a0179, 0xef45423c, 0x587edabd, 0x3a5fd695,
  48178. 0xa11e5271, 0x3dacc50c },
  48179. { 0x6499ae4c, 0xcb3e4f94, 0x7053c527, 0xa46dcbe1, 0xbe782e8a,
  48180. 0x807f5ce9, 0xd8481e45, 0xb6c64d28, 0xaa286fd0, 0xf35e4518,
  48181. 0xdf1cdb49, 0xf7b7b9ba, 0xaec23eaf, 0xf3fb6210, 0xb9bfd2fb,
  48182. 0x0a9ba385, 0x8807f3a0, 0xe51a0d53, 0xb17b2842, 0x7ab24404,
  48183. 0xf9dd9f0a, 0x6fd57687, 0xf3e9df64, 0xcd1efdb4, 0x60df194d,
  48184. 0x5dd2df7a, 0xe069df05, 0xbed3f2c3, 0x23248a31, 0x469b7561,
  48185. 0x694744f7, 0x866949e1 },
  48186. { 0x3f4ab07a, 0x3a9a0da5, 0xf54a6fbf, 0x2cd6f333, 0xb23cf290,
  48187. 0x0c92e921, 0x848e3d58, 0xc9581c3e, 0xd3b218ab, 0x93af1fbd,
  48188. 0x066cb4d7, 0x38598ea1, 0x990c03a0, 0x5001394e, 0x7d0877b5,
  48189. 0x3b664b1e, 0xd74c7091, 0xd79db1bb, 0x4e2d5dd0, 0x852d4435,
  48190. 0x3329db82, 0x0d2b841b, 0x7b96d480, 0xfa844eb0, 0xc295dc46,
  48191. 0x37a50569, 0x94f7ec4e, 0xc2d38373, 0x5b083177, 0xdc3884ff,
  48192. 0x8b1fa598, 0x574352b8 },
  48193. { 0x0d5d7ce9, 0xed2193f7, 0x0b487eaf, 0x3c19fd26, 0x7be65fd0,
  48194. 0x7c44ab59, 0x78270d56, 0xdd9da860, 0xbaa70198, 0x8a84ec00,
  48195. 0x285985df, 0x2ec27e49, 0xde2028d8, 0x996ccaf0, 0x61c2201d,
  48196. 0x4e7648c7, 0x091c19eb, 0xa96335bc, 0xf0d6782b, 0x253a3a69,
  48197. 0xd2946493, 0x3f204340, 0x099f6873, 0x444521a1, 0x6996011a,
  48198. 0x5fcbcc09, 0xf853a94e, 0x3884d5d8, 0xd3b6a3a1, 0x2418c624,
  48199. 0x06ae3c4f, 0x3e431af2 },
  48200. { 0x83d381f1, 0xf967d939, 0xd0c033c3, 0x36501aae, 0x54410768,
  48201. 0xbf3af4d0, 0x5093a6d3, 0xa86d1598, 0xd92f2900, 0x43ae0741,
  48202. 0x36f0b755, 0xfeb2afa6, 0xaa456d6f, 0xd090a6a3, 0xaefdb646,
  48203. 0x336a4fda, 0x1a942f7d, 0xfd1bfe44, 0x851ee41e, 0x7fc2a3ed,
  48204. 0x11e935c5, 0x4f1c9686, 0x53bbb343, 0xcd577666, 0xad896c2a,
  48205. 0xf26931ba, 0x86bbfa41, 0x8a0fbbd1, 0xa203cef1, 0x1c3d7d82,
  48206. 0xe2664d35, 0x6dad3f15 },
  48207. { 0x12ec35a1, 0xd1940b7d, 0xe7dfb128, 0x6219c5b6, 0xf13321d5,
  48208. 0x2cc278c6, 0x33c58eb6, 0x5e76904a, 0xd9903c43, 0x15090f55,
  48209. 0xc3d96a19, 0x061bc926, 0x8c0acba7, 0x974a9f03, 0x7198b21b,
  48210. 0x7a414021, 0xf8958c6f, 0xb069599d, 0xbebd0129, 0x517f2f1d,
  48211. 0xdf3a8dc3, 0x1109a613, 0x672375c5, 0x08e58448, 0x9383d2d3,
  48212. 0x56590ba4, 0x0bff837c, 0xfc3ee7c6, 0x27d2d55f, 0xc87a5390,
  48213. 0x5f517a3f, 0x2438e9d4 },
  48214. { 0x8815af3c, 0xc4a45308, 0xf3c9bed5, 0xe55f1a32, 0x97b65ddf,
  48215. 0xaef1cdc9, 0x12e51eb5, 0x61c61d94, 0xe63f2490, 0xbd0dac54,
  48216. 0xd0b3e231, 0x6f14429c, 0xf1da6010, 0xf737c3c2, 0x6bbc4fb1,
  48217. 0x7150e04b, 0x1be281cb, 0x205b4c89, 0xd7701f5b, 0xf1b4633c,
  48218. 0x2a513490, 0x8b33ef46, 0x68f1f7f2, 0xddb47c73, 0xbd416b67,
  48219. 0xf4ada511, 0xff795bb3, 0x9d2a97cd, 0x96200e67, 0x00a8b7b2,
  48220. 0xafe30e01, 0x13f39011 },
  48221. { 0x7bd0c827, 0x3dd296ef, 0x4a29ff46, 0x506110f3, 0x1c9a515a,
  48222. 0xf8793068, 0x268bca77, 0xde8d8045, 0x998045df, 0xcbb83024,
  48223. 0x68c0e584, 0x3f90d710, 0x263b6062, 0x2a838ca8, 0x535c5d0b,
  48224. 0x293bb5e7, 0x56415110, 0xceea99d5, 0x1bbda005, 0xfe311ad0,
  48225. 0xa4d8d018, 0x2497e0bf, 0x1cf2b866, 0x33dd77a0, 0xd8c4ba8b,
  48226. 0xbc075b73, 0x722b7bc9, 0x298466d4, 0xcbda1b0b, 0x17a7ce24,
  48227. 0x680703b6, 0x458d4b6b },
  48228. { 0x4d54d8b2, 0x8a26a20e, 0x4d320a0d, 0x05a5696e, 0xf994f700,
  48229. 0x698b5858, 0x2f6549a8, 0x7a4adc3c, 0x3694d00d, 0x1812e819,
  48230. 0x730402bd, 0x46b9b000, 0xa1b36410, 0xe10a1449, 0x99230220,
  48231. 0xeae95ea5, 0x1b4820c3, 0x3efc2e9b, 0x85c9eb8a, 0xfe5b5cb5,
  48232. 0x97847064, 0x21ae0319, 0x8f27d49f, 0x68ef0b70, 0x2f72556b,
  48233. 0x3259ef18, 0x624db01a, 0x00ae0457, 0x5668f95c, 0x628e3b06,
  48234. 0xb6fbbf91, 0x5f13f5fa },
  48235. { 0x3a9b0dc6, 0x7c6ed9ae, 0x6f883ec8, 0xaea1bde9, 0xea8b3677,
  48236. 0xea66bf88, 0x9a66e3ab, 0xdefa6abc, 0x68217ffd, 0xc4d3317b,
  48237. 0x290df05c, 0xf741c8f2, 0x7d11674e, 0x1f0fdf17, 0xc35989ca,
  48238. 0xfdf0ece7, 0x6b9c482d, 0x0eed92df, 0x55bf1ca7, 0x73713e66,
  48239. 0x25cec99c, 0x90acb290, 0xe803e69c, 0x37c9e3a2, 0x17713a1a,
  48240. 0x7c0a3c53, 0x6f5a174d, 0x350dc565, 0x05f802f6, 0x11625a44,
  48241. 0xa37ba4a2, 0x2196495d },
  48242. { 0x13142680, 0x00cb2fd3, 0x65d14cf4, 0xab9e91d7, 0xdfe2669e,
  48243. 0xc6a0ceab, 0x0ae22bc5, 0xbeefce58, 0xcb6ec250, 0x3c2b7986,
  48244. 0xd738f1ff, 0x84adb1a2, 0x516ec8ec, 0x9709bc28, 0x8e8f7db5,
  48245. 0xf3693129, 0x95b197f9, 0xc48efc6b, 0x9aaaa404, 0x9ff10952,
  48246. 0x144154b0, 0x2c3c8cbd, 0x427f3435, 0x33ef7bc3, 0xd21897c1,
  48247. 0x04a17940, 0x6ce548a0, 0x5aa0c47d, 0x3d56fa62, 0x2971cea7,
  48248. 0x04475f08, 0x93ad0eb0 },
  48249. { 0x988a9963, 0x7a0b6967, 0x6515e8dd, 0x61e477f7, 0x3b6b50f2,
  48250. 0x6274e386, 0xd33922de, 0x63a9b8d5, 0x687a5b3d, 0x3c38d3fb,
  48251. 0x1302e323, 0x18f6f09c, 0xe02fcccf, 0x254c05c3, 0x26e662f7,
  48252. 0xc04ed0b7, 0x143fe079, 0x1d5646b8, 0xc9016c8c, 0xef8a9448,
  48253. 0xf823d797, 0xe5674c4b, 0xbccde451, 0x0586f72f, 0x4417eade,
  48254. 0xc5fc88d5, 0x576e588d, 0x2b952209, 0x5844d1f9, 0x4408dd42,
  48255. 0xea41c034, 0x73f8c3f0 },
  48256. { 0x5df763dd, 0x89534fc8, 0x3ac71836, 0x3b1427f3, 0x6e8f15a0,
  48257. 0x0db5be17, 0xcb20888e, 0x1d390944, 0x857caea6, 0x7804c9ad,
  48258. 0x519f7bf3, 0xaa584428, 0x293aa8cf, 0x626eecf1, 0xea36a015,
  48259. 0x749e0d98, 0x3321edcd, 0xefff6dae, 0x28b791cc, 0x963deea6,
  48260. 0x2d16e361, 0xa14e0552, 0xb15ae206, 0xa2e058fc, 0xfca325e4,
  48261. 0x0f268745, 0x21341a8a, 0x7cf9d407, 0x7caa51b8, 0xdfed25d9,
  48262. 0xadbedd75, 0x0108ae39 },
  48263. { 0xa9e88f63, 0x54d178f3, 0xab0c7325, 0xaa05b11e, 0xe261d8a6,
  48264. 0x773a53e6, 0x8d0b91c8, 0x24db7dae, 0xe9bb004d, 0xde10b073,
  48265. 0x54e3090b, 0xfc8befe7, 0x0cc69c89, 0x16af0599, 0x9d59511a,
  48266. 0xddc83803, 0x46c5dafc, 0xc3f65b99, 0x1ee0a599, 0xfbbe4be8,
  48267. 0xfb3a9b17, 0x88891e36, 0x445dad00, 0x0c9aad75, 0xd5097e1f,
  48268. 0xdffc46ab, 0xac85a4e1, 0x8848089b, 0xa0c45233, 0x348bb42f,
  48269. 0xeb13c1df, 0x807c06d8 },
  48270. { 0x98ee0ef6, 0x00a969ec, 0x8bb7b7af, 0xba9d5483, 0xa02f8fdb,
  48271. 0x24484c92, 0x8b70557c, 0x7bdb201a, 0x60ad1af2, 0xe59343e4,
  48272. 0x998c95fb, 0x53a9a942, 0xda861d3b, 0x974db3de, 0xed399c0e,
  48273. 0xce1525c9, 0xf72109bd, 0x89b56881, 0x998211a4, 0x08ff7d15,
  48274. 0xef0f275a, 0x5df76b3a, 0xfa2f358b, 0x93f180f7, 0xc39b0634,
  48275. 0xaac4ffcf, 0x17583b53, 0x2692c626, 0xb55399fc, 0xb2fdfa36,
  48276. 0x99607a61, 0x16424c6c },
  48277. { 0xdd2744a9, 0x5dd65c55, 0xfe3af418, 0x2544c1c2, 0xefe8b089,
  48278. 0x32c82e99, 0xa9df691a, 0x30b7ab25, 0x9be99674, 0x98384550,
  48279. 0xcaf2d122, 0xbcecd258, 0xbcc77272, 0x88ae4098, 0x4b8efa0c,
  48280. 0xd4396141, 0xed64d12c, 0x44ff67b9, 0x2e7f3404, 0xa9e655e4,
  48281. 0x45b0e9eb, 0x3d16fc45, 0xf03ded28, 0x474a3e14, 0xacccb85c,
  48282. 0xa3c9adff, 0x7253a51b, 0x3dfe6bc1, 0xfb5831b1, 0xdddaf4b9,
  48283. 0xa4f4478a, 0x5544e602 },
  48284. { 0xbaa80b4f, 0x897c5313, 0x63bdc8ef, 0x0122716f, 0x7b42c5a8,
  48285. 0xae2742db, 0x0883308c, 0xe9d9e1e9, 0x2d341ab1, 0x352c8c3f,
  48286. 0xed945870, 0x163d0500, 0xc290d9d8, 0x8349dd73, 0x1f6c7d29,
  48287. 0x2053c5e0, 0xcb42033c, 0x83107446, 0x09d09af1, 0x76c88bd2,
  48288. 0xb2794681, 0xd0f70e6e, 0x19b1b540, 0x720b59de, 0x22994b43,
  48289. 0x80b7ecdc, 0x2dec53cf, 0xc1a4cdce, 0x1ed60f42, 0xdd7d3edd,
  48290. 0xe241d261, 0x5735995c },
  48291. { 0xa0237056, 0xdc4ba3fb, 0x33ab3388, 0x6856c164, 0x271ec612,
  48292. 0xc01eebbd, 0xe3031bec, 0xabdeb033, 0x6118a1f5, 0x4eee4419,
  48293. 0x5b600f33, 0xec497421, 0x08868773, 0x1b7185cf, 0x7c1b7dfd,
  48294. 0x7b0c46cd, 0x4a4c5e89, 0xd143b2da, 0xbb1ff94d, 0xdb9a5984,
  48295. 0xc9cf3465, 0xac3904e4, 0xeace64c9, 0xf8729bc0, 0x768ad99a,
  48296. 0x5cc22821, 0x8a9540c2, 0xbbd3b081, 0x049a6917, 0xe468ed5f,
  48297. 0x3ec45ef0, 0x885486df },
  48298. { 0x4bdff464, 0x6a942c93, 0x25a7b451, 0x3db2719f, 0x325be324,
  48299. 0xccb0070b, 0x19fe3339, 0x2055a31b, 0x241ee8ff, 0xaca69ae8,
  48300. 0x55ef8def, 0x7607dd08, 0x1a1b73c6, 0x9e24960f, 0x71d36810,
  48301. 0xbcb0e8a2, 0x6885e6b9, 0x29e11aa2, 0x185eae19, 0x98b5d0ab,
  48302. 0x0f81f91c, 0x1a0b96e4, 0x994fc503, 0x4d0e8bcf, 0xf119d6e0,
  48303. 0x33d81697, 0xaaa4ce0c, 0x29083287, 0xc91ff9d7, 0xc5dd4d3e,
  48304. 0xd4ab962d, 0x31cecfe8 },
  48305. { 0xfc8b21e8, 0x437bfd9a, 0xb19436df, 0xe5dd32b3, 0x921c36a0,
  48306. 0xfe5902d4, 0xa3d0fa90, 0x8e9de84d, 0x5bb523bd, 0x9663e6ad,
  48307. 0xaecd6975, 0x9800a23f, 0xb4fbb59c, 0x1009c0d9, 0xc9d20ff1,
  48308. 0x839aa7bd, 0xecd6fa3d, 0xf502f66d, 0xc5516ca9, 0x480ed4fb,
  48309. 0x6c742ac4, 0x65ffa5f6, 0xff3252f8, 0x2b7c7945, 0x75d9cb3d,
  48310. 0x72fefc05, 0xd6d6f1d2, 0x11b0863b, 0x9a6a4ec3, 0x5d8f3cf0,
  48311. 0xda2547b3, 0x6961b46a },
  48312. { 0xcb35e2ac, 0xd07b587e, 0x57af14d9, 0x1ed5546b, 0xdb28a04c,
  48313. 0xeca17a5b, 0x709d54f0, 0xa1f91d44, 0x9c6f400e, 0xa6e719fd,
  48314. 0xfb8ce190, 0x4e4b88ed, 0x246e3fd2, 0xf9781edd, 0xb655af5d,
  48315. 0xd67120e6, 0x93413ca7, 0xda782d1d, 0x9707fa21, 0x697e20a2,
  48316. 0x54e84123, 0x1eb51f32, 0x36051f9f, 0x2e254d9e, 0x73ce5be9,
  48317. 0xddaec42b, 0xcd3f794f, 0x89a9a32e, 0x0781aad9, 0x1964e22f,
  48318. 0x53755212, 0x6a63a90c },
  48319. { 0x3d7acbbb, 0x76554e00, 0xb74f6108, 0x2c01668a, 0x388c519b,
  48320. 0xe4a29672, 0x3eb94d4f, 0x01667714, 0x0cd6d2f6, 0x086a3cdf,
  48321. 0x7b370f7f, 0xf8658021, 0x5a4d3e7c, 0x658880c1, 0x5ba3f4a1,
  48322. 0xd6ed5816, 0x5ca471dd, 0xabcc7813, 0xe844a576, 0x809bf074,
  48323. 0x6ea502ea, 0xa53a81b3, 0x0e021ed3, 0xc20b9307, 0x8617f165,
  48324. 0x8c27f892, 0x8235cd0b, 0xa5476446, 0x82552961, 0xffc89ffd,
  48325. 0xd151d90e, 0x51ed4a22 },
  48326. { 0x449701b4, 0x37d6963a, 0xbb27caf2, 0xea8d91a3, 0xb572965f,
  48327. 0x3ef9be15, 0xdb50bf7d, 0x75a7a055, 0xce643b9b, 0xfd67480e,
  48328. 0x6ceb5d5e, 0xf2a60d2d, 0x5ed7c897, 0x68fc320c, 0x28ce685f,
  48329. 0x41c53cf6, 0x7106615e, 0x0e29711f, 0x23500ecc, 0x7a872138,
  48330. 0x6c29fe48, 0xaf0a9260, 0xe1ef9712, 0x93df3f2a, 0xd2d169bf,
  48331. 0x0d5f6fb1, 0x74a9793c, 0xeb7afe26, 0xe9f49256, 0x4173d94a,
  48332. 0x2b8b5ce5, 0x2d6951bc },
  48333. { 0x904e222e, 0xdd007d9f, 0x86f4e109, 0x333f248f, 0x8f429eee,
  48334. 0xd4994e8b, 0xcfc77518, 0x29573415, 0x0b0f42f1, 0x6e7fea3a,
  48335. 0xc2743519, 0xc795cb7d, 0x711e71a0, 0x820a8f66, 0x2b874f55,
  48336. 0x83d95d9c, 0xe70e1627, 0xd4b64d78, 0x8b92a742, 0x924353f5,
  48337. 0x447b5e6d, 0x322048b1, 0xbcf931a0, 0x0bad730c, 0xa7af2268,
  48338. 0x75c4d089, 0xb83b93f9, 0x464904c1, 0x165b3aee, 0xa24eba02,
  48339. 0xe08cc5f0, 0x65c48e78 },
  48340. { 0xde222c22, 0x1a1c73ce, 0xfcea23b4, 0x5683d8cd, 0xb2143b06,
  48341. 0x0301cb14, 0x59fcec77, 0x284adf8f, 0x31204cef, 0xfb1c581c,
  48342. 0x94735107, 0xf54d3eee, 0x4d3188c0, 0xdbf67f0b, 0x10f18d12,
  48343. 0x76a3f2d1, 0x07d3e013, 0x3809fa28, 0x25e7ece0, 0xf06f0a46,
  48344. 0xb2895d2e, 0xd82867ed, 0x08b0553a, 0xe106f489, 0xef245445,
  48345. 0xe2280fa6, 0xa8d9a3cb, 0x402d5785, 0xd438ba2d, 0xf63dd9ff,
  48346. 0x7a6b226f, 0x36b5cd2c },
  48347. { 0x545679a7, 0x87ff4e20, 0x4520c750, 0x64d80b41, 0x9b459cd8,
  48348. 0x90a357fa, 0xc85af1a3, 0xa19eaf39, 0x8d935a5e, 0x0d475d79,
  48349. 0x781a678a, 0x74501983, 0x0cc2e810, 0x74839779, 0x2f412244,
  48350. 0xc6a21d11, 0x36a51a37, 0x8d0e85f9, 0xeaa74df8, 0xff50151e,
  48351. 0x93cf99c4, 0x14e182a7, 0x376a9ab6, 0x45593df1, 0x522389ff,
  48352. 0x18f73caf, 0xf7445e8a, 0xd27cc960, 0x39a51dc8, 0x0692f4c5,
  48353. 0xdb39bfd8, 0x08d7c144 },
  48354. { 0x3ecca773, 0x809c0d96, 0xd48c2156, 0x87ea9192, 0xdb6bd641,
  48355. 0xf0eccd74, 0x2a678cdf, 0x77312374, 0xd1587b7e, 0x7a966d8b,
  48356. 0x6130a4c6, 0xf3c1a101, 0x5fce17bd, 0x7cc6e838, 0xa8de7aa4,
  48357. 0x95e95bb8, 0x898308e3, 0x3fe1e8b5, 0xe347694a, 0x0197243e,
  48358. 0xbb0cd2bf, 0xf3fe9c42, 0x0f9b2b49, 0xb5905264, 0xc7367d1f,
  48359. 0x4c385e8b, 0xb5ee147b, 0x1d3050ae, 0x04004ad9, 0x8e2c3879,
  48360. 0xbab70202, 0x5f2aa8ee },
  48361. { 0x1266524b, 0xe208d464, 0xd0a19f66, 0xb7bf3880, 0xda106ebf,
  48362. 0xa5aa685e, 0xe642dd46, 0x0a69e8d3, 0xc682e4d6, 0xef349c61,
  48363. 0x0fcb534c, 0x26f6ee3b, 0x05eb67b8, 0x7daba127, 0x18be05f6,
  48364. 0x2babb27e, 0x8e2d85d1, 0x959afcba, 0xe2d9d386, 0xedcf2d1a,
  48365. 0x1ea6f06e, 0x59dc52e6, 0x866e5ae8, 0xc28278b4, 0x02bcd3c7,
  48366. 0xd9ff0340, 0x784be82f, 0xe884ac76, 0x83c9f224, 0xa3164980,
  48367. 0xb46ff949, 0x62501a98 },
  48368. { 0xad264086, 0x563f7d9a, 0xa5e0e4bd, 0xca6a33db, 0x8c8d3d67,
  48369. 0xe8253002, 0x46e64b19, 0xa288dac8, 0x20aa4536, 0xfa3c9197,
  48370. 0xed553eac, 0x8130c9b0, 0x2ea8abd3, 0x622806e0, 0xceccfe77,
  48371. 0x52fbf54d, 0x4f0d1b70, 0xbd9a8e31, 0xd59b1741, 0x519d2133,
  48372. 0x9a6fea8a, 0xfd74101c, 0xb5c4eb10, 0xd1acf7a0, 0x91f9da5e,
  48373. 0x78499b73, 0xc0dea586, 0xabaa4c49, 0xa1f3531a, 0xcc9c5f73,
  48374. 0xfd3fc665, 0x497b15fe },
  48375. { 0xf45568e9, 0x8a56cbaa, 0xc7192a6f, 0xf491a0fe, 0x9ab2539a,
  48376. 0xdbb03dd3, 0x4ac37da9, 0xc86522f8, 0x02a0f5b4, 0x8c8cdba2,
  48377. 0xa29c539f, 0x8109fc75, 0xca90f02e, 0x9cd06d31, 0x3e216dbf,
  48378. 0x8f31f044, 0xba3ebd91, 0x99aa68ac, 0x42c007f4, 0x2a80d0d2,
  48379. 0x86a9b7ce, 0xdd8dffbf, 0xd6308edc, 0x405d3e84, 0x068012ca,
  48380. 0xdafa33fe, 0xedea1071, 0xc2eebd13, 0x2ff637e6, 0xb7ae7e5c,
  48381. 0x9e514cb7, 0x18d46a6c },
  48382. { 0xa78b7802, 0x868cbb22, 0x497cbaf4, 0x0745ddb2, 0x42ae8add,
  48383. 0xc4eb2f3e, 0xb4ceb4e4, 0xac0abcda, 0xa325fd40, 0x2e0d8325,
  48384. 0x13ac7345, 0x6cfe0571, 0xb14171b9, 0x7407a788, 0x6da7a52b,
  48385. 0x70eb0603, 0xd85176ac, 0xab0b36f9, 0x7c2954f3, 0x14109d29,
  48386. 0xdcd705ad, 0x370de9c8, 0x7bb5e751, 0x3f0db5cd, 0xa06e708c,
  48387. 0x45f93d41, 0x7e93050d, 0x10d54f8a, 0x5a38fef9, 0x69e6f8e4,
  48388. 0xd3f62e40, 0x55044601 },
  48389. { 0x06cb9cc9, 0xd1c5c910, 0x41d00014, 0x542074d7, 0x11236fb8,
  48390. 0x7cd8663e, 0x29ad5f82, 0x39721ffe, 0x2951fc83, 0x1d21fbfa,
  48391. 0x400d144f, 0x1cde06e7, 0x91792e6b, 0x9042596b, 0x29ad5166,
  48392. 0x3365c8e5, 0x9aeefe98, 0xe2220e85, 0x70c2aee3, 0xbcb53189,
  48393. 0x9ff100bc, 0x477ca3db, 0xf532973f, 0x27074176, 0x9a2bd01b,
  48394. 0xa12118ac, 0x3dd79f93, 0xf3425209, 0xc6f5d7db, 0x563a8ff7,
  48395. 0xd7b0ec4f, 0x0da313fc },
  48396. { 0x15aa2557, 0x37125a8c, 0x00893e9c, 0xca21d70c, 0x67b8a823,
  48397. 0x48713994, 0x7cb0042a, 0x0d3e9a74, 0xc9e2ce18, 0x2d2bf4ff,
  48398. 0x049aeac2, 0xd5531a0d, 0xf03d0660, 0x4d29a616, 0x1f1b7f00,
  48399. 0x473d50d6, 0xca3de50c, 0x3af0ecbb, 0x09c28f27, 0xe2959bea,
  48400. 0xf8704664, 0x6d7c2ea0, 0x731083ef, 0xadfae4e1, 0x941c2554,
  48401. 0x50940c26, 0xa1162d03, 0x44167410, 0x1e82290e, 0x620230d8,
  48402. 0xdb414acc, 0x63630be8 },
  48403. { 0x8a7d2e41, 0xbf8d5222, 0xeb62f879, 0x49e75823, 0x6c402d89,
  48404. 0x1b4d33dd, 0xde2c59ad, 0x883e04d6, 0x49b9dc38, 0xbf3f38f4,
  48405. 0xb4b70c4c, 0x9d997d18, 0x13cea045, 0x1f69b20c, 0x58e2606d,
  48406. 0xca3d7025, 0x261d1b79, 0x3d4fd977, 0x5a1436fa, 0x56aeafa8,
  48407. 0xbb443c07, 0x369b3e98, 0xe558f6be, 0xfce5186c, 0xf8ac8f89,
  48408. 0xeb0cd478, 0xd5e5aa72, 0x68074f37, 0x68544eb0, 0x295845c0,
  48409. 0xf16688ed, 0x306a9871 },
  48410. { 0x634ec136, 0xbc451e9d, 0x0e6f658f, 0x1edf27ca, 0xc0db4120,
  48411. 0xa9be0152, 0xc5bfee67, 0x87b6ef20, 0x9a2d6023, 0x35283238,
  48412. 0xc7afb899, 0x60e564d8, 0x0ac9c2de, 0x4af22bc0, 0x82a9d22b,
  48413. 0x28e6f631, 0xf532701b, 0xc075c701, 0x82075f91, 0xf6d418f8,
  48414. 0x1beaa511, 0xf9fa628d, 0x6e72a13d, 0x551e7a17, 0x77f4c01c,
  48415. 0x9306215b, 0x93c9d588, 0x71aba731, 0x58e57cd4, 0x6443ebe0,
  48416. 0xe8103e37, 0x2833ac41 },
  48417. { 0x8da5ec5c, 0x7e564b86, 0x1c08db24, 0xac3d9da8, 0x8c57a728,
  48418. 0x9d7c1f0b, 0x9d343dc2, 0x3512afe7, 0xfdc60339, 0xb438e4cf,
  48419. 0xdcfa1941, 0x7d5a2700, 0x27320449, 0xd5f323f8, 0x1393c6e6,
  48420. 0x1b87a58e, 0x04baa431, 0xecb68bd1, 0x4722b4d7, 0xc09c1c5a,
  48421. 0x206b5faa, 0xf42faa97, 0x9976327e, 0xe1dcbcd6, 0x087787d9,
  48422. 0x655ba9e4, 0xde5c0191, 0xbd59c757, 0x0bcf3538, 0x673020ed,
  48423. 0xa49d6303, 0x120cd454 },
  48424. { 0xcab0f9ee, 0xebfdb8f4, 0x2cce58ee, 0xbc003ef0, 0x5a8d0665,
  48425. 0x9b6a6841, 0x9b957774, 0x642ed3a6, 0x4721ab5c, 0x3de487f0,
  48426. 0x21a4f0d3, 0xef2ff380, 0x29dbddcd, 0xbd16f558, 0x0e93dff2,
  48427. 0x2ef05b4b, 0x0bc9aec1, 0xde1faa12, 0xd467fa92, 0x66dae2c2,
  48428. 0x5eb33e34, 0x758daf64, 0x8f0103cb, 0xa67ad9f6, 0x9be02430,
  48429. 0x151f693a, 0xeb4054bc, 0xd5698496, 0x7019336e, 0x8ef1677e,
  48430. 0x7fdeea3e, 0x021cfd16 },
  48431. { 0xdf5c36f3, 0x5c73715f, 0xd64ad254, 0x703bde37, 0xf2cf7713,
  48432. 0x55368d10, 0x0f3993c8, 0x1e5ec7b7, 0x304ae4ca, 0xfdb16776,
  48433. 0x3d3bb18b, 0x0d8f717e, 0x66343d5a, 0x5267073f, 0x156008b5,
  48434. 0xfaeb52ef, 0x224a470f, 0xb97ad5f9, 0xed2ab51a, 0xaf86e391,
  48435. 0x9974302c, 0xdc0c7e57, 0xfd0ae28a, 0xc88fa817, 0xbf8ed59c,
  48436. 0x807c22df, 0xeb128bb6, 0x5dedc231, 0xa20595a3, 0x71edcd9c,
  48437. 0xc73cf78e, 0x07265b46 },
  48438. { 0xbd66232f, 0x73dd99f0, 0xc4027716, 0xc59aaf89, 0x5b860fc4,
  48439. 0xaf826dfa, 0x7a943f3b, 0x239ea8aa, 0x523c428d, 0x0e0e1b1a,
  48440. 0x6973b95a, 0x55ea0e3a, 0x2557753b, 0xea399caa, 0x06957b1f,
  48441. 0xf8adf72f, 0x3bd34302, 0x0389f341, 0xf8a43a97, 0x333f27d0,
  48442. 0xadaf796f, 0xcd9c0c08, 0x49c12aa2, 0x6dcca49b, 0x7a0ac6e9,
  48443. 0xdd88deee, 0x0644080e, 0x8f47575d, 0x0cc2f4bd, 0x6e9d667d,
  48444. 0x31d1496c, 0x36c5754b },
  48445. { 0xf323d84b, 0x9120046e, 0x7e789c4f, 0xa6991122, 0x921b8055,
  48446. 0x4b0eaf4e, 0x8079974e, 0x6339844a, 0x740f8c79, 0xc905466a,
  48447. 0xcd6def49, 0x1c18d0f7, 0x4b23e4ba, 0x5297da6b, 0xc41800c5,
  48448. 0x1c09dff3, 0x37ef6777, 0x6c49075b, 0x50513ded, 0xa94c3a40,
  48449. 0x6b0b1705, 0x3d6742e9, 0xc48af5ae, 0xc0784494, 0xc95822de,
  48450. 0x40c01532, 0xc164d94f, 0xa2ddade5, 0xa2975eb5, 0xfc8a8ac9,
  48451. 0x1946944e, 0x06fbf861 },
  48452. { 0x3f45aa97, 0x2d65338e, 0x1d040feb, 0xd83b58c8, 0x0fdef8b9,
  48453. 0x05fef59b, 0xe4d7417c, 0x7beb071a, 0xb30a1a23, 0x982b61f5,
  48454. 0xfb65bd03, 0x4c5f2a2a, 0x5cbf6bf3, 0xe40abc9d, 0xf06612a5,
  48455. 0x422c326d, 0x9571ae28, 0xc921e69d, 0x23d3434e, 0x7c88b10b,
  48456. 0x9da07933, 0x96d2e957, 0x3619cf4d, 0x833d46a1, 0xd95eefa1,
  48457. 0xd9d19653, 0xa03e8f0e, 0x2a7d8411, 0x04bb5ab1, 0x5e642953,
  48458. 0x1f0fa9ea, 0x5e9ca0fd },
  48459. { 0x197c5dc4, 0x5bd54571, 0xe78a95a2, 0xe2da40bf, 0xffdb0eb2,
  48460. 0x65fb9efc, 0x0d17467c, 0xe952dc2c, 0xc758c6a3, 0xc1fc9c7b,
  48461. 0xd4034a9a, 0xfc79562c, 0x61f64b56, 0x26e36fbe, 0x1e84728b,
  48462. 0x6adc4b9e, 0xa8f9ac8a, 0x7f165fd3, 0x03e3e013, 0x7bc93a45,
  48463. 0x656478e3, 0xeacc5513, 0x064ddc77, 0xd3391717, 0x76936914,
  48464. 0x75b318dc, 0x362424a6, 0x69b1f1c7, 0x49955f34, 0x8cc2045b,
  48465. 0xc6836af8, 0x940622b3 },
  48466. { 0x0d997973, 0x4710ccb7, 0xd3f8f115, 0x3b29625d, 0x5b97abd5,
  48467. 0x8cf0c4d5, 0x673e14a5, 0xc6321e0a, 0x3d262246, 0x0541af9d,
  48468. 0x6fc83b11, 0xde6d8754, 0xf01652a4, 0x47e97da8, 0xad9802b6,
  48469. 0x0f82b3a6, 0xae9c44b2, 0x69aa4075, 0xced2bf77, 0xaf3f5de2,
  48470. 0x497a40da, 0x1ef1ea8a, 0x3c23ba9c, 0x2e0f8608, 0xf190a2c8,
  48471. 0xd8a998a4, 0xcfde3368, 0xe2b49c8c, 0xbde6bd71, 0xb9f49824,
  48472. 0x785bedb6, 0x80bb1664 },
  48473. { 0xfd145cb5, 0x05e575fe, 0xac5e6883, 0x155ee561, 0x8793b273,
  48474. 0x461e70cf, 0x133b2338, 0x9f1553de, 0xa2a7ba07, 0x2fb9e0c3,
  48475. 0x3e7086fa, 0xc3bfd6a8, 0x8bb4cb93, 0xb6ba8500, 0x76f82dbd,
  48476. 0x0b66d789, 0x54eb49ff, 0x7d5a6ff6, 0x1f20b322, 0xcd65d237,
  48477. 0x54e29cdc, 0x79ea49c2, 0xcb118ff9, 0x64975963, 0xcc58000b,
  48478. 0x969598dd, 0x110c779c, 0x95107918, 0x63b85a35, 0xedfc1548,
  48479. 0x41212350, 0x077ba5ea },
  48480. { 0xcdd86f61, 0x0b3a38d3, 0x0502a0ab, 0x43121445, 0x806d0272,
  48481. 0x1912edc5, 0x8a32f10f, 0x01dc1f98, 0x0e80c760, 0xbb1d31d1,
  48482. 0xf464e8b3, 0xd46ec7e5, 0x9abf49ee, 0xd569af36, 0x2cdade77,
  48483. 0x9d286ea7, 0x45ad5920, 0x2be7020d, 0x6299ae7f, 0xabe5236e,
  48484. 0xd3f55c07, 0xc93179bd, 0x52350e80, 0x8138995a, 0xaff07586,
  48485. 0x0901265c, 0xf4739653, 0x5b3c81b2, 0x9bc77d21, 0xbaf7581d,
  48486. 0x4591a2e2, 0x6b2006df },
  48487. { 0x965b1bc1, 0xb2fe50a8, 0x962bb4fd, 0x931f536a, 0x000e7f99,
  48488. 0xd5718d33, 0x53d5125e, 0x84728f25, 0xd2125caf, 0x4f8a6184,
  48489. 0x357f679e, 0x54f1a701, 0x1531c05a, 0x70a9f40c, 0x6fa8b775,
  48490. 0x10d0cb97, 0x9dc12ce9, 0xb476f41e, 0x2755f894, 0x5c8d7a75,
  48491. 0x625741a4, 0xd6c12e10, 0xc917b16c, 0x262a6fb8, 0x38d6b0a0,
  48492. 0x24d116e6, 0x32c38e83, 0x849540c0, 0x66868afc, 0x855b911c,
  48493. 0xbd26b550, 0x53217ea6 },
  48494. { 0x259f52b4, 0xfc840473, 0xe621146c, 0x968da9cb, 0xcacbd26e,
  48495. 0x964eb85e, 0xe4a54344, 0xab7daa2d, 0x381a4ff7, 0x6dc3b848,
  48496. 0x41c815ef, 0xa07a96b3, 0xc3d4b1e1, 0xc4fae9e8, 0x42ce9ea8,
  48497. 0x0f938d1e, 0x35cc052f, 0xa727dacc, 0xe9a06f07, 0xc81e01c9,
  48498. 0x4a6d65a1, 0xa9e08dcb, 0x6044a9a6, 0xf8e2d173, 0xf2bd295b,
  48499. 0x99893dd0, 0xf9781b12, 0xa08d3379, 0x61830ac2, 0x64bd6001,
  48500. 0xd9adbeef, 0x0386931e },
  48501. { 0xd09885a5, 0xd0d7abb3, 0xe355bb07, 0xed9d2b67, 0x536ebaed,
  48502. 0x3bc238cf, 0x699ce4d6, 0x61ca2e78, 0x111594cd, 0x354ff447,
  48503. 0x03316ad2, 0x55cbe709, 0x49fff5c4, 0x418679fd, 0x0f9c6c40,
  48504. 0x75bacd75, 0x2972721a, 0x677edc88, 0xe5ef502f, 0x82596887,
  48505. 0xbf320e0e, 0x459e9367, 0x8bbdccb2, 0x81ce36ef, 0xb766863d,
  48506. 0x1ba097fc, 0xd58c6db8, 0xcd3a21d6, 0xb4a8748b, 0x0e4967cd,
  48507. 0x15041c20, 0x2caaf749 },
  48508. { 0x6ed20424, 0x44f98006, 0x22471545, 0xb3e4ea23, 0x781a8c86,
  48509. 0x268ed1a5, 0x7ae5b70b, 0x48d0ab75, 0x356d3982, 0x6ca8b320,
  48510. 0x2df31fa4, 0x9ce8e681, 0xd925dcf2, 0xb909d232, 0xf56723de,
  48511. 0x302c8f78, 0xabac96f9, 0x11725d69, 0x57d1a170, 0x656a47ca,
  48512. 0xc18a2be7, 0x6bb5d511, 0xad50d9d9, 0xb56e45f1, 0x70b05518,
  48513. 0x36e886e2, 0x09d8ff91, 0xc7c71f3d, 0x9350361e, 0x65a1bbe2,
  48514. 0x45fe3bd8, 0x86d7f532 },
  48515. { 0xb0bf719a, 0x99f16eb6, 0x8bc3d913, 0xb6975098, 0x26cd01b4,
  48516. 0xfae50e52, 0x90898d1c, 0xd3e3ac54, 0x887ec666, 0x4da3b9db,
  48517. 0xfbea45b8, 0x58300644, 0x8355b058, 0x369f3bd9, 0x579bcc13,
  48518. 0x0fb239a8, 0x6e2bd811, 0x4f5b4539, 0x24198fd2, 0x007f3baf,
  48519. 0x8837d51d, 0x68a676db, 0xeae75b16, 0x68eeea62, 0x3db6083c,
  48520. 0x5ffe5f94, 0x7d836c5a, 0x52c94d0f, 0xcbc1ff85, 0x5a4c3c6f,
  48521. 0x86c0b4dd, 0x682a55e3 },
  48522. { 0x587495aa, 0xc8f235a4, 0x34c7245d, 0x2276026c, 0xb75a46e3,
  48523. 0xd6ae0cc5, 0xecc3e5e7, 0x890d3965, 0x14296629, 0x1b13342f,
  48524. 0x8a877227, 0xc89927e6, 0x2324a68b, 0x1543f27e, 0x49cdc21a,
  48525. 0x6c447684, 0x1452d0ac, 0x9bc7fd4f, 0xff4b045c, 0x2cc30a31,
  48526. 0x852f7611, 0x415d46a0, 0xc6fdd7a6, 0xad737052, 0x7b4c7c91,
  48527. 0xdcecc3ab, 0x7688d70c, 0xd2cdf01b, 0xe40d3905, 0x054f2542,
  48528. 0xfefe4dcd, 0x02227fa6 },
  48529. { 0xb751948b, 0x1805efd9, 0xfdfd225d, 0x8efeed46, 0x4f2c8b22,
  48530. 0xcb128e09, 0x96f7c5e5, 0x9d1090bf, 0xb4cbeca0, 0x0959d044,
  48531. 0x8e08cb04, 0x21c955f9, 0x68fa4fce, 0xbc1f279d, 0x0710ae9a,
  48532. 0xb021e14e, 0x881167f4, 0x64d16e9f, 0xbbc9f1a5, 0xf5a5c22e,
  48533. 0xe3420eea, 0x5f3716df, 0xd5c4e843, 0x971eb915, 0x28ffba81,
  48534. 0x64fc55fc, 0x7dd37578, 0x3427e54d, 0x15ebc7d0, 0x446e6a62,
  48535. 0x29269778, 0x547e249a },
  48536. { 0xa1ffda27, 0x4706868a, 0x7955cf50, 0xb4e6cdcc, 0x0a63f3d8,
  48537. 0xf65151e1, 0x9de5e70a, 0x5b4127ea, 0xf9342823, 0x3d2c09ba,
  48538. 0xaa2f7d51, 0x18c99d83, 0xddeec025, 0xa0c5bb1d, 0x03dcf1ce,
  48539. 0x7ffddf84, 0x616fdeda, 0xe57e4d29, 0x7932a1f0, 0xd2456569,
  48540. 0x3191d4e3, 0x7475e0e8, 0xc220218b, 0x3479bea1, 0x8bcb2505,
  48541. 0xfceb5c90, 0x3c6132e6, 0x1c685cea, 0xbfe6c1eb, 0xc42dc745,
  48542. 0xd2b08eea, 0x45a41cc0 },
  48543. { 0x4dbbf0e1, 0x3ea9b2c7, 0xa17cf70e, 0x41ff962f, 0x5eeb4c66,
  48544. 0xdc1ea758, 0xa9beb17e, 0x4f5412d2, 0xa285741a, 0x2c9e4f52,
  48545. 0x984fd11f, 0x93df7da4, 0x0df3184e, 0xb2afbddc, 0x2421e375,
  48546. 0x96323d25, 0x49df781e, 0xc87be1e4, 0x3d589bea, 0x145601ed,
  48547. 0x28fff6dd, 0x0f0bd9bd, 0x8a0f298c, 0x2d3259d4, 0xd88e6944,
  48548. 0x362d7a77, 0xb6ac2af6, 0xa84c06b6, 0xd087da02, 0xba850ac9,
  48549. 0x42ee40c8, 0x128763c9 },
  48550. { 0xacbac178, 0x29a80f07, 0x34b08f6e, 0x7cc20044, 0x70feded2,
  48551. 0xe9631d14, 0x86615767, 0xb2115da3, 0xcb088548, 0x7c75f5c4,
  48552. 0x9a2e8e03, 0x5b29d213, 0x8b881752, 0xfe9fda66, 0xc1de7ebc,
  48553. 0x3f1d8d88, 0x03218123, 0xb476565e, 0xb1c995f3, 0x07365561,
  48554. 0xb13eb71b, 0x2160cb18, 0x99b3a0eb, 0x7e8da513, 0xb20fcd74,
  48555. 0x5e8ca1f9, 0xb4126d72, 0x6a7e0067, 0x68bb637f, 0x1e8204b7,
  48556. 0xfc4f74d2, 0x75e96bcc },
  48557. { 0x0d19716e, 0x189d1fdc, 0x7c384525, 0xdf585058, 0xea987d2a,
  48558. 0x64a846d1, 0x6c07150f, 0x12b6bf83, 0x4d6fd5b7, 0x91d85d46,
  48559. 0x4f53f55f, 0xa9788836, 0x81509129, 0x60083bd8, 0xea876f48,
  48560. 0xa7672683, 0xc15b2489, 0xe80b2e7a, 0x42d1d992, 0x985ef8d2,
  48561. 0xcf3de492, 0x9c57b029, 0xb1487627, 0xfe02f83c, 0x8ae5b687,
  48562. 0xaeba4fe4, 0x5d6b8196, 0x8a86f09b, 0xa16e523d, 0xd88f566b,
  48563. 0xba268949, 0x309a6e9a },
  48564. { 0xbdfbe97a, 0xef27ee50, 0xb8c50c4d, 0x1a5fe70f, 0x7fe09f5c,
  48565. 0xcc7beb01, 0xbed36cc5, 0x8fa15a85, 0x7550ed3a, 0xc0c3acdb,
  48566. 0xeb908681, 0xc581ef87, 0xc49d5ccb, 0xa15b3362, 0x1fa264e8,
  48567. 0x0fbb1714, 0x8e1eee88, 0x267f8d8f, 0x21c2b63d, 0xd31ccfd6,
  48568. 0x53be7efd, 0x924dbe7d, 0xdb2a358a, 0xd42e877f, 0x75d68ac1,
  48569. 0xcf9673c7, 0x714fea55, 0xe35978fd, 0x5769b202, 0xeeb36653,
  48570. 0xd7593789, 0x0458258a },
  48571. { 0xa042dbdf, 0x5df71a74, 0x5779dfa2, 0x2d405857, 0x0d2e6657,
  48572. 0x0e66cba7, 0xca2e892e, 0x285d6745, 0x0f0e6b5f, 0xf56a8def,
  48573. 0xa30767c3, 0xe0ee851d, 0x43346b9c, 0x98c05658, 0xd6b3c742,
  48574. 0xb35fce26, 0x39777e00, 0xc0895bff, 0xe7b6d886, 0x83c8f6a6,
  48575. 0x4f02904b, 0xbee14843, 0x2e84ec34, 0x7f74915b, 0x96d10991,
  48576. 0xbaaf663c, 0xe41facc0, 0x004b8757, 0x6f86c029, 0xa2b880e5,
  48577. 0x95b77358, 0x53f4a3e0 },
  48578. { 0x89fc48e7, 0x11bb08ce, 0xafab5aeb, 0xba60c577, 0xa0c1cb5a,
  48579. 0xf06bcbf8, 0x79757cb6, 0x7d2efaea, 0x76319160, 0xe26d90b1,
  48580. 0x2b77b7a9, 0x42aa1ab6, 0x285df2bf, 0x38eec0cd, 0xf3a8f7f0,
  48581. 0xd35947f5, 0xfc1cb5b5, 0x97c8dc0e, 0xc45845cf, 0xfeb8cca0,
  48582. 0x249e26f2, 0x16e8d989, 0x483ed89a, 0x7c264e6d, 0x51d91073,
  48583. 0x13a3f145, 0x305e99f0, 0x8501562e, 0x6908d563, 0xaaf98d74,
  48584. 0xd723d236, 0x0a99e653 },
  48585. { 0xabbc0559, 0x23536f46, 0x9aa1a160, 0xc163067b, 0x0c1681b5,
  48586. 0x229fd229, 0x1378e907, 0x61254be1, 0xab793a2d, 0xc60ff57a,
  48587. 0x466552db, 0xa6f2df8b, 0x8c170a36, 0x9ad31893, 0x29b74d9a,
  48588. 0xc5cd9abe, 0xf7848523, 0xcf747273, 0x0d0e3063, 0xc126a93a,
  48589. 0x4248e3d8, 0xfe2021e3, 0x8323ddfa, 0xd97343ee, 0x332639e7,
  48590. 0x9f768775, 0x75325548, 0x9650fc31, 0x3eebf7ea, 0xb595dbd1,
  48591. 0x010fcbc0, 0x3a95cb45 },
  48592. { 0x39d7ff2e, 0x954e68cb, 0xc1d5c48f, 0x8dd1cb4b, 0x7169438a,
  48593. 0x02a92c77, 0x91cad8ce, 0x7965c0b0, 0x32cd08d2, 0x0c5798ab,
  48594. 0xa6902bda, 0x1a5bc3c3, 0x5186d218, 0x545d0925, 0xd27e64db,
  48595. 0xf0077cdb, 0x8cd092da, 0x0157caa4, 0x24532ab3, 0x2a2fa3a0,
  48596. 0x41ccaba3, 0xa5fb639b, 0x4744aee6, 0x01702dc1, 0xcdba93da,
  48597. 0x485bb436, 0x329784f1, 0x93597f66, 0xdad672c3, 0x5d713c1d,
  48598. 0x030b7245, 0x366d222e },
  48599. { 0x573ea5b2, 0xd50b4875, 0xa90da44d, 0x0fce401b, 0x7a1a0310,
  48600. 0x7b53fa65, 0xcf114460, 0x722a80a5, 0xa538bf49, 0x0b8ebf05,
  48601. 0xd32acd21, 0xae141147, 0x7b5ad07d, 0x6692712c, 0x3f48ca07,
  48602. 0x6dc5fee7, 0x2b8a78d8, 0x98ed1499, 0xdd2f1759, 0x4e8b3145,
  48603. 0x5f971b8e, 0x43408de1, 0xadf1b368, 0x055ea6dd, 0xe5932b7e,
  48604. 0x4bb76e73, 0xd30893fd, 0x44287153, 0x0661bfda, 0x173dccd2,
  48605. 0x79defd25, 0x9072ba99 },
  48606. { 0x9620ea39, 0x474de4dd, 0xc831cee8, 0xfbf1649f, 0xcd3a9c43,
  48607. 0x0b0e8bb1, 0x3f3df1d5, 0x6a38286f, 0x8f0ec9b3, 0x4ed072b3,
  48608. 0x729c09e3, 0xa6e4c987, 0x8ad12242, 0xea3e8ac6, 0xfbdfa5ba,
  48609. 0x6ae0e22b, 0xb0a0f592, 0x56171ecf, 0x6b871f8d, 0x33b2886d,
  48610. 0x35e11bda, 0x6b19bea9, 0x7f0f153f, 0x4d815a40, 0x7d6c02ee,
  48611. 0x7e608d97, 0xb6a88f46, 0x7e8f23d9, 0x439d1654, 0x26ac9652,
  48612. 0x35546c29, 0x8d92c6bd },
  48613. { 0xabeb0ff7, 0xb3e0d7ce, 0x3e0e42f8, 0xfbe35254, 0xde808499,
  48614. 0x57d1b226, 0x1cd44bc3, 0x9ece2e1f, 0x435cfee1, 0x1245adbc,
  48615. 0xf93f581c, 0x874ee840, 0xbda0b947, 0x916a779c, 0xfa57ae0a,
  48616. 0xabcc815a, 0xf0a621b0, 0x97adec2d, 0x81f90bdc, 0xbe6a502b,
  48617. 0x53bde63d, 0x54bf9de1, 0x78884c25, 0xa88fdabf, 0xcbbb5470,
  48618. 0x30aa52b1, 0x29053ef5, 0xf805396c, 0x8dd827ea, 0x8d43d898,
  48619. 0x5c1ae5c0, 0x4e4bec17 },
  48620. { 0xfcc09676, 0xbf8483a2, 0x19ea9a94, 0x457c4a3f, 0xd702a5dd,
  48621. 0xa6852ef3, 0x843fe7d8, 0xe7915fd2, 0x16e35158, 0x644bba98,
  48622. 0x9ed746f0, 0x8d1b95d0, 0xb90af0b5, 0x47704581, 0xd4fd135e,
  48623. 0x0bd4bc6b, 0xb4e833a5, 0xa6dce067, 0xff56a9a1, 0x2c0e8f30,
  48624. 0xec2c63fe, 0xa9c80800, 0x98f508a8, 0x449c20a5, 0x3292813a,
  48625. 0x02b94cb3, 0xec7e81a2, 0x647e3d28, 0xb4877677, 0x72e67d1a,
  48626. 0x6f9ded24, 0x7a4aa3f5 },
  48627. { 0xe27a0045, 0x559ef1ba, 0xb242cb50, 0xdc812d4f, 0x39cf8d24,
  48628. 0x23a478e4, 0x9b3f9c54, 0x97544fc5, 0xaffa1fcf, 0x5ac68132,
  48629. 0x34a2c83b, 0x74f8fee0, 0xcd3f4bb7, 0x96cc640f, 0xb0512ea6,
  48630. 0x775dce9d, 0xcdce381e, 0x67dca19d, 0xa9d3fe55, 0xc1eeb3f3,
  48631. 0x1a19274f, 0x38e0bf42, 0x28d69b12, 0x15992fb4, 0x9fd09df8,
  48632. 0x48fcebde, 0xb41ab5df, 0xdc9dfa4f, 0xc0a269c5, 0x0cbd7dc8,
  48633. 0xf7f0ade1, 0x60282a7b },
  48634. { 0xdceea2e7, 0x7c07e538, 0x3c42061d, 0x38a322c8, 0x4f1f6516,
  48635. 0x676828f9, 0xc7776a10, 0xf21b69fb, 0xb5e6b405, 0xc63a3417,
  48636. 0x91a7b642, 0x4c99f258, 0x2cad1440, 0x38692ca8, 0x00869bcd,
  48637. 0xf1e82ffe, 0x16fe466a, 0xc30b714e, 0x19019138, 0x5fb742f9,
  48638. 0x0fa516ae, 0xe90166d0, 0xd8c73a43, 0x5550f7ac, 0xfbc5c372,
  48639. 0x2d6a407d, 0x68cc39ed, 0xe47a7539, 0x4a5fbe70, 0x3fd286d9,
  48640. 0x23c6b942, 0x5f4ae9c7 },
  48641. { 0x53f4d561, 0xd96a2dda, 0x16da1992, 0x286d45d0, 0xfdd4b051,
  48642. 0x449a01fb, 0x9f2195ea, 0x25488a0d, 0xa37661b3, 0xc4151b0a,
  48643. 0xf9e5ee02, 0xb98c471e, 0xa8658817, 0xa4bca86e, 0x7a68fc0a,
  48644. 0xbbcadb87, 0x6b7366a9, 0x88b34649, 0x15661c2d, 0x32ee98d4,
  48645. 0xc901420c, 0xf5b3b4c6, 0x2f2752af, 0xa2352735, 0x510e4d9c,
  48646. 0x2f64ce73, 0xaca4aa80, 0x939a7f26, 0x401aa503, 0x9cd3e291,
  48647. 0xdc46afd2, 0x92a01423 },
  48648. { 0x1c2f7dbd, 0xe9f24be1, 0xb7d527fa, 0xda8c900f, 0x8648f128,
  48649. 0x963e25bb, 0x48141941, 0x9ab713e2, 0x7a6756fb, 0xe87f7d01,
  48650. 0x058d90bd, 0x274dd85e, 0x82566abd, 0x823fee7a, 0x74240195,
  48651. 0x9f6230d7, 0xacb5e46e, 0x04579f2c, 0x16a4c87e, 0x2a226263,
  48652. 0xd99b0857, 0x9ca19a43, 0xe488789e, 0x86dc2ba3, 0x9406c3bd,
  48653. 0xf960b5b9, 0x8960957e, 0x6f2c428b, 0x161c515b, 0x90748706,
  48654. 0xaa88cb9b, 0x0fc8fe1e },
  48655. { 0xfeb90f2d, 0x68ae1bed, 0xa48b1559, 0xf393bb3c, 0xf64e9635,
  48656. 0x2be62f9c, 0xf8be75c2, 0x354c2410, 0x5e6f7529, 0xbd7ea703,
  48657. 0x162cab31, 0xc264868e, 0xc860f3ff, 0xb1391e70, 0x1d89837e,
  48658. 0xdf367c75, 0x2bf32941, 0xe150b6b4, 0x78c1318f, 0x95e8f46e,
  48659. 0xa2c4b160, 0x2b3f1dab, 0x701afbf3, 0xc6ccf5ce, 0x5e8874c5,
  48660. 0x3ad27530, 0x5dc6dcbe, 0x39285e51, 0xd99892dd, 0x3c954d86,
  48661. 0xdfd3789f, 0x2d0ba862 },
  48662. { 0xb472e1af, 0xeacd8ee8, 0xb76abbcc, 0xeb354eae, 0xd0d93fbd,
  48663. 0x9b520bf8, 0xfe6fc706, 0xfccd60d7, 0xa4ee2f39, 0xa9353dde,
  48664. 0x9a81e51e, 0x5eb0925e, 0xd1366777, 0xee334da1, 0xd5354d69,
  48665. 0xc1d28c9f, 0x92a5ed54, 0xb9771755, 0xb7f70d81, 0x5d3e367f,
  48666. 0xa933ae7a, 0x7be7eeca, 0xe23cfbb7, 0x264cf1f9, 0x89497681,
  48667. 0x0d129f4a, 0x09b6235b, 0x705375a4, 0x48a376da, 0xccf64c75,
  48668. 0x4d41dbfc, 0x963c8712 },
  48669. { 0xde36a814, 0xbae290cb, 0x733b12b5, 0x9bdb0195, 0xf77fe0e1,
  48670. 0x0ebad867, 0x29720cea, 0x0a7d19fd, 0x9029ec72, 0x434d7651,
  48671. 0xbb51911e, 0x856aff17, 0xd80a7f60, 0xd0a25d9a, 0xf848c106,
  48672. 0xffca86af, 0x43ad749c, 0x53e8bdf9, 0xe3e696bb, 0xfb9e0284,
  48673. 0xeeee4215, 0x3eb6630a, 0x2ecf3c63, 0x9d8fbb9e, 0x4e00c0c0,
  48674. 0x71da4ffa, 0x5d57beac, 0xb296be59, 0xa8cec7ef, 0x1751fbad,
  48675. 0xff55d7bd, 0x2d03eb3c },
  48676. { 0x04f2ec1d, 0xeb16925f, 0x0d147ee2, 0xa878f276, 0xaad9d9e0,
  48677. 0x442df604, 0x3f71035b, 0x891df44b, 0x8cb95d5b, 0xc28272b3,
  48678. 0x5ee8ed23, 0x6f14efb5, 0x13b0f3e3, 0xf3c4460f, 0x6bd7335e,
  48679. 0x889f9bd7, 0xf755ba6e, 0x889ee771, 0xed219b6c, 0x626984fe,
  48680. 0xec2ee411, 0x2d44c737, 0x63efcd37, 0xb94385a2, 0x6637826b,
  48681. 0xd909321b, 0x3ee6b7a7, 0xc24f8a79, 0xa7cf61b7, 0xa3ca8d24,
  48682. 0xc54bacd9, 0x842e40c1 },
  48683. { 0xa661d843, 0x5a268ed6, 0x4f5b30cd, 0x02328cca, 0x1311e177,
  48684. 0x16e6fed1, 0xc6695967, 0x690decb4, 0x57b2e280, 0xbdac5bf6,
  48685. 0x1efe42d0, 0x827f82ca, 0xca5fca2f, 0xc554ec0a, 0xdde45506,
  48686. 0xac5276c1, 0xe3077513, 0xb7f4cb08, 0xcc8797cc, 0x8caf6d9a,
  48687. 0x0d9332d2, 0xd5964814, 0x285a409f, 0xcc6ae297, 0x6223d093,
  48688. 0x7773c2a5, 0x5128fc09, 0x2d5266ac, 0xbc31fe6c, 0xa596b7cb,
  48689. 0xcac91328, 0x0e63319a },
  48690. { 0xf0360ac2, 0xb5cd2fad, 0x285e605a, 0x86b660de, 0xe25b9b14,
  48691. 0x82c6cf10, 0xaa9ac554, 0x9d5fa38d, 0x526c070e, 0x3dfcf1b8,
  48692. 0x3fccc52d, 0x0379a96b, 0x0bfcc7f5, 0xe3659c29, 0x69d3e6a1,
  48693. 0x5b1a3db5, 0x9b7b42d5, 0xb41528b5, 0x9c22a006, 0x934defa4,
  48694. 0x9b4ce3b6, 0x90f38018, 0xb3abaf32, 0xb073bc04, 0xff8389e2,
  48695. 0x27a5a222, 0xffa5a35b, 0x0b7a9d51, 0x28e1a7c2, 0x4939ecef,
  48696. 0x1872705a, 0x88839da2 },
  48697. { 0x701ce29a, 0x56b66c30, 0x58981d50, 0x3acaf126, 0x105f9f21,
  48698. 0xd4dafc0c, 0x373e3d13, 0xfee571e6, 0xfa2ee3ca, 0xe7269c86,
  48699. 0xdd20385a, 0xf5cca64a, 0x3000e9ac, 0x217f2757, 0x0e7273ef,
  48700. 0xc934db47, 0x355b6776, 0x4294f4f7, 0x6fc05180, 0x1faa36b9,
  48701. 0xb052190b, 0x8f88b1db, 0xe9eaef52, 0x35791b90, 0xdb681b90,
  48702. 0xf37fb2eb, 0x4415c369, 0x39d0a51d, 0x1d2e21c9, 0xfc59cca7,
  48703. 0xa1f50c26, 0x64128cfe },
  48704. { 0xe8f5b0b5, 0xf03678a2, 0xd340f059, 0x5c7e249c, 0x93ca7cec,
  48705. 0x41440441, 0xbc83af98, 0x075ca346, 0xfaa8bbb0, 0xf39f0033,
  48706. 0xf38230f7, 0x3d18f0ed, 0xd448f345, 0x78dff00c, 0xd51aa475,
  48707. 0x849228c0, 0x30c928d1, 0xdd4e2708, 0x8f12cfd3, 0xc66ba686,
  48708. 0x88b3a206, 0x091049db, 0x016dae01, 0xd865d059, 0xe253e37d,
  48709. 0x4599e905, 0x7ce9871b, 0x322cf0c2, 0x174a132e, 0x014f54da,
  48710. 0xbdabcbda, 0x93634a09 },
  48711. { 0xa9a2e304, 0x62826b27, 0xc1a4c124, 0xc57e1866, 0x22381710,
  48712. 0x913ab832, 0xa9847cfe, 0x7e9b6b85, 0x2b5f46fd, 0x29655cf1,
  48713. 0x8038e66d, 0x7295572b, 0x6fa95eab, 0xe4cba601, 0xb9deda81,
  48714. 0xbbc11071, 0x3f1cf61e, 0x97f0009a, 0x373e0cfb, 0x5372777b,
  48715. 0xd139d63b, 0x302f909c, 0x4f87d78e, 0x1ed672da, 0xb4048763,
  48716. 0x362077a3, 0x9dcc22b2, 0xc408c32d, 0x26deeee7, 0x4b4c5bf2,
  48717. 0xbc06357e, 0x266cb467 },
  48718. { 0xb56363e8, 0x6faa4154, 0x3c1aa4db, 0x4b4fd078, 0x2b9e6597,
  48719. 0x14358dde, 0xfa004b84, 0x5b34ae3e, 0xf19911a6, 0xcf44b2ec,
  48720. 0xa536bf78, 0x55caa833, 0x8870dc95, 0x606e1eb9, 0x09f3511d,
  48721. 0xe3c3287d, 0x9d5cf364, 0x68b2f4eb, 0x63ab8c9e, 0xc154e892,
  48722. 0xc36ab611, 0x1548828e, 0xa1b7d120, 0x0932bfcb, 0x5315b8d7,
  48723. 0x7ee7b5bc, 0xf7473ac1, 0x782fd0d1, 0x3c8f2af3, 0xbcb029a8,
  48724. 0x52454ee1, 0x4b1d5a1b },
  48725. { 0x63d52c0c, 0x12fe5174, 0x188c099d, 0x3735525e, 0x360e3956,
  48726. 0x5c621563, 0xacfa5a43, 0x88b3f1ca, 0x797e8107, 0x90123a0a,
  48727. 0xb15e080a, 0xba31f6b5, 0xfca3dada, 0xd7de5e12, 0x0df511c8,
  48728. 0x3287361b, 0x65757d4e, 0x7cc800d4, 0x5207ec91, 0x10810f3d,
  48729. 0x30eea0e3, 0x0d4e56f1, 0x3ea5a2ec, 0xbbf7ee13, 0xbe6abbd0,
  48730. 0x6fc07762, 0x120bf619, 0xc831fdce, 0xb622d42a, 0xe07439fa,
  48731. 0x508e4b27, 0x8186b93f },
  48732. { 0x09312867, 0xc619d154, 0xbfaf7db4, 0x7e042c05, 0x1f5f5dda,
  48733. 0xc1cf1668, 0xa4fc3d82, 0x50aa5057, 0xce68b8fe, 0xed30ed65,
  48734. 0xbeb4d644, 0xecb01c0b, 0x831c0497, 0x7b5dc444, 0x9b7d9b1c,
  48735. 0x351e6a00, 0xd9477c91, 0x4bb863b9, 0x05d4110a, 0xaba65891,
  48736. 0x43580b7a, 0x30086cf4, 0x90be357e, 0xb139c076, 0x27b5214e,
  48737. 0x12bfff1a, 0x22c3ab57, 0x79cfc6d7, 0xf34a9bfa, 0x4743de57,
  48738. 0xc9ee2b2a, 0x0bf97e97 },
  48739. { 0xdda19e96, 0x96ec4ec8, 0x6c306e8b, 0x54ce18ea, 0x65f6918a,
  48740. 0x7e83612b, 0x0d9a0d99, 0x1ac6f68b, 0x62fdcc09, 0x98a697a4,
  48741. 0x95bc3e13, 0x65ce25f1, 0xb3939730, 0x1896ecda, 0x32f12806,
  48742. 0x9eb81a0f, 0x1d2dc7df, 0xd3d7416e, 0xad473599, 0xe22c7976,
  48743. 0x9f5ef439, 0x3de37a9a, 0x9e69d94e, 0x6b7ac0ab, 0x0a9d0bc8,
  48744. 0xe6bfa9e0, 0x5676f120, 0x576a870d, 0xfeaac23f, 0x3bd91bb4,
  48745. 0x3e40aabb, 0x8fe5482c },
  48746. { 0xce9a4d1e, 0x85ae67c2, 0x4f1d2038, 0x4c3eb803, 0x25d06192,
  48747. 0x5c6c8f3a, 0x308fb41c, 0x803de0ad, 0xe71c294e, 0x9961f5bc,
  48748. 0xf02eb0da, 0xdc62078d, 0xb64ae8b6, 0xc87ef515, 0x50b4d18f,
  48749. 0x69679f1e, 0x52199f43, 0xc5c009a1, 0x0f640a5f, 0xa7d484be,
  48750. 0x23dab566, 0x4c918bb1, 0x64275d2c, 0xa67c114c, 0xcad2ded6,
  48751. 0x95a913b9, 0x6b4b5c8d, 0x189ed18b, 0xb42d3bf6, 0x4aeb6206,
  48752. 0xbbc8bc3f, 0x3928c669 },
  48753. { 0xdacb4b64, 0xde4bea4a, 0xf26179a1, 0x03f62a44, 0x7a9112a4,
  48754. 0xf3aac94e, 0xd36f331e, 0x90448fbd, 0x407b85c4, 0x426042bc,
  48755. 0x2121b77b, 0x5ad8a596, 0x67cee984, 0x31674a4f, 0x4e3b2f0d,
  48756. 0x7fae8bbe, 0xa7c930eb, 0x681df6dd, 0xc259d0d4, 0xadeefa98,
  48757. 0xbea1c1fd, 0x1b14d9e6, 0x21d405d1, 0x3baadc8b, 0x73892754,
  48758. 0xf01dff93, 0xf071cde4, 0x81c35b3e, 0x9150d0d9, 0x1704d2e1,
  48759. 0x355134f6, 0x6ccc888f },
  48760. { 0x7ad7504c, 0xf8d36f0e, 0xf7959ddd, 0xbca3265f, 0xfede67aa,
  48761. 0x0dcd1ede, 0xbaebf32f, 0x1276f4ce, 0x014edcfc, 0x6825a6e6,
  48762. 0x99ad8eb7, 0x0b8c1a82, 0x09b8ce1e, 0x312024a9, 0x9cbd351a,
  48763. 0xcb8fd98b, 0xfab1e8be, 0xa4841378, 0x3973cacf, 0x17ed0f5d,
  48764. 0x259d5254, 0xa17e1484, 0x74b91393, 0x53d5b843, 0x1aca3ce9,
  48765. 0x8f792b21, 0xc8c0f815, 0x035ff110, 0xad4ed7bd, 0x6afa6357,
  48766. 0xb26faef9, 0x2f151980 },
  48767. { 0x29d2d439, 0x0c8631da, 0xbc039955, 0x121fbbc2, 0x6c05b75b,
  48768. 0x3e5a9792, 0xb6ce47ec, 0x6d6cf4c0, 0x9d88c658, 0xbaaa1767,
  48769. 0xf3355a17, 0x031db9e7, 0x0aef5a85, 0x8381e3d8, 0x15a31bdf,
  48770. 0xc71db290, 0x9498fd7d, 0x638f6b74, 0x13beeef6, 0x44edf3f9,
  48771. 0xf4ab67b3, 0xe6173271, 0xfd22df11, 0x3a202c70, 0x205c4e92,
  48772. 0xf7be0389, 0xa8eb9920, 0x1c219085, 0xbeb54aaa, 0x6c805ce8,
  48773. 0x0ac58d65, 0x354b05b7 },
  48774. { 0x7a9170e9, 0x7171e236, 0x4cad50cd, 0x01eec42d, 0x3cddccfb,
  48775. 0xffbe824f, 0xa66cae1a, 0xa73e8ce3, 0x965c7d01, 0xb7138a7f,
  48776. 0x5c3d971e, 0x00058e3f, 0x2ff0a72b, 0x52591ac3, 0xbbbce76f,
  48777. 0xa32fb5bc, 0xa9f81a18, 0xf3241ab8, 0xeca68630, 0xf31d3332,
  48778. 0x4482f13b, 0x847af9fc, 0xa4681be2, 0x6196e217, 0xe55efcf9,
  48779. 0x9938f932, 0x70acc705, 0x3e7dacb8, 0xcf09fac2, 0xd41be893,
  48780. 0xae3523a1, 0x48dc55c4 },
  48781. { 0xa5092193, 0x8e623826, 0x6898970c, 0xe46ec362, 0x25c9eb41,
  48782. 0x2f1356af, 0x83c7d245, 0x41780640, 0x97d00e38, 0x982def67,
  48783. 0xa512151c, 0x382eb6e7, 0x8af58869, 0x154e1077, 0x8a51cf02,
  48784. 0x18707075, 0x71313c58, 0xcdeba9f7, 0xba155904, 0x5d67b973,
  48785. 0x1d0d7b3a, 0x851c9f4b, 0x8b8af2cd, 0x19f29d71, 0x986b8d62,
  48786. 0xcb94ccff, 0xb93b9c33, 0x8725e24b, 0x66e38c68, 0x405ce4c5,
  48787. 0x0b6dc021, 0x5f6a8edd },
  48788. { 0x8f9a8690, 0x83704ca5, 0x2f76a407, 0x3f369766, 0x69201028,
  48789. 0xfbc12d8c, 0xbce3a4cf, 0x4cd58f16, 0x04aab26d, 0x7804664a,
  48790. 0x4ea457a8, 0x005cfbba, 0xb8a59794, 0x537951b3, 0x4fe1f739,
  48791. 0x4ca2b9e4, 0xdf325797, 0xe4428acd, 0x0ea243db, 0x648da342,
  48792. 0xf43ce01e, 0xcce6562b, 0xf27db490, 0x840f0421, 0x8bfb7cf0,
  48793. 0x156ccb70, 0x5a8797d3, 0x9b33480d, 0x9eb814bb, 0x2e12e07a,
  48794. 0xca7f87ac, 0x1ca65072 },
  48795. { 0x2b9d25a0, 0xfbb321cf, 0x40a746db, 0x66affdca, 0x59e368b5,
  48796. 0xc1c1530e, 0x7d80068f, 0x56ed1ea4, 0x5647dd68, 0x9b74d8fe,
  48797. 0x89b78da8, 0x1d96b507, 0x8bbe3391, 0x39b75243, 0x0d858c5f,
  48798. 0xef8d443e, 0x9646aa34, 0x4dd2db49, 0xe667543c, 0x7fad3bd1,
  48799. 0x68980985, 0xd0d710c0, 0x49facaba, 0x9f7aff32, 0x14f9a192,
  48800. 0x055dec1c, 0x1fb307a1, 0xaca66399, 0x35ffff64, 0xac44fd91,
  48801. 0xcbad3cee, 0x462cafb6 },
  48802. { 0xde3237dd, 0x1660a647, 0x82b87404, 0x95f735cc, 0xddfa55f8,
  48803. 0xf7879f59, 0x726b914a, 0x15ef043e, 0x1c93e298, 0x1875393d,
  48804. 0x6ef18331, 0xa1a2be74, 0x25a9a12b, 0x4e7e8dfc, 0xa9c3917f,
  48805. 0xdfefc97d, 0x0a2ebe41, 0xbc875d03, 0xa732d1cc, 0x0f75d235,
  48806. 0xd9baa6d3, 0x06fee7fe, 0x65f48576, 0xaa784fab, 0x513f83c0,
  48807. 0x23155e22, 0x3e8f9d13, 0xd2fb7718, 0xb546eafd, 0x2a291503,
  48808. 0x6cd93608, 0x1293c98c },
  48809. { 0x49d53b77, 0x72781251, 0x96eafac7, 0xa6ab403d, 0x4a36b711,
  48810. 0xb7d7c7db, 0x87e771c1, 0x8238c708, 0x33b37522, 0x495f6abf,
  48811. 0x8c87530d, 0xb0b0289c, 0xe77b111a, 0xca83cb86, 0xa1bd189e,
  48812. 0xbe1c0fb8, 0x1ae9d7c7, 0x58cfb2fb, 0x4940c3e8, 0xd05c23c5,
  48813. 0x74ad9107, 0x16e79e41, 0x064e7142, 0xa0a47f05, 0xfdfd614f,
  48814. 0xc6929cd4, 0x3946988b, 0xedb2584c, 0xe46f8fb1, 0x73e4b5f3,
  48815. 0x68ea94ba, 0x53b79aa1 },
  48816. { 0x44bbb6a1, 0x216fafce, 0x67821728, 0xd3a5bba0, 0xa9dd939a,
  48817. 0xef1e4b30, 0xf19efafe, 0x022eaf3d, 0x7b4ec014, 0xfed5abce,
  48818. 0x512c6738, 0x64968ee6, 0x29fe89a2, 0x23119869, 0x47397c05,
  48819. 0x0d539d8d, 0x234596c4, 0x6400bc54, 0x5346611d, 0xb9287f58,
  48820. 0xc9d5da0f, 0x04099903, 0xc83af2a8, 0xe5ef4997, 0x328151e1,
  48821. 0xc89dc01b, 0x58401104, 0x150fb4a9, 0xf3872c9d, 0x40a6f7d5,
  48822. 0x56c2e833, 0x8290d6d1 },
  48823. { 0xd8546946, 0xf84637c6, 0x69ec57fa, 0xda134a39, 0xd789007e,
  48824. 0xd42359a4, 0x0dc7b809, 0xb42557fe, 0x2d6784a9, 0xe62ae52d,
  48825. 0x0bcadb5f, 0xa2714ca6, 0x33aafca5, 0xcc208de6, 0xed967811,
  48826. 0x2380ed5c, 0xdb321660, 0x6e6b55e9, 0xa675235a, 0x1bead02c,
  48827. 0xb33fa0e1, 0x51cc6ef9, 0xf06a2a08, 0xfd223e26, 0xec47b3cf,
  48828. 0x00f332e1, 0xa0aa984e, 0x459f297b, 0xee952e14, 0x6fa1d969,
  48829. 0x304fabb0, 0x506ef1ab },
  48830. { 0x35bff163, 0x11b4eb27, 0xea9fa984, 0x7130b96f, 0x9deb27ce,
  48831. 0x66aceb3f, 0x9dd1c3d5, 0xa2daf1a5, 0xa73075aa, 0xf5090a7e,
  48832. 0xe3071b58, 0x36a6af39, 0xdf73ad9c, 0xa28d633d, 0xbdc89a16,
  48833. 0xdd354cac, 0xd4dcbc3c, 0xdfea3423, 0x379d92d1, 0x6eec74d2,
  48834. 0x8eed6765, 0xe14a456f, 0xfa8feb1f, 0xfabe7743, 0xb98fcbc7,
  48835. 0x1404ccf8, 0xf71a706e, 0x6ccd2fbf, 0x4d85c678, 0xdaaf3fdb,
  48836. 0x15200344, 0x415b7dbf },
  48837. { 0x7d8377a7, 0x97010586, 0xcb803272, 0x068a3d68, 0xf03a4c32,
  48838. 0xfd67d289, 0x93c8f290, 0x4bc7095d, 0xe9e5a2b8, 0x712fa13c,
  48839. 0x0feb9f3b, 0xfc6ac6c6, 0x6e0e54c2, 0x0cda36d9, 0x86320a01,
  48840. 0x45499751, 0x97f00f11, 0xf9318c91, 0xe6936508, 0x01dc4c3f,
  48841. 0x85f068aa, 0x769a2ef9, 0xa2b5511c, 0x3522cef0, 0xb4122e05,
  48842. 0x006965ed, 0xc175d43f, 0xfce0fafc, 0xec831d59, 0x525dc9bd,
  48843. 0xaf58879d, 0x1ec314f1 },
  48844. { 0x2c8310c2, 0x0663feef, 0x457e3f74, 0xaa7e14da, 0xe5346887,
  48845. 0x392b10fc, 0x637ec2c5, 0xcde4a38f, 0xb542f8df, 0x50773320,
  48846. 0xf7de1711, 0x341302f9, 0xae4b9bc6, 0x018b1c63, 0xdd2f9e6f,
  48847. 0xf001c46e, 0x26eccfa0, 0xd3bb0a97, 0x7746e0c7, 0xa931b99d,
  48848. 0xf5875aec, 0xe0c8b6f7, 0x96939c82, 0xbb32f17c, 0x3de5a664,
  48849. 0x765135d2, 0x52abfa6b, 0x71936cb4, 0x2dc105de, 0xad5cc08f,
  48850. 0x7fff5788, 0x17e91d12 },
  48851. { 0xb7e051ca, 0xbe92ced3, 0x19c776d4, 0xc644d4fd, 0x0086784b,
  48852. 0xc8ab4b52, 0xce9d6b31, 0x3ea66227, 0xd289e9c7, 0x395249a3,
  48853. 0xd12a19ee, 0x54509e65, 0x8c365aec, 0xa7bd4692, 0x77963e0e,
  48854. 0x354997e4, 0xb599732d, 0x0d765957, 0x91d4a3b6, 0x99584aeb,
  48855. 0x1deb3e28, 0x6e653ea4, 0x572571df, 0xca7c98ed, 0xb18ae1f9,
  48856. 0xf301a38f, 0x63f7b97e, 0x1629f7c2, 0xafc4a0d5, 0xdf242282,
  48857. 0x3ddd0c01, 0x118f3b4b },
  48858. { 0x7ad4762b, 0x74a0a0a8, 0x8c58d175, 0x1aef84da, 0x4cf76d86,
  48859. 0x16ff4960, 0x7e60d98b, 0xc0be8786, 0x3ecc1dba, 0x83637ffb,
  48860. 0x5dd6147a, 0xc244a609, 0x5b0846e5, 0xa3e17834, 0xe77a4c05,
  48861. 0x735eb686, 0xdf758695, 0x5bc18b4f, 0x1bdfe52f, 0x15618d0b,
  48862. 0x00715ba1, 0x878ecc0d, 0xc2dd617f, 0x1dbdbd1a, 0x21b61710,
  48863. 0x21d2b631, 0x44f593c2, 0x22ce8a79, 0x44f17024, 0x3b9b536a,
  48864. 0x8d03e727, 0x01d0a67c },
  48865. { 0x1e46533c, 0x7b964236, 0xfb88c2ae, 0xe9477990, 0xa42c4a18,
  48866. 0x019b5d16, 0xd83c7a45, 0x7135e81d, 0x4cb663e3, 0x74a69bdd,
  48867. 0xe76c0d63, 0x7b67ecdb, 0x11e68da6, 0x03d54521, 0xd2e8650a,
  48868. 0x596cceb5, 0x2af03b37, 0xcd572dfd, 0xfabd5952, 0x52364ba1,
  48869. 0xb4ed8569, 0x7f47d456, 0xc950d5d4, 0x5ad8b572, 0x486e2f84,
  48870. 0xcadd2dfa, 0xc56bb044, 0xdd527b43, 0x997c08e6, 0xc9adba24,
  48871. 0x7da6320f, 0x1b625b06 },
  48872. { 0x4fd8446d, 0x44dfaa7b, 0xaf6febeb, 0xc01b2f01, 0xfe8838b5,
  48873. 0xbf444388, 0xbba9758b, 0xf33c434f, 0x87156bc9, 0x2b971cba,
  48874. 0x1f49098b, 0x6b245e5c, 0x2b41c5dd, 0x87dcb534, 0x34d852d7,
  48875. 0xdb1f80c6, 0x2433da34, 0x6d6e3258, 0x3f7df0c2, 0xf6682065,
  48876. 0x360cb365, 0xc4ca567c, 0x9826656a, 0x321faac2, 0xbf069768,
  48877. 0x13f5ca6f, 0xa7076639, 0x15397921, 0x8400736e, 0xbdf14328,
  48878. 0x19fc948d, 0x333eca96 },
  48879. { 0xac775d81, 0x23337948, 0xd41dbbca, 0x38c2518f, 0xbcfce948,
  48880. 0x623c7a4f, 0x54703fe7, 0xaad36236, 0x13fb3b5b, 0x2b3a13a4,
  48881. 0x7f5c01f0, 0x5db3565a, 0x52359661, 0xd72408dc, 0x1d616e91,
  48882. 0x5a17f8e5, 0xcb25b999, 0x90c16eeb, 0x3393743e, 0xf35e8cf1,
  48883. 0xe54b64a7, 0x987da74a, 0x65cd449d, 0x557b322a, 0x37e7b15d,
  48884. 0x765082a5, 0xf2cd134f, 0x4d25c742, 0x4ccf0746, 0xae9d9c07,
  48885. 0x8728d135, 0x72fc2110 },
  48886. { 0xf96004c8, 0xa906b203, 0x458055ff, 0xd83f95cf, 0x55f35909,
  48887. 0xd77d5867, 0xe550c8ee, 0x4a9ea6fb, 0x55a06081, 0x91c8cca9,
  48888. 0xbce82062, 0x4a1fee78, 0x9a3df85e, 0xeb9ade06, 0x7d3de666,
  48889. 0xfbbdcf0c, 0x5d336d51, 0x228a391b, 0x5c2ffc3c, 0x760f8d28,
  48890. 0x2f7b165b, 0x1ee48de3, 0x56177040, 0x03803d84, 0x9deff9a0,
  48891. 0xe573f648, 0xa17e35a4, 0xe1a2738e, 0x8840a6c6, 0x238ef17c,
  48892. 0xb11ed92d, 0x480946f8 },
  48893. { 0xfd71f119, 0x84c747a8, 0x53eb3695, 0x19e65c5e, 0x6298587a,
  48894. 0x0e2f6786, 0xab18d6f4, 0x48a48899, 0xc630b8c0, 0xa1a99024,
  48895. 0x2caaf892, 0x84975096, 0xe20fd624, 0xc8869aba, 0x6c2b7dd4,
  48896. 0x3b72b04d, 0x0992f7d0, 0xe2775eb6, 0x7d06e684, 0x0089c06e,
  48897. 0xe4bbd007, 0xcb3b4361, 0x4ba846e4, 0xa1ae666b, 0x46464d9e,
  48898. 0xc01c2eb2, 0xc1f8539f, 0xf86f2be6, 0xcf68afc7, 0x16e8e8ae,
  48899. 0xc7386902, 0x8dab61fd },
  48900. { 0xd54d1d45, 0x42a5c903, 0xff4f9ba2, 0xacd4297e, 0x34d478b4,
  48901. 0x2d88b520, 0x08c4621a, 0x35b2ba2b, 0x34865402, 0xd3d239bb,
  48902. 0x911f32e6, 0x1de76aed, 0x3f06fdc2, 0x877f8bcf, 0x9ec51502,
  48903. 0x802714c1, 0xa590700d, 0xa10444eb, 0x31dcc957, 0x8694229f,
  48904. 0xb8169fed, 0x5ece77ab, 0x2caf080e, 0x55be8a15, 0xcbd7cef1,
  48905. 0x3eb21b14, 0x67b97ee1, 0x9def7ad1, 0x118f690c, 0xe03ca879,
  48906. 0xf99b29e7, 0x6f77e62d },
  48907. { 0xe40bbf59, 0xa271bded, 0x6401aad6, 0x177ba453, 0x73541cd1,
  48908. 0x1755e035, 0x4b71b02f, 0x3465b466, 0xa813359f, 0x22eb7113,
  48909. 0x6f38eac7, 0x9792a8fd, 0xff3bf3b5, 0x11aa012f, 0xf85c3fbf,
  48910. 0x99aafabf, 0x06c0cc42, 0x91e0a2ef, 0x773b7b3a, 0x314d5d57,
  48911. 0xd669840a, 0xae5e2e76, 0x2e5a8be6, 0x86136073, 0xc1cf5580,
  48912. 0xee6d7578, 0x68bed102, 0x2344e00f, 0x8184f0eb, 0x799d7886,
  48913. 0xc3d2cf80, 0x63819c91 },
  48914. { 0x7884b073, 0xca5392e1, 0xeb1267ea, 0x9ec3a1fc, 0x907038a7,
  48915. 0x3d07f5f0, 0xe4c47b70, 0xcb2ac07c, 0x1bf96b91, 0xf96664ee,
  48916. 0x2aea4fbf, 0xebf57589, 0xfade6500, 0x5aabf391, 0x171d1204,
  48917. 0xc5b3376f, 0xa0d3d81a, 0x1ff60c51, 0x976a844b, 0x10b2cfe7,
  48918. 0xbda6125a, 0xe131cc9a, 0x4ebd453e, 0xe0fc16d3, 0x504b6bc1,
  48919. 0xc0d0319a, 0x0a2f8cab, 0xe43a0be7, 0x55e49b47, 0xc80afeec,
  48920. 0x8265d7ee, 0x67d48d12 },
  48921. { 0xea2d56d6, 0x068d59a7, 0x27480a63, 0xd71abd0e, 0xae7366cd,
  48922. 0x6bd11db0, 0x07204ebc, 0xfbb639ca, 0xf77e6293, 0x89a242e7,
  48923. 0x75ba8c3d, 0xdee7ca2b, 0x64a2f9a8, 0x472ddc3d, 0x7561a010,
  48924. 0x84229df4, 0xc5b649d4, 0x95f62c85, 0x4dc927cd, 0xfdd56b1b,
  48925. 0x5ee60596, 0xfe8bb120, 0xabf29401, 0x3efcaa50, 0x10d1c184,
  48926. 0xd4900d0f, 0x28b01df5, 0x2cf113a9, 0x1f0e43f5, 0xa3d7ebc3,
  48927. 0xe8384dc7, 0x27950e38 },
  48928. { 0xe1d0fa79, 0xeab21ff0, 0x048b5de9, 0x4b9fd033, 0x2fe374cb,
  48929. 0x4c934689, 0x4eb21f6b, 0xbb4827fa, 0xa925e7e7, 0x46716f79,
  48930. 0x7dd4c531, 0x1442bf36, 0xd2e96ddf, 0x2073954c, 0x8502aa89,
  48931. 0x4e0141ae, 0x8eef6cc9, 0x8ee00e1a, 0x5880cdaf, 0x55ce8491,
  48932. 0x69628046, 0xff3aba5c, 0x5d15dfbf, 0x335cc4f8, 0x9f684f25,
  48933. 0xa7f0440c, 0xbb1e5bd8, 0xae80453f, 0xff2225ab, 0xa1c99813,
  48934. 0x79b25d71, 0x54ff7884 },
  48935. { 0xde40b068, 0x27c6ee30, 0xe6f3a51e, 0x9226465b, 0xfa3b21f6,
  48936. 0xe24a4604, 0xc0418115, 0x50a5a5ad, 0x8df90d2b, 0xe3285441,
  48937. 0xdcb0c00f, 0xbb74e58f, 0x4a2c08e3, 0xc68f1b3b, 0x0ccd9ec9,
  48938. 0x339df081, 0xb786ea9f, 0x915362dc, 0xc955aead, 0x28945e31,
  48939. 0x8b6a6c6b, 0xd6a2c01d, 0x3678a427, 0x069e82dc, 0x28c9302c,
  48940. 0x17875500, 0x9fa101e6, 0x8acda965, 0xee30b286, 0x4e4e4573,
  48941. 0x3f1830fe, 0x8adbad85 },
  48942. { 0x0969d524, 0x060ae11f, 0xf39bcc79, 0xf42fdaf7, 0x7cc1fcc2,
  48943. 0x3cec6766, 0xe2336d4f, 0x456b9cf2, 0x8e1c0f7f, 0x6aa1f5de,
  48944. 0x0984fb0e, 0xcdbc2ad2, 0x1b464b28, 0x4090cfa6, 0x1243f3ef,
  48945. 0x40d86f30, 0xcd5e87e7, 0x95b16ccc, 0x3026cd41, 0x403f168c,
  48946. 0x816c0730, 0xdbe386cb, 0x58407a1d, 0x14eb86f3, 0x1717e1af,
  48947. 0xf588b4f8, 0x66cbc96c, 0xb75c41a6, 0x027e71c1, 0xf342c1aa,
  48948. 0xc0945e5f, 0x73930036 },
  48949. { 0x22cdaf42, 0x954f757d, 0xf4181aab, 0x788b591d, 0xf5514f25,
  48950. 0x8b986819, 0xf18fd5bc, 0x69642e08, 0x022ceb91, 0x92b305d1,
  48951. 0x6a4f6985, 0x1715903e, 0x61179cae, 0x4bd7d69d, 0xd29c01aa,
  48952. 0xdacdfd5d, 0xd91108cc, 0x705ddd5a, 0x64ac8f15, 0x434ac7b1,
  48953. 0xb524632f, 0x61a514e1, 0x731fc447, 0x45b9e61b, 0xe0961b31,
  48954. 0xcf561348, 0x73eaf223, 0x9c28a967, 0xaa7c99d3, 0x5bd10182,
  48955. 0xe42965e2, 0x8bc6ec4a },
  48956. { 0xe7f2a32b, 0xd096e5c0, 0x09388a30, 0xff54800c, 0x401e360c,
  48957. 0x06fe437c, 0xbb6054a6, 0x6655fc9c, 0x8457aa6e, 0x510e1860,
  48958. 0x2b29b2b7, 0xa0acfca2, 0x51b7da61, 0x732483e3, 0x6be6c8ca,
  48959. 0xe31471ee, 0x8b65c9a1, 0xe565431c, 0x48d65cbb, 0xfc9ac3b9,
  48960. 0xae9b2aa8, 0xd308fc21, 0xaa60aa6a, 0xd6a7df0d, 0x982fc0d4,
  48961. 0x2844d96a, 0x5847a4d7, 0xab012c2c, 0xdceb8955, 0x2b3c8f71,
  48962. 0xbe9c7e15, 0x8e85437d },
  48963. };
  48964. /* Perform the modular exponentiation in Fp* for SAKKE.
  48965. *
  48966. * Base is fixed to be the g parameter - a precomputed table is used.
  48967. *
  48968. * Striping: 128 points at a distance of 8 combined.
  48969. * Total of 256 points in table.
  48970. * Square and multiply performed in Fp*.
  48971. *
  48972. * base [in] Base. MP integer.
  48973. * exp [in] Exponent. MP integer.
  48974. * res [out] Result. MP integer.
  48975. * returns 0 on success, MP_READ_E if there are too many bytes in an array
  48976. * and MEMORY_E if memory allocation fails.
  48977. */
  48978. int sp_ModExp_Fp_star_1024(const mp_int* base, mp_int* exp, mp_int* res)
  48979. {
  48980. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  48981. !defined(WOLFSSL_SP_NO_MALLOC)
  48982. sp_digit* td;
  48983. sp_digit* t;
  48984. sp_digit* tx;
  48985. sp_digit* ty;
  48986. #else
  48987. sp_digit t[4 * 2 * 32];
  48988. sp_digit tx[2 * 32];
  48989. sp_digit ty[2 * 32];
  48990. #endif
  48991. sp_digit* r = NULL;
  48992. unsigned char e[128];
  48993. int err = MP_OKAY;
  48994. int i;
  48995. int y;
  48996. (void)base;
  48997. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  48998. !defined(WOLFSSL_SP_NO_MALLOC)
  48999. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * 6 * 32 * 2, NULL,
  49000. DYNAMIC_TYPE_TMP_BUFFER);
  49001. if (td == NULL) {
  49002. err = MEMORY_E;
  49003. }
  49004. #endif
  49005. if (err == MP_OKAY) {
  49006. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  49007. !defined(WOLFSSL_SP_NO_MALLOC)
  49008. t = td;
  49009. tx = td + 4 * 32 * 2;
  49010. ty = td + 5 * 32 * 2;
  49011. #endif
  49012. r = ty;
  49013. (void)mp_to_unsigned_bin_len(exp, e, 128);
  49014. XMEMCPY(tx, p1024_norm_mod, sizeof(sp_digit) * 32);
  49015. y = e[112] >> 7;
  49016. y |= (e[96] >> 7) << 1;
  49017. y |= (e[80] >> 7) << 2;
  49018. y |= (e[64] >> 7) << 3;
  49019. y |= (e[48] >> 7) << 4;
  49020. y |= (e[32] >> 7) << 5;
  49021. y |= (e[16] >> 7) << 6;
  49022. y |= (e[0] >> 7) << 7;
  49023. XMEMCPY(ty, sp_1024_g_table[y], sizeof(sp_digit) * 32);
  49024. for (i = 126; i >= 0; i--) {
  49025. y = (e[127 - (i / 8)] >> (i & 0x7)) & 1;
  49026. y |= ((e[111 - (i / 8)] >> (i & 0x7)) & 1) << 1;
  49027. y |= ((e[95 - (i / 8)] >> (i & 0x7)) & 1) << 2;
  49028. y |= ((e[79 - (i / 8)] >> (i & 0x7)) & 1) << 3;
  49029. y |= ((e[63 - (i / 8)] >> (i & 0x7)) & 1) << 4;
  49030. y |= ((e[47 - (i / 8)] >> (i & 0x7)) & 1) << 5;
  49031. y |= ((e[31 - (i / 8)] >> (i & 0x7)) & 1) << 6;
  49032. y |= ((e[15 - (i / 8)] >> (i & 0x7)) & 1) << 7;
  49033. sp_1024_proj_sqr_32(tx, ty, t);
  49034. sp_1024_proj_mul_qx1_32(tx, ty, sp_1024_g_table[y], t);
  49035. }
  49036. }
  49037. if (err == MP_OKAY) {
  49038. sp_1024_mont_inv_32(tx, tx, t);
  49039. sp_1024_mont_mul_32(r, tx, ty, p1024_mod, p1024_mp_mod);
  49040. XMEMSET(r + 32, 0, sizeof(sp_digit) * 32);
  49041. sp_1024_mont_reduce_32(r, p1024_mod, p1024_mp_mod);
  49042. err = sp_1024_to_mp(r, res);
  49043. }
  49044. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  49045. !defined(WOLFSSL_SP_NO_MALLOC)
  49046. if (td != NULL) {
  49047. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  49048. }
  49049. #endif
  49050. return err;
  49051. }
  49052. #endif /* WOLFSSL_SP_SMALL */
  49053. /* Multiply p* by q* in projective co-ordinates.
  49054. *
  49055. * p.x' = (p.x * q.x) - (p.y * q.y)
  49056. * p.y' = (p.x * q.y) + (p.y * q.x)
  49057. * But applying Karatsuba:
  49058. * v0 = p.x * q.x
  49059. * v1 = p.y * q.y
  49060. * p.x' = v0 - v1
  49061. * p.y' = (px + py) * (qx + qy) - v0 - v1
  49062. *
  49063. * px [in,out] A single precision integer - X ordinate of number to multiply.
  49064. * py [in,out] A single precision integer - Y ordinate of number to multiply.
  49065. * qx [in] A single precision integer - X ordinate of number of
  49066. * multiplier.
  49067. * qy [in] A single precision integer - Y ordinate of number of
  49068. * multiplier.
  49069. * t [in] Two single precision integers - temps.
  49070. */
  49071. static void sp_1024_proj_mul_32(sp_digit* px, sp_digit* py,
  49072. const sp_digit* qx, const sp_digit* qy, sp_digit* t)
  49073. {
  49074. sp_digit* t1 = t;
  49075. sp_digit* t2 = t + 2 * 32;
  49076. /* t1 = px + py */
  49077. sp_1024_mont_add_32(t1, px, py, p1024_mod);
  49078. /* t2 = qx + qy */
  49079. sp_1024_mont_add_32(t2, qx, qy, p1024_mod);
  49080. /* t2 = (px + py) * (qx + qy) */
  49081. sp_1024_mont_mul_32(t2, t1, t2, p1024_mod, p1024_mp_mod);
  49082. /* t1 = py * qy */
  49083. sp_1024_mont_mul_32(t1, py, qy, p1024_mod, p1024_mp_mod);
  49084. /* t2 = (px + py) * (qx + qy) - (py * qy) */
  49085. sp_1024_mont_sub_32(t2, t2, t1, p1024_mod);
  49086. /* px = px * qx */
  49087. sp_1024_mont_mul_32(px, px, qx, p1024_mod, p1024_mp_mod);
  49088. /* py = (px + py) * (qx + qy) - (py * qy) - (px * qx) */
  49089. sp_1024_mont_sub_32(py, t2, px, p1024_mod);
  49090. /* px = (px * qx) - (py * qy)*/
  49091. sp_1024_mont_sub_32(px, px, t1, p1024_mod);
  49092. }
  49093. #ifndef WOLFSSL_SP_SMALL
  49094. /*
  49095. * Convert point from projective to affine but keep in Montgomery form.
  49096. *
  49097. * p [in,out] Point to convert.
  49098. * t [in] Temporary numbers: 2.
  49099. */
  49100. static void sp_1024_mont_map_32(sp_point_1024* p, sp_digit* t)
  49101. {
  49102. sp_digit* t1 = t;
  49103. sp_digit* t2 = t + 2 * 32;
  49104. sp_1024_mont_inv_32(t1, p->z, t2);
  49105. sp_1024_mont_sqr_32(t2, t1, p1024_mod, p1024_mp_mod);
  49106. sp_1024_mont_mul_32(t1, t2, t1, p1024_mod, p1024_mp_mod);
  49107. sp_1024_mont_mul_32(p->x, p->x, t2, p1024_mod, p1024_mp_mod);
  49108. sp_1024_mont_mul_32(p->y, p->y, t1, p1024_mod, p1024_mp_mod);
  49109. XMEMCPY(p->z, p1024_norm_mod, sizeof(sp_digit) * 32);
  49110. }
  49111. #endif /* WOLFSSL_SP_SMALL */
  49112. /*
  49113. * Calculate gradient of line through P, P and [-2]P, accumulate line and
  49114. * double P.
  49115. *
  49116. * Calculations:
  49117. * l = 3 * (p.x^2 - p.z^4) = 3 * (p.x - p.z^2) * (p.x + p.z^2)
  49118. * r.x = l * (p.x + q.x * p.z^2) - 2 * p.y^2
  49119. * r.y = 2 * p.y * p.z^3 * q.y (= p'.z * p.z^2 * q.y)
  49120. * v* = v*^2 * r*
  49121. * p'.x = l^2 - 8 * p.y^2 * p.x
  49122. * p'.y = (4 * p.y^2 * p.x - p'.x) * l - 8 * p.y^4
  49123. * p'.z = 2 * p.y * p.z
  49124. *
  49125. * @param [in,out] vx X-ordinate of projective value in F*.
  49126. * @param [in,out] vy Y-ordinate of projective value in F*.
  49127. * @param [in,out] p ECC point - point on E(F_p^2) to double.
  49128. * @param [in] q ECC point - second point on E(F_P^2).
  49129. * @param [in] t SP temporaries (6 used).
  49130. */
  49131. static void sp_1024_accumulate_line_dbl_32(sp_digit* vx, sp_digit* vy,
  49132. sp_point_1024* p, const sp_point_1024* q, sp_digit* t)
  49133. {
  49134. sp_digit* t1 = t + 0 * 32;
  49135. sp_digit* pz2 = t + 2 * 32;
  49136. sp_digit* rx = t + 4 * 32;
  49137. sp_digit* ry = t + 6 * 32;
  49138. sp_digit* l = t + 8 * 32;
  49139. sp_digit* ty = t + 10 * 32;
  49140. /* v = v^2 */
  49141. sp_1024_proj_sqr_32(vx, vy, t);
  49142. /* pz2 = p.z^2 */
  49143. sp_1024_mont_sqr_32(pz2, p->z, p1024_mod, p1024_mp_mod);
  49144. /* t1 = p.x + p.z^2 */
  49145. sp_1024_mont_add_32(ty, p->x, pz2, p1024_mod);
  49146. /* l = p.x - p.z^2 */
  49147. sp_1024_mont_sub_32(l, p->x, pz2, p1024_mod);
  49148. /* t1 = (p.x + p.z^2) * (p.x - p.z^2) = p.x^2 - p.z^4 */
  49149. sp_1024_mont_mul_32(t1, l, ty, p1024_mod, p1024_mp_mod);
  49150. /* l = 3 * (p.x^2 - p.z^4) */
  49151. sp_1024_mont_tpl_32(l, t1, p1024_mod);
  49152. /* t1 = q.x * p.z^2 */
  49153. sp_1024_mont_mul_32(t1, q->x, pz2, p1024_mod, p1024_mp_mod);
  49154. /* t1 = p.x + q.x * p.z^2 */
  49155. sp_1024_mont_add_32(t1, p->x, t1, p1024_mod);
  49156. /* r.x = l * (p.x + q.x * p.z^2) */
  49157. sp_1024_mont_mul_32(rx, l, t1, p1024_mod, p1024_mp_mod);
  49158. /* r.y = 2 * p.y */
  49159. sp_1024_mont_dbl_32(ry, p->y, p1024_mod);
  49160. /* ty = 4 * p.y ^ 2 */
  49161. sp_1024_mont_sqr_32(ty, ry, p1024_mod, p1024_mp_mod);
  49162. /* t1 = 2 * p.y ^ 2 */
  49163. sp_1024_div2_32(t1, ty, p1024_mod);
  49164. /* r.x -= 2 * (p.y ^ 2) */
  49165. sp_1024_mont_sub_32(rx, rx, t1, p1024_mod);
  49166. /* p'.z = p.y * 2 * p.z */
  49167. sp_1024_mont_mul_32(p->z, p->z, ry, p1024_mod, p1024_mp_mod);
  49168. /* r.y = p'.z * p.z^2 */
  49169. sp_1024_mont_mul_32(t1, p->z, pz2, p1024_mod, p1024_mp_mod);
  49170. /* r.y = p'.z * p.z^2 * q.y */
  49171. sp_1024_mont_mul_32(ry, t1, q->y, p1024_mod, p1024_mp_mod);
  49172. /* v = v^2 * r */
  49173. sp_1024_proj_mul_32(vx, vy, rx, ry, t);
  49174. /* Double point using previously calculated values
  49175. * l = 3 * (p.x - p.z^2).(p.x + p.z^2)
  49176. * ty = 4 * p.y^2
  49177. * p'.z = 2 * p.y * p.z
  49178. */
  49179. /* t1 = (4 * p.y^2) ^ 2 = 16 * p.y^4 */
  49180. sp_1024_mont_sqr_32(t1, ty, p1024_mod, p1024_mp_mod);
  49181. /* t1 = 16 * p.y^4 / 2 = 8 * p.y^4 */
  49182. sp_1024_div2_32(t1, t1, p1024_mod);
  49183. /* p'.y = 4 * p.y^2 * p.x */
  49184. sp_1024_mont_mul_32(p->y, ty, p->x, p1024_mod, p1024_mp_mod);
  49185. /* p'.x = l^2 */
  49186. sp_1024_mont_sqr_32(p->x, l, p1024_mod, p1024_mp_mod);
  49187. /* p'.x = l^2 - 4 * p.y^2 * p.x */
  49188. sp_1024_mont_sub_32(p->x, p->x, p->y, p1024_mod);
  49189. /* p'.x = l^2 - 8 * p.y^2 * p.x */
  49190. sp_1024_mont_sub_32(p->x, p->x, p->y, p1024_mod);
  49191. /* p'.y = 4 * p.y^2 * p.x - p.x' */
  49192. sp_1024_mont_sub_32(ty, p->y, p->x, p1024_mod);
  49193. /* p'.y = (4 * p.y^2 * p.x - p'.x) * l */
  49194. sp_1024_mont_mul_32(p->y, ty, l, p1024_mod, p1024_mp_mod);
  49195. /* p'.y = (4 * p.y^2 * p.x - p'.x) * l - 8 * p.y^4 */
  49196. sp_1024_mont_sub_32(p->y, p->y, t1, p1024_mod);
  49197. }
  49198. #ifdef WOLFSSL_SP_SMALL
  49199. /*
  49200. * Calculate gradient of line through C, P and -C-P, accumulate line and
  49201. * add P to C.
  49202. *
  49203. * Calculations:
  49204. * r.x = (q.x + p.x) * c.y - (q.x * c.z^2 + c.x) * p.y * c.z
  49205. * r.y = (c.x - p.x * c.z^2) * q.y * c.z
  49206. * v* = v* * r*
  49207. * r = p.y * c.z^3 - c.y
  49208. * c'.x = r^2 + h^3 - 2 * c.x * h^2
  49209. * c'.y = r * (c'.x - c.x * h^2) - c.y * h^3
  49210. * c'.z = (c.x - p.x * c.z^2) * c.z
  49211. *
  49212. * @param [in,out] vx X-ordinate of projective value in F*.
  49213. * @param [in,out] vy Y-ordinate of projective value in F*.
  49214. * @param [in,out] c ECC point - current point on E(F_p^2) to be added
  49215. * to.
  49216. * @param [in] p ECC point - point on E(F_p^2) to add.
  49217. * @param [in] q ECC point - second point on E(F_P^2).
  49218. * @param [in] qx_px SP that is a constant value across adds.
  49219. * @param [in] t SP temporaries (6 used).
  49220. */
  49221. static void sp_1024_accumulate_line_add_one_32(sp_digit* vx, sp_digit* vy,
  49222. sp_point_1024* c, sp_point_1024* p, sp_point_1024* q, sp_digit* qx_px,
  49223. sp_digit* t)
  49224. {
  49225. sp_digit* t1 = t;
  49226. sp_digit* t2 = t + 2 * 32;
  49227. sp_digit* rx = t + 4 * 32;
  49228. sp_digit* ry = t + 6 * 32;
  49229. sp_digit* h = t + 8 * 32;
  49230. sp_digit* r = t + 10 * 32;
  49231. /* r.x = (q.x + p.x) * c.y */
  49232. sp_1024_mont_mul_32(rx, qx_px, c->y, p1024_mod, p1024_mp_mod);
  49233. /* t2 = c.z^2 */
  49234. sp_1024_mont_sqr_32(t2, c->z, p1024_mod, p1024_mp_mod);
  49235. /* t1 = q.x * c.z^2 */
  49236. sp_1024_mont_mul_32(t1, q->x, t2, p1024_mod, p1024_mp_mod);
  49237. /* t1 = q.x * c.z^2 + c.x */
  49238. sp_1024_mont_add_32(h, t1, c->x, p1024_mod);
  49239. /* r = p.y * c.z */
  49240. sp_1024_mont_mul_32(ry, p->y, c->z, p1024_mod, p1024_mp_mod);
  49241. /* t1 = (q.x * c.z^2 + c.x) * p.y * c.z */
  49242. sp_1024_mont_mul_32(t1, h, ry, p1024_mod, p1024_mp_mod);
  49243. /* r = p.y * c.z * c.z^2 = p.y * c.z^3 */
  49244. sp_1024_mont_mul_32(r, ry, t2, p1024_mod, p1024_mp_mod);
  49245. /* r.x -= (q.x * c.z^2 + c.x) * p.y * c.z */
  49246. sp_1024_mont_sub_32(rx, rx, t1, p1024_mod);
  49247. /* t1 = p.x * c.z^2 */
  49248. sp_1024_mont_mul_32(t1, p->x, t2, p1024_mod, p1024_mp_mod);
  49249. /* h = c.x - p.x * c.z^2 */
  49250. sp_1024_mont_sub_32(h, c->x, t1, p1024_mod);
  49251. /* c'.z = (c.x - p.x * c.z^2) * c.z */
  49252. sp_1024_mont_mul_32(c->z, h, c->z, p1024_mod, p1024_mp_mod);
  49253. /* r.y = (c.x - p.x * c.z^2) * c.z * q.y */
  49254. sp_1024_mont_mul_32(ry, c->z, q->y, p1024_mod, p1024_mp_mod);
  49255. /* v = v * r */
  49256. sp_1024_proj_mul_32(vx, vy, rx, ry, t);
  49257. /* Add p to c using previously calculated values.
  49258. * h = c.x - p.x * c.z^2
  49259. * r = p.y * c.z^3
  49260. * c'.z = (c.x - p.x * c.z^2) * c.z
  49261. */
  49262. /* r = p.y * c.z^3 - c.y */
  49263. sp_1024_mont_sub_32(r, r, c->y, p1024_mod);
  49264. /* t1 = r^2 */
  49265. sp_1024_mont_sqr_32(t1, r, p1024_mod, p1024_mp_mod);
  49266. /* t2 = h^2 */
  49267. sp_1024_mont_sqr_32(rx, h, p1024_mod, p1024_mp_mod);
  49268. /* ry = c.x * h^2 */
  49269. sp_1024_mont_mul_32(ry, c->x, rx, p1024_mod, p1024_mp_mod);
  49270. /* t2 = h^3 */
  49271. sp_1024_mont_mul_32(t2, rx, h, p1024_mod, p1024_mp_mod);
  49272. /* c->x = r^2 + h^3 */
  49273. sp_1024_mont_add_32(c->x, t1, t2, p1024_mod);
  49274. /* t1 = 2 * c.x * h^2 */
  49275. sp_1024_mont_dbl_32(t1, ry, p1024_mod);
  49276. /* c'.x = r^2 + h^3 - 2 * c.x * h^2 */
  49277. sp_1024_mont_sub_32(c->x, c->x, t1, p1024_mod);
  49278. /* ry = c'.x - c.x * h^2 */
  49279. sp_1024_mont_sub_32(t1, c->x, ry, p1024_mod);
  49280. /* ry = r * (c'.x - c.x * h^2) */
  49281. sp_1024_mont_mul_32(ry, t1, r, p1024_mod, p1024_mp_mod);
  49282. /* t2 = c.y * h^3 */
  49283. sp_1024_mont_mul_32(t1, t2, c->y, p1024_mod, p1024_mp_mod);
  49284. /* c'.y = r * (c'.x - c.x * h^2) - c.y * h^3 */
  49285. sp_1024_mont_sub_32(c->y, ry, t1, p1024_mod);
  49286. }
  49287. /*
  49288. * Calculate r = pairing <P, Q>.
  49289. *
  49290. * That is, multiply base in PF_p[q] by the scalar s, such that s.P = Q.
  49291. *
  49292. * @param [in] key SAKKE key.
  49293. * @param [in] p First point on E(F_p)[q].
  49294. * @param [in] q Second point on E(F_p)[q].
  49295. * @param [in] r Result of calculation.
  49296. * @return 0 on success.
  49297. * @return MEMORY_E when dynamic memory allocation fails.
  49298. * @return Other -ve value on internal failure.
  49299. */
  49300. int sp_Pairing_1024(const ecc_point* pm, const ecc_point* qm, mp_int* res)
  49301. {
  49302. int err = MP_OKAY;
  49303. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  49304. !defined(WOLFSSL_SP_NO_MALLOC)
  49305. sp_digit* td = NULL;
  49306. sp_digit* t;
  49307. sp_digit* vx;
  49308. sp_digit* vy;
  49309. sp_digit* qx_px;
  49310. #else
  49311. sp_digit t[6 * 2 * 32];
  49312. sp_digit vx[2 * 32];
  49313. sp_digit vy[2 * 32];
  49314. sp_digit qx_px[2 * 32];
  49315. sp_point_1024 pd;
  49316. sp_point_1024 qd;
  49317. sp_point_1024 cd;
  49318. #endif
  49319. sp_point_1024* p = NULL;
  49320. sp_point_1024* q = NULL;
  49321. sp_point_1024* c = NULL;
  49322. sp_digit* r = NULL;
  49323. int i;
  49324. err = sp_1024_point_new_32(NULL, pd, p);
  49325. if (err == MP_OKAY) {
  49326. err = sp_1024_point_new_32(NULL, qd, q);
  49327. }
  49328. if (err == MP_OKAY) {
  49329. err = sp_1024_point_new_32(NULL, cd, c);
  49330. }
  49331. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  49332. !defined(WOLFSSL_SP_NO_MALLOC)
  49333. if (err == MP_OKAY) {
  49334. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * 9 * 32 * 2, NULL,
  49335. DYNAMIC_TYPE_TMP_BUFFER);
  49336. if (td == NULL) {
  49337. err = MEMORY_E;
  49338. }
  49339. }
  49340. #endif
  49341. if (err == MP_OKAY) {
  49342. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  49343. !defined(WOLFSSL_SP_NO_MALLOC)
  49344. t = td;
  49345. vx = td + 6 * 32 * 2;
  49346. vy = td + 7 * 32 * 2;
  49347. qx_px = td + 8 * 32 * 2;
  49348. #endif
  49349. r = vy;
  49350. sp_1024_point_from_ecc_point_32(p, pm);
  49351. sp_1024_point_from_ecc_point_32(q, qm);
  49352. err = sp_1024_mod_mul_norm_32(p->x, p->x, p1024_mod);
  49353. }
  49354. if (err == MP_OKAY) {
  49355. err = sp_1024_mod_mul_norm_32(p->y, p->y, p1024_mod);
  49356. }
  49357. if (err == MP_OKAY) {
  49358. err = sp_1024_mod_mul_norm_32(p->z, p->z, p1024_mod);
  49359. }
  49360. if (err == MP_OKAY) {
  49361. err = sp_1024_mod_mul_norm_32(q->x, q->x, p1024_mod);
  49362. }
  49363. if (err == MP_OKAY) {
  49364. err = sp_1024_mod_mul_norm_32(q->y, q->y, p1024_mod);
  49365. }
  49366. if (err == MP_OKAY) {
  49367. XMEMCPY(c, p, sizeof(sp_point_1024));
  49368. XMEMSET(vx, 0, sizeof(sp_digit) * 2 * 32);
  49369. vx[0] = 1;
  49370. XMEMSET(vy, 0, sizeof(sp_digit) * 2 * 32);
  49371. sp_1024_mont_add_32(qx_px, q->x, p->x, p1024_mod);
  49372. for (i = 1020; i >= 0; i--) {
  49373. /* Accumulate line into v and double point. */
  49374. sp_1024_accumulate_line_dbl_32(vx, vy, c, q, t);
  49375. if ((i > 0) && ((p1024_order[i / 32] >> (i % 32)) & 1)) {
  49376. /* Accumulate line into v and add P into C. */
  49377. sp_1024_accumulate_line_add_one_32(vx, vy, c, p, q, qx_px, t);
  49378. }
  49379. }
  49380. /* Final exponentiation */
  49381. sp_1024_proj_sqr_32(vx, vy, t);
  49382. sp_1024_proj_sqr_32(vx, vy, t);
  49383. /* Convert from PF_p[q] to F_p */
  49384. sp_1024_mont_inv_32(vx, vx, t);
  49385. sp_1024_mont_mul_32(r, vx, vy, p1024_mod, p1024_mp_mod);
  49386. XMEMSET(r + 32, 0, sizeof(sp_digit) * 32);
  49387. sp_1024_mont_reduce_32(r, p1024_mod, p1024_mp_mod);
  49388. err = sp_1024_to_mp(r, res);
  49389. }
  49390. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  49391. !defined(WOLFSSL_SP_NO_MALLOC)
  49392. if (td != NULL) {
  49393. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  49394. }
  49395. #endif
  49396. sp_1024_point_free_32(c, 1, NULL);
  49397. sp_1024_point_free_32(q, 1, NULL);
  49398. sp_1024_point_free_32(p, 1, NULL);
  49399. return err;
  49400. }
  49401. #else
  49402. /*
  49403. * Calculate gradient of line through C, P and -C-P, accumulate line and
  49404. * add P to C.
  49405. *
  49406. * Both C and P have z ordinates to use in the calculation.
  49407. *
  49408. * Calculations:
  49409. * r.x = (q.x * c.z^2 + c.x) * p.y * c.z - (q.x * p.z^2 + p.x) * c.y * p.z
  49410. * r.y = (p.x * c.z^2 - c.x * p.z^2) * q.y * p.z * c.z
  49411. * v* = v* * r*
  49412. * h = p.x * c.z^2 - c.x * p.z^2
  49413. * r = p.y * c.z^3 - c.y * p.z^3
  49414. * c'.x = r^2 - h^3 - 2 * c.x * p.z^2 * h^2
  49415. * c'.y = r * (c.x * p.z^2 * h^2 - c'.x) - c.y * p.z^3 * h^3
  49416. * c'.z = (p.x * c.z^2 - c.x * p.z^2) * c.z
  49417. *
  49418. * @param [in,out] vx X-ordinate of projective value in F*.
  49419. * @param [in,out] vy Y-ordinate of projective value in F*.
  49420. * @param [in,out] c ECC point - current point on E(F_p^2) to be added
  49421. * to.
  49422. * @param [in,out] p ECC point - point on E(F_p^2) to add.
  49423. * @param [in,out] q ECC point - second point on E(F_P^2).
  49424. * @param [in,out] t SP temporaries (6 used).
  49425. * @param [in,out] neg Indicates to use negative P.
  49426. * @return 0 on success.
  49427. * @return MEMORY_E when dynamic memory allocation fails.
  49428. * @return Other -ve value on internal failure.
  49429. */
  49430. static void sp_1024_accumulate_line_add_n_32(sp_digit* vx, sp_digit* vy,
  49431. const sp_point_1024* p, const sp_point_1024* q,
  49432. sp_point_1024* c, sp_digit* t, int neg)
  49433. {
  49434. sp_digit* t1 = t;
  49435. sp_digit* t2 = t + 2 * 32;
  49436. sp_digit* rx = t + 4 * 32;
  49437. sp_digit* ry = t + 6 * 32;
  49438. sp_digit* h = t + 8 * 32;
  49439. sp_digit* r = t + 10 * 32;
  49440. /* h = p.z^2 */
  49441. sp_1024_mont_sqr_32(h, p->z, p1024_mod, p1024_mp_mod);
  49442. /* rx = q.x * p.z^2 */
  49443. sp_1024_mont_mul_32(rx, q->x, h, p1024_mod, p1024_mp_mod);
  49444. /* rx = q.x * p.z^2 + p.x */
  49445. sp_1024_mont_add_32(t2, rx, p->x, p1024_mod);
  49446. /* c.y = c.y * p.z */
  49447. sp_1024_mont_mul_32(t1, c->y, p->z, p1024_mod, p1024_mp_mod);
  49448. /* r.x = (q.x * p.z^2 + p.x) * c.y * p.z */
  49449. sp_1024_mont_mul_32(rx, t2, t1, p1024_mod, p1024_mp_mod);
  49450. /* c.y = c.y * p.z^3 */
  49451. sp_1024_mont_mul_32(c->y, t1, h, p1024_mod, p1024_mp_mod);
  49452. /* t2 = c.z^2 */
  49453. sp_1024_mont_sqr_32(t2, c->z, p1024_mod, p1024_mp_mod);
  49454. /* t1 = q.x * c.z^2 */
  49455. sp_1024_mont_mul_32(t1, q->x, t2, p1024_mod, p1024_mp_mod);
  49456. /* t1 = q.x * c.z^2 + c.x */
  49457. sp_1024_mont_add_32(t1, t1, c->x, p1024_mod);
  49458. /* c.x = c.x * p.z^2 */
  49459. sp_1024_mont_mul_32(c->x, c->x, h, p1024_mod, p1024_mp_mod);
  49460. /* r = p.y * c.z */
  49461. sp_1024_mont_mul_32(r, p->y, c->z, p1024_mod, p1024_mp_mod);
  49462. if (neg) {
  49463. /* r = -p.y * c.z */
  49464. sp_1024_mont_sub_32(r, p1024_mod, r, p1024_mod);
  49465. }
  49466. /* t1 = (q.x * c.z^2 + c.x) * p.y * c.z */
  49467. sp_1024_mont_mul_32(ry, t1, r, p1024_mod, p1024_mp_mod);
  49468. /* r.x -= (q.x * c.z^2 + c.x) * p.y * c.z */
  49469. sp_1024_mont_sub_32(rx, ry, rx, p1024_mod);
  49470. /* t1 = p.x * c.z^2 */
  49471. sp_1024_mont_mul_32(t1, p->x, t2, p1024_mod, p1024_mp_mod);
  49472. /* h = p.x * c.z^2 - c.x * p.z^2 */
  49473. sp_1024_mont_sub_32(h, t1, c->x, p1024_mod);
  49474. /* c'.z = (p.x * c.z^2 - c.x * p.z^2) * c.z */
  49475. sp_1024_mont_mul_32(t1, h, c->z, p1024_mod, p1024_mp_mod);
  49476. /* c'.z = (p.x * c.z^2 - c.x * p.z^2) * c.z * p.z */
  49477. sp_1024_mont_mul_32(c->z, t1, p->z, p1024_mod, p1024_mp_mod);
  49478. /* r.y = (p.x * c.z^2 - c.x * p.z^2) * c.z * p.z * q.y */
  49479. sp_1024_mont_mul_32(ry, c->z, q->y, p1024_mod, p1024_mp_mod);
  49480. /* r = p.y * c.z^3 */
  49481. sp_1024_mont_mul_32(t1, r, t2, p1024_mod, p1024_mp_mod);
  49482. /* r = p.y * c.z^3 - c.y * p.z^3 */
  49483. sp_1024_mont_sub_32(r, t1, c->y, p1024_mod);
  49484. /* v = v * r */
  49485. sp_1024_proj_mul_32(vx, vy, rx, ry, t);
  49486. /* Add p to c using previously calculated values.
  49487. * h = p.x * c.z^2 - c.x * p.z^2
  49488. * r = p.y * c.z^3 - c.y * p.z^3
  49489. * c'.z = (p.x * c.z^2 - c.x * p.z^2) * c.z
  49490. */
  49491. /* t1 = r^2 */
  49492. sp_1024_mont_sqr_32(t1, r, p1024_mod, p1024_mp_mod);
  49493. /* t2 = h^2 */
  49494. sp_1024_mont_sqr_32(rx, h, p1024_mod, p1024_mp_mod);
  49495. /* ry = c.x * p.z^2 * h^2 */
  49496. sp_1024_mont_mul_32(ry, rx, c->x, p1024_mod, p1024_mp_mod);
  49497. /* t2 = h^3 */
  49498. sp_1024_mont_mul_32(t2, rx, h, p1024_mod, p1024_mp_mod);
  49499. /* c'.x = r^2 - h^3 */
  49500. sp_1024_mont_sub_32(c->x, t1, t2, p1024_mod);
  49501. /* t1 = 2 * c.x * p.z^2 * h^2 */
  49502. sp_1024_mont_dbl_32(t1, ry, p1024_mod);
  49503. /* c'.x = r^2 - h^3 - 2 * c.x * p.z^2 * h^2 */
  49504. sp_1024_mont_sub_32(c->x, c->x, t1, p1024_mod);
  49505. /* ry = c.x * p.z^2 * h^2 - c'.x */
  49506. sp_1024_mont_sub_32(t1, ry, c->x, p1024_mod);
  49507. /* ry = r * (c.x * p.z^2 * h^2 - c'.x) */
  49508. sp_1024_mont_mul_32(ry, t1, r, p1024_mod, p1024_mp_mod);
  49509. /* t2 = c.y * p.z^3 * h^3 */
  49510. sp_1024_mont_mul_32(t1, t2, c->y, p1024_mod, p1024_mp_mod);
  49511. /* c'.y = r * (c.x * p.z^2 * h^2 - c'.x) - c.y * p.z^3 * h^3 */
  49512. sp_1024_mont_sub_32(c->y, ry, t1, p1024_mod);
  49513. }
  49514. /*
  49515. * Perform n accumulate doubles and doubles of P.
  49516. *
  49517. * py = 2 * p.y
  49518. *
  49519. * For each double:
  49520. * Calculate gradient of line through P, P and [-2]P, accumulate line and
  49521. * double P.
  49522. *
  49523. * Calculations:
  49524. * l = 3 * (p.x^2 - p.z^4) = 3 * (p.x - p.z^2) * (p.x + p.z^2)
  49525. * r.x = l * (p.x + q.x * p.z^2) - py^2 / 2
  49526. * r.y = py * p.z^3 * q.y (= p'.z * p.z^2 * q.y)
  49527. * v* = v*^2 * r*
  49528. * p'.x = l^2 - 2 * py^2 * p.x
  49529. * py' = (py^2 * p.x - p'.x) * l - py^4 (= 2 * p'.y)
  49530. * p'.z = py * p.z
  49531. *
  49532. * Finally:
  49533. * p'.y = py' / 2
  49534. *
  49535. * @param [in,out] vx X-ordinate of projective value in F*.
  49536. * @param [in,out] vy Y-ordinate of projective value in F*.
  49537. * @param [in,out] p ECC point - point on E(F_p^2) to double.
  49538. * @param [in] q ECC point - second point on E(F_P^2).
  49539. * @param [in] n Number of times to double.
  49540. * @param [in] t SP temporaries (6 used).
  49541. */
  49542. static void sp_1024_accumulate_line_dbl_n_32(sp_digit* vx, sp_digit* vy,
  49543. sp_point_1024* p, const sp_point_1024* q, int n, sp_digit* t)
  49544. {
  49545. sp_digit* t1 = t + 0 * 32;
  49546. sp_digit* pz2 = t + 2 * 32;
  49547. sp_digit* rx = t + 4 * 32;
  49548. sp_digit* ry = t + 6 * 32;
  49549. sp_digit* l = t + 8 * 32;
  49550. sp_digit* ty = t + 10 * 32;
  49551. int i;
  49552. /* py = 2 * p.y */
  49553. sp_1024_mont_dbl_32(p->y, p->y, p1024_mod);
  49554. for (i = 0; i < n; i++) {
  49555. /* v = v^2 */
  49556. sp_1024_proj_sqr_32(vx, vy, t);
  49557. /* pz2 = p.z^2 */
  49558. sp_1024_mont_sqr_32(pz2, p->z, p1024_mod, p1024_mp_mod);
  49559. /* t1 = p.x + p.z^2 */
  49560. sp_1024_mont_add_32(t1, p->x, pz2, p1024_mod);
  49561. /* l = p.x - p.z^2 */
  49562. sp_1024_mont_sub_32(l, p->x, pz2, p1024_mod);
  49563. /* t1 = (p.x + p.z^2) * (p.x - p.z^2) = p.x^2 - p.z^4 */
  49564. sp_1024_mont_mul_32(ty, l, t1, p1024_mod, p1024_mp_mod);
  49565. /* l = 3 * (p.x^2 - p.z^4) */
  49566. sp_1024_mont_tpl_32(l, ty, p1024_mod);
  49567. /* t1 = q.x * p.z^2 */
  49568. sp_1024_mont_mul_32(t1, q->x, pz2, p1024_mod, p1024_mp_mod);
  49569. /* t1 = p.x + q.x * p.z^2 */
  49570. sp_1024_mont_add_32(t1, p->x, t1, p1024_mod);
  49571. /* r.x = l * (p.x + q.x * p.z^2) */
  49572. sp_1024_mont_mul_32(rx, l, t1, p1024_mod, p1024_mp_mod);
  49573. /* ty = py ^ 2 */
  49574. sp_1024_mont_sqr_32(ty, p->y, p1024_mod, p1024_mp_mod);
  49575. /* t1 = py ^ 2 / 2 */
  49576. sp_1024_div2_32(t1, ty, p1024_mod);
  49577. /* r.x -= py ^ 2 / 2 */
  49578. sp_1024_mont_sub_32(rx, rx, t1, p1024_mod);
  49579. /* p'.z = py * pz */
  49580. sp_1024_mont_mul_32(p->z, p->z, p->y, p1024_mod, p1024_mp_mod);
  49581. /* r.y = p'.z * p.z^2 */
  49582. sp_1024_mont_mul_32(t1, p->z, pz2, p1024_mod, p1024_mp_mod);
  49583. /* r.y = p'.z * p.z^2 * q.y */
  49584. sp_1024_mont_mul_32(ry, t1, q->y, p1024_mod, p1024_mp_mod);
  49585. /* v = v^2 * r */
  49586. sp_1024_proj_mul_32(vx, vy, rx, ry, t);
  49587. /* Double point using previously calculated values
  49588. * l = 3 * (p.x - p.z^2).(p.x + p.z^2)
  49589. * ty = py^2
  49590. * p'.z = py * p.z
  49591. */
  49592. /* t1 = py^2 ^ 2 = py^4 */
  49593. sp_1024_mont_sqr_32(t1, ty, p1024_mod, p1024_mp_mod);
  49594. /* py' = py^2 * p. x */
  49595. sp_1024_mont_mul_32(p->y, ty, p->x, p1024_mod, p1024_mp_mod);
  49596. /* p'.x = l^2 */
  49597. sp_1024_mont_sqr_32(p->x, l, p1024_mod, p1024_mp_mod);
  49598. /* p'.x = l^2 - py^2 * p.x */
  49599. sp_1024_mont_sub_32(p->x, p->x, p->y, p1024_mod);
  49600. /* p'.x = l^2 - 2 * p.y^2 * p.x */
  49601. sp_1024_mont_sub_32(p->x, p->x, p->y, p1024_mod);
  49602. /* py' = py^2 * p.x - p.x' */
  49603. sp_1024_mont_sub_32(ty, p->y, p->x, p1024_mod);
  49604. /* py' = (p.y^2 * p.x - p'.x) * l */
  49605. sp_1024_mont_mul_32(p->y, ty, l, p1024_mod, p1024_mp_mod);
  49606. /* py' = (p.y^2 * p.x - p'.x) * l * 2 */
  49607. sp_1024_mont_dbl_32(p->y, p->y, p1024_mod);
  49608. /* py' = (p.y^2 * p.x - p'.x) * l * 2 - p.y^4 */
  49609. sp_1024_mont_sub_32(p->y, p->y, t1, p1024_mod);
  49610. }
  49611. /* p'.y = py' / 2 */
  49612. sp_1024_div2_32(p->y, p->y, p1024_mod);
  49613. }
  49614. /* Operations to perform based on order - 1.
  49615. * Sliding window. Start at bottom and stop when bottom bit is one.
  49616. * Subtract if top bit in window is one.
  49617. * Width of 6 bits.
  49618. * Pairs: #dbls, add/subtract window value
  49619. */
  49620. static const signed char sp_1024_order_op[] = {
  49621. 5, 6, -13, 9, -21, 6, -5, 8, 31, 6, 3, 6, -27, 6, 25, 9,
  49622. -1, 6, -11, 6, -13, 6, -7, 6, -15, 6, -29, 7, 25, 6, -9, 6,
  49623. -19, 7, 3, 6, 11, 9, -23, 6, 1, 6, 27, 6, 1, 7, -25, 8,
  49624. 13, 7, -13, 7, -23, 10, 19, 7, 7, 7, -3, 7, 27, 6, -7, 7,
  49625. -21, 7, 11, 7, 31, 8, 1, 7, -23, 6, -17, 6, -3, 10, 11, 6,
  49626. -21, 7, -27, 11, -29, 6, -1, 10, 15, 8, 27, 7, 17, 6, 17, 7,
  49627. -13, 8, 13, 6, 21, 7, -29, 6, 19, 7, -25, 6, 11, 9, 29, 7,
  49628. -7, 8, 27, 7, 29, 10, -1, 8, -7, 8, 17, 6, 17, 7, -27, 7,
  49629. -21, 6, -9, 6, -27, 12, -23, 6, 19, 6, 13, 6, -11, 7, 27, 6,
  49630. 17, 6, -7, 6, -25, 7, -29, 6, 9, 7, 7, 6, 13, 6, -25, 6,
  49631. -19, 6, 13, 6, -11, 6, 5, 8, 19, 6, -21, 8, 23, 7, 27, 6,
  49632. -13, 6, -19, 11, 29, 7, -15, 6, -9, 7, -21, 10, -3, 7, 21, 10,
  49633. 25, 6, -15, 6, -23, 6, 21, 6, 1, 6, 21, 7, -3, 6, -3, 7,
  49634. -7, 6, -23, 7, 7, 8, 15, 9, 5, 6, -11, 6, 21, 11, -27, 7,
  49635. 27, 6, -11, 6, 31, 6, -21, 6, 19, 6, -7, 8, -7, 13, -3, 6,
  49636. -7, 7, -3, 6, 1, 6, 7, 8, 19, 8, 11, 9, -9, 7, -31, 12,
  49637. 25, 6, -17, 9, -15, 7, 5, 6, 25, 7, -5, 7, -25, 6, 17, 8,
  49638. -19, 6, -13, 6, 27, 8, 1, 7, -5, 7, -1, 6, 21, 6, 3, 10,
  49639. -3, 1,
  49640. };
  49641. /*
  49642. * Calculate r = pairing <P, Q>.
  49643. *
  49644. * That is, multiply base in PF_p[q] by the scalar s, such that s.P = Q.
  49645. *
  49646. * Sliding window. Start at bottom and stop when bottom bit is one.
  49647. * Subtract if top bit in window is one.
  49648. * Width of 6 bits.
  49649. *
  49650. * @param [in] pm First point on E(F_p)[q].
  49651. * @param [in] qm Second point on E(F_p)[q].
  49652. * @param [in] res Result of calculation.
  49653. * @return 0 on success.
  49654. * @return MEMORY_E when dynamic memory allocation fails.
  49655. */
  49656. int sp_Pairing_1024(const ecc_point* pm, const ecc_point* qm, mp_int* res)
  49657. {
  49658. int err;
  49659. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  49660. !defined(WOLFSSL_SP_NO_MALLOC)
  49661. sp_digit* td = NULL;
  49662. sp_digit* t;
  49663. sp_digit* vx;
  49664. sp_digit* vy;
  49665. sp_digit (*pre_vx)[64];
  49666. sp_digit (*pre_vy)[64];
  49667. sp_digit (*pre_nvy)[64];
  49668. sp_point_1024* pre_p;
  49669. #else
  49670. sp_digit t[6 * 2 * 32];
  49671. sp_digit vx[2 * 32];
  49672. sp_digit vy[2 * 32];
  49673. sp_digit pre_vx[16][64];
  49674. sp_digit pre_vy[16][64];
  49675. sp_digit pre_nvy[16][64];
  49676. sp_point_1024 pre_p[16];
  49677. sp_point_1024 pd;
  49678. sp_point_1024 qd;
  49679. sp_point_1024 cd;
  49680. #endif
  49681. sp_point_1024* p = NULL;
  49682. sp_point_1024* q = NULL;
  49683. sp_point_1024* c = NULL;
  49684. sp_digit* r = NULL;
  49685. int i;
  49686. int j;
  49687. err = sp_1024_point_new_32(NULL, pd, p);
  49688. if (err == MP_OKAY) {
  49689. err = sp_1024_point_new_32(NULL, qd, q);
  49690. }
  49691. if (err == MP_OKAY) {
  49692. err = sp_1024_point_new_32(NULL, cd, c);
  49693. }
  49694. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  49695. !defined(WOLFSSL_SP_NO_MALLOC)
  49696. if (err == MP_OKAY) {
  49697. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * 56 * 32 * 2 + 16 * sizeof(sp_point_1024), NULL,
  49698. DYNAMIC_TYPE_TMP_BUFFER);
  49699. if (td == NULL) {
  49700. err = MEMORY_E;
  49701. }
  49702. }
  49703. #endif
  49704. if (err == MP_OKAY) {
  49705. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  49706. !defined(WOLFSSL_SP_NO_MALLOC)
  49707. t = td;
  49708. vx = td + 6 * 32 * 2;
  49709. vy = td + 7 * 32 * 2;
  49710. pre_vx = (sp_digit(*)[64])(td + 8 * 32 * 2);
  49711. pre_vy = (sp_digit(*)[64])(td + 24 * 32 * 2);
  49712. pre_nvy = (sp_digit(*)[64])(td + 40 * 32 * 2);
  49713. pre_p = (sp_point_1024*)(td + 56 * 32 * 2);
  49714. #endif
  49715. r = vy;
  49716. sp_1024_point_from_ecc_point_32(p, pm);
  49717. sp_1024_point_from_ecc_point_32(q, qm);
  49718. err = sp_1024_mod_mul_norm_32(p->x, p->x, p1024_mod);
  49719. }
  49720. if (err == MP_OKAY) {
  49721. err = sp_1024_mod_mul_norm_32(p->y, p->y, p1024_mod);
  49722. }
  49723. if (err == MP_OKAY) {
  49724. err = sp_1024_mod_mul_norm_32(p->z, p->z, p1024_mod);
  49725. }
  49726. if (err == MP_OKAY) {
  49727. err = sp_1024_mod_mul_norm_32(q->x, q->x, p1024_mod);
  49728. }
  49729. if (err == MP_OKAY) {
  49730. err = sp_1024_mod_mul_norm_32(q->y, q->y, p1024_mod);
  49731. }
  49732. if (err == MP_OKAY) {
  49733. /* Generate pre-computation table: 1, 3, ... , 31 */
  49734. XMEMCPY(&pre_p[0], p, sizeof(sp_point_1024));
  49735. XMEMSET(pre_vx[0], 0, sizeof(sp_digit) * 2 * 32);
  49736. pre_vx[0][0] = 1;
  49737. XMEMSET(pre_vy[0], 0, sizeof(sp_digit) * 2 * 32);
  49738. sp_1024_mont_sub_32(pre_nvy[0], p1024_mod, pre_vy[0], p1024_mod);
  49739. /* [2]P for adding */
  49740. XMEMCPY(c, p, sizeof(sp_point_1024));
  49741. XMEMSET(vx, 0, sizeof(sp_digit) * 2 * 32);
  49742. vx[0] = 1;
  49743. XMEMSET(vy, 0, sizeof(sp_digit) * 2 * 32);
  49744. sp_1024_accumulate_line_dbl_32(vx, vy, c, q, t);
  49745. /* 3, 5, ... */
  49746. for (i = 1; i < 16; i++) {
  49747. XMEMCPY(&pre_p[i], &pre_p[i-1], sizeof(sp_point_1024));
  49748. XMEMCPY(pre_vx[i], pre_vx[i-1], sizeof(sp_digit) * 2 * 32);
  49749. XMEMCPY(pre_vy[i], pre_vy[i-1], sizeof(sp_digit) * 2 * 32);
  49750. sp_1024_proj_mul_32(pre_vx[i], pre_vy[i], vx, vy, t);
  49751. sp_1024_accumulate_line_add_n_32(pre_vx[i], pre_vy[i], c,
  49752. q, &pre_p[i], t, 0);
  49753. sp_1024_mont_sub_32(pre_nvy[i], p1024_mod, pre_vy[i], p1024_mod);
  49754. }
  49755. j = sp_1024_order_op[0] / 2;
  49756. XMEMCPY(c, &pre_p[j], sizeof(sp_point_1024));
  49757. XMEMCPY(vx, pre_vx[j], sizeof(sp_digit) * 2 * 32);
  49758. XMEMCPY(vy, pre_vy[j], sizeof(sp_digit) * 2 * 32);
  49759. /* Accumulate line into v and double point n times. */
  49760. sp_1024_accumulate_line_dbl_n_32(vx, vy, c, q,
  49761. sp_1024_order_op[1], t);
  49762. for (i = 2; i < 290; i += 2) {
  49763. j = sp_1024_order_op[i];
  49764. if (j > 0) {
  49765. j /= 2;
  49766. /* Accumulate line into v and add P into C. */
  49767. sp_1024_proj_mul_32(vx, vy, pre_vx[j], pre_vy[j], t);
  49768. sp_1024_accumulate_line_add_n_32(vx, vy, &pre_p[j], q, c,
  49769. t, 0);
  49770. }
  49771. else {
  49772. j = -j / 2;
  49773. /* Accumulate line into v and add P into C. */
  49774. sp_1024_proj_mul_32(vx, vy, pre_vx[j], pre_nvy[j], t);
  49775. sp_1024_accumulate_line_add_n_32(vx, vy, &pre_p[j], q, c,
  49776. t, 1);
  49777. }
  49778. /* Accumulate line into v and double point n times. */
  49779. sp_1024_accumulate_line_dbl_n_32(vx, vy, c, q,
  49780. sp_1024_order_op[i + 1], t);
  49781. }
  49782. /* Final exponentiation */
  49783. sp_1024_proj_sqr_32(vx, vy, t);
  49784. sp_1024_proj_sqr_32(vx, vy, t);
  49785. /* Convert from PF_p[q] to F_p */
  49786. sp_1024_mont_inv_32(vx, vx, t);
  49787. sp_1024_mont_mul_32(r, vx, vy, p1024_mod, p1024_mp_mod);
  49788. XMEMSET(r + 32, 0, sizeof(sp_digit) * 32);
  49789. sp_1024_mont_reduce_32(r, p1024_mod, p1024_mp_mod);
  49790. err = sp_1024_to_mp(r, res);
  49791. }
  49792. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  49793. !defined(WOLFSSL_SP_NO_MALLOC)
  49794. if (td != NULL) {
  49795. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  49796. }
  49797. #endif
  49798. sp_1024_point_free_32(c, 1, NULL);
  49799. sp_1024_point_free_32(q, 1, NULL);
  49800. sp_1024_point_free_32(p, 1, NULL);
  49801. return err;
  49802. }
  49803. #endif /* WOLFSSL_SP_SMALL */
  49804. #ifdef WOLFSSL_SP_SMALL
  49805. /*
  49806. * Generate table for pairing.
  49807. *
  49808. * Small implementation does not use a table - returns 0 length.
  49809. *
  49810. * pm [in] Point to generate table for.
  49811. * table [in] Generated table.
  49812. * len [in,out] On in, the size of the buffer.
  49813. * On out, length of table generated.
  49814. * @return 0 on success.
  49815. * LENGTH_ONLY_E when table is NULL and only length returned.
  49816. * BUFFER_E when len is too small.
  49817. */
  49818. int sp_Pairing_gen_precomp_1024(const ecc_point* pm, byte* table,
  49819. word32* len)
  49820. {
  49821. int err = 0;
  49822. if (table == NULL) {
  49823. *len = 0;
  49824. err = LENGTH_ONLY_E;
  49825. }
  49826. else if (*len != 0) {
  49827. err = BUFFER_E;
  49828. }
  49829. (void)*pm;
  49830. return err;
  49831. }
  49832. /*
  49833. * Calculate r = pairing <P, Q>.
  49834. *
  49835. * That is, multiply base in PF_p[q] by the scalar s, such that s.P = Q.
  49836. *
  49837. * Small implementation does not use a table - use the normal implementation.
  49838. *
  49839. * @param [in] pm First point on E(F_p)[q].
  49840. * @param [in] qm Second point on E(F_p)[q].
  49841. * @param [in] res Result of calculation.
  49842. * @param [in] table Precomputed table of values.
  49843. * @param [in] len Length of precomputed table of values in bytes.
  49844. * @return 0 on success.
  49845. * @return MEMORY_E when dynamic memory allocation fails.
  49846. */
  49847. int sp_Pairing_precomp_1024(const ecc_point* pm, const ecc_point* qm,
  49848. mp_int* res, const byte* table, word32 len)
  49849. {
  49850. (void)table;
  49851. (void)len;
  49852. return sp_Pairing_1024(pm, qm, res);
  49853. }
  49854. #else
  49855. /*
  49856. * Calc l and c for the point when doubling p.
  49857. *
  49858. * l = 3 * (p.x^2 - 1) / (2 * p.y)
  49859. * c = l * p.x - p.y
  49860. *
  49861. * @param [out] lr Gradient result - table entry.
  49862. * @param [out] cr Constant result - table entry.
  49863. * @param [in] px X-ordinate of point to double.
  49864. * @param [in] py Y-ordinate of point to double.
  49865. * @param [in] t SP temporaries (3 used).
  49866. */
  49867. static void sp_1024_accum_dbl_calc_lc_32(sp_digit* lr, sp_digit* cr,
  49868. const sp_digit* px, const sp_digit* py, sp_digit* t)
  49869. {
  49870. sp_digit* t1 = t + 0 * 2 * 32;
  49871. sp_digit* t2 = t + 2 * 2 * 32;
  49872. sp_digit* l = t + 4 * 2 * 32;
  49873. /* l = 1 / 2 * p.y */
  49874. sp_1024_mont_dbl_32(l, py, p1024_mod);
  49875. sp_1024_mont_inv_32(l, l, t);
  49876. /* t1 = p.x^2 */
  49877. sp_1024_mont_sqr_32(t1, px, p1024_mod, p1024_mp_mod);
  49878. /* t1 = p.x - 1 */
  49879. sp_1024_mont_sub_32(t1, t1, p1024_norm_mod, p1024_mod);
  49880. /* t1 = 3 * (p.x^2 - 1) */
  49881. sp_1024_mont_dbl_32(t2, t1, p1024_mod);
  49882. sp_1024_mont_add_32(t1, t1, t2, p1024_mod);
  49883. /* t1 = 3 * (p.x^2 - 1) / (2 * p.y) */
  49884. sp_1024_mont_mul_32(l, l, t1, p1024_mod, p1024_mp_mod);
  49885. /* t2 = l * p.x */
  49886. sp_1024_mont_mul_32(t2, l, px, p1024_mod, p1024_mp_mod);
  49887. /* c = t2 = l * p.x - p.y */
  49888. sp_1024_mont_sub_32(t2, t2, py, p1024_mod);
  49889. XMEMCPY(lr, l, sizeof(sp_digit) * 32);
  49890. XMEMCPY(cr, t2, sizeof(sp_digit) * 32);
  49891. }
  49892. /*
  49893. * Calc l and c when adding p and c.
  49894. *
  49895. * l = (c.y - p.y) / (c.x - p.x)
  49896. * c = (p.x * c.y - cx * p.y) / (cx - p.x)
  49897. *
  49898. * @param [out] lr Gradient result - table entry.
  49899. * @param [out] cr Constant result - table entry.
  49900. * @param [in] px X-ordinate of point to add.
  49901. * @param [in] py Y-ordinate of point to add.
  49902. * @param [in] cx X-ordinate of current point.
  49903. * @param [in] cy Y-ordinate of current point.
  49904. * @param [in] t SP temporaries (3 used).
  49905. */
  49906. static void sp_1024_accum_add_calc_lc_32(sp_digit* lr, sp_digit* cr,
  49907. const sp_digit* px, const sp_digit* py, const sp_digit* cx,
  49908. const sp_digit* cy, sp_digit* t)
  49909. {
  49910. sp_digit* t1 = t + 0 * 2 * 32;
  49911. sp_digit* c = t + 2 * 2 * 32;
  49912. sp_digit* l = t + 4 * 2 * 32;
  49913. /* l = 1 / (c.x - p.x) */
  49914. sp_1024_mont_sub_32(l, cx, px, p1024_mod);
  49915. sp_1024_mont_inv_32(l, l, t);
  49916. /* c = p.x * c.y */
  49917. sp_1024_mont_mul_32(c, px, cy, p1024_mod, p1024_mp_mod);
  49918. /* t1 = c.x * p.y */
  49919. sp_1024_mont_mul_32(t1, cx, py, p1024_mod, p1024_mp_mod);
  49920. /* c = (p.x * c.y) - (c.x * p.y) */
  49921. sp_1024_mont_sub_32(c, c, t1, p1024_mod);
  49922. /* c = ((p.x * c.y) - (c.x * p.y)) / (c.x - p.x) */
  49923. sp_1024_mont_mul_32(c, c, l, p1024_mod, p1024_mp_mod);
  49924. /* t1 = c.y - p.y */
  49925. sp_1024_mont_sub_32(t1, cy, py, p1024_mod);
  49926. /* l = (c.y - p.y) / (c.x - p.x) */
  49927. sp_1024_mont_mul_32(l, t1, l, p1024_mod, p1024_mp_mod);
  49928. XMEMCPY(lr, l, sizeof(sp_digit) * 32);
  49929. XMEMCPY(cr, c, sizeof(sp_digit) * 32);
  49930. }
  49931. /*
  49932. * Calculate vx and vy given gradient l and constant c and point q.
  49933. *
  49934. * l is a the gradient and is multiplied by q->x.
  49935. * c is a the constant that is added to the multiplicative result.
  49936. * q->y is the y-ordinate in result to multiply.
  49937. *
  49938. * if dbl
  49939. * v* = v*^2
  49940. * r.x = l * q.x + c
  49941. * r.y = q->y
  49942. * v* = v* * r*
  49943. *
  49944. * @param [in,out] vx X-ordinate of projective value in F*.
  49945. * @param [in,out] vy Y-ordinate of projective value in F*.
  49946. * @param [in] l Gradient to multiply with.
  49947. * @param [in] c Constant to add with.
  49948. * @param [in] q ECC point - second point on E(F_P^2).
  49949. * @param [in] t SP temporaries (3 used).
  49950. * @param [in] dbl Indicates whether this is for doubling. Otherwise
  49951. * adding.
  49952. */
  49953. static void sp_1024_accumulate_line_lc_32(sp_digit* vx, sp_digit* vy,
  49954. const sp_digit* l, const sp_digit* c, const sp_point_1024* q,
  49955. sp_digit* t, int dbl)
  49956. {
  49957. sp_digit* rx = t + 4 * 2 * 32;
  49958. /* v = v^2 */
  49959. if (dbl) {
  49960. sp_1024_proj_sqr_32(vx, vy, t);
  49961. }
  49962. /* rx = l * q.x + c */
  49963. sp_1024_mont_mul_32(rx, l, q->x, p1024_mod, p1024_mp_mod);
  49964. sp_1024_mont_add_32(rx, rx, c, p1024_mod);
  49965. /* v = v^2 * r */
  49966. sp_1024_proj_mul_32(vx, vy, rx, q->y, t);
  49967. }
  49968. /* Operations to perform based on order - 1.
  49969. * Sliding window. Start at bottom and stop when bottom bit is one.
  49970. * Subtract if top bit in window is one.
  49971. * Width of 6 bits.
  49972. * Pairs: #dbls, add/subtract window value
  49973. */
  49974. static const signed char sp_1024_order_op_pre[] = {
  49975. 5, 6, -13, 9, -21, 6, -5, 8, 31, 6, 3, 6, -27, 6, 25, 9,
  49976. -1, 6, -11, 6, -13, 6, -7, 6, -15, 6, -29, 7, 25, 6, -9, 6,
  49977. -19, 7, 3, 6, 11, 9, -23, 6, 1, 6, 27, 6, 1, 7, -25, 8,
  49978. 13, 7, -13, 7, -23, 10, 19, 7, 7, 7, -3, 7, 27, 6, -7, 7,
  49979. -21, 7, 11, 7, 31, 8, 1, 7, -23, 6, -17, 6, -3, 10, 11, 6,
  49980. -21, 7, -27, 11, -29, 6, -1, 10, 15, 8, 27, 7, 17, 6, 17, 7,
  49981. -13, 8, 13, 6, 21, 7, -29, 6, 19, 7, -25, 6, 11, 9, 29, 7,
  49982. -7, 8, 27, 7, 29, 10, -1, 8, -7, 8, 17, 6, 17, 7, -27, 7,
  49983. -21, 6, -9, 6, -27, 12, -23, 6, 19, 6, 13, 6, -11, 7, 27, 6,
  49984. 17, 6, -7, 6, -25, 7, -29, 6, 9, 7, 7, 6, 13, 6, -25, 6,
  49985. -19, 6, 13, 6, -11, 6, 5, 8, 19, 6, -21, 8, 23, 7, 27, 6,
  49986. -13, 6, -19, 11, 29, 7, -15, 6, -9, 7, -21, 10, -3, 7, 21, 10,
  49987. 25, 6, -15, 6, -23, 6, 21, 6, 1, 6, 21, 7, -3, 6, -3, 7,
  49988. -7, 6, -23, 7, 7, 8, 15, 9, 5, 6, -11, 6, 21, 11, -27, 7,
  49989. 27, 6, -11, 6, 31, 6, -21, 6, 19, 6, -7, 8, -7, 13, -3, 6,
  49990. -7, 7, -3, 6, 1, 6, 7, 8, 19, 8, 11, 9, -9, 7, -31, 12,
  49991. 25, 6, -17, 9, -15, 7, 5, 6, 25, 7, -5, 7, -25, 6, 17, 8,
  49992. -19, 6, -13, 6, 27, 8, 1, 7, -5, 7, -1, 6, 21, 6, 3, 10,
  49993. -3, 1,
  49994. };
  49995. /*
  49996. * Generate table for pairing.
  49997. *
  49998. * Calculate the graident (l) and constant (c) at each step of the way.
  49999. * Sliding window. Start at bottom and stop when bottom bit is one.
  50000. * Subtract if top bit in window is one.
  50001. * Width of 6 bits.
  50002. *
  50003. * pm [in] Point to generate table for.
  50004. * table [in] Generated table.
  50005. * len [in,out] On in, the size of the buffer.
  50006. * On out, length of table generated.
  50007. * @return 0 on success.
  50008. * LENGTH_ONLY_E when table is NULL and only length returned.
  50009. * BUFFER_E when len is too small.
  50010. * MEMORY_E when dynamic memory allocation fauls.
  50011. */
  50012. int sp_Pairing_gen_precomp_1024(const ecc_point* pm, byte* table,
  50013. word32* len)
  50014. {
  50015. int err = 0;
  50016. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  50017. !defined(WOLFSSL_SP_NO_MALLOC)
  50018. sp_digit* td = NULL;
  50019. sp_digit* t;
  50020. sp_point_1024* pre_p;
  50021. #else
  50022. sp_digit t[6 * 2 * 32];
  50023. sp_point_1024 pre_p[16];
  50024. sp_point_1024 pd;
  50025. sp_point_1024 cd;
  50026. sp_point_1024 negd;
  50027. #endif
  50028. sp_point_1024* p = NULL;
  50029. sp_point_1024* c = NULL;
  50030. sp_point_1024* neg = NULL;
  50031. int i;
  50032. int j;
  50033. int k;
  50034. sp_table_entry_1024* precomp = (sp_table_entry_1024*)table;
  50035. if (table == NULL) {
  50036. *len = sizeof(sp_table_entry_1024) * 1167;
  50037. err = LENGTH_ONLY_E;
  50038. }
  50039. if ((err == MP_OKAY) &&
  50040. (*len < (int)(sizeof(sp_table_entry_1024) * 1167))) {
  50041. err = BUFFER_E;
  50042. }
  50043. if (err == MP_OKAY) {
  50044. err = sp_1024_point_new_32(NULL, pd, p);
  50045. }
  50046. if (err == MP_OKAY) {
  50047. err = sp_1024_point_new_32(NULL, cd, c);
  50048. }
  50049. if (err == MP_OKAY) {
  50050. err = sp_1024_point_new_32(NULL, negd, neg);
  50051. }
  50052. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  50053. !defined(WOLFSSL_SP_NO_MALLOC)
  50054. if (err == MP_OKAY) {
  50055. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * 6 * 32 * 2 + 16 * sizeof(sp_point_1024), NULL,
  50056. DYNAMIC_TYPE_TMP_BUFFER);
  50057. if (td == NULL) {
  50058. err = MEMORY_E;
  50059. }
  50060. }
  50061. #endif
  50062. if (err == MP_OKAY) {
  50063. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  50064. !defined(WOLFSSL_SP_NO_MALLOC)
  50065. t = td;
  50066. pre_p = (sp_point_1024*)(td + 6 * 32 * 2);
  50067. #endif
  50068. sp_1024_point_from_ecc_point_32(p, pm);
  50069. err = sp_1024_mod_mul_norm_32(p->x, p->x, p1024_mod);
  50070. }
  50071. if (err == MP_OKAY) {
  50072. err = sp_1024_mod_mul_norm_32(p->y, p->y, p1024_mod);
  50073. }
  50074. if (err == MP_OKAY) {
  50075. XMEMCPY(p->z, p1024_norm_mod, sizeof(p1024_norm_mod));
  50076. neg->infinity = 0;
  50077. c->infinity = 0;
  50078. /* Generate pre-computation table: 1, 3, ... , 31 */
  50079. XMEMCPY(&pre_p[0], p, sizeof(sp_point_1024));
  50080. /* [2]P for adding */
  50081. sp_1024_proj_point_dbl_32(c, p, t);
  50082. /* 1, 3, ... */
  50083. for (i = 1; i < 16; i++) {
  50084. sp_1024_proj_point_add_32(&pre_p[i], &pre_p[i-1], c, t);
  50085. sp_1024_mont_map_32(&pre_p[i], t);
  50086. }
  50087. k = 0;
  50088. j = sp_1024_order_op_pre[0] / 2;
  50089. XMEMCPY(c, &pre_p[j], sizeof(sp_point_1024));
  50090. for (j = 0; j < sp_1024_order_op_pre[1]; j++) {
  50091. sp_1024_accum_dbl_calc_lc_32(precomp[k].x, precomp[k].y, c->x, c->y, t);
  50092. k++;
  50093. sp_1024_proj_point_dbl_32(c, c, t);
  50094. sp_1024_mont_map_32(c, t);
  50095. }
  50096. for (i = 2; i < 290; i += 2) {
  50097. j = sp_1024_order_op_pre[i];
  50098. if (j > 0) {
  50099. sp_1024_accum_add_calc_lc_32(precomp[k].x, precomp[k].y,
  50100. pre_p[j/2].x, pre_p[j/2].y, c->x, c->y, t);
  50101. k++;
  50102. sp_1024_proj_point_add_32(c, c, &pre_p[j/2], t);
  50103. sp_1024_mont_map_32(c, t);
  50104. }
  50105. else {
  50106. XMEMCPY(neg->x, pre_p[-j / 2].x, sizeof(pre_p->x));
  50107. sp_1024_mont_sub_32(neg->y, p1024_mod, pre_p[-j / 2].y,
  50108. p1024_mod);
  50109. XMEMCPY(neg->z, pre_p[-j / 2].z, sizeof(pre_p->z));
  50110. sp_1024_accum_add_calc_lc_32(precomp[k].x, precomp[k].y,
  50111. neg->x, neg->y, c->x, c->y, t);
  50112. k++;
  50113. sp_1024_proj_point_add_32(c, c, neg, t);
  50114. sp_1024_mont_map_32(c, t);
  50115. }
  50116. for (j = 0; j < sp_1024_order_op_pre[i + 1]; j++) {
  50117. sp_1024_accum_dbl_calc_lc_32(precomp[k].x, precomp[k].y, c->x, c->y, t);
  50118. k++;
  50119. sp_1024_proj_point_dbl_32(c, c, t);
  50120. sp_1024_mont_map_32(c, t);
  50121. }
  50122. }
  50123. *len = sizeof(sp_table_entry_1024) * 1167;
  50124. }
  50125. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  50126. !defined(WOLFSSL_SP_NO_MALLOC)
  50127. if (td != NULL) {
  50128. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  50129. }
  50130. #endif
  50131. sp_1024_point_free_32(neg, 1, NULL);
  50132. sp_1024_point_free_32(c, 1, NULL);
  50133. sp_1024_point_free_32(p, 1, NULL);
  50134. return err;
  50135. }
  50136. /*
  50137. * Calculate r = pairing <P, Q>.
  50138. *
  50139. * That is, multiply base in PF_p[q] by the scalar s, such that s.P = Q.
  50140. *
  50141. * Sliding window. Start at bottom and stop when bottom bit is one.
  50142. * Subtract if top bit in window is one.
  50143. * Width of 6 bits.
  50144. * Pre-generate values in window (1, 3, ...) - only V.
  50145. * Table contains all gradient l and a constant for each point on the path.
  50146. *
  50147. * @param [in] pm First point on E(F_p)[q].
  50148. * @param [in] qm Second point on E(F_p)[q].
  50149. * @param [in] res Result of calculation.
  50150. * @param [in] table Precomputed table of values.
  50151. * @param [in] len Length of precomputed table of values in bytes.
  50152. * @return 0 on success.
  50153. * @return MEMORY_E when dynamic memory allocation fails.
  50154. */
  50155. int sp_Pairing_precomp_1024(const ecc_point* pm, const ecc_point* qm,
  50156. mp_int* res, const byte* table, word32 len)
  50157. {
  50158. int err = 0;
  50159. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  50160. !defined(WOLFSSL_SP_NO_MALLOC)
  50161. sp_digit* td = NULL;
  50162. sp_digit* t;
  50163. sp_digit* vx;
  50164. sp_digit* vy;
  50165. sp_digit (*pre_vx)[64];
  50166. sp_digit (*pre_vy)[64];
  50167. sp_digit (*pre_nvy)[64];
  50168. #else
  50169. sp_digit t[6 * 2 * 32];
  50170. sp_digit vx[2 * 32];
  50171. sp_digit vy[2 * 32];
  50172. sp_digit pre_vx[16][64];
  50173. sp_digit pre_vy[16][64];
  50174. sp_digit pre_nvy[16][64];
  50175. sp_point_1024 pd;
  50176. sp_point_1024 qd;
  50177. sp_point_1024 cd;
  50178. #endif
  50179. sp_point_1024* p = NULL;
  50180. sp_point_1024* q = NULL;
  50181. sp_point_1024* c = NULL;
  50182. sp_digit* r = NULL;
  50183. int i;
  50184. int j;
  50185. int k;
  50186. const sp_table_entry_1024* precomp = (const sp_table_entry_1024*)table;
  50187. if (len < (int)(sizeof(sp_table_entry_1024) * 1167)) {
  50188. err = BUFFER_E;
  50189. }
  50190. if (err == MP_OKAY) {
  50191. err = sp_1024_point_new_32(NULL, pd, p);
  50192. }
  50193. if (err == MP_OKAY) {
  50194. err = sp_1024_point_new_32(NULL, qd, q);
  50195. }
  50196. if (err == MP_OKAY) {
  50197. err = sp_1024_point_new_32(NULL, cd, c);
  50198. }
  50199. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  50200. !defined(WOLFSSL_SP_NO_MALLOC)
  50201. if (err == MP_OKAY) {
  50202. td = (sp_digit*)XMALLOC(sizeof(sp_digit) * 56 * 32 * 2, NULL,
  50203. DYNAMIC_TYPE_TMP_BUFFER);
  50204. if (td == NULL) {
  50205. err = MEMORY_E;
  50206. }
  50207. }
  50208. #endif
  50209. if (err == MP_OKAY) {
  50210. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  50211. !defined(WOLFSSL_SP_NO_MALLOC)
  50212. t = td;
  50213. vx = td + 6 * 32 * 2;
  50214. vy = td + 7 * 32 * 2;
  50215. pre_vx = (sp_digit(*)[64])(td + 8 * 32 * 2);
  50216. pre_vy = (sp_digit(*)[64])(td + 24 * 32 * 2);
  50217. pre_nvy = (sp_digit(*)[64])(td + 40 * 32 * 2);
  50218. #endif
  50219. r = vy;
  50220. sp_1024_point_from_ecc_point_32(p, pm);
  50221. sp_1024_point_from_ecc_point_32(q, qm);
  50222. err = sp_1024_mod_mul_norm_32(p->x, p->x, p1024_mod);
  50223. }
  50224. if (err == MP_OKAY) {
  50225. err = sp_1024_mod_mul_norm_32(p->y, p->y, p1024_mod);
  50226. }
  50227. if (err == MP_OKAY) {
  50228. err = sp_1024_mod_mul_norm_32(p->z, p->z, p1024_mod);
  50229. }
  50230. if (err == MP_OKAY) {
  50231. err = sp_1024_mod_mul_norm_32(q->x, q->x, p1024_mod);
  50232. }
  50233. if (err == MP_OKAY) {
  50234. err = sp_1024_mod_mul_norm_32(q->y, q->y, p1024_mod);
  50235. }
  50236. if (err == MP_OKAY) {
  50237. /* Generate pre-computation table: 1, 3, ... , 31 */
  50238. XMEMSET(pre_vx[0], 0, sizeof(sp_digit) * 2 * 32);
  50239. pre_vx[0][0] = 1;
  50240. XMEMSET(pre_vy[0], 0, sizeof(sp_digit) * 2 * 32);
  50241. sp_1024_mont_sub_32(pre_nvy[0], p1024_mod, pre_vy[0], p1024_mod);
  50242. /* [2]P for adding */
  50243. XMEMCPY(c, p, sizeof(sp_point_1024));
  50244. XMEMSET(vx, 0, sizeof(sp_digit) * 2 * 32);
  50245. vx[0] = 1;
  50246. XMEMSET(vy, 0, sizeof(sp_digit) * 2 * 32);
  50247. sp_1024_accumulate_line_dbl_32(vx, vy, c, q, t);
  50248. /* 3, 5, ... */
  50249. for (i = 1; i < 16; i++) {
  50250. XMEMCPY(pre_vx[i], pre_vx[i-1], sizeof(sp_digit) * 2 * 32);
  50251. XMEMCPY(pre_vy[i], pre_vy[i-1], sizeof(sp_digit) * 2 * 32);
  50252. sp_1024_proj_mul_32(pre_vx[i], pre_vy[i], vx, vy, t);
  50253. sp_1024_accumulate_line_add_n_32(pre_vx[i], pre_vy[i], c,
  50254. q, p, t, 0);
  50255. sp_1024_mont_sub_32(pre_nvy[i], p1024_mod, pre_vy[i],
  50256. p1024_mod);
  50257. }
  50258. XMEMCPY(c->z, p1024_norm_mod, sizeof(sp_digit) * 32);
  50259. c->infinity = 0;
  50260. j = sp_1024_order_op_pre[0] / 2;
  50261. XMEMCPY(vx, pre_vx[j], sizeof(sp_digit) * 2 * 32);
  50262. XMEMCPY(vy, pre_vy[j], sizeof(sp_digit) * 2 * 32);
  50263. k = 0;
  50264. for (j = 0; j < sp_1024_order_op_pre[1]; j++) {
  50265. /* Accumulate line into v and double point. */
  50266. sp_1024_accumulate_line_lc_32(vx, vy, precomp[k].x,
  50267. precomp[k].y, q, t, 1);
  50268. k++;
  50269. }
  50270. for (i = 2; i < 290; i += 2) {
  50271. sp_1024_accumulate_line_lc_32(vx, vy, precomp[k].x,
  50272. precomp[k].y, q, t, 0);
  50273. k++;
  50274. j = sp_1024_order_op_pre[i];
  50275. if (j > 0) {
  50276. j /= 2;
  50277. /* Accumulate line into v. */
  50278. sp_1024_proj_mul_32(vx, vy, pre_vx[j], pre_vy[j], t);
  50279. }
  50280. else {
  50281. j = -j / 2;
  50282. /* Accumulate line into v. */
  50283. sp_1024_proj_mul_32(vx, vy, pre_vx[j], pre_nvy[j], t);
  50284. }
  50285. for (j = 0; j < sp_1024_order_op_pre[i + 1]; j++) {
  50286. /* Accumulate line into v and double point. */
  50287. sp_1024_accumulate_line_lc_32(vx, vy, precomp[k].x,
  50288. precomp[k].y, q, t, 1);
  50289. k++;
  50290. }
  50291. }
  50292. /* Final exponentiation */
  50293. sp_1024_proj_sqr_32(vx, vy, t);
  50294. sp_1024_proj_sqr_32(vx, vy, t);
  50295. /* Convert from PF_p[q] to F_p */
  50296. sp_1024_mont_inv_32(vx, vx, t);
  50297. sp_1024_mont_mul_32(r, vx, vy, p1024_mod, p1024_mp_mod);
  50298. XMEMSET(r + 32, 0, sizeof(sp_digit) * 32);
  50299. sp_1024_mont_reduce_32(r, p1024_mod, p1024_mp_mod);
  50300. err = sp_1024_to_mp(r, res);
  50301. }
  50302. #if (defined(WOLFSSL_SP_SMALL) || defined(WOLFSSL_SMALL_STACK)) && \
  50303. !defined(WOLFSSL_SP_NO_MALLOC)
  50304. if (td != NULL) {
  50305. XFREE(td, NULL, DYNAMIC_TYPE_TMP_BUFFER);
  50306. }
  50307. #endif
  50308. sp_1024_point_free_32(c, 1, NULL);
  50309. sp_1024_point_free_32(q, 1, NULL);
  50310. sp_1024_point_free_32(p, 1, NULL);
  50311. return err;
  50312. }
  50313. #endif /* WOLFSSL_SP_SMALL */
  50314. #ifdef HAVE_ECC_CHECK_KEY
  50315. /* Read big endian unsigned byte array into r.
  50316. *
  50317. * r A single precision integer.
  50318. * size Maximum number of bytes to convert
  50319. * a Byte array.
  50320. * n Number of bytes in array to read.
  50321. */
  50322. static void sp_1024_from_bin(sp_digit* r, int size, const byte* a, int n)
  50323. {
  50324. int i;
  50325. int j;
  50326. byte* d;
  50327. for (i = n - 1,j = 0; i >= 3; i -= 4) {
  50328. r[j] = ((sp_digit)a[i - 0] << 0) |
  50329. ((sp_digit)a[i - 1] << 8) |
  50330. ((sp_digit)a[i - 2] << 16) |
  50331. ((sp_digit)a[i - 3] << 24);
  50332. j++;
  50333. }
  50334. if (i >= 0) {
  50335. r[j] = 0;
  50336. d = (byte*)r;
  50337. switch (i) {
  50338. case 2: d[n - 1 - 2] = a[2]; //fallthrough
  50339. case 1: d[n - 1 - 1] = a[1]; //fallthrough
  50340. case 0: d[n - 1 - 0] = a[0]; //fallthrough
  50341. }
  50342. j++;
  50343. }
  50344. for (; j < size; j++) {
  50345. r[j] = 0;
  50346. }
  50347. }
  50348. /* Check that the x and y oridinates are a valid point on the curve.
  50349. *
  50350. * point EC point.
  50351. * heap Heap to use if dynamically allocating.
  50352. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  50353. * not on the curve and MP_OKAY otherwise.
  50354. */
  50355. static int sp_1024_ecc_is_point_32(const sp_point_1024* point,
  50356. void* heap)
  50357. {
  50358. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  50359. sp_digit* t1 = NULL;
  50360. #else
  50361. sp_digit t1[32 * 4];
  50362. #endif
  50363. sp_digit* t2 = NULL;
  50364. sp_int32 n;
  50365. int err = MP_OKAY;
  50366. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  50367. t1 = (sp_digit*)XMALLOC(sizeof(sp_digit) * 32 * 4, heap, DYNAMIC_TYPE_ECC);
  50368. if (t1 == NULL)
  50369. err = MEMORY_E;
  50370. #endif
  50371. (void)heap;
  50372. if (err == MP_OKAY) {
  50373. t2 = t1 + 2 * 32;
  50374. sp_1024_sqr_32(t1, point->y);
  50375. (void)sp_1024_mod_32(t1, t1, p1024_mod);
  50376. sp_1024_sqr_32(t2, point->x);
  50377. (void)sp_1024_mod_32(t2, t2, p1024_mod);
  50378. sp_1024_mul_32(t2, t2, point->x);
  50379. (void)sp_1024_mod_32(t2, t2, p1024_mod);
  50380. (void)sp_1024_sub_32(t2, p1024_mod, t2);
  50381. sp_1024_mont_add_32(t1, t1, t2, p1024_mod);
  50382. sp_1024_mont_add_32(t1, t1, point->x, p1024_mod);
  50383. sp_1024_mont_add_32(t1, t1, point->x, p1024_mod);
  50384. sp_1024_mont_add_32(t1, t1, point->x, p1024_mod);
  50385. n = sp_1024_cmp_32(t1, p1024_mod);
  50386. sp_1024_cond_sub_32(t1, t1, p1024_mod, ~(n >> 31));
  50387. sp_1024_norm_32(t1);
  50388. if (!sp_1024_iszero_32(t1)) {
  50389. err = MP_VAL;
  50390. }
  50391. }
  50392. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  50393. if (t1 != NULL)
  50394. XFREE(t1, heap, DYNAMIC_TYPE_ECC);
  50395. #endif
  50396. return err;
  50397. }
  50398. /* Check that the x and y oridinates are a valid point on the curve.
  50399. *
  50400. * pX X ordinate of EC point.
  50401. * pY Y ordinate of EC point.
  50402. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  50403. * not on the curve and MP_OKAY otherwise.
  50404. */
  50405. int sp_ecc_is_point_1024(const mp_int* pX, const mp_int* pY)
  50406. {
  50407. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  50408. sp_point_1024* pub = NULL;
  50409. #else
  50410. sp_point_1024 pub[1];
  50411. #endif
  50412. const byte one[1] = { 1 };
  50413. int err = MP_OKAY;
  50414. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  50415. pub = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024), NULL,
  50416. DYNAMIC_TYPE_ECC);
  50417. if (pub == NULL)
  50418. err = MEMORY_E;
  50419. #endif
  50420. if (err == MP_OKAY) {
  50421. sp_1024_from_mp(pub->x, 32, pX);
  50422. sp_1024_from_mp(pub->y, 32, pY);
  50423. sp_1024_from_bin(pub->z, 32, one, (int)sizeof(one));
  50424. err = sp_1024_ecc_is_point_32(pub, NULL);
  50425. }
  50426. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  50427. if (pub != NULL)
  50428. XFREE(pub, NULL, DYNAMIC_TYPE_ECC);
  50429. #endif
  50430. return err;
  50431. }
  50432. /* Check that the private scalar generates the EC point (px, py), the point is
  50433. * on the curve and the point has the correct order.
  50434. *
  50435. * pX X ordinate of EC point.
  50436. * pY Y ordinate of EC point.
  50437. * privm Private scalar that generates EC point.
  50438. * returns MEMORY_E if dynamic memory allocation fails, MP_VAL if the point is
  50439. * not on the curve, ECC_INF_E if the point does not have the correct order,
  50440. * ECC_PRIV_KEY_E when the private scalar doesn't generate the EC point and
  50441. * MP_OKAY otherwise.
  50442. */
  50443. int sp_ecc_check_key_1024(const mp_int* pX, const mp_int* pY,
  50444. const mp_int* privm, void* heap)
  50445. {
  50446. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  50447. sp_digit* priv = NULL;
  50448. sp_point_1024* pub = NULL;
  50449. #else
  50450. sp_digit priv[32];
  50451. sp_point_1024 pub[2];
  50452. #endif
  50453. sp_point_1024* p = NULL;
  50454. const byte one[1] = { 1 };
  50455. int err = MP_OKAY;
  50456. /* Quick check the lengs of public key ordinates and private key are in
  50457. * range. Proper check later.
  50458. */
  50459. if (((mp_count_bits(pX) > 1024) ||
  50460. (mp_count_bits(pY) > 1024) ||
  50461. ((privm != NULL) && (mp_count_bits(privm) > 1024)))) {
  50462. err = ECC_OUT_OF_RANGE_E;
  50463. }
  50464. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  50465. if (err == MP_OKAY) {
  50466. pub = (sp_point_1024*)XMALLOC(sizeof(sp_point_1024) * 2, heap,
  50467. DYNAMIC_TYPE_ECC);
  50468. if (pub == NULL)
  50469. err = MEMORY_E;
  50470. }
  50471. if (err == MP_OKAY && privm) {
  50472. priv = (sp_digit*)XMALLOC(sizeof(sp_digit) * 32, heap,
  50473. DYNAMIC_TYPE_ECC);
  50474. if (priv == NULL)
  50475. err = MEMORY_E;
  50476. }
  50477. #endif
  50478. if (err == MP_OKAY) {
  50479. p = pub + 1;
  50480. sp_1024_from_mp(pub->x, 32, pX);
  50481. sp_1024_from_mp(pub->y, 32, pY);
  50482. sp_1024_from_bin(pub->z, 32, one, (int)sizeof(one));
  50483. if (privm)
  50484. sp_1024_from_mp(priv, 32, privm);
  50485. /* Check point at infinitiy. */
  50486. if ((sp_1024_iszero_32(pub->x) != 0) &&
  50487. (sp_1024_iszero_32(pub->y) != 0)) {
  50488. err = ECC_INF_E;
  50489. }
  50490. }
  50491. /* Check range of X and Y */
  50492. if ((err == MP_OKAY) &&
  50493. ((sp_1024_cmp_32(pub->x, p1024_mod) >= 0) ||
  50494. (sp_1024_cmp_32(pub->y, p1024_mod) >= 0))) {
  50495. err = ECC_OUT_OF_RANGE_E;
  50496. }
  50497. if (err == MP_OKAY) {
  50498. /* Check point is on curve */
  50499. err = sp_1024_ecc_is_point_32(pub, heap);
  50500. }
  50501. if (err == MP_OKAY) {
  50502. /* Point * order = infinity */
  50503. err = sp_1024_ecc_mulmod_32(p, pub, p1024_order, 1, 1, heap);
  50504. }
  50505. /* Check result is infinity */
  50506. if ((err == MP_OKAY) && ((sp_1024_iszero_32(p->x) == 0) ||
  50507. (sp_1024_iszero_32(p->y) == 0))) {
  50508. err = ECC_INF_E;
  50509. }
  50510. if (privm) {
  50511. if (err == MP_OKAY) {
  50512. /* Base * private = point */
  50513. err = sp_1024_ecc_mulmod_base_32(p, priv, 1, 1, heap);
  50514. }
  50515. /* Check result is public key */
  50516. if ((err == MP_OKAY) &&
  50517. ((sp_1024_cmp_32(p->x, pub->x) != 0) ||
  50518. (sp_1024_cmp_32(p->y, pub->y) != 0))) {
  50519. err = ECC_PRIV_KEY_E;
  50520. }
  50521. }
  50522. #if defined(WOLFSSL_SMALL_STACK) && !defined(WOLFSSL_SP_NO_MALLOC)
  50523. if (pub != NULL)
  50524. XFREE(pub, heap, DYNAMIC_TYPE_ECC);
  50525. if (priv != NULL)
  50526. XFREE(priv, heap, DYNAMIC_TYPE_ECC);
  50527. #endif
  50528. return err;
  50529. }
  50530. #endif
  50531. #endif /* WOLFSSL_SP_1024 */
  50532. #endif /* WOLFSSL_HAVE_SP_ECC */
  50533. #endif /* WOLFSSL_SP_ARM_CORTEX_M_ASM */
  50534. #endif /* WOLFSSL_HAVE_SP_RSA | WOLFSSL_HAVE_SP_DH | WOLFSSL_HAVE_SP_ECC */