ecp_nistp224.c 60 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759
  1. /*
  2. * Copyright 2010-2018 The OpenSSL Project Authors. All Rights Reserved.
  3. *
  4. * Licensed under the Apache License 2.0 (the "License"). You may not use
  5. * this file except in compliance with the License. You can obtain a copy
  6. * in the file LICENSE in the source distribution or at
  7. * https://www.openssl.org/source/license.html
  8. */
  9. /* Copyright 2011 Google Inc.
  10. *
  11. * Licensed under the Apache License, Version 2.0 (the "License");
  12. *
  13. * you may not use this file except in compliance with the License.
  14. * You may obtain a copy of the License at
  15. *
  16. * http://www.apache.org/licenses/LICENSE-2.0
  17. *
  18. * Unless required by applicable law or agreed to in writing, software
  19. * distributed under the License is distributed on an "AS IS" BASIS,
  20. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  21. * See the License for the specific language governing permissions and
  22. * limitations under the License.
  23. */
  24. /*
  25. * ECDSA low level APIs are deprecated for public use, but still ok for
  26. * internal use.
  27. */
  28. #include "internal/deprecated.h"
  29. /*
  30. * A 64-bit implementation of the NIST P-224 elliptic curve point multiplication
  31. *
  32. * Inspired by Daniel J. Bernstein's public domain nistp224 implementation
  33. * and Adam Langley's public domain 64-bit C implementation of curve25519
  34. */
  35. #include <openssl/opensslconf.h>
  36. #ifdef OPENSSL_NO_EC_NISTP_64_GCC_128
  37. NON_EMPTY_TRANSLATION_UNIT
  38. #else
  39. # include <stdint.h>
  40. # include <string.h>
  41. # include <openssl/err.h>
  42. # include "ec_local.h"
  43. # if defined(__SIZEOF_INT128__) && __SIZEOF_INT128__==16
  44. /* even with gcc, the typedef won't work for 32-bit platforms */
  45. typedef __uint128_t uint128_t; /* nonstandard; implemented by gcc on 64-bit
  46. * platforms */
  47. # else
  48. # error "Your compiler doesn't appear to support 128-bit integer types"
  49. # endif
  50. typedef uint8_t u8;
  51. typedef uint64_t u64;
  52. /******************************************************************************/
  53. /*-
  54. * INTERNAL REPRESENTATION OF FIELD ELEMENTS
  55. *
  56. * Field elements are represented as a_0 + 2^56*a_1 + 2^112*a_2 + 2^168*a_3
  57. * using 64-bit coefficients called 'limbs',
  58. * and sometimes (for multiplication results) as
  59. * b_0 + 2^56*b_1 + 2^112*b_2 + 2^168*b_3 + 2^224*b_4 + 2^280*b_5 + 2^336*b_6
  60. * using 128-bit coefficients called 'widelimbs'.
  61. * A 4-limb representation is an 'felem';
  62. * a 7-widelimb representation is a 'widefelem'.
  63. * Even within felems, bits of adjacent limbs overlap, and we don't always
  64. * reduce the representations: we ensure that inputs to each felem
  65. * multiplication satisfy a_i < 2^60, so outputs satisfy b_i < 4*2^60*2^60,
  66. * and fit into a 128-bit word without overflow. The coefficients are then
  67. * again partially reduced to obtain an felem satisfying a_i < 2^57.
  68. * We only reduce to the unique minimal representation at the end of the
  69. * computation.
  70. */
  71. typedef uint64_t limb;
  72. typedef uint128_t widelimb;
  73. typedef limb felem[4];
  74. typedef widelimb widefelem[7];
  75. /*
  76. * Field element represented as a byte array. 28*8 = 224 bits is also the
  77. * group order size for the elliptic curve, and we also use this type for
  78. * scalars for point multiplication.
  79. */
  80. typedef u8 felem_bytearray[28];
  81. static const felem_bytearray nistp224_curve_params[5] = {
  82. {0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, /* p */
  83. 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0x00, 0x00, 0x00, 0x00,
  84. 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x01},
  85. {0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, /* a */
  86. 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFE, 0xFF, 0xFF, 0xFF, 0xFF,
  87. 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFE},
  88. {0xB4, 0x05, 0x0A, 0x85, 0x0C, 0x04, 0xB3, 0xAB, 0xF5, 0x41, /* b */
  89. 0x32, 0x56, 0x50, 0x44, 0xB0, 0xB7, 0xD7, 0xBF, 0xD8, 0xBA,
  90. 0x27, 0x0B, 0x39, 0x43, 0x23, 0x55, 0xFF, 0xB4},
  91. {0xB7, 0x0E, 0x0C, 0xBD, 0x6B, 0xB4, 0xBF, 0x7F, 0x32, 0x13, /* x */
  92. 0x90, 0xB9, 0x4A, 0x03, 0xC1, 0xD3, 0x56, 0xC2, 0x11, 0x22,
  93. 0x34, 0x32, 0x80, 0xD6, 0x11, 0x5C, 0x1D, 0x21},
  94. {0xbd, 0x37, 0x63, 0x88, 0xb5, 0xf7, 0x23, 0xfb, 0x4c, 0x22, /* y */
  95. 0xdf, 0xe6, 0xcd, 0x43, 0x75, 0xa0, 0x5a, 0x07, 0x47, 0x64,
  96. 0x44, 0xd5, 0x81, 0x99, 0x85, 0x00, 0x7e, 0x34}
  97. };
  98. /*-
  99. * Precomputed multiples of the standard generator
  100. * Points are given in coordinates (X, Y, Z) where Z normally is 1
  101. * (0 for the point at infinity).
  102. * For each field element, slice a_0 is word 0, etc.
  103. *
  104. * The table has 2 * 16 elements, starting with the following:
  105. * index | bits | point
  106. * ------+---------+------------------------------
  107. * 0 | 0 0 0 0 | 0G
  108. * 1 | 0 0 0 1 | 1G
  109. * 2 | 0 0 1 0 | 2^56G
  110. * 3 | 0 0 1 1 | (2^56 + 1)G
  111. * 4 | 0 1 0 0 | 2^112G
  112. * 5 | 0 1 0 1 | (2^112 + 1)G
  113. * 6 | 0 1 1 0 | (2^112 + 2^56)G
  114. * 7 | 0 1 1 1 | (2^112 + 2^56 + 1)G
  115. * 8 | 1 0 0 0 | 2^168G
  116. * 9 | 1 0 0 1 | (2^168 + 1)G
  117. * 10 | 1 0 1 0 | (2^168 + 2^56)G
  118. * 11 | 1 0 1 1 | (2^168 + 2^56 + 1)G
  119. * 12 | 1 1 0 0 | (2^168 + 2^112)G
  120. * 13 | 1 1 0 1 | (2^168 + 2^112 + 1)G
  121. * 14 | 1 1 1 0 | (2^168 + 2^112 + 2^56)G
  122. * 15 | 1 1 1 1 | (2^168 + 2^112 + 2^56 + 1)G
  123. * followed by a copy of this with each element multiplied by 2^28.
  124. *
  125. * The reason for this is so that we can clock bits into four different
  126. * locations when doing simple scalar multiplies against the base point,
  127. * and then another four locations using the second 16 elements.
  128. */
  129. static const felem gmul[2][16][3] = {
  130. {{{0, 0, 0, 0},
  131. {0, 0, 0, 0},
  132. {0, 0, 0, 0}},
  133. {{0x3280d6115c1d21, 0xc1d356c2112234, 0x7f321390b94a03, 0xb70e0cbd6bb4bf},
  134. {0xd5819985007e34, 0x75a05a07476444, 0xfb4c22dfe6cd43, 0xbd376388b5f723},
  135. {1, 0, 0, 0}},
  136. {{0xfd9675666ebbe9, 0xbca7664d40ce5e, 0x2242df8d8a2a43, 0x1f49bbb0f99bc5},
  137. {0x29e0b892dc9c43, 0xece8608436e662, 0xdc858f185310d0, 0x9812dd4eb8d321},
  138. {1, 0, 0, 0}},
  139. {{0x6d3e678d5d8eb8, 0x559eed1cb362f1, 0x16e9a3bbce8a3f, 0xeedcccd8c2a748},
  140. {0xf19f90ed50266d, 0xabf2b4bf65f9df, 0x313865468fafec, 0x5cb379ba910a17},
  141. {1, 0, 0, 0}},
  142. {{0x0641966cab26e3, 0x91fb2991fab0a0, 0xefec27a4e13a0b, 0x0499aa8a5f8ebe},
  143. {0x7510407766af5d, 0x84d929610d5450, 0x81d77aae82f706, 0x6916f6d4338c5b},
  144. {1, 0, 0, 0}},
  145. {{0xea95ac3b1f15c6, 0x086000905e82d4, 0xdd323ae4d1c8b1, 0x932b56be7685a3},
  146. {0x9ef93dea25dbbf, 0x41665960f390f0, 0xfdec76dbe2a8a7, 0x523e80f019062a},
  147. {1, 0, 0, 0}},
  148. {{0x822fdd26732c73, 0xa01c83531b5d0f, 0x363f37347c1ba4, 0xc391b45c84725c},
  149. {0xbbd5e1b2d6ad24, 0xddfbcde19dfaec, 0xc393da7e222a7f, 0x1efb7890ede244},
  150. {1, 0, 0, 0}},
  151. {{0x4c9e90ca217da1, 0xd11beca79159bb, 0xff8d33c2c98b7c, 0x2610b39409f849},
  152. {0x44d1352ac64da0, 0xcdbb7b2c46b4fb, 0x966c079b753c89, 0xfe67e4e820b112},
  153. {1, 0, 0, 0}},
  154. {{0xe28cae2df5312d, 0xc71b61d16f5c6e, 0x79b7619a3e7c4c, 0x05c73240899b47},
  155. {0x9f7f6382c73e3a, 0x18615165c56bda, 0x641fab2116fd56, 0x72855882b08394},
  156. {1, 0, 0, 0}},
  157. {{0x0469182f161c09, 0x74a98ca8d00fb5, 0xb89da93489a3e0, 0x41c98768fb0c1d},
  158. {0xe5ea05fb32da81, 0x3dce9ffbca6855, 0x1cfe2d3fbf59e6, 0x0e5e03408738a7},
  159. {1, 0, 0, 0}},
  160. {{0xdab22b2333e87f, 0x4430137a5dd2f6, 0xe03ab9f738beb8, 0xcb0c5d0dc34f24},
  161. {0x764a7df0c8fda5, 0x185ba5c3fa2044, 0x9281d688bcbe50, 0xc40331df893881},
  162. {1, 0, 0, 0}},
  163. {{0xb89530796f0f60, 0xade92bd26909a3, 0x1a0c83fb4884da, 0x1765bf22a5a984},
  164. {0x772a9ee75db09e, 0x23bc6c67cec16f, 0x4c1edba8b14e2f, 0xe2a215d9611369},
  165. {1, 0, 0, 0}},
  166. {{0x571e509fb5efb3, 0xade88696410552, 0xc8ae85fada74fe, 0x6c7e4be83bbde3},
  167. {0xff9f51160f4652, 0xb47ce2495a6539, 0xa2946c53b582f4, 0x286d2db3ee9a60},
  168. {1, 0, 0, 0}},
  169. {{0x40bbd5081a44af, 0x0995183b13926c, 0xbcefba6f47f6d0, 0x215619e9cc0057},
  170. {0x8bc94d3b0df45e, 0xf11c54a3694f6f, 0x8631b93cdfe8b5, 0xe7e3f4b0982db9},
  171. {1, 0, 0, 0}},
  172. {{0xb17048ab3e1c7b, 0xac38f36ff8a1d8, 0x1c29819435d2c6, 0xc813132f4c07e9},
  173. {0x2891425503b11f, 0x08781030579fea, 0xf5426ba5cc9674, 0x1e28ebf18562bc},
  174. {1, 0, 0, 0}},
  175. {{0x9f31997cc864eb, 0x06cd91d28b5e4c, 0xff17036691a973, 0xf1aef351497c58},
  176. {0xdd1f2d600564ff, 0xdead073b1402db, 0x74a684435bd693, 0xeea7471f962558},
  177. {1, 0, 0, 0}}},
  178. {{{0, 0, 0, 0},
  179. {0, 0, 0, 0},
  180. {0, 0, 0, 0}},
  181. {{0x9665266dddf554, 0x9613d78b60ef2d, 0xce27a34cdba417, 0xd35ab74d6afc31},
  182. {0x85ccdd22deb15e, 0x2137e5783a6aab, 0xa141cffd8c93c6, 0x355a1830e90f2d},
  183. {1, 0, 0, 0}},
  184. {{0x1a494eadaade65, 0xd6da4da77fe53c, 0xe7992996abec86, 0x65c3553c6090e3},
  185. {0xfa610b1fb09346, 0xf1c6540b8a4aaf, 0xc51a13ccd3cbab, 0x02995b1b18c28a},
  186. {1, 0, 0, 0}},
  187. {{0x7874568e7295ef, 0x86b419fbe38d04, 0xdc0690a7550d9a, 0xd3966a44beac33},
  188. {0x2b7280ec29132f, 0xbeaa3b6a032df3, 0xdc7dd88ae41200, 0xd25e2513e3a100},
  189. {1, 0, 0, 0}},
  190. {{0x924857eb2efafd, 0xac2bce41223190, 0x8edaa1445553fc, 0x825800fd3562d5},
  191. {0x8d79148ea96621, 0x23a01c3dd9ed8d, 0xaf8b219f9416b5, 0xd8db0cc277daea},
  192. {1, 0, 0, 0}},
  193. {{0x76a9c3b1a700f0, 0xe9acd29bc7e691, 0x69212d1a6b0327, 0x6322e97fe154be},
  194. {0x469fc5465d62aa, 0x8d41ed18883b05, 0x1f8eae66c52b88, 0xe4fcbe9325be51},
  195. {1, 0, 0, 0}},
  196. {{0x825fdf583cac16, 0x020b857c7b023a, 0x683c17744b0165, 0x14ffd0a2daf2f1},
  197. {0x323b36184218f9, 0x4944ec4e3b47d4, 0xc15b3080841acf, 0x0bced4b01a28bb},
  198. {1, 0, 0, 0}},
  199. {{0x92ac22230df5c4, 0x52f33b4063eda8, 0xcb3f19870c0c93, 0x40064f2ba65233},
  200. {0xfe16f0924f8992, 0x012da25af5b517, 0x1a57bb24f723a6, 0x06f8bc76760def},
  201. {1, 0, 0, 0}},
  202. {{0x4a7084f7817cb9, 0xbcab0738ee9a78, 0x3ec11e11d9c326, 0xdc0fe90e0f1aae},
  203. {0xcf639ea5f98390, 0x5c350aa22ffb74, 0x9afae98a4047b7, 0x956ec2d617fc45},
  204. {1, 0, 0, 0}},
  205. {{0x4306d648c1be6a, 0x9247cd8bc9a462, 0xf5595e377d2f2e, 0xbd1c3caff1a52e},
  206. {0x045e14472409d0, 0x29f3e17078f773, 0x745a602b2d4f7d, 0x191837685cdfbb},
  207. {1, 0, 0, 0}},
  208. {{0x5b6ee254a8cb79, 0x4953433f5e7026, 0xe21faeb1d1def4, 0xc4c225785c09de},
  209. {0x307ce7bba1e518, 0x31b125b1036db8, 0x47e91868839e8f, 0xc765866e33b9f3},
  210. {1, 0, 0, 0}},
  211. {{0x3bfece24f96906, 0x4794da641e5093, 0xde5df64f95db26, 0x297ecd89714b05},
  212. {0x701bd3ebb2c3aa, 0x7073b4f53cb1d5, 0x13c5665658af16, 0x9895089d66fe58},
  213. {1, 0, 0, 0}},
  214. {{0x0fef05f78c4790, 0x2d773633b05d2e, 0x94229c3a951c94, 0xbbbd70df4911bb},
  215. {0xb2c6963d2c1168, 0x105f47a72b0d73, 0x9fdf6111614080, 0x7b7e94b39e67b0},
  216. {1, 0, 0, 0}},
  217. {{0xad1a7d6efbe2b3, 0xf012482c0da69d, 0x6b3bdf12438345, 0x40d7558d7aa4d9},
  218. {0x8a09fffb5c6d3d, 0x9a356e5d9ffd38, 0x5973f15f4f9b1c, 0xdcd5f59f63c3ea},
  219. {1, 0, 0, 0}},
  220. {{0xacf39f4c5ca7ab, 0x4c8071cc5fd737, 0xc64e3602cd1184, 0x0acd4644c9abba},
  221. {0x6c011a36d8bf6e, 0xfecd87ba24e32a, 0x19f6f56574fad8, 0x050b204ced9405},
  222. {1, 0, 0, 0}},
  223. {{0xed4f1cae7d9a96, 0x5ceef7ad94c40a, 0x778e4a3bf3ef9b, 0x7405783dc3b55e},
  224. {0x32477c61b6e8c6, 0xb46a97570f018b, 0x91176d0a7e95d1, 0x3df90fbc4c7d0e},
  225. {1, 0, 0, 0}}}
  226. };
  227. /* Precomputation for the group generator. */
  228. struct nistp224_pre_comp_st {
  229. felem g_pre_comp[2][16][3];
  230. CRYPTO_REF_COUNT references;
  231. CRYPTO_RWLOCK *lock;
  232. };
  233. const EC_METHOD *EC_GFp_nistp224_method(void)
  234. {
  235. static const EC_METHOD ret = {
  236. EC_FLAGS_DEFAULT_OCT,
  237. NID_X9_62_prime_field,
  238. ec_GFp_nistp224_group_init,
  239. ec_GFp_simple_group_finish,
  240. ec_GFp_simple_group_clear_finish,
  241. ec_GFp_nist_group_copy,
  242. ec_GFp_nistp224_group_set_curve,
  243. ec_GFp_simple_group_get_curve,
  244. ec_GFp_simple_group_get_degree,
  245. ec_group_simple_order_bits,
  246. ec_GFp_simple_group_check_discriminant,
  247. ec_GFp_simple_point_init,
  248. ec_GFp_simple_point_finish,
  249. ec_GFp_simple_point_clear_finish,
  250. ec_GFp_simple_point_copy,
  251. ec_GFp_simple_point_set_to_infinity,
  252. ec_GFp_simple_set_Jprojective_coordinates_GFp,
  253. ec_GFp_simple_get_Jprojective_coordinates_GFp,
  254. ec_GFp_simple_point_set_affine_coordinates,
  255. ec_GFp_nistp224_point_get_affine_coordinates,
  256. 0 /* point_set_compressed_coordinates */ ,
  257. 0 /* point2oct */ ,
  258. 0 /* oct2point */ ,
  259. ec_GFp_simple_add,
  260. ec_GFp_simple_dbl,
  261. ec_GFp_simple_invert,
  262. ec_GFp_simple_is_at_infinity,
  263. ec_GFp_simple_is_on_curve,
  264. ec_GFp_simple_cmp,
  265. ec_GFp_simple_make_affine,
  266. ec_GFp_simple_points_make_affine,
  267. ec_GFp_nistp224_points_mul,
  268. ec_GFp_nistp224_precompute_mult,
  269. ec_GFp_nistp224_have_precompute_mult,
  270. ec_GFp_nist_field_mul,
  271. ec_GFp_nist_field_sqr,
  272. 0 /* field_div */ ,
  273. ec_GFp_simple_field_inv,
  274. 0 /* field_encode */ ,
  275. 0 /* field_decode */ ,
  276. 0, /* field_set_to_one */
  277. ec_key_simple_priv2oct,
  278. ec_key_simple_oct2priv,
  279. 0, /* set private */
  280. ec_key_simple_generate_key,
  281. ec_key_simple_check_key,
  282. ec_key_simple_generate_public_key,
  283. 0, /* keycopy */
  284. 0, /* keyfinish */
  285. ecdh_simple_compute_key,
  286. ecdsa_simple_sign_setup,
  287. ecdsa_simple_sign_sig,
  288. ecdsa_simple_verify_sig,
  289. 0, /* field_inverse_mod_ord */
  290. 0, /* blind_coordinates */
  291. 0, /* ladder_pre */
  292. 0, /* ladder_step */
  293. 0 /* ladder_post */
  294. };
  295. return &ret;
  296. }
  297. /*
  298. * Helper functions to convert field elements to/from internal representation
  299. */
  300. static void bin28_to_felem(felem out, const u8 in[28])
  301. {
  302. out[0] = *((const uint64_t *)(in)) & 0x00ffffffffffffff;
  303. out[1] = (*((const uint64_t *)(in + 7))) & 0x00ffffffffffffff;
  304. out[2] = (*((const uint64_t *)(in + 14))) & 0x00ffffffffffffff;
  305. out[3] = (*((const uint64_t *)(in+20))) >> 8;
  306. }
  307. static void felem_to_bin28(u8 out[28], const felem in)
  308. {
  309. unsigned i;
  310. for (i = 0; i < 7; ++i) {
  311. out[i] = in[0] >> (8 * i);
  312. out[i + 7] = in[1] >> (8 * i);
  313. out[i + 14] = in[2] >> (8 * i);
  314. out[i + 21] = in[3] >> (8 * i);
  315. }
  316. }
  317. /* From OpenSSL BIGNUM to internal representation */
  318. static int BN_to_felem(felem out, const BIGNUM *bn)
  319. {
  320. felem_bytearray b_out;
  321. int num_bytes;
  322. if (BN_is_negative(bn)) {
  323. ECerr(EC_F_BN_TO_FELEM, EC_R_BIGNUM_OUT_OF_RANGE);
  324. return 0;
  325. }
  326. num_bytes = BN_bn2lebinpad(bn, b_out, sizeof(b_out));
  327. if (num_bytes < 0) {
  328. ECerr(EC_F_BN_TO_FELEM, EC_R_BIGNUM_OUT_OF_RANGE);
  329. return 0;
  330. }
  331. bin28_to_felem(out, b_out);
  332. return 1;
  333. }
  334. /* From internal representation to OpenSSL BIGNUM */
  335. static BIGNUM *felem_to_BN(BIGNUM *out, const felem in)
  336. {
  337. felem_bytearray b_out;
  338. felem_to_bin28(b_out, in);
  339. return BN_lebin2bn(b_out, sizeof(b_out), out);
  340. }
  341. /******************************************************************************/
  342. /*-
  343. * FIELD OPERATIONS
  344. *
  345. * Field operations, using the internal representation of field elements.
  346. * NB! These operations are specific to our point multiplication and cannot be
  347. * expected to be correct in general - e.g., multiplication with a large scalar
  348. * will cause an overflow.
  349. *
  350. */
  351. static void felem_one(felem out)
  352. {
  353. out[0] = 1;
  354. out[1] = 0;
  355. out[2] = 0;
  356. out[3] = 0;
  357. }
  358. static void felem_assign(felem out, const felem in)
  359. {
  360. out[0] = in[0];
  361. out[1] = in[1];
  362. out[2] = in[2];
  363. out[3] = in[3];
  364. }
  365. /* Sum two field elements: out += in */
  366. static void felem_sum(felem out, const felem in)
  367. {
  368. out[0] += in[0];
  369. out[1] += in[1];
  370. out[2] += in[2];
  371. out[3] += in[3];
  372. }
  373. /* Subtract field elements: out -= in */
  374. /* Assumes in[i] < 2^57 */
  375. static void felem_diff(felem out, const felem in)
  376. {
  377. static const limb two58p2 = (((limb) 1) << 58) + (((limb) 1) << 2);
  378. static const limb two58m2 = (((limb) 1) << 58) - (((limb) 1) << 2);
  379. static const limb two58m42m2 = (((limb) 1) << 58) -
  380. (((limb) 1) << 42) - (((limb) 1) << 2);
  381. /* Add 0 mod 2^224-2^96+1 to ensure out > in */
  382. out[0] += two58p2;
  383. out[1] += two58m42m2;
  384. out[2] += two58m2;
  385. out[3] += two58m2;
  386. out[0] -= in[0];
  387. out[1] -= in[1];
  388. out[2] -= in[2];
  389. out[3] -= in[3];
  390. }
  391. /* Subtract in unreduced 128-bit mode: out -= in */
  392. /* Assumes in[i] < 2^119 */
  393. static void widefelem_diff(widefelem out, const widefelem in)
  394. {
  395. static const widelimb two120 = ((widelimb) 1) << 120;
  396. static const widelimb two120m64 = (((widelimb) 1) << 120) -
  397. (((widelimb) 1) << 64);
  398. static const widelimb two120m104m64 = (((widelimb) 1) << 120) -
  399. (((widelimb) 1) << 104) - (((widelimb) 1) << 64);
  400. /* Add 0 mod 2^224-2^96+1 to ensure out > in */
  401. out[0] += two120;
  402. out[1] += two120m64;
  403. out[2] += two120m64;
  404. out[3] += two120;
  405. out[4] += two120m104m64;
  406. out[5] += two120m64;
  407. out[6] += two120m64;
  408. out[0] -= in[0];
  409. out[1] -= in[1];
  410. out[2] -= in[2];
  411. out[3] -= in[3];
  412. out[4] -= in[4];
  413. out[5] -= in[5];
  414. out[6] -= in[6];
  415. }
  416. /* Subtract in mixed mode: out128 -= in64 */
  417. /* in[i] < 2^63 */
  418. static void felem_diff_128_64(widefelem out, const felem in)
  419. {
  420. static const widelimb two64p8 = (((widelimb) 1) << 64) +
  421. (((widelimb) 1) << 8);
  422. static const widelimb two64m8 = (((widelimb) 1) << 64) -
  423. (((widelimb) 1) << 8);
  424. static const widelimb two64m48m8 = (((widelimb) 1) << 64) -
  425. (((widelimb) 1) << 48) - (((widelimb) 1) << 8);
  426. /* Add 0 mod 2^224-2^96+1 to ensure out > in */
  427. out[0] += two64p8;
  428. out[1] += two64m48m8;
  429. out[2] += two64m8;
  430. out[3] += two64m8;
  431. out[0] -= in[0];
  432. out[1] -= in[1];
  433. out[2] -= in[2];
  434. out[3] -= in[3];
  435. }
  436. /*
  437. * Multiply a field element by a scalar: out = out * scalar The scalars we
  438. * actually use are small, so results fit without overflow
  439. */
  440. static void felem_scalar(felem out, const limb scalar)
  441. {
  442. out[0] *= scalar;
  443. out[1] *= scalar;
  444. out[2] *= scalar;
  445. out[3] *= scalar;
  446. }
  447. /*
  448. * Multiply an unreduced field element by a scalar: out = out * scalar The
  449. * scalars we actually use are small, so results fit without overflow
  450. */
  451. static void widefelem_scalar(widefelem out, const widelimb scalar)
  452. {
  453. out[0] *= scalar;
  454. out[1] *= scalar;
  455. out[2] *= scalar;
  456. out[3] *= scalar;
  457. out[4] *= scalar;
  458. out[5] *= scalar;
  459. out[6] *= scalar;
  460. }
  461. /* Square a field element: out = in^2 */
  462. static void felem_square(widefelem out, const felem in)
  463. {
  464. limb tmp0, tmp1, tmp2;
  465. tmp0 = 2 * in[0];
  466. tmp1 = 2 * in[1];
  467. tmp2 = 2 * in[2];
  468. out[0] = ((widelimb) in[0]) * in[0];
  469. out[1] = ((widelimb) in[0]) * tmp1;
  470. out[2] = ((widelimb) in[0]) * tmp2 + ((widelimb) in[1]) * in[1];
  471. out[3] = ((widelimb) in[3]) * tmp0 + ((widelimb) in[1]) * tmp2;
  472. out[4] = ((widelimb) in[3]) * tmp1 + ((widelimb) in[2]) * in[2];
  473. out[5] = ((widelimb) in[3]) * tmp2;
  474. out[6] = ((widelimb) in[3]) * in[3];
  475. }
  476. /* Multiply two field elements: out = in1 * in2 */
  477. static void felem_mul(widefelem out, const felem in1, const felem in2)
  478. {
  479. out[0] = ((widelimb) in1[0]) * in2[0];
  480. out[1] = ((widelimb) in1[0]) * in2[1] + ((widelimb) in1[1]) * in2[0];
  481. out[2] = ((widelimb) in1[0]) * in2[2] + ((widelimb) in1[1]) * in2[1] +
  482. ((widelimb) in1[2]) * in2[0];
  483. out[3] = ((widelimb) in1[0]) * in2[3] + ((widelimb) in1[1]) * in2[2] +
  484. ((widelimb) in1[2]) * in2[1] + ((widelimb) in1[3]) * in2[0];
  485. out[4] = ((widelimb) in1[1]) * in2[3] + ((widelimb) in1[2]) * in2[2] +
  486. ((widelimb) in1[3]) * in2[1];
  487. out[5] = ((widelimb) in1[2]) * in2[3] + ((widelimb) in1[3]) * in2[2];
  488. out[6] = ((widelimb) in1[3]) * in2[3];
  489. }
  490. /*-
  491. * Reduce seven 128-bit coefficients to four 64-bit coefficients.
  492. * Requires in[i] < 2^126,
  493. * ensures out[0] < 2^56, out[1] < 2^56, out[2] < 2^56, out[3] <= 2^56 + 2^16 */
  494. static void felem_reduce(felem out, const widefelem in)
  495. {
  496. static const widelimb two127p15 = (((widelimb) 1) << 127) +
  497. (((widelimb) 1) << 15);
  498. static const widelimb two127m71 = (((widelimb) 1) << 127) -
  499. (((widelimb) 1) << 71);
  500. static const widelimb two127m71m55 = (((widelimb) 1) << 127) -
  501. (((widelimb) 1) << 71) - (((widelimb) 1) << 55);
  502. widelimb output[5];
  503. /* Add 0 mod 2^224-2^96+1 to ensure all differences are positive */
  504. output[0] = in[0] + two127p15;
  505. output[1] = in[1] + two127m71m55;
  506. output[2] = in[2] + two127m71;
  507. output[3] = in[3];
  508. output[4] = in[4];
  509. /* Eliminate in[4], in[5], in[6] */
  510. output[4] += in[6] >> 16;
  511. output[3] += (in[6] & 0xffff) << 40;
  512. output[2] -= in[6];
  513. output[3] += in[5] >> 16;
  514. output[2] += (in[5] & 0xffff) << 40;
  515. output[1] -= in[5];
  516. output[2] += output[4] >> 16;
  517. output[1] += (output[4] & 0xffff) << 40;
  518. output[0] -= output[4];
  519. /* Carry 2 -> 3 -> 4 */
  520. output[3] += output[2] >> 56;
  521. output[2] &= 0x00ffffffffffffff;
  522. output[4] = output[3] >> 56;
  523. output[3] &= 0x00ffffffffffffff;
  524. /* Now output[2] < 2^56, output[3] < 2^56, output[4] < 2^72 */
  525. /* Eliminate output[4] */
  526. output[2] += output[4] >> 16;
  527. /* output[2] < 2^56 + 2^56 = 2^57 */
  528. output[1] += (output[4] & 0xffff) << 40;
  529. output[0] -= output[4];
  530. /* Carry 0 -> 1 -> 2 -> 3 */
  531. output[1] += output[0] >> 56;
  532. out[0] = output[0] & 0x00ffffffffffffff;
  533. output[2] += output[1] >> 56;
  534. /* output[2] < 2^57 + 2^72 */
  535. out[1] = output[1] & 0x00ffffffffffffff;
  536. output[3] += output[2] >> 56;
  537. /* output[3] <= 2^56 + 2^16 */
  538. out[2] = output[2] & 0x00ffffffffffffff;
  539. /*-
  540. * out[0] < 2^56, out[1] < 2^56, out[2] < 2^56,
  541. * out[3] <= 2^56 + 2^16 (due to final carry),
  542. * so out < 2*p
  543. */
  544. out[3] = output[3];
  545. }
  546. static void felem_square_reduce(felem out, const felem in)
  547. {
  548. widefelem tmp;
  549. felem_square(tmp, in);
  550. felem_reduce(out, tmp);
  551. }
  552. static void felem_mul_reduce(felem out, const felem in1, const felem in2)
  553. {
  554. widefelem tmp;
  555. felem_mul(tmp, in1, in2);
  556. felem_reduce(out, tmp);
  557. }
  558. /*
  559. * Reduce to unique minimal representation. Requires 0 <= in < 2*p (always
  560. * call felem_reduce first)
  561. */
  562. static void felem_contract(felem out, const felem in)
  563. {
  564. static const int64_t two56 = ((limb) 1) << 56;
  565. /* 0 <= in < 2*p, p = 2^224 - 2^96 + 1 */
  566. /* if in > p , reduce in = in - 2^224 + 2^96 - 1 */
  567. int64_t tmp[4], a;
  568. tmp[0] = in[0];
  569. tmp[1] = in[1];
  570. tmp[2] = in[2];
  571. tmp[3] = in[3];
  572. /* Case 1: a = 1 iff in >= 2^224 */
  573. a = (in[3] >> 56);
  574. tmp[0] -= a;
  575. tmp[1] += a << 40;
  576. tmp[3] &= 0x00ffffffffffffff;
  577. /*
  578. * Case 2: a = 0 iff p <= in < 2^224, i.e., the high 128 bits are all 1
  579. * and the lower part is non-zero
  580. */
  581. a = ((in[3] & in[2] & (in[1] | 0x000000ffffffffff)) + 1) |
  582. (((int64_t) (in[0] + (in[1] & 0x000000ffffffffff)) - 1) >> 63);
  583. a &= 0x00ffffffffffffff;
  584. /* turn a into an all-one mask (if a = 0) or an all-zero mask */
  585. a = (a - 1) >> 63;
  586. /* subtract 2^224 - 2^96 + 1 if a is all-one */
  587. tmp[3] &= a ^ 0xffffffffffffffff;
  588. tmp[2] &= a ^ 0xffffffffffffffff;
  589. tmp[1] &= (a ^ 0xffffffffffffffff) | 0x000000ffffffffff;
  590. tmp[0] -= 1 & a;
  591. /*
  592. * eliminate negative coefficients: if tmp[0] is negative, tmp[1] must be
  593. * non-zero, so we only need one step
  594. */
  595. a = tmp[0] >> 63;
  596. tmp[0] += two56 & a;
  597. tmp[1] -= 1 & a;
  598. /* carry 1 -> 2 -> 3 */
  599. tmp[2] += tmp[1] >> 56;
  600. tmp[1] &= 0x00ffffffffffffff;
  601. tmp[3] += tmp[2] >> 56;
  602. tmp[2] &= 0x00ffffffffffffff;
  603. /* Now 0 <= out < p */
  604. out[0] = tmp[0];
  605. out[1] = tmp[1];
  606. out[2] = tmp[2];
  607. out[3] = tmp[3];
  608. }
  609. /*
  610. * Get negative value: out = -in
  611. * Requires in[i] < 2^63,
  612. * ensures out[0] < 2^56, out[1] < 2^56, out[2] < 2^56, out[3] <= 2^56 + 2^16
  613. */
  614. static void felem_neg(felem out, const felem in)
  615. {
  616. widefelem tmp;
  617. memset(tmp, 0, sizeof(tmp));
  618. felem_diff_128_64(tmp, in);
  619. felem_reduce(out, tmp);
  620. }
  621. /*
  622. * Zero-check: returns 1 if input is 0, and 0 otherwise. We know that field
  623. * elements are reduced to in < 2^225, so we only need to check three cases:
  624. * 0, 2^224 - 2^96 + 1, and 2^225 - 2^97 + 2
  625. */
  626. static limb felem_is_zero(const felem in)
  627. {
  628. limb zero, two224m96p1, two225m97p2;
  629. zero = in[0] | in[1] | in[2] | in[3];
  630. zero = (((int64_t) (zero) - 1) >> 63) & 1;
  631. two224m96p1 = (in[0] ^ 1) | (in[1] ^ 0x00ffff0000000000)
  632. | (in[2] ^ 0x00ffffffffffffff) | (in[3] ^ 0x00ffffffffffffff);
  633. two224m96p1 = (((int64_t) (two224m96p1) - 1) >> 63) & 1;
  634. two225m97p2 = (in[0] ^ 2) | (in[1] ^ 0x00fffe0000000000)
  635. | (in[2] ^ 0x00ffffffffffffff) | (in[3] ^ 0x01ffffffffffffff);
  636. two225m97p2 = (((int64_t) (two225m97p2) - 1) >> 63) & 1;
  637. return (zero | two224m96p1 | two225m97p2);
  638. }
  639. static int felem_is_zero_int(const void *in)
  640. {
  641. return (int)(felem_is_zero(in) & ((limb) 1));
  642. }
  643. /* Invert a field element */
  644. /* Computation chain copied from djb's code */
  645. static void felem_inv(felem out, const felem in)
  646. {
  647. felem ftmp, ftmp2, ftmp3, ftmp4;
  648. widefelem tmp;
  649. unsigned i;
  650. felem_square(tmp, in);
  651. felem_reduce(ftmp, tmp); /* 2 */
  652. felem_mul(tmp, in, ftmp);
  653. felem_reduce(ftmp, tmp); /* 2^2 - 1 */
  654. felem_square(tmp, ftmp);
  655. felem_reduce(ftmp, tmp); /* 2^3 - 2 */
  656. felem_mul(tmp, in, ftmp);
  657. felem_reduce(ftmp, tmp); /* 2^3 - 1 */
  658. felem_square(tmp, ftmp);
  659. felem_reduce(ftmp2, tmp); /* 2^4 - 2 */
  660. felem_square(tmp, ftmp2);
  661. felem_reduce(ftmp2, tmp); /* 2^5 - 4 */
  662. felem_square(tmp, ftmp2);
  663. felem_reduce(ftmp2, tmp); /* 2^6 - 8 */
  664. felem_mul(tmp, ftmp2, ftmp);
  665. felem_reduce(ftmp, tmp); /* 2^6 - 1 */
  666. felem_square(tmp, ftmp);
  667. felem_reduce(ftmp2, tmp); /* 2^7 - 2 */
  668. for (i = 0; i < 5; ++i) { /* 2^12 - 2^6 */
  669. felem_square(tmp, ftmp2);
  670. felem_reduce(ftmp2, tmp);
  671. }
  672. felem_mul(tmp, ftmp2, ftmp);
  673. felem_reduce(ftmp2, tmp); /* 2^12 - 1 */
  674. felem_square(tmp, ftmp2);
  675. felem_reduce(ftmp3, tmp); /* 2^13 - 2 */
  676. for (i = 0; i < 11; ++i) { /* 2^24 - 2^12 */
  677. felem_square(tmp, ftmp3);
  678. felem_reduce(ftmp3, tmp);
  679. }
  680. felem_mul(tmp, ftmp3, ftmp2);
  681. felem_reduce(ftmp2, tmp); /* 2^24 - 1 */
  682. felem_square(tmp, ftmp2);
  683. felem_reduce(ftmp3, tmp); /* 2^25 - 2 */
  684. for (i = 0; i < 23; ++i) { /* 2^48 - 2^24 */
  685. felem_square(tmp, ftmp3);
  686. felem_reduce(ftmp3, tmp);
  687. }
  688. felem_mul(tmp, ftmp3, ftmp2);
  689. felem_reduce(ftmp3, tmp); /* 2^48 - 1 */
  690. felem_square(tmp, ftmp3);
  691. felem_reduce(ftmp4, tmp); /* 2^49 - 2 */
  692. for (i = 0; i < 47; ++i) { /* 2^96 - 2^48 */
  693. felem_square(tmp, ftmp4);
  694. felem_reduce(ftmp4, tmp);
  695. }
  696. felem_mul(tmp, ftmp3, ftmp4);
  697. felem_reduce(ftmp3, tmp); /* 2^96 - 1 */
  698. felem_square(tmp, ftmp3);
  699. felem_reduce(ftmp4, tmp); /* 2^97 - 2 */
  700. for (i = 0; i < 23; ++i) { /* 2^120 - 2^24 */
  701. felem_square(tmp, ftmp4);
  702. felem_reduce(ftmp4, tmp);
  703. }
  704. felem_mul(tmp, ftmp2, ftmp4);
  705. felem_reduce(ftmp2, tmp); /* 2^120 - 1 */
  706. for (i = 0; i < 6; ++i) { /* 2^126 - 2^6 */
  707. felem_square(tmp, ftmp2);
  708. felem_reduce(ftmp2, tmp);
  709. }
  710. felem_mul(tmp, ftmp2, ftmp);
  711. felem_reduce(ftmp, tmp); /* 2^126 - 1 */
  712. felem_square(tmp, ftmp);
  713. felem_reduce(ftmp, tmp); /* 2^127 - 2 */
  714. felem_mul(tmp, ftmp, in);
  715. felem_reduce(ftmp, tmp); /* 2^127 - 1 */
  716. for (i = 0; i < 97; ++i) { /* 2^224 - 2^97 */
  717. felem_square(tmp, ftmp);
  718. felem_reduce(ftmp, tmp);
  719. }
  720. felem_mul(tmp, ftmp, ftmp3);
  721. felem_reduce(out, tmp); /* 2^224 - 2^96 - 1 */
  722. }
  723. /*
  724. * Copy in constant time: if icopy == 1, copy in to out, if icopy == 0, copy
  725. * out to itself.
  726. */
  727. static void copy_conditional(felem out, const felem in, limb icopy)
  728. {
  729. unsigned i;
  730. /*
  731. * icopy is a (64-bit) 0 or 1, so copy is either all-zero or all-one
  732. */
  733. const limb copy = -icopy;
  734. for (i = 0; i < 4; ++i) {
  735. const limb tmp = copy & (in[i] ^ out[i]);
  736. out[i] ^= tmp;
  737. }
  738. }
  739. /******************************************************************************/
  740. /*-
  741. * ELLIPTIC CURVE POINT OPERATIONS
  742. *
  743. * Points are represented in Jacobian projective coordinates:
  744. * (X, Y, Z) corresponds to the affine point (X/Z^2, Y/Z^3),
  745. * or to the point at infinity if Z == 0.
  746. *
  747. */
  748. /*-
  749. * Double an elliptic curve point:
  750. * (X', Y', Z') = 2 * (X, Y, Z), where
  751. * X' = (3 * (X - Z^2) * (X + Z^2))^2 - 8 * X * Y^2
  752. * Y' = 3 * (X - Z^2) * (X + Z^2) * (4 * X * Y^2 - X') - 8 * Y^4
  753. * Z' = (Y + Z)^2 - Y^2 - Z^2 = 2 * Y * Z
  754. * Outputs can equal corresponding inputs, i.e., x_out == x_in is allowed,
  755. * while x_out == y_in is not (maybe this works, but it's not tested).
  756. */
  757. static void
  758. point_double(felem x_out, felem y_out, felem z_out,
  759. const felem x_in, const felem y_in, const felem z_in)
  760. {
  761. widefelem tmp, tmp2;
  762. felem delta, gamma, beta, alpha, ftmp, ftmp2;
  763. felem_assign(ftmp, x_in);
  764. felem_assign(ftmp2, x_in);
  765. /* delta = z^2 */
  766. felem_square(tmp, z_in);
  767. felem_reduce(delta, tmp);
  768. /* gamma = y^2 */
  769. felem_square(tmp, y_in);
  770. felem_reduce(gamma, tmp);
  771. /* beta = x*gamma */
  772. felem_mul(tmp, x_in, gamma);
  773. felem_reduce(beta, tmp);
  774. /* alpha = 3*(x-delta)*(x+delta) */
  775. felem_diff(ftmp, delta);
  776. /* ftmp[i] < 2^57 + 2^58 + 2 < 2^59 */
  777. felem_sum(ftmp2, delta);
  778. /* ftmp2[i] < 2^57 + 2^57 = 2^58 */
  779. felem_scalar(ftmp2, 3);
  780. /* ftmp2[i] < 3 * 2^58 < 2^60 */
  781. felem_mul(tmp, ftmp, ftmp2);
  782. /* tmp[i] < 2^60 * 2^59 * 4 = 2^121 */
  783. felem_reduce(alpha, tmp);
  784. /* x' = alpha^2 - 8*beta */
  785. felem_square(tmp, alpha);
  786. /* tmp[i] < 4 * 2^57 * 2^57 = 2^116 */
  787. felem_assign(ftmp, beta);
  788. felem_scalar(ftmp, 8);
  789. /* ftmp[i] < 8 * 2^57 = 2^60 */
  790. felem_diff_128_64(tmp, ftmp);
  791. /* tmp[i] < 2^116 + 2^64 + 8 < 2^117 */
  792. felem_reduce(x_out, tmp);
  793. /* z' = (y + z)^2 - gamma - delta */
  794. felem_sum(delta, gamma);
  795. /* delta[i] < 2^57 + 2^57 = 2^58 */
  796. felem_assign(ftmp, y_in);
  797. felem_sum(ftmp, z_in);
  798. /* ftmp[i] < 2^57 + 2^57 = 2^58 */
  799. felem_square(tmp, ftmp);
  800. /* tmp[i] < 4 * 2^58 * 2^58 = 2^118 */
  801. felem_diff_128_64(tmp, delta);
  802. /* tmp[i] < 2^118 + 2^64 + 8 < 2^119 */
  803. felem_reduce(z_out, tmp);
  804. /* y' = alpha*(4*beta - x') - 8*gamma^2 */
  805. felem_scalar(beta, 4);
  806. /* beta[i] < 4 * 2^57 = 2^59 */
  807. felem_diff(beta, x_out);
  808. /* beta[i] < 2^59 + 2^58 + 2 < 2^60 */
  809. felem_mul(tmp, alpha, beta);
  810. /* tmp[i] < 4 * 2^57 * 2^60 = 2^119 */
  811. felem_square(tmp2, gamma);
  812. /* tmp2[i] < 4 * 2^57 * 2^57 = 2^116 */
  813. widefelem_scalar(tmp2, 8);
  814. /* tmp2[i] < 8 * 2^116 = 2^119 */
  815. widefelem_diff(tmp, tmp2);
  816. /* tmp[i] < 2^119 + 2^120 < 2^121 */
  817. felem_reduce(y_out, tmp);
  818. }
  819. /*-
  820. * Add two elliptic curve points:
  821. * (X_1, Y_1, Z_1) + (X_2, Y_2, Z_2) = (X_3, Y_3, Z_3), where
  822. * X_3 = (Z_1^3 * Y_2 - Z_2^3 * Y_1)^2 - (Z_1^2 * X_2 - Z_2^2 * X_1)^3 -
  823. * 2 * Z_2^2 * X_1 * (Z_1^2 * X_2 - Z_2^2 * X_1)^2
  824. * Y_3 = (Z_1^3 * Y_2 - Z_2^3 * Y_1) * (Z_2^2 * X_1 * (Z_1^2 * X_2 - Z_2^2 * X_1)^2 - X_3) -
  825. * Z_2^3 * Y_1 * (Z_1^2 * X_2 - Z_2^2 * X_1)^3
  826. * Z_3 = (Z_1^2 * X_2 - Z_2^2 * X_1) * (Z_1 * Z_2)
  827. *
  828. * This runs faster if 'mixed' is set, which requires Z_2 = 1 or Z_2 = 0.
  829. */
  830. /*
  831. * This function is not entirely constant-time: it includes a branch for
  832. * checking whether the two input points are equal, (while not equal to the
  833. * point at infinity). This case never happens during single point
  834. * multiplication, so there is no timing leak for ECDH or ECDSA signing.
  835. */
  836. static void point_add(felem x3, felem y3, felem z3,
  837. const felem x1, const felem y1, const felem z1,
  838. const int mixed, const felem x2, const felem y2,
  839. const felem z2)
  840. {
  841. felem ftmp, ftmp2, ftmp3, ftmp4, ftmp5, x_out, y_out, z_out;
  842. widefelem tmp, tmp2;
  843. limb z1_is_zero, z2_is_zero, x_equal, y_equal;
  844. limb points_equal;
  845. if (!mixed) {
  846. /* ftmp2 = z2^2 */
  847. felem_square(tmp, z2);
  848. felem_reduce(ftmp2, tmp);
  849. /* ftmp4 = z2^3 */
  850. felem_mul(tmp, ftmp2, z2);
  851. felem_reduce(ftmp4, tmp);
  852. /* ftmp4 = z2^3*y1 */
  853. felem_mul(tmp2, ftmp4, y1);
  854. felem_reduce(ftmp4, tmp2);
  855. /* ftmp2 = z2^2*x1 */
  856. felem_mul(tmp2, ftmp2, x1);
  857. felem_reduce(ftmp2, tmp2);
  858. } else {
  859. /*
  860. * We'll assume z2 = 1 (special case z2 = 0 is handled later)
  861. */
  862. /* ftmp4 = z2^3*y1 */
  863. felem_assign(ftmp4, y1);
  864. /* ftmp2 = z2^2*x1 */
  865. felem_assign(ftmp2, x1);
  866. }
  867. /* ftmp = z1^2 */
  868. felem_square(tmp, z1);
  869. felem_reduce(ftmp, tmp);
  870. /* ftmp3 = z1^3 */
  871. felem_mul(tmp, ftmp, z1);
  872. felem_reduce(ftmp3, tmp);
  873. /* tmp = z1^3*y2 */
  874. felem_mul(tmp, ftmp3, y2);
  875. /* tmp[i] < 4 * 2^57 * 2^57 = 2^116 */
  876. /* ftmp3 = z1^3*y2 - z2^3*y1 */
  877. felem_diff_128_64(tmp, ftmp4);
  878. /* tmp[i] < 2^116 + 2^64 + 8 < 2^117 */
  879. felem_reduce(ftmp3, tmp);
  880. /* tmp = z1^2*x2 */
  881. felem_mul(tmp, ftmp, x2);
  882. /* tmp[i] < 4 * 2^57 * 2^57 = 2^116 */
  883. /* ftmp = z1^2*x2 - z2^2*x1 */
  884. felem_diff_128_64(tmp, ftmp2);
  885. /* tmp[i] < 2^116 + 2^64 + 8 < 2^117 */
  886. felem_reduce(ftmp, tmp);
  887. /*
  888. * The formulae are incorrect if the points are equal, in affine coordinates
  889. * (X_1, Y_1) == (X_2, Y_2), so we check for this and do doubling if this
  890. * happens.
  891. *
  892. * We use bitwise operations to avoid potential side-channels introduced by
  893. * the short-circuiting behaviour of boolean operators.
  894. */
  895. x_equal = felem_is_zero(ftmp);
  896. y_equal = felem_is_zero(ftmp3);
  897. /*
  898. * The special case of either point being the point at infinity (z1 and/or
  899. * z2 are zero), is handled separately later on in this function, so we
  900. * avoid jumping to point_double here in those special cases.
  901. */
  902. z1_is_zero = felem_is_zero(z1);
  903. z2_is_zero = felem_is_zero(z2);
  904. /*
  905. * Compared to `ecp_nistp256.c` and `ecp_nistp521.c`, in this
  906. * specific implementation `felem_is_zero()` returns truth as `0x1`
  907. * (rather than `0xff..ff`).
  908. *
  909. * This implies that `~true` in this implementation becomes
  910. * `0xff..fe` (rather than `0x0`): for this reason, to be used in
  911. * the if expression, we mask out only the last bit in the next
  912. * line.
  913. */
  914. points_equal = (x_equal & y_equal & (~z1_is_zero) & (~z2_is_zero)) & 1;
  915. if (points_equal) {
  916. /*
  917. * This is obviously not constant-time but, as mentioned before, this
  918. * case never happens during single point multiplication, so there is no
  919. * timing leak for ECDH or ECDSA signing.
  920. */
  921. point_double(x3, y3, z3, x1, y1, z1);
  922. return;
  923. }
  924. /* ftmp5 = z1*z2 */
  925. if (!mixed) {
  926. felem_mul(tmp, z1, z2);
  927. felem_reduce(ftmp5, tmp);
  928. } else {
  929. /* special case z2 = 0 is handled later */
  930. felem_assign(ftmp5, z1);
  931. }
  932. /* z_out = (z1^2*x2 - z2^2*x1)*(z1*z2) */
  933. felem_mul(tmp, ftmp, ftmp5);
  934. felem_reduce(z_out, tmp);
  935. /* ftmp = (z1^2*x2 - z2^2*x1)^2 */
  936. felem_assign(ftmp5, ftmp);
  937. felem_square(tmp, ftmp);
  938. felem_reduce(ftmp, tmp);
  939. /* ftmp5 = (z1^2*x2 - z2^2*x1)^3 */
  940. felem_mul(tmp, ftmp, ftmp5);
  941. felem_reduce(ftmp5, tmp);
  942. /* ftmp2 = z2^2*x1*(z1^2*x2 - z2^2*x1)^2 */
  943. felem_mul(tmp, ftmp2, ftmp);
  944. felem_reduce(ftmp2, tmp);
  945. /* tmp = z2^3*y1*(z1^2*x2 - z2^2*x1)^3 */
  946. felem_mul(tmp, ftmp4, ftmp5);
  947. /* tmp[i] < 4 * 2^57 * 2^57 = 2^116 */
  948. /* tmp2 = (z1^3*y2 - z2^3*y1)^2 */
  949. felem_square(tmp2, ftmp3);
  950. /* tmp2[i] < 4 * 2^57 * 2^57 < 2^116 */
  951. /* tmp2 = (z1^3*y2 - z2^3*y1)^2 - (z1^2*x2 - z2^2*x1)^3 */
  952. felem_diff_128_64(tmp2, ftmp5);
  953. /* tmp2[i] < 2^116 + 2^64 + 8 < 2^117 */
  954. /* ftmp5 = 2*z2^2*x1*(z1^2*x2 - z2^2*x1)^2 */
  955. felem_assign(ftmp5, ftmp2);
  956. felem_scalar(ftmp5, 2);
  957. /* ftmp5[i] < 2 * 2^57 = 2^58 */
  958. /*-
  959. * x_out = (z1^3*y2 - z2^3*y1)^2 - (z1^2*x2 - z2^2*x1)^3 -
  960. * 2*z2^2*x1*(z1^2*x2 - z2^2*x1)^2
  961. */
  962. felem_diff_128_64(tmp2, ftmp5);
  963. /* tmp2[i] < 2^117 + 2^64 + 8 < 2^118 */
  964. felem_reduce(x_out, tmp2);
  965. /* ftmp2 = z2^2*x1*(z1^2*x2 - z2^2*x1)^2 - x_out */
  966. felem_diff(ftmp2, x_out);
  967. /* ftmp2[i] < 2^57 + 2^58 + 2 < 2^59 */
  968. /*
  969. * tmp2 = (z1^3*y2 - z2^3*y1)*(z2^2*x1*(z1^2*x2 - z2^2*x1)^2 - x_out)
  970. */
  971. felem_mul(tmp2, ftmp3, ftmp2);
  972. /* tmp2[i] < 4 * 2^57 * 2^59 = 2^118 */
  973. /*-
  974. * y_out = (z1^3*y2 - z2^3*y1)*(z2^2*x1*(z1^2*x2 - z2^2*x1)^2 - x_out) -
  975. * z2^3*y1*(z1^2*x2 - z2^2*x1)^3
  976. */
  977. widefelem_diff(tmp2, tmp);
  978. /* tmp2[i] < 2^118 + 2^120 < 2^121 */
  979. felem_reduce(y_out, tmp2);
  980. /*
  981. * the result (x_out, y_out, z_out) is incorrect if one of the inputs is
  982. * the point at infinity, so we need to check for this separately
  983. */
  984. /*
  985. * if point 1 is at infinity, copy point 2 to output, and vice versa
  986. */
  987. copy_conditional(x_out, x2, z1_is_zero);
  988. copy_conditional(x_out, x1, z2_is_zero);
  989. copy_conditional(y_out, y2, z1_is_zero);
  990. copy_conditional(y_out, y1, z2_is_zero);
  991. copy_conditional(z_out, z2, z1_is_zero);
  992. copy_conditional(z_out, z1, z2_is_zero);
  993. felem_assign(x3, x_out);
  994. felem_assign(y3, y_out);
  995. felem_assign(z3, z_out);
  996. }
  997. /*
  998. * select_point selects the |idx|th point from a precomputation table and
  999. * copies it to out.
  1000. * The pre_comp array argument should be size of |size| argument
  1001. */
  1002. static void select_point(const u64 idx, unsigned int size,
  1003. const felem pre_comp[][3], felem out[3])
  1004. {
  1005. unsigned i, j;
  1006. limb *outlimbs = &out[0][0];
  1007. memset(out, 0, sizeof(*out) * 3);
  1008. for (i = 0; i < size; i++) {
  1009. const limb *inlimbs = &pre_comp[i][0][0];
  1010. u64 mask = i ^ idx;
  1011. mask |= mask >> 4;
  1012. mask |= mask >> 2;
  1013. mask |= mask >> 1;
  1014. mask &= 1;
  1015. mask--;
  1016. for (j = 0; j < 4 * 3; j++)
  1017. outlimbs[j] |= inlimbs[j] & mask;
  1018. }
  1019. }
  1020. /* get_bit returns the |i|th bit in |in| */
  1021. static char get_bit(const felem_bytearray in, unsigned i)
  1022. {
  1023. if (i >= 224)
  1024. return 0;
  1025. return (in[i >> 3] >> (i & 7)) & 1;
  1026. }
  1027. /*
  1028. * Interleaved point multiplication using precomputed point multiples: The
  1029. * small point multiples 0*P, 1*P, ..., 16*P are in pre_comp[], the scalars
  1030. * in scalars[]. If g_scalar is non-NULL, we also add this multiple of the
  1031. * generator, using certain (large) precomputed multiples in g_pre_comp.
  1032. * Output point (X, Y, Z) is stored in x_out, y_out, z_out
  1033. */
  1034. static void batch_mul(felem x_out, felem y_out, felem z_out,
  1035. const felem_bytearray scalars[],
  1036. const unsigned num_points, const u8 *g_scalar,
  1037. const int mixed, const felem pre_comp[][17][3],
  1038. const felem g_pre_comp[2][16][3])
  1039. {
  1040. int i, skip;
  1041. unsigned num;
  1042. unsigned gen_mul = (g_scalar != NULL);
  1043. felem nq[3], tmp[4];
  1044. u64 bits;
  1045. u8 sign, digit;
  1046. /* set nq to the point at infinity */
  1047. memset(nq, 0, sizeof(nq));
  1048. /*
  1049. * Loop over all scalars msb-to-lsb, interleaving additions of multiples
  1050. * of the generator (two in each of the last 28 rounds) and additions of
  1051. * other points multiples (every 5th round).
  1052. */
  1053. skip = 1; /* save two point operations in the first
  1054. * round */
  1055. for (i = (num_points ? 220 : 27); i >= 0; --i) {
  1056. /* double */
  1057. if (!skip)
  1058. point_double(nq[0], nq[1], nq[2], nq[0], nq[1], nq[2]);
  1059. /* add multiples of the generator */
  1060. if (gen_mul && (i <= 27)) {
  1061. /* first, look 28 bits upwards */
  1062. bits = get_bit(g_scalar, i + 196) << 3;
  1063. bits |= get_bit(g_scalar, i + 140) << 2;
  1064. bits |= get_bit(g_scalar, i + 84) << 1;
  1065. bits |= get_bit(g_scalar, i + 28);
  1066. /* select the point to add, in constant time */
  1067. select_point(bits, 16, g_pre_comp[1], tmp);
  1068. if (!skip) {
  1069. /* value 1 below is argument for "mixed" */
  1070. point_add(nq[0], nq[1], nq[2],
  1071. nq[0], nq[1], nq[2], 1, tmp[0], tmp[1], tmp[2]);
  1072. } else {
  1073. memcpy(nq, tmp, 3 * sizeof(felem));
  1074. skip = 0;
  1075. }
  1076. /* second, look at the current position */
  1077. bits = get_bit(g_scalar, i + 168) << 3;
  1078. bits |= get_bit(g_scalar, i + 112) << 2;
  1079. bits |= get_bit(g_scalar, i + 56) << 1;
  1080. bits |= get_bit(g_scalar, i);
  1081. /* select the point to add, in constant time */
  1082. select_point(bits, 16, g_pre_comp[0], tmp);
  1083. point_add(nq[0], nq[1], nq[2],
  1084. nq[0], nq[1], nq[2],
  1085. 1 /* mixed */ , tmp[0], tmp[1], tmp[2]);
  1086. }
  1087. /* do other additions every 5 doublings */
  1088. if (num_points && (i % 5 == 0)) {
  1089. /* loop over all scalars */
  1090. for (num = 0; num < num_points; ++num) {
  1091. bits = get_bit(scalars[num], i + 4) << 5;
  1092. bits |= get_bit(scalars[num], i + 3) << 4;
  1093. bits |= get_bit(scalars[num], i + 2) << 3;
  1094. bits |= get_bit(scalars[num], i + 1) << 2;
  1095. bits |= get_bit(scalars[num], i) << 1;
  1096. bits |= get_bit(scalars[num], i - 1);
  1097. ec_GFp_nistp_recode_scalar_bits(&sign, &digit, bits);
  1098. /* select the point to add or subtract */
  1099. select_point(digit, 17, pre_comp[num], tmp);
  1100. felem_neg(tmp[3], tmp[1]); /* (X, -Y, Z) is the negative
  1101. * point */
  1102. copy_conditional(tmp[1], tmp[3], sign);
  1103. if (!skip) {
  1104. point_add(nq[0], nq[1], nq[2],
  1105. nq[0], nq[1], nq[2],
  1106. mixed, tmp[0], tmp[1], tmp[2]);
  1107. } else {
  1108. memcpy(nq, tmp, 3 * sizeof(felem));
  1109. skip = 0;
  1110. }
  1111. }
  1112. }
  1113. }
  1114. felem_assign(x_out, nq[0]);
  1115. felem_assign(y_out, nq[1]);
  1116. felem_assign(z_out, nq[2]);
  1117. }
  1118. /******************************************************************************/
  1119. /*
  1120. * FUNCTIONS TO MANAGE PRECOMPUTATION
  1121. */
  1122. static NISTP224_PRE_COMP *nistp224_pre_comp_new(void)
  1123. {
  1124. NISTP224_PRE_COMP *ret = OPENSSL_zalloc(sizeof(*ret));
  1125. if (!ret) {
  1126. ECerr(EC_F_NISTP224_PRE_COMP_NEW, ERR_R_MALLOC_FAILURE);
  1127. return ret;
  1128. }
  1129. ret->references = 1;
  1130. ret->lock = CRYPTO_THREAD_lock_new();
  1131. if (ret->lock == NULL) {
  1132. ECerr(EC_F_NISTP224_PRE_COMP_NEW, ERR_R_MALLOC_FAILURE);
  1133. OPENSSL_free(ret);
  1134. return NULL;
  1135. }
  1136. return ret;
  1137. }
  1138. NISTP224_PRE_COMP *EC_nistp224_pre_comp_dup(NISTP224_PRE_COMP *p)
  1139. {
  1140. int i;
  1141. if (p != NULL)
  1142. CRYPTO_UP_REF(&p->references, &i, p->lock);
  1143. return p;
  1144. }
  1145. void EC_nistp224_pre_comp_free(NISTP224_PRE_COMP *p)
  1146. {
  1147. int i;
  1148. if (p == NULL)
  1149. return;
  1150. CRYPTO_DOWN_REF(&p->references, &i, p->lock);
  1151. REF_PRINT_COUNT("EC_nistp224", x);
  1152. if (i > 0)
  1153. return;
  1154. REF_ASSERT_ISNT(i < 0);
  1155. CRYPTO_THREAD_lock_free(p->lock);
  1156. OPENSSL_free(p);
  1157. }
  1158. /******************************************************************************/
  1159. /*
  1160. * OPENSSL EC_METHOD FUNCTIONS
  1161. */
  1162. int ec_GFp_nistp224_group_init(EC_GROUP *group)
  1163. {
  1164. int ret;
  1165. ret = ec_GFp_simple_group_init(group);
  1166. group->a_is_minus3 = 1;
  1167. return ret;
  1168. }
  1169. int ec_GFp_nistp224_group_set_curve(EC_GROUP *group, const BIGNUM *p,
  1170. const BIGNUM *a, const BIGNUM *b,
  1171. BN_CTX *ctx)
  1172. {
  1173. int ret = 0;
  1174. BIGNUM *curve_p, *curve_a, *curve_b;
  1175. #ifndef FIPS_MODE
  1176. BN_CTX *new_ctx = NULL;
  1177. if (ctx == NULL)
  1178. ctx = new_ctx = BN_CTX_new();
  1179. #endif
  1180. if (ctx == NULL)
  1181. return 0;
  1182. BN_CTX_start(ctx);
  1183. curve_p = BN_CTX_get(ctx);
  1184. curve_a = BN_CTX_get(ctx);
  1185. curve_b = BN_CTX_get(ctx);
  1186. if (curve_b == NULL)
  1187. goto err;
  1188. BN_bin2bn(nistp224_curve_params[0], sizeof(felem_bytearray), curve_p);
  1189. BN_bin2bn(nistp224_curve_params[1], sizeof(felem_bytearray), curve_a);
  1190. BN_bin2bn(nistp224_curve_params[2], sizeof(felem_bytearray), curve_b);
  1191. if ((BN_cmp(curve_p, p)) || (BN_cmp(curve_a, a)) || (BN_cmp(curve_b, b))) {
  1192. ECerr(EC_F_EC_GFP_NISTP224_GROUP_SET_CURVE,
  1193. EC_R_WRONG_CURVE_PARAMETERS);
  1194. goto err;
  1195. }
  1196. group->field_mod_func = BN_nist_mod_224;
  1197. ret = ec_GFp_simple_group_set_curve(group, p, a, b, ctx);
  1198. err:
  1199. BN_CTX_end(ctx);
  1200. #ifndef FIPS_MODE
  1201. BN_CTX_free(new_ctx);
  1202. #endif
  1203. return ret;
  1204. }
  1205. /*
  1206. * Takes the Jacobian coordinates (X, Y, Z) of a point and returns (X', Y') =
  1207. * (X/Z^2, Y/Z^3)
  1208. */
  1209. int ec_GFp_nistp224_point_get_affine_coordinates(const EC_GROUP *group,
  1210. const EC_POINT *point,
  1211. BIGNUM *x, BIGNUM *y,
  1212. BN_CTX *ctx)
  1213. {
  1214. felem z1, z2, x_in, y_in, x_out, y_out;
  1215. widefelem tmp;
  1216. if (EC_POINT_is_at_infinity(group, point)) {
  1217. ECerr(EC_F_EC_GFP_NISTP224_POINT_GET_AFFINE_COORDINATES,
  1218. EC_R_POINT_AT_INFINITY);
  1219. return 0;
  1220. }
  1221. if ((!BN_to_felem(x_in, point->X)) || (!BN_to_felem(y_in, point->Y)) ||
  1222. (!BN_to_felem(z1, point->Z)))
  1223. return 0;
  1224. felem_inv(z2, z1);
  1225. felem_square(tmp, z2);
  1226. felem_reduce(z1, tmp);
  1227. felem_mul(tmp, x_in, z1);
  1228. felem_reduce(x_in, tmp);
  1229. felem_contract(x_out, x_in);
  1230. if (x != NULL) {
  1231. if (!felem_to_BN(x, x_out)) {
  1232. ECerr(EC_F_EC_GFP_NISTP224_POINT_GET_AFFINE_COORDINATES,
  1233. ERR_R_BN_LIB);
  1234. return 0;
  1235. }
  1236. }
  1237. felem_mul(tmp, z1, z2);
  1238. felem_reduce(z1, tmp);
  1239. felem_mul(tmp, y_in, z1);
  1240. felem_reduce(y_in, tmp);
  1241. felem_contract(y_out, y_in);
  1242. if (y != NULL) {
  1243. if (!felem_to_BN(y, y_out)) {
  1244. ECerr(EC_F_EC_GFP_NISTP224_POINT_GET_AFFINE_COORDINATES,
  1245. ERR_R_BN_LIB);
  1246. return 0;
  1247. }
  1248. }
  1249. return 1;
  1250. }
  1251. static void make_points_affine(size_t num, felem points[ /* num */ ][3],
  1252. felem tmp_felems[ /* num+1 */ ])
  1253. {
  1254. /*
  1255. * Runs in constant time, unless an input is the point at infinity (which
  1256. * normally shouldn't happen).
  1257. */
  1258. ec_GFp_nistp_points_make_affine_internal(num,
  1259. points,
  1260. sizeof(felem),
  1261. tmp_felems,
  1262. (void (*)(void *))felem_one,
  1263. felem_is_zero_int,
  1264. (void (*)(void *, const void *))
  1265. felem_assign,
  1266. (void (*)(void *, const void *))
  1267. felem_square_reduce, (void (*)
  1268. (void *,
  1269. const void
  1270. *,
  1271. const void
  1272. *))
  1273. felem_mul_reduce,
  1274. (void (*)(void *, const void *))
  1275. felem_inv,
  1276. (void (*)(void *, const void *))
  1277. felem_contract);
  1278. }
  1279. /*
  1280. * Computes scalar*generator + \sum scalars[i]*points[i], ignoring NULL
  1281. * values Result is stored in r (r can equal one of the inputs).
  1282. */
  1283. int ec_GFp_nistp224_points_mul(const EC_GROUP *group, EC_POINT *r,
  1284. const BIGNUM *scalar, size_t num,
  1285. const EC_POINT *points[],
  1286. const BIGNUM *scalars[], BN_CTX *ctx)
  1287. {
  1288. int ret = 0;
  1289. int j;
  1290. unsigned i;
  1291. int mixed = 0;
  1292. BIGNUM *x, *y, *z, *tmp_scalar;
  1293. felem_bytearray g_secret;
  1294. felem_bytearray *secrets = NULL;
  1295. felem (*pre_comp)[17][3] = NULL;
  1296. felem *tmp_felems = NULL;
  1297. int num_bytes;
  1298. int have_pre_comp = 0;
  1299. size_t num_points = num;
  1300. felem x_in, y_in, z_in, x_out, y_out, z_out;
  1301. NISTP224_PRE_COMP *pre = NULL;
  1302. const felem(*g_pre_comp)[16][3] = NULL;
  1303. EC_POINT *generator = NULL;
  1304. const EC_POINT *p = NULL;
  1305. const BIGNUM *p_scalar = NULL;
  1306. BN_CTX_start(ctx);
  1307. x = BN_CTX_get(ctx);
  1308. y = BN_CTX_get(ctx);
  1309. z = BN_CTX_get(ctx);
  1310. tmp_scalar = BN_CTX_get(ctx);
  1311. if (tmp_scalar == NULL)
  1312. goto err;
  1313. if (scalar != NULL) {
  1314. pre = group->pre_comp.nistp224;
  1315. if (pre)
  1316. /* we have precomputation, try to use it */
  1317. g_pre_comp = (const felem(*)[16][3])pre->g_pre_comp;
  1318. else
  1319. /* try to use the standard precomputation */
  1320. g_pre_comp = &gmul[0];
  1321. generator = EC_POINT_new(group);
  1322. if (generator == NULL)
  1323. goto err;
  1324. /* get the generator from precomputation */
  1325. if (!felem_to_BN(x, g_pre_comp[0][1][0]) ||
  1326. !felem_to_BN(y, g_pre_comp[0][1][1]) ||
  1327. !felem_to_BN(z, g_pre_comp[0][1][2])) {
  1328. ECerr(EC_F_EC_GFP_NISTP224_POINTS_MUL, ERR_R_BN_LIB);
  1329. goto err;
  1330. }
  1331. if (!EC_POINT_set_Jprojective_coordinates_GFp(group,
  1332. generator, x, y, z,
  1333. ctx))
  1334. goto err;
  1335. if (0 == EC_POINT_cmp(group, generator, group->generator, ctx))
  1336. /* precomputation matches generator */
  1337. have_pre_comp = 1;
  1338. else
  1339. /*
  1340. * we don't have valid precomputation: treat the generator as a
  1341. * random point
  1342. */
  1343. num_points = num_points + 1;
  1344. }
  1345. if (num_points > 0) {
  1346. if (num_points >= 3) {
  1347. /*
  1348. * unless we precompute multiples for just one or two points,
  1349. * converting those into affine form is time well spent
  1350. */
  1351. mixed = 1;
  1352. }
  1353. secrets = OPENSSL_zalloc(sizeof(*secrets) * num_points);
  1354. pre_comp = OPENSSL_zalloc(sizeof(*pre_comp) * num_points);
  1355. if (mixed)
  1356. tmp_felems =
  1357. OPENSSL_malloc(sizeof(felem) * (num_points * 17 + 1));
  1358. if ((secrets == NULL) || (pre_comp == NULL)
  1359. || (mixed && (tmp_felems == NULL))) {
  1360. ECerr(EC_F_EC_GFP_NISTP224_POINTS_MUL, ERR_R_MALLOC_FAILURE);
  1361. goto err;
  1362. }
  1363. /*
  1364. * we treat NULL scalars as 0, and NULL points as points at infinity,
  1365. * i.e., they contribute nothing to the linear combination
  1366. */
  1367. for (i = 0; i < num_points; ++i) {
  1368. if (i == num) {
  1369. /* the generator */
  1370. p = EC_GROUP_get0_generator(group);
  1371. p_scalar = scalar;
  1372. } else {
  1373. /* the i^th point */
  1374. p = points[i];
  1375. p_scalar = scalars[i];
  1376. }
  1377. if ((p_scalar != NULL) && (p != NULL)) {
  1378. /* reduce scalar to 0 <= scalar < 2^224 */
  1379. if ((BN_num_bits(p_scalar) > 224)
  1380. || (BN_is_negative(p_scalar))) {
  1381. /*
  1382. * this is an unusual input, and we don't guarantee
  1383. * constant-timeness
  1384. */
  1385. if (!BN_nnmod(tmp_scalar, p_scalar, group->order, ctx)) {
  1386. ECerr(EC_F_EC_GFP_NISTP224_POINTS_MUL, ERR_R_BN_LIB);
  1387. goto err;
  1388. }
  1389. num_bytes = BN_bn2lebinpad(tmp_scalar,
  1390. secrets[i], sizeof(secrets[i]));
  1391. } else {
  1392. num_bytes = BN_bn2lebinpad(p_scalar,
  1393. secrets[i], sizeof(secrets[i]));
  1394. }
  1395. if (num_bytes < 0) {
  1396. ECerr(EC_F_EC_GFP_NISTP224_POINTS_MUL, ERR_R_BN_LIB);
  1397. goto err;
  1398. }
  1399. /* precompute multiples */
  1400. if ((!BN_to_felem(x_out, p->X)) ||
  1401. (!BN_to_felem(y_out, p->Y)) ||
  1402. (!BN_to_felem(z_out, p->Z)))
  1403. goto err;
  1404. felem_assign(pre_comp[i][1][0], x_out);
  1405. felem_assign(pre_comp[i][1][1], y_out);
  1406. felem_assign(pre_comp[i][1][2], z_out);
  1407. for (j = 2; j <= 16; ++j) {
  1408. if (j & 1) {
  1409. point_add(pre_comp[i][j][0], pre_comp[i][j][1],
  1410. pre_comp[i][j][2], pre_comp[i][1][0],
  1411. pre_comp[i][1][1], pre_comp[i][1][2], 0,
  1412. pre_comp[i][j - 1][0],
  1413. pre_comp[i][j - 1][1],
  1414. pre_comp[i][j - 1][2]);
  1415. } else {
  1416. point_double(pre_comp[i][j][0], pre_comp[i][j][1],
  1417. pre_comp[i][j][2], pre_comp[i][j / 2][0],
  1418. pre_comp[i][j / 2][1],
  1419. pre_comp[i][j / 2][2]);
  1420. }
  1421. }
  1422. }
  1423. }
  1424. if (mixed)
  1425. make_points_affine(num_points * 17, pre_comp[0], tmp_felems);
  1426. }
  1427. /* the scalar for the generator */
  1428. if ((scalar != NULL) && (have_pre_comp)) {
  1429. memset(g_secret, 0, sizeof(g_secret));
  1430. /* reduce scalar to 0 <= scalar < 2^224 */
  1431. if ((BN_num_bits(scalar) > 224) || (BN_is_negative(scalar))) {
  1432. /*
  1433. * this is an unusual input, and we don't guarantee
  1434. * constant-timeness
  1435. */
  1436. if (!BN_nnmod(tmp_scalar, scalar, group->order, ctx)) {
  1437. ECerr(EC_F_EC_GFP_NISTP224_POINTS_MUL, ERR_R_BN_LIB);
  1438. goto err;
  1439. }
  1440. num_bytes = BN_bn2lebinpad(tmp_scalar, g_secret, sizeof(g_secret));
  1441. } else {
  1442. num_bytes = BN_bn2lebinpad(scalar, g_secret, sizeof(g_secret));
  1443. }
  1444. /* do the multiplication with generator precomputation */
  1445. batch_mul(x_out, y_out, z_out,
  1446. (const felem_bytearray(*))secrets, num_points,
  1447. g_secret,
  1448. mixed, (const felem(*)[17][3])pre_comp, g_pre_comp);
  1449. } else {
  1450. /* do the multiplication without generator precomputation */
  1451. batch_mul(x_out, y_out, z_out,
  1452. (const felem_bytearray(*))secrets, num_points,
  1453. NULL, mixed, (const felem(*)[17][3])pre_comp, NULL);
  1454. }
  1455. /* reduce the output to its unique minimal representation */
  1456. felem_contract(x_in, x_out);
  1457. felem_contract(y_in, y_out);
  1458. felem_contract(z_in, z_out);
  1459. if ((!felem_to_BN(x, x_in)) || (!felem_to_BN(y, y_in)) ||
  1460. (!felem_to_BN(z, z_in))) {
  1461. ECerr(EC_F_EC_GFP_NISTP224_POINTS_MUL, ERR_R_BN_LIB);
  1462. goto err;
  1463. }
  1464. ret = EC_POINT_set_Jprojective_coordinates_GFp(group, r, x, y, z, ctx);
  1465. err:
  1466. BN_CTX_end(ctx);
  1467. EC_POINT_free(generator);
  1468. OPENSSL_free(secrets);
  1469. OPENSSL_free(pre_comp);
  1470. OPENSSL_free(tmp_felems);
  1471. return ret;
  1472. }
  1473. int ec_GFp_nistp224_precompute_mult(EC_GROUP *group, BN_CTX *ctx)
  1474. {
  1475. int ret = 0;
  1476. NISTP224_PRE_COMP *pre = NULL;
  1477. int i, j;
  1478. BIGNUM *x, *y;
  1479. EC_POINT *generator = NULL;
  1480. felem tmp_felems[32];
  1481. #ifndef FIPS_MODE
  1482. BN_CTX *new_ctx = NULL;
  1483. #endif
  1484. /* throw away old precomputation */
  1485. EC_pre_comp_free(group);
  1486. #ifndef FIPS_MODE
  1487. if (ctx == NULL)
  1488. ctx = new_ctx = BN_CTX_new();
  1489. #endif
  1490. if (ctx == NULL)
  1491. return 0;
  1492. BN_CTX_start(ctx);
  1493. x = BN_CTX_get(ctx);
  1494. y = BN_CTX_get(ctx);
  1495. if (y == NULL)
  1496. goto err;
  1497. /* get the generator */
  1498. if (group->generator == NULL)
  1499. goto err;
  1500. generator = EC_POINT_new(group);
  1501. if (generator == NULL)
  1502. goto err;
  1503. BN_bin2bn(nistp224_curve_params[3], sizeof(felem_bytearray), x);
  1504. BN_bin2bn(nistp224_curve_params[4], sizeof(felem_bytearray), y);
  1505. if (!EC_POINT_set_affine_coordinates(group, generator, x, y, ctx))
  1506. goto err;
  1507. if ((pre = nistp224_pre_comp_new()) == NULL)
  1508. goto err;
  1509. /*
  1510. * if the generator is the standard one, use built-in precomputation
  1511. */
  1512. if (0 == EC_POINT_cmp(group, generator, group->generator, ctx)) {
  1513. memcpy(pre->g_pre_comp, gmul, sizeof(pre->g_pre_comp));
  1514. goto done;
  1515. }
  1516. if ((!BN_to_felem(pre->g_pre_comp[0][1][0], group->generator->X)) ||
  1517. (!BN_to_felem(pre->g_pre_comp[0][1][1], group->generator->Y)) ||
  1518. (!BN_to_felem(pre->g_pre_comp[0][1][2], group->generator->Z)))
  1519. goto err;
  1520. /*
  1521. * compute 2^56*G, 2^112*G, 2^168*G for the first table, 2^28*G, 2^84*G,
  1522. * 2^140*G, 2^196*G for the second one
  1523. */
  1524. for (i = 1; i <= 8; i <<= 1) {
  1525. point_double(pre->g_pre_comp[1][i][0], pre->g_pre_comp[1][i][1],
  1526. pre->g_pre_comp[1][i][2], pre->g_pre_comp[0][i][0],
  1527. pre->g_pre_comp[0][i][1], pre->g_pre_comp[0][i][2]);
  1528. for (j = 0; j < 27; ++j) {
  1529. point_double(pre->g_pre_comp[1][i][0], pre->g_pre_comp[1][i][1],
  1530. pre->g_pre_comp[1][i][2], pre->g_pre_comp[1][i][0],
  1531. pre->g_pre_comp[1][i][1], pre->g_pre_comp[1][i][2]);
  1532. }
  1533. if (i == 8)
  1534. break;
  1535. point_double(pre->g_pre_comp[0][2 * i][0],
  1536. pre->g_pre_comp[0][2 * i][1],
  1537. pre->g_pre_comp[0][2 * i][2], pre->g_pre_comp[1][i][0],
  1538. pre->g_pre_comp[1][i][1], pre->g_pre_comp[1][i][2]);
  1539. for (j = 0; j < 27; ++j) {
  1540. point_double(pre->g_pre_comp[0][2 * i][0],
  1541. pre->g_pre_comp[0][2 * i][1],
  1542. pre->g_pre_comp[0][2 * i][2],
  1543. pre->g_pre_comp[0][2 * i][0],
  1544. pre->g_pre_comp[0][2 * i][1],
  1545. pre->g_pre_comp[0][2 * i][2]);
  1546. }
  1547. }
  1548. for (i = 0; i < 2; i++) {
  1549. /* g_pre_comp[i][0] is the point at infinity */
  1550. memset(pre->g_pre_comp[i][0], 0, sizeof(pre->g_pre_comp[i][0]));
  1551. /* the remaining multiples */
  1552. /* 2^56*G + 2^112*G resp. 2^84*G + 2^140*G */
  1553. point_add(pre->g_pre_comp[i][6][0], pre->g_pre_comp[i][6][1],
  1554. pre->g_pre_comp[i][6][2], pre->g_pre_comp[i][4][0],
  1555. pre->g_pre_comp[i][4][1], pre->g_pre_comp[i][4][2],
  1556. 0, pre->g_pre_comp[i][2][0], pre->g_pre_comp[i][2][1],
  1557. pre->g_pre_comp[i][2][2]);
  1558. /* 2^56*G + 2^168*G resp. 2^84*G + 2^196*G */
  1559. point_add(pre->g_pre_comp[i][10][0], pre->g_pre_comp[i][10][1],
  1560. pre->g_pre_comp[i][10][2], pre->g_pre_comp[i][8][0],
  1561. pre->g_pre_comp[i][8][1], pre->g_pre_comp[i][8][2],
  1562. 0, pre->g_pre_comp[i][2][0], pre->g_pre_comp[i][2][1],
  1563. pre->g_pre_comp[i][2][2]);
  1564. /* 2^112*G + 2^168*G resp. 2^140*G + 2^196*G */
  1565. point_add(pre->g_pre_comp[i][12][0], pre->g_pre_comp[i][12][1],
  1566. pre->g_pre_comp[i][12][2], pre->g_pre_comp[i][8][0],
  1567. pre->g_pre_comp[i][8][1], pre->g_pre_comp[i][8][2],
  1568. 0, pre->g_pre_comp[i][4][0], pre->g_pre_comp[i][4][1],
  1569. pre->g_pre_comp[i][4][2]);
  1570. /*
  1571. * 2^56*G + 2^112*G + 2^168*G resp. 2^84*G + 2^140*G + 2^196*G
  1572. */
  1573. point_add(pre->g_pre_comp[i][14][0], pre->g_pre_comp[i][14][1],
  1574. pre->g_pre_comp[i][14][2], pre->g_pre_comp[i][12][0],
  1575. pre->g_pre_comp[i][12][1], pre->g_pre_comp[i][12][2],
  1576. 0, pre->g_pre_comp[i][2][0], pre->g_pre_comp[i][2][1],
  1577. pre->g_pre_comp[i][2][2]);
  1578. for (j = 1; j < 8; ++j) {
  1579. /* odd multiples: add G resp. 2^28*G */
  1580. point_add(pre->g_pre_comp[i][2 * j + 1][0],
  1581. pre->g_pre_comp[i][2 * j + 1][1],
  1582. pre->g_pre_comp[i][2 * j + 1][2],
  1583. pre->g_pre_comp[i][2 * j][0],
  1584. pre->g_pre_comp[i][2 * j][1],
  1585. pre->g_pre_comp[i][2 * j][2], 0,
  1586. pre->g_pre_comp[i][1][0], pre->g_pre_comp[i][1][1],
  1587. pre->g_pre_comp[i][1][2]);
  1588. }
  1589. }
  1590. make_points_affine(31, &(pre->g_pre_comp[0][1]), tmp_felems);
  1591. done:
  1592. SETPRECOMP(group, nistp224, pre);
  1593. pre = NULL;
  1594. ret = 1;
  1595. err:
  1596. BN_CTX_end(ctx);
  1597. EC_POINT_free(generator);
  1598. #ifndef FIPS_MODE
  1599. BN_CTX_free(new_ctx);
  1600. #endif
  1601. EC_nistp224_pre_comp_free(pre);
  1602. return ret;
  1603. }
  1604. int ec_GFp_nistp224_have_precompute_mult(const EC_GROUP *group)
  1605. {
  1606. return HAVEPRECOMP(group, nistp224);
  1607. }
  1608. #endif