des_locl.h 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226
  1. /*
  2. * Copyright 1995-2016 The OpenSSL Project Authors. All Rights Reserved.
  3. *
  4. * Licensed under the OpenSSL license (the "License"). You may not use
  5. * this file except in compliance with the License. You can obtain a copy
  6. * in the file LICENSE in the source distribution or at
  7. * https://www.openssl.org/source/license.html
  8. */
  9. #ifndef HEADER_DES_LOCL_H
  10. # define HEADER_DES_LOCL_H
  11. # include <openssl/e_os2.h>
  12. # include <stdio.h>
  13. # include <stdlib.h>
  14. # include <string.h>
  15. # include <openssl/des.h>
  16. # ifdef OPENSSL_BUILD_SHLIBCRYPTO
  17. # undef OPENSSL_EXTERN
  18. # define OPENSSL_EXTERN OPENSSL_EXPORT
  19. # endif
  20. # define ITERATIONS 16
  21. # define HALF_ITERATIONS 8
  22. # define c2l(c,l) (l =((DES_LONG)(*((c)++))) , \
  23. l|=((DES_LONG)(*((c)++)))<< 8L, \
  24. l|=((DES_LONG)(*((c)++)))<<16L, \
  25. l|=((DES_LONG)(*((c)++)))<<24L)
  26. /* NOTE - c is not incremented as per c2l */
  27. # define c2ln(c,l1,l2,n) { \
  28. c+=n; \
  29. l1=l2=0; \
  30. switch (n) { \
  31. case 8: l2 =((DES_LONG)(*(--(c))))<<24L; \
  32. /* fall thru */ \
  33. case 7: l2|=((DES_LONG)(*(--(c))))<<16L; \
  34. /* fall thru */ \
  35. case 6: l2|=((DES_LONG)(*(--(c))))<< 8L; \
  36. /* fall thru */ \
  37. case 5: l2|=((DES_LONG)(*(--(c)))); \
  38. /* fall thru */ \
  39. case 4: l1 =((DES_LONG)(*(--(c))))<<24L; \
  40. /* fall thru */ \
  41. case 3: l1|=((DES_LONG)(*(--(c))))<<16L; \
  42. /* fall thru */ \
  43. case 2: l1|=((DES_LONG)(*(--(c))))<< 8L; \
  44. /* fall thru */ \
  45. case 1: l1|=((DES_LONG)(*(--(c)))); \
  46. } \
  47. }
  48. # define l2c(l,c) (*((c)++)=(unsigned char)(((l) )&0xff), \
  49. *((c)++)=(unsigned char)(((l)>> 8L)&0xff), \
  50. *((c)++)=(unsigned char)(((l)>>16L)&0xff), \
  51. *((c)++)=(unsigned char)(((l)>>24L)&0xff))
  52. /*
  53. * replacements for htonl and ntohl since I have no idea what to do when
  54. * faced with machines with 8 byte longs.
  55. */
  56. # define n2l(c,l) (l =((DES_LONG)(*((c)++)))<<24L, \
  57. l|=((DES_LONG)(*((c)++)))<<16L, \
  58. l|=((DES_LONG)(*((c)++)))<< 8L, \
  59. l|=((DES_LONG)(*((c)++))))
  60. # define l2n(l,c) (*((c)++)=(unsigned char)(((l)>>24L)&0xff), \
  61. *((c)++)=(unsigned char)(((l)>>16L)&0xff), \
  62. *((c)++)=(unsigned char)(((l)>> 8L)&0xff), \
  63. *((c)++)=(unsigned char)(((l) )&0xff))
  64. /* NOTE - c is not incremented as per l2c */
  65. # define l2cn(l1,l2,c,n) { \
  66. c+=n; \
  67. switch (n) { \
  68. case 8: *(--(c))=(unsigned char)(((l2)>>24L)&0xff); \
  69. /* fall thru */ \
  70. case 7: *(--(c))=(unsigned char)(((l2)>>16L)&0xff); \
  71. /* fall thru */ \
  72. case 6: *(--(c))=(unsigned char)(((l2)>> 8L)&0xff); \
  73. /* fall thru */ \
  74. case 5: *(--(c))=(unsigned char)(((l2) )&0xff); \
  75. /* fall thru */ \
  76. case 4: *(--(c))=(unsigned char)(((l1)>>24L)&0xff); \
  77. /* fall thru */ \
  78. case 3: *(--(c))=(unsigned char)(((l1)>>16L)&0xff); \
  79. /* fall thru */ \
  80. case 2: *(--(c))=(unsigned char)(((l1)>> 8L)&0xff); \
  81. /* fall thru */ \
  82. case 1: *(--(c))=(unsigned char)(((l1) )&0xff); \
  83. } \
  84. }
  85. # if defined(_MSC_VER)
  86. # define ROTATE(a,n) (_lrotr(a,n))
  87. # elif defined(__ICC)
  88. # define ROTATE(a,n) (_rotr(a,n))
  89. # elif defined(__GNUC__) && __GNUC__>=2 && !defined(__STRICT_ANSI__) && !defined(OPENSSL_NO_ASM) && !defined(OPENSSL_NO_INLINE_ASM) && !defined(PEDANTIC)
  90. # if defined(__i386) || defined(__i386__) || defined(__x86_64) || defined(__x86_64__)
  91. # define ROTATE(a,n) ({ register unsigned int ret; \
  92. asm ("rorl %1,%0" \
  93. : "=r"(ret) \
  94. : "I"(n),"0"(a) \
  95. : "cc"); \
  96. ret; \
  97. })
  98. # endif
  99. # endif
  100. # ifndef ROTATE
  101. # define ROTATE(a,n) (((a)>>(n))+((a)<<(32-(n))))
  102. # endif
  103. /*
  104. * Don't worry about the LOAD_DATA() stuff, that is used by fcrypt() to add
  105. * it's little bit to the front
  106. */
  107. # ifdef DES_FCRYPT
  108. # define LOAD_DATA_tmp(R,S,u,t,E0,E1) \
  109. { DES_LONG tmp; LOAD_DATA(R,S,u,t,E0,E1,tmp); }
  110. # define LOAD_DATA(R,S,u,t,E0,E1,tmp) \
  111. t=R^(R>>16L); \
  112. u=t&E0; t&=E1; \
  113. tmp=(u<<16); u^=R^s[S ]; u^=tmp; \
  114. tmp=(t<<16); t^=R^s[S+1]; t^=tmp
  115. # else
  116. # define LOAD_DATA_tmp(a,b,c,d,e,f) LOAD_DATA(a,b,c,d,e,f,g)
  117. # define LOAD_DATA(R,S,u,t,E0,E1,tmp) \
  118. u=R^s[S ]; \
  119. t=R^s[S+1]
  120. # endif
  121. /*
  122. * It recently occurred to me that 0^0^0^0^0^0^0 == 0, so there is no reason
  123. * to not xor all the sub items together. This potentially saves a register
  124. * since things can be xored directly into L
  125. */
  126. # define D_ENCRYPT(LL,R,S) { \
  127. LOAD_DATA_tmp(R,S,u,t,E0,E1); \
  128. t=ROTATE(t,4); \
  129. LL^= \
  130. DES_SPtrans[0][(u>> 2L)&0x3f]^ \
  131. DES_SPtrans[2][(u>>10L)&0x3f]^ \
  132. DES_SPtrans[4][(u>>18L)&0x3f]^ \
  133. DES_SPtrans[6][(u>>26L)&0x3f]^ \
  134. DES_SPtrans[1][(t>> 2L)&0x3f]^ \
  135. DES_SPtrans[3][(t>>10L)&0x3f]^ \
  136. DES_SPtrans[5][(t>>18L)&0x3f]^ \
  137. DES_SPtrans[7][(t>>26L)&0x3f]; }
  138. /*-
  139. * IP and FP
  140. * The problem is more of a geometric problem that random bit fiddling.
  141. 0 1 2 3 4 5 6 7 62 54 46 38 30 22 14 6
  142. 8 9 10 11 12 13 14 15 60 52 44 36 28 20 12 4
  143. 16 17 18 19 20 21 22 23 58 50 42 34 26 18 10 2
  144. 24 25 26 27 28 29 30 31 to 56 48 40 32 24 16 8 0
  145. 32 33 34 35 36 37 38 39 63 55 47 39 31 23 15 7
  146. 40 41 42 43 44 45 46 47 61 53 45 37 29 21 13 5
  147. 48 49 50 51 52 53 54 55 59 51 43 35 27 19 11 3
  148. 56 57 58 59 60 61 62 63 57 49 41 33 25 17 9 1
  149. The output has been subject to swaps of the form
  150. 0 1 -> 3 1 but the odd and even bits have been put into
  151. 2 3 2 0
  152. different words. The main trick is to remember that
  153. t=((l>>size)^r)&(mask);
  154. r^=t;
  155. l^=(t<<size);
  156. can be used to swap and move bits between words.
  157. So l = 0 1 2 3 r = 16 17 18 19
  158. 4 5 6 7 20 21 22 23
  159. 8 9 10 11 24 25 26 27
  160. 12 13 14 15 28 29 30 31
  161. becomes (for size == 2 and mask == 0x3333)
  162. t = 2^16 3^17 -- -- l = 0 1 16 17 r = 2 3 18 19
  163. 6^20 7^21 -- -- 4 5 20 21 6 7 22 23
  164. 10^24 11^25 -- -- 8 9 24 25 10 11 24 25
  165. 14^28 15^29 -- -- 12 13 28 29 14 15 28 29
  166. Thanks for hints from Richard Outerbridge - he told me IP&FP
  167. could be done in 15 xor, 10 shifts and 5 ands.
  168. When I finally started to think of the problem in 2D
  169. I first got ~42 operations without xors. When I remembered
  170. how to use xors :-) I got it to its final state.
  171. */
  172. # define PERM_OP(a,b,t,n,m) ((t)=((((a)>>(n))^(b))&(m)),\
  173. (b)^=(t),\
  174. (a)^=((t)<<(n)))
  175. # define IP(l,r) \
  176. { \
  177. register DES_LONG tt; \
  178. PERM_OP(r,l,tt, 4,0x0f0f0f0fL); \
  179. PERM_OP(l,r,tt,16,0x0000ffffL); \
  180. PERM_OP(r,l,tt, 2,0x33333333L); \
  181. PERM_OP(l,r,tt, 8,0x00ff00ffL); \
  182. PERM_OP(r,l,tt, 1,0x55555555L); \
  183. }
  184. # define FP(l,r) \
  185. { \
  186. register DES_LONG tt; \
  187. PERM_OP(l,r,tt, 1,0x55555555L); \
  188. PERM_OP(r,l,tt, 8,0x00ff00ffL); \
  189. PERM_OP(l,r,tt, 2,0x33333333L); \
  190. PERM_OP(r,l,tt,16,0x0000ffffL); \
  191. PERM_OP(l,r,tt, 4,0x0f0f0f0fL); \
  192. }
  193. extern const DES_LONG DES_SPtrans[8][64];
  194. void fcrypt_body(DES_LONG *out, DES_key_schedule *ks,
  195. DES_LONG Eswap0, DES_LONG Eswap1);
  196. #endif