md32_common.h 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437
  1. /* crypto/md32_common.h */
  2. /* ====================================================================
  3. * Copyright (c) 1999-2007 The OpenSSL Project. All rights reserved.
  4. *
  5. * Redistribution and use in source and binary forms, with or without
  6. * modification, are permitted provided that the following conditions
  7. * are met:
  8. *
  9. * 1. Redistributions of source code must retain the above copyright
  10. * notice, this list of conditions and the following disclaimer.
  11. *
  12. * 2. Redistributions in binary form must reproduce the above copyright
  13. * notice, this list of conditions and the following disclaimer in
  14. * the documentation and/or other materials provided with the
  15. * distribution.
  16. *
  17. * 3. All advertising materials mentioning features or use of this
  18. * software must display the following acknowledgment:
  19. * "This product includes software developed by the OpenSSL Project
  20. * for use in the OpenSSL Toolkit. (http://www.OpenSSL.org/)"
  21. *
  22. * 4. The names "OpenSSL Toolkit" and "OpenSSL Project" must not be used to
  23. * endorse or promote products derived from this software without
  24. * prior written permission. For written permission, please contact
  25. * licensing@OpenSSL.org.
  26. *
  27. * 5. Products derived from this software may not be called "OpenSSL"
  28. * nor may "OpenSSL" appear in their names without prior written
  29. * permission of the OpenSSL Project.
  30. *
  31. * 6. Redistributions of any form whatsoever must retain the following
  32. * acknowledgment:
  33. * "This product includes software developed by the OpenSSL Project
  34. * for use in the OpenSSL Toolkit (http://www.OpenSSL.org/)"
  35. *
  36. * THIS SOFTWARE IS PROVIDED BY THE OpenSSL PROJECT ``AS IS'' AND ANY
  37. * EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  38. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
  39. * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE OpenSSL PROJECT OR
  40. * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  41. * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  42. * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  43. * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  44. * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
  45. * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  46. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
  47. * OF THE POSSIBILITY OF SUCH DAMAGE.
  48. * ====================================================================
  49. *
  50. */
  51. /*-
  52. * This is a generic 32 bit "collector" for message digest algorithms.
  53. * Whenever needed it collects input character stream into chunks of
  54. * 32 bit values and invokes a block function that performs actual hash
  55. * calculations.
  56. *
  57. * Porting guide.
  58. *
  59. * Obligatory macros:
  60. *
  61. * DATA_ORDER_IS_BIG_ENDIAN or DATA_ORDER_IS_LITTLE_ENDIAN
  62. * this macro defines byte order of input stream.
  63. * HASH_CBLOCK
  64. * size of a unit chunk HASH_BLOCK operates on.
  65. * HASH_LONG
  66. * has to be at lest 32 bit wide, if it's wider, then
  67. * HASH_LONG_LOG2 *has to* be defined along
  68. * HASH_CTX
  69. * context structure that at least contains following
  70. * members:
  71. * typedef struct {
  72. * ...
  73. * HASH_LONG Nl,Nh;
  74. * either {
  75. * HASH_LONG data[HASH_LBLOCK];
  76. * unsigned char data[HASH_CBLOCK];
  77. * };
  78. * unsigned int num;
  79. * ...
  80. * } HASH_CTX;
  81. * data[] vector is expected to be zeroed upon first call to
  82. * HASH_UPDATE.
  83. * HASH_UPDATE
  84. * name of "Update" function, implemented here.
  85. * HASH_TRANSFORM
  86. * name of "Transform" function, implemented here.
  87. * HASH_FINAL
  88. * name of "Final" function, implemented here.
  89. * HASH_BLOCK_DATA_ORDER
  90. * name of "block" function capable of treating *unaligned* input
  91. * message in original (data) byte order, implemented externally.
  92. * HASH_MAKE_STRING
  93. * macro convering context variables to an ASCII hash string.
  94. *
  95. * MD5 example:
  96. *
  97. * #define DATA_ORDER_IS_LITTLE_ENDIAN
  98. *
  99. * #define HASH_LONG MD5_LONG
  100. * #define HASH_LONG_LOG2 MD5_LONG_LOG2
  101. * #define HASH_CTX MD5_CTX
  102. * #define HASH_CBLOCK MD5_CBLOCK
  103. * #define HASH_UPDATE MD5_Update
  104. * #define HASH_TRANSFORM MD5_Transform
  105. * #define HASH_FINAL MD5_Final
  106. * #define HASH_BLOCK_DATA_ORDER md5_block_data_order
  107. *
  108. * <appro@fy.chalmers.se>
  109. */
  110. #include <openssl/crypto.h>
  111. #if !defined(DATA_ORDER_IS_BIG_ENDIAN) && !defined(DATA_ORDER_IS_LITTLE_ENDIAN)
  112. # error "DATA_ORDER must be defined!"
  113. #endif
  114. #ifndef HASH_CBLOCK
  115. # error "HASH_CBLOCK must be defined!"
  116. #endif
  117. #ifndef HASH_LONG
  118. # error "HASH_LONG must be defined!"
  119. #endif
  120. #ifndef HASH_CTX
  121. # error "HASH_CTX must be defined!"
  122. #endif
  123. #ifndef HASH_UPDATE
  124. # error "HASH_UPDATE must be defined!"
  125. #endif
  126. #ifndef HASH_TRANSFORM
  127. # error "HASH_TRANSFORM must be defined!"
  128. #endif
  129. #ifndef HASH_FINAL
  130. # error "HASH_FINAL must be defined!"
  131. #endif
  132. #ifndef HASH_BLOCK_DATA_ORDER
  133. # error "HASH_BLOCK_DATA_ORDER must be defined!"
  134. #endif
  135. /*
  136. * Engage compiler specific rotate intrinsic function if available.
  137. */
  138. #undef ROTATE
  139. #ifndef PEDANTIC
  140. # if defined(_MSC_VER)
  141. # define ROTATE(a,n) _lrotl(a,n)
  142. # elif defined(__ICC)
  143. # define ROTATE(a,n) _rotl(a,n)
  144. # elif defined(__MWERKS__)
  145. # if defined(__POWERPC__)
  146. # define ROTATE(a,n) __rlwinm(a,n,0,31)
  147. # elif defined(__MC68K__)
  148. /* Motorola specific tweak. <appro@fy.chalmers.se> */
  149. # define ROTATE(a,n) ( n<24 ? __rol(a,n) : __ror(a,32-n) )
  150. # else
  151. # define ROTATE(a,n) __rol(a,n)
  152. # endif
  153. # elif defined(__GNUC__) && __GNUC__>=2 && !defined(OPENSSL_NO_ASM) && !defined(OPENSSL_NO_INLINE_ASM)
  154. /*
  155. * Some GNU C inline assembler templates. Note that these are
  156. * rotates by *constant* number of bits! But that's exactly
  157. * what we need here...
  158. * <appro@fy.chalmers.se>
  159. */
  160. # if defined(__i386) || defined(__i386__) || defined(__x86_64) || defined(__x86_64__)
  161. # define ROTATE(a,n) ({ register unsigned int ret; \
  162. asm ( \
  163. "roll %1,%0" \
  164. : "=r"(ret) \
  165. : "I"(n), "0"((unsigned int)(a)) \
  166. : "cc"); \
  167. ret; \
  168. })
  169. # elif defined(_ARCH_PPC) || defined(_ARCH_PPC64) || \
  170. defined(__powerpc) || defined(__ppc__) || defined(__powerpc64__)
  171. # define ROTATE(a,n) ({ register unsigned int ret; \
  172. asm ( \
  173. "rlwinm %0,%1,%2,0,31" \
  174. : "=r"(ret) \
  175. : "r"(a), "I"(n)); \
  176. ret; \
  177. })
  178. # elif defined(__s390x__)
  179. # define ROTATE(a,n) ({ register unsigned int ret; \
  180. asm ("rll %0,%1,%2" \
  181. : "=r"(ret) \
  182. : "r"(a), "I"(n)); \
  183. ret; \
  184. })
  185. # endif
  186. # endif
  187. #endif /* PEDANTIC */
  188. #ifndef ROTATE
  189. # define ROTATE(a,n) (((a)<<(n))|(((a)&0xffffffff)>>(32-(n))))
  190. #endif
  191. #if defined(DATA_ORDER_IS_BIG_ENDIAN)
  192. # ifndef PEDANTIC
  193. # if defined(__GNUC__) && __GNUC__>=2 && !defined(OPENSSL_NO_ASM) && !defined(OPENSSL_NO_INLINE_ASM)
  194. # if ((defined(__i386) || defined(__i386__)) && !defined(I386_ONLY)) || \
  195. (defined(__x86_64) || defined(__x86_64__))
  196. # if !defined(B_ENDIAN)
  197. /*
  198. * This gives ~30-40% performance improvement in SHA-256 compiled
  199. * with gcc [on P4]. Well, first macro to be frank. We can pull
  200. * this trick on x86* platforms only, because these CPUs can fetch
  201. * unaligned data without raising an exception.
  202. */
  203. # define HOST_c2l(c,l) ({ unsigned int r=*((const unsigned int *)(c)); \
  204. asm ("bswapl %0":"=r"(r):"0"(r)); \
  205. (c)+=4; (l)=r; })
  206. # define HOST_l2c(l,c) ({ unsigned int r=(l); \
  207. asm ("bswapl %0":"=r"(r):"0"(r)); \
  208. *((unsigned int *)(c))=r; (c)+=4; r; })
  209. # endif
  210. # elif defined(__aarch64__)
  211. # if defined(__BYTE_ORDER__)
  212. # if defined(__ORDER_LITTLE_ENDIAN__) && __BYTE_ORDER__==__ORDER_LITTLE_ENDIAN__
  213. # define HOST_c2l(c,l) ({ unsigned int r; \
  214. asm ("rev %w0,%w1" \
  215. :"=r"(r) \
  216. :"r"(*((const unsigned int *)(c))));\
  217. (c)+=4; (l)=r; })
  218. # define HOST_l2c(l,c) ({ unsigned int r; \
  219. asm ("rev %w0,%w1" \
  220. :"=r"(r) \
  221. :"r"((unsigned int)(l)));\
  222. *((unsigned int *)(c))=r; (c)+=4; r; })
  223. # elif defined(__ORDER_BIG_ENDIAN__) && __BYTE_ORDER__==__ORDER_BIG_ENDIAN__
  224. # define HOST_c2l(c,l) ((l)=*((const unsigned int *)(c)), (c)+=4, (l))
  225. # define HOST_l2c(l,c) (*((unsigned int *)(c))=(l), (c)+=4, (l))
  226. # endif
  227. # endif
  228. # endif
  229. # endif
  230. # if defined(__s390__) || defined(__s390x__)
  231. # define HOST_c2l(c,l) ((l)=*((const unsigned int *)(c)), (c)+=4, (l))
  232. # define HOST_l2c(l,c) (*((unsigned int *)(c))=(l), (c)+=4, (l))
  233. # endif
  234. # endif
  235. # ifndef HOST_c2l
  236. # define HOST_c2l(c,l) (l =(((unsigned long)(*((c)++)))<<24), \
  237. l|=(((unsigned long)(*((c)++)))<<16), \
  238. l|=(((unsigned long)(*((c)++)))<< 8), \
  239. l|=(((unsigned long)(*((c)++))) ) )
  240. # endif
  241. # ifndef HOST_l2c
  242. # define HOST_l2c(l,c) (*((c)++)=(unsigned char)(((l)>>24)&0xff), \
  243. *((c)++)=(unsigned char)(((l)>>16)&0xff), \
  244. *((c)++)=(unsigned char)(((l)>> 8)&0xff), \
  245. *((c)++)=(unsigned char)(((l) )&0xff), \
  246. l)
  247. # endif
  248. #elif defined(DATA_ORDER_IS_LITTLE_ENDIAN)
  249. # ifndef PEDANTIC
  250. # if defined(__GNUC__) && __GNUC__>=2 && !defined(OPENSSL_NO_ASM) && !defined(OPENSSL_NO_INLINE_ASM)
  251. # if defined(__s390x__)
  252. # define HOST_c2l(c,l) ({ asm ("lrv %0,%1" \
  253. :"=d"(l) :"m"(*(const unsigned int *)(c)));\
  254. (c)+=4; (l); })
  255. # define HOST_l2c(l,c) ({ asm ("strv %1,%0" \
  256. :"=m"(*(unsigned int *)(c)) :"d"(l));\
  257. (c)+=4; (l); })
  258. # endif
  259. # endif
  260. # if defined(__i386) || defined(__i386__) || defined(__x86_64) || defined(__x86_64__)
  261. # ifndef B_ENDIAN
  262. /* See comment in DATA_ORDER_IS_BIG_ENDIAN section. */
  263. # define HOST_c2l(c,l) ((l)=*((const unsigned int *)(c)), (c)+=4, l)
  264. # define HOST_l2c(l,c) (*((unsigned int *)(c))=(l), (c)+=4, l)
  265. # endif
  266. # endif
  267. # endif
  268. # ifndef HOST_c2l
  269. # define HOST_c2l(c,l) (l =(((unsigned long)(*((c)++))) ), \
  270. l|=(((unsigned long)(*((c)++)))<< 8), \
  271. l|=(((unsigned long)(*((c)++)))<<16), \
  272. l|=(((unsigned long)(*((c)++)))<<24) )
  273. # endif
  274. # ifndef HOST_l2c
  275. # define HOST_l2c(l,c) (*((c)++)=(unsigned char)(((l) )&0xff), \
  276. *((c)++)=(unsigned char)(((l)>> 8)&0xff), \
  277. *((c)++)=(unsigned char)(((l)>>16)&0xff), \
  278. *((c)++)=(unsigned char)(((l)>>24)&0xff), \
  279. l)
  280. # endif
  281. #endif
  282. /*
  283. * Time for some action:-)
  284. */
  285. int HASH_UPDATE(HASH_CTX *c, const void *data_, size_t len)
  286. {
  287. const unsigned char *data = data_;
  288. unsigned char *p;
  289. HASH_LONG l;
  290. size_t n;
  291. if (len == 0)
  292. return 1;
  293. l = (c->Nl + (((HASH_LONG) len) << 3)) & 0xffffffffUL;
  294. /*
  295. * 95-05-24 eay Fixed a bug with the overflow handling, thanks to Wei Dai
  296. * <weidai@eskimo.com> for pointing it out.
  297. */
  298. if (l < c->Nl) /* overflow */
  299. c->Nh++;
  300. c->Nh += (HASH_LONG) (len >> 29); /* might cause compiler warning on
  301. * 16-bit */
  302. c->Nl = l;
  303. n = c->num;
  304. if (n != 0) {
  305. p = (unsigned char *)c->data;
  306. if (len >= HASH_CBLOCK || len + n >= HASH_CBLOCK) {
  307. memcpy(p + n, data, HASH_CBLOCK - n);
  308. HASH_BLOCK_DATA_ORDER(c, p, 1);
  309. n = HASH_CBLOCK - n;
  310. data += n;
  311. len -= n;
  312. c->num = 0;
  313. /*
  314. * We use memset rather than OPENSSL_cleanse() here deliberately.
  315. * Using OPENSSL_cleanse() here could be a performance issue. It
  316. * will get properly cleansed on finalisation so this isn't a
  317. * security problem.
  318. */
  319. memset(p, 0, HASH_CBLOCK); /* keep it zeroed */
  320. } else {
  321. memcpy(p + n, data, len);
  322. c->num += (unsigned int)len;
  323. return 1;
  324. }
  325. }
  326. n = len / HASH_CBLOCK;
  327. if (n > 0) {
  328. HASH_BLOCK_DATA_ORDER(c, data, n);
  329. n *= HASH_CBLOCK;
  330. data += n;
  331. len -= n;
  332. }
  333. if (len != 0) {
  334. p = (unsigned char *)c->data;
  335. c->num = (unsigned int)len;
  336. memcpy(p, data, len);
  337. }
  338. return 1;
  339. }
  340. void HASH_TRANSFORM(HASH_CTX *c, const unsigned char *data)
  341. {
  342. HASH_BLOCK_DATA_ORDER(c, data, 1);
  343. }
  344. int HASH_FINAL(unsigned char *md, HASH_CTX *c)
  345. {
  346. unsigned char *p = (unsigned char *)c->data;
  347. size_t n = c->num;
  348. p[n] = 0x80; /* there is always room for one */
  349. n++;
  350. if (n > (HASH_CBLOCK - 8)) {
  351. memset(p + n, 0, HASH_CBLOCK - n);
  352. n = 0;
  353. HASH_BLOCK_DATA_ORDER(c, p, 1);
  354. }
  355. memset(p + n, 0, HASH_CBLOCK - 8 - n);
  356. p += HASH_CBLOCK - 8;
  357. #if defined(DATA_ORDER_IS_BIG_ENDIAN)
  358. (void)HOST_l2c(c->Nh, p);
  359. (void)HOST_l2c(c->Nl, p);
  360. #elif defined(DATA_ORDER_IS_LITTLE_ENDIAN)
  361. (void)HOST_l2c(c->Nl, p);
  362. (void)HOST_l2c(c->Nh, p);
  363. #endif
  364. p -= HASH_CBLOCK;
  365. HASH_BLOCK_DATA_ORDER(c, p, 1);
  366. c->num = 0;
  367. OPENSSL_cleanse(p, HASH_CBLOCK);
  368. #ifndef HASH_MAKE_STRING
  369. # error "HASH_MAKE_STRING must be defined!"
  370. #else
  371. HASH_MAKE_STRING(c, md);
  372. #endif
  373. return 1;
  374. }
  375. #ifndef MD32_REG_T
  376. # if defined(__alpha) || defined(__sparcv9) || defined(__mips)
  377. # define MD32_REG_T long
  378. /*
  379. * This comment was originaly written for MD5, which is why it
  380. * discusses A-D. But it basically applies to all 32-bit digests,
  381. * which is why it was moved to common header file.
  382. *
  383. * In case you wonder why A-D are declared as long and not
  384. * as MD5_LONG. Doing so results in slight performance
  385. * boost on LP64 architectures. The catch is we don't
  386. * really care if 32 MSBs of a 64-bit register get polluted
  387. * with eventual overflows as we *save* only 32 LSBs in
  388. * *either* case. Now declaring 'em long excuses the compiler
  389. * from keeping 32 MSBs zeroed resulting in 13% performance
  390. * improvement under SPARC Solaris7/64 and 5% under AlphaLinux.
  391. * Well, to be honest it should say that this *prevents*
  392. * performance degradation.
  393. * <appro@fy.chalmers.se>
  394. */
  395. # else
  396. /*
  397. * Above is not absolute and there are LP64 compilers that
  398. * generate better code if MD32_REG_T is defined int. The above
  399. * pre-processor condition reflects the circumstances under which
  400. * the conclusion was made and is subject to further extension.
  401. * <appro@fy.chalmers.se>
  402. */
  403. # define MD32_REG_T int
  404. # endif
  405. #endif