paul | 718e374 | 2002-12-13 20:15:29 +0000 | [diff] [blame] | 1 | /* md5.c - Functions to compute MD5 message digest of files or memory blocks |
| 2 | according to the definition of MD5 in RFC 1321 from April 1992. |
| 3 | Copyright (C) 1995, 1996, 1997 Free Software Foundation, Inc. |
| 4 | This file is part of the GNU C Library. |
| 5 | |
| 6 | The GNU C Library is free software; you can redistribute it and/or |
| 7 | modify it under the terms of the GNU Library General Public License as |
| 8 | published by the Free Software Foundation; either version 2 of the |
| 9 | License, or (at your option) any later version. |
| 10 | |
| 11 | The GNU C Library is distributed in the hope that it will be useful, |
| 12 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 13 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 14 | Library General Public License for more details. |
| 15 | |
| 16 | You should have received a copy of the GNU Library General Public |
| 17 | License along with the GNU C Library; see the file COPYING.LIB. If not, |
| 18 | write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330, |
| 19 | Boston, MA 02111-1307, USA. */ |
| 20 | |
| 21 | /* Written by Ulrich Drepper <drepper@gnu.ai.mit.edu>, 1995. */ |
| 22 | |
| 23 | #ifdef HAVE_CONFIG_H |
| 24 | # include <config.h> |
| 25 | #endif |
| 26 | |
| 27 | #include <sys/types.h> |
| 28 | |
| 29 | #if STDC_HEADERS || defined _LIBC |
| 30 | # include <stdlib.h> |
| 31 | # include <string.h> |
| 32 | #else |
| 33 | # ifndef HAVE_MEMCPY |
| 34 | # define memcpy(d, s, n) bcopy ((s), (d), (n)) |
| 35 | # endif |
| 36 | #endif |
| 37 | |
| 38 | #include "md5-gnu.h" |
| 39 | |
| 40 | #ifdef _LIBC |
| 41 | # include <endian.h> |
| 42 | # if __BYTE_ORDER == __BIG_ENDIAN |
| 43 | # define WORDS_BIGENDIAN 1 |
| 44 | # endif |
| 45 | /* We need to keep the namespace clean so define the MD5 function |
| 46 | protected using leading __ and use weak aliases. */ |
| 47 | # define md5_init_ctx __md5_init_ctx |
| 48 | # define md5_process_block __md5_process_block |
| 49 | # define md5_process_bytes __md5_process_bytes |
| 50 | # define md5_finish_ctx __md5_finish_ctx |
| 51 | # define md5_read_ctx __md5_read_ctx |
| 52 | # define md5_stream __md5_stream |
| 53 | # define md5_buffer __md5_buffer |
| 54 | #endif |
| 55 | |
| 56 | #ifdef WORDS_BIGENDIAN |
| 57 | # define SWAP(n) \ |
| 58 | (((n) << 24) | (((n) & 0xff00) << 8) | (((n) >> 8) & 0xff00) | ((n) >> 24)) |
| 59 | #else |
| 60 | # define SWAP(n) (n) |
| 61 | #endif |
| 62 | |
| 63 | |
| 64 | /* This array contains the bytes used to pad the buffer to the next |
| 65 | 64-byte boundary. (RFC 1321, 3.1: Step 1) */ |
| 66 | static const unsigned char fillbuf[64] = { 0x80, 0 /* , 0, 0, ... */ }; |
| 67 | |
| 68 | |
| 69 | /* Initialize structure containing state of computation. |
| 70 | (RFC 1321, 3.3: Step 3) */ |
| 71 | void |
paul | 8cc4198 | 2005-05-06 21:25:49 +0000 | [diff] [blame^] | 72 | md5_init_ctx (struct md5_ctx *ctx) |
paul | 718e374 | 2002-12-13 20:15:29 +0000 | [diff] [blame] | 73 | { |
| 74 | ctx->A = 0x67452301; |
| 75 | ctx->B = 0xefcdab89; |
| 76 | ctx->C = 0x98badcfe; |
| 77 | ctx->D = 0x10325476; |
| 78 | |
| 79 | ctx->total[0] = ctx->total[1] = 0; |
| 80 | ctx->buflen = 0; |
| 81 | } |
| 82 | |
| 83 | /* Put result from CTX in first 16 bytes following RESBUF. The result |
| 84 | must be in little endian byte order. |
| 85 | |
| 86 | IMPORTANT: On some systems it is required that RESBUF is correctly |
| 87 | aligned for a 32 bits value. */ |
| 88 | void * |
paul | 8cc4198 | 2005-05-06 21:25:49 +0000 | [diff] [blame^] | 89 | md5_read_ctx (const struct md5_ctx *ctx, void *resbuf) |
paul | 718e374 | 2002-12-13 20:15:29 +0000 | [diff] [blame] | 90 | { |
| 91 | ((md5_uint32 *) resbuf)[0] = SWAP (ctx->A); |
| 92 | ((md5_uint32 *) resbuf)[1] = SWAP (ctx->B); |
| 93 | ((md5_uint32 *) resbuf)[2] = SWAP (ctx->C); |
| 94 | ((md5_uint32 *) resbuf)[3] = SWAP (ctx->D); |
| 95 | |
| 96 | return resbuf; |
| 97 | } |
| 98 | |
| 99 | /* Process the remaining bytes in the internal buffer and the usual |
| 100 | prolog according to the standard and write the result to RESBUF. |
| 101 | |
| 102 | IMPORTANT: On some systems it is required that RESBUF is correctly |
| 103 | aligned for a 32 bits value. */ |
| 104 | void * |
paul | 8cc4198 | 2005-05-06 21:25:49 +0000 | [diff] [blame^] | 105 | md5_finish_ctx (struct md5_ctx *ctx, void *resbuf) |
paul | 718e374 | 2002-12-13 20:15:29 +0000 | [diff] [blame] | 106 | { |
| 107 | /* Take yet unprocessed bytes into account. */ |
| 108 | md5_uint32 bytes = ctx->buflen; |
| 109 | size_t pad; |
| 110 | |
| 111 | /* Now count remaining bytes. */ |
| 112 | ctx->total[0] += bytes; |
| 113 | if (ctx->total[0] < bytes) |
| 114 | ++ctx->total[1]; |
| 115 | |
| 116 | pad = bytes >= 56 ? 64 + 56 - bytes : 56 - bytes; |
| 117 | memcpy (&ctx->buffer[bytes], fillbuf, pad); |
| 118 | |
| 119 | /* Put the 64-bit file length in *bits* at the end of the buffer. */ |
| 120 | *(md5_uint32 *) &ctx->buffer[bytes + pad] = SWAP (ctx->total[0] << 3); |
| 121 | *(md5_uint32 *) &ctx->buffer[bytes + pad + 4] = SWAP ((ctx->total[1] << 3) | |
| 122 | (ctx->total[0] >> 29)); |
| 123 | |
| 124 | /* Process last bytes. */ |
| 125 | md5_process_block (ctx->buffer, bytes + pad + 8, ctx); |
| 126 | |
| 127 | return md5_read_ctx (ctx, resbuf); |
| 128 | } |
| 129 | |
| 130 | /* Compute MD5 message digest for bytes read from STREAM. The |
| 131 | resulting message digest number will be written into the 16 bytes |
| 132 | beginning at RESBLOCK. */ |
| 133 | int |
paul | 8cc4198 | 2005-05-06 21:25:49 +0000 | [diff] [blame^] | 134 | md5_stream (FILE *stream, void *resblock) |
paul | 718e374 | 2002-12-13 20:15:29 +0000 | [diff] [blame] | 135 | { |
| 136 | /* Important: BLOCKSIZE must be a multiple of 64. */ |
| 137 | #define BLOCKSIZE 4096 |
| 138 | struct md5_ctx ctx; |
| 139 | char buffer[BLOCKSIZE + 72]; |
| 140 | size_t sum; |
| 141 | |
| 142 | /* Initialize the computation context. */ |
| 143 | md5_init_ctx (&ctx); |
| 144 | |
| 145 | /* Iterate over full file contents. */ |
| 146 | while (1) |
| 147 | { |
| 148 | /* We read the file in blocks of BLOCKSIZE bytes. One call of the |
| 149 | computation function processes the whole buffer so that with the |
| 150 | next round of the loop another block can be read. */ |
| 151 | size_t n; |
| 152 | sum = 0; |
| 153 | |
| 154 | /* Read block. Take care for partial reads. */ |
| 155 | do |
| 156 | { |
| 157 | n = fread (buffer + sum, 1, BLOCKSIZE - sum, stream); |
| 158 | |
| 159 | sum += n; |
| 160 | } |
| 161 | while (sum < BLOCKSIZE && n != 0); |
| 162 | if (n == 0 && ferror (stream)) |
| 163 | return 1; |
| 164 | |
| 165 | /* If end of file is reached, end the loop. */ |
| 166 | if (n == 0) |
| 167 | break; |
| 168 | |
| 169 | /* Process buffer with BLOCKSIZE bytes. Note that |
| 170 | BLOCKSIZE % 64 == 0 |
| 171 | */ |
| 172 | md5_process_block (buffer, BLOCKSIZE, &ctx); |
| 173 | } |
| 174 | |
| 175 | /* Add the last bytes if necessary. */ |
| 176 | if (sum > 0) |
| 177 | md5_process_bytes (buffer, sum, &ctx); |
| 178 | |
| 179 | /* Construct result in desired memory. */ |
| 180 | md5_finish_ctx (&ctx, resblock); |
| 181 | return 0; |
| 182 | } |
| 183 | |
| 184 | /* Compute MD5 message digest for LEN bytes beginning at BUFFER. The |
| 185 | result is always in little endian byte order, so that a byte-wise |
| 186 | output yields to the wanted ASCII representation of the message |
| 187 | digest. */ |
| 188 | void * |
paul | 8cc4198 | 2005-05-06 21:25:49 +0000 | [diff] [blame^] | 189 | md5_buffer (const char *buffer, size_t len, void *resblock) |
paul | 718e374 | 2002-12-13 20:15:29 +0000 | [diff] [blame] | 190 | { |
| 191 | struct md5_ctx ctx; |
| 192 | |
| 193 | /* Initialize the computation context. */ |
| 194 | md5_init_ctx (&ctx); |
| 195 | |
| 196 | /* Process whole buffer but last len % 64 bytes. */ |
| 197 | md5_process_bytes (buffer, len, &ctx); |
| 198 | |
| 199 | /* Put result in desired memory area. */ |
| 200 | return md5_finish_ctx (&ctx, resblock); |
| 201 | } |
| 202 | |
| 203 | |
| 204 | void |
paul | 8cc4198 | 2005-05-06 21:25:49 +0000 | [diff] [blame^] | 205 | md5_process_bytes (const void *buffer, size_t len, struct md5_ctx *ctx) |
paul | 718e374 | 2002-12-13 20:15:29 +0000 | [diff] [blame] | 206 | { |
| 207 | /* When we already have some bits in our internal buffer concatenate |
| 208 | both inputs first. */ |
| 209 | if (ctx->buflen != 0) |
| 210 | { |
| 211 | size_t left_over = ctx->buflen; |
| 212 | size_t add = 128 - left_over > len ? len : 128 - left_over; |
| 213 | |
| 214 | memcpy (&ctx->buffer[left_over], buffer, add); |
| 215 | ctx->buflen += add; |
| 216 | |
| 217 | if (left_over + add > 64) |
| 218 | { |
| 219 | md5_process_block (ctx->buffer, (left_over + add) & ~63, ctx); |
| 220 | /* The regions in the following copy operation cannot overlap. */ |
| 221 | memcpy (ctx->buffer, &ctx->buffer[(left_over + add) & ~63], |
| 222 | (left_over + add) & 63); |
| 223 | ctx->buflen = (left_over + add) & 63; |
| 224 | } |
| 225 | |
| 226 | buffer = (const char *) buffer + add; |
| 227 | len -= add; |
| 228 | } |
| 229 | |
| 230 | /* Process available complete blocks. */ |
| 231 | if (len > 64) |
| 232 | { |
| 233 | md5_process_block (buffer, len & ~63, ctx); |
| 234 | buffer = (const char *) buffer + (len & ~63); |
| 235 | len &= 63; |
| 236 | } |
| 237 | |
| 238 | /* Move remaining bytes in internal buffer. */ |
| 239 | if (len > 0) |
| 240 | { |
| 241 | memcpy (ctx->buffer, buffer, len); |
| 242 | ctx->buflen = len; |
| 243 | } |
| 244 | } |
| 245 | |
| 246 | |
| 247 | /* These are the four functions used in the four steps of the MD5 algorithm |
| 248 | and defined in the RFC 1321. The first function is a little bit optimized |
| 249 | (as found in Colin Plumbs public domain implementation). */ |
| 250 | /* #define FF(b, c, d) ((b & c) | (~b & d)) */ |
| 251 | #define FF(b, c, d) (d ^ (b & (c ^ d))) |
| 252 | #define FG(b, c, d) FF (d, b, c) |
| 253 | #define FH(b, c, d) (b ^ c ^ d) |
| 254 | #define FI(b, c, d) (c ^ (b | ~d)) |
| 255 | |
| 256 | /* Process LEN bytes of BUFFER, accumulating context into CTX. |
| 257 | It is assumed that LEN % 64 == 0. */ |
| 258 | |
| 259 | void |
paul | 8cc4198 | 2005-05-06 21:25:49 +0000 | [diff] [blame^] | 260 | md5_process_block (const void *buffer, size_t len, struct md5_ctx *ctx) |
paul | 718e374 | 2002-12-13 20:15:29 +0000 | [diff] [blame] | 261 | { |
| 262 | md5_uint32 correct_words[16]; |
| 263 | const md5_uint32 *words = buffer; |
| 264 | size_t nwords = len / sizeof (md5_uint32); |
| 265 | const md5_uint32 *endp = words + nwords; |
| 266 | md5_uint32 A = ctx->A; |
| 267 | md5_uint32 B = ctx->B; |
| 268 | md5_uint32 C = ctx->C; |
| 269 | md5_uint32 D = ctx->D; |
| 270 | |
| 271 | /* First increment the byte count. RFC 1321 specifies the possible |
| 272 | length of the file up to 2^64 bits. Here we only compute the |
| 273 | number of bytes. Do a double word increment. */ |
| 274 | ctx->total[0] += len; |
| 275 | if (ctx->total[0] < len) |
| 276 | ++ctx->total[1]; |
| 277 | |
| 278 | /* Process all bytes in the buffer with 64 bytes in each round of |
| 279 | the loop. */ |
| 280 | while (words < endp) |
| 281 | { |
| 282 | md5_uint32 *cwp = correct_words; |
| 283 | md5_uint32 A_save = A; |
| 284 | md5_uint32 B_save = B; |
| 285 | md5_uint32 C_save = C; |
| 286 | md5_uint32 D_save = D; |
| 287 | |
| 288 | /* First round: using the given function, the context and a constant |
| 289 | the next context is computed. Because the algorithms processing |
| 290 | unit is a 32-bit word and it is determined to work on words in |
| 291 | little endian byte order we perhaps have to change the byte order |
| 292 | before the computation. To reduce the work for the next steps |
| 293 | we store the swapped words in the array CORRECT_WORDS. */ |
| 294 | |
| 295 | #define OP(a, b, c, d, s, T) \ |
| 296 | do \ |
| 297 | { \ |
| 298 | a += FF (b, c, d) + (*cwp++ = SWAP (*words)) + T; \ |
| 299 | ++words; \ |
| 300 | CYCLIC (a, s); \ |
| 301 | a += b; \ |
| 302 | } \ |
| 303 | while (0) |
| 304 | |
| 305 | /* It is unfortunate that C does not provide an operator for |
| 306 | cyclic rotation. Hope the C compiler is smart enough. */ |
| 307 | #define CYCLIC(w, s) (w = (w << s) | (w >> (32 - s))) |
| 308 | |
| 309 | /* Before we start, one word to the strange constants. |
| 310 | They are defined in RFC 1321 as |
| 311 | |
| 312 | T[i] = (int) (4294967296.0 * fabs (sin (i))), i=1..64 |
| 313 | */ |
| 314 | |
| 315 | /* Round 1. */ |
| 316 | OP (A, B, C, D, 7, 0xd76aa478); |
| 317 | OP (D, A, B, C, 12, 0xe8c7b756); |
| 318 | OP (C, D, A, B, 17, 0x242070db); |
| 319 | OP (B, C, D, A, 22, 0xc1bdceee); |
| 320 | OP (A, B, C, D, 7, 0xf57c0faf); |
| 321 | OP (D, A, B, C, 12, 0x4787c62a); |
| 322 | OP (C, D, A, B, 17, 0xa8304613); |
| 323 | OP (B, C, D, A, 22, 0xfd469501); |
| 324 | OP (A, B, C, D, 7, 0x698098d8); |
| 325 | OP (D, A, B, C, 12, 0x8b44f7af); |
| 326 | OP (C, D, A, B, 17, 0xffff5bb1); |
| 327 | OP (B, C, D, A, 22, 0x895cd7be); |
| 328 | OP (A, B, C, D, 7, 0x6b901122); |
| 329 | OP (D, A, B, C, 12, 0xfd987193); |
| 330 | OP (C, D, A, B, 17, 0xa679438e); |
| 331 | OP (B, C, D, A, 22, 0x49b40821); |
| 332 | |
| 333 | /* For the second to fourth round we have the possibly swapped words |
| 334 | in CORRECT_WORDS. Redefine the macro to take an additional first |
| 335 | argument specifying the function to use. */ |
| 336 | #undef OP |
| 337 | #define OP(f, a, b, c, d, k, s, T) \ |
| 338 | do \ |
| 339 | { \ |
| 340 | a += f (b, c, d) + correct_words[k] + T; \ |
| 341 | CYCLIC (a, s); \ |
| 342 | a += b; \ |
| 343 | } \ |
| 344 | while (0) |
| 345 | |
| 346 | /* Round 2. */ |
| 347 | OP (FG, A, B, C, D, 1, 5, 0xf61e2562); |
| 348 | OP (FG, D, A, B, C, 6, 9, 0xc040b340); |
| 349 | OP (FG, C, D, A, B, 11, 14, 0x265e5a51); |
| 350 | OP (FG, B, C, D, A, 0, 20, 0xe9b6c7aa); |
| 351 | OP (FG, A, B, C, D, 5, 5, 0xd62f105d); |
| 352 | OP (FG, D, A, B, C, 10, 9, 0x02441453); |
| 353 | OP (FG, C, D, A, B, 15, 14, 0xd8a1e681); |
| 354 | OP (FG, B, C, D, A, 4, 20, 0xe7d3fbc8); |
| 355 | OP (FG, A, B, C, D, 9, 5, 0x21e1cde6); |
| 356 | OP (FG, D, A, B, C, 14, 9, 0xc33707d6); |
| 357 | OP (FG, C, D, A, B, 3, 14, 0xf4d50d87); |
| 358 | OP (FG, B, C, D, A, 8, 20, 0x455a14ed); |
| 359 | OP (FG, A, B, C, D, 13, 5, 0xa9e3e905); |
| 360 | OP (FG, D, A, B, C, 2, 9, 0xfcefa3f8); |
| 361 | OP (FG, C, D, A, B, 7, 14, 0x676f02d9); |
| 362 | OP (FG, B, C, D, A, 12, 20, 0x8d2a4c8a); |
| 363 | |
| 364 | /* Round 3. */ |
| 365 | OP (FH, A, B, C, D, 5, 4, 0xfffa3942); |
| 366 | OP (FH, D, A, B, C, 8, 11, 0x8771f681); |
| 367 | OP (FH, C, D, A, B, 11, 16, 0x6d9d6122); |
| 368 | OP (FH, B, C, D, A, 14, 23, 0xfde5380c); |
| 369 | OP (FH, A, B, C, D, 1, 4, 0xa4beea44); |
| 370 | OP (FH, D, A, B, C, 4, 11, 0x4bdecfa9); |
| 371 | OP (FH, C, D, A, B, 7, 16, 0xf6bb4b60); |
| 372 | OP (FH, B, C, D, A, 10, 23, 0xbebfbc70); |
| 373 | OP (FH, A, B, C, D, 13, 4, 0x289b7ec6); |
| 374 | OP (FH, D, A, B, C, 0, 11, 0xeaa127fa); |
| 375 | OP (FH, C, D, A, B, 3, 16, 0xd4ef3085); |
| 376 | OP (FH, B, C, D, A, 6, 23, 0x04881d05); |
| 377 | OP (FH, A, B, C, D, 9, 4, 0xd9d4d039); |
| 378 | OP (FH, D, A, B, C, 12, 11, 0xe6db99e5); |
| 379 | OP (FH, C, D, A, B, 15, 16, 0x1fa27cf8); |
| 380 | OP (FH, B, C, D, A, 2, 23, 0xc4ac5665); |
| 381 | |
| 382 | /* Round 4. */ |
| 383 | OP (FI, A, B, C, D, 0, 6, 0xf4292244); |
| 384 | OP (FI, D, A, B, C, 7, 10, 0x432aff97); |
| 385 | OP (FI, C, D, A, B, 14, 15, 0xab9423a7); |
| 386 | OP (FI, B, C, D, A, 5, 21, 0xfc93a039); |
| 387 | OP (FI, A, B, C, D, 12, 6, 0x655b59c3); |
| 388 | OP (FI, D, A, B, C, 3, 10, 0x8f0ccc92); |
| 389 | OP (FI, C, D, A, B, 10, 15, 0xffeff47d); |
| 390 | OP (FI, B, C, D, A, 1, 21, 0x85845dd1); |
| 391 | OP (FI, A, B, C, D, 8, 6, 0x6fa87e4f); |
| 392 | OP (FI, D, A, B, C, 15, 10, 0xfe2ce6e0); |
| 393 | OP (FI, C, D, A, B, 6, 15, 0xa3014314); |
| 394 | OP (FI, B, C, D, A, 13, 21, 0x4e0811a1); |
| 395 | OP (FI, A, B, C, D, 4, 6, 0xf7537e82); |
| 396 | OP (FI, D, A, B, C, 11, 10, 0xbd3af235); |
| 397 | OP (FI, C, D, A, B, 2, 15, 0x2ad7d2bb); |
| 398 | OP (FI, B, C, D, A, 9, 21, 0xeb86d391); |
| 399 | |
| 400 | /* Add the starting values of the context. */ |
| 401 | A += A_save; |
| 402 | B += B_save; |
| 403 | C += C_save; |
| 404 | D += D_save; |
| 405 | } |
| 406 | |
| 407 | /* Put checksum in context given as argument. */ |
| 408 | ctx->A = A; |
| 409 | ctx->B = B; |
| 410 | ctx->C = C; |
| 411 | ctx->D = D; |
| 412 | } |
| 413 | |
| 414 | |
| 415 | #ifdef _LIBC |
| 416 | /* Define weak aliases. */ |
| 417 | # undef md5_init_ctx |
| 418 | weak_alias (__md5_init_ctx, md5_init_ctx) |
| 419 | # undef md5_process_block |
| 420 | weak_alias (__md5_process_block, md5_process_block) |
| 421 | # undef md5_process_bytes |
| 422 | weak_alias (__md5_process_bytes, md5_process_bytes) |
| 423 | # undef md5_finish_ctx |
| 424 | weak_alias (__md5_finish_ctx, md5_finish_ctx) |
| 425 | # undef md5_read_ctx |
| 426 | weak_alias (__md5_read_ctx, md5_read_ctx) |
| 427 | # undef md5_stream |
| 428 | weak_alias (__md5_stream, md5_stream) |
| 429 | # undef md5_buffer |
| 430 | weak_alias (__md5_buffer, md5_buffer) |
| 431 | #endif |