Chris@43: /* adler32.c -- compute the Adler-32 checksum of a data stream Chris@43: * Copyright (C) 1995-2011 Mark Adler Chris@43: * For conditions of distribution and use, see copyright notice in zlib.h Chris@43: */ Chris@43: Chris@43: /* @(#) $Id$ */ Chris@43: Chris@43: #include "zutil.h" Chris@43: Chris@43: #define local static Chris@43: Chris@43: local uLong adler32_combine_ OF((uLong adler1, uLong adler2, z_off64_t len2)); Chris@43: Chris@43: #define BASE 65521 /* largest prime smaller than 65536 */ Chris@43: #define NMAX 5552 Chris@43: /* NMAX is the largest n such that 255n(n+1)/2 + (n+1)(BASE-1) <= 2^32-1 */ Chris@43: Chris@43: #define DO1(buf,i) {adler += (buf)[i]; sum2 += adler;} Chris@43: #define DO2(buf,i) DO1(buf,i); DO1(buf,i+1); Chris@43: #define DO4(buf,i) DO2(buf,i); DO2(buf,i+2); Chris@43: #define DO8(buf,i) DO4(buf,i); DO4(buf,i+4); Chris@43: #define DO16(buf) DO8(buf,0); DO8(buf,8); Chris@43: Chris@43: /* use NO_DIVIDE if your processor does not do division in hardware -- Chris@43: try it both ways to see which is faster */ Chris@43: #ifdef NO_DIVIDE Chris@43: /* note that this assumes BASE is 65521, where 65536 % 65521 == 15 Chris@43: (thank you to John Reiser for pointing this out) */ Chris@43: # define CHOP(a) \ Chris@43: do { \ Chris@43: unsigned long tmp = a >> 16; \ Chris@43: a &= 0xffffUL; \ Chris@43: a += (tmp << 4) - tmp; \ Chris@43: } while (0) Chris@43: # define MOD28(a) \ Chris@43: do { \ Chris@43: CHOP(a); \ Chris@43: if (a >= BASE) a -= BASE; \ Chris@43: } while (0) Chris@43: # define MOD(a) \ Chris@43: do { \ Chris@43: CHOP(a); \ Chris@43: MOD28(a); \ Chris@43: } while (0) Chris@43: # define MOD63(a) \ Chris@43: do { /* this assumes a is not negative */ \ Chris@43: z_off64_t tmp = a >> 32; \ Chris@43: a &= 0xffffffffL; \ Chris@43: a += (tmp << 8) - (tmp << 5) + tmp; \ Chris@43: tmp = a >> 16; \ Chris@43: a &= 0xffffL; \ Chris@43: a += (tmp << 4) - tmp; \ Chris@43: tmp = a >> 16; \ Chris@43: a &= 0xffffL; \ Chris@43: a += (tmp << 4) - tmp; \ Chris@43: if (a >= BASE) a -= BASE; \ Chris@43: } while (0) Chris@43: #else Chris@43: # define MOD(a) a %= BASE Chris@43: # define MOD28(a) a %= BASE Chris@43: # define MOD63(a) a %= BASE Chris@43: #endif Chris@43: Chris@43: /* ========================================================================= */ Chris@43: uLong ZEXPORT adler32(adler, buf, len) Chris@43: uLong adler; Chris@43: const Bytef *buf; Chris@43: uInt len; Chris@43: { Chris@43: unsigned long sum2; Chris@43: unsigned n; Chris@43: Chris@43: /* split Adler-32 into component sums */ Chris@43: sum2 = (adler >> 16) & 0xffff; Chris@43: adler &= 0xffff; Chris@43: Chris@43: /* in case user likes doing a byte at a time, keep it fast */ Chris@43: if (len == 1) { Chris@43: adler += buf[0]; Chris@43: if (adler >= BASE) Chris@43: adler -= BASE; Chris@43: sum2 += adler; Chris@43: if (sum2 >= BASE) Chris@43: sum2 -= BASE; Chris@43: return adler | (sum2 << 16); Chris@43: } Chris@43: Chris@43: /* initial Adler-32 value (deferred check for len == 1 speed) */ Chris@43: if (buf == Z_NULL) Chris@43: return 1L; Chris@43: Chris@43: /* in case short lengths are provided, keep it somewhat fast */ Chris@43: if (len < 16) { Chris@43: while (len--) { Chris@43: adler += *buf++; Chris@43: sum2 += adler; Chris@43: } Chris@43: if (adler >= BASE) Chris@43: adler -= BASE; Chris@43: MOD28(sum2); /* only added so many BASE's */ Chris@43: return adler | (sum2 << 16); Chris@43: } Chris@43: Chris@43: /* do length NMAX blocks -- requires just one modulo operation */ Chris@43: while (len >= NMAX) { Chris@43: len -= NMAX; Chris@43: n = NMAX / 16; /* NMAX is divisible by 16 */ Chris@43: do { Chris@43: DO16(buf); /* 16 sums unrolled */ Chris@43: buf += 16; Chris@43: } while (--n); Chris@43: MOD(adler); Chris@43: MOD(sum2); Chris@43: } Chris@43: Chris@43: /* do remaining bytes (less than NMAX, still just one modulo) */ Chris@43: if (len) { /* avoid modulos if none remaining */ Chris@43: while (len >= 16) { Chris@43: len -= 16; Chris@43: DO16(buf); Chris@43: buf += 16; Chris@43: } Chris@43: while (len--) { Chris@43: adler += *buf++; Chris@43: sum2 += adler; Chris@43: } Chris@43: MOD(adler); Chris@43: MOD(sum2); Chris@43: } Chris@43: Chris@43: /* return recombined sums */ Chris@43: return adler | (sum2 << 16); Chris@43: } Chris@43: Chris@43: /* ========================================================================= */ Chris@43: local uLong adler32_combine_(adler1, adler2, len2) Chris@43: uLong adler1; Chris@43: uLong adler2; Chris@43: z_off64_t len2; Chris@43: { Chris@43: unsigned long sum1; Chris@43: unsigned long sum2; Chris@43: unsigned rem; Chris@43: Chris@43: /* for negative len, return invalid adler32 as a clue for debugging */ Chris@43: if (len2 < 0) Chris@43: return 0xffffffffUL; Chris@43: Chris@43: /* the derivation of this formula is left as an exercise for the reader */ Chris@43: MOD63(len2); /* assumes len2 >= 0 */ Chris@43: rem = (unsigned)len2; Chris@43: sum1 = adler1 & 0xffff; Chris@43: sum2 = rem * sum1; Chris@43: MOD(sum2); Chris@43: sum1 += (adler2 & 0xffff) + BASE - 1; Chris@43: sum2 += ((adler1 >> 16) & 0xffff) + ((adler2 >> 16) & 0xffff) + BASE - rem; Chris@43: if (sum1 >= BASE) sum1 -= BASE; Chris@43: if (sum1 >= BASE) sum1 -= BASE; Chris@43: if (sum2 >= (BASE << 1)) sum2 -= (BASE << 1); Chris@43: if (sum2 >= BASE) sum2 -= BASE; Chris@43: return sum1 | (sum2 << 16); Chris@43: } Chris@43: Chris@43: /* ========================================================================= */ Chris@43: uLong ZEXPORT adler32_combine(adler1, adler2, len2) Chris@43: uLong adler1; Chris@43: uLong adler2; Chris@43: z_off_t len2; Chris@43: { Chris@43: return adler32_combine_(adler1, adler2, len2); Chris@43: } Chris@43: Chris@43: uLong ZEXPORT adler32_combine64(adler1, adler2, len2) Chris@43: uLong adler1; Chris@43: uLong adler2; Chris@43: z_off64_t len2; Chris@43: { Chris@43: return adler32_combine_(adler1, adler2, len2); Chris@43: }