1*2d60b848STomohiro Kusumi /* adler32.c -- compute the Adler-32 checksum of a data stream
2*2d60b848STomohiro Kusumi * Copyright (C) 1995-2011 Mark Adler
3*2d60b848STomohiro Kusumi * For conditions of distribution and use, see copyright notice in zlib.h
4*2d60b848STomohiro Kusumi */
5*2d60b848STomohiro Kusumi
6*2d60b848STomohiro Kusumi /* @(#) $Id$ */
7*2d60b848STomohiro Kusumi
8*2d60b848STomohiro Kusumi #include "hammer2_zlib_zutil.h"
9*2d60b848STomohiro Kusumi
10*2d60b848STomohiro Kusumi #define local static
11*2d60b848STomohiro Kusumi
12*2d60b848STomohiro Kusumi //local uLong adler32_combine_ (uLong adler1, uLong adler2, z_off64_t len2);
13*2d60b848STomohiro Kusumi
14*2d60b848STomohiro Kusumi #define BASE 65521 /* largest prime smaller than 65536 */
15*2d60b848STomohiro Kusumi #define NMAX 5552
16*2d60b848STomohiro Kusumi /* NMAX is the largest n such that 255n(n+1)/2 + (n+1)(BASE-1) <= 2^32-1 */
17*2d60b848STomohiro Kusumi
18*2d60b848STomohiro Kusumi #define DO1(buf,i) {adler += (buf)[i]; sum2 += adler;}
19*2d60b848STomohiro Kusumi #define DO2(buf,i) DO1(buf,i); DO1(buf,i+1);
20*2d60b848STomohiro Kusumi #define DO4(buf,i) DO2(buf,i); DO2(buf,i+2);
21*2d60b848STomohiro Kusumi #define DO8(buf,i) DO4(buf,i); DO4(buf,i+4);
22*2d60b848STomohiro Kusumi #define DO16(buf) DO8(buf,0); DO8(buf,8);
23*2d60b848STomohiro Kusumi
24*2d60b848STomohiro Kusumi /* use NO_DIVIDE if your processor does not do division in hardware --
25*2d60b848STomohiro Kusumi try it both ways to see which is faster */
26*2d60b848STomohiro Kusumi #ifdef NO_DIVIDE
27*2d60b848STomohiro Kusumi /* note that this assumes BASE is 65521, where 65536 % 65521 == 15
28*2d60b848STomohiro Kusumi (thank you to John Reiser for pointing this out) */
29*2d60b848STomohiro Kusumi # define CHOP(a) \
30*2d60b848STomohiro Kusumi do { \
31*2d60b848STomohiro Kusumi unsigned long tmp = a >> 16; \
32*2d60b848STomohiro Kusumi a &= 0xffffUL; \
33*2d60b848STomohiro Kusumi a += (tmp << 4) - tmp; \
34*2d60b848STomohiro Kusumi } while (0)
35*2d60b848STomohiro Kusumi # define MOD28(a) \
36*2d60b848STomohiro Kusumi do { \
37*2d60b848STomohiro Kusumi CHOP(a); \
38*2d60b848STomohiro Kusumi if (a >= BASE) a -= BASE; \
39*2d60b848STomohiro Kusumi } while (0)
40*2d60b848STomohiro Kusumi # define MOD(a) \
41*2d60b848STomohiro Kusumi do { \
42*2d60b848STomohiro Kusumi CHOP(a); \
43*2d60b848STomohiro Kusumi MOD28(a); \
44*2d60b848STomohiro Kusumi } while (0)
45*2d60b848STomohiro Kusumi # define MOD63(a) \
46*2d60b848STomohiro Kusumi do { /* this assumes a is not negative */ \
47*2d60b848STomohiro Kusumi z_off64_t tmp = a >> 32; \
48*2d60b848STomohiro Kusumi a &= 0xffffffffL; \
49*2d60b848STomohiro Kusumi a += (tmp << 8) - (tmp << 5) + tmp; \
50*2d60b848STomohiro Kusumi tmp = a >> 16; \
51*2d60b848STomohiro Kusumi a &= 0xffffL; \
52*2d60b848STomohiro Kusumi a += (tmp << 4) - tmp; \
53*2d60b848STomohiro Kusumi tmp = a >> 16; \
54*2d60b848STomohiro Kusumi a &= 0xffffL; \
55*2d60b848STomohiro Kusumi a += (tmp << 4) - tmp; \
56*2d60b848STomohiro Kusumi if (a >= BASE) a -= BASE; \
57*2d60b848STomohiro Kusumi } while (0)
58*2d60b848STomohiro Kusumi #else
59*2d60b848STomohiro Kusumi # define MOD(a) a %= BASE
60*2d60b848STomohiro Kusumi # define MOD28(a) a %= BASE
61*2d60b848STomohiro Kusumi # define MOD63(a) a %= BASE
62*2d60b848STomohiro Kusumi #endif
63*2d60b848STomohiro Kusumi
64*2d60b848STomohiro Kusumi local uLong adler32_combine_(uLong adler1, uLong adler2, z_off64_t len2);
65*2d60b848STomohiro Kusumi uLong adler32_combine(uLong adler1, uLong adler2, z_off_t len2);
66*2d60b848STomohiro Kusumi
67*2d60b848STomohiro Kusumi /* ========================================================================= */
68*2d60b848STomohiro Kusumi uLong
adler32(uLong adler,const Bytef * buf,uInt len)69*2d60b848STomohiro Kusumi adler32(uLong adler, const Bytef *buf, uInt len)
70*2d60b848STomohiro Kusumi {
71*2d60b848STomohiro Kusumi unsigned long sum2;
72*2d60b848STomohiro Kusumi unsigned n;
73*2d60b848STomohiro Kusumi
74*2d60b848STomohiro Kusumi /* split Adler-32 into component sums */
75*2d60b848STomohiro Kusumi sum2 = (adler >> 16) & 0xffff;
76*2d60b848STomohiro Kusumi adler &= 0xffff;
77*2d60b848STomohiro Kusumi
78*2d60b848STomohiro Kusumi /* in case user likes doing a byte at a time, keep it fast */
79*2d60b848STomohiro Kusumi if (len == 1) {
80*2d60b848STomohiro Kusumi adler += buf[0];
81*2d60b848STomohiro Kusumi if (adler >= BASE)
82*2d60b848STomohiro Kusumi adler -= BASE;
83*2d60b848STomohiro Kusumi sum2 += adler;
84*2d60b848STomohiro Kusumi if (sum2 >= BASE)
85*2d60b848STomohiro Kusumi sum2 -= BASE;
86*2d60b848STomohiro Kusumi return adler | (sum2 << 16);
87*2d60b848STomohiro Kusumi }
88*2d60b848STomohiro Kusumi
89*2d60b848STomohiro Kusumi /* initial Adler-32 value (deferred check for len == 1 speed) */
90*2d60b848STomohiro Kusumi if (buf == Z_NULL)
91*2d60b848STomohiro Kusumi return 1L;
92*2d60b848STomohiro Kusumi
93*2d60b848STomohiro Kusumi /* in case short lengths are provided, keep it somewhat fast */
94*2d60b848STomohiro Kusumi if (len < 16) {
95*2d60b848STomohiro Kusumi while (len--) {
96*2d60b848STomohiro Kusumi adler += *buf++;
97*2d60b848STomohiro Kusumi sum2 += adler;
98*2d60b848STomohiro Kusumi }
99*2d60b848STomohiro Kusumi if (adler >= BASE)
100*2d60b848STomohiro Kusumi adler -= BASE;
101*2d60b848STomohiro Kusumi MOD28(sum2); /* only added so many BASE's */
102*2d60b848STomohiro Kusumi return adler | (sum2 << 16);
103*2d60b848STomohiro Kusumi }
104*2d60b848STomohiro Kusumi
105*2d60b848STomohiro Kusumi /* do length NMAX blocks -- requires just one modulo operation */
106*2d60b848STomohiro Kusumi while (len >= NMAX) {
107*2d60b848STomohiro Kusumi len -= NMAX;
108*2d60b848STomohiro Kusumi n = NMAX / 16; /* NMAX is divisible by 16 */
109*2d60b848STomohiro Kusumi do {
110*2d60b848STomohiro Kusumi DO16(buf); /* 16 sums unrolled */
111*2d60b848STomohiro Kusumi buf += 16;
112*2d60b848STomohiro Kusumi } while (--n);
113*2d60b848STomohiro Kusumi MOD(adler);
114*2d60b848STomohiro Kusumi MOD(sum2);
115*2d60b848STomohiro Kusumi }
116*2d60b848STomohiro Kusumi
117*2d60b848STomohiro Kusumi /* do remaining bytes (less than NMAX, still just one modulo) */
118*2d60b848STomohiro Kusumi if (len) { /* avoid modulos if none remaining */
119*2d60b848STomohiro Kusumi while (len >= 16) {
120*2d60b848STomohiro Kusumi len -= 16;
121*2d60b848STomohiro Kusumi DO16(buf);
122*2d60b848STomohiro Kusumi buf += 16;
123*2d60b848STomohiro Kusumi }
124*2d60b848STomohiro Kusumi while (len--) {
125*2d60b848STomohiro Kusumi adler += *buf++;
126*2d60b848STomohiro Kusumi sum2 += adler;
127*2d60b848STomohiro Kusumi }
128*2d60b848STomohiro Kusumi MOD(adler);
129*2d60b848STomohiro Kusumi MOD(sum2);
130*2d60b848STomohiro Kusumi }
131*2d60b848STomohiro Kusumi
132*2d60b848STomohiro Kusumi /* return recombined sums */
133*2d60b848STomohiro Kusumi return adler | (sum2 << 16);
134*2d60b848STomohiro Kusumi }
135*2d60b848STomohiro Kusumi
136*2d60b848STomohiro Kusumi /* ========================================================================= */
137*2d60b848STomohiro Kusumi local
138*2d60b848STomohiro Kusumi uLong
adler32_combine_(uLong adler1,uLong adler2,z_off64_t len2)139*2d60b848STomohiro Kusumi adler32_combine_(uLong adler1, uLong adler2, z_off64_t len2)
140*2d60b848STomohiro Kusumi {
141*2d60b848STomohiro Kusumi unsigned long sum1;
142*2d60b848STomohiro Kusumi unsigned long sum2;
143*2d60b848STomohiro Kusumi unsigned rem;
144*2d60b848STomohiro Kusumi
145*2d60b848STomohiro Kusumi /* for negative len, return invalid adler32 as a clue for debugging */
146*2d60b848STomohiro Kusumi if (len2 < 0)
147*2d60b848STomohiro Kusumi return 0xffffffffUL;
148*2d60b848STomohiro Kusumi
149*2d60b848STomohiro Kusumi /* the derivation of this formula is left as an exercise for the reader */
150*2d60b848STomohiro Kusumi MOD63(len2); /* assumes len2 >= 0 */
151*2d60b848STomohiro Kusumi rem = (unsigned)len2;
152*2d60b848STomohiro Kusumi sum1 = adler1 & 0xffff;
153*2d60b848STomohiro Kusumi sum2 = rem * sum1;
154*2d60b848STomohiro Kusumi MOD(sum2);
155*2d60b848STomohiro Kusumi sum1 += (adler2 & 0xffff) + BASE - 1;
156*2d60b848STomohiro Kusumi sum2 += ((adler1 >> 16) & 0xffff) + ((adler2 >> 16) & 0xffff) + BASE - rem;
157*2d60b848STomohiro Kusumi if (sum1 >= BASE) sum1 -= BASE;
158*2d60b848STomohiro Kusumi if (sum1 >= BASE) sum1 -= BASE;
159*2d60b848STomohiro Kusumi if (sum2 >= (BASE << 1)) sum2 -= (BASE << 1);
160*2d60b848STomohiro Kusumi if (sum2 >= BASE) sum2 -= BASE;
161*2d60b848STomohiro Kusumi return sum1 | (sum2 << 16);
162*2d60b848STomohiro Kusumi }
163*2d60b848STomohiro Kusumi
164*2d60b848STomohiro Kusumi /* ========================================================================= */
165*2d60b848STomohiro Kusumi uLong
adler32_combine(uLong adler1,uLong adler2,z_off_t len2)166*2d60b848STomohiro Kusumi adler32_combine(uLong adler1, uLong adler2, z_off_t len2)
167*2d60b848STomohiro Kusumi {
168*2d60b848STomohiro Kusumi return adler32_combine_(adler1, adler2, len2);
169*2d60b848STomohiro Kusumi }
170*2d60b848STomohiro Kusumi
171*2d60b848STomohiro Kusumi uLong
adler32_combine64(uLong adler1,uLong adler2,z_off64_t len2)172*2d60b848STomohiro Kusumi adler32_combine64(uLong adler1, uLong adler2, z_off64_t len2)
173*2d60b848STomohiro Kusumi {
174*2d60b848STomohiro Kusumi return adler32_combine_(adler1, adler2, len2);
175*2d60b848STomohiro Kusumi }
176