1221b1638SMasahiro Yamada /* adler32.c -- compute the Adler-32 checksum of a data stream
2221b1638SMasahiro Yamada * Copyright (C) 1995-2011, 2016 Mark Adler
3221b1638SMasahiro Yamada * For conditions of distribution and use, see copyright notice in zlib.h
4221b1638SMasahiro Yamada */
5221b1638SMasahiro Yamada
6221b1638SMasahiro Yamada /* @(#) $Id$ */
7221b1638SMasahiro Yamada
8221b1638SMasahiro Yamada #include "zutil.h"
9221b1638SMasahiro Yamada
10221b1638SMasahiro Yamada #define BASE 65521U /* largest prime smaller than 65536 */
11221b1638SMasahiro Yamada #define NMAX 5552
12221b1638SMasahiro Yamada /* NMAX is the largest n such that 255n(n+1)/2 + (n+1)(BASE-1) <= 2^32-1 */
13221b1638SMasahiro Yamada
14221b1638SMasahiro Yamada #define DO1(buf,i) {adler += (buf)[i]; sum2 += adler;}
15221b1638SMasahiro Yamada #define DO2(buf,i) DO1(buf,i); DO1(buf,i+1);
16221b1638SMasahiro Yamada #define DO4(buf,i) DO2(buf,i); DO2(buf,i+2);
17221b1638SMasahiro Yamada #define DO8(buf,i) DO4(buf,i); DO4(buf,i+4);
18221b1638SMasahiro Yamada #define DO16(buf) DO8(buf,0); DO8(buf,8);
19221b1638SMasahiro Yamada
20221b1638SMasahiro Yamada /* use NO_DIVIDE if your processor does not do division in hardware --
21221b1638SMasahiro Yamada try it both ways to see which is faster */
22221b1638SMasahiro Yamada #ifdef NO_DIVIDE
23221b1638SMasahiro Yamada /* note that this assumes BASE is 65521, where 65536 % 65521 == 15
24221b1638SMasahiro Yamada (thank you to John Reiser for pointing this out) */
25221b1638SMasahiro Yamada # define CHOP(a) \
26221b1638SMasahiro Yamada do { \
27221b1638SMasahiro Yamada unsigned long tmp = a >> 16; \
28221b1638SMasahiro Yamada a &= 0xffffUL; \
29221b1638SMasahiro Yamada a += (tmp << 4) - tmp; \
30221b1638SMasahiro Yamada } while (0)
31221b1638SMasahiro Yamada # define MOD28(a) \
32221b1638SMasahiro Yamada do { \
33221b1638SMasahiro Yamada CHOP(a); \
34221b1638SMasahiro Yamada if (a >= BASE) a -= BASE; \
35221b1638SMasahiro Yamada } while (0)
36221b1638SMasahiro Yamada # define MOD(a) \
37221b1638SMasahiro Yamada do { \
38221b1638SMasahiro Yamada CHOP(a); \
39221b1638SMasahiro Yamada MOD28(a); \
40221b1638SMasahiro Yamada } while (0)
41221b1638SMasahiro Yamada # define MOD63(a) \
42221b1638SMasahiro Yamada do { /* this assumes a is not negative */ \
43221b1638SMasahiro Yamada z_off64_t tmp = a >> 32; \
44221b1638SMasahiro Yamada a &= 0xffffffffL; \
45221b1638SMasahiro Yamada a += (tmp << 8) - (tmp << 5) + tmp; \
46221b1638SMasahiro Yamada tmp = a >> 16; \
47221b1638SMasahiro Yamada a &= 0xffffL; \
48221b1638SMasahiro Yamada a += (tmp << 4) - tmp; \
49221b1638SMasahiro Yamada tmp = a >> 16; \
50221b1638SMasahiro Yamada a &= 0xffffL; \
51221b1638SMasahiro Yamada a += (tmp << 4) - tmp; \
52221b1638SMasahiro Yamada if (a >= BASE) a -= BASE; \
53221b1638SMasahiro Yamada } while (0)
54221b1638SMasahiro Yamada #else
55221b1638SMasahiro Yamada # define MOD(a) a %= BASE
56221b1638SMasahiro Yamada # define MOD28(a) a %= BASE
57221b1638SMasahiro Yamada # define MOD63(a) a %= BASE
58221b1638SMasahiro Yamada #endif
59221b1638SMasahiro Yamada
60221b1638SMasahiro Yamada /* ========================================================================= */
adler32_z(uLong adler,const Bytef * buf,z_size_t len)61*fd39217aSManish Pandey uLong ZEXPORT adler32_z(uLong adler, const Bytef *buf, z_size_t len) {
62221b1638SMasahiro Yamada unsigned long sum2;
63221b1638SMasahiro Yamada unsigned n;
64221b1638SMasahiro Yamada
65221b1638SMasahiro Yamada /* split Adler-32 into component sums */
66221b1638SMasahiro Yamada sum2 = (adler >> 16) & 0xffff;
67221b1638SMasahiro Yamada adler &= 0xffff;
68221b1638SMasahiro Yamada
69221b1638SMasahiro Yamada /* in case user likes doing a byte at a time, keep it fast */
70221b1638SMasahiro Yamada if (len == 1) {
71221b1638SMasahiro Yamada adler += buf[0];
72221b1638SMasahiro Yamada if (adler >= BASE)
73221b1638SMasahiro Yamada adler -= BASE;
74221b1638SMasahiro Yamada sum2 += adler;
75221b1638SMasahiro Yamada if (sum2 >= BASE)
76221b1638SMasahiro Yamada sum2 -= BASE;
77221b1638SMasahiro Yamada return adler | (sum2 << 16);
78221b1638SMasahiro Yamada }
79221b1638SMasahiro Yamada
80221b1638SMasahiro Yamada /* initial Adler-32 value (deferred check for len == 1 speed) */
81221b1638SMasahiro Yamada if (buf == Z_NULL)
82221b1638SMasahiro Yamada return 1L;
83221b1638SMasahiro Yamada
84221b1638SMasahiro Yamada /* in case short lengths are provided, keep it somewhat fast */
85221b1638SMasahiro Yamada if (len < 16) {
86221b1638SMasahiro Yamada while (len--) {
87221b1638SMasahiro Yamada adler += *buf++;
88221b1638SMasahiro Yamada sum2 += adler;
89221b1638SMasahiro Yamada }
90221b1638SMasahiro Yamada if (adler >= BASE)
91221b1638SMasahiro Yamada adler -= BASE;
92221b1638SMasahiro Yamada MOD28(sum2); /* only added so many BASE's */
93221b1638SMasahiro Yamada return adler | (sum2 << 16);
94221b1638SMasahiro Yamada }
95221b1638SMasahiro Yamada
96221b1638SMasahiro Yamada /* do length NMAX blocks -- requires just one modulo operation */
97221b1638SMasahiro Yamada while (len >= NMAX) {
98221b1638SMasahiro Yamada len -= NMAX;
99221b1638SMasahiro Yamada n = NMAX / 16; /* NMAX is divisible by 16 */
100221b1638SMasahiro Yamada do {
101221b1638SMasahiro Yamada DO16(buf); /* 16 sums unrolled */
102221b1638SMasahiro Yamada buf += 16;
103221b1638SMasahiro Yamada } while (--n);
104221b1638SMasahiro Yamada MOD(adler);
105221b1638SMasahiro Yamada MOD(sum2);
106221b1638SMasahiro Yamada }
107221b1638SMasahiro Yamada
108221b1638SMasahiro Yamada /* do remaining bytes (less than NMAX, still just one modulo) */
109221b1638SMasahiro Yamada if (len) { /* avoid modulos if none remaining */
110221b1638SMasahiro Yamada while (len >= 16) {
111221b1638SMasahiro Yamada len -= 16;
112221b1638SMasahiro Yamada DO16(buf);
113221b1638SMasahiro Yamada buf += 16;
114221b1638SMasahiro Yamada }
115221b1638SMasahiro Yamada while (len--) {
116221b1638SMasahiro Yamada adler += *buf++;
117221b1638SMasahiro Yamada sum2 += adler;
118221b1638SMasahiro Yamada }
119221b1638SMasahiro Yamada MOD(adler);
120221b1638SMasahiro Yamada MOD(sum2);
121221b1638SMasahiro Yamada }
122221b1638SMasahiro Yamada
123221b1638SMasahiro Yamada /* return recombined sums */
124221b1638SMasahiro Yamada return adler | (sum2 << 16);
125221b1638SMasahiro Yamada }
126221b1638SMasahiro Yamada
127221b1638SMasahiro Yamada /* ========================================================================= */
adler32(uLong adler,const Bytef * buf,uInt len)128*fd39217aSManish Pandey uLong ZEXPORT adler32(uLong adler, const Bytef *buf, uInt len) {
129221b1638SMasahiro Yamada return adler32_z(adler, buf, len);
130221b1638SMasahiro Yamada }
131221b1638SMasahiro Yamada
132221b1638SMasahiro Yamada /* ========================================================================= */
adler32_combine_(uLong adler1,uLong adler2,z_off64_t len2)133*fd39217aSManish Pandey local uLong adler32_combine_(uLong adler1, uLong adler2, z_off64_t len2) {
134221b1638SMasahiro Yamada unsigned long sum1;
135221b1638SMasahiro Yamada unsigned long sum2;
136221b1638SMasahiro Yamada unsigned rem;
137221b1638SMasahiro Yamada
138221b1638SMasahiro Yamada /* for negative len, return invalid adler32 as a clue for debugging */
139221b1638SMasahiro Yamada if (len2 < 0)
140221b1638SMasahiro Yamada return 0xffffffffUL;
141221b1638SMasahiro Yamada
142221b1638SMasahiro Yamada /* the derivation of this formula is left as an exercise for the reader */
143221b1638SMasahiro Yamada MOD63(len2); /* assumes len2 >= 0 */
144221b1638SMasahiro Yamada rem = (unsigned)len2;
145221b1638SMasahiro Yamada sum1 = adler1 & 0xffff;
146221b1638SMasahiro Yamada sum2 = rem * sum1;
147221b1638SMasahiro Yamada MOD(sum2);
148221b1638SMasahiro Yamada sum1 += (adler2 & 0xffff) + BASE - 1;
149221b1638SMasahiro Yamada sum2 += ((adler1 >> 16) & 0xffff) + ((adler2 >> 16) & 0xffff) + BASE - rem;
150221b1638SMasahiro Yamada if (sum1 >= BASE) sum1 -= BASE;
151221b1638SMasahiro Yamada if (sum1 >= BASE) sum1 -= BASE;
152221b1638SMasahiro Yamada if (sum2 >= ((unsigned long)BASE << 1)) sum2 -= ((unsigned long)BASE << 1);
153221b1638SMasahiro Yamada if (sum2 >= BASE) sum2 -= BASE;
154221b1638SMasahiro Yamada return sum1 | (sum2 << 16);
155221b1638SMasahiro Yamada }
156221b1638SMasahiro Yamada
157221b1638SMasahiro Yamada /* ========================================================================= */
adler32_combine(uLong adler1,uLong adler2,z_off_t len2)158*fd39217aSManish Pandey uLong ZEXPORT adler32_combine(uLong adler1, uLong adler2, z_off_t len2) {
159221b1638SMasahiro Yamada return adler32_combine_(adler1, adler2, len2);
160221b1638SMasahiro Yamada }
161221b1638SMasahiro Yamada
adler32_combine64(uLong adler1,uLong adler2,z_off64_t len2)162*fd39217aSManish Pandey uLong ZEXPORT adler32_combine64(uLong adler1, uLong adler2, z_off64_t len2) {
163221b1638SMasahiro Yamada return adler32_combine_(adler1, adler2, len2);
164221b1638SMasahiro Yamada }
165