xref: /aosp_15_r20/external/zlib/adler32.c (revision 86ee64e75fa5f8bce2c8c356138035642429cd05)
1*86ee64e7SAndroid Build Coastguard Worker /* adler32.c -- compute the Adler-32 checksum of a data stream
2*86ee64e7SAndroid Build Coastguard Worker  * Copyright (C) 1995-2011, 2016 Mark Adler
3*86ee64e7SAndroid Build Coastguard Worker  * For conditions of distribution and use, see copyright notice in zlib.h
4*86ee64e7SAndroid Build Coastguard Worker  */
5*86ee64e7SAndroid Build Coastguard Worker 
6*86ee64e7SAndroid Build Coastguard Worker /* @(#) $Id$ */
7*86ee64e7SAndroid Build Coastguard Worker 
8*86ee64e7SAndroid Build Coastguard Worker #include "zutil.h"
9*86ee64e7SAndroid Build Coastguard Worker 
10*86ee64e7SAndroid Build Coastguard Worker #define BASE 65521U     /* largest prime smaller than 65536 */
11*86ee64e7SAndroid Build Coastguard Worker #define NMAX 5552
12*86ee64e7SAndroid Build Coastguard Worker /* NMAX is the largest n such that 255n(n+1)/2 + (n+1)(BASE-1) <= 2^32-1 */
13*86ee64e7SAndroid Build Coastguard Worker 
14*86ee64e7SAndroid Build Coastguard Worker #define DO1(buf,i)  {adler += (buf)[i]; sum2 += adler;}
15*86ee64e7SAndroid Build Coastguard Worker #define DO2(buf,i)  DO1(buf,i); DO1(buf,i+1);
16*86ee64e7SAndroid Build Coastguard Worker #define DO4(buf,i)  DO2(buf,i); DO2(buf,i+2);
17*86ee64e7SAndroid Build Coastguard Worker #define DO8(buf,i)  DO4(buf,i); DO4(buf,i+4);
18*86ee64e7SAndroid Build Coastguard Worker #define DO16(buf)   DO8(buf,0); DO8(buf,8);
19*86ee64e7SAndroid Build Coastguard Worker 
20*86ee64e7SAndroid Build Coastguard Worker /* use NO_DIVIDE if your processor does not do division in hardware --
21*86ee64e7SAndroid Build Coastguard Worker    try it both ways to see which is faster */
22*86ee64e7SAndroid Build Coastguard Worker #ifdef NO_DIVIDE
23*86ee64e7SAndroid Build Coastguard Worker /* note that this assumes BASE is 65521, where 65536 % 65521 == 15
24*86ee64e7SAndroid Build Coastguard Worker    (thank you to John Reiser for pointing this out) */
25*86ee64e7SAndroid Build Coastguard Worker #  define CHOP(a) \
26*86ee64e7SAndroid Build Coastguard Worker     do { \
27*86ee64e7SAndroid Build Coastguard Worker         unsigned long tmp = a >> 16; \
28*86ee64e7SAndroid Build Coastguard Worker         a &= 0xffffUL; \
29*86ee64e7SAndroid Build Coastguard Worker         a += (tmp << 4) - tmp; \
30*86ee64e7SAndroid Build Coastguard Worker     } while (0)
31*86ee64e7SAndroid Build Coastguard Worker #  define MOD28(a) \
32*86ee64e7SAndroid Build Coastguard Worker     do { \
33*86ee64e7SAndroid Build Coastguard Worker         CHOP(a); \
34*86ee64e7SAndroid Build Coastguard Worker         if (a >= BASE) a -= BASE; \
35*86ee64e7SAndroid Build Coastguard Worker     } while (0)
36*86ee64e7SAndroid Build Coastguard Worker #  define MOD(a) \
37*86ee64e7SAndroid Build Coastguard Worker     do { \
38*86ee64e7SAndroid Build Coastguard Worker         CHOP(a); \
39*86ee64e7SAndroid Build Coastguard Worker         MOD28(a); \
40*86ee64e7SAndroid Build Coastguard Worker     } while (0)
41*86ee64e7SAndroid Build Coastguard Worker #  define MOD63(a) \
42*86ee64e7SAndroid Build Coastguard Worker     do { /* this assumes a is not negative */ \
43*86ee64e7SAndroid Build Coastguard Worker         z_off64_t tmp = a >> 32; \
44*86ee64e7SAndroid Build Coastguard Worker         a &= 0xffffffffL; \
45*86ee64e7SAndroid Build Coastguard Worker         a += (tmp << 8) - (tmp << 5) + tmp; \
46*86ee64e7SAndroid Build Coastguard Worker         tmp = a >> 16; \
47*86ee64e7SAndroid Build Coastguard Worker         a &= 0xffffL; \
48*86ee64e7SAndroid Build Coastguard Worker         a += (tmp << 4) - tmp; \
49*86ee64e7SAndroid Build Coastguard Worker         tmp = a >> 16; \
50*86ee64e7SAndroid Build Coastguard Worker         a &= 0xffffL; \
51*86ee64e7SAndroid Build Coastguard Worker         a += (tmp << 4) - tmp; \
52*86ee64e7SAndroid Build Coastguard Worker         if (a >= BASE) a -= BASE; \
53*86ee64e7SAndroid Build Coastguard Worker     } while (0)
54*86ee64e7SAndroid Build Coastguard Worker #else
55*86ee64e7SAndroid Build Coastguard Worker #  define MOD(a) a %= BASE
56*86ee64e7SAndroid Build Coastguard Worker #  define MOD28(a) a %= BASE
57*86ee64e7SAndroid Build Coastguard Worker #  define MOD63(a) a %= BASE
58*86ee64e7SAndroid Build Coastguard Worker #endif
59*86ee64e7SAndroid Build Coastguard Worker 
60*86ee64e7SAndroid Build Coastguard Worker #include "cpu_features.h"
61*86ee64e7SAndroid Build Coastguard Worker #if defined(ADLER32_SIMD_SSSE3) || defined(ADLER32_SIMD_NEON) || defined(ADLER32_SIMD_RVV)
62*86ee64e7SAndroid Build Coastguard Worker #include "adler32_simd.h"
63*86ee64e7SAndroid Build Coastguard Worker #endif
64*86ee64e7SAndroid Build Coastguard Worker 
65*86ee64e7SAndroid Build Coastguard Worker /* ========================================================================= */
adler32_z(uLong adler,const Bytef * buf,z_size_t len)66*86ee64e7SAndroid Build Coastguard Worker uLong ZEXPORT adler32_z(uLong adler, const Bytef *buf, z_size_t len) {
67*86ee64e7SAndroid Build Coastguard Worker     unsigned long sum2;
68*86ee64e7SAndroid Build Coastguard Worker     unsigned n;
69*86ee64e7SAndroid Build Coastguard Worker     /* TODO(cavalcantii): verify if this lengths are optimal for current CPUs. */
70*86ee64e7SAndroid Build Coastguard Worker #if defined(ADLER32_SIMD_SSSE3) || defined(ADLER32_SIMD_NEON) \
71*86ee64e7SAndroid Build Coastguard Worker     || defined(ADLER32_SIMD_RVV)
72*86ee64e7SAndroid Build Coastguard Worker #if defined(ADLER32_SIMD_SSSE3)
73*86ee64e7SAndroid Build Coastguard Worker     if (buf != Z_NULL && len >= 64 && x86_cpu_enable_ssse3)
74*86ee64e7SAndroid Build Coastguard Worker #elif defined(ADLER32_SIMD_NEON)
75*86ee64e7SAndroid Build Coastguard Worker     if (buf != Z_NULL && len >= 64)
76*86ee64e7SAndroid Build Coastguard Worker #elif defined(ADLER32_SIMD_RVV)
77*86ee64e7SAndroid Build Coastguard Worker     if (buf != Z_NULL && len >= 32 && riscv_cpu_enable_rvv)
78*86ee64e7SAndroid Build Coastguard Worker #endif
79*86ee64e7SAndroid Build Coastguard Worker         return adler32_simd_(adler, buf, len);
80*86ee64e7SAndroid Build Coastguard Worker #endif
81*86ee64e7SAndroid Build Coastguard Worker 
82*86ee64e7SAndroid Build Coastguard Worker     /* split Adler-32 into component sums */
83*86ee64e7SAndroid Build Coastguard Worker     sum2 = (adler >> 16) & 0xffff;
84*86ee64e7SAndroid Build Coastguard Worker     adler &= 0xffff;
85*86ee64e7SAndroid Build Coastguard Worker 
86*86ee64e7SAndroid Build Coastguard Worker     /* in case user likes doing a byte at a time, keep it fast */
87*86ee64e7SAndroid Build Coastguard Worker     if (len == 1) {
88*86ee64e7SAndroid Build Coastguard Worker         adler += buf[0];
89*86ee64e7SAndroid Build Coastguard Worker         if (adler >= BASE)
90*86ee64e7SAndroid Build Coastguard Worker             adler -= BASE;
91*86ee64e7SAndroid Build Coastguard Worker         sum2 += adler;
92*86ee64e7SAndroid Build Coastguard Worker         if (sum2 >= BASE)
93*86ee64e7SAndroid Build Coastguard Worker             sum2 -= BASE;
94*86ee64e7SAndroid Build Coastguard Worker         return adler | (sum2 << 16);
95*86ee64e7SAndroid Build Coastguard Worker     }
96*86ee64e7SAndroid Build Coastguard Worker 
97*86ee64e7SAndroid Build Coastguard Worker #if defined(ADLER32_SIMD_SSSE3) || defined(ADLER32_SIMD_NEON) \
98*86ee64e7SAndroid Build Coastguard Worker     || defined(RISCV_RVV)
99*86ee64e7SAndroid Build Coastguard Worker     /*
100*86ee64e7SAndroid Build Coastguard Worker      * Use SIMD to compute the adler32. Since this function can be
101*86ee64e7SAndroid Build Coastguard Worker      * freely used, check CPU features here. zlib convention is to
102*86ee64e7SAndroid Build Coastguard Worker      * call adler32(0, NULL, 0), before making calls to adler32().
103*86ee64e7SAndroid Build Coastguard Worker      * So this is a good early (and infrequent) place to cache CPU
104*86ee64e7SAndroid Build Coastguard Worker      * features for those later, more interesting adler32() calls.
105*86ee64e7SAndroid Build Coastguard Worker      */
106*86ee64e7SAndroid Build Coastguard Worker     if (buf == Z_NULL) {
107*86ee64e7SAndroid Build Coastguard Worker         if (!len) /* Assume user is calling adler32(0, NULL, 0); */
108*86ee64e7SAndroid Build Coastguard Worker             cpu_check_features();
109*86ee64e7SAndroid Build Coastguard Worker         return 1L;
110*86ee64e7SAndroid Build Coastguard Worker     }
111*86ee64e7SAndroid Build Coastguard Worker #else
112*86ee64e7SAndroid Build Coastguard Worker     /* initial Adler-32 value (deferred check for len == 1 speed) */
113*86ee64e7SAndroid Build Coastguard Worker     if (buf == Z_NULL)
114*86ee64e7SAndroid Build Coastguard Worker         return 1L;
115*86ee64e7SAndroid Build Coastguard Worker #endif
116*86ee64e7SAndroid Build Coastguard Worker 
117*86ee64e7SAndroid Build Coastguard Worker     /* in case short lengths are provided, keep it somewhat fast */
118*86ee64e7SAndroid Build Coastguard Worker     if (len < 16) {
119*86ee64e7SAndroid Build Coastguard Worker         while (len--) {
120*86ee64e7SAndroid Build Coastguard Worker             adler += *buf++;
121*86ee64e7SAndroid Build Coastguard Worker             sum2 += adler;
122*86ee64e7SAndroid Build Coastguard Worker         }
123*86ee64e7SAndroid Build Coastguard Worker         if (adler >= BASE)
124*86ee64e7SAndroid Build Coastguard Worker             adler -= BASE;
125*86ee64e7SAndroid Build Coastguard Worker         MOD28(sum2);            /* only added so many BASE's */
126*86ee64e7SAndroid Build Coastguard Worker         return adler | (sum2 << 16);
127*86ee64e7SAndroid Build Coastguard Worker     }
128*86ee64e7SAndroid Build Coastguard Worker 
129*86ee64e7SAndroid Build Coastguard Worker     /* do length NMAX blocks -- requires just one modulo operation */
130*86ee64e7SAndroid Build Coastguard Worker     while (len >= NMAX) {
131*86ee64e7SAndroid Build Coastguard Worker         len -= NMAX;
132*86ee64e7SAndroid Build Coastguard Worker         n = NMAX / 16;          /* NMAX is divisible by 16 */
133*86ee64e7SAndroid Build Coastguard Worker         do {
134*86ee64e7SAndroid Build Coastguard Worker             DO16(buf);          /* 16 sums unrolled */
135*86ee64e7SAndroid Build Coastguard Worker             buf += 16;
136*86ee64e7SAndroid Build Coastguard Worker         } while (--n);
137*86ee64e7SAndroid Build Coastguard Worker         MOD(adler);
138*86ee64e7SAndroid Build Coastguard Worker         MOD(sum2);
139*86ee64e7SAndroid Build Coastguard Worker     }
140*86ee64e7SAndroid Build Coastguard Worker 
141*86ee64e7SAndroid Build Coastguard Worker     /* do remaining bytes (less than NMAX, still just one modulo) */
142*86ee64e7SAndroid Build Coastguard Worker     if (len) {                  /* avoid modulos if none remaining */
143*86ee64e7SAndroid Build Coastguard Worker         while (len >= 16) {
144*86ee64e7SAndroid Build Coastguard Worker             len -= 16;
145*86ee64e7SAndroid Build Coastguard Worker             DO16(buf);
146*86ee64e7SAndroid Build Coastguard Worker             buf += 16;
147*86ee64e7SAndroid Build Coastguard Worker         }
148*86ee64e7SAndroid Build Coastguard Worker         while (len--) {
149*86ee64e7SAndroid Build Coastguard Worker             adler += *buf++;
150*86ee64e7SAndroid Build Coastguard Worker             sum2 += adler;
151*86ee64e7SAndroid Build Coastguard Worker         }
152*86ee64e7SAndroid Build Coastguard Worker         MOD(adler);
153*86ee64e7SAndroid Build Coastguard Worker         MOD(sum2);
154*86ee64e7SAndroid Build Coastguard Worker     }
155*86ee64e7SAndroid Build Coastguard Worker 
156*86ee64e7SAndroid Build Coastguard Worker     /* return recombined sums */
157*86ee64e7SAndroid Build Coastguard Worker     return adler | (sum2 << 16);
158*86ee64e7SAndroid Build Coastguard Worker }
159*86ee64e7SAndroid Build Coastguard Worker 
160*86ee64e7SAndroid Build Coastguard Worker /* ========================================================================= */
adler32(uLong adler,const Bytef * buf,uInt len)161*86ee64e7SAndroid Build Coastguard Worker uLong ZEXPORT adler32(uLong adler, const Bytef *buf, uInt len) {
162*86ee64e7SAndroid Build Coastguard Worker     return adler32_z(adler, buf, len);
163*86ee64e7SAndroid Build Coastguard Worker }
164*86ee64e7SAndroid Build Coastguard Worker 
165*86ee64e7SAndroid Build Coastguard Worker /* ========================================================================= */
adler32_combine_(uLong adler1,uLong adler2,z_off64_t len2)166*86ee64e7SAndroid Build Coastguard Worker local uLong adler32_combine_(uLong adler1, uLong adler2, z_off64_t len2) {
167*86ee64e7SAndroid Build Coastguard Worker     unsigned long sum1;
168*86ee64e7SAndroid Build Coastguard Worker     unsigned long sum2;
169*86ee64e7SAndroid Build Coastguard Worker     unsigned rem;
170*86ee64e7SAndroid Build Coastguard Worker 
171*86ee64e7SAndroid Build Coastguard Worker     /* for negative len, return invalid adler32 as a clue for debugging */
172*86ee64e7SAndroid Build Coastguard Worker     if (len2 < 0)
173*86ee64e7SAndroid Build Coastguard Worker         return 0xffffffffUL;
174*86ee64e7SAndroid Build Coastguard Worker 
175*86ee64e7SAndroid Build Coastguard Worker     /* the derivation of this formula is left as an exercise for the reader */
176*86ee64e7SAndroid Build Coastguard Worker     MOD63(len2);                /* assumes len2 >= 0 */
177*86ee64e7SAndroid Build Coastguard Worker     rem = (unsigned)len2;
178*86ee64e7SAndroid Build Coastguard Worker     sum1 = adler1 & 0xffff;
179*86ee64e7SAndroid Build Coastguard Worker     sum2 = rem * sum1;
180*86ee64e7SAndroid Build Coastguard Worker     MOD(sum2);
181*86ee64e7SAndroid Build Coastguard Worker     sum1 += (adler2 & 0xffff) + BASE - 1;
182*86ee64e7SAndroid Build Coastguard Worker     sum2 += ((adler1 >> 16) & 0xffff) + ((adler2 >> 16) & 0xffff) + BASE - rem;
183*86ee64e7SAndroid Build Coastguard Worker     if (sum1 >= BASE) sum1 -= BASE;
184*86ee64e7SAndroid Build Coastguard Worker     if (sum1 >= BASE) sum1 -= BASE;
185*86ee64e7SAndroid Build Coastguard Worker     if (sum2 >= ((unsigned long)BASE << 1)) sum2 -= ((unsigned long)BASE << 1);
186*86ee64e7SAndroid Build Coastguard Worker     if (sum2 >= BASE) sum2 -= BASE;
187*86ee64e7SAndroid Build Coastguard Worker     return sum1 | (sum2 << 16);
188*86ee64e7SAndroid Build Coastguard Worker }
189*86ee64e7SAndroid Build Coastguard Worker 
190*86ee64e7SAndroid Build Coastguard Worker /* ========================================================================= */
adler32_combine(uLong adler1,uLong adler2,z_off_t len2)191*86ee64e7SAndroid Build Coastguard Worker uLong ZEXPORT adler32_combine(uLong adler1, uLong adler2, z_off_t len2) {
192*86ee64e7SAndroid Build Coastguard Worker     return adler32_combine_(adler1, adler2, len2);
193*86ee64e7SAndroid Build Coastguard Worker }
194*86ee64e7SAndroid Build Coastguard Worker 
adler32_combine64(uLong adler1,uLong adler2,z_off64_t len2)195*86ee64e7SAndroid Build Coastguard Worker uLong ZEXPORT adler32_combine64(uLong adler1, uLong adler2, z_off64_t len2) {
196*86ee64e7SAndroid Build Coastguard Worker     return adler32_combine_(adler1, adler2, len2);
197*86ee64e7SAndroid Build Coastguard Worker }
198