]>
Commit | Line | Data |
---|---|---|
1 | /* crc32.c -- compute the CRC-32 of a data stream | |
2 | * Copyright (C) 1995-2005 Mark Adler | |
3 | * For conditions of distribution and use, see copyright notice in zlib.h | |
4 | * | |
5 | * Thanks to Rodney Brown <rbrown64@csc.com.au> for his contribution of faster | |
6 | * CRC methods: exclusive-oring 32 bits of data at a time, and pre-computing | |
7 | * tables for updating the shift register in one step with three exclusive-ors | |
8 | * instead of four steps with four exclusive-ors. This results in about a | |
9 | * factor of two increase in speed on a Power PC G4 (PPC7455) using gcc -O3. | |
10 | */ | |
11 | ||
12 | /* @(#) $Id$ */ | |
13 | ||
14 | /* | |
15 | Note on the use of DYNAMIC_CRC_TABLE: there is no mutex or semaphore | |
16 | protection on the static variables used to control the first-use generation | |
17 | of the crc tables. Therefore, if you #define DYNAMIC_CRC_TABLE, you should | |
18 | first call get_crc_table() to initialize the tables before allowing more than | |
19 | one thread to use crc32(). | |
20 | */ | |
21 | ||
22 | #ifdef MAKECRCH | |
23 | # include <stdio.h> | |
24 | # ifndef DYNAMIC_CRC_TABLE | |
25 | # define DYNAMIC_CRC_TABLE | |
26 | # endif /* !DYNAMIC_CRC_TABLE */ | |
27 | #endif /* MAKECRCH */ | |
28 | ||
29 | #include "zutil.h" /* for STDC and FAR definitions */ | |
30 | ||
31 | #define local static | |
32 | ||
33 | /* Find a four-byte integer type for crc32_little() and crc32_big(). */ | |
34 | #ifndef NOBYFOUR | |
35 | # ifdef STDC /* need ANSI C limits.h to determine sizes */ | |
36 | # include <limits.h> | |
37 | # define BYFOUR | |
38 | # if (UINT_MAX == 0xffffffffUL) | |
39 | typedef unsigned int u4; | |
40 | # else | |
41 | # if (ULONG_MAX == 0xffffffffUL) | |
42 | typedef unsigned long u4; | |
43 | # else | |
44 | # if (USHRT_MAX == 0xffffffffUL) | |
45 | typedef unsigned short u4; | |
46 | # else | |
47 | # undef BYFOUR /* can't find a four-byte integer type! */ | |
48 | # endif | |
49 | # endif | |
50 | # endif | |
51 | # endif /* STDC */ | |
52 | #endif /* !NOBYFOUR */ | |
53 | ||
54 | /* Definitions for doing the crc four data bytes at a time. */ | |
55 | #ifdef BYFOUR | |
56 | # define REV(w) (((w)>>24)+(((w)>>8)&0xff00)+ \ | |
57 | (((w)&0xff00)<<8)+(((w)&0xff)<<24)) | |
58 | local unsigned long crc32_little OF((unsigned long, | |
59 | const unsigned char FAR *, unsigned)); | |
60 | local unsigned long crc32_big OF((unsigned long, | |
61 | const unsigned char FAR *, unsigned)); | |
62 | # define TBLS 8 | |
63 | #else | |
64 | # define TBLS 1 | |
65 | #endif /* BYFOUR */ | |
66 | ||
67 | /* Local functions for crc concatenation */ | |
68 | local unsigned long gf2_matrix_times OF((unsigned long *mat, | |
69 | unsigned long vec)); | |
70 | local void gf2_matrix_square OF((unsigned long *square, unsigned long *mat)); | |
71 | ||
72 | #ifdef DYNAMIC_CRC_TABLE | |
73 | ||
74 | local volatile int crc_table_empty = 1; | |
75 | local unsigned long FAR crc_table[TBLS][256]; | |
76 | local void make_crc_table OF((void)); | |
77 | #ifdef MAKECRCH | |
78 | local void write_table OF((FILE *, const unsigned long FAR *)); | |
79 | #endif /* MAKECRCH */ | |
80 | /* | |
81 | Generate tables for a byte-wise 32-bit CRC calculation on the polynomial: | |
82 | x^32+x^26+x^23+x^22+x^16+x^12+x^11+x^10+x^8+x^7+x^5+x^4+x^2+x+1. | |
83 | ||
84 | Polynomials over GF(2) are represented in binary, one bit per coefficient, | |
85 | with the lowest powers in the most significant bit. Then adding polynomials | |
86 | is just exclusive-or, and multiplying a polynomial by x is a right shift by | |
87 | one. If we call the above polynomial p, and represent a byte as the | |
88 | polynomial q, also with the lowest power in the most significant bit (so the | |
89 | byte 0xb1 is the polynomial x^7+x^3+x+1), then the CRC is (q*x^32) mod p, | |
90 | where a mod b means the remainder after dividing a by b. | |
91 | ||
92 | This calculation is done using the shift-register method of multiplying and | |
93 | taking the remainder. The register is initialized to zero, and for each | |
94 | incoming bit, x^32 is added mod p to the register if the bit is a one (where | |
95 | x^32 mod p is p+x^32 = x^26+...+1), and the register is multiplied mod p by | |
96 | x (which is shifting right by one and adding x^32 mod p if the bit shifted | |
97 | out is a one). We start with the highest power (least significant bit) of | |
98 | q and repeat for all eight bits of q. | |
99 | ||
100 | The first table is simply the CRC of all possible eight bit values. This is | |
101 | all the information needed to generate CRCs on data a byte at a time for all | |
102 | combinations of CRC register values and incoming bytes. The remaining tables | |
103 | allow for word-at-a-time CRC calculation for both big-endian and little- | |
104 | endian machines, where a word is four bytes. | |
105 | */ | |
106 | local void make_crc_table() | |
107 | { | |
108 | unsigned long c; | |
109 | int n, k; | |
110 | unsigned long poly; /* polynomial exclusive-or pattern */ | |
111 | /* terms of polynomial defining this crc (except x^32): */ | |
112 | static volatile int first = 1; /* flag to limit concurrent making */ | |
113 | static const unsigned char p[] = {0,1,2,4,5,7,8,10,11,12,16,22,23,26}; | |
114 | ||
115 | /* See if another task is already doing this (not thread-safe, but better | |
116 | than nothing -- significantly reduces duration of vulnerability in | |
117 | case the advice about DYNAMIC_CRC_TABLE is ignored) */ | |
118 | if (first) { | |
119 | first = 0; | |
120 | ||
121 | /* make exclusive-or pattern from polynomial (0xedb88320UL) */ | |
122 | poly = 0UL; | |
123 | for (n = 0; n < sizeof(p)/sizeof(unsigned char); n++) | |
124 | poly |= 1UL << (31 - p[n]); | |
125 | ||
126 | /* generate a crc for every 8-bit value */ | |
127 | for (n = 0; n < 256; n++) { | |
128 | c = (unsigned long)n; | |
129 | for (k = 0; k < 8; k++) | |
130 | c = c & 1 ? poly ^ (c >> 1) : c >> 1; | |
131 | crc_table[0][n] = c; | |
132 | } | |
133 | ||
134 | #ifdef BYFOUR | |
135 | /* generate crc for each value followed by one, two, and three zeros, | |
136 | and then the byte reversal of those as well as the first table */ | |
137 | for (n = 0; n < 256; n++) { | |
138 | c = crc_table[0][n]; | |
139 | crc_table[4][n] = REV(c); | |
140 | for (k = 1; k < 4; k++) { | |
141 | c = crc_table[0][c & 0xff] ^ (c >> 8); | |
142 | crc_table[k][n] = c; | |
143 | crc_table[k + 4][n] = REV(c); | |
144 | } | |
145 | } | |
146 | #endif /* BYFOUR */ | |
147 | ||
148 | crc_table_empty = 0; | |
149 | } | |
150 | else { /* not first */ | |
151 | /* wait for the other guy to finish (not efficient, but rare) */ | |
152 | while (crc_table_empty) | |
153 | ; | |
154 | } | |
155 | ||
156 | #ifdef MAKECRCH | |
157 | /* write out CRC tables to crc32.h */ | |
158 | { | |
159 | FILE *out; | |
160 | ||
161 | out = fopen("crc32.h", "w"); | |
162 | if (out == NULL) return; | |
163 | fprintf(out, "/* crc32.h -- tables for rapid CRC calculation\n"); | |
164 | fprintf(out, " * Generated automatically by crc32.c\n */\n\n"); | |
165 | fprintf(out, "local const unsigned long FAR "); | |
166 | fprintf(out, "crc_table[TBLS][256] =\n{\n {\n"); | |
167 | write_table(out, crc_table[0]); | |
168 | # ifdef BYFOUR | |
169 | fprintf(out, "#ifdef BYFOUR\n"); | |
170 | for (k = 1; k < 8; k++) { | |
171 | fprintf(out, " },\n {\n"); | |
172 | write_table(out, crc_table[k]); | |
173 | } | |
174 | fprintf(out, "#endif\n"); | |
175 | # endif /* BYFOUR */ | |
176 | fprintf(out, " }\n};\n"); | |
177 | fclose(out); | |
178 | } | |
179 | #endif /* MAKECRCH */ | |
180 | } | |
181 | ||
182 | #ifdef MAKECRCH | |
183 | local void write_table(out, table) | |
184 | FILE *out; | |
185 | const unsigned long FAR *table; | |
186 | { | |
187 | int n; | |
188 | ||
189 | for (n = 0; n < 256; n++) | |
190 | fprintf(out, "%s0x%08lxUL%s", n % 5 ? "" : " ", table[n], | |
191 | n == 255 ? "\n" : (n % 5 == 4 ? ",\n" : ", ")); | |
192 | } | |
193 | #endif /* MAKECRCH */ | |
194 | ||
195 | #else /* !DYNAMIC_CRC_TABLE */ | |
196 | /* ======================================================================== | |
197 | * Tables of CRC-32s of all single-byte values, made by make_crc_table(). | |
198 | */ | |
199 | #include "crc32.h" | |
200 | #endif /* DYNAMIC_CRC_TABLE */ | |
201 | ||
202 | /* ========================================================================= | |
203 | * This function can be used by asm versions of crc32() | |
204 | */ | |
205 | const unsigned long FAR * ZEXPORT get_crc_table() | |
206 | { | |
207 | #ifdef DYNAMIC_CRC_TABLE | |
208 | if (crc_table_empty) | |
209 | make_crc_table(); | |
210 | #endif /* DYNAMIC_CRC_TABLE */ | |
211 | return (const unsigned long FAR *)crc_table; | |
212 | } | |
213 | ||
214 | /* ========================================================================= */ | |
215 | #define DO1 crc = crc_table[0][((int)crc ^ (*buf++)) & 0xff] ^ (crc >> 8) | |
216 | #define DO8 DO1; DO1; DO1; DO1; DO1; DO1; DO1; DO1 | |
217 | ||
218 | /* ========================================================================= */ | |
219 | unsigned long ZEXPORT crc32(crc, buf, len) | |
220 | unsigned long crc; | |
221 | const unsigned char FAR *buf; | |
222 | unsigned len; | |
223 | { | |
224 | if (buf == Z_NULL) return 0UL; | |
225 | ||
226 | #ifdef DYNAMIC_CRC_TABLE | |
227 | if (crc_table_empty) | |
228 | make_crc_table(); | |
229 | #endif /* DYNAMIC_CRC_TABLE */ | |
230 | ||
231 | #ifdef BYFOUR | |
232 | if (sizeof(void *) == sizeof(ptrdiff_t)) { | |
233 | u4 endian; | |
234 | ||
235 | endian = 1; | |
236 | if (*((unsigned char *)(&endian))) | |
237 | return crc32_little(crc, buf, len); | |
238 | else | |
239 | return crc32_big(crc, buf, len); | |
240 | } | |
241 | #endif /* BYFOUR */ | |
242 | crc = crc ^ 0xffffffffUL; | |
243 | while (len >= 8) { | |
244 | DO8; | |
245 | len -= 8; | |
246 | } | |
247 | if (len) do { | |
248 | DO1; | |
249 | } while (--len); | |
250 | return crc ^ 0xffffffffUL; | |
251 | } | |
252 | ||
253 | #ifdef BYFOUR | |
254 | ||
255 | /* ========================================================================= */ | |
256 | #define DOLIT4 c ^= *buf4++; \ | |
257 | c = crc_table[3][c & 0xff] ^ crc_table[2][(c >> 8) & 0xff] ^ \ | |
258 | crc_table[1][(c >> 16) & 0xff] ^ crc_table[0][c >> 24] | |
259 | #define DOLIT32 DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4 | |
260 | ||
261 | /* ========================================================================= */ | |
262 | local unsigned long crc32_little(crc, buf, len) | |
263 | unsigned long crc; | |
264 | const unsigned char FAR *buf; | |
265 | unsigned len; | |
266 | { | |
267 | register u4 c; | |
268 | register const u4 FAR *buf4; | |
269 | ||
270 | c = (u4)crc; | |
271 | c = ~c; | |
272 | while (len && ((ptrdiff_t)buf & 3)) { | |
273 | c = crc_table[0][(c ^ *buf++) & 0xff] ^ (c >> 8); | |
274 | len--; | |
275 | } | |
276 | ||
277 | buf4 = (const u4 FAR *)(const void FAR *)buf; | |
278 | while (len >= 32) { | |
279 | DOLIT32; | |
280 | len -= 32; | |
281 | } | |
282 | while (len >= 4) { | |
283 | DOLIT4; | |
284 | len -= 4; | |
285 | } | |
286 | buf = (const unsigned char FAR *)buf4; | |
287 | ||
288 | if (len) do { | |
289 | c = crc_table[0][(c ^ *buf++) & 0xff] ^ (c >> 8); | |
290 | } while (--len); | |
291 | c = ~c; | |
292 | return (unsigned long)c; | |
293 | } | |
294 | ||
295 | /* ========================================================================= */ | |
296 | #define DOBIG4 c ^= *++buf4; \ | |
297 | c = crc_table[4][c & 0xff] ^ crc_table[5][(c >> 8) & 0xff] ^ \ | |
298 | crc_table[6][(c >> 16) & 0xff] ^ crc_table[7][c >> 24] | |
299 | #define DOBIG32 DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4 | |
300 | ||
301 | /* ========================================================================= */ | |
302 | local unsigned long crc32_big(crc, buf, len) | |
303 | unsigned long crc; | |
304 | const unsigned char FAR *buf; | |
305 | unsigned len; | |
306 | { | |
307 | register u4 c; | |
308 | register const u4 FAR *buf4; | |
309 | ||
310 | c = REV((u4)crc); | |
311 | c = ~c; | |
312 | while (len && ((ptrdiff_t)buf & 3)) { | |
313 | c = crc_table[4][(c >> 24) ^ *buf++] ^ (c << 8); | |
314 | len--; | |
315 | } | |
316 | ||
317 | buf4 = (const u4 FAR *)(const void FAR *)buf; | |
318 | buf4--; | |
319 | while (len >= 32) { | |
320 | DOBIG32; | |
321 | len -= 32; | |
322 | } | |
323 | while (len >= 4) { | |
324 | DOBIG4; | |
325 | len -= 4; | |
326 | } | |
327 | buf4++; | |
328 | buf = (const unsigned char FAR *)buf4; | |
329 | ||
330 | if (len) do { | |
331 | c = crc_table[4][(c >> 24) ^ *buf++] ^ (c << 8); | |
332 | } while (--len); | |
333 | c = ~c; | |
334 | return (unsigned long)(REV(c)); | |
335 | } | |
336 | ||
337 | #endif /* BYFOUR */ | |
338 | ||
339 | #define GF2_DIM 32 /* dimension of GF(2) vectors (length of CRC) */ | |
340 | ||
341 | /* ========================================================================= */ | |
342 | local unsigned long gf2_matrix_times(mat, vec) | |
343 | unsigned long *mat; | |
344 | unsigned long vec; | |
345 | { | |
346 | unsigned long sum; | |
347 | ||
348 | sum = 0; | |
349 | while (vec) { | |
350 | if (vec & 1) | |
351 | sum ^= *mat; | |
352 | vec >>= 1; | |
353 | mat++; | |
354 | } | |
355 | return sum; | |
356 | } | |
357 | ||
358 | /* ========================================================================= */ | |
359 | local void gf2_matrix_square(square, mat) | |
360 | unsigned long *square; | |
361 | unsigned long *mat; | |
362 | { | |
363 | int n; | |
364 | ||
365 | for (n = 0; n < GF2_DIM; n++) | |
366 | square[n] = gf2_matrix_times(mat, mat[n]); | |
367 | } | |
368 | ||
369 | /* ========================================================================= */ | |
370 | uLong ZEXPORT crc32_combine(crc1, crc2, len2) | |
371 | uLong crc1; | |
372 | uLong crc2; | |
373 | z_off_t len2; | |
374 | { | |
375 | int n; | |
376 | unsigned long row; | |
377 | unsigned long even[GF2_DIM]; /* even-power-of-two zeros operator */ | |
378 | unsigned long odd[GF2_DIM]; /* odd-power-of-two zeros operator */ | |
379 | ||
380 | /* degenerate case */ | |
381 | if (len2 == 0) | |
382 | return crc1; | |
383 | ||
384 | /* put operator for one zero bit in odd */ | |
385 | odd[0] = 0xedb88320L; /* CRC-32 polynomial */ | |
386 | row = 1; | |
387 | for (n = 1; n < GF2_DIM; n++) { | |
388 | odd[n] = row; | |
389 | row <<= 1; | |
390 | } | |
391 | ||
392 | /* put operator for two zero bits in even */ | |
393 | gf2_matrix_square(even, odd); | |
394 | ||
395 | /* put operator for four zero bits in odd */ | |
396 | gf2_matrix_square(odd, even); | |
397 | ||
398 | /* apply len2 zeros to crc1 (first square will put the operator for one | |
399 | zero byte, eight zero bits, in even) */ | |
400 | do { | |
401 | /* apply zeros operator for this bit of len2 */ | |
402 | gf2_matrix_square(even, odd); | |
403 | if (len2 & 1) | |
404 | crc1 = gf2_matrix_times(even, crc1); | |
405 | len2 >>= 1; | |
406 | ||
407 | /* if no more bits set, then done */ | |
408 | if (len2 == 0) | |
409 | break; | |
410 | ||
411 | /* another iteration of the loop with odd and even swapped */ | |
412 | gf2_matrix_square(odd, even); | |
413 | if (len2 & 1) | |
414 | crc1 = gf2_matrix_times(odd, crc1); | |
415 | len2 >>= 1; | |
416 | ||
417 | /* if no more bits set, then done */ | |
418 | } while (len2 != 0); | |
419 | ||
420 | /* return combined crc */ | |
421 | crc1 ^= crc2; | |
422 | return crc1; | |
423 | } |