nuclear@2: /* crc32.c -- compute the CRC-32 of a data stream
nuclear@2:  * Copyright (C) 1995-2005 Mark Adler
nuclear@2:  * For conditions of distribution and use, see copyright notice in zlib.h
nuclear@2:  *
nuclear@2:  * Thanks to Rodney Brown <rbrown64@csc.com.au> for his contribution of faster
nuclear@2:  * CRC methods: exclusive-oring 32 bits of data at a time, and pre-computing
nuclear@2:  * tables for updating the shift register in one step with three exclusive-ors
nuclear@2:  * instead of four steps with four exclusive-ors.  This results in about a
nuclear@2:  * factor of two increase in speed on a Power PC G4 (PPC7455) using gcc -O3.
nuclear@2:  */
nuclear@2: 
nuclear@2: /* @(#) $Id$ */
nuclear@2: 
nuclear@2: /*
nuclear@2:   Note on the use of DYNAMIC_CRC_TABLE: there is no mutex or semaphore
nuclear@2:   protection on the static variables used to control the first-use generation
nuclear@2:   of the crc tables.  Therefore, if you #define DYNAMIC_CRC_TABLE, you should
nuclear@2:   first call get_crc_table() to initialize the tables before allowing more than
nuclear@2:   one thread to use crc32().
nuclear@2:  */
nuclear@2: 
nuclear@2: #ifdef MAKECRCH
nuclear@2: #  include <stdio.h>
nuclear@2: #  ifndef DYNAMIC_CRC_TABLE
nuclear@2: #    define DYNAMIC_CRC_TABLE
nuclear@2: #  endif /* !DYNAMIC_CRC_TABLE */
nuclear@2: #endif /* MAKECRCH */
nuclear@2: 
nuclear@2: #include "zutil.h"      /* for STDC and FAR definitions */
nuclear@2: 
nuclear@2: #define local static
nuclear@2: 
nuclear@2: /* Find a four-byte integer type for crc32_little() and crc32_big(). */
nuclear@2: #ifndef NOBYFOUR
nuclear@2: #  ifdef STDC           /* need ANSI C limits.h to determine sizes */
nuclear@2: #    include <limits.h>
nuclear@2: #    define BYFOUR
nuclear@2: #    if (UINT_MAX == 0xffffffffUL)
nuclear@2:        typedef unsigned int u4;
nuclear@2: #    else
nuclear@2: #      if (ULONG_MAX == 0xffffffffUL)
nuclear@2:          typedef unsigned long u4;
nuclear@2: #      else
nuclear@2: #        if (USHRT_MAX == 0xffffffffUL)
nuclear@2:            typedef unsigned short u4;
nuclear@2: #        else
nuclear@2: #          undef BYFOUR     /* can't find a four-byte integer type! */
nuclear@2: #        endif
nuclear@2: #      endif
nuclear@2: #    endif
nuclear@2: #  endif /* STDC */
nuclear@2: #endif /* !NOBYFOUR */
nuclear@2: 
nuclear@2: /* Definitions for doing the crc four data bytes at a time. */
nuclear@2: #ifdef BYFOUR
nuclear@2: #  define REV(w) (((w)>>24)+(((w)>>8)&0xff00)+ \
nuclear@2:                 (((w)&0xff00)<<8)+(((w)&0xff)<<24))
nuclear@2:    local unsigned long crc32_little OF((unsigned long,
nuclear@2:                         const unsigned char FAR *, unsigned));
nuclear@2:    local unsigned long crc32_big OF((unsigned long,
nuclear@2:                         const unsigned char FAR *, unsigned));
nuclear@2: #  define TBLS 8
nuclear@2: #else
nuclear@2: #  define TBLS 1
nuclear@2: #endif /* BYFOUR */
nuclear@2: 
nuclear@2: /* Local functions for crc concatenation */
nuclear@2: local unsigned long gf2_matrix_times OF((unsigned long *mat,
nuclear@2:                                          unsigned long vec));
nuclear@2: local void gf2_matrix_square OF((unsigned long *square, unsigned long *mat));
nuclear@2: 
nuclear@2: #ifdef DYNAMIC_CRC_TABLE
nuclear@2: 
nuclear@2: local volatile int crc_table_empty = 1;
nuclear@2: local unsigned long FAR crc_table[TBLS][256];
nuclear@2: local void make_crc_table OF((void));
nuclear@2: #ifdef MAKECRCH
nuclear@2:    local void write_table OF((FILE *, const unsigned long FAR *));
nuclear@2: #endif /* MAKECRCH */
nuclear@2: /*
nuclear@2:   Generate tables for a byte-wise 32-bit CRC calculation on the polynomial:
nuclear@2:   x^32+x^26+x^23+x^22+x^16+x^12+x^11+x^10+x^8+x^7+x^5+x^4+x^2+x+1.
nuclear@2: 
nuclear@2:   Polynomials over GF(2) are represented in binary, one bit per coefficient,
nuclear@2:   with the lowest powers in the most significant bit.  Then adding polynomials
nuclear@2:   is just exclusive-or, and multiplying a polynomial by x is a right shift by
nuclear@2:   one.  If we call the above polynomial p, and represent a byte as the
nuclear@2:   polynomial q, also with the lowest power in the most significant bit (so the
nuclear@2:   byte 0xb1 is the polynomial x^7+x^3+x+1), then the CRC is (q*x^32) mod p,
nuclear@2:   where a mod b means the remainder after dividing a by b.
nuclear@2: 
nuclear@2:   This calculation is done using the shift-register method of multiplying and
nuclear@2:   taking the remainder.  The register is initialized to zero, and for each
nuclear@2:   incoming bit, x^32 is added mod p to the register if the bit is a one (where
nuclear@2:   x^32 mod p is p+x^32 = x^26+...+1), and the register is multiplied mod p by
nuclear@2:   x (which is shifting right by one and adding x^32 mod p if the bit shifted
nuclear@2:   out is a one).  We start with the highest power (least significant bit) of
nuclear@2:   q and repeat for all eight bits of q.
nuclear@2: 
nuclear@2:   The first table is simply the CRC of all possible eight bit values.  This is
nuclear@2:   all the information needed to generate CRCs on data a byte at a time for all
nuclear@2:   combinations of CRC register values and incoming bytes.  The remaining tables
nuclear@2:   allow for word-at-a-time CRC calculation for both big-endian and little-
nuclear@2:   endian machines, where a word is four bytes.
nuclear@2: */
nuclear@2: local void make_crc_table()
nuclear@2: {
nuclear@2:     unsigned long c;
nuclear@2:     int n, k;
nuclear@2:     unsigned long poly;                 /* polynomial exclusive-or pattern */
nuclear@2:     /* terms of polynomial defining this crc (except x^32): */
nuclear@2:     static volatile int first = 1;      /* flag to limit concurrent making */
nuclear@2:     static const unsigned char p[] = {0,1,2,4,5,7,8,10,11,12,16,22,23,26};
nuclear@2: 
nuclear@2:     /* See if another task is already doing this (not thread-safe, but better
nuclear@2:        than nothing -- significantly reduces duration of vulnerability in
nuclear@2:        case the advice about DYNAMIC_CRC_TABLE is ignored) */
nuclear@2:     if (first) {
nuclear@2:         first = 0;
nuclear@2: 
nuclear@2:         /* make exclusive-or pattern from polynomial (0xedb88320UL) */
nuclear@2:         poly = 0UL;
nuclear@2:         for (n = 0; n < sizeof(p)/sizeof(unsigned char); n++)
nuclear@2:             poly |= 1UL << (31 - p[n]);
nuclear@2: 
nuclear@2:         /* generate a crc for every 8-bit value */
nuclear@2:         for (n = 0; n < 256; n++) {
nuclear@2:             c = (unsigned long)n;
nuclear@2:             for (k = 0; k < 8; k++)
nuclear@2:                 c = c & 1 ? poly ^ (c >> 1) : c >> 1;
nuclear@2:             crc_table[0][n] = c;
nuclear@2:         }
nuclear@2: 
nuclear@2: #ifdef BYFOUR
nuclear@2:         /* generate crc for each value followed by one, two, and three zeros,
nuclear@2:            and then the byte reversal of those as well as the first table */
nuclear@2:         for (n = 0; n < 256; n++) {
nuclear@2:             c = crc_table[0][n];
nuclear@2:             crc_table[4][n] = REV(c);
nuclear@2:             for (k = 1; k < 4; k++) {
nuclear@2:                 c = crc_table[0][c & 0xff] ^ (c >> 8);
nuclear@2:                 crc_table[k][n] = c;
nuclear@2:                 crc_table[k + 4][n] = REV(c);
nuclear@2:             }
nuclear@2:         }
nuclear@2: #endif /* BYFOUR */
nuclear@2: 
nuclear@2:         crc_table_empty = 0;
nuclear@2:     }
nuclear@2:     else {      /* not first */
nuclear@2:         /* wait for the other guy to finish (not efficient, but rare) */
nuclear@2:         while (crc_table_empty)
nuclear@2:             ;
nuclear@2:     }
nuclear@2: 
nuclear@2: #ifdef MAKECRCH
nuclear@2:     /* write out CRC tables to crc32.h */
nuclear@2:     {
nuclear@2:         FILE *out;
nuclear@2: 
nuclear@2:         out = fopen("crc32.h", "w");
nuclear@2:         if (out == NULL) return;
nuclear@2:         fprintf(out, "/* crc32.h -- tables for rapid CRC calculation\n");
nuclear@2:         fprintf(out, " * Generated automatically by crc32.c\n */\n\n");
nuclear@2:         fprintf(out, "local const unsigned long FAR ");
nuclear@2:         fprintf(out, "crc_table[TBLS][256] =\n{\n  {\n");
nuclear@2:         write_table(out, crc_table[0]);
nuclear@2: #  ifdef BYFOUR
nuclear@2:         fprintf(out, "#ifdef BYFOUR\n");
nuclear@2:         for (k = 1; k < 8; k++) {
nuclear@2:             fprintf(out, "  },\n  {\n");
nuclear@2:             write_table(out, crc_table[k]);
nuclear@2:         }
nuclear@2:         fprintf(out, "#endif\n");
nuclear@2: #  endif /* BYFOUR */
nuclear@2:         fprintf(out, "  }\n};\n");
nuclear@2:         fclose(out);
nuclear@2:     }
nuclear@2: #endif /* MAKECRCH */
nuclear@2: }
nuclear@2: 
nuclear@2: #ifdef MAKECRCH
nuclear@2: local void write_table(out, table)
nuclear@2:     FILE *out;
nuclear@2:     const unsigned long FAR *table;
nuclear@2: {
nuclear@2:     int n;
nuclear@2: 
nuclear@2:     for (n = 0; n < 256; n++)
nuclear@2:         fprintf(out, "%s0x%08lxUL%s", n % 5 ? "" : "    ", table[n],
nuclear@2:                 n == 255 ? "\n" : (n % 5 == 4 ? ",\n" : ", "));
nuclear@2: }
nuclear@2: #endif /* MAKECRCH */
nuclear@2: 
nuclear@2: #else /* !DYNAMIC_CRC_TABLE */
nuclear@2: /* ========================================================================
nuclear@2:  * Tables of CRC-32s of all single-byte values, made by make_crc_table().
nuclear@2:  */
nuclear@2: #include "crc32.h"
nuclear@2: #endif /* DYNAMIC_CRC_TABLE */
nuclear@2: 
nuclear@2: /* =========================================================================
nuclear@2:  * This function can be used by asm versions of crc32()
nuclear@2:  */
nuclear@2: const unsigned long FAR * ZEXPORT get_crc_table()
nuclear@2: {
nuclear@2: #ifdef DYNAMIC_CRC_TABLE
nuclear@2:     if (crc_table_empty)
nuclear@2:         make_crc_table();
nuclear@2: #endif /* DYNAMIC_CRC_TABLE */
nuclear@2:     return (const unsigned long FAR *)crc_table;
nuclear@2: }
nuclear@2: 
nuclear@2: /* ========================================================================= */
nuclear@2: #define DO1 crc = crc_table[0][((int)crc ^ (*buf++)) & 0xff] ^ (crc >> 8)
nuclear@2: #define DO8 DO1; DO1; DO1; DO1; DO1; DO1; DO1; DO1
nuclear@2: 
nuclear@2: /* ========================================================================= */
nuclear@2: unsigned long ZEXPORT crc32(crc, buf, len)
nuclear@2:     unsigned long crc;
nuclear@2:     const unsigned char FAR *buf;
nuclear@2:     unsigned len;
nuclear@2: {
nuclear@2:     if (buf == Z_NULL) return 0UL;
nuclear@2: 
nuclear@2: #ifdef DYNAMIC_CRC_TABLE
nuclear@2:     if (crc_table_empty)
nuclear@2:         make_crc_table();
nuclear@2: #endif /* DYNAMIC_CRC_TABLE */
nuclear@2: 
nuclear@2: #ifdef BYFOUR
nuclear@2:     if (sizeof(void *) == sizeof(ptrdiff_t)) {
nuclear@2:         u4 endian;
nuclear@2: 
nuclear@2:         endian = 1;
nuclear@2:         if (*((unsigned char *)(&endian)))
nuclear@2:             return crc32_little(crc, buf, len);
nuclear@2:         else
nuclear@2:             return crc32_big(crc, buf, len);
nuclear@2:     }
nuclear@2: #endif /* BYFOUR */
nuclear@2:     crc = crc ^ 0xffffffffUL;
nuclear@2:     while (len >= 8) {
nuclear@2:         DO8;
nuclear@2:         len -= 8;
nuclear@2:     }
nuclear@2:     if (len) do {
nuclear@2:         DO1;
nuclear@2:     } while (--len);
nuclear@2:     return crc ^ 0xffffffffUL;
nuclear@2: }
nuclear@2: 
nuclear@2: #ifdef BYFOUR
nuclear@2: 
nuclear@2: /* ========================================================================= */
nuclear@2: #define DOLIT4 c ^= *buf4++; \
nuclear@2:         c = crc_table[3][c & 0xff] ^ crc_table[2][(c >> 8) & 0xff] ^ \
nuclear@2:             crc_table[1][(c >> 16) & 0xff] ^ crc_table[0][c >> 24]
nuclear@2: #define DOLIT32 DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4
nuclear@2: 
nuclear@2: /* ========================================================================= */
nuclear@2: local unsigned long crc32_little(crc, buf, len)
nuclear@2:     unsigned long crc;
nuclear@2:     const unsigned char FAR *buf;
nuclear@2:     unsigned len;
nuclear@2: {
nuclear@2:     register u4 c;
nuclear@2:     register const u4 FAR *buf4;
nuclear@2: 
nuclear@2:     c = (u4)crc;
nuclear@2:     c = ~c;
nuclear@2:     while (len && ((ptrdiff_t)buf & 3)) {
nuclear@2:         c = crc_table[0][(c ^ *buf++) & 0xff] ^ (c >> 8);
nuclear@2:         len--;
nuclear@2:     }
nuclear@2: 
nuclear@2:     buf4 = (const u4 FAR *)(const void FAR *)buf;
nuclear@2:     while (len >= 32) {
nuclear@2:         DOLIT32;
nuclear@2:         len -= 32;
nuclear@2:     }
nuclear@2:     while (len >= 4) {
nuclear@2:         DOLIT4;
nuclear@2:         len -= 4;
nuclear@2:     }
nuclear@2:     buf = (const unsigned char FAR *)buf4;
nuclear@2: 
nuclear@2:     if (len) do {
nuclear@2:         c = crc_table[0][(c ^ *buf++) & 0xff] ^ (c >> 8);
nuclear@2:     } while (--len);
nuclear@2:     c = ~c;
nuclear@2:     return (unsigned long)c;
nuclear@2: }
nuclear@2: 
nuclear@2: /* ========================================================================= */
nuclear@2: #define DOBIG4 c ^= *++buf4; \
nuclear@2:         c = crc_table[4][c & 0xff] ^ crc_table[5][(c >> 8) & 0xff] ^ \
nuclear@2:             crc_table[6][(c >> 16) & 0xff] ^ crc_table[7][c >> 24]
nuclear@2: #define DOBIG32 DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4
nuclear@2: 
nuclear@2: /* ========================================================================= */
nuclear@2: local unsigned long crc32_big(crc, buf, len)
nuclear@2:     unsigned long crc;
nuclear@2:     const unsigned char FAR *buf;
nuclear@2:     unsigned len;
nuclear@2: {
nuclear@2:     register u4 c;
nuclear@2:     register const u4 FAR *buf4;
nuclear@2: 
nuclear@2:     c = REV((u4)crc);
nuclear@2:     c = ~c;
nuclear@2:     while (len && ((ptrdiff_t)buf & 3)) {
nuclear@2:         c = crc_table[4][(c >> 24) ^ *buf++] ^ (c << 8);
nuclear@2:         len--;
nuclear@2:     }
nuclear@2: 
nuclear@2:     buf4 = (const u4 FAR *)(const void FAR *)buf;
nuclear@2:     buf4--;
nuclear@2:     while (len >= 32) {
nuclear@2:         DOBIG32;
nuclear@2:         len -= 32;
nuclear@2:     }
nuclear@2:     while (len >= 4) {
nuclear@2:         DOBIG4;
nuclear@2:         len -= 4;
nuclear@2:     }
nuclear@2:     buf4++;
nuclear@2:     buf = (const unsigned char FAR *)buf4;
nuclear@2: 
nuclear@2:     if (len) do {
nuclear@2:         c = crc_table[4][(c >> 24) ^ *buf++] ^ (c << 8);
nuclear@2:     } while (--len);
nuclear@2:     c = ~c;
nuclear@2:     return (unsigned long)(REV(c));
nuclear@2: }
nuclear@2: 
nuclear@2: #endif /* BYFOUR */
nuclear@2: 
nuclear@2: #define GF2_DIM 32      /* dimension of GF(2) vectors (length of CRC) */
nuclear@2: 
nuclear@2: /* ========================================================================= */
nuclear@2: local unsigned long gf2_matrix_times(mat, vec)
nuclear@2:     unsigned long *mat;
nuclear@2:     unsigned long vec;
nuclear@2: {
nuclear@2:     unsigned long sum;
nuclear@2: 
nuclear@2:     sum = 0;
nuclear@2:     while (vec) {
nuclear@2:         if (vec & 1)
nuclear@2:             sum ^= *mat;
nuclear@2:         vec >>= 1;
nuclear@2:         mat++;
nuclear@2:     }
nuclear@2:     return sum;
nuclear@2: }
nuclear@2: 
nuclear@2: /* ========================================================================= */
nuclear@2: local void gf2_matrix_square(square, mat)
nuclear@2:     unsigned long *square;
nuclear@2:     unsigned long *mat;
nuclear@2: {
nuclear@2:     int n;
nuclear@2: 
nuclear@2:     for (n = 0; n < GF2_DIM; n++)
nuclear@2:         square[n] = gf2_matrix_times(mat, mat[n]);
nuclear@2: }
nuclear@2: 
nuclear@2: /* ========================================================================= */
nuclear@2: uLong ZEXPORT crc32_combine(crc1, crc2, len2)
nuclear@2:     uLong crc1;
nuclear@2:     uLong crc2;
nuclear@2:     z_off_t len2;
nuclear@2: {
nuclear@2:     int n;
nuclear@2:     unsigned long row;
nuclear@2:     unsigned long even[GF2_DIM];    /* even-power-of-two zeros operator */
nuclear@2:     unsigned long odd[GF2_DIM];     /* odd-power-of-two zeros operator */
nuclear@2: 
nuclear@2:     /* degenerate case */
nuclear@2:     if (len2 == 0)
nuclear@2:         return crc1;
nuclear@2: 
nuclear@2:     /* put operator for one zero bit in odd */
nuclear@2:     odd[0] = 0xedb88320L;           /* CRC-32 polynomial */
nuclear@2:     row = 1;
nuclear@2:     for (n = 1; n < GF2_DIM; n++) {
nuclear@2:         odd[n] = row;
nuclear@2:         row <<= 1;
nuclear@2:     }
nuclear@2: 
nuclear@2:     /* put operator for two zero bits in even */
nuclear@2:     gf2_matrix_square(even, odd);
nuclear@2: 
nuclear@2:     /* put operator for four zero bits in odd */
nuclear@2:     gf2_matrix_square(odd, even);
nuclear@2: 
nuclear@2:     /* apply len2 zeros to crc1 (first square will put the operator for one
nuclear@2:        zero byte, eight zero bits, in even) */
nuclear@2:     do {
nuclear@2:         /* apply zeros operator for this bit of len2 */
nuclear@2:         gf2_matrix_square(even, odd);
nuclear@2:         if (len2 & 1)
nuclear@2:             crc1 = gf2_matrix_times(even, crc1);
nuclear@2:         len2 >>= 1;
nuclear@2: 
nuclear@2:         /* if no more bits set, then done */
nuclear@2:         if (len2 == 0)
nuclear@2:             break;
nuclear@2: 
nuclear@2:         /* another iteration of the loop with odd and even swapped */
nuclear@2:         gf2_matrix_square(odd, even);
nuclear@2:         if (len2 & 1)
nuclear@2:             crc1 = gf2_matrix_times(odd, crc1);
nuclear@2:         len2 >>= 1;
nuclear@2: 
nuclear@2:         /* if no more bits set, then done */
nuclear@2:     } while (len2 != 0);
nuclear@2: 
nuclear@2:     /* return combined crc */
nuclear@2:     crc1 ^= crc2;
nuclear@2:     return crc1;
nuclear@2: }