]> git.ipfire.org Git - thirdparty/libarchive.git/commitdiff
Revert unintentional commit of wip changes for
authorJoerg Sonnenberger <joerg.sonnenberger@gmail.com>
Mon, 4 Aug 2008 07:31:57 +0000 (03:31 -0400)
committerJoerg Sonnenberger <joerg.sonnenberger@gmail.com>
Mon, 4 Aug 2008 07:31:57 +0000 (03:31 -0400)
archive_write_set_compression_compress.c.

SVN-Revision: 178

libarchive/archive_write_set_compression_compress.c

index b62d6fe255722493ea2b0ae52e608a4ec60bd43a..f913a23c53b1d1daae7d9f14ac1d56cf56792f9e 100644 (file)
@@ -74,6 +74,8 @@ __FBSDID("$FreeBSD: src/lib/libarchive/archive_write_set_compression_compress.c,
 #include "archive_private.h"
 #include "archive_write_private.h"
 
+#define        HSIZE           69001   /* 95% occupancy */
+#define        HSHIFT          8       /* 8 - trunc(log2(HSIZE / 65536)) */
 #define        CHECK_GAP 10000         /* Ratio check interval. */
 
 #define        MAXCODE(bits)   ((1 << (bits)) - 1)
@@ -91,10 +93,12 @@ struct private_data {
        int code_len;                   /* Number of bits/code. */
        int cur_maxcode;                /* Maximum code, given n_bits. */
        int max_maxcode;                /* Should NEVER generate this code. */
+       int hashtab [HSIZE];
+       unsigned short codetab [HSIZE];
        int first_free;         /* First unused entry. */
        int compress_ratio;
 
-       size_t cur_code;
+       int cur_code, cur_fcode;
 
        int bit_offset;
        unsigned char bit_buf;
@@ -102,10 +106,6 @@ struct private_data {
        unsigned char   *compressed;
        size_t           compressed_buffer_size;
        size_t           compressed_offset;
-
-       uint8_t code_next[65536];
-       uint16_t code_link[65536];
-       uint16_t code_state[65536];
 };
 
 static int     archive_compressor_compress_finish(struct archive_write *);
@@ -158,6 +158,7 @@ archive_compressor_compress_init(struct archive_write *a)
                    "Can't allocate data for compression");
                return (ARCHIVE_FATAL);
        }
+       memset(state, 0, sizeof(*state));
 
        state->compressed_buffer_size = a->bytes_per_block;
        state->compressed = malloc(state->compressed_buffer_size);
@@ -172,23 +173,18 @@ archive_compressor_compress_init(struct archive_write *a)
        a->compressor.write = archive_compressor_compress_write;
        a->compressor.finish = archive_compressor_compress_finish;
 
-       state->in_count = 0;
-       state->out_count = 0;
-       state->checkpoint = 0;
-
        state->max_maxcode = 0x10000;   /* Should NEVER generate this code. */
+       state->in_count = 0;            /* Length of input. */
        state->bit_buf = 0;
        state->bit_offset = 0;
        state->out_count = 3;           /* Includes 3-byte header mojo. */
        state->compress_ratio = 0;
        state->checkpoint = CHECK_GAP;
        state->code_len = 9;
-       state->cur_code = 256;
        state->cur_maxcode = MAXCODE(state->code_len);
        state->first_free = FIRST;
 
-       state->first_higher = 0;
-       memset(state->code_lower, 0, sizeof(state->code_lower));
+       memset(state->hashtab, 0xff, sizeof(state->hashtab));
 
        /* Prime output buffer with a gzip header. */
        state->compressed[0] = 0x1f; /* Compress */
@@ -215,6 +211,9 @@ archive_compressor_compress_init(struct archive_write *a)
  * code in turn.  When the buffer fills up empty it and start over.
  */
 
+static unsigned char rmask[9] =
+       {0x00, 0x01, 0x03, 0x07, 0x0f, 0x1f, 0x3f, 0x7f, 0xff};
+
 static int
 output_byte(struct archive_write *a, unsigned char c)
 {
@@ -264,7 +263,7 @@ output_code(struct archive_write *a, int ocode)
        }
        /* Last bits. */
        state->bit_offset += state->code_len;
-       state->bit_buf = ocode & ((1 << bits) - 1);
+       state->bit_buf = ocode & rmask[bits];
        if (state->bit_offset == state->code_len * 8)
                state->bit_offset = 0;
 
@@ -292,8 +291,6 @@ output_code(struct archive_write *a, int ocode)
                if (clear_flg) {
                        state->code_len = 9;
                        state->cur_maxcode = MAXCODE(state->code_len);
-                       state->first_higher = 0;
-                       memset(state->code_lower, 0, sizeof(state->code_lower));
                } else {
                        state->code_len++;
                        if (state->code_len == 16)
@@ -333,9 +330,8 @@ archive_compressor_compress_write(struct archive_write *a, const void *buff,
        struct private_data *state;
        int i;
        int ratio;
-       int ret;
+       int c, disp, ret;
        const unsigned char *bp;
-       size_t c, next1, next2;
 
        state = (struct private_data *)a->compressor.data;
        if (a->client_writer == NULL) {
@@ -359,26 +355,40 @@ archive_compressor_compress_write(struct archive_write *a, const void *buff,
        while (length--) {
                c = *bp++;
                state->in_count++;
+               state->cur_fcode = (c << 16) + state->cur_code;
+               i = ((c << HSHIFT) ^ state->cur_code);  /* Xor hashing. */
+
+               if (state->hashtab[i] == state->cur_fcode) {
+                       state->cur_code = state->codetab[i];
+                       continue;
+               }
+               if (state->hashtab[i] < 0)      /* Empty slot. */
+                       goto nomatch;
+               /* Secondary hash (after G. Knott). */
+               if (i == 0)
+                       disp = 1;
+               else
+                       disp = HSIZE - i;
+ probe:                
+               if ((i -= disp) < 0)
+                       i += HSIZE;
 
-               if ((next1 = state->code_lower[state->cur_code * 16 + c / 16]) != 0 &&
-                   (next2 = state->code_higher[next1 * 16 + c % 16]) != 0) {
-                       state->cur_code = next2;
+               if (state->hashtab[i] == state->cur_fcode) {
+                       state->cur_code = state->codetab[i];
                        continue;
                }
+               if (state->hashtab[i] >= 0)
+                       goto probe;
+ nomatch:      
                ret = output_code(a, state->cur_code);
                if (ret != ARCHIVE_OK)
                        return ret;
+               state->cur_code = c;
                if (state->first_free < state->max_maxcode) {
-                       if (next1 == 0) {
-                               next1 = ++state->first_higher;
-                               state->code_lower[state->cur_code * 16 + c / 16] = next1;
-                               memset(state->code_higher + next1 * 16, 0, 32);
-                       }
-                       state->code_higher[next1 * 16 + c % 16] = state->first_free++;
-                       state->cur_code = c;
+                       state->codetab[i] = state->first_free++;        /* code -> hashtable */
+                       state->hashtab[i] = state->cur_fcode;
                        continue;
                }
-               state->cur_code = c;
                if (state->in_count < state->checkpoint)
                        continue;
 
@@ -395,6 +405,7 @@ archive_compressor_compress_write(struct archive_write *a, const void *buff,
                        state->compress_ratio = ratio;
                else {
                        state->compress_ratio = 0;
+                       memset(state->hashtab, 0xff, sizeof(state->hashtab));
                        state->first_free = FIRST;
                        ret = output_code(a, CLEAR);
                        if (ret != ARCHIVE_OK)
@@ -405,6 +416,7 @@ archive_compressor_compress_write(struct archive_write *a, const void *buff,
        return (ARCHIVE_OK);
 }
 
+
 /*
  * Finish the compression...
  */