busybox/archival/libunarchive/decompress_unzip.c

1105 lines
31 KiB
C
Raw Normal View History

2001-04-11 03:11:33 +00:00
/* vi: set sw=4 ts=4: */
/*
* gunzip implementation for busybox
*
* Based on GNU gzip v1.2.4 Copyright (C) 1992-1993 Jean-loup Gailly.
*
* Originally adjusted for busybox by Sven Rudolph <sr1@inf.tu-dresden.de>
* based on gzip sources
*
* Adjusted further by Erik Andersen <andersen@codepoet.org> to support
2001-12-06 08:20:14 +00:00
* files as well as stdin/stdout, and to generally behave itself wrt
2001-04-11 03:11:33 +00:00
* command line handling.
*
* General cleanup to better adhere to the style guide and make use of standard
* busybox functions by Glenn McGrath <bug1@iinet.net.au>
*
* read_gz interface + associated hacking by Laurence Anderson
*
* Fixed huft_build() so decoding end-of-block code does not grab more bits
* than necessary (this is required by unzip applet), added inflate_cleanup()
* to free leaked bytebuffer memory (used in unzip.c), and some minor style
* guide cleanups by Ed Clark
*
2001-04-11 03:11:33 +00:00
* gzip (GNU zip) -- compress files with zip algorithm and 'compress' interface
* Copyright (C) 1992-1993 Jean-loup Gailly
* The unzip code was written and put in the public domain by Mark Adler.
* Portions of the lzw code are derived from the public domain 'compress'
* written by Spencer Thomas, Joe Orost, James Woods, Jim McKie, Steve Davies,
* Ken Turkowski, Dave Mack and Peter Jannesen.
*
* See the file algorithm.doc for the compression algorithms and file formats.
2006-09-17 16:28:10 +00:00
*
* Licensed under GPLv2 or later, see file LICENSE in this tarball for details.
2001-04-11 03:11:33 +00:00
*/
#include "libbb.h"
2002-09-25 02:47:48 +00:00
#include "unarchive.h"
2001-04-11 03:11:33 +00:00
2002-09-25 02:47:48 +00:00
typedef struct huft_s {
unsigned char e; /* number of extra bits or operation */
unsigned char b; /* number of bits in this code or subcode */
union {
unsigned short n; /* literal, length base, or distance base */
struct huft_s *t; /* pointer to next level of table */
} v;
} huft_t;
2001-04-11 03:11:33 +00:00
enum {
/* gunzip_window size--must be a power of two, and
* at least 32K for zip's deflate method */
GUNZIP_WSIZE = 0x8000,
/* If BMAX needs to be larger than 16, then h and x[] should be ulg. */
BMAX = 16, /* maximum bit length of any code (16 for explode) */
N_MAX = 288, /* maximum number of codes in any set */
};
/* This is somewhat complex-looking arrangement, but it allows
* to place decompressor state either in bss or in
* malloc'ed space simply by changing #defines below.
* Sizes on i386:
* text data bss dec hex
* 5256 0 108 5364 14f4 - bss
* 4915 0 0 4915 1333 - malloc
*/
#define STATE_IN_BSS 0
#define STATE_IN_MALLOC 1
typedef struct state_t {
off_t gunzip_bytes_out; /* number of output bytes */
uint32_t gunzip_crc;
int gunzip_src_fd;
unsigned gunzip_outbuf_count; /* bytes in output buffer */
unsigned char *gunzip_window;
uint32_t *gunzip_crc_table;
/* bitbuffer */
unsigned gunzip_bb; /* bit buffer */
unsigned char gunzip_bk; /* bits in bit buffer */
/* These control the size of the STATE()bytebuffer */
unsigned bytebuffer_max;
unsigned char *bytebuffer;
unsigned bytebuffer_offset;
unsigned bytebuffer_size;
/* private data of inflate_codes() */
unsigned inflate_codes_ml; /* masks for bl and bd bits */
unsigned inflate_codes_md; /* masks for bl and bd bits */
unsigned inflate_codes_bb; /* bit buffer */
unsigned inflate_codes_k; /* number of bits in bit buffer */
unsigned inflate_codes_w; /* current gunzip_window position */
huft_t *inflate_codes_tl;
huft_t *inflate_codes_td;
unsigned inflate_codes_bl;
unsigned inflate_codes_bd;
unsigned inflate_codes_nn; /* length and index for copy */
unsigned inflate_codes_dd;
smallint resume_copy;
/* private data of inflate_get_next_window() */
smallint method; /* Method == -1 for stored, -2 for codes */
smallint need_another_block;
smallint end_reached;
/* private data of inflate_stored() */
unsigned inflate_stored_n;
unsigned inflate_stored_b;
unsigned inflate_stored_k;
unsigned inflate_stored_w;
} state_t;
#define gunzip_bytes_out (S()gunzip_bytes_out )
#define gunzip_crc (S()gunzip_crc )
#define gunzip_src_fd (S()gunzip_src_fd )
#define gunzip_outbuf_count (S()gunzip_outbuf_count)
#define gunzip_window (S()gunzip_window )
#define gunzip_crc_table (S()gunzip_crc_table )
#define gunzip_bb (S()gunzip_bb )
#define gunzip_bk (S()gunzip_bk )
#define bytebuffer_max (S()bytebuffer_max )
#define bytebuffer (S()bytebuffer )
#define bytebuffer_offset (S()bytebuffer_offset )
#define bytebuffer_size (S()bytebuffer_size )
#define inflate_codes_ml (S()inflate_codes_ml )
#define inflate_codes_md (S()inflate_codes_md )
#define inflate_codes_bb (S()inflate_codes_bb )
#define inflate_codes_k (S()inflate_codes_k )
#define inflate_codes_w (S()inflate_codes_w )
#define inflate_codes_tl (S()inflate_codes_tl )
#define inflate_codes_td (S()inflate_codes_td )
#define inflate_codes_bl (S()inflate_codes_bl )
#define inflate_codes_bd (S()inflate_codes_bd )
#define inflate_codes_nn (S()inflate_codes_nn )
#define inflate_codes_dd (S()inflate_codes_dd )
#define resume_copy (S()resume_copy )
#define method (S()method )
#define need_another_block (S()need_another_block )
#define end_reached (S()end_reached )
#define inflate_stored_n (S()inflate_stored_n )
#define inflate_stored_b (S()inflate_stored_b )
#define inflate_stored_k (S()inflate_stored_k )
#define inflate_stored_w (S()inflate_stored_w )
#define INIT_STATE ({ bytebuffer_size = 0; method = -1; need_another_block = 1; })
/* This is generic part */
#if STATE_IN_BSS /* Use global data segment */
#define DECLARE_STATE /*nothing*/
#define ALLOC_STATE (init_state())
#define DEALLOC_STATE ((void)0)
#define S() state.
#define PASS_STATE /*nothing*/
#define PASS_STATE_ONLY /*nothing*/
#define STATE_PARAM /*nothing*/
#define STATE_PARAM_ONLY void
static state_t state;
static void init_state(void)
{
INIT_STATE;
}
#endif
#if STATE_IN_MALLOC /* Use malloc space */
#define DECLARE_STATE state_t *state
#define ALLOC_STATE (state = alloc_state())
#define DEALLOC_STATE free(state)
#define S() state->
#define PASS_STATE state,
#define PASS_STATE_ONLY state
#define STATE_PARAM state_t *state,
#define STATE_PARAM_ONLY state_t *state
static state_t* alloc_state(void)
{
state_t* state = xzalloc(sizeof(*state));
INIT_STATE;
return state;
}
#endif
2001-04-11 03:11:33 +00:00
static const unsigned short mask_bits[] = {
2002-09-25 02:47:48 +00:00
0x0000, 0x0001, 0x0003, 0x0007, 0x000f, 0x001f, 0x003f, 0x007f, 0x00ff,
2001-04-11 03:11:33 +00:00
0x01ff, 0x03ff, 0x07ff, 0x0fff, 0x1fff, 0x3fff, 0x7fff, 0xffff
};
2002-09-25 02:47:48 +00:00
/* Copy lengths for literal codes 257..285 */
static const unsigned short cplens[] = {
3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 15, 17, 19, 23, 27, 31, 35, 43, 51, 59,
67, 83, 99, 115, 131, 163, 195, 227, 258, 0, 0
2002-09-25 02:47:48 +00:00
};
/* note: see note #13 above about the 258 in this list. */
/* Extra bits for literal codes 257..285 */
static const unsigned char cplext[] = {
0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3, 4, 4, 4, 4, 5,
5, 5, 5, 0, 99, 99
}; /* 99 == invalid */
2002-09-25 02:47:48 +00:00
/* Copy offsets for distance codes 0..29 */
static const unsigned short cpdist[] = {
1, 2, 3, 4, 5, 7, 9, 13, 17, 25, 33, 49, 65, 97, 129, 193, 257, 385, 513,
769, 1025, 1537, 2049, 3073, 4097, 6145, 8193, 12289, 16385, 24577
2002-09-25 02:47:48 +00:00
};
/* Extra bits for distance codes */
static const unsigned char cpdext[] = {
0, 0, 0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7, 8, 8, 9, 9, 10, 10,
11, 11, 12, 12, 13, 13
2002-09-25 02:47:48 +00:00
};
/* Tables for deflate from PKZIP's appnote.txt. */
/* Order of the bit length code lengths */
static const unsigned char border[] = {
16, 17, 18, 0, 8, 7, 9, 6, 10, 5, 11, 4, 12, 3, 13, 2, 14, 1, 15
};
static unsigned fill_bitbuffer(STATE_PARAM unsigned bitbuffer, unsigned *current, const unsigned required)
2002-09-25 02:47:48 +00:00
{
while (*current < required) {
if (bytebuffer_offset >= bytebuffer_size) {
/* Leave the first 4 bytes empty so we can always unwind the bitbuffer
* to the front of the bytebuffer, leave 4 bytes free at end of tail
* so we can easily top up buffer in check_trailer_gzip() */
bytebuffer_size = safe_read(gunzip_src_fd, &bytebuffer[4], bytebuffer_max - 8);
if (1 > bytebuffer_size)
//shouldn't we propagate error?
bb_error_msg_and_die("unexpected end of file");
bytebuffer_size += 4;
bytebuffer_offset = 4;
}
2007-01-05 19:46:04 +00:00
bitbuffer |= ((unsigned) bytebuffer[bytebuffer_offset]) << *current;
bytebuffer_offset++;
2002-09-25 02:47:48 +00:00
*current += 8;
}
return bitbuffer;
2002-09-25 02:47:48 +00:00
}
2002-08-22 18:41:20 +00:00
2001-04-11 03:11:33 +00:00
/*
* Free the malloc'ed tables built by huft_build(), which makes a linked
* list of the tables it made, with the links in a dummy first entry of
* each table.
2001-04-11 03:11:33 +00:00
* t: table to free
*/
static void huft_free(huft_t * p)
2001-04-11 03:11:33 +00:00
{
2002-09-25 02:47:48 +00:00
huft_t *q;
2001-04-11 03:11:33 +00:00
/* Go through linked list, freeing from the malloced (t[-1]) address. */
while (p) {
2001-04-11 03:11:33 +00:00
q = (--p)->v.t;
free(p);
2001-04-11 03:11:33 +00:00
p = q;
}
}
/* Given a list of code lengths and a maximum table size, make a set of
* tables to decode that set of codes. Return zero on success, one if
* the given code set is incomplete (the tables are still built in this
* case), two if the input is invalid (all zero length codes or an
* oversubscribed set of lengths), and three if not enough memory.
*
* b: code lengths in bits (all assumed <= BMAX)
* n: number of codes (assumed <= N_MAX)
* s: number of simple-valued codes (0..s-1)
* d: list of base values for non-simple codes
* e: list of extra bits for non-simple codes
* t: result: starting table
* m: maximum lookup bits, returns actual
*/
static int huft_build(unsigned *b, const unsigned n,
2007-01-05 19:46:04 +00:00
const unsigned s, const unsigned short *d,
const unsigned char *e, huft_t ** t, unsigned *m)
2001-04-11 03:11:33 +00:00
{
unsigned a; /* counter for codes of length k */
2001-04-11 03:11:33 +00:00
unsigned c[BMAX + 1]; /* bit length count table */
unsigned eob_len; /* length of end-of-block code (value 256) */
unsigned f; /* i repeats in table every f entries */
int g; /* maximum code length */
int htl; /* table level */
unsigned i; /* counter, current code */
unsigned j; /* counter */
int k; /* number of bits in current code */
unsigned *p; /* pointer into c[], b[], or v[] */
huft_t *q; /* points to current table */
huft_t r; /* table entry for structure assignment */
huft_t *u[BMAX]; /* table stack */
unsigned v[N_MAX]; /* values in order of bit length */
int ws[BMAX+1]; /* bits decoded stack */
int w; /* bits decoded */
2001-04-11 03:11:33 +00:00
unsigned x[BMAX + 1]; /* bit offsets, then code stack */
unsigned *xp; /* pointer into x */
int y; /* number of dummy codes added */
unsigned z; /* number of entries in current table */
/* Length of EOB code, if any */
eob_len = n > 256 ? b[256] : BMAX;
2001-04-11 03:11:33 +00:00
/* Generate counts for each bit length */
memset(c, 0, sizeof(c));
2001-04-11 03:11:33 +00:00
p = b;
i = n;
do {
c[*p]++; /* assume all entries <= BMAX */
p++; /* Can't combine with above line (Solaris bug) */
2001-04-11 03:11:33 +00:00
} while (--i);
if (c[0] == n) { /* null input--all zero length codes */
*t = NULL;
2001-04-11 03:11:33 +00:00
*m = 0;
return 2;
2001-04-11 03:11:33 +00:00
}
/* Find minimum and maximum length, bound *m by those */
for (j = 1; (c[j] == 0) && (j <= BMAX); j++);
k = j; /* minimum code length */
for (i = BMAX; (c[i] == 0) && i; i--);
g = i; /* maximum code length */
*m = (*m < j) ? j : ((*m > i) ? i : *m);
2001-04-11 03:11:33 +00:00
/* Adjust last length count to fill out codes, if needed */
2002-09-25 02:47:48 +00:00
for (y = 1 << j; j < i; j++, y <<= 1) {
y -= c[j];
if (y < 0) {
return 2; /* bad input: more codes than bits */
2002-09-25 02:47:48 +00:00
}
}
y -= c[i];
if (y < 0) {
2001-04-11 03:11:33 +00:00
return 2;
2002-09-25 02:47:48 +00:00
}
2001-04-11 03:11:33 +00:00
c[i] += y;
/* Generate starting offsets into the value table for each length */
x[1] = j = 0;
p = c + 1;
xp = x + 2;
while (--i) { /* note that i == g from above */
j += *p++;
*xp++ = j;
2001-04-11 03:11:33 +00:00
}
/* Make a table of values in order of bit lengths */
p = b;
i = 0;
do {
j = *p++;
if (j != 0) {
2001-04-11 03:11:33 +00:00
v[x[j]++] = i;
2002-09-25 02:47:48 +00:00
}
2001-04-11 03:11:33 +00:00
} while (++i < n);
/* Generate the Huffman codes and for each, make the table entries */
x[0] = i = 0; /* first Huffman code is zero */
p = v; /* grab values in bit order */
htl = -1; /* no tables yet--level -1 */
w = ws[0] = 0; /* bits decoded */
u[0] = NULL; /* just to keep compilers happy */
q = NULL; /* ditto */
z = 0; /* ditto */
2001-04-11 03:11:33 +00:00
/* go through the bit lengths (k already is bits in shortest code) */
for (; k <= g; k++) {
a = c[k];
while (a--) {
/* here i is the Huffman code of length k bits for value *p */
/* make tables up to required level */
while (k > ws[htl + 1]) {
w = ws[++htl];
/* compute minimum size table less than or equal to *m bits */
z = g - w;
z = z > *m ? *m : z; /* upper limit on table size */
j = k - w;
f = 1 << j;
if (f > a + 1) { /* try a k-w bit table */
/* too few codes for k-w bit table */
f -= a + 1; /* deduct codes from patterns left */
2001-04-11 03:11:33 +00:00
xp = c + k;
while (++j < z) { /* try smaller tables up to z bits */
f <<= 1;
if (f <= *++xp) {
break; /* enough codes to use up j bits */
2002-09-25 02:47:48 +00:00
}
f -= *xp; /* else deduct codes from patterns */
2001-04-11 03:11:33 +00:00
}
}
j = (w + j > eob_len && w < eob_len) ? eob_len - w : j; /* make EOB code end at table */
2002-08-22 18:41:20 +00:00
z = 1 << j; /* table entries for j-bit table */
ws[htl+1] = w + j; /* set bits decoded in stack */
2001-04-11 03:11:33 +00:00
/* allocate and link in new table */
q = xzalloc((z + 1) * sizeof(huft_t));
2002-08-22 18:41:20 +00:00
*t = q + 1; /* link to list for huft_free() */
t = &(q->v.t);
u[htl] = ++q; /* table starts after link */
2001-04-11 03:11:33 +00:00
/* connect to last table, if there is one */
if (htl) {
x[htl] = i; /* save pattern for backing up */
r.b = (unsigned char) (w - ws[htl - 1]); /* bits to dump before this table */
r.e = (unsigned char) (16 + j); /* bits in this table */
r.v.t = q; /* pointer to this table */
j = (i & ((1 << w) - 1)) >> ws[htl - 1];
u[htl - 1][j] = r; /* connect to last table */
2001-04-11 03:11:33 +00:00
}
}
/* set up table entry in r */
r.b = (unsigned char) (k - w);
2002-09-25 02:47:48 +00:00
if (p >= v + n) {
r.e = 99; /* out of values--invalid code */
2002-09-25 02:47:48 +00:00
} else if (*p < s) {
r.e = (unsigned char) (*p < 256 ? 16 : 15); /* 256 is EOB code */
r.v.n = (unsigned short) (*p++); /* simple code is just the value */
2001-04-11 03:11:33 +00:00
} else {
r.e = (unsigned char) e[*p - s]; /* non-simple--look up in lists */
2001-04-11 03:11:33 +00:00
r.v.n = d[*p++ - s];
}
/* fill code-like entries with r */
f = 1 << (k - w);
2002-09-25 02:47:48 +00:00
for (j = i >> w; j < z; j += f) {
2001-04-11 03:11:33 +00:00
q[j] = r;
2002-09-25 02:47:48 +00:00
}
2001-04-11 03:11:33 +00:00
/* backwards increment the k-bit code i */
2002-09-25 02:47:48 +00:00
for (j = 1 << (k - 1); i & j; j >>= 1) {
2001-04-11 03:11:33 +00:00
i ^= j;
2002-09-25 02:47:48 +00:00
}
2001-04-11 03:11:33 +00:00
i ^= j;
/* backup over finished tables */
while ((i & ((1 << w) - 1)) != x[htl]) {
w = ws[--htl];
2001-04-11 03:11:33 +00:00
}
}
}
/* return actual size of base table */
*m = ws[1];
2001-04-11 03:11:33 +00:00
/* Return true (1) if we were given an incomplete table */
return y != 0 && g != 1;
}
2001-04-11 03:11:33 +00:00
/*
* inflate (decompress) the codes in a deflated (compressed) block.
* Return an error code or zero if it all goes ok.
*
* tl, td: literal/length and distance decoder tables
* bl, bd: number of bits decoded by tl[] and td[]
*/
/* called once from inflate_block */
/* map formerly local static variables to globals */
#define ml inflate_codes_ml
#define md inflate_codes_md
#define bb inflate_codes_bb
#define k inflate_codes_k
#define w inflate_codes_w
#define tl inflate_codes_tl
#define td inflate_codes_td
#define bl inflate_codes_bl
#define bd inflate_codes_bd
#define nn inflate_codes_nn
#define dd inflate_codes_dd
static void inflate_codes_setup(STATE_PARAM huft_t * my_tl, huft_t * my_td, const unsigned my_bl, const unsigned my_bd)
2001-04-11 03:11:33 +00:00
{
tl = my_tl;
td = my_td;
bl = my_bl;
bd = my_bd;
/* make local copies of globals */
bb = gunzip_bb; /* initialize bit buffer */
k = gunzip_bk;
w = gunzip_outbuf_count; /* initialize gunzip_window position */
/* inflate the coded data */
ml = mask_bits[bl]; /* precompute masks for speed */
md = mask_bits[bd];
}
/* called once from inflate_get_next_window */
static int inflate_codes(STATE_PARAM_ONLY)
{
unsigned e; /* table entry flag/number of extra bits */
huft_t *t; /* pointer to table entry */
if (resume_copy) goto do_copy;
2002-09-25 02:47:48 +00:00
while (1) { /* do until end of block */
bb = fill_bitbuffer(PASS_STATE bb, &k, bl);
t = tl + ((unsigned) bb & ml);
e = t->e;
if (e > 16)
2002-08-22 18:41:20 +00:00
do {
if (e == 99) {
//shouldn't we propagate error?
bb_error_msg_and_die("inflate_codes error 1");
2002-08-22 18:41:20 +00:00
}
bb >>= t->b;
2002-08-22 18:41:20 +00:00
k -= t->b;
e -= 16;
bb = fill_bitbuffer(PASS_STATE bb, &k, e);
t = t->v.t + ((unsigned) bb & mask_bits[e]);
e = t->e;
} while (e > 16);
bb >>= t->b;
2001-04-11 03:11:33 +00:00
k -= t->b;
2002-08-22 18:41:20 +00:00
if (e == 16) { /* then it's a literal */
2002-09-25 02:47:48 +00:00
gunzip_window[w++] = (unsigned char) t->v.n;
if (w == GUNZIP_WSIZE) {
gunzip_outbuf_count = w;
2002-11-20 06:46:46 +00:00
//flush_gunzip_window();
2001-04-11 03:11:33 +00:00
w = 0;
return 1; // We have a block to read
2001-04-11 03:11:33 +00:00
}
2002-08-22 18:41:20 +00:00
} else { /* it's an EOB or a length */
2001-04-11 03:11:33 +00:00
/* exit if end of block */
if (e == 15) {
break;
}
/* get length of block to copy */
bb = fill_bitbuffer(PASS_STATE bb, &k, e);
nn = t->v.n + ((unsigned) bb & mask_bits[e]);
bb >>= e;
2001-04-11 03:11:33 +00:00
k -= e;
/* decode distance of block to copy */
bb = fill_bitbuffer(PASS_STATE bb, &k, bd);
t = td + ((unsigned) bb & md);
e = t->e;
if (e > 16)
2001-04-11 03:11:33 +00:00
do {
if (e == 99)
//shouldn't we propagate error?
bb_error_msg_and_die("inflate_codes error 2");
bb >>= t->b;
2001-04-11 03:11:33 +00:00
k -= t->b;
e -= 16;
bb = fill_bitbuffer(PASS_STATE bb, &k, e);
t = t->v.t + ((unsigned) bb & mask_bits[e]);
e = t->e;
} while (e > 16);
bb >>= t->b;
2001-04-11 03:11:33 +00:00
k -= t->b;
bb = fill_bitbuffer(PASS_STATE bb, &k, e);
dd = w - t->v.n - ((unsigned) bb & mask_bits[e]);
bb >>= e;
2001-04-11 03:11:33 +00:00
k -= e;
/* do the copy */
do_copy:
do {
/* Was: nn -= (e = (e = GUNZIP_WSIZE - ((dd &= GUNZIP_WSIZE - 1) > w ? dd : w)) > nn ? nn : e); */
/* Who wrote THAT?? rewritten as: */
dd &= GUNZIP_WSIZE - 1;
e = GUNZIP_WSIZE - (dd > w ? dd : w);
if (e > nn) e = nn;
nn -= e;
/* copy to new buffer to prevent possible overwrite */
if (w - dd >= e) { /* (this test assumes unsigned comparison) */
memcpy(gunzip_window + w, gunzip_window + dd, e);
2001-04-11 03:11:33 +00:00
w += e;
dd += e;
2002-09-25 02:47:48 +00:00
} else {
/* do it slow to avoid memcpy() overlap */
/* !NOMEMCPY */
2001-04-11 03:11:33 +00:00
do {
gunzip_window[w++] = gunzip_window[dd++];
2001-04-11 03:11:33 +00:00
} while (--e);
2002-09-25 02:47:48 +00:00
}
if (w == GUNZIP_WSIZE) {
gunzip_outbuf_count = w;
resume_copy = (nn != 0);
2002-11-20 06:46:46 +00:00
//flush_gunzip_window();
2001-04-11 03:11:33 +00:00
w = 0;
return 1;
2001-04-11 03:11:33 +00:00
}
} while (nn);
resume_copy = 0;
2001-04-11 03:11:33 +00:00
}
}
/* restore the globals from the locals */
gunzip_outbuf_count = w; /* restore global gunzip_window pointer */
gunzip_bb = bb; /* restore global bit buffer */
2002-09-25 02:47:48 +00:00
gunzip_bk = k;
2001-04-11 03:11:33 +00:00
2002-11-20 06:46:46 +00:00
/* normally just after call to inflate_codes, but save code by putting it here */
/* free the decoding tables, return */
huft_free(tl);
huft_free(td);
2001-04-11 03:11:33 +00:00
/* done */
return 0;
}
#undef ml
#undef md
#undef bb
#undef k
#undef w
#undef tl
#undef td
#undef bl
#undef bd
#undef nn
#undef dd
/* called once from inflate_block */
static void inflate_stored_setup(STATE_PARAM int my_n, int my_b, int my_k)
{
inflate_stored_n = my_n;
inflate_stored_b = my_b;
inflate_stored_k = my_k;
/* initialize gunzip_window position */
inflate_stored_w = gunzip_outbuf_count;
}
/* called once from inflate_get_next_window */
static int inflate_stored(STATE_PARAM_ONLY)
2002-11-20 06:46:46 +00:00
{
/* read and output the compressed data */
while (inflate_stored_n--) {
inflate_stored_b = fill_bitbuffer(PASS_STATE inflate_stored_b, &inflate_stored_k, 8);
gunzip_window[inflate_stored_w++] = (unsigned char) inflate_stored_b;
if (inflate_stored_w == GUNZIP_WSIZE) {
gunzip_outbuf_count = inflate_stored_w;
2002-11-20 06:46:46 +00:00
//flush_gunzip_window();
inflate_stored_w = 0;
inflate_stored_b >>= 8;
inflate_stored_k -= 8;
return 1; // We have a block
2002-11-20 06:46:46 +00:00
}
inflate_stored_b >>= 8;
inflate_stored_k -= 8;
2002-11-20 06:46:46 +00:00
}
/* restore the globals from the locals */
gunzip_outbuf_count = inflate_stored_w; /* restore global gunzip_window pointer */
gunzip_bb = inflate_stored_b; /* restore global bit buffer */
gunzip_bk = inflate_stored_k;
2002-11-20 06:46:46 +00:00
return 0; // Finished
}
2001-04-11 03:11:33 +00:00
/*
* decompress an inflated block
* e: last block flag
*
* GLOBAL VARIABLES: bb, kk,
*/
/* Return values: -1 = inflate_stored, -2 = inflate_codes */
/* One callsite in inflate_get_next_window */
static int inflate_block(STATE_PARAM smallint *e)
2001-04-11 03:11:33 +00:00
{
unsigned t; /* block type */
2007-01-05 19:46:04 +00:00
unsigned b; /* bit buffer */
unsigned k; /* number of bits in bit buffer */
2001-04-11 03:11:33 +00:00
/* make local bit buffer */
2002-09-25 02:47:48 +00:00
b = gunzip_bb;
k = gunzip_bk;
2001-04-11 03:11:33 +00:00
/* read in last block bit */
b = fill_bitbuffer(PASS_STATE b, &k, 1);
*e = b & 1;
2001-04-11 03:11:33 +00:00
b >>= 1;
k -= 1;
/* read in block type */
b = fill_bitbuffer(PASS_STATE b, &k, 2);
2001-04-11 03:11:33 +00:00
t = (unsigned) b & 3;
b >>= 2;
k -= 2;
/* restore the global bit buffer */
2002-09-25 02:47:48 +00:00
gunzip_bb = b;
gunzip_bk = k;
2001-04-11 03:11:33 +00:00
/* inflate that block type */
switch (t) {
2002-08-22 18:41:20 +00:00
case 0: /* Inflate stored */
{
2007-01-05 19:46:04 +00:00
unsigned n; /* number of bytes in block */
unsigned b_stored; /* bit buffer */
unsigned k_stored; /* number of bits in bit buffer */
2002-08-22 18:41:20 +00:00
/* make local copies of globals */
2002-09-25 02:47:48 +00:00
b_stored = gunzip_bb; /* initialize bit buffer */
k_stored = gunzip_bk;
2002-08-22 18:41:20 +00:00
/* go to byte boundary */
n = k_stored & 7;
b_stored >>= n;
k_stored -= n;
/* get the length and its complement */
b_stored = fill_bitbuffer(PASS_STATE b_stored, &k_stored, 16);
2002-08-22 18:41:20 +00:00
n = ((unsigned) b_stored & 0xffff);
b_stored >>= 16;
k_stored -= 16;
2002-09-25 02:47:48 +00:00
b_stored = fill_bitbuffer(PASS_STATE b_stored, &k_stored, 16);
2002-08-22 18:41:20 +00:00
if (n != (unsigned) ((~b_stored) & 0xffff)) {
return 1; /* error in compressed data */
}
b_stored >>= 16;
k_stored -= 16;
inflate_stored_setup(PASS_STATE n, b_stored, k_stored); // Setup inflate_stored
2002-11-20 06:46:46 +00:00
return -1;
2002-08-22 18:41:20 +00:00
}
case 1:
/* Inflate fixed
* decompress an inflated type 1 (fixed Huffman codes) block. We should
* either replace this with a custom decoder, or at least precompute the
* Huffman tables. */
2002-08-22 18:41:20 +00:00
{
int i; /* temporary variable */
huft_t *tl; /* literal/length code table */
huft_t *td; /* distance code table */
2007-01-05 19:46:04 +00:00
unsigned bl; /* lookup bits for tl */
unsigned bd; /* lookup bits for td */
unsigned l[288]; /* length list for huft_build */
2002-08-22 18:41:20 +00:00
/* set up literal table */
for (i = 0; i < 144; i++) {
l[i] = 8;
}
for (; i < 256; i++) {
l[i] = 9;
}
for (; i < 280; i++) {
l[i] = 7;
}
for (; i < 288; i++) { /* make a complete, but wrong code set */
l[i] = 8;
}
bl = 7;
i = huft_build(l, 288, 257, cplens, cplext, &tl, &bl);
if (i != 0) {
2002-08-22 18:41:20 +00:00
return i;
2001-04-11 03:11:33 +00:00
}
2002-08-22 18:41:20 +00:00
/* set up distance table */
for (i = 0; i < 30; i++) { /* make an incomplete code set */
l[i] = 5;
}
bd = 5;
i = huft_build(l, 30, 0, cpdist, cpdext, &td, &bd);
if (i > 1) {
2002-08-22 18:41:20 +00:00
huft_free(tl);
return i;
}
2001-04-11 03:11:33 +00:00
2002-08-22 18:41:20 +00:00
/* decompress until an end-of-block code */
inflate_codes_setup(PASS_STATE tl, td, bl, bd); // Setup inflate_codes
2002-11-20 06:46:46 +00:00
/* huft_free code moved into inflate_codes */
2002-11-20 06:46:46 +00:00
return -2;
2002-08-22 18:41:20 +00:00
}
case 2: /* Inflate dynamic */
{
const int dbits = 6; /* bits in base distance lookup table */
const int lbits = 9; /* bits in base literal/length lookup table */
huft_t *tl; /* literal/length code table */
huft_t *td; /* distance code table */
2007-01-05 19:46:04 +00:00
unsigned i; /* temporary variables */
unsigned j;
unsigned l; /* last length */
unsigned m; /* mask for bit lengths table */
unsigned n; /* number of lengths to get */
unsigned bl; /* lookup bits for tl */
unsigned bd; /* lookup bits for td */
unsigned nb; /* number of bit length codes */
unsigned nl; /* number of literal/length codes */
unsigned nd; /* number of distance codes */
unsigned ll[286 + 30]; /* literal/length and distance code lengths */
unsigned b_dynamic; /* bit buffer */
unsigned k_dynamic; /* number of bits in bit buffer */
2002-08-22 18:41:20 +00:00
/* make local bit buffer */
2002-09-25 02:47:48 +00:00
b_dynamic = gunzip_bb;
k_dynamic = gunzip_bk;
2002-08-22 18:41:20 +00:00
/* read in table lengths */
b_dynamic = fill_bitbuffer(PASS_STATE b_dynamic, &k_dynamic, 5);
2007-01-05 19:46:04 +00:00
nl = 257 + ((unsigned) b_dynamic & 0x1f); /* number of literal/length codes */
2002-09-25 02:47:48 +00:00
2002-08-22 18:41:20 +00:00
b_dynamic >>= 5;
k_dynamic -= 5;
b_dynamic = fill_bitbuffer(PASS_STATE b_dynamic, &k_dynamic, 5);
2007-01-05 19:46:04 +00:00
nd = 1 + ((unsigned) b_dynamic & 0x1f); /* number of distance codes */
2002-09-25 02:47:48 +00:00
2002-08-22 18:41:20 +00:00
b_dynamic >>= 5;
k_dynamic -= 5;
b_dynamic = fill_bitbuffer(PASS_STATE b_dynamic, &k_dynamic, 4);
2007-01-05 19:46:04 +00:00
nb = 4 + ((unsigned) b_dynamic & 0xf); /* number of bit length codes */
2002-09-25 02:47:48 +00:00
2002-08-22 18:41:20 +00:00
b_dynamic >>= 4;
k_dynamic -= 4;
if (nl > 286 || nd > 30) {
return 1; /* bad lengths */
2001-04-11 03:11:33 +00:00
}
2002-08-22 18:41:20 +00:00
/* read in bit-length-code lengths */
for (j = 0; j < nb; j++) {
b_dynamic = fill_bitbuffer(PASS_STATE b_dynamic, &k_dynamic, 3);
2007-01-05 19:46:04 +00:00
ll[border[j]] = (unsigned) b_dynamic & 7;
2002-08-22 18:41:20 +00:00
b_dynamic >>= 3;
k_dynamic -= 3;
}
for (; j < 19; j++) {
ll[border[j]] = 0;
}
/* build decoding table for trees--single level, 7 bit lookup */
bl = 7;
2002-09-25 02:47:48 +00:00
i = huft_build(ll, 19, 19, NULL, NULL, &tl, &bl);
if (i != 0) {
2002-08-22 18:41:20 +00:00
if (i == 1) {
huft_free(tl);
2001-04-11 03:11:33 +00:00
}
2002-08-22 18:41:20 +00:00
return i; /* incomplete code set */
}
/* read in literal and distance code lengths */
n = nl + nd;
m = mask_bits[bl];
i = l = 0;
2007-01-05 19:46:04 +00:00
while ((unsigned) i < n) {
b_dynamic = fill_bitbuffer(PASS_STATE b_dynamic, &k_dynamic, (unsigned)bl);
2007-01-05 19:46:04 +00:00
j = (td = tl + ((unsigned) b_dynamic & m))->b;
2002-08-22 18:41:20 +00:00
b_dynamic >>= j;
k_dynamic -= j;
j = td->v.n;
if (j < 16) { /* length of code in bits (0..15) */
ll[i++] = l = j; /* save last length in l */
} else if (j == 16) { /* repeat last length 3 to 6 times */
b_dynamic = fill_bitbuffer(PASS_STATE b_dynamic, &k_dynamic, 2);
2007-01-05 19:46:04 +00:00
j = 3 + ((unsigned) b_dynamic & 3);
2002-08-22 18:41:20 +00:00
b_dynamic >>= 2;
k_dynamic -= 2;
2007-01-05 19:46:04 +00:00
if ((unsigned) i + j > n) {
2002-08-22 18:41:20 +00:00
return 1;
}
while (j--) {
ll[i++] = l;
}
} else if (j == 17) { /* 3 to 10 zero length codes */
b_dynamic = fill_bitbuffer(PASS_STATE b_dynamic, &k_dynamic, 3);
2007-01-05 19:46:04 +00:00
j = 3 + ((unsigned) b_dynamic & 7);
2001-04-11 03:11:33 +00:00
b_dynamic >>= 3;
k_dynamic -= 3;
2007-01-05 19:46:04 +00:00
if ((unsigned) i + j > n) {
2002-08-22 18:41:20 +00:00
return 1;
2001-04-11 03:11:33 +00:00
}
2002-08-22 18:41:20 +00:00
while (j--) {
ll[i++] = 0;
}
l = 0;
} else { /* j == 18: 11 to 138 zero length codes */
b_dynamic = fill_bitbuffer(PASS_STATE b_dynamic, &k_dynamic, 7);
2007-01-05 19:46:04 +00:00
j = 11 + ((unsigned) b_dynamic & 0x7f);
2002-08-22 18:41:20 +00:00
b_dynamic >>= 7;
k_dynamic -= 7;
2007-01-05 19:46:04 +00:00
if ((unsigned) i + j > n) {
2002-08-22 18:41:20 +00:00
return 1;
2001-04-11 03:11:33 +00:00
}
2002-08-22 18:41:20 +00:00
while (j--) {
ll[i++] = 0;
2001-04-11 03:11:33 +00:00
}
2002-08-22 18:41:20 +00:00
l = 0;
2001-04-11 03:11:33 +00:00
}
2002-08-22 18:41:20 +00:00
}
2001-04-11 03:11:33 +00:00
2002-08-22 18:41:20 +00:00
/* free decoding table for trees */
huft_free(tl);
2001-04-11 03:11:33 +00:00
2002-08-22 18:41:20 +00:00
/* restore the global bit buffer */
2002-09-25 02:47:48 +00:00
gunzip_bb = b_dynamic;
gunzip_bk = k_dynamic;
2001-04-11 03:11:33 +00:00
2002-08-22 18:41:20 +00:00
/* build the decoding tables for literal/length and distance codes */
bl = lbits;
2002-09-25 02:47:48 +00:00
i = huft_build(ll, nl, 257, cplens, cplext, &tl, &bl);
if (i != 0) {
2002-08-22 18:41:20 +00:00
if (i == 1) {
//shouldn't we propagate error?
bb_error_msg_and_die("incomplete literal tree");
/* huft_free(tl); */
2001-04-11 03:11:33 +00:00
}
2002-08-22 18:41:20 +00:00
return i; /* incomplete code set */
}
2002-09-25 02:47:48 +00:00
2002-08-22 18:41:20 +00:00
bd = dbits;
i = huft_build(ll + nl, nd, 0, cpdist, cpdext, &td, &bd);
if (i != 0) {
2002-08-22 18:41:20 +00:00
if (i == 1) {
//shouldn't we propagate error?
2003-03-19 09:13:01 +00:00
bb_error_msg_and_die("incomplete distance tree");
/* huft_free(td); */
2002-08-22 18:41:20 +00:00
}
2001-04-11 03:11:33 +00:00
huft_free(tl);
2002-08-22 18:41:20 +00:00
return i; /* incomplete code set */
2001-04-11 03:11:33 +00:00
}
2002-08-22 18:41:20 +00:00
/* decompress until an end-of-block code */
inflate_codes_setup(PASS_STATE tl, td, bl, bd); // Setup inflate_codes
2002-08-22 18:41:20 +00:00
2002-11-20 06:46:46 +00:00
/* huft_free code moved into inflate_codes */
2002-11-20 06:46:46 +00:00
return -2;
2002-08-22 18:41:20 +00:00
}
2001-04-11 03:11:33 +00:00
default:
/* bad block type */
//shouldn't we propagate error?
bb_error_msg_and_die("bad block type %d", t);
}
}
/* Two callsites, both in inflate_get_next_window */
static void calculate_gunzip_crc(STATE_PARAM_ONLY)
{
int n;
for (n = 0; n < gunzip_outbuf_count; n++) {
gunzip_crc = gunzip_crc_table[((int) gunzip_crc ^ (gunzip_window[n])) & 0xff] ^ (gunzip_crc >> 8);
}
gunzip_bytes_out += gunzip_outbuf_count;
}
/* One callsite in inflate_unzip_internal */
static int inflate_get_next_window(STATE_PARAM_ONLY)
{
gunzip_outbuf_count = 0;
while (1) {
int ret;
if (need_another_block) {
if (end_reached) {
calculate_gunzip_crc(PASS_STATE_ONLY);
end_reached = 0;
need_another_block = 1;
return 0; /* Last block */
}
method = inflate_block(PASS_STATE &end_reached);
need_another_block = 0;
}
switch (method) {
case -1:
ret = inflate_stored(PASS_STATE_ONLY);
break;
case -2:
ret = inflate_codes(PASS_STATE_ONLY);
break;
default:
//shouldn't we propagate error?
bb_error_msg_and_die("inflate error %d", method);
}
if (ret == 1) {
calculate_gunzip_crc(PASS_STATE_ONLY);
return 1; // More data left
}
need_another_block = 1; // End of that block
2001-04-11 03:11:33 +00:00
}
/* Doesnt get here */
2001-04-11 03:11:33 +00:00
}
/* Called from unpack_gz_stream() and inflate_unzip() */
/* NB: bytebuffer is allocated here but freeing it is left to the caller! */
static USE_DESKTOP(long long) int
inflate_unzip_internal(STATE_PARAM int in, int out)
{
USE_DESKTOP(long long) int n = 0;
ssize_t nwrote;
2001-04-11 03:11:33 +00:00
/* Allocate all global buffers (for DYN_ALLOC option) */
gunzip_window = xmalloc(GUNZIP_WSIZE);
2002-09-25 02:47:48 +00:00
gunzip_outbuf_count = 0;
gunzip_bytes_out = 0;
gunzip_src_fd = in;
2001-04-11 03:11:33 +00:00
2002-09-25 02:47:48 +00:00
/* initialize gunzip_window, bit buffer */
gunzip_bk = 0;
gunzip_bb = 0;
2001-04-11 03:11:33 +00:00
2002-09-25 02:47:48 +00:00
/* Create the crc table */
gunzip_crc_table = crc32_filltable(NULL, 0);
gunzip_crc = ~0;
2006-09-17 16:28:10 +00:00
/* Allocate space for buffer */
bytebuffer = xmalloc(bytebuffer_max);
while (1) {
int r = inflate_get_next_window(PASS_STATE_ONLY);
nwrote = full_write(out, gunzip_window, gunzip_outbuf_count);
if (nwrote != gunzip_outbuf_count) {
bb_perror_msg("write");
n = -1;
goto ret;
}
USE_DESKTOP(n += nwrote;)
if (r == 0) break;
}
2002-09-25 02:47:48 +00:00
/* Store unused bytes in a global buffer so calling applets can access it */
if (gunzip_bk >= 8) {
/* Undo too much lookahead. The next read will be byte aligned
* so we can discard unused bits in the last meaningful byte. */
bytebuffer_offset--;
bytebuffer[bytebuffer_offset] = gunzip_bb & 0xff;
2002-09-25 02:47:48 +00:00
gunzip_bb >>= 8;
gunzip_bk -= 8;
2001-04-11 03:11:33 +00:00
}
ret:
/* Cleanup */
free(gunzip_window);
free(gunzip_crc_table);
return n;
2001-04-11 03:11:33 +00:00
}
USE_DESKTOP(long long) int
inflate_unzip(inflate_unzip_result *res, unsigned bufsize, int in, int out)
{
USE_DESKTOP(long long) int n;
DECLARE_STATE;
ALLOC_STATE;
bytebuffer_max = bufsize + 8;
bytebuffer_offset = 4;
n = inflate_unzip_internal(PASS_STATE in, out);
res->crc = gunzip_crc;
res->bytes_out = gunzip_bytes_out;
free(bytebuffer);
DEALLOC_STATE;
return n;
}
USE_DESKTOP(long long) int
unpack_gz_stream(int in, int out)
{
uint32_t stored_crc = 0;
2007-01-05 19:46:04 +00:00
unsigned count;
USE_DESKTOP(long long) int n;
DECLARE_STATE;
ALLOC_STATE;
bytebuffer_max = 0x8000;
n = inflate_unzip_internal(PASS_STATE in, out);
if (n < 0) goto ret;
/* top up the input buffer with the rest of the trailer */
count = bytebuffer_size - bytebuffer_offset;
if (count < 8) {
xread(in, &bytebuffer[bytebuffer_size], 8 - count);
//shouldn't we propagate error?
bytebuffer_size += 8 - count;
}
for (count = 0; count != 4; count++) {
stored_crc |= (bytebuffer[bytebuffer_offset] << (count * 8));
bytebuffer_offset++;
}
/* Validate decompression - crc */
if (stored_crc != (~gunzip_crc)) {
bb_error_msg("crc error");
n = -1;
goto ret;
}
/* Validate decompression - size */
if (gunzip_bytes_out !=
(bytebuffer[bytebuffer_offset] | (bytebuffer[bytebuffer_offset+1] << 8) |
(bytebuffer[bytebuffer_offset+2] << 16) | (bytebuffer[bytebuffer_offset+3] << 24))
) {
bb_error_msg("incorrect length");
n = -1;
}
ret:
free(bytebuffer);
DEALLOC_STATE;
return n;
}