decompress_unzip.c

来自「busybox-1.2.0,标准的Linux工具集[最新].对linux下软件的」· C语言 代码 · 共 923 行 · 第 1/2 页

C
923
字号
/* vi: set sw=4 ts=4: *//* * gunzip implementation for busybox * * Based on GNU gzip v1.2.4 Copyright (C) 1992-1993 Jean-loup Gailly. * * Originally adjusted for busybox by Sven Rudolph <sr1@inf.tu-dresden.de> * based on gzip sources * * Adjusted further by Erik Andersen <andersen@codepoet.org> to support * files as well as stdin/stdout, and to generally behave itself wrt * command line handling. * * General cleanup to better adhere to the style guide and make use of standard * busybox functions by Glenn McGrath <bug1@iinet.net.au> * * read_gz interface + associated hacking by Laurence Anderson * * Fixed huft_build() so decoding end-of-block code does not grab more bits * than necessary (this is required by unzip applet), added inflate_cleanup() * to free leaked bytebuffer memory (used in unzip.c), and some minor style * guide cleanups by Ed Clark * * gzip (GNU zip) -- compress files with zip algorithm and 'compress' interface * Copyright (C) 1992-1993 Jean-loup Gailly * The unzip code was written and put in the public domain by Mark Adler. * Portions of the lzw code are derived from the public domain 'compress' * written by Spencer Thomas, Joe Orost, James Woods, Jim McKie, Steve Davies, * Ken Turkowski, Dave Mack and Peter Jannesen. * * See the file algorithm.doc for the compression algorithms and file formats. *  * Licensed under GPLv2 or later, see file LICENSE in this tarball for details. */#include "libbb.h"#include <sys/wait.h>#include <signal.h>#include "unarchive.h"typedef struct huft_s {	unsigned char e;	/* number of extra bits or operation */	unsigned char b;	/* number of bits in this code or subcode */	union {		unsigned short n;	/* literal, length base, or distance base */		struct huft_s *t;	/* pointer to next level of table */	} v;} huft_t;static int gunzip_src_fd;unsigned int gunzip_bytes_out;	/* number of output bytes */static unsigned int gunzip_outbuf_count;	/* bytes in output buffer *//* gunzip_window size--must be a power of two, and *  at least 32K for zip's deflate method */enum { gunzip_wsize = 0x8000 };static unsigned char *gunzip_window;static uint32_t *gunzip_crc_table;uint32_t gunzip_crc;/* If BMAX needs to be larger than 16, then h and x[] should be ulg. */#define BMAX 16	/* maximum bit length of any code (16 for explode) */#define N_MAX 288	/* maximum number of codes in any set *//* bitbuffer */static unsigned int gunzip_bb;	/* bit buffer */static unsigned char gunzip_bk;	/* bits in bit buffer *//* These control the size of the bytebuffer */static unsigned int bytebuffer_max = 0x8000;static unsigned char *bytebuffer = NULL;static unsigned int bytebuffer_offset = 0;static unsigned int bytebuffer_size = 0;static const unsigned short mask_bits[] = {	0x0000, 0x0001, 0x0003, 0x0007, 0x000f, 0x001f, 0x003f, 0x007f, 0x00ff,	0x01ff, 0x03ff, 0x07ff, 0x0fff, 0x1fff, 0x3fff, 0x7fff, 0xffff};/* Copy lengths for literal codes 257..285 */static const unsigned short cplens[] = {	3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 15, 17, 19, 23, 27, 31, 35, 43, 51, 59,	67, 83, 99, 115, 131, 163, 195, 227, 258, 0, 0};/* note: see note #13 above about the 258 in this list. *//* Extra bits for literal codes 257..285 */static const unsigned char cplext[] = {	0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3, 4, 4, 4, 4, 5,	5, 5, 5, 0, 99, 99};						/* 99==invalid *//* Copy offsets for distance codes 0..29 */static const unsigned short cpdist[] = {	1, 2, 3, 4, 5, 7, 9, 13, 17, 25, 33, 49, 65, 97, 129, 193, 257, 385, 513,	769, 1025, 1537, 2049, 3073, 4097, 6145, 8193, 12289, 16385, 24577};/* Extra bits for distance codes */static const unsigned char cpdext[] = {	0, 0, 0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7, 8, 8, 9, 9, 10, 10,	11, 11, 12, 12, 13, 13};/* Tables for deflate from PKZIP's appnote.txt. *//* Order of the bit length code lengths */static const unsigned char border[] = {	16, 17, 18, 0, 8, 7, 9, 6, 10, 5, 11, 4, 12, 3, 13, 2, 14, 1, 15};static unsigned int fill_bitbuffer(unsigned int bitbuffer, unsigned int *current, const unsigned int required){	while (*current < required) {		if (bytebuffer_offset >= bytebuffer_size) {			/* Leave the first 4 bytes empty so we can always unwind the bitbuffer			 * to the front of the bytebuffer, leave 4 bytes free at end of tail			 * so we can easily top up buffer in check_trailer_gzip() */			if (!(bytebuffer_size = bb_xread(gunzip_src_fd, &bytebuffer[4], bytebuffer_max - 8))) {				bb_error_msg_and_die("unexpected end of file");			}			bytebuffer_size += 4;			bytebuffer_offset = 4;		}		bitbuffer |= ((unsigned int) bytebuffer[bytebuffer_offset]) << *current;		bytebuffer_offset++;		*current += 8;	}	return(bitbuffer);}/* * Free the malloc'ed tables built by huft_build(), which makes a linked * list of the tables it made, with the links in a dummy first entry of * each table. * t: table to free */static int huft_free(huft_t * t){	huft_t *p;	huft_t *q;	/* Go through linked list, freeing from the malloced (t[-1]) address. */	p = t;	while (p != (huft_t *) NULL) {		q = (--p)->v.t;		free((char *) p);		p = q;	}	return 0;}/* Given a list of code lengths and a maximum table size, make a set of * tables to decode that set of codes.  Return zero on success, one if * the given code set is incomplete (the tables are still built in this * case), two if the input is invalid (all zero length codes or an * oversubscribed set of lengths), and three if not enough memory. * * b:	code lengths in bits (all assumed <= BMAX) * n:	number of codes (assumed <= N_MAX) * s:	number of simple-valued codes (0..s-1) * d:	list of base values for non-simple codes * e:	list of extra bits for non-simple codes * t:	result: starting table * m:	maximum lookup bits, returns actual */staticint huft_build(unsigned int *b, const unsigned int n,			   const unsigned int s, const unsigned short *d,			   const unsigned char *e, huft_t ** t, unsigned int *m){	unsigned a;				/* counter for codes of length k */	unsigned c[BMAX + 1];	/* bit length count table */	unsigned eob_len;		/* length of end-of-block code (value 256) */	unsigned f;				/* i repeats in table every f entries */	int g;					/* maximum code length */	int htl;				/* table level */	unsigned i;				/* counter, current code */	unsigned j;				/* counter */	int k;					/* number of bits in current code */	unsigned *p;			/* pointer into c[], b[], or v[] */	huft_t *q;				/* points to current table */	huft_t r;				/* table entry for structure assignment */	huft_t *u[BMAX];		/* table stack */	unsigned v[N_MAX];		/* values in order of bit length */	int ws[BMAX+1];			/* bits decoded stack */	int w;					/* bits decoded */	unsigned x[BMAX + 1];	/* bit offsets, then code stack */	unsigned *xp;			/* pointer into x */	int y;					/* number of dummy codes added */	unsigned z;				/* number of entries in current table */	/* Length of EOB code, if any */	eob_len = n > 256 ? b[256] : BMAX;	/* Generate counts for each bit length */	memset((void *)c, 0, sizeof(c));	p = b;	i = n;	do {		c[*p]++; /* assume all entries <= BMAX */		p++; /* Can't combine with above line (Solaris bug) */	} while (--i);	if (c[0] == n) { /* null input--all zero length codes */		*t = (huft_t *) NULL;		*m = 0;		return 2;	}	/* Find minimum and maximum length, bound *m by those */	for (j = 1; (c[j] == 0) && (j <= BMAX); j++);	k = j; /* minimum code length */	for (i = BMAX; (c[i] == 0) && i; i--);	g = i; /* maximum code length */	*m = (*m < j) ? j : ((*m > i) ? i : *m);	/* Adjust last length count to fill out codes, if needed */	for (y = 1 << j; j < i; j++, y <<= 1) {		if ((y -= c[j]) < 0) {			return 2; /* bad input: more codes than bits */		}	}	if ((y -= c[i]) < 0) {		return 2;	}	c[i] += y;	/* Generate starting offsets into the value table for each length */	x[1] = j = 0;	p = c + 1;	xp = x + 2;	while (--i) { /* note that i == g from above */		*xp++ = (j += *p++);	}	/* Make a table of values in order of bit lengths */	p = b;	i = 0;	do {		if ((j = *p++) != 0) {			v[x[j]++] = i;		}	} while (++i < n);	/* Generate the Huffman codes and for each, make the table entries */	x[0] = i = 0;			/* first Huffman code is zero */	p = v;					/* grab values in bit order */	htl = -1;				/* no tables yet--level -1 */	w = ws[0] = 0;			/* bits decoded */	u[0] = (huft_t *) NULL;	/* just to keep compilers happy */	q = (huft_t *) NULL;	/* ditto */	z = 0;					/* ditto */	/* go through the bit lengths (k already is bits in shortest code) */	for (; k <= g; k++) {		a = c[k];		while (a--) {			/* here i is the Huffman code of length k bits for value *p */			/* make tables up to required level */			while (k > ws[htl + 1]) {				w = ws[++htl];				/* compute minimum size table less than or equal to *m bits */				z = (z = g - w) > *m ? *m : z; /* upper limit on table size */				if ((f = 1 << (j = k - w)) > a + 1) { /* try a k-w bit table */					/* too few codes for k-w bit table */					f -= a + 1; /* deduct codes from patterns left */					xp = c + k;					while (++j < z) { /* try smaller tables up to z bits */						if ((f <<= 1) <= *++xp) {							break; /* enough codes to use up j bits */						}						f -= *xp; /* else deduct codes from patterns */					}				}				j = (w + j > eob_len && w < eob_len) ? eob_len - w : j;	/* make EOB code end at table */				z = 1 << j;	/* table entries for j-bit table */				ws[htl+1] = w + j;	/* set bits decoded in stack */				/* allocate and link in new table */				q = (huft_t *) xzalloc((z + 1) * sizeof(huft_t));				*t = q + 1;	/* link to list for huft_free() */				t = &(q->v.t);				u[htl] = ++q;	/* table starts after link */				/* connect to last table, if there is one */				if (htl) {					x[htl] = i; /* save pattern for backing up */					r.b = (unsigned char) (w - ws[htl - 1]); /* bits to dump before this table */					r.e = (unsigned char) (16 + j); /* bits in this table */					r.v.t = q; /* pointer to this table */					j = (i & ((1 << w) - 1)) >> ws[htl - 1];					u[htl - 1][j] = r; /* connect to last table */				}			}			/* set up table entry in r */			r.b = (unsigned char) (k - w);			if (p >= v + n) {				r.e = 99; /* out of values--invalid code */			} else if (*p < s) {				r.e = (unsigned char) (*p < 256 ? 16 : 15);	/* 256 is EOB code */				r.v.n = (unsigned short) (*p++); /* simple code is just the value */			} else {				r.e = (unsigned char) e[*p - s]; /* non-simple--look up in lists */				r.v.n = d[*p++ - s];			}			/* fill code-like entries with r */			f = 1 << (k - w);			for (j = i >> w; j < z; j += f) {				q[j] = r;			}			/* backwards increment the k-bit code i */			for (j = 1 << (k - 1); i & j; j >>= 1) {				i ^= j;			}			i ^= j;			/* backup over finished tables */			while ((i & ((1 << w) - 1)) != x[htl]) {				w = ws[--htl];			}		}	}	/* return actual size of base table */	*m = ws[1];	/* Return true (1) if we were given an incomplete table */	return y != 0 && g != 1;}/* * inflate (decompress) the codes in a deflated (compressed) block. * Return an error code or zero if it all goes ok. * * tl, td: literal/length and distance decoder tables * bl, bd: number of bits decoded by tl[] and td[] */static int inflate_codes(huft_t * my_tl, huft_t * my_td, const unsigned int my_bl, const unsigned int my_bd, int setup){	static unsigned int e;	/* table entry flag/number of extra bits */	static unsigned int n, d;	/* length and index for copy */	static unsigned int w;	/* current gunzip_window position */	static huft_t *t;			/* pointer to table entry */	static unsigned int ml, md;	/* masks for bl and bd bits */	static unsigned int b;	/* bit buffer */	static unsigned int k;			/* number of bits in bit buffer */	static huft_t *tl, *td;	static unsigned int bl, bd;	static int resumeCopy = 0;	if (setup) { // 1st time we are called, copy in variables		tl = my_tl;		td = my_td;		bl = my_bl;		bd = my_bd;		/* make local copies of globals */		b = gunzip_bb;				/* initialize bit buffer */		k = gunzip_bk;		w = gunzip_outbuf_count;			/* initialize gunzip_window position */		/* inflate the coded data */		ml = mask_bits[bl];	/* precompute masks for speed */		md = mask_bits[bd];		return 0; // Don't actually do anything the first time	}	if (resumeCopy) goto do_copy;	while (1) {			/* do until end of block */		b = fill_bitbuffer(b, &k, bl);		if ((e = (t = tl + ((unsigned) b & ml))->e) > 16)			do {				if (e == 99) {					bb_error_msg_and_die("inflate_codes error 1");				}				b >>= t->b;				k -= t->b;				e -= 16;				b = fill_bitbuffer(b, &k, e);			} while ((e =					  (t = t->v.t + ((unsigned) b & mask_bits[e]))->e) > 16);		b >>= t->b;		k -= t->b;		if (e == 16) {	/* then it's a literal */			gunzip_window[w++] = (unsigned char) t->v.n;			if (w == gunzip_wsize) {				gunzip_outbuf_count = (w);				//flush_gunzip_window();				w = 0;				return 1; // We have a block to read			}		} else {		/* it's an EOB or a length */			/* exit if end of block */			if (e == 15) {				break;			}			/* get length of block to copy */			b = fill_bitbuffer(b, &k, e);			n = t->v.n + ((unsigned) b & mask_bits[e]);			b >>= e;			k -= e;			/* decode distance of block to copy */			b = fill_bitbuffer(b, &k, bd);			if ((e = (t = td + ((unsigned) b & md))->e) > 16)				do {					if (e == 99)						bb_error_msg_and_die("inflate_codes error 2");					b >>= t->b;					k -= t->b;					e -= 16;					b = fill_bitbuffer(b, &k, e);				} while ((e =						  (t =						   t->v.t + ((unsigned) b & mask_bits[e]))->e) > 16);			b >>= t->b;			k -= t->b;			b = fill_bitbuffer(b, &k, e);			d = w - t->v.n - ((unsigned) b & mask_bits[e]);			b >>= e;			k -= e;			/* do the copy */do_copy:		do {				n -= (e =					  (e =					   gunzip_wsize - ((d &= gunzip_wsize - 1) > w ? d : w)) > n ? n : e);			   /* copy to new buffer to prevent possible overwrite */				if (w - d >= e) {	/* (this test assumes unsigned comparison) */					memcpy(gunzip_window + w, gunzip_window + d, e);					w += e;					d += e;				} else {				   /* do it slow to avoid memcpy() overlap */				   /* !NOMEMCPY */					do {						gunzip_window[w++] = gunzip_window[d++];					} while (--e);				}				if (w == gunzip_wsize) {					gunzip_outbuf_count = (w);					if (n) resumeCopy = 1;					else resumeCopy = 0;					//flush_gunzip_window();					w = 0;					return 1;				}			} while (n);			resumeCopy = 0;		}	}	/* restore the globals from the locals */	gunzip_outbuf_count = w;			/* restore global gunzip_window pointer */	gunzip_bb = b;				/* restore global bit buffer */	gunzip_bk = k;

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?