|  | // SPDX-License-Identifier: GPL-2.0-or-later | 
|  | /* | 
|  | * lzx_decompress.c - A decompressor for the LZX compression format, which can | 
|  | * be used in "System Compressed" files.  This is based on the code from wimlib. | 
|  | * This code only supports a window size (dictionary size) of 32768 bytes, since | 
|  | * this is the only size used in System Compression. | 
|  | * | 
|  | * Copyright (C) 2015 Eric Biggers | 
|  | */ | 
|  |  | 
|  | #include "decompress_common.h" | 
|  | #include "lib.h" | 
|  |  | 
|  | /* Number of literal byte values  */ | 
|  | #define LZX_NUM_CHARS			256 | 
|  |  | 
|  | /* The smallest and largest allowed match lengths  */ | 
|  | #define LZX_MIN_MATCH_LEN		2 | 
|  | #define LZX_MAX_MATCH_LEN		257 | 
|  |  | 
|  | /* Number of distinct match lengths that can be represented  */ | 
|  | #define LZX_NUM_LENS			(LZX_MAX_MATCH_LEN - LZX_MIN_MATCH_LEN + 1) | 
|  |  | 
|  | /* Number of match lengths for which no length symbol is required  */ | 
|  | #define LZX_NUM_PRIMARY_LENS		7 | 
|  | #define LZX_NUM_LEN_HEADERS		(LZX_NUM_PRIMARY_LENS + 1) | 
|  |  | 
|  | /* Valid values of the 3-bit block type field  */ | 
|  | #define LZX_BLOCKTYPE_VERBATIM		1 | 
|  | #define LZX_BLOCKTYPE_ALIGNED		2 | 
|  | #define LZX_BLOCKTYPE_UNCOMPRESSED	3 | 
|  |  | 
|  | /* Number of offset slots for a window size of 32768  */ | 
|  | #define LZX_NUM_OFFSET_SLOTS		30 | 
|  |  | 
|  | /* Number of symbols in the main code for a window size of 32768  */ | 
|  | #define LZX_MAINCODE_NUM_SYMBOLS	\ | 
|  | (LZX_NUM_CHARS + (LZX_NUM_OFFSET_SLOTS * LZX_NUM_LEN_HEADERS)) | 
|  |  | 
|  | /* Number of symbols in the length code  */ | 
|  | #define LZX_LENCODE_NUM_SYMBOLS		(LZX_NUM_LENS - LZX_NUM_PRIMARY_LENS) | 
|  |  | 
|  | /* Number of symbols in the precode  */ | 
|  | #define LZX_PRECODE_NUM_SYMBOLS		20 | 
|  |  | 
|  | /* Number of bits in which each precode codeword length is represented  */ | 
|  | #define LZX_PRECODE_ELEMENT_SIZE	4 | 
|  |  | 
|  | /* Number of low-order bits of each match offset that are entropy-encoded in | 
|  | * aligned offset blocks | 
|  | */ | 
|  | #define LZX_NUM_ALIGNED_OFFSET_BITS	3 | 
|  |  | 
|  | /* Number of symbols in the aligned offset code  */ | 
|  | #define LZX_ALIGNEDCODE_NUM_SYMBOLS	(1 << LZX_NUM_ALIGNED_OFFSET_BITS) | 
|  |  | 
|  | /* Mask for the match offset bits that are entropy-encoded in aligned offset | 
|  | * blocks | 
|  | */ | 
|  | #define LZX_ALIGNED_OFFSET_BITMASK	((1 << LZX_NUM_ALIGNED_OFFSET_BITS) - 1) | 
|  |  | 
|  | /* Number of bits in which each aligned offset codeword length is represented  */ | 
|  | #define LZX_ALIGNEDCODE_ELEMENT_SIZE	3 | 
|  |  | 
|  | /* Maximum lengths (in bits) of the codewords in each Huffman code  */ | 
|  | #define LZX_MAX_MAIN_CODEWORD_LEN	16 | 
|  | #define LZX_MAX_LEN_CODEWORD_LEN	16 | 
|  | #define LZX_MAX_PRE_CODEWORD_LEN	((1 << LZX_PRECODE_ELEMENT_SIZE) - 1) | 
|  | #define LZX_MAX_ALIGNED_CODEWORD_LEN	((1 << LZX_ALIGNEDCODE_ELEMENT_SIZE) - 1) | 
|  |  | 
|  | /* The default "filesize" value used in pre/post-processing.  In the LZX format | 
|  | * used in cabinet files this value must be given to the decompressor, whereas | 
|  | * in the LZX format used in WIM files and system-compressed files this value is | 
|  | * fixed at 12000000. | 
|  | */ | 
|  | #define LZX_DEFAULT_FILESIZE		12000000 | 
|  |  | 
|  | /* Assumed block size when the encoded block size begins with a 0 bit.  */ | 
|  | #define LZX_DEFAULT_BLOCK_SIZE		32768 | 
|  |  | 
|  | /* Number of offsets in the recent (or "repeat") offsets queue.  */ | 
|  | #define LZX_NUM_RECENT_OFFSETS		3 | 
|  |  | 
|  | /* These values are chosen for fast decompression.  */ | 
|  | #define LZX_MAINCODE_TABLEBITS		11 | 
|  | #define LZX_LENCODE_TABLEBITS		10 | 
|  | #define LZX_PRECODE_TABLEBITS		6 | 
|  | #define LZX_ALIGNEDCODE_TABLEBITS	7 | 
|  |  | 
|  | #define LZX_READ_LENS_MAX_OVERRUN	50 | 
|  |  | 
|  | /* Mapping: offset slot => first match offset that uses that offset slot. | 
|  | */ | 
|  | static const u32 lzx_offset_slot_base[LZX_NUM_OFFSET_SLOTS + 1] = { | 
|  | 0,	1,	2,	3,	4,	/* 0  --- 4  */ | 
|  | 6,	8,	12,	16,	24,	/* 5  --- 9  */ | 
|  | 32,	48,	64,	96,	128,	/* 10 --- 14 */ | 
|  | 192,	256,	384,	512,	768,	/* 15 --- 19 */ | 
|  | 1024,	1536,	2048,	3072,	4096,   /* 20 --- 24 */ | 
|  | 6144,	8192,	12288,	16384,	24576,	/* 25 --- 29 */ | 
|  | 32768,					/* extra     */ | 
|  | }; | 
|  |  | 
|  | /* Mapping: offset slot => how many extra bits must be read and added to the | 
|  | * corresponding offset slot base to decode the match offset. | 
|  | */ | 
|  | static const u8 lzx_extra_offset_bits[LZX_NUM_OFFSET_SLOTS] = { | 
|  | 0,	0,	0,	0,	1, | 
|  | 1,	2,	2,	3,	3, | 
|  | 4,	4,	5,	5,	6, | 
|  | 6,	7,	7,	8,	8, | 
|  | 9,	9,	10,	10,	11, | 
|  | 11,	12,	12,	13,	13, | 
|  | }; | 
|  |  | 
|  | /* Reusable heap-allocated memory for LZX decompression  */ | 
|  | struct lzx_decompressor { | 
|  |  | 
|  | /* Huffman decoding tables, and arrays that map symbols to codeword | 
|  | * lengths | 
|  | */ | 
|  |  | 
|  | u16 maincode_decode_table[(1 << LZX_MAINCODE_TABLEBITS) + | 
|  | (LZX_MAINCODE_NUM_SYMBOLS * 2)]; | 
|  | u8 maincode_lens[LZX_MAINCODE_NUM_SYMBOLS + LZX_READ_LENS_MAX_OVERRUN]; | 
|  |  | 
|  |  | 
|  | u16 lencode_decode_table[(1 << LZX_LENCODE_TABLEBITS) + | 
|  | (LZX_LENCODE_NUM_SYMBOLS * 2)]; | 
|  | u8 lencode_lens[LZX_LENCODE_NUM_SYMBOLS + LZX_READ_LENS_MAX_OVERRUN]; | 
|  |  | 
|  |  | 
|  | u16 alignedcode_decode_table[(1 << LZX_ALIGNEDCODE_TABLEBITS) + | 
|  | (LZX_ALIGNEDCODE_NUM_SYMBOLS * 2)]; | 
|  | u8 alignedcode_lens[LZX_ALIGNEDCODE_NUM_SYMBOLS]; | 
|  |  | 
|  | u16 precode_decode_table[(1 << LZX_PRECODE_TABLEBITS) + | 
|  | (LZX_PRECODE_NUM_SYMBOLS * 2)]; | 
|  | u8 precode_lens[LZX_PRECODE_NUM_SYMBOLS]; | 
|  |  | 
|  | /* Temporary space for make_huffman_decode_table()  */ | 
|  | u16 working_space[2 * (1 + LZX_MAX_MAIN_CODEWORD_LEN) + | 
|  | LZX_MAINCODE_NUM_SYMBOLS]; | 
|  | }; | 
|  |  | 
|  | static void undo_e8_translation(void *target, s32 input_pos) | 
|  | { | 
|  | s32 abs_offset, rel_offset; | 
|  |  | 
|  | abs_offset = get_unaligned_le32(target); | 
|  | if (abs_offset >= 0) { | 
|  | if (abs_offset < LZX_DEFAULT_FILESIZE) { | 
|  | /* "good translation" */ | 
|  | rel_offset = abs_offset - input_pos; | 
|  | put_unaligned_le32(rel_offset, target); | 
|  | } | 
|  | } else { | 
|  | if (abs_offset >= -input_pos) { | 
|  | /* "compensating translation" */ | 
|  | rel_offset = abs_offset + LZX_DEFAULT_FILESIZE; | 
|  | put_unaligned_le32(rel_offset, target); | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Undo the 'E8' preprocessing used in LZX.  Before compression, the | 
|  | * uncompressed data was preprocessed by changing the targets of suspected x86 | 
|  | * CALL instructions from relative offsets to absolute offsets.  After | 
|  | * match/literal decoding, the decompressor must undo the translation. | 
|  | */ | 
|  | static void lzx_postprocess(u8 *data, u32 size) | 
|  | { | 
|  | /* | 
|  | * A worthwhile optimization is to push the end-of-buffer check into the | 
|  | * relatively rare E8 case.  This is possible if we replace the last six | 
|  | * bytes of data with E8 bytes; then we are guaranteed to hit an E8 byte | 
|  | * before reaching end-of-buffer.  In addition, this scheme guarantees | 
|  | * that no translation can begin following an E8 byte in the last 10 | 
|  | * bytes because a 4-byte offset containing E8 as its high byte is a | 
|  | * large negative number that is not valid for translation.  That is | 
|  | * exactly what we need. | 
|  | */ | 
|  | u8 *tail; | 
|  | u8 saved_bytes[6]; | 
|  | u8 *p; | 
|  |  | 
|  | if (size <= 10) | 
|  | return; | 
|  |  | 
|  | tail = &data[size - 6]; | 
|  | memcpy(saved_bytes, tail, 6); | 
|  | memset(tail, 0xE8, 6); | 
|  | p = data; | 
|  | for (;;) { | 
|  | while (*p != 0xE8) | 
|  | p++; | 
|  | if (p >= tail) | 
|  | break; | 
|  | undo_e8_translation(p + 1, p - data); | 
|  | p += 5; | 
|  | } | 
|  | memcpy(tail, saved_bytes, 6); | 
|  | } | 
|  |  | 
|  | /* Read a Huffman-encoded symbol using the precode.  */ | 
|  | static forceinline u32 read_presym(const struct lzx_decompressor *d, | 
|  | struct input_bitstream *is) | 
|  | { | 
|  | return read_huffsym(is, d->precode_decode_table, | 
|  | LZX_PRECODE_TABLEBITS, LZX_MAX_PRE_CODEWORD_LEN); | 
|  | } | 
|  |  | 
|  | /* Read a Huffman-encoded symbol using the main code.  */ | 
|  | static forceinline u32 read_mainsym(const struct lzx_decompressor *d, | 
|  | struct input_bitstream *is) | 
|  | { | 
|  | return read_huffsym(is, d->maincode_decode_table, | 
|  | LZX_MAINCODE_TABLEBITS, LZX_MAX_MAIN_CODEWORD_LEN); | 
|  | } | 
|  |  | 
|  | /* Read a Huffman-encoded symbol using the length code.  */ | 
|  | static forceinline u32 read_lensym(const struct lzx_decompressor *d, | 
|  | struct input_bitstream *is) | 
|  | { | 
|  | return read_huffsym(is, d->lencode_decode_table, | 
|  | LZX_LENCODE_TABLEBITS, LZX_MAX_LEN_CODEWORD_LEN); | 
|  | } | 
|  |  | 
|  | /* Read a Huffman-encoded symbol using the aligned offset code.  */ | 
|  | static forceinline u32 read_alignedsym(const struct lzx_decompressor *d, | 
|  | struct input_bitstream *is) | 
|  | { | 
|  | return read_huffsym(is, d->alignedcode_decode_table, | 
|  | LZX_ALIGNEDCODE_TABLEBITS, | 
|  | LZX_MAX_ALIGNED_CODEWORD_LEN); | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Read the precode from the compressed input bitstream, then use it to decode | 
|  | * @num_lens codeword length values. | 
|  | * | 
|  | * @is:		The input bitstream. | 
|  | * | 
|  | * @lens:	An array that contains the length values from the previous time | 
|  | *		the codeword lengths for this Huffman code were read, or all 0's | 
|  | *		if this is the first time.  This array must have at least | 
|  | *		(@num_lens + LZX_READ_LENS_MAX_OVERRUN) entries. | 
|  | * | 
|  | * @num_lens:	Number of length values to decode. | 
|  | * | 
|  | * Returns 0 on success, or -1 if the data was invalid. | 
|  | */ | 
|  | static int lzx_read_codeword_lens(struct lzx_decompressor *d, | 
|  | struct input_bitstream *is, | 
|  | u8 *lens, u32 num_lens) | 
|  | { | 
|  | u8 *len_ptr = lens; | 
|  | u8 *lens_end = lens + num_lens; | 
|  | int i; | 
|  |  | 
|  | /* Read the lengths of the precode codewords.  These are given | 
|  | * explicitly. | 
|  | */ | 
|  | for (i = 0; i < LZX_PRECODE_NUM_SYMBOLS; i++) { | 
|  | d->precode_lens[i] = | 
|  | bitstream_read_bits(is, LZX_PRECODE_ELEMENT_SIZE); | 
|  | } | 
|  |  | 
|  | /* Make the decoding table for the precode.  */ | 
|  | if (make_huffman_decode_table(d->precode_decode_table, | 
|  | LZX_PRECODE_NUM_SYMBOLS, | 
|  | LZX_PRECODE_TABLEBITS, | 
|  | d->precode_lens, | 
|  | LZX_MAX_PRE_CODEWORD_LEN, | 
|  | d->working_space)) | 
|  | return -1; | 
|  |  | 
|  | /* Decode the codeword lengths.  */ | 
|  | do { | 
|  | u32 presym; | 
|  | u8 len; | 
|  |  | 
|  | /* Read the next precode symbol.  */ | 
|  | presym = read_presym(d, is); | 
|  | if (presym < 17) { | 
|  | /* Difference from old length  */ | 
|  | len = *len_ptr - presym; | 
|  | if ((s8)len < 0) | 
|  | len += 17; | 
|  | *len_ptr++ = len; | 
|  | } else { | 
|  | /* Special RLE values  */ | 
|  |  | 
|  | u32 run_len; | 
|  |  | 
|  | if (presym == 17) { | 
|  | /* Run of 0's  */ | 
|  | run_len = 4 + bitstream_read_bits(is, 4); | 
|  | len = 0; | 
|  | } else if (presym == 18) { | 
|  | /* Longer run of 0's  */ | 
|  | run_len = 20 + bitstream_read_bits(is, 5); | 
|  | len = 0; | 
|  | } else { | 
|  | /* Run of identical lengths  */ | 
|  | run_len = 4 + bitstream_read_bits(is, 1); | 
|  | presym = read_presym(d, is); | 
|  | if (presym > 17) | 
|  | return -1; | 
|  | len = *len_ptr - presym; | 
|  | if ((s8)len < 0) | 
|  | len += 17; | 
|  | } | 
|  |  | 
|  | do { | 
|  | *len_ptr++ = len; | 
|  | } while (--run_len); | 
|  | /* Worst case overrun is when presym == 18, | 
|  | * run_len == 20 + 31, and only 1 length was remaining. | 
|  | * So LZX_READ_LENS_MAX_OVERRUN == 50. | 
|  | * | 
|  | * Overrun while reading the first half of maincode_lens | 
|  | * can corrupt the previous values in the second half. | 
|  | * This doesn't really matter because the resulting | 
|  | * lengths will still be in range, and data that | 
|  | * generates overruns is invalid anyway. | 
|  | */ | 
|  | } | 
|  | } while (len_ptr < lens_end); | 
|  |  | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Read the header of an LZX block and save the block type and (uncompressed) | 
|  | * size in *block_type_ret and *block_size_ret, respectively. | 
|  | * | 
|  | * If the block is compressed, also update the Huffman decode @tables with the | 
|  | * new Huffman codes.  If the block is uncompressed, also update the match | 
|  | * offset @queue with the new match offsets. | 
|  | * | 
|  | * Return 0 on success, or -1 if the data was invalid. | 
|  | */ | 
|  | static int lzx_read_block_header(struct lzx_decompressor *d, | 
|  | struct input_bitstream *is, | 
|  | int *block_type_ret, | 
|  | u32 *block_size_ret, | 
|  | u32 recent_offsets[]) | 
|  | { | 
|  | int block_type; | 
|  | u32 block_size; | 
|  | int i; | 
|  |  | 
|  | bitstream_ensure_bits(is, 4); | 
|  |  | 
|  | /* The first three bits tell us what kind of block it is, and should be | 
|  | * one of the LZX_BLOCKTYPE_* values. | 
|  | */ | 
|  | block_type = bitstream_pop_bits(is, 3); | 
|  |  | 
|  | /* Read the block size.  */ | 
|  | if (bitstream_pop_bits(is, 1)) { | 
|  | block_size = LZX_DEFAULT_BLOCK_SIZE; | 
|  | } else { | 
|  | block_size = 0; | 
|  | block_size |= bitstream_read_bits(is, 8); | 
|  | block_size <<= 8; | 
|  | block_size |= bitstream_read_bits(is, 8); | 
|  | } | 
|  |  | 
|  | switch (block_type) { | 
|  |  | 
|  | case LZX_BLOCKTYPE_ALIGNED: | 
|  |  | 
|  | /* Read the aligned offset code and prepare its decode table. | 
|  | */ | 
|  |  | 
|  | for (i = 0; i < LZX_ALIGNEDCODE_NUM_SYMBOLS; i++) { | 
|  | d->alignedcode_lens[i] = | 
|  | bitstream_read_bits(is, | 
|  | LZX_ALIGNEDCODE_ELEMENT_SIZE); | 
|  | } | 
|  |  | 
|  | if (make_huffman_decode_table(d->alignedcode_decode_table, | 
|  | LZX_ALIGNEDCODE_NUM_SYMBOLS, | 
|  | LZX_ALIGNEDCODE_TABLEBITS, | 
|  | d->alignedcode_lens, | 
|  | LZX_MAX_ALIGNED_CODEWORD_LEN, | 
|  | d->working_space)) | 
|  | return -1; | 
|  |  | 
|  | /* Fall though, since the rest of the header for aligned offset | 
|  | * blocks is the same as that for verbatim blocks. | 
|  | */ | 
|  | fallthrough; | 
|  |  | 
|  | case LZX_BLOCKTYPE_VERBATIM: | 
|  |  | 
|  | /* Read the main code and prepare its decode table. | 
|  | * | 
|  | * Note that the codeword lengths in the main code are encoded | 
|  | * in two parts: one part for literal symbols, and one part for | 
|  | * match symbols. | 
|  | */ | 
|  |  | 
|  | if (lzx_read_codeword_lens(d, is, d->maincode_lens, | 
|  | LZX_NUM_CHARS)) | 
|  | return -1; | 
|  |  | 
|  | if (lzx_read_codeword_lens(d, is, | 
|  | d->maincode_lens + LZX_NUM_CHARS, | 
|  | LZX_MAINCODE_NUM_SYMBOLS - LZX_NUM_CHARS)) | 
|  | return -1; | 
|  |  | 
|  | if (make_huffman_decode_table(d->maincode_decode_table, | 
|  | LZX_MAINCODE_NUM_SYMBOLS, | 
|  | LZX_MAINCODE_TABLEBITS, | 
|  | d->maincode_lens, | 
|  | LZX_MAX_MAIN_CODEWORD_LEN, | 
|  | d->working_space)) | 
|  | return -1; | 
|  |  | 
|  | /* Read the length code and prepare its decode table.  */ | 
|  |  | 
|  | if (lzx_read_codeword_lens(d, is, d->lencode_lens, | 
|  | LZX_LENCODE_NUM_SYMBOLS)) | 
|  | return -1; | 
|  |  | 
|  | if (make_huffman_decode_table(d->lencode_decode_table, | 
|  | LZX_LENCODE_NUM_SYMBOLS, | 
|  | LZX_LENCODE_TABLEBITS, | 
|  | d->lencode_lens, | 
|  | LZX_MAX_LEN_CODEWORD_LEN, | 
|  | d->working_space)) | 
|  | return -1; | 
|  |  | 
|  | break; | 
|  |  | 
|  | case LZX_BLOCKTYPE_UNCOMPRESSED: | 
|  |  | 
|  | /* Before reading the three recent offsets from the uncompressed | 
|  | * block header, the stream must be aligned on a 16-bit | 
|  | * boundary.  But if the stream is *already* aligned, then the | 
|  | * next 16 bits must be discarded. | 
|  | */ | 
|  | bitstream_ensure_bits(is, 1); | 
|  | bitstream_align(is); | 
|  |  | 
|  | recent_offsets[0] = bitstream_read_u32(is); | 
|  | recent_offsets[1] = bitstream_read_u32(is); | 
|  | recent_offsets[2] = bitstream_read_u32(is); | 
|  |  | 
|  | /* Offsets of 0 are invalid.  */ | 
|  | if (recent_offsets[0] == 0 || recent_offsets[1] == 0 || | 
|  | recent_offsets[2] == 0) | 
|  | return -1; | 
|  | break; | 
|  |  | 
|  | default: | 
|  | /* Unrecognized block type.  */ | 
|  | return -1; | 
|  | } | 
|  |  | 
|  | *block_type_ret = block_type; | 
|  | *block_size_ret = block_size; | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | /* Decompress a block of LZX-compressed data.  */ | 
|  | static int lzx_decompress_block(const struct lzx_decompressor *d, | 
|  | struct input_bitstream *is, | 
|  | int block_type, u32 block_size, | 
|  | u8 * const out_begin, u8 *out_next, | 
|  | u32 recent_offsets[]) | 
|  | { | 
|  | u8 * const block_end = out_next + block_size; | 
|  | u32 ones_if_aligned = 0U - (block_type == LZX_BLOCKTYPE_ALIGNED); | 
|  |  | 
|  | do { | 
|  | u32 mainsym; | 
|  | u32 match_len; | 
|  | u32 match_offset; | 
|  | u32 offset_slot; | 
|  | u32 num_extra_bits; | 
|  |  | 
|  | mainsym = read_mainsym(d, is); | 
|  | if (mainsym < LZX_NUM_CHARS) { | 
|  | /* Literal  */ | 
|  | *out_next++ = mainsym; | 
|  | continue; | 
|  | } | 
|  |  | 
|  | /* Match  */ | 
|  |  | 
|  | /* Decode the length header and offset slot.  */ | 
|  | mainsym -= LZX_NUM_CHARS; | 
|  | match_len = mainsym % LZX_NUM_LEN_HEADERS; | 
|  | offset_slot = mainsym / LZX_NUM_LEN_HEADERS; | 
|  |  | 
|  | /* If needed, read a length symbol to decode the full length. */ | 
|  | if (match_len == LZX_NUM_PRIMARY_LENS) | 
|  | match_len += read_lensym(d, is); | 
|  | match_len += LZX_MIN_MATCH_LEN; | 
|  |  | 
|  | if (offset_slot < LZX_NUM_RECENT_OFFSETS) { | 
|  | /* Repeat offset  */ | 
|  |  | 
|  | /* Note: This isn't a real LRU queue, since using the R2 | 
|  | * offset doesn't bump the R1 offset down to R2.  This | 
|  | * quirk allows all 3 recent offsets to be handled by | 
|  | * the same code.  (For R0, the swap is a no-op.) | 
|  | */ | 
|  | match_offset = recent_offsets[offset_slot]; | 
|  | recent_offsets[offset_slot] = recent_offsets[0]; | 
|  | recent_offsets[0] = match_offset; | 
|  | } else { | 
|  | /* Explicit offset  */ | 
|  |  | 
|  | /* Look up the number of extra bits that need to be read | 
|  | * to decode offsets with this offset slot. | 
|  | */ | 
|  | num_extra_bits = lzx_extra_offset_bits[offset_slot]; | 
|  |  | 
|  | /* Start with the offset slot base value.  */ | 
|  | match_offset = lzx_offset_slot_base[offset_slot]; | 
|  |  | 
|  | /* In aligned offset blocks, the low-order 3 bits of | 
|  | * each offset are encoded using the aligned offset | 
|  | * code.  Otherwise, all the extra bits are literal. | 
|  | */ | 
|  |  | 
|  | if ((num_extra_bits & ones_if_aligned) >= LZX_NUM_ALIGNED_OFFSET_BITS) { | 
|  | match_offset += | 
|  | bitstream_read_bits(is, num_extra_bits - | 
|  | LZX_NUM_ALIGNED_OFFSET_BITS) | 
|  | << LZX_NUM_ALIGNED_OFFSET_BITS; | 
|  | match_offset += read_alignedsym(d, is); | 
|  | } else { | 
|  | match_offset += bitstream_read_bits(is, num_extra_bits); | 
|  | } | 
|  |  | 
|  | /* Adjust the offset.  */ | 
|  | match_offset -= (LZX_NUM_RECENT_OFFSETS - 1); | 
|  |  | 
|  | /* Update the recent offsets.  */ | 
|  | recent_offsets[2] = recent_offsets[1]; | 
|  | recent_offsets[1] = recent_offsets[0]; | 
|  | recent_offsets[0] = match_offset; | 
|  | } | 
|  |  | 
|  | /* Validate the match, then copy it to the current position.  */ | 
|  |  | 
|  | if (match_len > (size_t)(block_end - out_next)) | 
|  | return -1; | 
|  |  | 
|  | if (match_offset > (size_t)(out_next - out_begin)) | 
|  | return -1; | 
|  |  | 
|  | out_next = lz_copy(out_next, match_len, match_offset, | 
|  | block_end, LZX_MIN_MATCH_LEN); | 
|  |  | 
|  | } while (out_next != block_end); | 
|  |  | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * lzx_allocate_decompressor - Allocate an LZX decompressor | 
|  | * | 
|  | * Return the pointer to the decompressor on success, or return NULL and set | 
|  | * errno on failure. | 
|  | */ | 
|  | struct lzx_decompressor *lzx_allocate_decompressor(void) | 
|  | { | 
|  | return kmalloc(sizeof(struct lzx_decompressor), GFP_NOFS); | 
|  | } | 
|  |  | 
|  | /* | 
|  | * lzx_decompress - Decompress a buffer of LZX-compressed data | 
|  | * | 
|  | * @decompressor:      A decompressor allocated with lzx_allocate_decompressor() | 
|  | * @compressed_data:	The buffer of data to decompress | 
|  | * @compressed_size:	Number of bytes of compressed data | 
|  | * @uncompressed_data:	The buffer in which to store the decompressed data | 
|  | * @uncompressed_size:	The number of bytes the data decompresses into | 
|  | * | 
|  | * Return 0 on success, or return -1 and set errno on failure. | 
|  | */ | 
|  | int lzx_decompress(struct lzx_decompressor *decompressor, | 
|  | const void *compressed_data, size_t compressed_size, | 
|  | void *uncompressed_data, size_t uncompressed_size) | 
|  | { | 
|  | struct lzx_decompressor *d = decompressor; | 
|  | u8 * const out_begin = uncompressed_data; | 
|  | u8 *out_next = out_begin; | 
|  | u8 * const out_end = out_begin + uncompressed_size; | 
|  | struct input_bitstream is; | 
|  | u32 recent_offsets[LZX_NUM_RECENT_OFFSETS] = {1, 1, 1}; | 
|  | int e8_status = 0; | 
|  |  | 
|  | init_input_bitstream(&is, compressed_data, compressed_size); | 
|  |  | 
|  | /* Codeword lengths begin as all 0's for delta encoding purposes.  */ | 
|  | memset(d->maincode_lens, 0, LZX_MAINCODE_NUM_SYMBOLS); | 
|  | memset(d->lencode_lens, 0, LZX_LENCODE_NUM_SYMBOLS); | 
|  |  | 
|  | /* Decompress blocks until we have all the uncompressed data.  */ | 
|  |  | 
|  | while (out_next != out_end) { | 
|  | int block_type; | 
|  | u32 block_size; | 
|  |  | 
|  | if (lzx_read_block_header(d, &is, &block_type, &block_size, | 
|  | recent_offsets)) | 
|  | goto invalid; | 
|  |  | 
|  | if (block_size < 1 || block_size > (size_t)(out_end - out_next)) | 
|  | goto invalid; | 
|  |  | 
|  | if (block_type != LZX_BLOCKTYPE_UNCOMPRESSED) { | 
|  |  | 
|  | /* Compressed block  */ | 
|  |  | 
|  | if (lzx_decompress_block(d, | 
|  | &is, | 
|  | block_type, | 
|  | block_size, | 
|  | out_begin, | 
|  | out_next, | 
|  | recent_offsets)) | 
|  | goto invalid; | 
|  |  | 
|  | e8_status |= d->maincode_lens[0xe8]; | 
|  | out_next += block_size; | 
|  | } else { | 
|  | /* Uncompressed block  */ | 
|  |  | 
|  | out_next = bitstream_read_bytes(&is, out_next, | 
|  | block_size); | 
|  | if (!out_next) | 
|  | goto invalid; | 
|  |  | 
|  | if (block_size & 1) | 
|  | bitstream_read_byte(&is); | 
|  |  | 
|  | e8_status = 1; | 
|  | } | 
|  | } | 
|  |  | 
|  | /* Postprocess the data unless it cannot possibly contain 0xe8 bytes. */ | 
|  | if (e8_status) | 
|  | lzx_postprocess(uncompressed_data, uncompressed_size); | 
|  |  | 
|  | return 0; | 
|  |  | 
|  | invalid: | 
|  | return -1; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * lzx_free_decompressor - Free an LZX decompressor | 
|  | * | 
|  | * @decompressor:       A decompressor that was allocated with | 
|  | *			lzx_allocate_decompressor(), or NULL. | 
|  | */ | 
|  | void lzx_free_decompressor(struct lzx_decompressor *decompressor) | 
|  | { | 
|  | kfree(decompressor); | 
|  | } |