/////////////////////////////////////////////////////////////////////////////// // /// \file block_header_decoder.c /// \brief Decodes Block Header from .lzma files // // Copyright (C) 2007 Lasse Collin // // This library is free software; you can redistribute it and/or // modify it under the terms of the GNU Lesser General Public // License as published by the Free Software Foundation; either // version 2.1 of the License, or (at your option) any later version. // // This library is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU // Lesser General Public License for more details. // /////////////////////////////////////////////////////////////////////////////// #include "common.h" #include "check.h" struct lzma_coder_s { lzma_options_block *options; enum { SEQ_FLAGS_1, SEQ_FLAGS_2, SEQ_COMPRESSED_SIZE, SEQ_UNCOMPRESSED_SIZE, SEQ_FILTER_FLAGS_INIT, SEQ_FILTER_FLAGS_DECODE, SEQ_CRC32, SEQ_PADDING } sequence; /// Position in variable-length integers size_t pos; /// CRC32 of the Block Header uint32_t crc32; lzma_next_coder filter_flags_decoder; }; static bool update_sequence(lzma_coder *coder) { switch (coder->sequence) { case SEQ_FLAGS_2: if (coder->options->compressed_size != LZMA_VLI_VALUE_UNKNOWN) { coder->pos = 0; coder->sequence = SEQ_COMPRESSED_SIZE; break; } // Fall through case SEQ_COMPRESSED_SIZE: if (coder->options->uncompressed_size != LZMA_VLI_VALUE_UNKNOWN) { coder->pos = 0; coder->sequence = SEQ_UNCOMPRESSED_SIZE; break; } // Fall through case SEQ_UNCOMPRESSED_SIZE: coder->pos = 0; // Fall through case SEQ_FILTER_FLAGS_DECODE: if (coder->options->filters[coder->pos].id != LZMA_VLI_VALUE_UNKNOWN) { coder->sequence = SEQ_FILTER_FLAGS_INIT; break; } if (coder->options->has_crc32) { coder->pos = 0; coder->sequence = SEQ_CRC32; break; } case SEQ_CRC32: if (coder->options->padding != 0) { coder->pos = 0; coder->sequence = SEQ_PADDING; break; } return true; default: assert(0); return true; } return false; } static lzma_ret block_header_decode(lzma_coder *coder, lzma_allocator *allocator, const uint8_t *restrict in, size_t *restrict in_pos, size_t in_size, uint8_t *restrict out lzma_attribute((unused)), size_t *restrict out_pos lzma_attribute((unused)), size_t out_size lzma_attribute((unused)), lzma_action action lzma_attribute((unused))) { while (*in_pos < in_size) switch (coder->sequence) { case SEQ_FLAGS_1: // Check that the reserved bit is unset. Use HEADER_ERROR // because newer version of liblzma may support the reserved // bit, although it is likely that this is just a broken file. if (in[*in_pos] & 0x40) return LZMA_HEADER_ERROR; // Number of filters: we prepare appropriate amount of // variables for variable-length integer parsing. The // initialization function has already reset the rest // of the values to LZMA_VLI_VALUE_UNKNOWN, which allows // us to later know how many filters there are. for (int i = (int)(in[*in_pos] & 0x07) - 1; i >= 0; --i) coder->options->filters[i].id = 0; // End of Payload Marker flag coder->options->has_eopm = (in[*in_pos] & 0x08) != 0; // Compressed Size: Prepare for variable-length integer // parsing if it is known. if (in[*in_pos] & 0x10) coder->options->compressed_size = 0; // Uncompressed Size: the same. if (in[*in_pos] & 0x20) coder->options->uncompressed_size = 0; // Is Metadata Block flag coder->options->is_metadata = (in[*in_pos] & 0x80) != 0; // We need at least one: Uncompressed Size or EOPM. if (coder->options->uncompressed_size == LZMA_VLI_VALUE_UNKNOWN && !coder->options->has_eopm) return LZMA_DATA_ERROR; // Update header CRC32. coder->crc32 = lzma_crc32(in + *in_pos, 1, coder->crc32); ++*in_pos; coder->sequence = SEQ_FLAGS_2; break; case SEQ_FLAGS_2: // Check that the reserved bits are unset. if (in[*in_pos] & 0xE0) return LZMA_DATA_ERROR; // Get the size of Header Padding. coder->options->padding = in[*in_pos] & 0x1F; coder->crc32 = lzma_crc32(in + *in_pos, 1, coder->crc32); ++*in_pos; if (update_sequence(coder)) return LZMA_STREAM_END; break; case SEQ_COMPRESSED_SIZE: { // Store the old input position to be used when // updating coder->header_crc32. const size_t in_start = *in_pos; const lzma_ret ret = lzma_vli_decode( &coder->options->compressed_size, &coder->pos, in, in_pos, in_size); const size_t in_used = *in_pos - in_start; coder->options->compressed_reserve += in_used; assert(coder->options->compressed_reserve <= LZMA_VLI_BYTES_MAX); coder->options->header_size += in_used; coder->crc32 = lzma_crc32(in + in_start, in_used, coder->crc32); if (ret != LZMA_STREAM_END) return ret; if (update_sequence(coder)) return LZMA_STREAM_END; break; } case SEQ_UNCOMPRESSED_SIZE: { const size_t in_start = *in_pos; const lzma_ret ret = lzma_vli_decode( &coder->options->uncompressed_size, &coder->pos, in, in_pos, in_size); const size_t in_used = *in_pos - in_start; coder->options->uncompressed_reserve += in_used; assert(coder->options->uncompressed_reserve <= LZMA_VLI_BYTES_MAX); coder->options->header_size += in_used; coder->crc32 = lzma_crc32(in + in_start, in_used, coder->crc32); if (ret != LZMA_STREAM_END) return ret; if (update_sequence(coder)) return LZMA_STREAM_END; break; } case SEQ_FILTER_FLAGS_INIT: { assert(coder->options->filters[coder->pos].id != LZMA_VLI_VALUE_UNKNOWN); const lzma_ret ret = lzma_filter_flags_decoder_init( &coder->filter_flags_decoder, allocator, &coder->options->filters[coder->pos]); if (ret != LZMA_OK) return ret; coder->sequence = SEQ_FILTER_FLAGS_DECODE; } // Fall through case SEQ_FILTER_FLAGS_DECODE: { const size_t in_start = *in_pos; const lzma_ret ret = coder->filter_flags_decoder.code( coder->filter_flags_decoder.coder, allocator, in, in_pos, in_size, NULL, NULL, 0, LZMA_RUN); const size_t in_used = *in_pos - in_start; coder->options->header_size += in_used; coder->crc32 = lzma_crc32(in + in_start, in_used, coder->crc32); if (ret != LZMA_STREAM_END) return ret; ++coder->pos; if (update_sequence(coder)) return LZMA_STREAM_END; break; } case SEQ_CRC32: assert(coder->options->has_crc32); if (in[*in_pos] != ((coder->crc32 >> (coder->pos * 8)) & 0xFF)) return LZMA_DATA_ERROR; ++*in_pos; ++coder->pos; // Check if we reached end of the CRC32 field. if (coder->pos == 4) { coder->options->header_size += 4; if (update_sequence(coder)) return LZMA_STREAM_END; } break; case SEQ_PADDING: if (in[*in_pos] != 0x00) return LZMA_DATA_ERROR; ++*in_pos; ++coder->options->header_size; ++coder->pos; if (coder->pos < (size_t)(coder->options->padding)) break; return LZMA_STREAM_END; default: return LZMA_PROG_ERROR; } return LZMA_OK; } static void block_header_decoder_end(lzma_coder *coder, lzma_allocator *allocator) { lzma_next_coder_end(&coder->filter_flags_decoder, allocator); lzma_free(coder, allocator); return; } extern lzma_ret lzma_block_header_decoder_init(lzma_next_coder *next, lzma_allocator *allocator, lzma_options_block *options) { if (next->coder == NULL) { next->coder = lzma_alloc(sizeof(lzma_coder), allocator); if (next->coder == NULL) return LZMA_MEM_ERROR; next->code = &block_header_decode; next->end = &block_header_decoder_end; next->coder->filter_flags_decoder = LZMA_NEXT_CODER_INIT; } // Assume that Compressed Size and Uncompressed Size are unknown. options->compressed_size = LZMA_VLI_VALUE_UNKNOWN; options->uncompressed_size = LZMA_VLI_VALUE_UNKNOWN; // We will calculate the sizes of these fields too so that the // application may rewrite the header if it wishes so. options->compressed_reserve = 0; options->uncompressed_reserve = 0; // The Block Flags field is always present, so include its size here // and we don't need to worry about it in block_header_decode(). options->header_size = 2; // Reset filters[] to indicate empty list of filters. // See SEQ_FLAGS_1 in block_header_decode() for reasoning of this. for (size_t i = 0; i < 8; ++i) { options->filters[i].id = LZMA_VLI_VALUE_UNKNOWN; options->filters[i].options = NULL; } next->coder->options = options; next->coder->sequence = SEQ_FLAGS_1; next->coder->pos = 0; next->coder->crc32 = 0; return LZMA_OK; } extern LZMA_API lzma_ret lzma_block_header_decoder(lzma_stream *strm, lzma_options_block *options) { lzma_next_strm_init(strm, lzma_block_header_decoder_init, options); strm->internal->supported_actions[LZMA_RUN] = true; return LZMA_OK; }