BinaryObjectScanner/BurnOutSharp/External/libmspack/Compression/CompressionStream.cs

/* This file is part of libmspack.
 * (C) 2003-2013 Stuart Caie.
 *
 * The LZX method was created by Jonathan Forbes and Tomi Poutanen, adapted
 * by Microsoft Corporation.
 *
 * libmspack is free software { get; set; } you can redistribute it and/or modify it under
 * the terms of the GNU Lesser General Public License (LGPL) version 2.1
 *
 * For further details, see the file COPYING.LIB distributed with libmspack
 */

using System;

namespace LibMSPackSharp.Compression
{
    public abstract class CompressionStream
    {
        private const int CHAR_BIT = 8;

        private const int BITBUF_WIDTH = 4 * CHAR_BIT;

        /// <summary>
        /// I/O routines
        /// </summary>
        public SystemImpl Sys { get; set; }

        /// <summary>
        /// Input file handle
        /// </summary>
        public object Input { get; set; }

        /// <summary>
        /// Output file handle
        /// </summary>
        public object Output { get; set; }

        public Error Error { get; set; }

        #region I/O buffering

        public byte[] InputBuffer { get; set; }

        public uint InputBufferSize { get; set; }

        public int InputPointer { get; set; }

        public int InputLength { get; set; }

        public int OutputPointer { get; set; }

        public int OutputLength { get; set; }

        public uint BitBuffer { get; set; }

        public uint BitsLeft { get; set; }

        /// <summary>
        /// Have we reached the end of input?
        /// </summary>
        public int InputEnd { get; set; }

        #endregion

        #region ReadBits Methods

        /* This header defines macros that read data streams by
         * the individual bits
         *
         * INIT_BITS         initialises bitstream state in state structure
         * STORE_BITS        stores bitstream state in state structure
         * RESTORE_BITS      restores bitstream state from state structure
         * ENSURE_BITS(n)    ensure there are at least N bits in the bit buffer
         * READ_BITS(var,n)  takes N bits from the buffer and puts them in var
         * PEEK_BITS(n)      extracts without removing N bits from the bit buffer
         * REMOVE_BITS(n)    removes N bits from the bit buffer
         *
         * READ_BITS simply calls ENSURE_BITS, PEEK_BITS and REMOVE_BITS,
         * which means it's limited to reading the number of bits you can
         * ensure at any one time. It also fails if asked to read zero bits.
         * If you need to read zero bits, or more bits than can be ensured in
         * one go, use READ_MANY_BITS instead.
         *
         * These macros have variable names baked into them, so to use them
         * you have to define some macros:
         * - BITS_TYPE: the type name of your state structure
         * - BITS_VAR: the variable that points to your state structure
         * - define BITS_ORDER_MSB if bits are read from the MSB, or
         *   define BITS_ORDER_LSB if bits are read from the LSB
         * - READ_BYTES: some code that reads more data into the bit buffer,
         *   it should use READ_IF_NEEDED (calls read_input if the byte buffer
         *   is empty), then INJECT_BITS(data,n) to put data from the byte
         *   buffer into the bit buffer.
         *
         * You also need to define some variables and structure members:
         * - byte[] i_ptr;    // current position in the byte buffer
         * - byte[] i_end;    // end of the byte buffer
         * - uint bit_buffer; // the bit buffer itself
         * - uint bits_left;  // number of bits remaining
         *
         * If you use read_input() and READ_IF_NEEDED, they also expect these
         * structure members:
         * - struct mspack_system *sys;  // to access sys->read()
         * - uint error;         // to record/return read errors
         * - byte input_end;    // to mark reaching the EOF
         * - byte[] inbuf;       // the input byte buffer
         * - uint inbuf_size;    // the size of the input byte buffer
         *
         * Your READ_BYTES implementation should read data from *i_ptr and
         * put them in the bit buffer. READ_IF_NEEDED will call read_input()
         * if i_ptr reaches i_end, and will fill up inbuf and set i_ptr to
         * the start of inbuf and i_end to the end of inbuf.
         *
         * If you're reading in MSB order, the routines work by using the area
         * beyond the MSB and the LSB of the bit buffer as a free source of
         * zeroes when shifting. This avoids having to mask any bits. So we
         * have to know the bit width of the bit buffer variable. We use
         * <limits.h> and CHAR_BIT to find the size of the bit buffer in bits.
         *
         * If you are reading in LSB order, bits need to be masked. Normally
         * this is done by computing the mask: N bits are masked by the value
         * (1<<N)-1). However, you can define BITS_LSB_TABLE to use a lookup
         * table instead of computing this. This adds two new macros,
         * PEEK_BITS_T and READ_BITS_T which work the same way as PEEK_BITS
         * and READ_BITS, except they use this lookup table. This is useful if
         * you need to look up a number of bits that are only known at
         * runtime, so the bit mask can't be turned into a constant by the
         * compiler.
         * The bit buffer datatype should be at least 32 bits wide: it must be
         * possible to ENSURE_BITS(17), so it must be possible to add 16 new bits
         * to the bit buffer when the bit buffer already has 1 to 15 bits left.
         */

        public void INIT_BITS()
        {
            InputPointer = 0;
            InputLength = 0;
            BitBuffer = 0;
            BitsLeft = 0;
            InputEnd = 0;
        }

        public void STORE_BITS(int inputPointer, int inputLength, uint bitBuffer, uint bitsLeft)
        {
            InputPointer = inputPointer;
            InputLength = inputLength;
            BitBuffer = bitBuffer;
            BitsLeft = bitsLeft;
        }

        public void RESTORE_BITS(ref int inputPointer, ref int inputLength, ref uint bitBuffer, ref uint bitsLeft)
        {
            inputPointer = InputPointer;
            inputLength = InputLength;
            bitBuffer = BitBuffer;
            bitsLeft = BitsLeft;
        }

        public void ENSURE_BITS(int nbits, ref int i_ptr, ref int i_end, ref uint bitsLeft, ref uint bitBuffer)
        {
            while (bitsLeft < nbits)
            {
                READ_BYTES(ref i_ptr, ref i_end, ref bitsLeft, ref bitBuffer);
            }
        }

        public void READ_BITS(ref int val, int nbits, ref int i_ptr, ref int i_end, ref uint bitsLeft, ref uint bitBuffer)
        {
            ENSURE_BITS(nbits, ref i_ptr, ref i_end, ref bitsLeft, ref bitBuffer);
            val = PEEK_BITS(nbits, bitBuffer);
            REMOVE_BITS(nbits, ref bitsLeft, ref bitBuffer);
        }

        public Error READ_MANY_BITS(ref uint val, byte bits, ref int i_ptr, ref int i_end, ref uint bitsLeft, ref uint bitBuffer)
        {
            byte needed = bits, bitrun;
            val = 0;
            while (needed > 0)
            {
                if (bitsLeft <= (BITBUF_WIDTH - 16))
                {
                    Error error = READ_BYTES(ref i_ptr, ref i_end, ref bitsLeft, ref bitBuffer);
                    if (error != Error.MSPACK_ERR_OK)
                        return error;
                }

                bitrun = (byte)((bitsLeft < needed) ? bitsLeft : needed);
                val = (uint)((val << bitrun) | PEEK_BITS(bitrun, bitBuffer));
                REMOVE_BITS(bitrun, ref bitsLeft, ref bitBuffer);
                needed -= bitrun;
            }

            return Error.MSPACK_ERR_OK;
        }

        public int PEEK_BITS(int nbits, uint bitBuffer)
        {
            return (int)(bitBuffer & ((1 << (nbits)) - 1));
        }

        public void REMOVE_BITS(int nbits, ref uint bitsLeft, ref uint bitBuffer)
        {
            bitBuffer >>= nbits;
            bitsLeft -= (uint)nbits;
        }

        public void INJECT_BITS(uint bitdata, int nbits, ref uint bitsLeft, ref uint bitBuffer)
        {
            bitBuffer |= bitdata << (int)bitsLeft;
            bitsLeft += (uint)nbits;
        }

        public abstract Error READ_BYTES(ref int i_ptr, ref int i_end, ref uint bitsLeft, ref uint bitBuffer);

        // lsb_bit_mask[n] = (1 << n) - 1 */
        private static readonly ushort[] lsb_bit_mask = new ushort[17]
        {
            0x0000, 0x0001, 0x0003, 0x0007, 0x000f, 0x001f, 0x003f, 0x007f, 0x00ff,
            0x01ff, 0x03ff, 0x07ff, 0x0fff, 0x1fff, 0x3fff, 0x7fff, 0xffff
        };

        public int PEEK_BITS_T(int nbits)
        {
            return (int)(BitBuffer & lsb_bit_mask[nbits]);
        }

        public void READ_BITS_T(ref int val, int nbits, ref int i_ptr, ref int i_end, ref uint bitsLeft, ref uint bitBuffer)
        {
            ENSURE_BITS(nbits, ref i_ptr, ref i_end, ref bitsLeft, ref bitBuffer);
            val = PEEK_BITS_T(nbits);
            REMOVE_BITS(nbits, ref bitsLeft, ref bitBuffer);
        }

        public Error READ_IF_NEEDED(ref int iPtr, ref int iEnd)
        {
            if (iPtr >= iEnd)
            {
                if (ReadInput(this) != Error.MSPACK_ERR_OK)
                    return Error;

                iPtr = InputPointer;
                iEnd = InputLength;
            }

            return Error.MSPACK_ERR_OK;
        }

        private static Error ReadInput(CompressionStream p)
        {
            int read = p.Sys.Read(p.Input, p.InputBuffer, 0, (int)p.InputBufferSize);
            if (read < 0)
                return p.Error = Error.MSPACK_ERR_READ;

            // We might overrun the input stream by asking for bits we don't use,
            // so fake 2 more bytes at the end of input
            if (read == 0)
            {
                if (p.InputEnd != 0)
                {
                    Console.WriteLine("out of input bytes");
                    return p.Error = Error.MSPACK_ERR_READ;
                }
                else
                {
                    read = 2;
                    p.InputBuffer[0] = p.InputBuffer[1] = 0;
                    p.InputEnd = 1;
                }
            }

            // Update i_ptr and i_end
            p.InputPointer = 0;
            p.InputLength = read;
            return Error.MSPACK_ERR_OK;
        }

        #endregion

        #region ReadHuff Methods

        private const int HUFF_MAXBITS = 16;

        /// <summary>
        /// Decodes the next huffman symbol from the input bitstream into var.
        /// Do not use this macro on a table unless build_decode_table() succeeded.
        /// </summary>
        public int READ_HUFFSYM(ushort[] decodingTable, ref uint var, int tablebits, byte[] lengthTable, int maxsymbols, ref int i, ref ushort sym, ref int i_ptr, ref int i_end, ref uint bitsLeft, ref uint bitBuffer)
        {
            ENSURE_BITS(HUFF_MAXBITS, ref i_ptr, ref i_end, ref bitsLeft, ref bitBuffer);
            sym = decodingTable[PEEK_BITS(tablebits, bitBuffer)];
            if (sym >= maxsymbols)
            {
                int ret = HUFF_TRAVERSE(decodingTable, tablebits, maxsymbols, ref i, ref sym, bitBuffer);
                if (ret != 0)
                    return ret;
            }

            var = sym;
            i = lengthTable[sym];
            REMOVE_BITS(i, ref bitsLeft, ref bitBuffer);
            return (int)Error.MSPACK_ERR_OK;
        }

        public int HUFF_TRAVERSE(ushort[] decodingTable, int tablebits, int maxsymbols, ref int i, ref ushort sym, uint bitBuffer)
        {
            i = tablebits - 1;
            do
            {
                if (i++ > HUFF_MAXBITS)
                    return HUFF_ERROR();

                sym = decodingTable[(sym << 1) | ((bitBuffer >> i) & 1)];
            } while (sym >= maxsymbols);

            return (int)Error.MSPACK_ERR_OK;
        }

        public abstract int HUFF_ERROR();

        /// <summary>
        /// This function was originally coded by David Tritscher.
        ///
        /// It builds a fast huffman decoding table from
        /// a canonical huffman code lengths table.
        /// </summary>
        /// <param name="nsyms">total number of symbols in this huffman tree.</param>
        /// <param name="nbits">any symbols with a code length of nbits or less can be decoded in one lookup of the table.</param>
        /// <param name="length">A table to get code lengths from [0 to nsyms-1]</param>
        /// <param name="table">
        /// The table to fill up with decoded symbols and pointers.
        /// Should be ((1<<nbits) + (nsyms*2)) in length.
        /// </param>
        /// <returns>0 for OK or 1 for error</returns>
        public static int MakeDecodeTable(uint nsyms, uint nbits, byte[] length, ushort[] table)
        {
            ushort sym, next_symbol;
            uint leaf, fill;
            uint reverse;
            byte bit_num;
            uint pos = 0; // The current position in the decode table
            uint table_mask = (uint)(1 << (int)nbits);
            uint bit_mask = table_mask >> 1; // Don't do 0 length codes

            // Fill entries for codes short enough for a direct mapping
            for (bit_num = 1; bit_num <= nbits; bit_num++)
            {
                for (sym = 0; sym < nsyms; sym++)
                {
                    if (length[sym] != bit_num)
                        continue;

                    // Reverse the significant bits
                    fill = length[sym];
                    reverse = pos >> (int)(nbits - fill);
                    leaf = 0;

                    do
                    {
                        leaf <<= 1;
                        leaf |= reverse & 1;
                        reverse >>= 1;
                    } while (--fill != 0);

                    if ((pos += bit_mask) > table_mask)
                        return 1; // Table overrun

                    // Fill all possible lookups of this symbol with the symbol itself
                    fill = bit_mask;
                    next_symbol = (ushort)(1 << bit_num);

                    do
                    {
                        table[leaf] = sym;
                        leaf += next_symbol;
                    } while (--fill != 0);
                }
                bit_mask >>= 1;
            }

            // Exit with success if table is now complete
            if (pos == table_mask)
                return 0;

            // Mark all remaining table entries as unused
            for (sym = (ushort)pos; sym < table_mask; sym++)
            {
                reverse = sym;
                leaf = 0;
                fill = nbits;

                do
                {
                    leaf <<= 1;
                    leaf |= reverse & 1;
                    reverse >>= 1;
                } while (--fill != 0);

                table[leaf] = 0xFFFF;
            }

            // next_symbol = base of allocation for long codes
            next_symbol = (ushort)(((table_mask >> 1) < nsyms) ? nsyms : (table_mask >> 1));

            // Give ourselves room for codes to grow by up to 16 more bits.
            // codes now start at bit nbits+16 and end at (nbits+16-codelength)
            pos <<= 16;
            table_mask <<= 16;
            bit_mask = 1 << 15;

            for (bit_num = (byte)(nbits + 1); bit_num <= HUFF_MAXBITS; bit_num++)
            {
                for (sym = 0; sym < nsyms; sym++)
                {
                    if (length[sym] != bit_num)
                        continue;
                    if (pos >= table_mask)
                        return 1; // Table overflow

                    // Leaf = the first nbits of the code, reversed
                    reverse = pos >> 16;
                    leaf = 0;
                    fill = nbits;

                    do
                    {
                        leaf <<= 1;
                        leaf |= reverse & 1;
                        reverse >>= 1;
                    } while (--fill != 0);

                    for (fill = 0; fill < (bit_num - nbits); fill++)
                    {
                        // Ff this path hasn't been taken yet, 'allocate' two entries
                        if (table[leaf] == 0xFFFF)
                        {
                            table[(next_symbol << 1)] = 0xFFFF;
                            table[(next_symbol << 1) + 1] = 0xFFFF;
                            table[leaf] = next_symbol++;
                        }

                        // Follow the path and select either left or right for next bit
                        leaf = (uint)(table[leaf] << 1);
                        if (((pos >> (int)(15 - fill)) & 1) != 0)
                            leaf++;
                    }

                    table[leaf] = sym;
                    pos += bit_mask;
                }

                bit_mask >>= 1;
            }

            // Full table?
            return (pos == table_mask) ? 0 : 1;
        }

        #endregion
    }
}