123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788 |
- using System;
- using ICSharpCode.SharpZipLib.Checksum;
- using ICSharpCode.SharpZipLib.Zip.Compression.Streams;
- namespace ICSharpCode.SharpZipLib.Zip.Compression
- {
- /// <summary>
- /// Inflater is used to decompress data that has been compressed according
- /// to the "deflate" standard described in rfc1951.
- ///
- /// By default Zlib (rfc1950) headers and footers are expected in the input.
- /// You can use constructor <code> public Inflater(bool noHeader)</code> passing true
- /// if there is no Zlib header information
- ///
- /// The usage is as following. First you have to set some input with
- /// <code>SetInput()</code>, then Inflate() it. If inflate doesn't
- /// inflate any bytes there may be three reasons:
- /// <ul>
- /// <li>IsNeedingInput() returns true because the input buffer is empty.
- /// You have to provide more input with <code>SetInput()</code>.
- /// NOTE: IsNeedingInput() also returns true when, the stream is finished.
- /// </li>
- /// <li>IsNeedingDictionary() returns true, you have to provide a preset
- /// dictionary with <code>SetDictionary()</code>.</li>
- /// <li>IsFinished returns true, the inflater has finished.</li>
- /// </ul>
- /// Once the first output byte is produced, a dictionary will not be
- /// needed at a later stage.
- ///
- /// author of the original java version : John Leuner, Jochen Hoenicke
- /// </summary>
- public class Inflater
- {
- #region Constants/Readonly
- /// <summary>
- /// Copy lengths for literal codes 257..285
- /// </summary>
- static readonly int[] CPLENS = {
- 3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 15, 17, 19, 23, 27, 31,
- 35, 43, 51, 59, 67, 83, 99, 115, 131, 163, 195, 227, 258
- };
- /// <summary>
- /// Extra bits for literal codes 257..285
- /// </summary>
- static readonly int[] CPLEXT = {
- 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2,
- 3, 3, 3, 3, 4, 4, 4, 4, 5, 5, 5, 5, 0
- };
- /// <summary>
- /// Copy offsets for distance codes 0..29
- /// </summary>
- static readonly int[] CPDIST = {
- 1, 2, 3, 4, 5, 7, 9, 13, 17, 25, 33, 49, 65, 97, 129, 193,
- 257, 385, 513, 769, 1025, 1537, 2049, 3073, 4097, 6145,
- 8193, 12289, 16385, 24577
- };
- /// <summary>
- /// Extra bits for distance codes
- /// </summary>
- static readonly int[] CPDEXT = {
- 0, 0, 0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6,
- 7, 7, 8, 8, 9, 9, 10, 10, 11, 11,
- 12, 12, 13, 13
- };
- /// <summary>
- /// These are the possible states for an inflater
- /// </summary>
- const int DECODE_HEADER = 0;
- const int DECODE_DICT = 1;
- const int DECODE_BLOCKS = 2;
- const int DECODE_STORED_LEN1 = 3;
- const int DECODE_STORED_LEN2 = 4;
- const int DECODE_STORED = 5;
- const int DECODE_DYN_HEADER = 6;
- const int DECODE_HUFFMAN = 7;
- const int DECODE_HUFFMAN_LENBITS = 8;
- const int DECODE_HUFFMAN_DIST = 9;
- const int DECODE_HUFFMAN_DISTBITS = 10;
- const int DECODE_CHKSUM = 11;
- const int FINISHED = 12;
- #endregion
- #region Instance Fields
- /// <summary>
- /// This variable contains the current state.
- /// </summary>
- int mode;
- /// <summary>
- /// The adler checksum of the dictionary or of the decompressed
- /// stream, as it is written in the header resp. footer of the
- /// compressed stream.
- /// Only valid if mode is DECODE_DICT or DECODE_CHKSUM.
- /// </summary>
- int readAdler;
- /// <summary>
- /// The number of bits needed to complete the current state. This
- /// is valid, if mode is DECODE_DICT, DECODE_CHKSUM,
- /// DECODE_HUFFMAN_LENBITS or DECODE_HUFFMAN_DISTBITS.
- /// </summary>
- int neededBits;
- int repLength;
- int repDist;
- int uncomprLen;
- /// <summary>
- /// True, if the last block flag was set in the last block of the
- /// inflated stream. This means that the stream ends after the
- /// current block.
- /// </summary>
- bool isLastBlock;
- /// <summary>
- /// The total number of inflated bytes.
- /// </summary>
- long totalOut;
- /// <summary>
- /// The total number of bytes set with setInput(). This is not the
- /// value returned by the TotalIn property, since this also includes the
- /// unprocessed input.
- /// </summary>
- long totalIn;
- /// <summary>
- /// This variable stores the noHeader flag that was given to the constructor.
- /// True means, that the inflated stream doesn't contain a Zlib header or
- /// footer.
- /// </summary>
- bool noHeader;
- readonly StreamManipulator input;
- OutputWindow outputWindow;
- InflaterDynHeader dynHeader;
- InflaterHuffmanTree litlenTree, distTree;
- Adler32 adler;
- #endregion
- #region Constructors
- /// <summary>
- /// Creates a new inflater or RFC1951 decompressor
- /// RFC1950/Zlib headers and footers will be expected in the input data
- /// </summary>
- public Inflater() : this(false)
- {
- }
- /// <summary>
- /// Creates a new inflater.
- /// </summary>
- /// <param name="noHeader">
- /// True if no RFC1950/Zlib header and footer fields are expected in the input data
- ///
- /// This is used for GZIPed/Zipped input.
- ///
- /// For compatibility with
- /// Sun JDK you should provide one byte of input more than needed in
- /// this case.
- /// </param>
- public Inflater(bool noHeader)
- {
- this.noHeader = noHeader;
- this.adler = new Adler32();
- input = new StreamManipulator();
- outputWindow = new OutputWindow();
- mode = noHeader ? DECODE_BLOCKS : DECODE_HEADER;
- }
- #endregion
- /// <summary>
- /// Resets the inflater so that a new stream can be decompressed. All
- /// pending input and output will be discarded.
- /// </summary>
- public void Reset()
- {
- mode = noHeader ? DECODE_BLOCKS : DECODE_HEADER;
- totalIn = 0;
- totalOut = 0;
- input.Reset();
- outputWindow.Reset();
- dynHeader = null;
- litlenTree = null;
- distTree = null;
- isLastBlock = false;
- adler.Reset();
- }
- /// <summary>
- /// Decodes a zlib/RFC1950 header.
- /// </summary>
- /// <returns>
- /// False if more input is needed.
- /// </returns>
- /// <exception cref="SharpZipBaseException">
- /// The header is invalid.
- /// </exception>
- private bool DecodeHeader()
- {
- int header = input.PeekBits(16);
- if (header < 0) {
- return false;
- }
- input.DropBits(16);
- // The header is written in "wrong" byte order
- header = ((header << 8) | (header >> 8)) & 0xffff;
- if (header % 31 != 0) {
- throw new SharpZipBaseException("Header checksum illegal");
- }
- if ((header & 0x0f00) != (Deflater.DEFLATED << 8)) {
- throw new SharpZipBaseException("Compression Method unknown");
- }
- /* Maximum size of the backwards window in bits.
- * We currently ignore this, but we could use it to make the
- * inflater window more space efficient. On the other hand the
- * full window (15 bits) is needed most times, anyway.
- int max_wbits = ((header & 0x7000) >> 12) + 8;
- */
- if ((header & 0x0020) == 0) { // Dictionary flag?
- mode = DECODE_BLOCKS;
- } else {
- mode = DECODE_DICT;
- neededBits = 32;
- }
- return true;
- }
- /// <summary>
- /// Decodes the dictionary checksum after the deflate header.
- /// </summary>
- /// <returns>
- /// False if more input is needed.
- /// </returns>
- private bool DecodeDict()
- {
- while (neededBits > 0) {
- int dictByte = input.PeekBits(8);
- if (dictByte < 0) {
- return false;
- }
- input.DropBits(8);
- readAdler = (readAdler << 8) | dictByte;
- neededBits -= 8;
- }
- return false;
- }
- /// <summary>
- /// Decodes the huffman encoded symbols in the input stream.
- /// </summary>
- /// <returns>
- /// false if more input is needed, true if output window is
- /// full or the current block ends.
- /// </returns>
- /// <exception cref="SharpZipBaseException">
- /// if deflated stream is invalid.
- /// </exception>
- private bool DecodeHuffman()
- {
- int free = outputWindow.GetFreeSpace();
- while (free >= 258) {
- int symbol;
- switch (mode) {
- case DECODE_HUFFMAN:
- // This is the inner loop so it is optimized a bit
- while (((symbol = litlenTree.GetSymbol(input)) & ~0xff) == 0) {
- outputWindow.Write(symbol);
- if (--free < 258) {
- return true;
- }
- }
- if (symbol < 257) {
- if (symbol < 0) {
- return false;
- } else {
- // symbol == 256: end of block
- distTree = null;
- litlenTree = null;
- mode = DECODE_BLOCKS;
- return true;
- }
- }
- try {
- repLength = CPLENS[symbol - 257];
- neededBits = CPLEXT[symbol - 257];
- } catch (Exception) {
- throw new SharpZipBaseException("Illegal rep length code");
- }
- goto case DECODE_HUFFMAN_LENBITS; // fall through
- case DECODE_HUFFMAN_LENBITS:
- if (neededBits > 0) {
- mode = DECODE_HUFFMAN_LENBITS;
- int i = input.PeekBits(neededBits);
- if (i < 0) {
- return false;
- }
- input.DropBits(neededBits);
- repLength += i;
- }
- mode = DECODE_HUFFMAN_DIST;
- goto case DECODE_HUFFMAN_DIST; // fall through
- case DECODE_HUFFMAN_DIST:
- symbol = distTree.GetSymbol(input);
- if (symbol < 0) {
- return false;
- }
- try {
- repDist = CPDIST[symbol];
- neededBits = CPDEXT[symbol];
- } catch (Exception) {
- throw new SharpZipBaseException("Illegal rep dist code");
- }
- goto case DECODE_HUFFMAN_DISTBITS; // fall through
- case DECODE_HUFFMAN_DISTBITS:
- if (neededBits > 0) {
- mode = DECODE_HUFFMAN_DISTBITS;
- int i = input.PeekBits(neededBits);
- if (i < 0) {
- return false;
- }
- input.DropBits(neededBits);
- repDist += i;
- }
- outputWindow.Repeat(repLength, repDist);
- free -= repLength;
- mode = DECODE_HUFFMAN;
- break;
- default:
- throw new SharpZipBaseException("Inflater unknown mode");
- }
- }
- return true;
- }
- /// <summary>
- /// Decodes the adler checksum after the deflate stream.
- /// </summary>
- /// <returns>
- /// false if more input is needed.
- /// </returns>
- /// <exception cref="SharpZipBaseException">
- /// If checksum doesn't match.
- /// </exception>
- private bool DecodeChksum()
- {
- while (neededBits > 0) {
- int chkByte = input.PeekBits(8);
- if (chkByte < 0) {
- return false;
- }
- input.DropBits(8);
- readAdler = (readAdler << 8) | chkByte;
- neededBits -= 8;
- }
- if ((int)adler.Value != readAdler) {
- throw new SharpZipBaseException("Adler chksum doesn't match: " + (int)adler.Value + " vs. " + readAdler);
- }
- mode = FINISHED;
- return false;
- }
- /// <summary>
- /// Decodes the deflated stream.
- /// </summary>
- /// <returns>
- /// false if more input is needed, or if finished.
- /// </returns>
- /// <exception cref="SharpZipBaseException">
- /// if deflated stream is invalid.
- /// </exception>
- private bool Decode()
- {
- switch (mode) {
- case DECODE_HEADER:
- return DecodeHeader();
- case DECODE_DICT:
- return DecodeDict();
- case DECODE_CHKSUM:
- return DecodeChksum();
- case DECODE_BLOCKS:
- if (isLastBlock) {
- if (noHeader) {
- mode = FINISHED;
- return false;
- } else {
- input.SkipToByteBoundary();
- neededBits = 32;
- mode = DECODE_CHKSUM;
- return true;
- }
- }
- int type = input.PeekBits(3);
- if (type < 0) {
- return false;
- }
- input.DropBits(3);
- isLastBlock |= (type & 1) != 0;
- switch (type >> 1) {
- case DeflaterConstants.STORED_BLOCK:
- input.SkipToByteBoundary();
- mode = DECODE_STORED_LEN1;
- break;
- case DeflaterConstants.STATIC_TREES:
- litlenTree = InflaterHuffmanTree.defLitLenTree;
- distTree = InflaterHuffmanTree.defDistTree;
- mode = DECODE_HUFFMAN;
- break;
- case DeflaterConstants.DYN_TREES:
- dynHeader = new InflaterDynHeader();
- mode = DECODE_DYN_HEADER;
- break;
- default:
- throw new SharpZipBaseException("Unknown block type " + type);
- }
- return true;
- case DECODE_STORED_LEN1: {
- if ((uncomprLen = input.PeekBits(16)) < 0) {
- return false;
- }
- input.DropBits(16);
- mode = DECODE_STORED_LEN2;
- }
- goto case DECODE_STORED_LEN2; // fall through
- case DECODE_STORED_LEN2: {
- int nlen = input.PeekBits(16);
- if (nlen < 0) {
- return false;
- }
- input.DropBits(16);
- if (nlen != (uncomprLen ^ 0xffff)) {
- throw new SharpZipBaseException("broken uncompressed block");
- }
- mode = DECODE_STORED;
- }
- goto case DECODE_STORED; // fall through
- case DECODE_STORED: {
- int more = outputWindow.CopyStored(input, uncomprLen);
- uncomprLen -= more;
- if (uncomprLen == 0) {
- mode = DECODE_BLOCKS;
- return true;
- }
- return !input.IsNeedingInput;
- }
- case DECODE_DYN_HEADER:
- if (!dynHeader.Decode(input)) {
- return false;
- }
- litlenTree = dynHeader.BuildLitLenTree();
- distTree = dynHeader.BuildDistTree();
- mode = DECODE_HUFFMAN;
- goto case DECODE_HUFFMAN; // fall through
- case DECODE_HUFFMAN:
- case DECODE_HUFFMAN_LENBITS:
- case DECODE_HUFFMAN_DIST:
- case DECODE_HUFFMAN_DISTBITS:
- return DecodeHuffman();
- case FINISHED:
- return false;
- default:
- throw new SharpZipBaseException("Inflater.Decode unknown mode");
- }
- }
- /// <summary>
- /// Sets the preset dictionary. This should only be called, if
- /// needsDictionary() returns true and it should set the same
- /// dictionary, that was used for deflating. The getAdler()
- /// function returns the checksum of the dictionary needed.
- /// </summary>
- /// <param name="buffer">
- /// The dictionary.
- /// </param>
- public void SetDictionary(byte[] buffer)
- {
- SetDictionary(buffer, 0, buffer.Length);
- }
- /// <summary>
- /// Sets the preset dictionary. This should only be called, if
- /// needsDictionary() returns true and it should set the same
- /// dictionary, that was used for deflating. The getAdler()
- /// function returns the checksum of the dictionary needed.
- /// </summary>
- /// <param name="buffer">
- /// The dictionary.
- /// </param>
- /// <param name="index">
- /// The index into buffer where the dictionary starts.
- /// </param>
- /// <param name="count">
- /// The number of bytes in the dictionary.
- /// </param>
- /// <exception cref="System.InvalidOperationException">
- /// No dictionary is needed.
- /// </exception>
- /// <exception cref="SharpZipBaseException">
- /// The adler checksum for the buffer is invalid
- /// </exception>
- public void SetDictionary(byte[] buffer, int index, int count)
- {
- if (buffer == null) {
- throw new ArgumentNullException("nameof(buffer)");
- }
- if (index < 0) {
- throw new ArgumentOutOfRangeException("nameof(index)");
- }
- if (count < 0) {
- throw new ArgumentOutOfRangeException("nameof(count)");
- }
- if (!IsNeedingDictionary) {
- throw new InvalidOperationException("Dictionary is not needed");
- }
- adler.Update(buffer, index, count);
- if ((int)adler.Value != readAdler) {
- throw new SharpZipBaseException("Wrong adler checksum");
- }
- adler.Reset();
- outputWindow.CopyDict(buffer, index, count);
- mode = DECODE_BLOCKS;
- }
- /// <summary>
- /// Sets the input. This should only be called, if needsInput()
- /// returns true.
- /// </summary>
- /// <param name="buffer">
- /// the input.
- /// </param>
- public void SetInput(byte[] buffer)
- {
- SetInput(buffer, 0, buffer.Length);
- }
- /// <summary>
- /// Sets the input. This should only be called, if needsInput()
- /// returns true.
- /// </summary>
- /// <param name="buffer">
- /// The source of input data
- /// </param>
- /// <param name="index">
- /// The index into buffer where the input starts.
- /// </param>
- /// <param name="count">
- /// The number of bytes of input to use.
- /// </param>
- /// <exception cref="System.InvalidOperationException">
- /// No input is needed.
- /// </exception>
- /// <exception cref="System.ArgumentOutOfRangeException">
- /// The index and/or count are wrong.
- /// </exception>
- public void SetInput(byte[] buffer, int index, int count)
- {
- input.SetInput(buffer, index, count);
- totalIn += (long)count;
- }
- /// <summary>
- /// Inflates the compressed stream to the output buffer. If this
- /// returns 0, you should check, whether IsNeedingDictionary(),
- /// IsNeedingInput() or IsFinished() returns true, to determine why no
- /// further output is produced.
- /// </summary>
- /// <param name="buffer">
- /// the output buffer.
- /// </param>
- /// <returns>
- /// The number of bytes written to the buffer, 0 if no further
- /// output can be produced.
- /// </returns>
- /// <exception cref="System.ArgumentOutOfRangeException">
- /// if buffer has length 0.
- /// </exception>
- /// <exception cref="System.FormatException">
- /// if deflated stream is invalid.
- /// </exception>
- public int Inflate(byte[] buffer)
- {
- if (buffer == null) {
- throw new ArgumentNullException("nameof(buffer)");
- }
- return Inflate(buffer, 0, buffer.Length);
- }
- /// <summary>
- /// Inflates the compressed stream to the output buffer. If this
- /// returns 0, you should check, whether needsDictionary(),
- /// needsInput() or finished() returns true, to determine why no
- /// further output is produced.
- /// </summary>
- /// <param name="buffer">
- /// the output buffer.
- /// </param>
- /// <param name="offset">
- /// the offset in buffer where storing starts.
- /// </param>
- /// <param name="count">
- /// the maximum number of bytes to output.
- /// </param>
- /// <returns>
- /// the number of bytes written to the buffer, 0 if no further output can be produced.
- /// </returns>
- /// <exception cref="System.ArgumentOutOfRangeException">
- /// if count is less than 0.
- /// </exception>
- /// <exception cref="System.ArgumentOutOfRangeException">
- /// if the index and / or count are wrong.
- /// </exception>
- /// <exception cref="System.FormatException">
- /// if deflated stream is invalid.
- /// </exception>
- public int Inflate(byte[] buffer, int offset, int count)
- {
- if (buffer == null) {
- throw new ArgumentNullException("nameof(buffer)");
- }
- if (count < 0) {
- throw new ArgumentOutOfRangeException("nameof(count)", "count cannot be negative");
- }
- if (offset < 0) {
- throw new ArgumentOutOfRangeException("nameof(offset)", "offset cannot be negative");
- }
- if (offset + count > buffer.Length) {
- throw new ArgumentException("count exceeds buffer bounds");
- }
- // Special case: count may be zero
- if (count == 0) {
- if (!IsFinished) { // -jr- 08-Nov-2003 INFLATE_BUG fix..
- Decode();
- }
- return 0;
- }
- int bytesCopied = 0;
- do {
- if (mode != DECODE_CHKSUM) {
- /* Don't give away any output, if we are waiting for the
- * checksum in the input stream.
- *
- * With this trick we have always:
- * IsNeedingInput() and not IsFinished()
- * implies more output can be produced.
- */
- int more = outputWindow.CopyOutput(buffer, offset, count);
- if (more > 0) {
- adler.Update(buffer, offset, more);
- offset += more;
- bytesCopied += more;
- totalOut += (long)more;
- count -= more;
- if (count == 0) {
- return bytesCopied;
- }
- }
- }
- } while (Decode() || ((outputWindow.GetAvailable() > 0) && (mode != DECODE_CHKSUM)));
- return bytesCopied;
- }
- /// <summary>
- /// Returns true, if the input buffer is empty.
- /// You should then call setInput().
- /// NOTE: This method also returns true when the stream is finished.
- /// </summary>
- public bool IsNeedingInput {
- get {
- return input.IsNeedingInput;
- }
- }
- /// <summary>
- /// Returns true, if a preset dictionary is needed to inflate the input.
- /// </summary>
- public bool IsNeedingDictionary {
- get {
- return mode == DECODE_DICT && neededBits == 0;
- }
- }
- /// <summary>
- /// Returns true, if the inflater has finished. This means, that no
- /// input is needed and no output can be produced.
- /// </summary>
- public bool IsFinished {
- get {
- return mode == FINISHED && outputWindow.GetAvailable() == 0;
- }
- }
- /// <summary>
- /// Gets the adler checksum. This is either the checksum of all
- /// uncompressed bytes returned by inflate(), or if needsDictionary()
- /// returns true (and thus no output was yet produced) this is the
- /// adler checksum of the expected dictionary.
- /// </summary>
- /// <returns>
- /// the adler checksum.
- /// </returns>
- public int Adler {
- get {
- return IsNeedingDictionary ? readAdler : (int)adler.Value;
- }
- }
- /// <summary>
- /// Gets the total number of output bytes returned by Inflate().
- /// </summary>
- /// <returns>
- /// the total number of output bytes.
- /// </returns>
- public long TotalOut {
- get {
- return totalOut;
- }
- }
- /// <summary>
- /// Gets the total number of processed compressed input bytes.
- /// </summary>
- /// <returns>
- /// The total number of bytes of processed input bytes.
- /// </returns>
- public long TotalIn {
- get {
- return totalIn - (long)RemainingInput;
- }
- }
- /// <summary>
- /// Gets the number of unprocessed input bytes. Useful, if the end of the
- /// stream is reached and you want to further process the bytes after
- /// the deflate stream.
- /// </summary>
- /// <returns>
- /// The number of bytes of the input which have not been processed.
- /// </returns>
- public int RemainingInput {
- // TODO: This should be a long?
- get {
- return input.AvailableBytes;
- }
- }
- }
- }
|