mirror of
https://github.com/ClassiCube/ClassiCube.git
synced 2025-01-22 17:12:25 -05:00
1819 lines
No EOL
73 KiB
C#
1819 lines
No EOL
73 KiB
C#
// Copyright (c) 2009-2011 Dino Chiesa and Microsoft Corporation.
|
|
// All rights reserved.
|
|
// This code module is part of DotNetZip, a zipfile class library.
|
|
|
|
// This code is licensed under the Microsoft Public License.
|
|
// See the file License.txt for the license details.
|
|
// More info on: http://dotnetzip.codeplex.com
|
|
|
|
|
|
using System;
|
|
|
|
namespace Ionic.Zlib
|
|
{
|
|
|
|
internal enum BlockState
|
|
{
|
|
NeedMore = 0, // block not completed, need more input or more output
|
|
BlockDone, // block flush performed
|
|
FinishStarted, // finish started, need only more output at next deflate
|
|
FinishDone // finish done, accept no more input or output
|
|
}
|
|
|
|
internal enum DeflateFlavor
|
|
{
|
|
Store,
|
|
Fast,
|
|
Slow
|
|
}
|
|
|
|
internal sealed class DeflateManager
|
|
{
|
|
private static readonly int MEM_LEVEL_MAX = 9;
|
|
private static readonly int MEM_LEVEL_DEFAULT = 8;
|
|
|
|
internal delegate BlockState CompressFunc(FlushType flush);
|
|
|
|
internal class Config
|
|
{
|
|
// Use a faster search when the previous match is longer than this
|
|
internal int GoodLength; // reduce lazy search above this match length
|
|
|
|
// Attempt to find a better match only when the current match is
|
|
// strictly smaller than this value. This mechanism is used only for
|
|
// compression levels >= 4. For levels 1,2,3: MaxLazy is actually
|
|
// MaxInsertLength. (See DeflateFast)
|
|
|
|
internal int MaxLazy; // do not perform lazy search above this match length
|
|
|
|
internal int NiceLength; // quit search above this match length
|
|
|
|
// To speed up deflation, hash chains are never searched beyond this
|
|
// length. A higher limit improves compression ratio but degrades the speed.
|
|
|
|
internal int MaxChainLength;
|
|
|
|
internal DeflateFlavor Flavor;
|
|
|
|
private Config(int goodLength, int maxLazy, int niceLength, int maxChainLength, DeflateFlavor flavor)
|
|
{
|
|
this.GoodLength = goodLength;
|
|
this.MaxLazy = maxLazy;
|
|
this.NiceLength = niceLength;
|
|
this.MaxChainLength = maxChainLength;
|
|
this.Flavor = flavor;
|
|
}
|
|
|
|
public static Config Lookup(CompressionLevel level)
|
|
{
|
|
return Table[(int)level];
|
|
}
|
|
|
|
|
|
static Config()
|
|
{
|
|
Table = new Config[] {
|
|
new Config(0, 0, 0, 0, DeflateFlavor.Store),
|
|
new Config(4, 4, 8, 4, DeflateFlavor.Fast),
|
|
new Config(4, 5, 16, 8, DeflateFlavor.Fast),
|
|
new Config(4, 6, 32, 32, DeflateFlavor.Fast),
|
|
|
|
new Config(4, 4, 16, 16, DeflateFlavor.Slow),
|
|
new Config(8, 16, 32, 32, DeflateFlavor.Slow),
|
|
new Config(8, 16, 128, 128, DeflateFlavor.Slow),
|
|
new Config(8, 32, 128, 256, DeflateFlavor.Slow),
|
|
new Config(32, 128, 258, 1024, DeflateFlavor.Slow),
|
|
new Config(32, 258, 258, 4096, DeflateFlavor.Slow),
|
|
};
|
|
}
|
|
|
|
private static readonly Config[] Table;
|
|
}
|
|
|
|
|
|
private CompressFunc DeflateFunction;
|
|
|
|
private static readonly System.String[] _ErrorMessage = new System.String[]
|
|
{
|
|
"need dictionary",
|
|
"stream end",
|
|
"",
|
|
"file error",
|
|
"stream error",
|
|
"data error",
|
|
"insufficient memory",
|
|
"buffer error",
|
|
"incompatible version",
|
|
""
|
|
};
|
|
|
|
// preset dictionary flag in zlib header
|
|
private static readonly int PRESET_DICT = 0x20;
|
|
|
|
private static readonly int INIT_STATE = 42;
|
|
private static readonly int BUSY_STATE = 113;
|
|
private static readonly int FINISH_STATE = 666;
|
|
|
|
// The deflate compression method
|
|
private static readonly int Z_DEFLATED = 8;
|
|
|
|
private static readonly int STORED_BLOCK = 0;
|
|
private static readonly int STATIC_TREES = 1;
|
|
private static readonly int DYN_TREES = 2;
|
|
|
|
// The three kinds of block type
|
|
private static readonly int Z_BINARY = 0;
|
|
private static readonly int Z_ASCII = 1;
|
|
private static readonly int Z_UNKNOWN = 2;
|
|
|
|
private static readonly int Buf_size = 8 * 2;
|
|
|
|
private static readonly int MIN_MATCH = 3;
|
|
private static readonly int MAX_MATCH = 258;
|
|
|
|
private static readonly int MIN_LOOKAHEAD = (MAX_MATCH + MIN_MATCH + 1);
|
|
|
|
private static readonly int HEAP_SIZE = (2 * InternalConstants.L_CODES + 1);
|
|
|
|
private static readonly int END_BLOCK = 256;
|
|
|
|
internal ZlibCodec _codec; // the zlib encoder/decoder
|
|
internal int status; // as the name implies
|
|
internal byte[] pending; // output still pending - waiting to be compressed
|
|
internal int nextPending; // index of next pending byte to output to the stream
|
|
internal int pendingCount; // number of bytes in the pending buffer
|
|
|
|
internal sbyte data_type; // UNKNOWN, BINARY or ASCII
|
|
internal int last_flush; // value of flush param for previous deflate call
|
|
|
|
internal int w_size; // LZ77 window size (32K by default)
|
|
internal int w_bits; // log2(w_size) (8..16)
|
|
internal int w_mask; // w_size - 1
|
|
|
|
//internal byte[] dictionary;
|
|
internal byte[] window;
|
|
|
|
// Sliding window. Input bytes are read into the second half of the window,
|
|
// and move to the first half later to keep a dictionary of at least wSize
|
|
// bytes. With this organization, matches are limited to a distance of
|
|
// wSize-MAX_MATCH bytes, but this ensures that IO is always
|
|
// performed with a length multiple of the block size.
|
|
//
|
|
// To do: use the user input buffer as sliding window.
|
|
|
|
internal int window_size;
|
|
// Actual size of window: 2*wSize, except when the user input buffer
|
|
// is directly used as sliding window.
|
|
|
|
internal short[] prev;
|
|
// Link to older string with same hash index. To limit the size of this
|
|
// array to 64K, this link is maintained only for the last 32K strings.
|
|
// An index in this array is thus a window index modulo 32K.
|
|
|
|
internal short[] head; // Heads of the hash chains or NIL.
|
|
|
|
internal int ins_h; // hash index of string to be inserted
|
|
internal int hash_size; // number of elements in hash table
|
|
internal int hash_bits; // log2(hash_size)
|
|
internal int hash_mask; // hash_size-1
|
|
|
|
// Number of bits by which ins_h must be shifted at each input
|
|
// step. It must be such that after MIN_MATCH steps, the oldest
|
|
// byte no longer takes part in the hash key, that is:
|
|
// hash_shift * MIN_MATCH >= hash_bits
|
|
internal int hash_shift;
|
|
|
|
// Window position at the beginning of the current output block. Gets
|
|
// negative when the window is moved backwards.
|
|
|
|
internal int block_start;
|
|
|
|
Config config;
|
|
internal int match_length; // length of best match
|
|
internal int prev_match; // previous match
|
|
internal int match_available; // set if previous match exists
|
|
internal int strstart; // start of string to insert into.....????
|
|
internal int match_start; // start of matching string
|
|
internal int lookahead; // number of valid bytes ahead in window
|
|
|
|
// Length of the best match at previous step. Matches not greater than this
|
|
// are discarded. This is used in the lazy match evaluation.
|
|
internal int prev_length;
|
|
|
|
// Insert new strings in the hash table only if the match length is not
|
|
// greater than this length. This saves time but degrades compression.
|
|
// max_insert_length is used only for compression levels <= 3.
|
|
|
|
internal CompressionLevel compressionLevel; // compression level (1..9)
|
|
internal CompressionStrategy compressionStrategy; // favor or force Huffman coding
|
|
|
|
|
|
internal short[] dyn_ltree; // literal and length tree
|
|
internal short[] dyn_dtree; // distance tree
|
|
internal short[] bl_tree; // Huffman tree for bit lengths
|
|
|
|
internal Tree treeLiterals = new Tree(); // desc for literal tree
|
|
internal Tree treeDistances = new Tree(); // desc for distance tree
|
|
internal Tree treeBitLengths = new Tree(); // desc for bit length tree
|
|
|
|
// number of codes at each bit length for an optimal tree
|
|
internal short[] bl_count = new short[InternalConstants.MAX_BITS + 1];
|
|
|
|
// heap used to build the Huffman trees
|
|
internal int[] heap = new int[2 * InternalConstants.L_CODES + 1];
|
|
|
|
internal int heap_len; // number of elements in the heap
|
|
internal int heap_max; // element of largest frequency
|
|
|
|
// The sons of heap[n] are heap[2*n] and heap[2*n+1]. heap[0] is not used.
|
|
// The same heap array is used to build all trees.
|
|
|
|
// Depth of each subtree used as tie breaker for trees of equal frequency
|
|
internal sbyte[] depth = new sbyte[2 * InternalConstants.L_CODES + 1];
|
|
|
|
internal int _lengthOffset; // index for literals or lengths
|
|
|
|
|
|
// Size of match buffer for literals/lengths. There are 4 reasons for
|
|
// limiting lit_bufsize to 64K:
|
|
// - frequencies can be kept in 16 bit counters
|
|
// - if compression is not successful for the first block, all input
|
|
// data is still in the window so we can still emit a stored block even
|
|
// when input comes from standard input. (This can also be done for
|
|
// all blocks if lit_bufsize is not greater than 32K.)
|
|
// - if compression is not successful for a file smaller than 64K, we can
|
|
// even emit a stored file instead of a stored block (saving 5 bytes).
|
|
// This is applicable only for zip (not gzip or zlib).
|
|
// - creating new Huffman trees less frequently may not provide fast
|
|
// adaptation to changes in the input data statistics. (Take for
|
|
// example a binary file with poorly compressible code followed by
|
|
// a highly compressible string table.) Smaller buffer sizes give
|
|
// fast adaptation but have of course the overhead of transmitting
|
|
// trees more frequently.
|
|
|
|
internal int lit_bufsize;
|
|
|
|
internal int last_lit; // running index in l_buf
|
|
|
|
// Buffer for distances. To simplify the code, d_buf and l_buf have
|
|
// the same number of elements. To use different lengths, an extra flag
|
|
// array would be necessary.
|
|
|
|
internal int _distanceOffset; // index into pending; points to distance data??
|
|
|
|
internal int opt_len; // bit length of current block with optimal trees
|
|
internal int static_len; // bit length of current block with static trees
|
|
internal int matches; // number of string matches in current block
|
|
internal int last_eob_len; // bit length of EOB code for last block
|
|
|
|
// Output buffer. bits are inserted starting at the bottom (least
|
|
// significant bits).
|
|
internal short bi_buf;
|
|
|
|
// Number of valid bits in bi_buf. All bits above the last valid bit
|
|
// are always zero.
|
|
internal int bi_valid;
|
|
|
|
|
|
internal DeflateManager()
|
|
{
|
|
dyn_ltree = new short[HEAP_SIZE * 2];
|
|
dyn_dtree = new short[(2 * InternalConstants.D_CODES + 1) * 2]; // distance tree
|
|
bl_tree = new short[(2 * InternalConstants.BL_CODES + 1) * 2]; // Huffman tree for bit lengths
|
|
}
|
|
|
|
|
|
// lm_init
|
|
private void _InitializeLazyMatch()
|
|
{
|
|
window_size = 2 * w_size;
|
|
|
|
// clear the hash - workitem 9063
|
|
Array.Clear(head, 0, hash_size);
|
|
//for (int i = 0; i < hash_size; i++) head[i] = 0;
|
|
|
|
config = Config.Lookup(compressionLevel);
|
|
SetDeflater();
|
|
|
|
strstart = 0;
|
|
block_start = 0;
|
|
lookahead = 0;
|
|
match_length = prev_length = MIN_MATCH - 1;
|
|
match_available = 0;
|
|
ins_h = 0;
|
|
}
|
|
|
|
// Initialize the tree data structures for a new zlib stream.
|
|
private void _InitializeTreeData()
|
|
{
|
|
treeLiterals.dyn_tree = dyn_ltree;
|
|
treeLiterals.staticTree = StaticTree.Literals;
|
|
|
|
treeDistances.dyn_tree = dyn_dtree;
|
|
treeDistances.staticTree = StaticTree.Distances;
|
|
|
|
treeBitLengths.dyn_tree = bl_tree;
|
|
treeBitLengths.staticTree = StaticTree.BitLengths;
|
|
|
|
bi_buf = 0;
|
|
bi_valid = 0;
|
|
last_eob_len = 8; // enough lookahead for inflate
|
|
|
|
// Initialize the first block of the first file:
|
|
_InitializeBlocks();
|
|
}
|
|
|
|
internal void _InitializeBlocks()
|
|
{
|
|
// Initialize the trees.
|
|
for (int i = 0; i < InternalConstants.L_CODES; i++)
|
|
dyn_ltree[i * 2] = 0;
|
|
for (int i = 0; i < InternalConstants.D_CODES; i++)
|
|
dyn_dtree[i * 2] = 0;
|
|
for (int i = 0; i < InternalConstants.BL_CODES; i++)
|
|
bl_tree[i * 2] = 0;
|
|
|
|
dyn_ltree[END_BLOCK * 2] = 1;
|
|
opt_len = static_len = 0;
|
|
last_lit = matches = 0;
|
|
}
|
|
|
|
// Restore the heap property by moving down the tree starting at node k,
|
|
// exchanging a node with the smallest of its two sons if necessary, stopping
|
|
// when the heap property is re-established (each father smaller than its
|
|
// two sons).
|
|
internal void pqdownheap(short[] tree, int k)
|
|
{
|
|
int v = heap[k];
|
|
int j = k << 1; // left son of k
|
|
while (j <= heap_len)
|
|
{
|
|
// Set j to the smallest of the two sons:
|
|
if (j < heap_len && _IsSmaller(tree, heap[j + 1], heap[j], depth))
|
|
{
|
|
j++;
|
|
}
|
|
// Exit if v is smaller than both sons
|
|
if (_IsSmaller(tree, v, heap[j], depth))
|
|
break;
|
|
|
|
// Exchange v with the smallest son
|
|
heap[k] = heap[j]; k = j;
|
|
// And continue down the tree, setting j to the left son of k
|
|
j <<= 1;
|
|
}
|
|
heap[k] = v;
|
|
}
|
|
|
|
internal static bool _IsSmaller(short[] tree, int n, int m, sbyte[] depth)
|
|
{
|
|
short tn2 = tree[n * 2];
|
|
short tm2 = tree[m * 2];
|
|
return (tn2 < tm2 || (tn2 == tm2 && depth[n] <= depth[m]));
|
|
}
|
|
|
|
|
|
// Scan a literal or distance tree to determine the frequencies of the codes
|
|
// in the bit length tree.
|
|
internal void scan_tree(short[] tree, int max_code)
|
|
{
|
|
int n; // iterates over all tree elements
|
|
int prevlen = -1; // last emitted length
|
|
int curlen; // length of current code
|
|
int nextlen = (int)tree[0 * 2 + 1]; // length of next code
|
|
int count = 0; // repeat count of the current code
|
|
int max_count = 7; // max repeat count
|
|
int min_count = 4; // min repeat count
|
|
|
|
if (nextlen == 0)
|
|
{
|
|
max_count = 138; min_count = 3;
|
|
}
|
|
tree[(max_code + 1) * 2 + 1] = (short)0x7fff; // guard //??
|
|
|
|
for (n = 0; n <= max_code; n++)
|
|
{
|
|
curlen = nextlen; nextlen = (int)tree[(n + 1) * 2 + 1];
|
|
if (++count < max_count && curlen == nextlen)
|
|
{
|
|
continue;
|
|
}
|
|
else if (count < min_count)
|
|
{
|
|
bl_tree[curlen * 2] = (short)(bl_tree[curlen * 2] + count);
|
|
}
|
|
else if (curlen != 0)
|
|
{
|
|
if (curlen != prevlen)
|
|
bl_tree[curlen * 2]++;
|
|
bl_tree[InternalConstants.REP_3_6 * 2]++;
|
|
}
|
|
else if (count <= 10)
|
|
{
|
|
bl_tree[InternalConstants.REPZ_3_10 * 2]++;
|
|
}
|
|
else
|
|
{
|
|
bl_tree[InternalConstants.REPZ_11_138 * 2]++;
|
|
}
|
|
count = 0; prevlen = curlen;
|
|
if (nextlen == 0)
|
|
{
|
|
max_count = 138; min_count = 3;
|
|
}
|
|
else if (curlen == nextlen)
|
|
{
|
|
max_count = 6; min_count = 3;
|
|
}
|
|
else
|
|
{
|
|
max_count = 7; min_count = 4;
|
|
}
|
|
}
|
|
}
|
|
|
|
// Construct the Huffman tree for the bit lengths and return the index in
|
|
// bl_order of the last bit length code to send.
|
|
internal int build_bl_tree()
|
|
{
|
|
int max_blindex; // index of last bit length code of non zero freq
|
|
|
|
// Determine the bit length frequencies for literal and distance trees
|
|
scan_tree(dyn_ltree, treeLiterals.max_code);
|
|
scan_tree(dyn_dtree, treeDistances.max_code);
|
|
|
|
// Build the bit length tree:
|
|
treeBitLengths.build_tree(this);
|
|
// opt_len now includes the length of the tree representations, except
|
|
// the lengths of the bit lengths codes and the 5+5+4 bits for the counts.
|
|
|
|
// Determine the number of bit length codes to send. The pkzip format
|
|
// requires that at least 4 bit length codes be sent. (appnote.txt says
|
|
// 3 but the actual value used is 4.)
|
|
for (max_blindex = InternalConstants.BL_CODES - 1; max_blindex >= 3; max_blindex--)
|
|
{
|
|
if (bl_tree[Tree.bl_order[max_blindex] * 2 + 1] != 0)
|
|
break;
|
|
}
|
|
// Update opt_len to include the bit length tree and counts
|
|
opt_len += 3 * (max_blindex + 1) + 5 + 5 + 4;
|
|
|
|
return max_blindex;
|
|
}
|
|
|
|
|
|
// Send the header for a block using dynamic Huffman trees: the counts, the
|
|
// lengths of the bit length codes, the literal tree and the distance tree.
|
|
// IN assertion: lcodes >= 257, dcodes >= 1, blcodes >= 4.
|
|
internal void send_all_trees(int lcodes, int dcodes, int blcodes)
|
|
{
|
|
int rank; // index in bl_order
|
|
|
|
send_bits(lcodes - 257, 5); // not +255 as stated in appnote.txt
|
|
send_bits(dcodes - 1, 5);
|
|
send_bits(blcodes - 4, 4); // not -3 as stated in appnote.txt
|
|
for (rank = 0; rank < blcodes; rank++)
|
|
{
|
|
send_bits(bl_tree[Tree.bl_order[rank] * 2 + 1], 3);
|
|
}
|
|
send_tree(dyn_ltree, lcodes - 1); // literal tree
|
|
send_tree(dyn_dtree, dcodes - 1); // distance tree
|
|
}
|
|
|
|
// Send a literal or distance tree in compressed form, using the codes in
|
|
// bl_tree.
|
|
internal void send_tree(short[] tree, int max_code)
|
|
{
|
|
int n; // iterates over all tree elements
|
|
int prevlen = -1; // last emitted length
|
|
int curlen; // length of current code
|
|
int nextlen = tree[0 * 2 + 1]; // length of next code
|
|
int count = 0; // repeat count of the current code
|
|
int max_count = 7; // max repeat count
|
|
int min_count = 4; // min repeat count
|
|
|
|
if (nextlen == 0)
|
|
{
|
|
max_count = 138; min_count = 3;
|
|
}
|
|
|
|
for (n = 0; n <= max_code; n++)
|
|
{
|
|
curlen = nextlen; nextlen = tree[(n + 1) * 2 + 1];
|
|
if (++count < max_count && curlen == nextlen)
|
|
{
|
|
continue;
|
|
}
|
|
else if (count < min_count)
|
|
{
|
|
do
|
|
{
|
|
send_code(curlen, bl_tree);
|
|
}
|
|
while (--count != 0);
|
|
}
|
|
else if (curlen != 0)
|
|
{
|
|
if (curlen != prevlen)
|
|
{
|
|
send_code(curlen, bl_tree); count--;
|
|
}
|
|
send_code(InternalConstants.REP_3_6, bl_tree);
|
|
send_bits(count - 3, 2);
|
|
}
|
|
else if (count <= 10)
|
|
{
|
|
send_code(InternalConstants.REPZ_3_10, bl_tree);
|
|
send_bits(count - 3, 3);
|
|
}
|
|
else
|
|
{
|
|
send_code(InternalConstants.REPZ_11_138, bl_tree);
|
|
send_bits(count - 11, 7);
|
|
}
|
|
count = 0; prevlen = curlen;
|
|
if (nextlen == 0)
|
|
{
|
|
max_count = 138; min_count = 3;
|
|
}
|
|
else if (curlen == nextlen)
|
|
{
|
|
max_count = 6; min_count = 3;
|
|
}
|
|
else
|
|
{
|
|
max_count = 7; min_count = 4;
|
|
}
|
|
}
|
|
}
|
|
|
|
// Output a block of bytes on the stream.
|
|
// IN assertion: there is enough room in pending_buf.
|
|
private void put_bytes(byte[] p, int start, int len)
|
|
{
|
|
Array.Copy(p, start, pending, pendingCount, len);
|
|
pendingCount += len;
|
|
}
|
|
|
|
#if NOTNEEDED
|
|
private void put_byte(byte c)
|
|
{
|
|
pending[pendingCount++] = c;
|
|
}
|
|
internal void put_short(int b)
|
|
{
|
|
unchecked
|
|
{
|
|
pending[pendingCount++] = (byte)b;
|
|
pending[pendingCount++] = (byte)(b >> 8);
|
|
}
|
|
}
|
|
internal void putShortMSB(int b)
|
|
{
|
|
unchecked
|
|
{
|
|
pending[pendingCount++] = (byte)(b >> 8);
|
|
pending[pendingCount++] = (byte)b;
|
|
}
|
|
}
|
|
#endif
|
|
|
|
internal void send_code(int c, short[] tree)
|
|
{
|
|
int c2 = c * 2;
|
|
send_bits((tree[c2] & 0xffff), (tree[c2 + 1] & 0xffff));
|
|
}
|
|
|
|
internal void send_bits(int value, int length)
|
|
{
|
|
int len = length;
|
|
unchecked
|
|
{
|
|
if (bi_valid > (int)Buf_size - len)
|
|
{
|
|
//int val = value;
|
|
// bi_buf |= (val << bi_valid);
|
|
|
|
bi_buf |= (short)((value << bi_valid) & 0xffff);
|
|
//put_short(bi_buf);
|
|
pending[pendingCount++] = (byte)bi_buf;
|
|
pending[pendingCount++] = (byte)(bi_buf >> 8);
|
|
|
|
|
|
bi_buf = (short)((uint)value >> (Buf_size - bi_valid));
|
|
bi_valid += len - Buf_size;
|
|
}
|
|
else
|
|
{
|
|
// bi_buf |= (value) << bi_valid;
|
|
bi_buf |= (short)((value << bi_valid) & 0xffff);
|
|
bi_valid += len;
|
|
}
|
|
}
|
|
}
|
|
|
|
// Send one empty static block to give enough lookahead for inflate.
|
|
// This takes 10 bits, of which 7 may remain in the bit buffer.
|
|
// The current inflate code requires 9 bits of lookahead. If the
|
|
// last two codes for the previous block (real code plus EOB) were coded
|
|
// on 5 bits or less, inflate may have only 5+3 bits of lookahead to decode
|
|
// the last real code. In this case we send two empty static blocks instead
|
|
// of one. (There are no problems if the previous block is stored or fixed.)
|
|
// To simplify the code, we assume the worst case of last real code encoded
|
|
// on one bit only.
|
|
internal void _tr_align()
|
|
{
|
|
send_bits(STATIC_TREES << 1, 3);
|
|
send_code(END_BLOCK, StaticTree.lengthAndLiteralsTreeCodes);
|
|
|
|
bi_flush();
|
|
|
|
// Of the 10 bits for the empty block, we have already sent
|
|
// (10 - bi_valid) bits. The lookahead for the last real code (before
|
|
// the EOB of the previous block) was thus at least one plus the length
|
|
// of the EOB plus what we have just sent of the empty static block.
|
|
if (1 + last_eob_len + 10 - bi_valid < 9)
|
|
{
|
|
send_bits(STATIC_TREES << 1, 3);
|
|
send_code(END_BLOCK, StaticTree.lengthAndLiteralsTreeCodes);
|
|
bi_flush();
|
|
}
|
|
last_eob_len = 7;
|
|
}
|
|
|
|
|
|
// Save the match info and tally the frequency counts. Return true if
|
|
// the current block must be flushed.
|
|
internal bool _tr_tally(int dist, int lc)
|
|
{
|
|
pending[_distanceOffset + last_lit * 2] = unchecked((byte) ( (uint)dist >> 8 ) );
|
|
pending[_distanceOffset + last_lit * 2 + 1] = unchecked((byte)dist);
|
|
pending[_lengthOffset + last_lit] = unchecked((byte)lc);
|
|
last_lit++;
|
|
|
|
if (dist == 0)
|
|
{
|
|
// lc is the unmatched char
|
|
dyn_ltree[lc * 2]++;
|
|
}
|
|
else
|
|
{
|
|
matches++;
|
|
// Here, lc is the match length - MIN_MATCH
|
|
dist--; // dist = match distance - 1
|
|
dyn_ltree[(Tree.LengthCode[lc] + InternalConstants.LITERALS + 1) * 2]++;
|
|
dyn_dtree[Tree.DistanceCode(dist) * 2]++;
|
|
}
|
|
|
|
if ((last_lit & 0x1fff) == 0 && (int)compressionLevel > 2)
|
|
{
|
|
// Compute an upper bound for the compressed length
|
|
int out_length = last_lit << 3;
|
|
int in_length = strstart - block_start;
|
|
int dcode;
|
|
for (dcode = 0; dcode < InternalConstants.D_CODES; dcode++)
|
|
{
|
|
out_length = (int)(out_length + (int)dyn_dtree[dcode * 2] * (5L + Tree.ExtraDistanceBits[dcode]));
|
|
}
|
|
out_length >>= 3;
|
|
if ((matches < (last_lit / 2)) && out_length < in_length / 2)
|
|
return true;
|
|
}
|
|
|
|
return (last_lit == lit_bufsize - 1) || (last_lit == lit_bufsize);
|
|
// dinoch - wraparound?
|
|
// We avoid equality with lit_bufsize because of wraparound at 64K
|
|
// on 16 bit machines and because stored blocks are restricted to
|
|
// 64K-1 bytes.
|
|
}
|
|
|
|
|
|
|
|
// Send the block data compressed using the given Huffman trees
|
|
internal void send_compressed_block(short[] ltree, short[] dtree)
|
|
{
|
|
int distance; // distance of matched string
|
|
int lc; // match length or unmatched char (if dist == 0)
|
|
int lx = 0; // running index in l_buf
|
|
int code; // the code to send
|
|
int extra; // number of extra bits to send
|
|
|
|
if (last_lit != 0)
|
|
{
|
|
do
|
|
{
|
|
int ix = _distanceOffset + lx * 2;
|
|
distance = ((pending[ix] << 8) & 0xff00) |
|
|
(pending[ix + 1] & 0xff);
|
|
lc = (pending[_lengthOffset + lx]) & 0xff;
|
|
lx++;
|
|
|
|
if (distance == 0)
|
|
{
|
|
send_code(lc, ltree); // send a literal byte
|
|
}
|
|
else
|
|
{
|
|
// literal or match pair
|
|
// Here, lc is the match length - MIN_MATCH
|
|
code = Tree.LengthCode[lc];
|
|
|
|
// send the length code
|
|
send_code(code + InternalConstants.LITERALS + 1, ltree);
|
|
extra = Tree.ExtraLengthBits[code];
|
|
if (extra != 0)
|
|
{
|
|
// send the extra length bits
|
|
lc -= Tree.LengthBase[code];
|
|
send_bits(lc, extra);
|
|
}
|
|
distance--; // dist is now the match distance - 1
|
|
code = Tree.DistanceCode(distance);
|
|
|
|
// send the distance code
|
|
send_code(code, dtree);
|
|
|
|
extra = Tree.ExtraDistanceBits[code];
|
|
if (extra != 0)
|
|
{
|
|
// send the extra distance bits
|
|
distance -= Tree.DistanceBase[code];
|
|
send_bits(distance, extra);
|
|
}
|
|
}
|
|
|
|
// Check that the overlay between pending and d_buf+l_buf is ok:
|
|
}
|
|
while (lx < last_lit);
|
|
}
|
|
|
|
send_code(END_BLOCK, ltree);
|
|
last_eob_len = ltree[END_BLOCK * 2 + 1];
|
|
}
|
|
|
|
|
|
|
|
// Set the data type to ASCII or BINARY, using a crude approximation:
|
|
// binary if more than 20% of the bytes are <= 6 or >= 128, ascii otherwise.
|
|
// IN assertion: the fields freq of dyn_ltree are set and the total of all
|
|
// frequencies does not exceed 64K (to fit in an int on 16 bit machines).
|
|
internal void set_data_type()
|
|
{
|
|
int n = 0;
|
|
int ascii_freq = 0;
|
|
int bin_freq = 0;
|
|
while (n < 7)
|
|
{
|
|
bin_freq += dyn_ltree[n * 2]; n++;
|
|
}
|
|
while (n < 128)
|
|
{
|
|
ascii_freq += dyn_ltree[n * 2]; n++;
|
|
}
|
|
while (n < InternalConstants.LITERALS)
|
|
{
|
|
bin_freq += dyn_ltree[n * 2]; n++;
|
|
}
|
|
data_type = (sbyte)(bin_freq > (ascii_freq >> 2) ? Z_BINARY : Z_ASCII);
|
|
}
|
|
|
|
|
|
|
|
// Flush the bit buffer, keeping at most 7 bits in it.
|
|
internal void bi_flush()
|
|
{
|
|
if (bi_valid == 16)
|
|
{
|
|
pending[pendingCount++] = (byte)bi_buf;
|
|
pending[pendingCount++] = (byte)(bi_buf >> 8);
|
|
bi_buf = 0;
|
|
bi_valid = 0;
|
|
}
|
|
else if (bi_valid >= 8)
|
|
{
|
|
//put_byte((byte)bi_buf);
|
|
pending[pendingCount++] = (byte)bi_buf;
|
|
bi_buf >>= 8;
|
|
bi_valid -= 8;
|
|
}
|
|
}
|
|
|
|
// Flush the bit buffer and align the output on a byte boundary
|
|
internal void bi_windup()
|
|
{
|
|
if (bi_valid > 8)
|
|
{
|
|
pending[pendingCount++] = (byte)bi_buf;
|
|
pending[pendingCount++] = (byte)(bi_buf >> 8);
|
|
}
|
|
else if (bi_valid > 0)
|
|
{
|
|
//put_byte((byte)bi_buf);
|
|
pending[pendingCount++] = (byte)bi_buf;
|
|
}
|
|
bi_buf = 0;
|
|
bi_valid = 0;
|
|
}
|
|
|
|
// Copy a stored block, storing first the length and its
|
|
// one's complement if requested.
|
|
internal void copy_block(int buf, int len, bool header)
|
|
{
|
|
bi_windup(); // align on byte boundary
|
|
last_eob_len = 8; // enough lookahead for inflate
|
|
|
|
if (header)
|
|
unchecked
|
|
{
|
|
//put_short((short)len);
|
|
pending[pendingCount++] = (byte)len;
|
|
pending[pendingCount++] = (byte)(len >> 8);
|
|
//put_short((short)~len);
|
|
pending[pendingCount++] = (byte)~len;
|
|
pending[pendingCount++] = (byte)(~len >> 8);
|
|
}
|
|
|
|
put_bytes(window, buf, len);
|
|
}
|
|
|
|
internal void flush_block_only(bool eof)
|
|
{
|
|
_tr_flush_block(block_start >= 0 ? block_start : -1, strstart - block_start, eof);
|
|
block_start = strstart;
|
|
_codec.flush_pending();
|
|
}
|
|
|
|
// Copy without compression as much as possible from the input stream, return
|
|
// the current block state.
|
|
// This function does not insert new strings in the dictionary since
|
|
// uncompressible data is probably not useful. This function is used
|
|
// only for the level=0 compression option.
|
|
// NOTE: this function should be optimized to avoid extra copying from
|
|
// window to pending_buf.
|
|
internal BlockState DeflateNone(FlushType flush)
|
|
{
|
|
// Stored blocks are limited to 0xffff bytes, pending is limited
|
|
// to pending_buf_size, and each stored block has a 5 byte header:
|
|
|
|
int max_block_size = 0xffff;
|
|
int max_start;
|
|
|
|
if (max_block_size > pending.Length - 5)
|
|
{
|
|
max_block_size = pending.Length - 5;
|
|
}
|
|
|
|
// Copy as much as possible from input to output:
|
|
while (true)
|
|
{
|
|
// Fill the window as much as possible:
|
|
if (lookahead <= 1)
|
|
{
|
|
_fillWindow();
|
|
if (lookahead == 0 && flush == FlushType.None)
|
|
return BlockState.NeedMore;
|
|
if (lookahead == 0)
|
|
break; // flush the current block
|
|
}
|
|
|
|
strstart += lookahead;
|
|
lookahead = 0;
|
|
|
|
// Emit a stored block if pending will be full:
|
|
max_start = block_start + max_block_size;
|
|
if (strstart == 0 || strstart >= max_start)
|
|
{
|
|
// strstart == 0 is possible when wraparound on 16-bit machine
|
|
lookahead = (int)(strstart - max_start);
|
|
strstart = (int)max_start;
|
|
|
|
flush_block_only(false);
|
|
if (_codec.AvailableBytesOut == 0)
|
|
return BlockState.NeedMore;
|
|
}
|
|
|
|
// Flush if we may have to slide, otherwise block_start may become
|
|
// negative and the data will be gone:
|
|
if (strstart - block_start >= w_size - MIN_LOOKAHEAD)
|
|
{
|
|
flush_block_only(false);
|
|
if (_codec.AvailableBytesOut == 0)
|
|
return BlockState.NeedMore;
|
|
}
|
|
}
|
|
|
|
flush_block_only(flush == FlushType.Finish);
|
|
if (_codec.AvailableBytesOut == 0)
|
|
return (flush == FlushType.Finish) ? BlockState.FinishStarted : BlockState.NeedMore;
|
|
|
|
return flush == FlushType.Finish ? BlockState.FinishDone : BlockState.BlockDone;
|
|
}
|
|
|
|
|
|
// Send a stored block
|
|
internal void _tr_stored_block(int buf, int stored_len, bool eof)
|
|
{
|
|
send_bits((STORED_BLOCK << 1) + (eof ? 1 : 0), 3); // send block type
|
|
copy_block(buf, stored_len, true); // with header
|
|
}
|
|
|
|
// Determine the best encoding for the current block: dynamic trees, static
|
|
// trees or store, and output the encoded block to the zip file.
|
|
internal void _tr_flush_block(int buf, int stored_len, bool eof)
|
|
{
|
|
int opt_lenb, static_lenb; // opt_len and static_len in bytes
|
|
int max_blindex = 0; // index of last bit length code of non zero freq
|
|
|
|
// Build the Huffman trees unless a stored block is forced
|
|
if (compressionLevel > 0)
|
|
{
|
|
// Check if the file is ascii or binary
|
|
if (data_type == Z_UNKNOWN)
|
|
set_data_type();
|
|
|
|
// Construct the literal and distance trees
|
|
treeLiterals.build_tree(this);
|
|
|
|
treeDistances.build_tree(this);
|
|
|
|
// At this point, opt_len and static_len are the total bit lengths of
|
|
// the compressed block data, excluding the tree representations.
|
|
|
|
// Build the bit length tree for the above two trees, and get the index
|
|
// in bl_order of the last bit length code to send.
|
|
max_blindex = build_bl_tree();
|
|
|
|
// Determine the best encoding. Compute first the block length in bytes
|
|
opt_lenb = (opt_len + 3 + 7) >> 3;
|
|
static_lenb = (static_len + 3 + 7) >> 3;
|
|
|
|
if (static_lenb <= opt_lenb)
|
|
opt_lenb = static_lenb;
|
|
}
|
|
else
|
|
{
|
|
opt_lenb = static_lenb = stored_len + 5; // force a stored block
|
|
}
|
|
|
|
if (stored_len + 4 <= opt_lenb && buf != -1)
|
|
{
|
|
// 4: two words for the lengths
|
|
// The test buf != NULL is only necessary if LIT_BUFSIZE > WSIZE.
|
|
// Otherwise we can't have processed more than WSIZE input bytes since
|
|
// the last block flush, because compression would have been
|
|
// successful. If LIT_BUFSIZE <= WSIZE, it is never too late to
|
|
// transform a block into a stored block.
|
|
_tr_stored_block(buf, stored_len, eof);
|
|
}
|
|
else if (static_lenb == opt_lenb)
|
|
{
|
|
send_bits((STATIC_TREES << 1) + (eof ? 1 : 0), 3);
|
|
send_compressed_block(StaticTree.lengthAndLiteralsTreeCodes, StaticTree.distTreeCodes);
|
|
}
|
|
else
|
|
{
|
|
send_bits((DYN_TREES << 1) + (eof ? 1 : 0), 3);
|
|
send_all_trees(treeLiterals.max_code + 1, treeDistances.max_code + 1, max_blindex + 1);
|
|
send_compressed_block(dyn_ltree, dyn_dtree);
|
|
}
|
|
|
|
// The above check is made mod 2^32, for files larger than 512 MB
|
|
// and uLong implemented on 32 bits.
|
|
|
|
_InitializeBlocks();
|
|
|
|
if (eof)
|
|
{
|
|
bi_windup();
|
|
}
|
|
}
|
|
|
|
// Fill the window when the lookahead becomes insufficient.
|
|
// Updates strstart and lookahead.
|
|
//
|
|
// IN assertion: lookahead < MIN_LOOKAHEAD
|
|
// OUT assertions: strstart <= window_size-MIN_LOOKAHEAD
|
|
// At least one byte has been read, or avail_in == 0; reads are
|
|
// performed for at least two bytes (required for the zip translate_eol
|
|
// option -- not supported here).
|
|
private void _fillWindow()
|
|
{
|
|
int n, m;
|
|
int p;
|
|
int more; // Amount of free space at the end of the window.
|
|
|
|
do
|
|
{
|
|
more = (window_size - lookahead - strstart);
|
|
|
|
// Deal with !@#$% 64K limit:
|
|
if (more == 0 && strstart == 0 && lookahead == 0)
|
|
{
|
|
more = w_size;
|
|
}
|
|
else if (more == -1)
|
|
{
|
|
// Very unlikely, but possible on 16 bit machine if strstart == 0
|
|
// and lookahead == 1 (input done one byte at time)
|
|
more--;
|
|
|
|
// If the window is almost full and there is insufficient lookahead,
|
|
// move the upper half to the lower one to make room in the upper half.
|
|
}
|
|
else if (strstart >= w_size + w_size - MIN_LOOKAHEAD)
|
|
{
|
|
Array.Copy(window, w_size, window, 0, w_size);
|
|
match_start -= w_size;
|
|
strstart -= w_size; // we now have strstart >= MAX_DIST
|
|
block_start -= w_size;
|
|
|
|
// Slide the hash table (could be avoided with 32 bit values
|
|
// at the expense of memory usage). We slide even when level == 0
|
|
// to keep the hash table consistent if we switch back to level > 0
|
|
// later. (Using level 0 permanently is not an optimal usage of
|
|
// zlib, so we don't care about this pathological case.)
|
|
|
|
n = hash_size;
|
|
p = n;
|
|
do
|
|
{
|
|
m = (head[--p] & 0xffff);
|
|
head[p] = (short)((m >= w_size) ? (m - w_size) : 0);
|
|
}
|
|
while (--n != 0);
|
|
|
|
n = w_size;
|
|
p = n;
|
|
do
|
|
{
|
|
m = (prev[--p] & 0xffff);
|
|
prev[p] = (short)((m >= w_size) ? (m - w_size) : 0);
|
|
// If n is not on any hash chain, prev[n] is garbage but
|
|
// its value will never be used.
|
|
}
|
|
while (--n != 0);
|
|
more += w_size;
|
|
}
|
|
|
|
if (_codec.AvailableBytesIn == 0)
|
|
return;
|
|
|
|
// If there was no sliding:
|
|
// strstart <= WSIZE+MAX_DIST-1 && lookahead <= MIN_LOOKAHEAD - 1 &&
|
|
// more == window_size - lookahead - strstart
|
|
// => more >= window_size - (MIN_LOOKAHEAD-1 + WSIZE + MAX_DIST-1)
|
|
// => more >= window_size - 2*WSIZE + 2
|
|
// In the BIG_MEM or MMAP case (not yet supported),
|
|
// window_size == input_size + MIN_LOOKAHEAD &&
|
|
// strstart + s->lookahead <= input_size => more >= MIN_LOOKAHEAD.
|
|
// Otherwise, window_size == 2*WSIZE so more >= 2.
|
|
// If there was sliding, more >= WSIZE. So in all cases, more >= 2.
|
|
|
|
n = _codec.read_buf(window, strstart + lookahead, more);
|
|
lookahead += n;
|
|
|
|
// Initialize the hash value now that we have some input:
|
|
if (lookahead >= MIN_MATCH)
|
|
{
|
|
ins_h = window[strstart] & 0xff;
|
|
ins_h = (((ins_h) << hash_shift) ^ (window[strstart + 1] & 0xff)) & hash_mask;
|
|
}
|
|
// If the whole input has less than MIN_MATCH bytes, ins_h is garbage,
|
|
// but this is not important since only literal bytes will be emitted.
|
|
}
|
|
while (lookahead < MIN_LOOKAHEAD && _codec.AvailableBytesIn != 0);
|
|
}
|
|
|
|
// Compress as much as possible from the input stream, return the current
|
|
// block state.
|
|
// This function does not perform lazy evaluation of matches and inserts
|
|
// new strings in the dictionary only for unmatched strings or for short
|
|
// matches. It is used only for the fast compression options.
|
|
internal BlockState DeflateFast(FlushType flush)
|
|
{
|
|
// short hash_head = 0; // head of the hash chain
|
|
int hash_head = 0; // head of the hash chain
|
|
bool bflush; // set if current block must be flushed
|
|
|
|
while (true)
|
|
{
|
|
// Make sure that we always have enough lookahead, except
|
|
// at the end of the input file. We need MAX_MATCH bytes
|
|
// for the next match, plus MIN_MATCH bytes to insert the
|
|
// string following the next match.
|
|
if (lookahead < MIN_LOOKAHEAD)
|
|
{
|
|
_fillWindow();
|
|
if (lookahead < MIN_LOOKAHEAD && flush == FlushType.None)
|
|
{
|
|
return BlockState.NeedMore;
|
|
}
|
|
if (lookahead == 0)
|
|
break; // flush the current block
|
|
}
|
|
|
|
// Insert the string window[strstart .. strstart+2] in the
|
|
// dictionary, and set hash_head to the head of the hash chain:
|
|
if (lookahead >= MIN_MATCH)
|
|
{
|
|
ins_h = (((ins_h) << hash_shift) ^ (window[(strstart) + (MIN_MATCH - 1)] & 0xff)) & hash_mask;
|
|
|
|
// prev[strstart&w_mask]=hash_head=head[ins_h];
|
|
hash_head = (head[ins_h] & 0xffff);
|
|
prev[strstart & w_mask] = head[ins_h];
|
|
head[ins_h] = unchecked((short)strstart);
|
|
}
|
|
|
|
// Find the longest match, discarding those <= prev_length.
|
|
// At this point we have always match_length < MIN_MATCH
|
|
|
|
if (hash_head != 0L && ((strstart - hash_head) & 0xffff) <= w_size - MIN_LOOKAHEAD)
|
|
{
|
|
// To simplify the code, we prevent matches with the string
|
|
// of window index 0 (in particular we have to avoid a match
|
|
// of the string with itself at the start of the input file).
|
|
if (compressionStrategy != CompressionStrategy.HuffmanOnly)
|
|
{
|
|
match_length = longest_match(hash_head);
|
|
}
|
|
// longest_match() sets match_start
|
|
}
|
|
if (match_length >= MIN_MATCH)
|
|
{
|
|
// check_match(strstart, match_start, match_length);
|
|
|
|
bflush = _tr_tally(strstart - match_start, match_length - MIN_MATCH);
|
|
|
|
lookahead -= match_length;
|
|
|
|
// Insert new strings in the hash table only if the match length
|
|
// is not too large. This saves time but degrades compression.
|
|
if (match_length <= config.MaxLazy && lookahead >= MIN_MATCH)
|
|
{
|
|
match_length--; // string at strstart already in hash table
|
|
do
|
|
{
|
|
strstart++;
|
|
|
|
ins_h = ((ins_h << hash_shift) ^ (window[(strstart) + (MIN_MATCH - 1)] & 0xff)) & hash_mask;
|
|
// prev[strstart&w_mask]=hash_head=head[ins_h];
|
|
hash_head = (head[ins_h] & 0xffff);
|
|
prev[strstart & w_mask] = head[ins_h];
|
|
head[ins_h] = unchecked((short)strstart);
|
|
|
|
// strstart never exceeds WSIZE-MAX_MATCH, so there are
|
|
// always MIN_MATCH bytes ahead.
|
|
}
|
|
while (--match_length != 0);
|
|
strstart++;
|
|
}
|
|
else
|
|
{
|
|
strstart += match_length;
|
|
match_length = 0;
|
|
ins_h = window[strstart] & 0xff;
|
|
|
|
ins_h = (((ins_h) << hash_shift) ^ (window[strstart + 1] & 0xff)) & hash_mask;
|
|
// If lookahead < MIN_MATCH, ins_h is garbage, but it does not
|
|
// matter since it will be recomputed at next deflate call.
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// No match, output a literal byte
|
|
|
|
bflush = _tr_tally(0, window[strstart] & 0xff);
|
|
lookahead--;
|
|
strstart++;
|
|
}
|
|
if (bflush)
|
|
{
|
|
flush_block_only(false);
|
|
if (_codec.AvailableBytesOut == 0)
|
|
return BlockState.NeedMore;
|
|
}
|
|
}
|
|
|
|
flush_block_only(flush == FlushType.Finish);
|
|
if (_codec.AvailableBytesOut == 0)
|
|
{
|
|
if (flush == FlushType.Finish)
|
|
return BlockState.FinishStarted;
|
|
else
|
|
return BlockState.NeedMore;
|
|
}
|
|
return flush == FlushType.Finish ? BlockState.FinishDone : BlockState.BlockDone;
|
|
}
|
|
|
|
// Same as above, but achieves better compression. We use a lazy
|
|
// evaluation for matches: a match is finally adopted only if there is
|
|
// no better match at the next window position.
|
|
internal BlockState DeflateSlow(FlushType flush)
|
|
{
|
|
// short hash_head = 0; // head of hash chain
|
|
int hash_head = 0; // head of hash chain
|
|
bool bflush; // set if current block must be flushed
|
|
|
|
// Process the input block.
|
|
while (true)
|
|
{
|
|
// Make sure that we always have enough lookahead, except
|
|
// at the end of the input file. We need MAX_MATCH bytes
|
|
// for the next match, plus MIN_MATCH bytes to insert the
|
|
// string following the next match.
|
|
|
|
if (lookahead < MIN_LOOKAHEAD)
|
|
{
|
|
_fillWindow();
|
|
if (lookahead < MIN_LOOKAHEAD && flush == FlushType.None)
|
|
return BlockState.NeedMore;
|
|
|
|
if (lookahead == 0)
|
|
break; // flush the current block
|
|
}
|
|
|
|
// Insert the string window[strstart .. strstart+2] in the
|
|
// dictionary, and set hash_head to the head of the hash chain:
|
|
|
|
if (lookahead >= MIN_MATCH)
|
|
{
|
|
ins_h = (((ins_h) << hash_shift) ^ (window[(strstart) + (MIN_MATCH - 1)] & 0xff)) & hash_mask;
|
|
// prev[strstart&w_mask]=hash_head=head[ins_h];
|
|
hash_head = (head[ins_h] & 0xffff);
|
|
prev[strstart & w_mask] = head[ins_h];
|
|
head[ins_h] = unchecked((short)strstart);
|
|
}
|
|
|
|
// Find the longest match, discarding those <= prev_length.
|
|
prev_length = match_length;
|
|
prev_match = match_start;
|
|
match_length = MIN_MATCH - 1;
|
|
|
|
if (hash_head != 0 && prev_length < config.MaxLazy &&
|
|
((strstart - hash_head) & 0xffff) <= w_size - MIN_LOOKAHEAD)
|
|
{
|
|
// To simplify the code, we prevent matches with the string
|
|
// of window index 0 (in particular we have to avoid a match
|
|
// of the string with itself at the start of the input file).
|
|
|
|
if (compressionStrategy != CompressionStrategy.HuffmanOnly)
|
|
{
|
|
match_length = longest_match(hash_head);
|
|
}
|
|
// longest_match() sets match_start
|
|
|
|
if (match_length <= 5 && (compressionStrategy == CompressionStrategy.Filtered ||
|
|
(match_length == MIN_MATCH && strstart - match_start > 4096)))
|
|
{
|
|
|
|
// If prev_match is also MIN_MATCH, match_start is garbage
|
|
// but we will ignore the current match anyway.
|
|
match_length = MIN_MATCH - 1;
|
|
}
|
|
}
|
|
|
|
// If there was a match at the previous step and the current
|
|
// match is not better, output the previous match:
|
|
if (prev_length >= MIN_MATCH && match_length <= prev_length)
|
|
{
|
|
int max_insert = strstart + lookahead - MIN_MATCH;
|
|
// Do not insert strings in hash table beyond this.
|
|
|
|
// check_match(strstart-1, prev_match, prev_length);
|
|
|
|
bflush = _tr_tally(strstart - 1 - prev_match, prev_length - MIN_MATCH);
|
|
|
|
// Insert in hash table all strings up to the end of the match.
|
|
// strstart-1 and strstart are already inserted. If there is not
|
|
// enough lookahead, the last two strings are not inserted in
|
|
// the hash table.
|
|
lookahead -= (prev_length - 1);
|
|
prev_length -= 2;
|
|
do
|
|
{
|
|
if (++strstart <= max_insert)
|
|
{
|
|
ins_h = (((ins_h) << hash_shift) ^ (window[(strstart) + (MIN_MATCH - 1)] & 0xff)) & hash_mask;
|
|
//prev[strstart&w_mask]=hash_head=head[ins_h];
|
|
hash_head = (head[ins_h] & 0xffff);
|
|
prev[strstart & w_mask] = head[ins_h];
|
|
head[ins_h] = unchecked((short)strstart);
|
|
}
|
|
}
|
|
while (--prev_length != 0);
|
|
match_available = 0;
|
|
match_length = MIN_MATCH - 1;
|
|
strstart++;
|
|
|
|
if (bflush)
|
|
{
|
|
flush_block_only(false);
|
|
if (_codec.AvailableBytesOut == 0)
|
|
return BlockState.NeedMore;
|
|
}
|
|
}
|
|
else if (match_available != 0)
|
|
{
|
|
|
|
// If there was no match at the previous position, output a
|
|
// single literal. If there was a match but the current match
|
|
// is longer, truncate the previous match to a single literal.
|
|
|
|
bflush = _tr_tally(0, window[strstart - 1] & 0xff);
|
|
|
|
if (bflush)
|
|
{
|
|
flush_block_only(false);
|
|
}
|
|
strstart++;
|
|
lookahead--;
|
|
if (_codec.AvailableBytesOut == 0)
|
|
return BlockState.NeedMore;
|
|
}
|
|
else
|
|
{
|
|
// There is no previous match to compare with, wait for
|
|
// the next step to decide.
|
|
|
|
match_available = 1;
|
|
strstart++;
|
|
lookahead--;
|
|
}
|
|
}
|
|
|
|
if (match_available != 0)
|
|
{
|
|
bflush = _tr_tally(0, window[strstart - 1] & 0xff);
|
|
match_available = 0;
|
|
}
|
|
flush_block_only(flush == FlushType.Finish);
|
|
|
|
if (_codec.AvailableBytesOut == 0)
|
|
{
|
|
if (flush == FlushType.Finish)
|
|
return BlockState.FinishStarted;
|
|
else
|
|
return BlockState.NeedMore;
|
|
}
|
|
|
|
return flush == FlushType.Finish ? BlockState.FinishDone : BlockState.BlockDone;
|
|
}
|
|
|
|
|
|
internal int longest_match(int cur_match)
|
|
{
|
|
int chain_length = config.MaxChainLength; // max hash chain length
|
|
int scan = strstart; // current string
|
|
int match; // matched string
|
|
int len; // length of current match
|
|
int best_len = prev_length; // best match length so far
|
|
int limit = strstart > (w_size - MIN_LOOKAHEAD) ? strstart - (w_size - MIN_LOOKAHEAD) : 0;
|
|
|
|
int niceLength = config.NiceLength;
|
|
|
|
// Stop when cur_match becomes <= limit. To simplify the code,
|
|
// we prevent matches with the string of window index 0.
|
|
|
|
int wmask = w_mask;
|
|
|
|
int strend = strstart + MAX_MATCH;
|
|
byte scan_end1 = window[scan + best_len - 1];
|
|
byte scan_end = window[scan + best_len];
|
|
|
|
// The code is optimized for HASH_BITS >= 8 and MAX_MATCH-2 multiple of 16.
|
|
// It is easy to get rid of this optimization if necessary.
|
|
|
|
// Do not waste too much time if we already have a good match:
|
|
if (prev_length >= config.GoodLength)
|
|
{
|
|
chain_length >>= 2;
|
|
}
|
|
|
|
// Do not look for matches beyond the end of the input. This is necessary
|
|
// to make deflate deterministic.
|
|
if (niceLength > lookahead)
|
|
niceLength = lookahead;
|
|
|
|
do
|
|
{
|
|
match = cur_match;
|
|
|
|
// Skip to next match if the match length cannot increase
|
|
// or if the match length is less than 2:
|
|
if (window[match + best_len] != scan_end ||
|
|
window[match + best_len - 1] != scan_end1 ||
|
|
window[match] != window[scan] ||
|
|
window[++match] != window[scan + 1])
|
|
continue;
|
|
|
|
// The check at best_len-1 can be removed because it will be made
|
|
// again later. (This heuristic is not always a win.)
|
|
// It is not necessary to compare scan[2] and match[2] since they
|
|
// are always equal when the other bytes match, given that
|
|
// the hash keys are equal and that HASH_BITS >= 8.
|
|
scan += 2; match++;
|
|
|
|
// We check for insufficient lookahead only every 8th comparison;
|
|
// the 256th check will be made at strstart+258.
|
|
do
|
|
{
|
|
}
|
|
while (window[++scan] == window[++match] &&
|
|
window[++scan] == window[++match] &&
|
|
window[++scan] == window[++match] &&
|
|
window[++scan] == window[++match] &&
|
|
window[++scan] == window[++match] &&
|
|
window[++scan] == window[++match] &&
|
|
window[++scan] == window[++match] &&
|
|
window[++scan] == window[++match] && scan < strend);
|
|
|
|
len = MAX_MATCH - (int)(strend - scan);
|
|
scan = strend - MAX_MATCH;
|
|
|
|
if (len > best_len)
|
|
{
|
|
match_start = cur_match;
|
|
best_len = len;
|
|
if (len >= niceLength)
|
|
break;
|
|
scan_end1 = window[scan + best_len - 1];
|
|
scan_end = window[scan + best_len];
|
|
}
|
|
}
|
|
while ((cur_match = (prev[cur_match & wmask] & 0xffff)) > limit && --chain_length != 0);
|
|
|
|
if (best_len <= lookahead)
|
|
return best_len;
|
|
return lookahead;
|
|
}
|
|
|
|
|
|
private bool Rfc1950BytesEmitted = false;
|
|
private bool _WantRfc1950HeaderBytes = true;
|
|
internal bool WantRfc1950HeaderBytes
|
|
{
|
|
get { return _WantRfc1950HeaderBytes; }
|
|
set { _WantRfc1950HeaderBytes = value; }
|
|
}
|
|
|
|
|
|
internal int Initialize(ZlibCodec codec, CompressionLevel level)
|
|
{
|
|
return Initialize(codec, level, ZlibConstants.WindowBitsMax);
|
|
}
|
|
|
|
internal int Initialize(ZlibCodec codec, CompressionLevel level, int bits)
|
|
{
|
|
return Initialize(codec, level, bits, MEM_LEVEL_DEFAULT, CompressionStrategy.Default);
|
|
}
|
|
|
|
internal int Initialize(ZlibCodec codec, CompressionLevel level, int bits, CompressionStrategy compressionStrategy)
|
|
{
|
|
return Initialize(codec, level, bits, MEM_LEVEL_DEFAULT, compressionStrategy);
|
|
}
|
|
|
|
internal int Initialize(ZlibCodec codec, CompressionLevel level, int windowBits, int memLevel, CompressionStrategy strategy)
|
|
{
|
|
_codec = codec;
|
|
_codec.Message = null;
|
|
|
|
// validation
|
|
if (windowBits < 9 || windowBits > 15)
|
|
throw new ZlibException("windowBits must be in the range 9..15.");
|
|
|
|
if (memLevel < 1 || memLevel > MEM_LEVEL_MAX)
|
|
throw new ZlibException(String.Format("memLevel must be in the range 1.. {0}", MEM_LEVEL_MAX));
|
|
|
|
_codec.dstate = this;
|
|
|
|
w_bits = windowBits;
|
|
w_size = 1 << w_bits;
|
|
w_mask = w_size - 1;
|
|
|
|
hash_bits = memLevel + 7;
|
|
hash_size = 1 << hash_bits;
|
|
hash_mask = hash_size - 1;
|
|
hash_shift = ((hash_bits + MIN_MATCH - 1) / MIN_MATCH);
|
|
|
|
window = new byte[w_size * 2];
|
|
prev = new short[w_size];
|
|
head = new short[hash_size];
|
|
|
|
// for memLevel==8, this will be 16384, 16k
|
|
lit_bufsize = 1 << (memLevel + 6);
|
|
|
|
// Use a single array as the buffer for data pending compression,
|
|
// the output distance codes, and the output length codes (aka tree).
|
|
// orig comment: This works just fine since the average
|
|
// output size for (length,distance) codes is <= 24 bits.
|
|
pending = new byte[lit_bufsize * 4];
|
|
_distanceOffset = lit_bufsize;
|
|
_lengthOffset = (1 + 2) * lit_bufsize;
|
|
|
|
// So, for memLevel 8, the length of the pending buffer is 65536. 64k.
|
|
// The first 16k are pending bytes.
|
|
// The middle slice, of 32k, is used for distance codes.
|
|
// The final 16k are length codes.
|
|
|
|
this.compressionLevel = level;
|
|
this.compressionStrategy = strategy;
|
|
|
|
Reset();
|
|
return ZlibConstants.Z_OK;
|
|
}
|
|
|
|
|
|
internal void Reset()
|
|
{
|
|
_codec.TotalBytesIn = _codec.TotalBytesOut = 0;
|
|
_codec.Message = null;
|
|
//strm.data_type = Z_UNKNOWN;
|
|
|
|
pendingCount = 0;
|
|
nextPending = 0;
|
|
|
|
Rfc1950BytesEmitted = false;
|
|
|
|
status = (WantRfc1950HeaderBytes) ? INIT_STATE : BUSY_STATE;
|
|
_codec._Adler32 = Adler.Adler32(0, null, 0, 0);
|
|
|
|
last_flush = (int)FlushType.None;
|
|
|
|
_InitializeTreeData();
|
|
_InitializeLazyMatch();
|
|
}
|
|
|
|
|
|
internal int End()
|
|
{
|
|
if (status != INIT_STATE && status != BUSY_STATE && status != FINISH_STATE)
|
|
{
|
|
return ZlibConstants.Z_STREAM_ERROR;
|
|
}
|
|
// Deallocate in reverse order of allocations:
|
|
pending = null;
|
|
head = null;
|
|
prev = null;
|
|
window = null;
|
|
// free
|
|
// dstate=null;
|
|
return status == BUSY_STATE ? ZlibConstants.Z_DATA_ERROR : ZlibConstants.Z_OK;
|
|
}
|
|
|
|
|
|
private void SetDeflater()
|
|
{
|
|
switch (config.Flavor)
|
|
{
|
|
case DeflateFlavor.Store:
|
|
DeflateFunction = DeflateNone;
|
|
break;
|
|
case DeflateFlavor.Fast:
|
|
DeflateFunction = DeflateFast;
|
|
break;
|
|
case DeflateFlavor.Slow:
|
|
DeflateFunction = DeflateSlow;
|
|
break;
|
|
}
|
|
}
|
|
|
|
|
|
internal int SetParams(CompressionLevel level, CompressionStrategy strategy)
|
|
{
|
|
int result = ZlibConstants.Z_OK;
|
|
|
|
if (compressionLevel != level)
|
|
{
|
|
Config newConfig = Config.Lookup(level);
|
|
|
|
// change in the deflate flavor (Fast vs slow vs none)?
|
|
if (newConfig.Flavor != config.Flavor && _codec.TotalBytesIn != 0)
|
|
{
|
|
// Flush the last buffer:
|
|
result = _codec.Deflate(FlushType.Partial);
|
|
}
|
|
|
|
compressionLevel = level;
|
|
config = newConfig;
|
|
SetDeflater();
|
|
}
|
|
|
|
// no need to flush with change in strategy? Really?
|
|
compressionStrategy = strategy;
|
|
|
|
return result;
|
|
}
|
|
|
|
|
|
internal int SetDictionary(byte[] dictionary)
|
|
{
|
|
int length = dictionary.Length;
|
|
int index = 0;
|
|
|
|
if (dictionary == null || status != INIT_STATE)
|
|
throw new ZlibException("Stream error.");
|
|
|
|
_codec._Adler32 = Adler.Adler32(_codec._Adler32, dictionary, 0, dictionary.Length);
|
|
|
|
if (length < MIN_MATCH)
|
|
return ZlibConstants.Z_OK;
|
|
if (length > w_size - MIN_LOOKAHEAD)
|
|
{
|
|
length = w_size - MIN_LOOKAHEAD;
|
|
index = dictionary.Length - length; // use the tail of the dictionary
|
|
}
|
|
Array.Copy(dictionary, index, window, 0, length);
|
|
strstart = length;
|
|
block_start = length;
|
|
|
|
// Insert all strings in the hash table (except for the last two bytes).
|
|
// s->lookahead stays null, so s->ins_h will be recomputed at the next
|
|
// call of fill_window.
|
|
|
|
ins_h = window[0] & 0xff;
|
|
ins_h = (((ins_h) << hash_shift) ^ (window[1] & 0xff)) & hash_mask;
|
|
|
|
for (int n = 0; n <= length - MIN_MATCH; n++)
|
|
{
|
|
ins_h = (((ins_h) << hash_shift) ^ (window[(n) + (MIN_MATCH - 1)] & 0xff)) & hash_mask;
|
|
prev[n & w_mask] = head[ins_h];
|
|
head[ins_h] = (short)n;
|
|
}
|
|
return ZlibConstants.Z_OK;
|
|
}
|
|
|
|
|
|
|
|
internal int Deflate(FlushType flush)
|
|
{
|
|
int old_flush;
|
|
|
|
if (_codec.OutputBuffer == null ||
|
|
(_codec.InputBuffer == null && _codec.AvailableBytesIn != 0) ||
|
|
(status == FINISH_STATE && flush != FlushType.Finish))
|
|
{
|
|
_codec.Message = _ErrorMessage[ZlibConstants.Z_NEED_DICT - (ZlibConstants.Z_STREAM_ERROR)];
|
|
throw new ZlibException(String.Format("Something is fishy. [{0}]", _codec.Message));
|
|
}
|
|
if (_codec.AvailableBytesOut == 0)
|
|
{
|
|
_codec.Message = _ErrorMessage[ZlibConstants.Z_NEED_DICT - (ZlibConstants.Z_BUF_ERROR)];
|
|
throw new ZlibException("OutputBuffer is full (AvailableBytesOut == 0)");
|
|
}
|
|
|
|
old_flush = last_flush;
|
|
last_flush = (int)flush;
|
|
|
|
// Write the zlib (rfc1950) header bytes
|
|
if (status == INIT_STATE)
|
|
{
|
|
int header = (Z_DEFLATED + ((w_bits - 8) << 4)) << 8;
|
|
int level_flags = (((int)compressionLevel - 1) & 0xff) >> 1;
|
|
|
|
if (level_flags > 3)
|
|
level_flags = 3;
|
|
header |= (level_flags << 6);
|
|
if (strstart != 0)
|
|
header |= PRESET_DICT;
|
|
header += 31 - (header % 31);
|
|
|
|
status = BUSY_STATE;
|
|
//putShortMSB(header);
|
|
unchecked
|
|
{
|
|
pending[pendingCount++] = (byte)(header >> 8);
|
|
pending[pendingCount++] = (byte)header;
|
|
}
|
|
// Save the adler32 of the preset dictionary:
|
|
if (strstart != 0)
|
|
{
|
|
pending[pendingCount++] = (byte)((_codec._Adler32 & 0xFF000000) >> 24);
|
|
pending[pendingCount++] = (byte)((_codec._Adler32 & 0x00FF0000) >> 16);
|
|
pending[pendingCount++] = (byte)((_codec._Adler32 & 0x0000FF00) >> 8);
|
|
pending[pendingCount++] = (byte)(_codec._Adler32 & 0x000000FF);
|
|
}
|
|
_codec._Adler32 = Adler.Adler32(0, null, 0, 0);
|
|
}
|
|
|
|
// Flush as much pending output as possible
|
|
if (pendingCount != 0)
|
|
{
|
|
_codec.flush_pending();
|
|
if (_codec.AvailableBytesOut == 0)
|
|
{
|
|
//System.out.println(" avail_out==0");
|
|
// Since avail_out is 0, deflate will be called again with
|
|
// more output space, but possibly with both pending and
|
|
// avail_in equal to zero. There won't be anything to do,
|
|
// but this is not an error situation so make sure we
|
|
// return OK instead of BUF_ERROR at next call of deflate:
|
|
last_flush = -1;
|
|
return ZlibConstants.Z_OK;
|
|
}
|
|
|
|
// Make sure there is something to do and avoid duplicate consecutive
|
|
// flushes. For repeated and useless calls with Z_FINISH, we keep
|
|
// returning Z_STREAM_END instead of Z_BUFF_ERROR.
|
|
}
|
|
else if (_codec.AvailableBytesIn == 0 &&
|
|
(int)flush <= old_flush &&
|
|
flush != FlushType.Finish)
|
|
{
|
|
// workitem 8557
|
|
//
|
|
// Not sure why this needs to be an error. pendingCount == 0, which
|
|
// means there's nothing to deflate. And the caller has not asked
|
|
// for a FlushType.Finish, but... that seems very non-fatal. We
|
|
// can just say "OK" and do nothing.
|
|
|
|
// _codec.Message = z_errmsg[ZlibConstants.Z_NEED_DICT - (ZlibConstants.Z_BUF_ERROR)];
|
|
// throw new ZlibException("AvailableBytesIn == 0 && flush<=old_flush && flush != FlushType.Finish");
|
|
|
|
return ZlibConstants.Z_OK;
|
|
}
|
|
|
|
// User must not provide more input after the first FINISH:
|
|
if (status == FINISH_STATE && _codec.AvailableBytesIn != 0)
|
|
{
|
|
_codec.Message = _ErrorMessage[ZlibConstants.Z_NEED_DICT - (ZlibConstants.Z_BUF_ERROR)];
|
|
throw new ZlibException("status == FINISH_STATE && _codec.AvailableBytesIn != 0");
|
|
}
|
|
|
|
// Start a new block or continue the current one.
|
|
if (_codec.AvailableBytesIn != 0 || lookahead != 0 || (flush != FlushType.None && status != FINISH_STATE))
|
|
{
|
|
BlockState bstate = DeflateFunction(flush);
|
|
|
|
if (bstate == BlockState.FinishStarted || bstate == BlockState.FinishDone)
|
|
{
|
|
status = FINISH_STATE;
|
|
}
|
|
if (bstate == BlockState.NeedMore || bstate == BlockState.FinishStarted)
|
|
{
|
|
if (_codec.AvailableBytesOut == 0)
|
|
{
|
|
last_flush = -1; // avoid BUF_ERROR next call, see above
|
|
}
|
|
return ZlibConstants.Z_OK;
|
|
// If flush != Z_NO_FLUSH && avail_out == 0, the next call
|
|
// of deflate should use the same flush parameter to make sure
|
|
// that the flush is complete. So we don't have to output an
|
|
// empty block here, this will be done at next call. This also
|
|
// ensures that for a very small output buffer, we emit at most
|
|
// one empty block.
|
|
}
|
|
|
|
if (bstate == BlockState.BlockDone)
|
|
{
|
|
if (flush == FlushType.Partial)
|
|
{
|
|
_tr_align();
|
|
}
|
|
else
|
|
{
|
|
// FlushType.Full or FlushType.Sync
|
|
_tr_stored_block(0, 0, false);
|
|
// For a full flush, this empty block will be recognized
|
|
// as a special marker by inflate_sync().
|
|
if (flush == FlushType.Full)
|
|
{
|
|
// clear hash (forget the history)
|
|
for (int i = 0; i < hash_size; i++)
|
|
head[i] = 0;
|
|
}
|
|
}
|
|
_codec.flush_pending();
|
|
if (_codec.AvailableBytesOut == 0)
|
|
{
|
|
last_flush = -1; // avoid BUF_ERROR at next call, see above
|
|
return ZlibConstants.Z_OK;
|
|
}
|
|
}
|
|
}
|
|
|
|
if (flush != FlushType.Finish)
|
|
return ZlibConstants.Z_OK;
|
|
|
|
if (!WantRfc1950HeaderBytes || Rfc1950BytesEmitted)
|
|
return ZlibConstants.Z_STREAM_END;
|
|
|
|
// Write the zlib trailer (adler32)
|
|
pending[pendingCount++] = (byte)((_codec._Adler32 & 0xFF000000) >> 24);
|
|
pending[pendingCount++] = (byte)((_codec._Adler32 & 0x00FF0000) >> 16);
|
|
pending[pendingCount++] = (byte)((_codec._Adler32 & 0x0000FF00) >> 8);
|
|
pending[pendingCount++] = (byte)(_codec._Adler32 & 0x000000FF);
|
|
//putShortMSB((int)(SharedUtils.URShift(_codec._Adler32, 16)));
|
|
//putShortMSB((int)(_codec._Adler32 & 0xffff));
|
|
|
|
_codec.flush_pending();
|
|
|
|
// If avail_out is zero, the application will call deflate again
|
|
// to flush the rest.
|
|
|
|
Rfc1950BytesEmitted = true; // write the trailer only once!
|
|
|
|
return pendingCount != 0 ? ZlibConstants.Z_OK : ZlibConstants.Z_STREAM_END;
|
|
}
|
|
|
|
}
|
|
} |