ECCE @ EIC Software
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Groups Pages
deflate.h
Go to the documentation of this file. Or view the newest version in sPHENIX GitHub for file deflate.h
1 /* deflate.h -- internal compression state
2  * Copyright (C) 1995-2016 Jean-loup Gailly
3  * For conditions of distribution and use, see copyright notice in zlib.h
4  */
5 
6 /* WARNING: this file should *not* be used by applications. It is
7  part of the implementation of the compression library and is
8  subject to change. Applications should only use zlib.h.
9  */
10 
11 
12 #ifndef DEFLATE_H
13 #define DEFLATE_H
14 
15 #include "zutil.h"
16 
17 /* define NO_GZIP when compiling if you want to disable gzip header and
18  trailer creation by deflate(). NO_GZIP would be used to avoid linking in
19  the crc code when it is not needed. For shared libraries, gzip encoding
20  should be left enabled. */
21 #ifndef NO_GZIP
22 # define GZIP
23 #endif
24 
25 /* ===========================================================================
26  * Internal compression state.
27  */
28 
29 #define LENGTH_CODES 29
30 /* number of length codes, not counting the special END_BLOCK code */
31 
32 #define LITERALS 256
33 /* number of literal bytes 0..255 */
34 
35 #define L_CODES (LITERALS+1+LENGTH_CODES)
36 /* number of Literal or Length codes, including the END_BLOCK code */
37 
38 #define D_CODES 30
39 /* number of distance codes */
40 
41 #define BL_CODES 19
42 /* number of codes used to transfer the bit lengths */
43 
44 #define HEAP_SIZE (2*L_CODES+1)
45 /* maximum heap size */
46 
47 #define MAX_BITS 15
48 /* All codes must not exceed MAX_BITS bits */
49 
50 #define Buf_size 16
51 /* size of bit buffer in bi_buf */
52 
53 #define INIT_STATE 42 /* zlib header -> BUSY_STATE */
54 #ifdef GZIP
55 # define GZIP_STATE 57 /* gzip header -> BUSY_STATE | EXTRA_STATE */
56 #endif
57 #define EXTRA_STATE 69 /* gzip extra block -> NAME_STATE */
58 #define NAME_STATE 73 /* gzip file name -> COMMENT_STATE */
59 #define COMMENT_STATE 91 /* gzip comment -> HCRC_STATE */
60 #define HCRC_STATE 103 /* gzip header CRC -> BUSY_STATE */
61 #define BUSY_STATE 113 /* deflate -> FINISH_STATE */
62 #define FINISH_STATE 666 /* stream complete */
63 /* Stream status */
64 
65 
66 /* Data structure describing a single value and its code string. */
67 typedef struct ct_data_s {
68  union {
69  ush freq; /* frequency count */
70  ush code; /* bit string */
71  } fc;
72  union {
73  ush dad; /* father node in Huffman tree */
74  ush len; /* length of bit string */
75  } dl;
76 } FAR ct_data;
77 
78 #define Freq fc.freq
79 #define Code fc.code
80 #define Dad dl.dad
81 #define Len dl.len
82 
84 
85 typedef struct tree_desc_s {
86  ct_data *dyn_tree; /* the dynamic tree */
87  int max_code; /* largest code with non zero frequency */
88  const static_tree_desc *stat_desc; /* the corresponding static tree */
89 } FAR tree_desc;
90 
91 typedef ush Pos;
92 typedef Pos FAR Posf;
93 typedef unsigned IPos;
94 
95 /* A Pos is an index in the character window. We use short instead of int to
96  * save space in the various tables. IPos is used only for parameter passing.
97  */
98 
99 typedef struct internal_state {
100  z_streamp strm; /* pointer back to this zlib stream */
101  int status; /* as the name implies */
102  Bytef *pending_buf; /* output still pending */
103  ulg pending_buf_size; /* size of pending_buf */
104  Bytef *pending_out; /* next pending byte to output to the stream */
105  ulg pending; /* nb of bytes in the pending buffer */
106  int wrap; /* bit 0 true for zlib, bit 1 true for gzip */
107  gz_headerp gzhead; /* gzip header information to write */
108  ulg gzindex; /* where in extra, name, or comment */
109  Byte method; /* can only be DEFLATED */
110  int last_flush; /* value of flush param for previous deflate call */
111 
112  /* used by deflate.c: */
113 
114  uInt w_size; /* LZ77 window size (32K by default) */
115  uInt w_bits; /* log2(w_size) (8..16) */
116  uInt w_mask; /* w_size - 1 */
117 
118  Bytef *window;
119  /* Sliding window. Input bytes are read into the second half of the window,
120  * and move to the first half later to keep a dictionary of at least wSize
121  * bytes. With this organization, matches are limited to a distance of
122  * wSize-MAX_MATCH bytes, but this ensures that IO is always
123  * performed with a length multiple of the block size. Also, it limits
124  * the window size to 64K, which is quite useful on MSDOS.
125  * To do: use the user input buffer as sliding window.
126  */
127 
129  /* Actual size of window: 2*wSize, except when the user input buffer
130  * is directly used as sliding window.
131  */
132 
134  /* Link to older string with same hash index. To limit the size of this
135  * array to 64K, this link is maintained only for the last 32K strings.
136  * An index in this array is thus a window index modulo 32K.
137  */
138 
139  Posf *head; /* Heads of the hash chains or NIL. */
140 
141  uInt ins_h; /* hash index of string to be inserted */
142  uInt hash_size; /* number of elements in hash table */
143  uInt hash_bits; /* log2(hash_size) */
144  uInt hash_mask; /* hash_size-1 */
145 
147  /* Number of bits by which ins_h must be shifted at each input
148  * step. It must be such that after MIN_MATCH steps, the oldest
149  * byte no longer takes part in the hash key, that is:
150  * hash_shift * MIN_MATCH >= hash_bits
151  */
152 
154  /* Window position at the beginning of the current output block. Gets
155  * negative when the window is moved backwards.
156  */
157 
158  uInt match_length; /* length of best match */
159  IPos prev_match; /* previous match */
160  int match_available; /* set if previous match exists */
161  uInt strstart; /* start of string to insert */
162  uInt match_start; /* start of matching string */
163  uInt lookahead; /* number of valid bytes ahead in window */
164 
166  /* Length of the best match at previous step. Matches not greater than this
167  * are discarded. This is used in the lazy match evaluation.
168  */
169 
171  /* To speed up deflation, hash chains are never searched beyond this
172  * length. A higher limit improves compression ratio but degrades the
173  * speed.
174  */
175 
177  /* Attempt to find a better match only when the current match is strictly
178  * smaller than this value. This mechanism is used only for compression
179  * levels >= 4.
180  */
181 # define max_insert_length max_lazy_match
182  /* Insert new strings in the hash table only if the match length is not
183  * greater than this length. This saves time but degrades compression.
184  * max_insert_length is used only for compression levels <= 3.
185  */
186 
187  int level; /* compression level (1..9) */
188  int strategy; /* favor or force Huffman coding*/
189 
191  /* Use a faster search when the previous match is longer than this */
192 
193  int nice_match; /* Stop searching when current match exceeds this */
194 
195  /* used by trees.c: */
196  /* Didn't use ct_data typedef below to suppress compiler warning */
197  struct ct_data_s dyn_ltree[HEAP_SIZE]; /* literal and length tree */
198  struct ct_data_s dyn_dtree[2*D_CODES+1]; /* distance tree */
199  struct ct_data_s bl_tree[2*BL_CODES+1]; /* Huffman tree for bit lengths */
200 
201  struct tree_desc_s l_desc; /* desc. for literal tree */
202  struct tree_desc_s d_desc; /* desc. for distance tree */
203  struct tree_desc_s bl_desc; /* desc. for bit length tree */
204 
206  /* number of codes at each bit length for an optimal tree */
207 
208  int heap[2*L_CODES+1]; /* heap used to build the Huffman trees */
209  int heap_len; /* number of elements in the heap */
210  int heap_max; /* element of largest frequency */
211  /* The sons of heap[n] are heap[2*n] and heap[2*n+1]. heap[0] is not used.
212  * The same heap array is used to build all trees.
213  */
214 
216  /* Depth of each subtree used as tie breaker for trees of equal frequency
217  */
218 
219  uchf *l_buf; /* buffer for literals or lengths */
220 
222  /* Size of match buffer for literals/lengths. There are 4 reasons for
223  * limiting lit_bufsize to 64K:
224  * - frequencies can be kept in 16 bit counters
225  * - if compression is not successful for the first block, all input
226  * data is still in the window so we can still emit a stored block even
227  * when input comes from standard input. (This can also be done for
228  * all blocks if lit_bufsize is not greater than 32K.)
229  * - if compression is not successful for a file smaller than 64K, we can
230  * even emit a stored file instead of a stored block (saving 5 bytes).
231  * This is applicable only for zip (not gzip or zlib).
232  * - creating new Huffman trees less frequently may not provide fast
233  * adaptation to changes in the input data statistics. (Take for
234  * example a binary file with poorly compressible code followed by
235  * a highly compressible string table.) Smaller buffer sizes give
236  * fast adaptation but have of course the overhead of transmitting
237  * trees more frequently.
238  * - I can't count above 4
239  */
240 
241  uInt last_lit; /* running index in l_buf */
242 
244  /* Buffer for distances. To simplify the code, d_buf and l_buf have
245  * the same number of elements. To use different lengths, an extra flag
246  * array would be necessary.
247  */
248 
249  ulg opt_len; /* bit length of current block with optimal trees */
250  ulg static_len; /* bit length of current block with static trees */
251  uInt matches; /* number of string matches in current block */
252  uInt insert; /* bytes at end of window left to insert */
253 
254 #ifdef ZLIB_DEBUG
255  ulg compressed_len; /* total bit length of compressed file mod 2^32 */
256  ulg bits_sent; /* bit length of compressed data sent mod 2^32 */
257 #endif
258 
260  /* Output buffer. bits are inserted starting at the bottom (least
261  * significant bits).
262  */
263  int bi_valid;
264  /* Number of valid bits in bi_buf. All bits above the last valid bit
265  * are always zero.
266  */
267 
269  /* High water mark offset in window for initialized bytes -- bytes above
270  * this are set to zero in order to avoid memory check warnings when
271  * longest match routines access bytes past the input. This is then
272  * updated to the new high water mark.
273  */
274 
275 } FAR deflate_state;
276 
277 /* Output a byte on the stream.
278  * IN assertion: there is enough room in pending_buf.
279  */
280 #define put_byte(s, c) {s->pending_buf[s->pending++] = (Bytef)(c);}
281 
282 
283 #define MIN_LOOKAHEAD (MAX_MATCH+MIN_MATCH+1)
284 /* Minimum amount of lookahead, except at the end of the input file.
285  * See deflate.c for comments about the MIN_MATCH+1.
286  */
287 
288 #define MAX_DIST(s) ((s)->w_size-MIN_LOOKAHEAD)
289 /* In order to simplify the code, particularly on 16 bit machines, match
290  * distances are limited to MAX_DIST instead of WSIZE.
291  */
292 
293 #define WIN_INIT MAX_MATCH
294 /* Number of bytes after end of data in window to initialize in order to avoid
295  memory checker errors from longest match routines */
296 
297  /* in trees.c */
299 int ZLIB_INTERNAL _tr_tally OF((deflate_state *s, unsigned dist, unsigned lc));
300 void ZLIB_INTERNAL _tr_flush_block OF((deflate_state *s, charf *buf,
301  ulg stored_len, int last));
304 void ZLIB_INTERNAL _tr_stored_block OF((deflate_state *s, charf *buf,
305  ulg stored_len, int last));
306 
307 #define d_code(dist) \
308  ((dist) < 256 ? _dist_code[dist] : _dist_code[256+((dist)>>7)])
309 /* Mapping from a distance to a distance code. dist is the distance - 1 and
310  * must not have side effects. _dist_code[256] and _dist_code[257] are never
311  * used.
312  */
313 
314 #ifndef ZLIB_DEBUG
315 /* Inline versions of _tr_tally for speed: */
316 
317 #if defined(GEN_TREES_H) || !defined(STDC)
318  extern uch ZLIB_INTERNAL _length_code[];
319  extern uch ZLIB_INTERNAL _dist_code[];
320 #else
321  extern const uch ZLIB_INTERNAL _length_code[];
322  extern const uch ZLIB_INTERNAL _dist_code[];
323 #endif
324 
325 # define _tr_tally_lit(s, c, flush) \
326  { uch cc = (c); \
327  s->d_buf[s->last_lit] = 0; \
328  s->l_buf[s->last_lit++] = cc; \
329  s->dyn_ltree[cc].Freq++; \
330  flush = (s->last_lit == s->lit_bufsize-1); \
331  }
332 # define _tr_tally_dist(s, distance, length, flush) \
333  { uch len = (uch)(length); \
334  ush dist = (ush)(distance); \
335  s->d_buf[s->last_lit] = dist; \
336  s->l_buf[s->last_lit++] = len; \
337  dist--; \
338  s->dyn_ltree[_length_code[len]+LITERALS+1].Freq++; \
339  s->dyn_dtree[d_code(dist)].Freq++; \
340  flush = (s->last_lit == s->lit_bufsize-1); \
341  }
342 #else
343 # define _tr_tally_lit(s, c, flush) flush = _tr_tally(s, 0, c)
344 # define _tr_tally_dist(s, distance, length, flush) \
345  flush = _tr_tally(s, distance, length)
346 #endif
347 
348 #endif /* DEFLATE_H */