Unit imtrees; {$T-} {$define ORG_DEBUG} { trees.c -- output deflated data using Huffman coding Copyright (C) 1995-1998 Jean-loup Gailly Pascal tranlastion Copyright (C) 1998 by Jacques Nomssi Nzali For conditions of distribution and use, see copyright notice in readme.txt } { * ALGORITHM * * The "deflation" process uses several Huffman trees. The more * common source values are represented by shorter bit sequences. * * Each code tree is stored in a compressed form which is itself * a Huffman encoding of the lengths of all the code strings (in * ascending order by source values). The actual code strings are * reconstructed from the lengths in the inflate process, as described * in the deflate specification. * * REFERENCES * * Deutsch, L.P.,"'Deflate' Compressed Data Format Specification". * Available in ftp.uu.net:/pub/archiving/zip/doc/deflate-1.1.doc * * Storer, James A. * Data Compression: Methods and Theory, pp. 49-50. * Computer Science Press, 1988. ISBN 0-7167-8156-5. * * Sedgewick, R. * Algorithms, p290. * Addison-Wesley, 1983. ISBN 0-201-06672-6. } interface {$I imzconf.inc} uses {$ifdef DEBUG} SysUtils, strutils, {$ENDIF} imzutil, impaszlib; { =========================================================================== Internal compression state. } const LENGTH_CODES = 29; { number of length codes, not counting the special END_BLOCK code } LITERALS = 256; { number of literal bytes 0..255 } L_CODES = (LITERALS+1+LENGTH_CODES); { number of Literal or Length codes, including the END_BLOCK code } D_CODES = 30; { number of distance codes } BL_CODES = 19; { number of codes used to transfer the bit lengths } HEAP_SIZE = (2*L_CODES+1); { maximum heap size } MAX_BITS = 15; { All codes must not exceed MAX_BITS bits } const INIT_STATE = 42; BUSY_STATE = 113; FINISH_STATE = 666; { Stream status } { Data structure describing a single value and its code string. } type ct_data_ptr = ^ct_data; ct_data = record fc : record case byte of 0:(freq : ush); { frequency count } 1:(code : ush); { bit string } end; dl : record case byte of 0:(dad : ush); { father node in Huffman tree } 1:(len : ush); { length of bit string } end; end; { Freq = fc.freq Code = fc.code Dad = dl.dad Len = dl.len } type ltree_type = array[0..HEAP_SIZE-1] of ct_data; { literal and length tree } dtree_type = array[0..2*D_CODES+1-1] of ct_data; { distance tree } htree_type = array[0..2*BL_CODES+1-1] of ct_data; { Huffman tree for bit lengths } { generic tree type } tree_type = array[0..(MaxInt div SizeOf(ct_data))-1] of ct_data; tree_ptr = ^tree_type; ltree_ptr = ^ltree_type; dtree_ptr = ^dtree_type; htree_ptr = ^htree_type; type static_tree_desc_ptr = ^static_tree_desc; static_tree_desc = record {const} static_tree : tree_ptr; { static tree or NIL } {const} extra_bits : pzIntfArray; { extra bits for each code or NIL } extra_base : int; { base index for extra_bits } elems : int; { max number of elements in the tree } max_length : int; { max bit length for the codes } end; tree_desc_ptr = ^tree_desc; tree_desc = record dyn_tree : tree_ptr; { the dynamic tree } max_code : int; { largest code with non zero frequency } stat_desc : static_tree_desc_ptr; { the corresponding static tree } end; type Pos = ush; Posf = Pos; {FAR} IPos = uInt; pPosf = ^Posf; zPosfArray = array[0..(MaxInt div SizeOf(Posf))-1] of Posf; pzPosfArray = ^zPosfArray; { A Pos is an index in the character window. We use short instead of int to save space in the various tables. IPos is used only for parameter passing.} type deflate_state_ptr = ^deflate_state; deflate_state = record strm : z_streamp; { pointer back to this zlib stream } status : int; { as the name implies } pending_buf : pzByteArray; { output still pending } pending_buf_size : ulg; { size of pending_buf } pending_out : pBytef; { next pending byte to output to the stream } pending : int; { nb of bytes in the pending buffer } noheader : int; { suppress zlib header and adler32 } data_type : Byte; { UNKNOWN, BINARY or ASCII } method : Byte; { STORED (for zip only) or DEFLATED } last_flush : int; { value of flush param for previous deflate call } { used by deflate.pas: } w_size : uInt; { LZ77 window size (32K by default) } w_bits : uInt; { log2(w_size) (8..16) } w_mask : uInt; { w_size - 1 } window : pzByteArray; { Sliding window. Input bytes are read into the second half of the window, and move to the first half later to keep a dictionary of at least wSize bytes. With this organization, matches are limited to a distance of wSize-MAX_MATCH bytes, but this ensures that IO is always performed with a length multiple of the block size. Also, it limits the window size to 64K, which is quite useful on MSDOS. To do: use the user input buffer as sliding window. } window_size : ulg; { Actual size of window: 2*wSize, except when the user input buffer is directly used as sliding window. } prev : pzPosfArray; { Link to older string with same hash index. To limit the size of this array to 64K, this link is maintained only for the last 32K strings. An index in this array is thus a window index modulo 32K. } head : pzPosfArray; { Heads of the hash chains or NIL. } ins_h : uInt; { hash index of string to be inserted } hash_size : uInt; { number of elements in hash table } hash_bits : uInt; { log2(hash_size) } hash_mask : uInt; { hash_size-1 } hash_shift : uInt; { Number of bits by which ins_h must be shifted at each input step. It must be such that after MIN_MATCH steps, the oldest byte no longer takes part in the hash key, that is: hash_shift * MIN_MATCH >= hash_bits } block_start : long; { Window position at the beginning of the current output block. Gets negative when the window is moved backwards. } match_length : uInt; { length of best match } prev_match : IPos; { previous match } match_available : boolean; { set if previous match exists } strstart : uInt; { start of string to insert } match_start : uInt; { start of matching string } lookahead : uInt; { number of valid bytes ahead in window } prev_length : uInt; { Length of the best match at previous step. Matches not greater than this are discarded. This is used in the lazy match evaluation. } max_chain_length : uInt; { To speed up deflation, hash chains are never searched beyond this length. A higher limit improves compression ratio but degrades the speed. } { moved to the end because Borland Pascal won't accept the following: max_lazy_match : uInt; max_insert_length : uInt absolute max_lazy_match; } level : int; { compression level (1..9) } strategy : int; { favor or force Huffman coding} good_match : uInt; { Use a faster search when the previous match is longer than this } nice_match : int; { Stop searching when current match exceeds this } { used by trees.pas: } { Didn't use ct_data typedef below to supress compiler warning } dyn_ltree : ltree_type; { literal and length tree } dyn_dtree : dtree_type; { distance tree } bl_tree : htree_type; { Huffman tree for bit lengths } l_desc : tree_desc; { desc. for literal tree } d_desc : tree_desc; { desc. for distance tree } bl_desc : tree_desc; { desc. for bit length tree } bl_count : array[0..MAX_BITS+1-1] of ush; { number of codes at each bit length for an optimal tree } heap : array[0..2*L_CODES+1-1] of int; { heap used to build the Huffman trees } heap_len : int; { number of elements in the heap } heap_max : int; { element of largest frequency } { The sons of heap[n] are heap[2*n] and heap[2*n+1]. heap[0] is not used. The same heap array is used to build all trees. } depth : array[0..2*L_CODES+1-1] of uch; { Depth of each subtree used as tie breaker for trees of equal frequency } l_buf : puchfArray; { buffer for literals or lengths } lit_bufsize : uInt; { Size of match buffer for literals/lengths. There are 4 reasons for limiting lit_bufsize to 64K: - frequencies can be kept in 16 bit counters - if compression is not successful for the first block, all input data is still in the window so we can still emit a stored block even when input comes from standard input. (This can also be done for all blocks if lit_bufsize is not greater than 32K.) - if compression is not successful for a file smaller than 64K, we can even emit a stored file instead of a stored block (saving 5 bytes). This is applicable only for zip (not gzip or zlib). - creating new Huffman trees less frequently may not provide fast adaptation to changes in the input data statistics. (Take for example a binary file with poorly compressible code followed by a highly compressible string table.) Smaller buffer sizes give fast adaptation but have of course the overhead of transmitting trees more frequently. - I can't count above 4 } last_lit : uInt; { running index in l_buf } d_buf : pushfArray; { Buffer for distances. To simplify the code, d_buf and l_buf have the same number of elements. To use different lengths, an extra flag array would be necessary. } opt_len : ulg; { bit length of current block with optimal trees } static_len : ulg; { bit length of current block with static trees } compressed_len : ulg; { total bit length of compressed file } matches : uInt; { number of string matches in current block } last_eob_len : int; { bit length of EOB code for last block } {$ifdef DEBUG} bits_sent : ulg; { bit length of the compressed data } {$endif} bi_buf : ush; { Output buffer. bits are inserted starting at the bottom (least significant bits). } bi_valid : int; { Number of valid bits in bi_buf. All bits above the last valid bit are always zero. } case byte of 0:(max_lazy_match : uInt); { Attempt to find a better match only when the current match is strictly smaller than this value. This mechanism is used only for compression levels >= 4. } 1:(max_insert_length : uInt); { Insert new strings in the hash table only if the match length is not greater than this length. This saves time but degrades compression. max_insert_length is used only for compression levels <= 3. } end; procedure _tr_init (var s : deflate_state); function _tr_tally (var s : deflate_state; dist : unsigned; lc : unsigned) : boolean; function _tr_flush_block (var s : deflate_state; buf : pcharf; stored_len : ulg; eof : boolean) : ulg; procedure _tr_align(var s : deflate_state); procedure _tr_stored_block(var s : deflate_state; buf : pcharf; stored_len : ulg; eof : boolean); implementation { #define GEN_TREES_H } {$ifndef GEN_TREES_H} { header created automatically with -DGEN_TREES_H } const DIST_CODE_LEN = 512; { see definition of array dist_code below } { The static literal tree. Since the bit lengths are imposed, there is no need for the L_CODES extra codes used during heap construction. However The codes 286 and 287 are needed to build a canonical tree (see _tr_init below). } var static_ltree : array[0..L_CODES+2-1] of ct_data = ( { fc:(freq, code) dl:(dad,len) } (fc:(freq: 12);dl:(len: 8)), (fc:(freq:140);dl:(len: 8)), (fc:(freq: 76);dl:(len: 8)), (fc:(freq:204);dl:(len: 8)), (fc:(freq: 44);dl:(len: 8)), (fc:(freq:172);dl:(len: 8)), (fc:(freq:108);dl:(len: 8)), (fc:(freq:236);dl:(len: 8)), (fc:(freq: 28);dl:(len: 8)), (fc:(freq:156);dl:(len: 8)), (fc:(freq: 92);dl:(len: 8)), (fc:(freq:220);dl:(len: 8)), (fc:(freq: 60);dl:(len: 8)), (fc:(freq:188);dl:(len: 8)), (fc:(freq:124);dl:(len: 8)), (fc:(freq:252);dl:(len: 8)), (fc:(freq: 2);dl:(len: 8)), (fc:(freq:130);dl:(len: 8)), (fc:(freq: 66);dl:(len: 8)), (fc:(freq:194);dl:(len: 8)), (fc:(freq: 34);dl:(len: 8)), (fc:(freq:162);dl:(len: 8)), (fc:(freq: 98);dl:(len: 8)), (fc:(freq:226);dl:(len: 8)), (fc:(freq: 18);dl:(len: 8)), (fc:(freq:146);dl:(len: 8)), (fc:(freq: 82);dl:(len: 8)), (fc:(freq:210);dl:(len: 8)), (fc:(freq: 50);dl:(len: 8)), (fc:(freq:178);dl:(len: 8)), (fc:(freq:114);dl:(len: 8)), (fc:(freq:242);dl:(len: 8)), (fc:(freq: 10);dl:(len: 8)), (fc:(freq:138);dl:(len: 8)), (fc:(freq: 74);dl:(len: 8)), (fc:(freq:202);dl:(len: 8)), (fc:(freq: 42);dl:(len: 8)), (fc:(freq:170);dl:(len: 8)), (fc:(freq:106);dl:(len: 8)), (fc:(freq:234);dl:(len: 8)), (fc:(freq: 26);dl:(len: 8)), (fc:(freq:154);dl:(len: 8)), (fc:(freq: 90);dl:(len: 8)), (fc:(freq:218);dl:(len: 8)), (fc:(freq: 58);dl:(len: 8)), (fc:(freq:186);dl:(len: 8)), (fc:(freq:122);dl:(len: 8)), (fc:(freq:250);dl:(len: 8)), (fc:(freq: 6);dl:(len: 8)), (fc:(freq:134);dl:(len: 8)), (fc:(freq: 70);dl:(len: 8)), (fc:(freq:198);dl:(len: 8)), (fc:(freq: 38);dl:(len: 8)), (fc:(freq:166);dl:(len: 8)), (fc:(freq:102);dl:(len: 8)), (fc:(freq:230);dl:(len: 8)), (fc:(freq: 22);dl:(len: 8)), (fc:(freq:150);dl:(len: 8)), (fc:(freq: 86);dl:(len: 8)), (fc:(freq:214);dl:(len: 8)), (fc:(freq: 54);dl:(len: 8)), (fc:(freq:182);dl:(len: 8)), (fc:(freq:118);dl:(len: 8)), (fc:(freq:246);dl:(len: 8)), (fc:(freq: 14);dl:(len: 8)), (fc:(freq:142);dl:(len: 8)), (fc:(freq: 78);dl:(len: 8)), (fc:(freq:206);dl:(len: 8)), (fc:(freq: 46);dl:(len: 8)), (fc:(freq:174);dl:(len: 8)), (fc:(freq:110);dl:(len: 8)), (fc:(freq:238);dl:(len: 8)), (fc:(freq: 30);dl:(len: 8)), (fc:(freq:158);dl:(len: 8)), (fc:(freq: 94);dl:(len: 8)), (fc:(freq:222);dl:(len: 8)), (fc:(freq: 62);dl:(len: 8)), (fc:(freq:190);dl:(len: 8)), (fc:(freq:126);dl:(len: 8)), (fc:(freq:254);dl:(len: 8)), (fc:(freq: 1);dl:(len: 8)), (fc:(freq:129);dl:(len: 8)), (fc:(freq: 65);dl:(len: 8)), (fc:(freq:193);dl:(len: 8)), (fc:(freq: 33);dl:(len: 8)), (fc:(freq:161);dl:(len: 8)), (fc:(freq: 97);dl:(len: 8)), (fc:(freq:225);dl:(len: 8)), (fc:(freq: 17);dl:(len: 8)), (fc:(freq:145);dl:(len: 8)), (fc:(freq: 81);dl:(len: 8)), (fc:(freq:209);dl:(len: 8)), (fc:(freq: 49);dl:(len: 8)), (fc:(freq:177);dl:(len: 8)), (fc:(freq:113);dl:(len: 8)), (fc:(freq:241);dl:(len: 8)), (fc:(freq: 9);dl:(len: 8)), (fc:(freq:137);dl:(len: 8)), (fc:(freq: 73);dl:(len: 8)), (fc:(freq:201);dl:(len: 8)), (fc:(freq: 41);dl:(len: 8)), (fc:(freq:169);dl:(len: 8)), (fc:(freq:105);dl:(len: 8)), (fc:(freq:233);dl:(len: 8)), (fc:(freq: 25);dl:(len: 8)), (fc:(freq:153);dl:(len: 8)), (fc:(freq: 89);dl:(len: 8)), (fc:(freq:217);dl:(len: 8)), (fc:(freq: 57);dl:(len: 8)), (fc:(freq:185);dl:(len: 8)), (fc:(freq:121);dl:(len: 8)), (fc:(freq:249);dl:(len: 8)), (fc:(freq: 5);dl:(len: 8)), (fc:(freq:133);dl:(len: 8)), (fc:(freq: 69);dl:(len: 8)), (fc:(freq:197);dl:(len: 8)), (fc:(freq: 37);dl:(len: 8)), (fc:(freq:165);dl:(len: 8)), (fc:(freq:101);dl:(len: 8)), (fc:(freq:229);dl:(len: 8)), (fc:(freq: 21);dl:(len: 8)), (fc:(freq:149);dl:(len: 8)), (fc:(freq: 85);dl:(len: 8)), (fc:(freq:213);dl:(len: 8)), (fc:(freq: 53);dl:(len: 8)), (fc:(freq:181);dl:(len: 8)), (fc:(freq:117);dl:(len: 8)), (fc:(freq:245);dl:(len: 8)), (fc:(freq: 13);dl:(len: 8)), (fc:(freq:141);dl:(len: 8)), (fc:(freq: 77);dl:(len: 8)), (fc:(freq:205);dl:(len: 8)), (fc:(freq: 45);dl:(len: 8)), (fc:(freq:173);dl:(len: 8)), (fc:(freq:109);dl:(len: 8)), (fc:(freq:237);dl:(len: 8)), (fc:(freq: 29);dl:(len: 8)), (fc:(freq:157);dl:(len: 8)), (fc:(freq: 93);dl:(len: 8)), (fc:(freq:221);dl:(len: 8)), (fc:(freq: 61);dl:(len: 8)), (fc:(freq:189);dl:(len: 8)), (fc:(freq:125);dl:(len: 8)), (fc:(freq:253);dl:(len: 8)), (fc:(freq: 19);dl:(len: 9)), (fc:(freq:275);dl:(len: 9)), (fc:(freq:147);dl:(len: 9)), (fc:(freq:403);dl:(len: 9)), (fc:(freq: 83);dl:(len: 9)), (fc:(freq:339);dl:(len: 9)), (fc:(freq:211);dl:(len: 9)), (fc:(freq:467);dl:(len: 9)), (fc:(freq: 51);dl:(len: 9)), (fc:(freq:307);dl:(len: 9)), (fc:(freq:179);dl:(len: 9)), (fc:(freq:435);dl:(len: 9)), (fc:(freq:115);dl:(len: 9)), (fc:(freq:371);dl:(len: 9)), (fc:(freq:243);dl:(len: 9)), (fc:(freq:499);dl:(len: 9)), (fc:(freq: 11);dl:(len: 9)), (fc:(freq:267);dl:(len: 9)), (fc:(freq:139);dl:(len: 9)), (fc:(freq:395);dl:(len: 9)), (fc:(freq: 75);dl:(len: 9)), (fc:(freq:331);dl:(len: 9)), (fc:(freq:203);dl:(len: 9)), (fc:(freq:459);dl:(len: 9)), (fc:(freq: 43);dl:(len: 9)), (fc:(freq:299);dl:(len: 9)), (fc:(freq:171);dl:(len: 9)), (fc:(freq:427);dl:(len: 9)), (fc:(freq:107);dl:(len: 9)), (fc:(freq:363);dl:(len: 9)), (fc:(freq:235);dl:(len: 9)), (fc:(freq:491);dl:(len: 9)), (fc:(freq: 27);dl:(len: 9)), (fc:(freq:283);dl:(len: 9)), (fc:(freq:155);dl:(len: 9)), (fc:(freq:411);dl:(len: 9)), (fc:(freq: 91);dl:(len: 9)), (fc:(freq:347);dl:(len: 9)), (fc:(freq:219);dl:(len: 9)), (fc:(freq:475);dl:(len: 9)), (fc:(freq: 59);dl:(len: 9)), (fc:(freq:315);dl:(len: 9)), (fc:(freq:187);dl:(len: 9)), (fc:(freq:443);dl:(len: 9)), (fc:(freq:123);dl:(len: 9)), (fc:(freq:379);dl:(len: 9)), (fc:(freq:251);dl:(len: 9)), (fc:(freq:507);dl:(len: 9)), (fc:(freq: 7);dl:(len: 9)), (fc:(freq:263);dl:(len: 9)), (fc:(freq:135);dl:(len: 9)), (fc:(freq:391);dl:(len: 9)), (fc:(freq: 71);dl:(len: 9)), (fc:(freq:327);dl:(len: 9)), (fc:(freq:199);dl:(len: 9)), (fc:(freq:455);dl:(len: 9)), (fc:(freq: 39);dl:(len: 9)), (fc:(freq:295);dl:(len: 9)), (fc:(freq:167);dl:(len: 9)), (fc:(freq:423);dl:(len: 9)), (fc:(freq:103);dl:(len: 9)), (fc:(freq:359);dl:(len: 9)), (fc:(freq:231);dl:(len: 9)), (fc:(freq:487);dl:(len: 9)), (fc:(freq: 23);dl:(len: 9)), (fc:(freq:279);dl:(len: 9)), (fc:(freq:151);dl:(len: 9)), (fc:(freq:407);dl:(len: 9)), (fc:(freq: 87);dl:(len: 9)), (fc:(freq:343);dl:(len: 9)), (fc:(freq:215);dl:(len: 9)), (fc:(freq:471);dl:(len: 9)), (fc:(freq: 55);dl:(len: 9)), (fc:(freq:311);dl:(len: 9)), (fc:(freq:183);dl:(len: 9)), (fc:(freq:439);dl:(len: 9)), (fc:(freq:119);dl:(len: 9)), (fc:(freq:375);dl:(len: 9)), (fc:(freq:247);dl:(len: 9)), (fc:(freq:503);dl:(len: 9)), (fc:(freq: 15);dl:(len: 9)), (fc:(freq:271);dl:(len: 9)), (fc:(freq:143);dl:(len: 9)), (fc:(freq:399);dl:(len: 9)), (fc:(freq: 79);dl:(len: 9)), (fc:(freq:335);dl:(len: 9)), (fc:(freq:207);dl:(len: 9)), (fc:(freq:463);dl:(len: 9)), (fc:(freq: 47);dl:(len: 9)), (fc:(freq:303);dl:(len: 9)), (fc:(freq:175);dl:(len: 9)), (fc:(freq:431);dl:(len: 9)), (fc:(freq:111);dl:(len: 9)), (fc:(freq:367);dl:(len: 9)), (fc:(freq:239);dl:(len: 9)), (fc:(freq:495);dl:(len: 9)), (fc:(freq: 31);dl:(len: 9)), (fc:(freq:287);dl:(len: 9)), (fc:(freq:159);dl:(len: 9)), (fc:(freq:415);dl:(len: 9)), (fc:(freq: 95);dl:(len: 9)), (fc:(freq:351);dl:(len: 9)), (fc:(freq:223);dl:(len: 9)), (fc:(freq:479);dl:(len: 9)), (fc:(freq: 63);dl:(len: 9)), (fc:(freq:319);dl:(len: 9)), (fc:(freq:191);dl:(len: 9)), (fc:(freq:447);dl:(len: 9)), (fc:(freq:127);dl:(len: 9)), (fc:(freq:383);dl:(len: 9)), (fc:(freq:255);dl:(len: 9)), (fc:(freq:511);dl:(len: 9)), (fc:(freq: 0);dl:(len: 7)), (fc:(freq: 64);dl:(len: 7)), (fc:(freq: 32);dl:(len: 7)), (fc:(freq: 96);dl:(len: 7)), (fc:(freq: 16);dl:(len: 7)), (fc:(freq: 80);dl:(len: 7)), (fc:(freq: 48);dl:(len: 7)), (fc:(freq:112);dl:(len: 7)), (fc:(freq: 8);dl:(len: 7)), (fc:(freq: 72);dl:(len: 7)), (fc:(freq: 40);dl:(len: 7)), (fc:(freq:104);dl:(len: 7)), (fc:(freq: 24);dl:(len: 7)), (fc:(freq: 88);dl:(len: 7)), (fc:(freq: 56);dl:(len: 7)), (fc:(freq:120);dl:(len: 7)), (fc:(freq: 4);dl:(len: 7)), (fc:(freq: 68);dl:(len: 7)), (fc:(freq: 36);dl:(len: 7)), (fc:(freq:100);dl:(len: 7)), (fc:(freq: 20);dl:(len: 7)), (fc:(freq: 84);dl:(len: 7)), (fc:(freq: 52);dl:(len: 7)), (fc:(freq:116);dl:(len: 7)), (fc:(freq: 3);dl:(len: 8)), (fc:(freq:131);dl:(len: 8)), (fc:(freq: 67);dl:(len: 8)), (fc:(freq:195);dl:(len: 8)), (fc:(freq: 35);dl:(len: 8)), (fc:(freq:163);dl:(len: 8)), (fc:(freq: 99);dl:(len: 8)), (fc:(freq:227);dl:(len: 8)) ); { The static distance tree. (Actually a trivial tree since all lens use 5 bits.) } static_dtree : array[0..D_CODES-1] of ct_data = ( (fc:(freq: 0); dl:(len:5)), (fc:(freq:16); dl:(len:5)), (fc:(freq: 8); dl:(len:5)), (fc:(freq:24); dl:(len:5)), (fc:(freq: 4); dl:(len:5)), (fc:(freq:20); dl:(len:5)), (fc:(freq:12); dl:(len:5)), (fc:(freq:28); dl:(len:5)), (fc:(freq: 2); dl:(len:5)), (fc:(freq:18); dl:(len:5)), (fc:(freq:10); dl:(len:5)), (fc:(freq:26); dl:(len:5)), (fc:(freq: 6); dl:(len:5)), (fc:(freq:22); dl:(len:5)), (fc:(freq:14); dl:(len:5)), (fc:(freq:30); dl:(len:5)), (fc:(freq: 1); dl:(len:5)), (fc:(freq:17); dl:(len:5)), (fc:(freq: 9); dl:(len:5)), (fc:(freq:25); dl:(len:5)), (fc:(freq: 5); dl:(len:5)), (fc:(freq:21); dl:(len:5)), (fc:(freq:13); dl:(len:5)), (fc:(freq:29); dl:(len:5)), (fc:(freq: 3); dl:(len:5)), (fc:(freq:19); dl:(len:5)), (fc:(freq:11); dl:(len:5)), (fc:(freq:27); dl:(len:5)), (fc:(freq: 7); dl:(len:5)), (fc:(freq:23); dl:(len:5)) ); { Distance codes. The first 256 values correspond to the distances 3 .. 258, the last 256 values correspond to the top 8 bits of the 15 bit distances. } _dist_code : array[0..DIST_CODE_LEN-1] of uch = ( 0, 1, 2, 3, 4, 4, 5, 5, 6, 6, 6, 6, 7, 7, 7, 7, 8, 8, 8, 8, 8, 8, 8, 8, 9, 9, 9, 9, 9, 9, 9, 9, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 14, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 0, 0, 16, 17, 18, 18, 19, 19, 20, 20, 20, 20, 21, 21, 21, 21, 22, 22, 22, 22, 22, 22, 22, 22, 23, 23, 23, 23, 23, 23, 23, 23, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 28, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29, 29 ); { length code for each normalized match length (0 == MIN_MATCH) } _length_code : array[0..MAX_MATCH-MIN_MATCH+1-1] of uch = ( 0, 1, 2, 3, 4, 5, 6, 7, 8, 8, 9, 9, 10, 10, 11, 11, 12, 12, 12, 12, 13, 13, 13, 13, 14, 14, 14, 14, 15, 15, 15, 15, 16, 16, 16, 16, 16, 16, 16, 16, 17, 17, 17, 17, 17, 17, 17, 17, 18, 18, 18, 18, 18, 18, 18, 18, 19, 19, 19, 19, 19, 19, 19, 19, 20, 20, 20, 20, 20, 20, 20, 20, 20, 20, 20, 20, 20, 20, 20, 20, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 22, 22, 22, 22, 22, 22, 22, 22, 22, 22, 22, 22, 22, 22, 22, 22, 23, 23, 23, 23, 23, 23, 23, 23, 23, 23, 23, 23, 23, 23, 23, 23, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 24, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 25, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 26, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 28 ); { First normalized length for each code (0 = MIN_MATCH) } base_length : array[0..LENGTH_CODES-1] of int = ( 0, 1, 2, 3, 4, 5, 6, 7, 8, 10, 12, 14, 16, 20, 24, 28, 32, 40, 48, 56, 64, 80, 96, 112, 128, 160, 192, 224, 0 ); { First normalized distance for each code (0 = distance of 1) } base_dist : array[0..D_CODES-1] of int = ( 0, 1, 2, 3, 4, 6, 8, 12, 16, 24, 32, 48, 64, 96, 128, 192, 256, 384, 512, 768, 1024, 1536, 2048, 3072, 4096, 6144, 8192, 12288, 16384, 24576 ); {$endif} { Output a byte on the stream. IN assertion: there is enough room in pending_buf. macro put_byte(s, c) begin s^.pending_buf^[s^.pending] := (c); Inc(s^.pending); end } const MIN_LOOKAHEAD = (MAX_MATCH+MIN_MATCH+1); { Minimum amount of lookahead, except at the end of the input file. See deflate.c for comments about the MIN_MATCH+1. } {macro d_code(dist) if (dist) < 256 then := _dist_code[dist] else := _dist_code[256+((dist) shr 7)]); Mapping from a distance to a distance code. dist is the distance - 1 and must not have side effects. _dist_code[256] and _dist_code[257] are never used. } {$ifndef ORG_DEBUG} { Inline versions of _tr_tally for speed: } #if defined(GEN_TREES_H) || !defined(STDC) extern uch _length_code[]; extern uch _dist_code[]; #else extern const uch _length_code[]; extern const uch _dist_code[]; #endif macro _tr_tally_lit(s, c, flush) var cc : uch; begin cc := (c); s^.d_buf[s^.last_lit] := 0; s^.l_buf[s^.last_lit] := cc; Inc(s^.last_lit); Inc(s^.dyn_ltree[cc].fc.Freq); flush := (s^.last_lit = s^.lit_bufsize-1); end; macro _tr_tally_dist(s, distance, length, flush) \ var len : uch; dist : ush; begin len := (length); dist := (distance); s^.d_buf[s^.last_lit] := dist; s^.l_buf[s^.last_lit] = len; Inc(s^.last_lit); Dec(dist); Inc(s^.dyn_ltree[_length_code[len]+LITERALS+1].fc.Freq); Inc(s^.dyn_dtree[d_code(dist)].Freq); flush := (s^.last_lit = s^.lit_bufsize-1); end; {$endif} { =========================================================================== Constants } const MAX_BL_BITS = 7; { Bit length codes must not exceed MAX_BL_BITS bits } const END_BLOCK = 256; { end of block literal code } const REP_3_6 = 16; { repeat previous bit length 3-6 times (2 bits of repeat count) } const REPZ_3_10 = 17; { repeat a zero length 3-10 times (3 bits of repeat count) } const REPZ_11_138 = 18; { repeat a zero length 11-138 times (7 bits of repeat count) } {local} const extra_lbits : array[0..LENGTH_CODES-1] of int { extra bits for each length code } = (0,0,0,0,0,0,0,0,1,1,1,1,2,2,2,2,3,3,3,3,4,4,4,4,5,5,5,5,0); {local} const extra_dbits : array[0..D_CODES-1] of int { extra bits for each distance code } = (0,0,0,0,1,1,2,2,3,3,4,4,5,5,6,6,7,7,8,8,9,9,10,10,11,11,12,12,13,13); {local} const extra_blbits : array[0..BL_CODES-1] of int { extra bits for each bit length code } = (0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,3,7); {local} const bl_order : array[0..BL_CODES-1] of uch = (16,17,18,0,8,7,9,6,10,5,11,4,12,3,13,2,14,1,15); { The lengths of the bit length codes are sent in order of decreasing probability, to avoid transmitting the lengths for unused bit length codes. } const Buf_size = (8 * 2*sizeof(uch)); { Number of bits used within bi_buf. (bi_buf might be implemented on more than 16 bits on some systems.) } { =========================================================================== Local data. These are initialized only once. } {$ifdef GEN_TREES_H)} { non ANSI compilers may not accept trees.h } const DIST_CODE_LEN = 512; { see definition of array dist_code below } {local} var static_ltree : array[0..L_CODES+2-1] of ct_data; { The static literal tree. Since the bit lengths are imposed, there is no need for the L_CODES extra codes used during heap construction. However The codes 286 and 287 are needed to build a canonical tree (see _tr_init below). } {local} static_dtree : array[0..D_CODES-1] of ct_data; { The static distance tree. (Actually a trivial tree since all codes use 5 bits.) } _dist_code : array[0..DIST_CODE_LEN-1] of uch; { Distance codes. The first 256 values correspond to the distances 3 .. 258, the last 256 values correspond to the top 8 bits of the 15 bit distances. } _length_code : array[0..MAX_MATCH-MIN_MATCH+1-1] of uch; { length code for each normalized match length (0 == MIN_MATCH) } {local} base_length : array[0..LENGTH_CODES-1] of int; { First normalized length for each code (0 = MIN_MATCH) } {local} base_dist : array[0..D_CODES-1] of int; { First normalized distance for each code (0 = distance of 1) } {$endif} { GEN_TREES_H } {local} const static_l_desc : static_tree_desc = (static_tree: {tree_ptr}(@(static_ltree)); { pointer to array of ct_data } extra_bits: {pzIntfArray}(@(extra_lbits)); { pointer to array of int } extra_base: LITERALS+1; elems: L_CODES; max_length: MAX_BITS); {local} const static_d_desc : static_tree_desc = (static_tree: {tree_ptr}(@(static_dtree)); extra_bits: {pzIntfArray}(@(extra_dbits)); extra_base : 0; elems: D_CODES; max_length: MAX_BITS); {local} const static_bl_desc : static_tree_desc = (static_tree: {tree_ptr}(NIL); extra_bits: {pzIntfArray}@(extra_blbits); extra_base : 0; elems: BL_CODES; max_length: MAX_BL_BITS); (* =========================================================================== Local (static) routines in this file. } procedure tr_static_init; procedure init_block(var deflate_state); procedure pqdownheap(var s : deflate_state; var tree : ct_data; k : int); procedure gen_bitlen(var s : deflate_state; var desc : tree_desc); procedure gen_codes(var tree : ct_data; max_code : int; bl_count : pushf); procedure build_tree(var s : deflate_state; var desc : tree_desc); procedure scan_tree(var s : deflate_state; var tree : ct_data; max_code : int); procedure send_tree(var s : deflate_state; var tree : ct_data; max_code : int); function build_bl_tree(var deflate_state) : int; procedure send_all_trees(var deflate_state; lcodes : int; dcodes : int; blcodes : int); procedure compress_block(var s : deflate_state; var ltree : ct_data; var dtree : ct_data); procedure set_data_type(var s : deflate_state); function bi_reverse(value : unsigned; length : int) : unsigned; procedure bi_windup(var deflate_state); procedure bi_flush(var deflate_state); procedure copy_block(var deflate_state; buf : pcharf; len : unsigned; header : int); *) {$ifdef GEN_TREES_H} {local} procedure gen_trees_header; {$endif} (* { =========================================================================== Output a short LSB first on the stream. IN assertion: there is enough room in pendingBuf. } macro put_short(s, w) begin {put_byte(s, (uch)((w) & 0xff));} s.pending_buf^[s.pending] := uch((w) and $ff); Inc(s.pending); {put_byte(s, (uch)((ush)(w) >> 8));} s.pending_buf^[s.pending] := uch(ush(w) shr 8);; Inc(s.pending); end *) { =========================================================================== Send a value on a given number of bits. IN assertion: length <= 16 and value fits in length bits. } {$ifdef ORG_DEBUG} {local} procedure send_bits(var s : deflate_state; value : int; { value to send } length : int); { number of bits } begin {$ifdef DEBUG} Tracevv(' l '+IntToStr(length)+ ' v '+IntToStr(value)); Assert((length > 0) and (length <= 15), 'invalid length'); Inc(s.bits_sent, ulg(length)); {$ENDIF} { If not enough room in bi_buf, use (valid) bits from bi_buf and (16 - bi_valid) bits from value, leaving (width - (16-bi_valid)) unused bits in value. } {$IFOPT Q+} {$Q-} {$DEFINE NoOverflowCheck} {$ENDIF} {$IFOPT R+} {$R-} {$DEFINE NoRangeCheck} {$ENDIF} if (s.bi_valid > int(Buf_size) - length) then begin s.bi_buf := s.bi_buf or int(value shl s.bi_valid); {put_short(s, s.bi_buf);} s.pending_buf^[s.pending] := uch(s.bi_buf and $ff); Inc(s.pending); s.pending_buf^[s.pending] := uch(ush(s.bi_buf) shr 8);; Inc(s.pending); s.bi_buf := ush(value) shr (Buf_size - s.bi_valid); Inc(s.bi_valid, length - Buf_size); end else begin s.bi_buf := s.bi_buf or int(value shl s.bi_valid); Inc(s.bi_valid, length); end; {$IFDEF NoOverflowCheck} {$Q+} {$UNDEF NoOverflowCheck} {$ENDIF} {$IFDEF NoRangeCheck} {$Q+} {$UNDEF NoRangeCheck} {$ENDIF} end; {$else} { !DEBUG } macro send_code(s, c, tree) begin send_bits(s, tree[c].Code, tree[c].Len); { Send a code of the given tree. c and tree must not have side effects } end macro send_bits(s, value, length) \ begin int len := length;\ if (s^.bi_valid > (int)Buf_size - len) begin\ int val := value;\ s^.bi_buf |= (val << s^.bi_valid);\ {put_short(s, s.bi_buf);} s.pending_buf^[s.pending] := uch(s.bi_buf and $ff); Inc(s.pending); s.pending_buf^[s.pending] := uch(ush(s.bi_buf) shr 8);; Inc(s.pending); s^.bi_buf := (ush)val >> (Buf_size - s^.bi_valid);\ s^.bi_valid += len - Buf_size;\ end else begin\ s^.bi_buf |= (value) << s^.bi_valid;\ s^.bi_valid += len;\ end\ end; {$endif} { DEBUG } { =========================================================================== Reverse the first len bits of a code, using straightforward code (a faster method would use a table) IN assertion: 1 <= len <= 15 } {local} function bi_reverse(code : unsigned; { the value to invert } len : int) : unsigned; { its bit length } var res : unsigned; {register} begin res := 0; repeat res := res or (code and 1); code := code shr 1; res := res shl 1; Dec(len); until (len <= 0); bi_reverse := res shr 1; end; { =========================================================================== Generate the codes for a given tree and bit counts (which need not be optimal). IN assertion: the array bl_count contains the bit length statistics for the given tree and the field len is set for all tree elements. OUT assertion: the field code is set for all tree elements of non zero code length. } {local} procedure gen_codes(tree : tree_ptr; { the tree to decorate } max_code : int; { largest code with non zero frequency } var bl_count : array of ushf); { number of codes at each bit length } var next_code : array[0..MAX_BITS+1-1] of ush; { next code value for each bit length } code : ush; { running code value } bits : int; { bit index } n : int; { code index } var len : int; begin code := 0; { The distribution counts are first used to generate the code values without bit reversal. } for bits := 1 to MAX_BITS do begin code := ((code + bl_count[bits-1]) shl 1); next_code[bits] := code; end; { Check that the bit counts in bl_count are consistent. The last code must be all ones. } {$IFDEF DEBUG} Assert (code + bl_count[MAX_BITS]-1 = (1 shl MAX_BITS)-1, 'inconsistent bit counts'); Tracev(#13'gen_codes: max_code '+IntToStr(max_code)); {$ENDIF} for n := 0 to max_code do begin len := tree^[n].dl.Len; if (len = 0) then continue; { Now reverse the bits } tree^[n].fc.Code := bi_reverse(next_code[len], len); Inc(next_code[len]); {$ifdef DEBUG} if (n>31) and (n<128) then Tracecv(tree <> tree_ptr(@static_ltree), (^M'n #'+IntToStr(n)+' '+AnsiChar(n)+' l '+IntToStr(len)+' c '+ IntToStr(tree^[n].fc.Code)+' ('+IntToStr(next_code[len]-1)+')')) else Tracecv(tree <> tree_ptr(@static_ltree), (^M'n #'+IntToStr(n)+' l '+IntToStr(len)+' c '+ IntToStr(tree^[n].fc.Code)+' ('+IntToStr(next_code[len]-1)+')')); {$ENDIF} end; end; { =========================================================================== Genererate the file trees.h describing the static trees. } {$ifdef GEN_TREES_H} macro SEPARATOR(i, last, width) if (i) = (last) then ( ^M');'^M^M else \ if (i) mod (width) = (width)-1 then ','^M else ', ' procedure gen_trees_header; var header : system.text; i : int; begin system.assign(header, 'trees.inc'); {$I-} ReWrite(header); {$I+} Assert (IOresult <> 0, 'Can''t open trees.h'); WriteLn(header, '{ header created automatically with -DGEN_TREES_H }'^M); WriteLn(header, 'local const ct_data static_ltree[L_CODES+2] := ('); for i := 0 to L_CODES+2-1 do begin WriteLn(header, '((%3u),(%3u))%s', static_ltree[i].Code, static_ltree[i].Len, SEPARATOR(i, L_CODES+1, 5)); end; WriteLn(header, 'local const ct_data static_dtree[D_CODES] := ('); for i := 0 to D_CODES-1 do begin WriteLn(header, '((%2u),(%2u))%s', static_dtree[i].Code, static_dtree[i].Len, SEPARATOR(i, D_CODES-1, 5)); end; WriteLn(header, 'const uch _dist_code[DIST_CODE_LEN] := ('); for i := 0 to DIST_CODE_LEN-1 do begin WriteLn(header, '%2u%s', _dist_code[i], SEPARATOR(i, DIST_CODE_LEN-1, 20)); end; WriteLn(header, 'const uch _length_code[MAX_MATCH-MIN_MATCH+1]= ('); for i := 0 to MAX_MATCH-MIN_MATCH+1-1 do begin WriteLn(header, '%2u%s', _length_code[i], SEPARATOR(i, MAX_MATCH-MIN_MATCH, 20)); end; WriteLn(header, 'local const int base_length[LENGTH_CODES] := ('); for i := 0 to LENGTH_CODES-1 do begin WriteLn(header, '%1u%s', base_length[i], SEPARATOR(i, LENGTH_CODES-1, 20)); end; WriteLn(header, 'local const int base_dist[D_CODES] := ('); for i := 0 to D_CODES-1 do begin WriteLn(header, '%5u%s', base_dist[i], SEPARATOR(i, D_CODES-1, 10)); end; close(header); end; {$endif} { GEN_TREES_H } { =========================================================================== Initialize the various 'constant' tables. } {local} procedure tr_static_init; {$ifdef GEN_TREES_H} const static_init_done : boolean = FALSE; var n : int; { iterates over tree elements } bits : int; { bit counter } length : int; { length value } code : int; { code value } dist : int; { distance index } bl_count : array[0..MAX_BITS+1-1] of ush; { number of codes at each bit length for an optimal tree } begin if (static_init_done) then exit; { Initialize the mapping length (0..255) -> length code (0..28) } length := 0; for code := 0 to LENGTH_CODES-1-1 do begin base_length[code] := length; for n := 0 to (1 shl extra_lbits[code])-1 do begin _length_code[length] := uch(code); Inc(length); end; end; Assert (length = 256, 'tr_static_init: length <> 256'); { Note that the length 255 (match length 258) can be represented in two different ways: code 284 + 5 bits or code 285, so we overwrite length_code[255] to use the best encoding: } _length_code[length-1] := uch(code); { Initialize the mapping dist (0..32K) -> dist code (0..29) } dist := 0; for code := 0 to 16-1 do begin base_dist[code] := dist; for n := 0 to (1 shl extra_dbits[code])-1 do begin _dist_code[dist] := uch(code); Inc(dist); end; end; Assert (dist = 256, 'tr_static_init: dist <> 256'); dist := dist shr 7; { from now on, all distances are divided by 128 } for code := 16 to D_CODES-1 do begin base_dist[code] := dist shl 7; for n := 0 to (1 shl (extra_dbits[code]-7))-1 do begin _dist_code[256 + dist] := uch(code); Inc(dist); end; end; Assert (dist = 256, 'tr_static_init: 256+dist <> 512'); { Construct the codes of the static literal tree } for bits := 0 to MAX_BITS do bl_count[bits] := 0; n := 0; while (n <= 143) do begin static_ltree[n].dl.Len := 8; Inc(n); Inc(bl_count[8]); end; while (n <= 255) do begin static_ltree[n].dl.Len := 9; Inc(n); Inc(bl_count[9]); end; while (n <= 279) do begin static_ltree[n].dl.Len := 7; Inc(n); Inc(bl_count[7]); end; while (n <= 287) do begin static_ltree[n].dl.Len := 8; Inc(n); Inc(bl_count[8]); end; { Codes 286 and 287 do not exist, but we must include them in the tree construction to get a canonical Huffman tree (longest code all ones) } gen_codes(tree_ptr(@static_ltree), L_CODES+1, bl_count); { The static distance tree is trivial: } for n := 0 to D_CODES-1 do begin static_dtree[n].dl.Len := 5; static_dtree[n].fc.Code := bi_reverse(unsigned(n), 5); end; static_init_done := TRUE; gen_trees_header; { save to include file } {$else} begin {$endif} { GEN_TREES_H) } end; { =========================================================================== Initialize a new block. } {local} procedure init_block(var s : deflate_state); var n : int; { iterates over tree elements } begin { Initialize the trees. } for n := 0 to L_CODES-1 do s.dyn_ltree[n].fc.Freq := 0; for n := 0 to D_CODES-1 do s.dyn_dtree[n].fc.Freq := 0; for n := 0 to BL_CODES-1 do s.bl_tree[n].fc.Freq := 0; s.dyn_ltree[END_BLOCK].fc.Freq := 1; s.static_len := Long(0); s.opt_len := Long(0); s.matches := 0; s.last_lit := 0; end; const SMALLEST = 1; { Index within the heap array of least frequent node in the Huffman tree } { =========================================================================== Initialize the tree data structures for a new zlib stream. } procedure _tr_init(var s : deflate_state); begin tr_static_init; s.compressed_len := Long(0); s.l_desc.dyn_tree := tree_ptr(@s.dyn_ltree); s.l_desc.stat_desc := @static_l_desc; s.d_desc.dyn_tree := tree_ptr(@s.dyn_dtree); s.d_desc.stat_desc := @static_d_desc; s.bl_desc.dyn_tree := tree_ptr(@s.bl_tree); s.bl_desc.stat_desc := @static_bl_desc; s.bi_buf := 0; s.bi_valid := 0; s.last_eob_len := 8; { enough lookahead for inflate } {$ifdef DEBUG} s.bits_sent := Long(0); {$endif} { Initialize the first block of the first file: } init_block(s); end; { =========================================================================== Remove the smallest element from the heap and recreate the heap with one less element. Updates heap and heap_len. macro pqremove(s, tree, top) begin top := s.heap[SMALLEST]; s.heap[SMALLEST] := s.heap[s.heap_len]; Dec(s.heap_len); pqdownheap(s, tree, SMALLEST); end } { =========================================================================== Compares to subtrees, using the tree depth as tie breaker when the subtrees have equal frequency. This minimizes the worst case length. macro smaller(tree, n, m, depth) ( (tree[n].Freq < tree[m].Freq) or ((tree[n].Freq = tree[m].Freq) and (depth[n] <= depth[m])) ) } { =========================================================================== Restore the heap property by moving down the tree starting at node k, exchanging a node with the smallest of its two sons if necessary, stopping when the heap property is re-established (each father smaller than its two sons). } {local} procedure pqdownheap(var s : deflate_state; var tree : tree_type; { the tree to restore } k : int); { node to move down } var v : int; j : int; begin v := s.heap[k]; j := k shl 1; { left son of k } while (j <= s.heap_len) do begin { Set j to the smallest of the two sons: } if (j < s.heap_len) and {smaller(tree, s.heap[j+1], s.heap[j], s.depth)} ( (tree[s.heap[j+1]].fc.Freq < tree[s.heap[j]].fc.Freq) or ((tree[s.heap[j+1]].fc.Freq = tree[s.heap[j]].fc.Freq) and (s.depth[s.heap[j+1]] <= s.depth[s.heap[j]])) ) then begin Inc(j); end; { Exit if v is smaller than both sons } if {(smaller(tree, v, s.heap[j], s.depth))} ( (tree[v].fc.Freq < tree[s.heap[j]].fc.Freq) or ((tree[v].fc.Freq = tree[s.heap[j]].fc.Freq) and (s.depth[v] <= s.depth[s.heap[j]])) ) then break; { Exchange v with the smallest son } s.heap[k] := s.heap[j]; k := j; { And continue down the tree, setting j to the left son of k } j := j shl 1; end; s.heap[k] := v; end; { =========================================================================== Compute the optimal bit lengths for a tree and update the total bit length for the current block. IN assertion: the fields freq and dad are set, heap[heap_max] and above are the tree nodes sorted by increasing frequency. OUT assertions: the field len is set to the optimal bit length, the array bl_count contains the frequencies for each bit length. The length opt_len is updated; static_len is also updated if stree is not null. } {local} procedure gen_bitlen(var s : deflate_state; var desc : tree_desc); { the tree descriptor } var tree : tree_ptr; max_code : int; stree : tree_ptr; {const} extra : pzIntfArray; {const} base : int; max_length : int; h : int; { heap index } n, m : int; { iterate over the tree elements } bits : int; { bit length } xbits : int; { extra bits } f : ush; { frequency } overflow : int; { number of elements with bit length too large } begin tree := desc.dyn_tree; max_code := desc.max_code; stree := desc.stat_desc^.static_tree; extra := desc.stat_desc^.extra_bits; base := desc.stat_desc^.extra_base; max_length := desc.stat_desc^.max_length; overflow := 0; for bits := 0 to MAX_BITS do s.bl_count[bits] := 0; { In a first pass, compute the optimal bit lengths (which may overflow in the case of the bit length tree). } tree^[s.heap[s.heap_max]].dl.Len := 0; { root of the heap } for h := s.heap_max+1 to HEAP_SIZE-1 do begin n := s.heap[h]; bits := tree^[tree^[n].dl.Dad].dl.Len + 1; if (bits > max_length) then begin bits := max_length; Inc(overflow); end; tree^[n].dl.Len := ush(bits); { We overwrite tree[n].dl.Dad which is no longer needed } if (n > max_code) then continue; { not a leaf node } Inc(s.bl_count[bits]); xbits := 0; if (n >= base) then xbits := extra^[n-base]; f := tree^[n].fc.Freq; Inc(s.opt_len, ulg(f) * (bits + xbits)); if (stree <> NIL) then Inc(s.static_len, ulg(f) * (stree^[n].dl.Len + xbits)); end; if (overflow = 0) then exit; {$ifdef DEBUG} Tracev(^M'bit length overflow'); {$endif} { This happens for example on obj2 and pic of the Calgary corpus } { Find the first bit length which could increase: } repeat bits := max_length-1; while (s.bl_count[bits] = 0) do Dec(bits); Dec(s.bl_count[bits]); { move one leaf down the tree } Inc(s.bl_count[bits+1], 2); { move one overflow item as its brother } Dec(s.bl_count[max_length]); { The brother of the overflow item also moves one step up, but this does not affect bl_count[max_length] } Dec(overflow, 2); until (overflow <= 0); { Now recompute all bit lengths, scanning in increasing frequency. h is still equal to HEAP_SIZE. (It is simpler to reconstruct all lengths instead of fixing only the wrong ones. This idea is taken from 'ar' written by Haruhiko Okumura.) } h := HEAP_SIZE; { Delphi3: compiler warning w/o this } for bits := max_length downto 1 do begin n := s.bl_count[bits]; while (n <> 0) do begin Dec(h); m := s.heap[h]; if (m > max_code) then continue; if (tree^[m].dl.Len <> unsigned(bits)) then begin {$ifdef DEBUG} Trace('code '+IntToStr(m)+' bits '+IntToStr(tree^[m].dl.Len) +'.'+IntToStr(bits)); {$ENDIF} Inc(s.opt_len, (long(bits) - long(tree^[m].dl.Len)) * long(tree^[m].fc.Freq) ); tree^[m].dl.Len := ush(bits); end; Dec(n); end; end; end; { =========================================================================== Construct one Huffman tree and assigns the code bit strings and lengths. Update the total bit length for the current block. IN assertion: the field freq is set for all tree elements. OUT assertions: the fields len and code are set to the optimal bit length and corresponding code. The length opt_len is updated; static_len is also updated if stree is not null. The field max_code is set. } {local} procedure build_tree(var s : deflate_state; var desc : tree_desc); { the tree descriptor } var tree : tree_ptr; stree : tree_ptr; {const} elems : int; n, m : int; { iterate over heap elements } max_code : int; { largest code with non zero frequency } node : int; { new node being created } begin tree := desc.dyn_tree; stree := desc.stat_desc^.static_tree; elems := desc.stat_desc^.elems; max_code := -1; { Construct the initial heap, with least frequent element in heap[SMALLEST]. The sons of heap[n] are heap[2*n] and heap[2*n+1]. heap[0] is not used. } s.heap_len := 0; s.heap_max := HEAP_SIZE; for n := 0 to elems-1 do begin if (tree^[n].fc.Freq <> 0) then begin max_code := n; Inc(s.heap_len); s.heap[s.heap_len] := n; s.depth[n] := 0; end else begin tree^[n].dl.Len := 0; end; end; { The pkzip format requires that at least one distance code exists, and that at least one bit should be sent even if there is only one possible code. So to avoid special checks later on we force at least two codes of non zero frequency. } while (s.heap_len < 2) do begin Inc(s.heap_len); if (max_code < 2) then begin Inc(max_code); s.heap[s.heap_len] := max_code; node := max_code; end else begin s.heap[s.heap_len] := 0; node := 0; end; tree^[node].fc.Freq := 1; s.depth[node] := 0; Dec(s.opt_len); if (stree <> NIL) then Dec(s.static_len, stree^[node].dl.Len); { node is 0 or 1 so it does not have extra bits } end; desc.max_code := max_code; { The elements heap[heap_len/2+1 .. heap_len] are leaves of the tree, establish sub-heaps of increasing lengths: } for n := s.heap_len div 2 downto 1 do pqdownheap(s, tree^, n); { Construct the Huffman tree by repeatedly combining the least two frequent nodes. } node := elems; { next internal node of the tree } repeat {pqremove(s, tree, n);} { n := node of least frequency } n := s.heap[SMALLEST]; s.heap[SMALLEST] := s.heap[s.heap_len]; Dec(s.heap_len); pqdownheap(s, tree^, SMALLEST); m := s.heap[SMALLEST]; { m := node of next least frequency } Dec(s.heap_max); s.heap[s.heap_max] := n; { keep the nodes sorted by frequency } Dec(s.heap_max); s.heap[s.heap_max] := m; { Create a new node father of n and m } tree^[node].fc.Freq := tree^[n].fc.Freq + tree^[m].fc.Freq; { maximum } if (s.depth[n] >= s.depth[m]) then s.depth[node] := uch (s.depth[n] + 1) else s.depth[node] := uch (s.depth[m] + 1); tree^[m].dl.Dad := ush(node); tree^[n].dl.Dad := ush(node); {$ifdef DUMP_BL_TREE} if (tree = tree_ptr(@s.bl_tree)) then begin WriteLn(#13'node ',node,'(',tree^[node].fc.Freq,') sons ',n, '(',tree^[n].fc.Freq,') ', m, '(',tree^[m].fc.Freq,')'); end; {$endif} { and insert the new node in the heap } s.heap[SMALLEST] := node; Inc(node); pqdownheap(s, tree^, SMALLEST); until (s.heap_len < 2); Dec(s.heap_max); s.heap[s.heap_max] := s.heap[SMALLEST]; { At this point, the fields freq and dad are set. We can now generate the bit lengths. } gen_bitlen(s, desc); { The field len is now set, we can generate the bit codes } gen_codes (tree, max_code, s.bl_count); end; { =========================================================================== Scan a literal or distance tree to determine the frequencies of the codes in the bit length tree. } {local} procedure scan_tree(var s : deflate_state; var tree : array of ct_data; { the tree to be scanned } max_code : int); { and its largest code of non zero frequency } var n : int; { iterates over all tree elements } prevlen : int; { last emitted length } curlen : int; { length of current code } nextlen : int; { length of next code } count : int; { repeat count of the current code } max_count : int; { max repeat count } min_count : int; { min repeat count } begin prevlen := -1; nextlen := tree[0].dl.Len; count := 0; max_count := 7; min_count := 4; if (nextlen = 0) then begin max_count := 138; min_count := 3; end; tree[max_code+1].dl.Len := ush($ffff); { guard } for n := 0 to max_code do begin curlen := nextlen; nextlen := tree[n+1].dl.Len; Inc(count); if (count < max_count) and (curlen = nextlen) then continue else if (count < min_count) then Inc(s.bl_tree[curlen].fc.Freq, count) else if (curlen <> 0) then begin if (curlen <> prevlen) then Inc(s.bl_tree[curlen].fc.Freq); Inc(s.bl_tree[REP_3_6].fc.Freq); end else if (count <= 10) then Inc(s.bl_tree[REPZ_3_10].fc.Freq) else Inc(s.bl_tree[REPZ_11_138].fc.Freq); count := 0; prevlen := curlen; if (nextlen = 0) then begin max_count := 138; min_count := 3; end else if (curlen = nextlen) then begin max_count := 6; min_count := 3; end else begin max_count := 7; min_count := 4; end; end; end; { =========================================================================== Send a literal or distance tree in compressed form, using the codes in bl_tree. } {local} procedure send_tree(var s : deflate_state; var tree : array of ct_data; { the tree to be scanned } max_code : int); { and its largest code of non zero frequency } var n : int; { iterates over all tree elements } prevlen : int; { last emitted length } curlen : int; { length of current code } nextlen : int; { length of next code } count : int; { repeat count of the current code } max_count : int; { max repeat count } min_count : int; { min repeat count } begin prevlen := -1; nextlen := tree[0].dl.Len; count := 0; max_count := 7; min_count := 4; { tree[max_code+1].dl.Len := -1; } { guard already set } if (nextlen = 0) then begin max_count := 138; min_count := 3; end; for n := 0 to max_code do begin curlen := nextlen; nextlen := tree[n+1].dl.Len; Inc(count); if (count < max_count) and (curlen = nextlen) then continue else if (count < min_count) then begin repeat {$ifdef DEBUG} Tracevvv(#13'cd '+IntToStr(curlen)); {$ENDIF} send_bits(s, s.bl_tree[curlen].fc.Code, s.bl_tree[curlen].dl.Len); Dec(count); until (count = 0); end else if (curlen <> 0) then begin if (curlen <> prevlen) then begin {$ifdef DEBUG} Tracevvv(#13'cd '+IntToStr(curlen)); {$ENDIF} send_bits(s, s.bl_tree[curlen].fc.Code, s.bl_tree[curlen].dl.Len); Dec(count); end; {$IFDEF DEBUG} Assert((count >= 3) and (count <= 6), ' 3_6?'); {$ENDIF} {$ifdef DEBUG} Tracevvv(#13'cd '+IntToStr(REP_3_6)); {$ENDIF} send_bits(s, s.bl_tree[REP_3_6].fc.Code, s.bl_tree[REP_3_6].dl.Len); send_bits(s, count-3, 2); end else if (count <= 10) then begin {$ifdef DEBUG} Tracevvv(#13'cd '+IntToStr(REPZ_3_10)); {$ENDIF} send_bits(s, s.bl_tree[REPZ_3_10].fc.Code, s.bl_tree[REPZ_3_10].dl.Len); send_bits(s, count-3, 3); end else begin {$ifdef DEBUG} Tracevvv(#13'cd '+IntToStr(REPZ_11_138)); {$ENDIF} send_bits(s, s.bl_tree[REPZ_11_138].fc.Code, s.bl_tree[REPZ_11_138].dl.Len); send_bits(s, count-11, 7); end; count := 0; prevlen := curlen; if (nextlen = 0) then begin max_count := 138; min_count := 3; end else if (curlen = nextlen) then begin max_count := 6; min_count := 3; end else begin max_count := 7; min_count := 4; end; end; end; { =========================================================================== Construct the Huffman tree for the bit lengths and return the index in bl_order of the last bit length code to send. } {local} function build_bl_tree(var s : deflate_state) : int; var max_blindex : int; { index of last bit length code of non zero freq } begin { Determine the bit length frequencies for literal and distance trees } scan_tree(s, s.dyn_ltree, s.l_desc.max_code); scan_tree(s, s.dyn_dtree, s.d_desc.max_code); { Build the bit length tree: } build_tree(s, s.bl_desc); { opt_len now includes the length of the tree representations, except the lengths of the bit lengths codes and the 5+5+4 bits for the counts. } { Determine the number of bit length codes to send. The pkzip format requires that at least 4 bit length codes be sent. (appnote.txt says 3 but the actual value used is 4.) } for max_blindex := BL_CODES-1 downto 3 do begin if (s.bl_tree[bl_order[max_blindex]].dl.Len <> 0) then break; end; { Update opt_len to include the bit length tree and counts } Inc(s.opt_len, 3*(max_blindex+1) + 5+5+4); {$ifdef DEBUG} Tracev(^M'dyn trees: dyn %ld, stat %ld {s.opt_len, s.static_len}'); {$ENDIF} build_bl_tree := max_blindex; end; { =========================================================================== Send the header for a block using dynamic Huffman trees: the counts, the lengths of the bit length codes, the literal tree and the distance tree. IN assertion: lcodes >= 257, dcodes >= 1, blcodes >= 4. } {local} procedure send_all_trees(var s : deflate_state; lcodes : int; dcodes : int; blcodes : int); { number of codes for each tree } var rank : int; { index in bl_order } begin {$IFDEF DEBUG} Assert ((lcodes >= 257) and (dcodes >= 1) and (blcodes >= 4), 'not enough codes'); Assert ((lcodes <= L_CODES) and (dcodes <= D_CODES) and (blcodes <= BL_CODES), 'too many codes'); Tracev(^M'bl counts: '); {$ENDIF} send_bits(s, lcodes-257, 5); { not +255 as stated in appnote.txt } send_bits(s, dcodes-1, 5); send_bits(s, blcodes-4, 4); { not -3 as stated in appnote.txt } for rank := 0 to blcodes-1 do begin {$ifdef DEBUG} Tracev(^M'bl code '+IntToStr(bl_order[rank])); {$ENDIF} send_bits(s, s.bl_tree[bl_order[rank]].dl.Len, 3); end; {$ifdef DEBUG} Tracev(^M'bl tree: sent '+IntToStr(s.bits_sent)); {$ENDIF} send_tree(s, s.dyn_ltree, lcodes-1); { literal tree } {$ifdef DEBUG} Tracev(^M'lit tree: sent '+IntToStr(s.bits_sent)); {$ENDIF} send_tree(s, s.dyn_dtree, dcodes-1); { distance tree } {$ifdef DEBUG} Tracev(^M'dist tree: sent '+IntToStr(s.bits_sent)); {$ENDIF} end; { =========================================================================== Flush the bit buffer and align the output on a byte boundary } {local} procedure bi_windup(var s : deflate_state); begin if (s.bi_valid > 8) then begin {put_short(s, s.bi_buf);} s.pending_buf^[s.pending] := uch(s.bi_buf and $ff); Inc(s.pending); s.pending_buf^[s.pending] := uch(ush(s.bi_buf) shr 8);; Inc(s.pending); end else if (s.bi_valid > 0) then begin {put_byte(s, (Byte)s^.bi_buf);} s.pending_buf^[s.pending] := Byte(s.bi_buf); Inc(s.pending); end; s.bi_buf := 0; s.bi_valid := 0; {$ifdef DEBUG} s.bits_sent := (s.bits_sent+7) and (not 7); {$endif} end; { =========================================================================== Copy a stored block, storing first the length and its one's complement if requested. } {local} procedure copy_block(var s : deflate_state; buf : pcharf; { the input data } len : unsigned; { its length } header : boolean); { true if block header must be written } begin bi_windup(s); { align on byte boundary } s.last_eob_len := 8; { enough lookahead for inflate } if (header) then begin {put_short(s, (ush)len);} s.pending_buf^[s.pending] := uch(ush(len) and $ff); Inc(s.pending); s.pending_buf^[s.pending] := uch(ush(len) shr 8);; Inc(s.pending); {put_short(s, (ush)~len);} s.pending_buf^[s.pending] := uch(ush(not len) and $ff); Inc(s.pending); s.pending_buf^[s.pending] := uch(ush(not len) shr 8);; Inc(s.pending); {$ifdef DEBUG} Inc(s.bits_sent, 2*16); {$endif} end; {$ifdef DEBUG} Inc(s.bits_sent, ulg(len shl 3)); {$endif} while (len <> 0) do begin Dec(len); {put_byte(s, *buf++);} s.pending_buf^[s.pending] := buf^; Inc(buf); Inc(s.pending); end; end; { =========================================================================== Send a stored block } procedure _tr_stored_block(var s : deflate_state; buf : pcharf; { input block } stored_len : ulg; { length of input block } eof : boolean); { true if this is the last block for a file } begin send_bits(s, (STORED_BLOCK shl 1)+ord(eof), 3); { send block type } s.compressed_len := (s.compressed_len + 3 + 7) and ulg(not Long(7)); Inc(s.compressed_len, (stored_len + 4) shl 3); copy_block(s, buf, unsigned(stored_len), TRUE); { with header } end; { =========================================================================== Flush the bit buffer, keeping at most 7 bits in it. } {local} procedure bi_flush(var s : deflate_state); begin if (s.bi_valid = 16) then begin {put_short(s, s.bi_buf);} s.pending_buf^[s.pending] := uch(s.bi_buf and $ff); Inc(s.pending); s.pending_buf^[s.pending] := uch(ush(s.bi_buf) shr 8);; Inc(s.pending); s.bi_buf := 0; s.bi_valid := 0; end else if (s.bi_valid >= 8) then begin {put_byte(s, (Byte)s^.bi_buf);} s.pending_buf^[s.pending] := Byte(s.bi_buf); Inc(s.pending); s.bi_buf := s.bi_buf shr 8; Dec(s.bi_valid, 8); end; end; { =========================================================================== Send one empty static block to give enough lookahead for inflate. This takes 10 bits, of which 7 may remain in the bit buffer. The current inflate code requires 9 bits of lookahead. If the last two codes for the previous block (real code plus EOB) were coded on 5 bits or less, inflate may have only 5+3 bits of lookahead to decode the last real code. In this case we send two empty static blocks instead of one. (There are no problems if the previous block is stored or fixed.) To simplify the code, we assume the worst case of last real code encoded on one bit only. } procedure _tr_align(var s : deflate_state); begin send_bits(s, STATIC_TREES shl 1, 3); {$ifdef DEBUG} Tracevvv(#13'cd '+IntToStr(END_BLOCK)); {$ENDIF} send_bits(s, static_ltree[END_BLOCK].fc.Code, static_ltree[END_BLOCK].dl.Len); Inc(s.compressed_len, Long(10)); { 3 for block type, 7 for EOB } bi_flush(s); { Of the 10 bits for the empty block, we have already sent (10 - bi_valid) bits. The lookahead for the last real code (before the EOB of the previous block) was thus at least one plus the length of the EOB plus what we have just sent of the empty static block. } if (1 + s.last_eob_len + 10 - s.bi_valid < 9) then begin send_bits(s, STATIC_TREES shl 1, 3); {$ifdef DEBUG} Tracevvv(#13'cd '+IntToStr(END_BLOCK)); {$ENDIF} send_bits(s, static_ltree[END_BLOCK].fc.Code, static_ltree[END_BLOCK].dl.Len); Inc(s.compressed_len, Long(10)); bi_flush(s); end; s.last_eob_len := 7; end; { =========================================================================== Set the data type to ASCII or BINARY, using a crude approximation: binary if more than 20% of the bytes are <= 6 or >= 128, ascii otherwise. IN assertion: the fields freq of dyn_ltree are set and the total of all frequencies does not exceed 64K (to fit in an int on 16 bit machines). } {local} procedure set_data_type(var s : deflate_state); var n : int; ascii_freq : unsigned; bin_freq : unsigned; begin n := 0; ascii_freq := 0; bin_freq := 0; while (n < 7) do begin Inc(bin_freq, s.dyn_ltree[n].fc.Freq); Inc(n); end; while (n < 128) do begin Inc(ascii_freq, s.dyn_ltree[n].fc.Freq); Inc(n); end; while (n < LITERALS) do begin Inc(bin_freq, s.dyn_ltree[n].fc.Freq); Inc(n); end; if (bin_freq > (ascii_freq shr 2)) then s.data_type := Byte(Z_BINARY) else s.data_type := Byte(Z_ASCII); end; { =========================================================================== Send the block data compressed using the given Huffman trees } {local} procedure compress_block(var s : deflate_state; var ltree : array of ct_data; { literal tree } var dtree : array of ct_data); { distance tree } var dist : unsigned; { distance of matched string } lc : int; { match length or unmatched char (if dist == 0) } lx : unsigned; { running index in l_buf } code : unsigned; { the code to send } extra : int; { number of extra bits to send } begin lx := 0; if (s.last_lit <> 0) then repeat dist := s.d_buf^[lx]; lc := s.l_buf^[lx]; Inc(lx); if (dist = 0) then begin { send a literal byte } {$ifdef DEBUG} Tracevvv(#13'cd '+IntToStr(lc)); Tracecv((lc > 31) and (lc < 128), ' '+AnsiChar(lc)+' '); {$ENDIF} send_bits(s, ltree[lc].fc.Code, ltree[lc].dl.Len); end else begin { Here, lc is the match length - MIN_MATCH } code := _length_code[lc]; { send the length code } {$ifdef DEBUG} Tracevvv(#13'cd '+IntToStr(code+LITERALS+1)); {$ENDIF} send_bits(s, ltree[code+LITERALS+1].fc.Code, ltree[code+LITERALS+1].dl.Len); extra := extra_lbits[code]; if (extra <> 0) then begin Dec(lc, base_length[code]); send_bits(s, lc, extra); { send the extra length bits } end; Dec(dist); { dist is now the match distance - 1 } {code := d_code(dist);} if (dist < 256) then code := _dist_code[dist] else code := _dist_code[256+(dist shr 7)]; {$IFDEF DEBUG} Assert (code < D_CODES, 'bad d_code'); {$ENDIF} { send the distance code } {$ifdef DEBUG} Tracevvv(#13'cd '+IntToStr(code)); {$ENDIF} send_bits(s, dtree[code].fc.Code, dtree[code].dl.Len); extra := extra_dbits[code]; if (extra <> 0) then begin Dec(dist, base_dist[code]); send_bits(s, dist, extra); { send the extra distance bits } end; end; { literal or match pair ? } { Check that the overlay between pending_buf and d_buf+l_buf is ok: } {$IFDEF DEBUG} Assert(s.pending < s.lit_bufsize + 2*lx, 'pendingBuf overflow'); {$ENDIF} until (lx >= s.last_lit); {$ifdef DEBUG} Tracevvv(#13'cd '+IntToStr(END_BLOCK)); {$ENDIF} send_bits(s, ltree[END_BLOCK].fc.Code, ltree[END_BLOCK].dl.Len); s.last_eob_len := ltree[END_BLOCK].dl.Len; end; { =========================================================================== Determine the best encoding for the current block: dynamic trees, static trees or store, and output the encoded block to the zip file. This function returns the total compressed length for the file so far. } function _tr_flush_block (var s : deflate_state; buf : pcharf; { input block, or NULL if too old } stored_len : ulg; { length of input block } eof : boolean) : ulg; { true if this is the last block for a file } var opt_lenb, static_lenb : ulg; { opt_len and static_len in bytes } max_blindex : int; { index of last bit length code of non zero freq } begin max_blindex := 0; { Build the Huffman trees unless a stored block is forced } if (s.level > 0) then begin { Check if the file is ascii or binary } if (s.data_type = Z_UNKNOWN) then set_data_type(s); { Construct the literal and distance trees } build_tree(s, s.l_desc); {$ifdef DEBUG} Tracev(^M'lit data: dyn %ld, stat %ld {s.opt_len, s.static_len}'); {$ENDIF} build_tree(s, s.d_desc); {$ifdef DEBUG} Tracev(^M'dist data: dyn %ld, stat %ld {s.opt_len, s.static_len}'); {$ENDIF} { At this point, opt_len and static_len are the total bit lengths of the compressed block data, excluding the tree representations. } { Build the bit length tree for the above two trees, and get the index in bl_order of the last bit length code to send. } max_blindex := build_bl_tree(s); { Determine the best encoding. Compute first the block length in bytes} opt_lenb := (s.opt_len+3+7) shr 3; static_lenb := (s.static_len+3+7) shr 3; {$ifdef DEBUG} Tracev(^M'opt %lu(%lu) stat %lu(%lu) stored %lu lit %u '+ '{opt_lenb, s.opt_len, static_lenb, s.static_len, stored_len,'+ 's.last_lit}'); {$ENDIF} if (static_lenb <= opt_lenb) then opt_lenb := static_lenb; end else begin {$IFDEF DEBUG} Assert(buf <> pcharf(NIL), 'lost buf'); {$ENDIF} static_lenb := stored_len + 5; opt_lenb := static_lenb; { force a stored block } end; { If compression failed and this is the first and last block, and if the .zip file can be seeked (to rewrite the local header), the whole file is transformed into a stored file: } {$ifdef STORED_FILE_OK} {$ifdef FORCE_STORED_FILE} if eof and (s.compressed_len = Long(0)) then begin { force stored file } {$else} if (stored_len <= opt_lenb) and eof and (s.compressed_len=Long(0)) and seekable()) do begin {$endif} { Since LIT_BUFSIZE <= 2*WSIZE, the input data must be there: } if (buf = pcharf(0)) then error ('block vanished'); copy_block(buf, unsigned(stored_len), 0); { without header } s.compressed_len := stored_len shl 3; s.method := STORED; end else {$endif} { STORED_FILE_OK } {$ifdef FORCE_STORED} if (buf <> pcharf(0)) then begin { force stored block } {$else} if (stored_len+4 <= opt_lenb) and (buf <> pcharf(0)) then begin { 4: two words for the lengths } {$endif} { The test buf <> NULL is only necessary if LIT_BUFSIZE > WSIZE. Otherwise we can't have processed more than WSIZE input bytes since the last block flush, because compression would have been successful. If LIT_BUFSIZE <= WSIZE, it is never too late to transform a block into a stored block. } _tr_stored_block(s, buf, stored_len, eof); {$ifdef FORCE_STATIC} end else if (static_lenb >= 0) then begin { force static trees } {$else} end else if (static_lenb = opt_lenb) then begin {$endif} send_bits(s, (STATIC_TREES shl 1)+ord(eof), 3); compress_block(s, static_ltree, static_dtree); Inc(s.compressed_len, 3 + s.static_len); end else begin send_bits(s, (DYN_TREES shl 1)+ord(eof), 3); send_all_trees(s, s.l_desc.max_code+1, s.d_desc.max_code+1, max_blindex+1); compress_block(s, s.dyn_ltree, s.dyn_dtree); Inc(s.compressed_len, 3 + s.opt_len); end; {$ifdef DEBUG} Assert (s.compressed_len = s.bits_sent, 'bad compressed size'); {$ENDIF} init_block(s); if (eof) then begin bi_windup(s); Inc(s.compressed_len, 7); { align on byte boundary } end; {$ifdef DEBUG} Tracev(#13'comprlen %lu(%lu) {s.compressed_len shr 3,'+ 's.compressed_len-7*ord(eof)}'); {$ENDIF} _tr_flush_block := s.compressed_len shr 3; end; { =========================================================================== Save the match info and tally the frequency counts. Return true if the current block must be flushed. } function _tr_tally (var s : deflate_state; dist : unsigned; { distance of matched string } lc : unsigned) : boolean; { match length-MIN_MATCH or unmatched char (if dist=0) } var {$IFDEF DEBUG} MAX_DIST : ush; {$ENDIF} code : ush; {$ifdef TRUNCATE_BLOCK} var out_length : ulg; in_length : ulg; dcode : int; {$endif} begin s.d_buf^[s.last_lit] := ush(dist); s.l_buf^[s.last_lit] := uch(lc); Inc(s.last_lit); if (dist = 0) then begin { lc is the unmatched char } Inc(s.dyn_ltree[lc].fc.Freq); end else begin Inc(s.matches); { Here, lc is the match length - MIN_MATCH } Dec(dist); { dist := match distance - 1 } {macro d_code(dist)} if (dist) < 256 then code := _dist_code[dist] else code := _dist_code[256+(dist shr 7)]; {$IFDEF DEBUG} {macro MAX_DIST(s) <=> ((s)^.w_size-MIN_LOOKAHEAD) In order to simplify the code, particularly on 16 bit machines, match distances are limited to MAX_DIST instead of WSIZE. } MAX_DIST := ush(s.w_size-MIN_LOOKAHEAD); Assert((dist < ush(MAX_DIST)) and (ush(lc) <= ush(MAX_MATCH-MIN_MATCH)) and (ush(code) < ush(D_CODES)), '_tr_tally: bad match'); {$ENDIF} Inc(s.dyn_ltree[_length_code[lc]+LITERALS+1].fc.Freq); {s.dyn_dtree[d_code(dist)].Freq++;} Inc(s.dyn_dtree[code].fc.Freq); end; {$ifdef TRUNCATE_BLOCK} { Try to guess if it is profitable to stop the current block here } if (s.last_lit and $1fff = 0) and (s.level > 2) then begin { Compute an upper bound for the compressed length } out_length := ulg(s.last_lit)*Long(8); in_length := ulg(long(s.strstart) - s.block_start); for dcode := 0 to D_CODES-1 do begin Inc(out_length, ulg(s.dyn_dtree[dcode].fc.Freq * (Long(5)+extra_dbits[dcode])) ); end; out_length := out_length shr 3; {$ifdef DEBUG} Tracev(^M'last_lit %u, in %ld, out ~%ld(%ld%%) '); { s.last_lit, in_length, out_length, Long(100) - out_length*Long(100) div in_length)); } {$ENDIF} if (s.matches < s.last_lit div 2) and (out_length < in_length div 2) then begin _tr_tally := TRUE; exit; end; end; {$endif} _tr_tally := (s.last_lit = s.lit_bufsize-1); { We avoid equality with lit_bufsize because of wraparound at 64K on 16 bit machines and because stored blocks are restricted to 64K-1 bytes. } end; end.