deflate.c 80 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146
  1. /* deflate.c -- compress data using the deflation algorithm
  2. * Copyright (C) 1995-2024 Jean-loup Gailly and Mark Adler
  3. * For conditions of distribution and use, see copyright notice in zlib.h
  4. */
  5. /*
  6. * ALGORITHM
  7. *
  8. * The "deflation" process depends on being able to identify portions
  9. * of the input text which are identical to earlier input (within a
  10. * sliding window trailing behind the input currently being processed).
  11. *
  12. * The most straightforward technique turns out to be the fastest for
  13. * most input files: try all possible matches and select the longest.
  14. * The key feature of this algorithm is that insertions into the string
  15. * dictionary are very simple and thus fast, and deletions are avoided
  16. * completely. Insertions are performed at each input character, whereas
  17. * string matches are performed only when the previous match ends. So it
  18. * is preferable to spend more time in matches to allow very fast string
  19. * insertions and avoid deletions. The matching algorithm for small
  20. * strings is inspired from that of Rabin & Karp. A brute force approach
  21. * is used to find longer strings when a small match has been found.
  22. * A similar algorithm is used in comic (by Jan-Mark Wams) and freeze
  23. * (by Leonid Broukhis).
  24. * A previous version of this file used a more sophisticated algorithm
  25. * (by Fiala and Greene) which is guaranteed to run in linear amortized
  26. * time, but has a larger average cost, uses more memory and is patented.
  27. * However the F&G algorithm may be faster for some highly redundant
  28. * files if the parameter max_chain_length (described below) is too large.
  29. *
  30. * ACKNOWLEDGEMENTS
  31. *
  32. * The idea of lazy evaluation of matches is due to Jan-Mark Wams, and
  33. * I found it in 'freeze' written by Leonid Broukhis.
  34. * Thanks to many people for bug reports and testing.
  35. *
  36. * REFERENCES
  37. *
  38. * Deutsch, L.P.,"DEFLATE Compressed Data Format Specification".
  39. * Available in http://tools.ietf.org/html/rfc1951
  40. *
  41. * A description of the Rabin and Karp algorithm is given in the book
  42. * "Algorithms" by R. Sedgewick, Addison-Wesley, p252.
  43. *
  44. * Fiala,E.R., and Greene,D.H.
  45. * Data Compression with Finite Windows, Comm.ACM, 32,4 (1989) 490-595
  46. *
  47. */
  48. /* @(#) $Id$ */
  49. #include "deflate.h"
  50. const char deflate_copyright[] =
  51. " deflate 1.3.1 Copyright 1995-2024 Jean-loup Gailly and Mark Adler ";
  52. /*
  53. If you use the zlib library in a product, an acknowledgment is welcome
  54. in the documentation of your product. If for some reason you cannot
  55. include such an acknowledgment, I would appreciate that you keep this
  56. copyright string in the executable of your product.
  57. */
  58. typedef enum {
  59. need_more, /* block not completed, need more input or more output */
  60. block_done, /* block flush performed */
  61. finish_started, /* finish started, need only more output at next deflate */
  62. finish_done /* finish done, accept no more input or output */
  63. } block_state;
  64. typedef block_state (*compress_func)(deflate_state *s, int flush);
  65. /* Compression function. Returns the block state after the call. */
  66. local block_state deflate_stored(deflate_state *s, int flush);
  67. local block_state deflate_fast(deflate_state *s, int flush);
  68. #ifndef FASTEST
  69. local block_state deflate_slow(deflate_state *s, int flush);
  70. #endif
  71. local block_state deflate_rle(deflate_state *s, int flush);
  72. local block_state deflate_huff(deflate_state *s, int flush);
  73. /* ===========================================================================
  74. * Local data
  75. */
  76. #define NIL 0
  77. /* Tail of hash chains */
  78. #ifndef TOO_FAR
  79. # define TOO_FAR 4096
  80. #endif
  81. /* Matches of length 3 are discarded if their distance exceeds TOO_FAR */
  82. /* Values for max_lazy_match, good_match and max_chain_length, depending on
  83. * the desired pack level (0..9). The values given below have been tuned to
  84. * exclude worst case performance for pathological files. Better values may be
  85. * found for specific files.
  86. */
  87. typedef struct config_s {
  88. ush good_length; /* reduce lazy search above this match length */
  89. ush max_lazy; /* do not perform lazy search above this match length */
  90. ush nice_length; /* quit search above this match length */
  91. ush max_chain;
  92. compress_func func;
  93. } config;
  94. #ifdef FASTEST
  95. local const config configuration_table[2] = {
  96. /* good lazy nice chain */
  97. /* 0 */ {0, 0, 0, 0, deflate_stored}, /* store only */
  98. /* 1 */ {4, 4, 8, 4, deflate_fast}}; /* max speed, no lazy matches */
  99. #else
  100. local const config configuration_table[10] = {
  101. /* good lazy nice chain */
  102. /* 0 */ {0, 0, 0, 0, deflate_stored}, /* store only */
  103. /* 1 */ {4, 4, 8, 4, deflate_fast}, /* max speed, no lazy matches */
  104. /* 2 */ {4, 5, 16, 8, deflate_fast},
  105. /* 3 */ {4, 6, 32, 32, deflate_fast},
  106. /* 4 */ {4, 4, 16, 16, deflate_slow}, /* lazy matches */
  107. /* 5 */ {8, 16, 32, 32, deflate_slow},
  108. /* 6 */ {8, 16, 128, 128, deflate_slow},
  109. /* 7 */ {8, 32, 128, 256, deflate_slow},
  110. /* 8 */ {32, 128, 258, 1024, deflate_slow},
  111. /* 9 */ {32, 258, 258, 4096, deflate_slow}}; /* max compression */
  112. #endif
  113. /* Note: the deflate() code requires max_lazy >= MIN_MATCH and max_chain >= 4
  114. * For deflate_fast() (levels <= 3) good is ignored and lazy has a different
  115. * meaning.
  116. */
  117. /* rank Z_BLOCK between Z_NO_FLUSH and Z_PARTIAL_FLUSH */
  118. #define RANK(f) (((f) * 2) - ((f) > 4 ? 9 : 0))
  119. /* ===========================================================================
  120. * Update a hash value with the given input byte
  121. * IN assertion: all calls to UPDATE_HASH are made with consecutive input
  122. * characters, so that a running hash key can be computed from the previous
  123. * key instead of complete recalculation each time.
  124. */
  125. #define UPDATE_HASH(s,h,c) (h = (((h) << s->hash_shift) ^ (c)) & s->hash_mask)
  126. /* ===========================================================================
  127. * Insert string str in the dictionary and set match_head to the previous head
  128. * of the hash chain (the most recent string with same hash key). Return
  129. * the previous length of the hash chain.
  130. * If this file is compiled with -DFASTEST, the compression level is forced
  131. * to 1, and no hash chains are maintained.
  132. * IN assertion: all calls to INSERT_STRING are made with consecutive input
  133. * characters and the first MIN_MATCH bytes of str are valid (except for
  134. * the last MIN_MATCH-1 bytes of the input file).
  135. */
  136. #ifdef FASTEST
  137. #define INSERT_STRING(s, str, match_head) \
  138. (UPDATE_HASH(s, s->ins_h, s->window[(str) + (MIN_MATCH-1)]), \
  139. match_head = s->head[s->ins_h], \
  140. s->head[s->ins_h] = (Pos)(str))
  141. #else
  142. #define INSERT_STRING(s, str, match_head) \
  143. (UPDATE_HASH(s, s->ins_h, s->window[(str) + (MIN_MATCH-1)]), \
  144. match_head = s->prev[(str) & s->w_mask] = s->head[s->ins_h], \
  145. s->head[s->ins_h] = (Pos)(str))
  146. #endif
  147. /* ===========================================================================
  148. * Initialize the hash table (avoiding 64K overflow for 16 bit systems).
  149. * prev[] will be initialized on the fly.
  150. */
  151. #define CLEAR_HASH(s) \
  152. do { \
  153. s->head[s->hash_size - 1] = NIL; \
  154. zmemzero((Bytef *)s->head, \
  155. (unsigned)(s->hash_size - 1)*sizeof(*s->head)); \
  156. } while (0)
  157. /* ===========================================================================
  158. * Slide the hash table when sliding the window down (could be avoided with 32
  159. * bit values at the expense of memory usage). We slide even when level == 0 to
  160. * keep the hash table consistent if we switch back to level > 0 later.
  161. */
  162. #if defined(__has_feature)
  163. # if __has_feature(memory_sanitizer)
  164. __attribute__((no_sanitize("memory")))
  165. # endif
  166. #endif
  167. local void slide_hash(deflate_state *s) {
  168. unsigned n, m;
  169. Posf *p;
  170. uInt wsize = s->w_size;
  171. n = s->hash_size;
  172. p = &s->head[n];
  173. do {
  174. m = *--p;
  175. *p = (Pos)(m >= wsize ? m - wsize : NIL);
  176. } while (--n);
  177. n = wsize;
  178. #ifndef FASTEST
  179. p = &s->prev[n];
  180. do {
  181. m = *--p;
  182. *p = (Pos)(m >= wsize ? m - wsize : NIL);
  183. /* If n is not on any hash chain, prev[n] is garbage but
  184. * its value will never be used.
  185. */
  186. } while (--n);
  187. #endif
  188. }
  189. /* ===========================================================================
  190. * Read a new buffer from the current input stream, update the adler32
  191. * and total number of bytes read. All deflate() input goes through
  192. * this function so some applications may wish to modify it to avoid
  193. * allocating a large strm->next_in buffer and copying from it.
  194. * (See also flush_pending()).
  195. */
  196. local unsigned read_buf(z_streamp strm, Bytef *buf, unsigned size) {
  197. unsigned len = strm->avail_in;
  198. if (len > size) len = size;
  199. if (len == 0) return 0;
  200. strm->avail_in -= len;
  201. zmemcpy(buf, strm->next_in, len);
  202. if (strm->state->wrap == 1) {
  203. strm->adler = adler32(strm->adler, buf, len);
  204. }
  205. #ifdef GZIP
  206. else if (strm->state->wrap == 2) {
  207. strm->adler = crc32(strm->adler, buf, len);
  208. }
  209. #endif
  210. strm->next_in += len;
  211. strm->total_in += len;
  212. return len;
  213. }
  214. /* ===========================================================================
  215. * Fill the window when the lookahead becomes insufficient.
  216. * Updates strstart and lookahead.
  217. *
  218. * IN assertion: lookahead < MIN_LOOKAHEAD
  219. * OUT assertions: strstart <= window_size-MIN_LOOKAHEAD
  220. * At least one byte has been read, or avail_in == 0; reads are
  221. * performed for at least two bytes (required for the zip translate_eol
  222. * option -- not supported here).
  223. */
  224. local void fill_window(deflate_state *s) {
  225. unsigned n;
  226. unsigned more; /* Amount of free space at the end of the window. */
  227. uInt wsize = s->w_size;
  228. Assert(s->lookahead < MIN_LOOKAHEAD, "already enough lookahead");
  229. do {
  230. more = (unsigned)(s->window_size -(ulg)s->lookahead -(ulg)s->strstart);
  231. /* Deal with !@#$% 64K limit: */
  232. if (sizeof(int) <= 2) {
  233. if (more == 0 && s->strstart == 0 && s->lookahead == 0) {
  234. more = wsize;
  235. } else if (more == (unsigned)(-1)) {
  236. /* Very unlikely, but possible on 16 bit machine if
  237. * strstart == 0 && lookahead == 1 (input done a byte at time)
  238. */
  239. more--;
  240. }
  241. }
  242. /* If the window is almost full and there is insufficient lookahead,
  243. * move the upper half to the lower one to make room in the upper half.
  244. */
  245. if (s->strstart >= wsize + MAX_DIST(s)) {
  246. zmemcpy(s->window, s->window + wsize, (unsigned)wsize - more);
  247. s->match_start -= wsize;
  248. s->strstart -= wsize; /* we now have strstart >= MAX_DIST */
  249. s->block_start -= (long) wsize;
  250. if (s->insert > s->strstart)
  251. s->insert = s->strstart;
  252. slide_hash(s);
  253. more += wsize;
  254. }
  255. if (s->strm->avail_in == 0) break;
  256. /* If there was no sliding:
  257. * strstart <= WSIZE+MAX_DIST-1 && lookahead <= MIN_LOOKAHEAD - 1 &&
  258. * more == window_size - lookahead - strstart
  259. * => more >= window_size - (MIN_LOOKAHEAD-1 + WSIZE + MAX_DIST-1)
  260. * => more >= window_size - 2*WSIZE + 2
  261. * In the BIG_MEM or MMAP case (not yet supported),
  262. * window_size == input_size + MIN_LOOKAHEAD &&
  263. * strstart + s->lookahead <= input_size => more >= MIN_LOOKAHEAD.
  264. * Otherwise, window_size == 2*WSIZE so more >= 2.
  265. * If there was sliding, more >= WSIZE. So in all cases, more >= 2.
  266. */
  267. Assert(more >= 2, "more < 2");
  268. n = read_buf(s->strm, s->window + s->strstart + s->lookahead, more);
  269. s->lookahead += n;
  270. /* Initialize the hash value now that we have some input: */
  271. if (s->lookahead + s->insert >= MIN_MATCH) {
  272. uInt str = s->strstart - s->insert;
  273. s->ins_h = s->window[str];
  274. UPDATE_HASH(s, s->ins_h, s->window[str + 1]);
  275. #if MIN_MATCH != 3
  276. Call UPDATE_HASH() MIN_MATCH-3 more times
  277. #endif
  278. while (s->insert) {
  279. UPDATE_HASH(s, s->ins_h, s->window[str + MIN_MATCH-1]);
  280. #ifndef FASTEST
  281. s->prev[str & s->w_mask] = s->head[s->ins_h];
  282. #endif
  283. s->head[s->ins_h] = (Pos)str;
  284. str++;
  285. s->insert--;
  286. if (s->lookahead + s->insert < MIN_MATCH)
  287. break;
  288. }
  289. }
  290. /* If the whole input has less than MIN_MATCH bytes, ins_h is garbage,
  291. * but this is not important since only literal bytes will be emitted.
  292. */
  293. } while (s->lookahead < MIN_LOOKAHEAD && s->strm->avail_in != 0);
  294. /* If the WIN_INIT bytes after the end of the current data have never been
  295. * written, then zero those bytes in order to avoid memory check reports of
  296. * the use of uninitialized (or uninitialised as Julian writes) bytes by
  297. * the longest match routines. Update the high water mark for the next
  298. * time through here. WIN_INIT is set to MAX_MATCH since the longest match
  299. * routines allow scanning to strstart + MAX_MATCH, ignoring lookahead.
  300. */
  301. if (s->high_water < s->window_size) {
  302. ulg curr = s->strstart + (ulg)(s->lookahead);
  303. ulg init;
  304. if (s->high_water < curr) {
  305. /* Previous high water mark below current data -- zero WIN_INIT
  306. * bytes or up to end of window, whichever is less.
  307. */
  308. init = s->window_size - curr;
  309. if (init > WIN_INIT)
  310. init = WIN_INIT;
  311. zmemzero(s->window + curr, (unsigned)init);
  312. s->high_water = curr + init;
  313. }
  314. else if (s->high_water < (ulg)curr + WIN_INIT) {
  315. /* High water mark at or above current data, but below current data
  316. * plus WIN_INIT -- zero out to current data plus WIN_INIT, or up
  317. * to end of window, whichever is less.
  318. */
  319. init = (ulg)curr + WIN_INIT - s->high_water;
  320. if (init > s->window_size - s->high_water)
  321. init = s->window_size - s->high_water;
  322. zmemzero(s->window + s->high_water, (unsigned)init);
  323. s->high_water += init;
  324. }
  325. }
  326. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  327. "not enough room for search");
  328. }
  329. /* ========================================================================= */
  330. int ZEXPORT deflateInit_(z_streamp strm, int level, const char *version,
  331. int stream_size) {
  332. return deflateInit2_(strm, level, Z_DEFLATED, MAX_WBITS, DEF_MEM_LEVEL,
  333. Z_DEFAULT_STRATEGY, version, stream_size);
  334. /* To do: ignore strm->next_in if we use it as window */
  335. }
  336. /* ========================================================================= */
  337. int ZEXPORT deflateInit2_(z_streamp strm, int level, int method,
  338. int windowBits, int memLevel, int strategy,
  339. const char *version, int stream_size) {
  340. deflate_state *s;
  341. int wrap = 1;
  342. static const char my_version[] = ZLIB_VERSION;
  343. if (version == Z_NULL || version[0] != my_version[0] ||
  344. stream_size != sizeof(z_stream)) {
  345. return Z_VERSION_ERROR;
  346. }
  347. if (strm == Z_NULL) return Z_STREAM_ERROR;
  348. strm->msg = Z_NULL;
  349. if (strm->zalloc == (alloc_func)0) {
  350. #ifdef Z_SOLO
  351. return Z_STREAM_ERROR;
  352. #else
  353. strm->zalloc = zcalloc;
  354. strm->opaque = (voidpf)0;
  355. #endif
  356. }
  357. if (strm->zfree == (free_func)0)
  358. #ifdef Z_SOLO
  359. return Z_STREAM_ERROR;
  360. #else
  361. strm->zfree = zcfree;
  362. #endif
  363. #ifdef FASTEST
  364. if (level != 0) level = 1;
  365. #else
  366. if (level == Z_DEFAULT_COMPRESSION) level = 6;
  367. #endif
  368. if (windowBits < 0) { /* suppress zlib wrapper */
  369. wrap = 0;
  370. if (windowBits < -15)
  371. return Z_STREAM_ERROR;
  372. windowBits = -windowBits;
  373. }
  374. #ifdef GZIP
  375. else if (windowBits > 15) {
  376. wrap = 2; /* write gzip wrapper instead */
  377. windowBits -= 16;
  378. }
  379. #endif
  380. if (memLevel < 1 || memLevel > MAX_MEM_LEVEL || method != Z_DEFLATED ||
  381. windowBits < 8 || windowBits > 15 || level < 0 || level > 9 ||
  382. strategy < 0 || strategy > Z_FIXED || (windowBits == 8 && wrap != 1)) {
  383. return Z_STREAM_ERROR;
  384. }
  385. if (windowBits == 8) windowBits = 9; /* until 256-byte window bug fixed */
  386. s = (deflate_state *) ZALLOC(strm, 1, sizeof(deflate_state));
  387. if (s == Z_NULL) return Z_MEM_ERROR;
  388. strm->state = (struct internal_state FAR *)s;
  389. s->strm = strm;
  390. s->status = INIT_STATE; /* to pass state test in deflateReset() */
  391. s->wrap = wrap;
  392. s->gzhead = Z_NULL;
  393. s->w_bits = (uInt)windowBits;
  394. s->w_size = 1 << s->w_bits;
  395. s->w_mask = s->w_size - 1;
  396. s->hash_bits = (uInt)memLevel + 7;
  397. s->hash_size = 1 << s->hash_bits;
  398. s->hash_mask = s->hash_size - 1;
  399. s->hash_shift = ((s->hash_bits + MIN_MATCH-1) / MIN_MATCH);
  400. s->window = (Bytef *) ZALLOC(strm, s->w_size, 2*sizeof(Byte));
  401. /* The following memset eliminates the valgrind uninitialized warning
  402. "swept under the carpet" here:
  403. http://www.zlib.net/zlib_faq.html#faq36 */
  404. memset(s->window, 0, s->w_size*2*sizeof(Byte));
  405. s->prev = (Posf *) ZALLOC(strm, s->w_size, sizeof(Pos));
  406. s->head = (Posf *) ZALLOC(strm, s->hash_size, sizeof(Pos));
  407. s->high_water = 0; /* nothing written to s->window yet */
  408. s->lit_bufsize = 1 << (memLevel + 6); /* 16K elements by default */
  409. /* We overlay pending_buf and sym_buf. This works since the average size
  410. * for length/distance pairs over any compressed block is assured to be 31
  411. * bits or less.
  412. *
  413. * Analysis: The longest fixed codes are a length code of 8 bits plus 5
  414. * extra bits, for lengths 131 to 257. The longest fixed distance codes are
  415. * 5 bits plus 13 extra bits, for distances 16385 to 32768. The longest
  416. * possible fixed-codes length/distance pair is then 31 bits total.
  417. *
  418. * sym_buf starts one-fourth of the way into pending_buf. So there are
  419. * three bytes in sym_buf for every four bytes in pending_buf. Each symbol
  420. * in sym_buf is three bytes -- two for the distance and one for the
  421. * literal/length. As each symbol is consumed, the pointer to the next
  422. * sym_buf value to read moves forward three bytes. From that symbol, up to
  423. * 31 bits are written to pending_buf. The closest the written pending_buf
  424. * bits gets to the next sym_buf symbol to read is just before the last
  425. * code is written. At that time, 31*(n - 2) bits have been written, just
  426. * after 24*(n - 2) bits have been consumed from sym_buf. sym_buf starts at
  427. * 8*n bits into pending_buf. (Note that the symbol buffer fills when n - 1
  428. * symbols are written.) The closest the writing gets to what is unread is
  429. * then n + 14 bits. Here n is lit_bufsize, which is 16384 by default, and
  430. * can range from 128 to 32768.
  431. *
  432. * Therefore, at a minimum, there are 142 bits of space between what is
  433. * written and what is read in the overlain buffers, so the symbols cannot
  434. * be overwritten by the compressed data. That space is actually 139 bits,
  435. * due to the three-bit fixed-code block header.
  436. *
  437. * That covers the case where either Z_FIXED is specified, forcing fixed
  438. * codes, or when the use of fixed codes is chosen, because that choice
  439. * results in a smaller compressed block than dynamic codes. That latter
  440. * condition then assures that the above analysis also covers all dynamic
  441. * blocks. A dynamic-code block will only be chosen to be emitted if it has
  442. * fewer bits than a fixed-code block would for the same set of symbols.
  443. * Therefore its average symbol length is assured to be less than 31. So
  444. * the compressed data for a dynamic block also cannot overwrite the
  445. * symbols from which it is being constructed.
  446. */
  447. s->pending_buf = (uchf *) ZALLOC(strm, s->lit_bufsize, LIT_BUFS);
  448. s->pending_buf_size = (ulg)s->lit_bufsize * 4;
  449. if (s->window == Z_NULL || s->prev == Z_NULL || s->head == Z_NULL ||
  450. s->pending_buf == Z_NULL) {
  451. s->status = FINISH_STATE;
  452. strm->msg = ERR_MSG(Z_MEM_ERROR);
  453. deflateEnd (strm);
  454. return Z_MEM_ERROR;
  455. }
  456. #ifdef LIT_MEM
  457. s->d_buf = (ushf *)(s->pending_buf + (s->lit_bufsize << 1));
  458. s->l_buf = s->pending_buf + (s->lit_bufsize << 2);
  459. s->sym_end = s->lit_bufsize - 1;
  460. #else
  461. s->sym_buf = s->pending_buf + s->lit_bufsize;
  462. s->sym_end = (s->lit_bufsize - 1) * 3;
  463. #endif
  464. /* We avoid equality with lit_bufsize*3 because of wraparound at 64K
  465. * on 16 bit machines and because stored blocks are restricted to
  466. * 64K-1 bytes.
  467. */
  468. s->level = level;
  469. s->strategy = strategy;
  470. s->method = (Byte)method;
  471. return deflateReset(strm);
  472. }
  473. /* =========================================================================
  474. * Check for a valid deflate stream state. Return 0 if ok, 1 if not.
  475. */
  476. local int deflateStateCheck(z_streamp strm) {
  477. deflate_state *s;
  478. if (strm == Z_NULL ||
  479. strm->zalloc == (alloc_func)0 || strm->zfree == (free_func)0)
  480. return 1;
  481. s = strm->state;
  482. if (s == Z_NULL || s->strm != strm || (s->status != INIT_STATE &&
  483. #ifdef GZIP
  484. s->status != GZIP_STATE &&
  485. #endif
  486. s->status != EXTRA_STATE &&
  487. s->status != NAME_STATE &&
  488. s->status != COMMENT_STATE &&
  489. s->status != HCRC_STATE &&
  490. s->status != BUSY_STATE &&
  491. s->status != FINISH_STATE))
  492. return 1;
  493. return 0;
  494. }
  495. /* ========================================================================= */
  496. int ZEXPORT deflateSetDictionary(z_streamp strm, const Bytef *dictionary,
  497. uInt dictLength) {
  498. deflate_state *s;
  499. uInt str, n;
  500. int wrap;
  501. unsigned avail;
  502. z_const unsigned char *next;
  503. if (deflateStateCheck(strm) || dictionary == Z_NULL)
  504. return Z_STREAM_ERROR;
  505. s = strm->state;
  506. wrap = s->wrap;
  507. if (wrap == 2 || (wrap == 1 && s->status != INIT_STATE) || s->lookahead)
  508. return Z_STREAM_ERROR;
  509. /* when using zlib wrappers, compute Adler-32 for provided dictionary */
  510. if (wrap == 1)
  511. strm->adler = adler32(strm->adler, dictionary, dictLength);
  512. s->wrap = 0; /* avoid computing Adler-32 in read_buf */
  513. /* if dictionary would fill window, just replace the history */
  514. if (dictLength >= s->w_size) {
  515. if (wrap == 0) { /* already empty otherwise */
  516. CLEAR_HASH(s);
  517. s->strstart = 0;
  518. s->block_start = 0L;
  519. s->insert = 0;
  520. }
  521. dictionary += dictLength - s->w_size; /* use the tail */
  522. dictLength = s->w_size;
  523. }
  524. /* insert dictionary into window and hash */
  525. avail = strm->avail_in;
  526. next = strm->next_in;
  527. strm->avail_in = dictLength;
  528. strm->next_in = (z_const Bytef *)dictionary;
  529. fill_window(s);
  530. while (s->lookahead >= MIN_MATCH) {
  531. str = s->strstart;
  532. n = s->lookahead - (MIN_MATCH-1);
  533. do {
  534. UPDATE_HASH(s, s->ins_h, s->window[str + MIN_MATCH-1]);
  535. #ifndef FASTEST
  536. s->prev[str & s->w_mask] = s->head[s->ins_h];
  537. #endif
  538. s->head[s->ins_h] = (Pos)str;
  539. str++;
  540. } while (--n);
  541. s->strstart = str;
  542. s->lookahead = MIN_MATCH-1;
  543. fill_window(s);
  544. }
  545. s->strstart += s->lookahead;
  546. s->block_start = (long)s->strstart;
  547. s->insert = s->lookahead;
  548. s->lookahead = 0;
  549. s->match_length = s->prev_length = MIN_MATCH-1;
  550. s->match_available = 0;
  551. strm->next_in = next;
  552. strm->avail_in = avail;
  553. s->wrap = wrap;
  554. return Z_OK;
  555. }
  556. /* ========================================================================= */
  557. int ZEXPORT deflateGetDictionary(z_streamp strm, Bytef *dictionary,
  558. uInt *dictLength) {
  559. deflate_state *s;
  560. uInt len;
  561. if (deflateStateCheck(strm))
  562. return Z_STREAM_ERROR;
  563. s = strm->state;
  564. len = s->strstart + s->lookahead;
  565. if (len > s->w_size)
  566. len = s->w_size;
  567. if (dictionary != Z_NULL && len)
  568. zmemcpy(dictionary, s->window + s->strstart + s->lookahead - len, len);
  569. if (dictLength != Z_NULL)
  570. *dictLength = len;
  571. return Z_OK;
  572. }
  573. /* ========================================================================= */
  574. int ZEXPORT deflateResetKeep(z_streamp strm) {
  575. deflate_state *s;
  576. if (deflateStateCheck(strm)) {
  577. return Z_STREAM_ERROR;
  578. }
  579. strm->total_in = strm->total_out = 0;
  580. strm->msg = Z_NULL; /* use zfree if we ever allocate msg dynamically */
  581. strm->data_type = Z_UNKNOWN;
  582. s = (deflate_state *)strm->state;
  583. s->pending = 0;
  584. s->pending_out = s->pending_buf;
  585. if (s->wrap < 0) {
  586. s->wrap = -s->wrap; /* was made negative by deflate(..., Z_FINISH); */
  587. }
  588. s->status =
  589. #ifdef GZIP
  590. s->wrap == 2 ? GZIP_STATE :
  591. #endif
  592. INIT_STATE;
  593. strm->adler =
  594. #ifdef GZIP
  595. s->wrap == 2 ? crc32(0L, Z_NULL, 0) :
  596. #endif
  597. adler32(0L, Z_NULL, 0);
  598. s->last_flush = -2;
  599. _tr_init(s);
  600. return Z_OK;
  601. }
  602. /* ===========================================================================
  603. * Initialize the "longest match" routines for a new zlib stream
  604. */
  605. local void lm_init(deflate_state *s) {
  606. s->window_size = (ulg)2L*s->w_size;
  607. CLEAR_HASH(s);
  608. /* Set the default configuration parameters:
  609. */
  610. s->max_lazy_match = configuration_table[s->level].max_lazy;
  611. s->good_match = configuration_table[s->level].good_length;
  612. s->nice_match = configuration_table[s->level].nice_length;
  613. s->max_chain_length = configuration_table[s->level].max_chain;
  614. s->strstart = 0;
  615. s->block_start = 0L;
  616. s->lookahead = 0;
  617. s->insert = 0;
  618. s->match_length = s->prev_length = MIN_MATCH-1;
  619. s->match_available = 0;
  620. s->ins_h = 0;
  621. }
  622. /* ========================================================================= */
  623. int ZEXPORT deflateReset(z_streamp strm) {
  624. int ret;
  625. ret = deflateResetKeep(strm);
  626. if (ret == Z_OK)
  627. lm_init(strm->state);
  628. return ret;
  629. }
  630. /* ========================================================================= */
  631. int ZEXPORT deflateSetHeader(z_streamp strm, gz_headerp head) {
  632. if (deflateStateCheck(strm) || strm->state->wrap != 2)
  633. return Z_STREAM_ERROR;
  634. strm->state->gzhead = head;
  635. return Z_OK;
  636. }
  637. /* ========================================================================= */
  638. int ZEXPORT deflatePending(z_streamp strm, unsigned *pending, int *bits) {
  639. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  640. if (pending != Z_NULL)
  641. *pending = strm->state->pending;
  642. if (bits != Z_NULL)
  643. *bits = strm->state->bi_valid;
  644. return Z_OK;
  645. }
  646. /* ========================================================================= */
  647. int ZEXPORT deflatePrime(z_streamp strm, int bits, int value) {
  648. deflate_state *s;
  649. int put;
  650. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  651. s = strm->state;
  652. #ifdef LIT_MEM
  653. if (bits < 0 || bits > 16 ||
  654. (uchf *)s->d_buf < s->pending_out + ((Buf_size + 7) >> 3))
  655. return Z_BUF_ERROR;
  656. #else
  657. if (bits < 0 || bits > 16 ||
  658. s->sym_buf < s->pending_out + ((Buf_size + 7) >> 3))
  659. return Z_BUF_ERROR;
  660. #endif
  661. do {
  662. put = Buf_size - s->bi_valid;
  663. if (put > bits)
  664. put = bits;
  665. s->bi_buf |= (ush)((value & ((1 << put) - 1)) << s->bi_valid);
  666. s->bi_valid += put;
  667. _tr_flush_bits(s);
  668. value >>= put;
  669. bits -= put;
  670. } while (bits);
  671. return Z_OK;
  672. }
  673. /* ========================================================================= */
  674. int ZEXPORT deflateParams(z_streamp strm, int level, int strategy) {
  675. deflate_state *s;
  676. compress_func func;
  677. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  678. s = strm->state;
  679. #ifdef FASTEST
  680. if (level != 0) level = 1;
  681. #else
  682. if (level == Z_DEFAULT_COMPRESSION) level = 6;
  683. #endif
  684. if (level < 0 || level > 9 || strategy < 0 || strategy > Z_FIXED) {
  685. return Z_STREAM_ERROR;
  686. }
  687. func = configuration_table[s->level].func;
  688. if ((strategy != s->strategy || func != configuration_table[level].func) &&
  689. s->last_flush != -2) {
  690. /* Flush the last buffer: */
  691. int err = deflate(strm, Z_BLOCK);
  692. if (err == Z_STREAM_ERROR)
  693. return err;
  694. if (strm->avail_in || (s->strstart - s->block_start) + s->lookahead)
  695. return Z_BUF_ERROR;
  696. }
  697. if (s->level != level) {
  698. if (s->level == 0 && s->matches != 0) {
  699. if (s->matches == 1)
  700. slide_hash(s);
  701. else
  702. CLEAR_HASH(s);
  703. s->matches = 0;
  704. }
  705. s->level = level;
  706. s->max_lazy_match = configuration_table[level].max_lazy;
  707. s->good_match = configuration_table[level].good_length;
  708. s->nice_match = configuration_table[level].nice_length;
  709. s->max_chain_length = configuration_table[level].max_chain;
  710. }
  711. s->strategy = strategy;
  712. return Z_OK;
  713. }
  714. /* ========================================================================= */
  715. int ZEXPORT deflateTune(z_streamp strm, int good_length, int max_lazy,
  716. int nice_length, int max_chain) {
  717. deflate_state *s;
  718. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  719. s = strm->state;
  720. s->good_match = (uInt)good_length;
  721. s->max_lazy_match = (uInt)max_lazy;
  722. s->nice_match = nice_length;
  723. s->max_chain_length = (uInt)max_chain;
  724. return Z_OK;
  725. }
  726. /* =========================================================================
  727. * For the default windowBits of 15 and memLevel of 8, this function returns a
  728. * close to exact, as well as small, upper bound on the compressed size. This
  729. * is an expansion of ~0.03%, plus a small constant.
  730. *
  731. * For any setting other than those defaults for windowBits and memLevel, one
  732. * of two worst case bounds is returned. This is at most an expansion of ~4% or
  733. * ~13%, plus a small constant.
  734. *
  735. * Both the 0.03% and 4% derive from the overhead of stored blocks. The first
  736. * one is for stored blocks of 16383 bytes (memLevel == 8), whereas the second
  737. * is for stored blocks of 127 bytes (the worst case memLevel == 1). The
  738. * expansion results from five bytes of header for each stored block.
  739. *
  740. * The larger expansion of 13% results from a window size less than or equal to
  741. * the symbols buffer size (windowBits <= memLevel + 7). In that case some of
  742. * the data being compressed may have slid out of the sliding window, impeding
  743. * a stored block from being emitted. Then the only choice is a fixed or
  744. * dynamic block, where a fixed block limits the maximum expansion to 9 bits
  745. * per 8-bit byte, plus 10 bits for every block. The smallest block size for
  746. * which this can occur is 255 (memLevel == 2).
  747. *
  748. * Shifts are used to approximate divisions, for speed.
  749. */
  750. uLong ZEXPORT deflateBound(z_streamp strm, uLong sourceLen) {
  751. deflate_state *s;
  752. uLong fixedlen, storelen, wraplen;
  753. /* upper bound for fixed blocks with 9-bit literals and length 255
  754. (memLevel == 2, which is the lowest that may not use stored blocks) --
  755. ~13% overhead plus a small constant */
  756. fixedlen = sourceLen + (sourceLen >> 3) + (sourceLen >> 8) +
  757. (sourceLen >> 9) + 4;
  758. /* upper bound for stored blocks with length 127 (memLevel == 1) --
  759. ~4% overhead plus a small constant */
  760. storelen = sourceLen + (sourceLen >> 5) + (sourceLen >> 7) +
  761. (sourceLen >> 11) + 7;
  762. /* if can't get parameters, return larger bound plus a zlib wrapper */
  763. if (deflateStateCheck(strm))
  764. return (fixedlen > storelen ? fixedlen : storelen) + 6;
  765. /* compute wrapper length */
  766. s = strm->state;
  767. switch (s->wrap) {
  768. case 0: /* raw deflate */
  769. wraplen = 0;
  770. break;
  771. case 1: /* zlib wrapper */
  772. wraplen = 6 + (s->strstart ? 4 : 0);
  773. break;
  774. #ifdef GZIP
  775. case 2: /* gzip wrapper */
  776. wraplen = 18;
  777. if (s->gzhead != Z_NULL) { /* user-supplied gzip header */
  778. Bytef *str;
  779. if (s->gzhead->extra != Z_NULL)
  780. wraplen += 2 + s->gzhead->extra_len;
  781. str = s->gzhead->name;
  782. if (str != Z_NULL)
  783. do {
  784. wraplen++;
  785. } while (*str++);
  786. str = s->gzhead->comment;
  787. if (str != Z_NULL)
  788. do {
  789. wraplen++;
  790. } while (*str++);
  791. if (s->gzhead->hcrc)
  792. wraplen += 2;
  793. }
  794. break;
  795. #endif
  796. default: /* for compiler happiness */
  797. wraplen = 6;
  798. }
  799. /* if not default parameters, return one of the conservative bounds */
  800. if (s->w_bits != 15 || s->hash_bits != 8 + 7)
  801. return (s->w_bits <= s->hash_bits && s->level ? fixedlen : storelen) +
  802. wraplen;
  803. /* default settings: return tight bound for that case -- ~0.03% overhead
  804. plus a small constant */
  805. return sourceLen + (sourceLen >> 12) + (sourceLen >> 14) +
  806. (sourceLen >> 25) + 13 - 6 + wraplen;
  807. }
  808. /* =========================================================================
  809. * Put a short in the pending buffer. The 16-bit value is put in MSB order.
  810. * IN assertion: the stream state is correct and there is enough room in
  811. * pending_buf.
  812. */
  813. local void putShortMSB(deflate_state *s, uInt b) {
  814. put_byte(s, (Byte)(b >> 8));
  815. put_byte(s, (Byte)(b & 0xff));
  816. }
  817. /* =========================================================================
  818. * Flush as much pending output as possible. All deflate() output, except for
  819. * some deflate_stored() output, goes through this function so some
  820. * applications may wish to modify it to avoid allocating a large
  821. * strm->next_out buffer and copying into it. (See also read_buf()).
  822. */
  823. local void flush_pending(z_streamp strm) {
  824. unsigned len;
  825. deflate_state *s = strm->state;
  826. _tr_flush_bits(s);
  827. len = s->pending;
  828. if (len > strm->avail_out) len = strm->avail_out;
  829. if (len == 0) return;
  830. zmemcpy(strm->next_out, s->pending_out, len);
  831. strm->next_out += len;
  832. s->pending_out += len;
  833. strm->total_out += len;
  834. strm->avail_out -= len;
  835. s->pending -= len;
  836. if (s->pending == 0) {
  837. s->pending_out = s->pending_buf;
  838. }
  839. }
  840. /* ===========================================================================
  841. * Update the header CRC with the bytes s->pending_buf[beg..s->pending - 1].
  842. */
  843. #define HCRC_UPDATE(beg) \
  844. do { \
  845. if (s->gzhead->hcrc && s->pending > (beg)) \
  846. strm->adler = crc32(strm->adler, s->pending_buf + (beg), \
  847. s->pending - (beg)); \
  848. } while (0)
  849. /* ========================================================================= */
  850. int ZEXPORT deflate(z_streamp strm, int flush) {
  851. int old_flush; /* value of flush param for previous deflate call */
  852. deflate_state *s;
  853. if (deflateStateCheck(strm) || flush > Z_BLOCK || flush < 0) {
  854. return Z_STREAM_ERROR;
  855. }
  856. s = strm->state;
  857. if (strm->next_out == Z_NULL ||
  858. (strm->avail_in != 0 && strm->next_in == Z_NULL) ||
  859. (s->status == FINISH_STATE && flush != Z_FINISH)) {
  860. ERR_RETURN(strm, Z_STREAM_ERROR);
  861. }
  862. if (strm->avail_out == 0) ERR_RETURN(strm, Z_BUF_ERROR);
  863. old_flush = s->last_flush;
  864. s->last_flush = flush;
  865. /* Flush as much pending output as possible */
  866. if (s->pending != 0) {
  867. flush_pending(strm);
  868. if (strm->avail_out == 0) {
  869. /* Since avail_out is 0, deflate will be called again with
  870. * more output space, but possibly with both pending and
  871. * avail_in equal to zero. There won't be anything to do,
  872. * but this is not an error situation so make sure we
  873. * return OK instead of BUF_ERROR at next call of deflate:
  874. */
  875. s->last_flush = -1;
  876. return Z_OK;
  877. }
  878. /* Make sure there is something to do and avoid duplicate consecutive
  879. * flushes. For repeated and useless calls with Z_FINISH, we keep
  880. * returning Z_STREAM_END instead of Z_BUF_ERROR.
  881. */
  882. } else if (strm->avail_in == 0 && RANK(flush) <= RANK(old_flush) &&
  883. flush != Z_FINISH) {
  884. ERR_RETURN(strm, Z_BUF_ERROR);
  885. }
  886. /* User must not provide more input after the first FINISH: */
  887. if (s->status == FINISH_STATE && strm->avail_in != 0) {
  888. ERR_RETURN(strm, Z_BUF_ERROR);
  889. }
  890. /* Write the header */
  891. if (s->status == INIT_STATE && s->wrap == 0)
  892. s->status = BUSY_STATE;
  893. if (s->status == INIT_STATE) {
  894. /* zlib header */
  895. uInt header = (Z_DEFLATED + ((s->w_bits - 8) << 4)) << 8;
  896. uInt level_flags;
  897. if (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2)
  898. level_flags = 0;
  899. else if (s->level < 6)
  900. level_flags = 1;
  901. else if (s->level == 6)
  902. level_flags = 2;
  903. else
  904. level_flags = 3;
  905. header |= (level_flags << 6);
  906. if (s->strstart != 0) header |= PRESET_DICT;
  907. header += 31 - (header % 31);
  908. putShortMSB(s, header);
  909. /* Save the adler32 of the preset dictionary: */
  910. if (s->strstart != 0) {
  911. putShortMSB(s, (uInt)(strm->adler >> 16));
  912. putShortMSB(s, (uInt)(strm->adler & 0xffff));
  913. }
  914. strm->adler = adler32(0L, Z_NULL, 0);
  915. s->status = BUSY_STATE;
  916. /* Compression must start with an empty pending buffer */
  917. flush_pending(strm);
  918. if (s->pending != 0) {
  919. s->last_flush = -1;
  920. return Z_OK;
  921. }
  922. }
  923. #ifdef GZIP
  924. if (s->status == GZIP_STATE) {
  925. /* gzip header */
  926. strm->adler = crc32(0L, Z_NULL, 0);
  927. put_byte(s, 31);
  928. put_byte(s, 139);
  929. put_byte(s, 8);
  930. if (s->gzhead == Z_NULL) {
  931. put_byte(s, 0);
  932. put_byte(s, 0);
  933. put_byte(s, 0);
  934. put_byte(s, 0);
  935. put_byte(s, 0);
  936. put_byte(s, s->level == 9 ? 2 :
  937. (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2 ?
  938. 4 : 0));
  939. put_byte(s, OS_CODE);
  940. s->status = BUSY_STATE;
  941. /* Compression must start with an empty pending buffer */
  942. flush_pending(strm);
  943. if (s->pending != 0) {
  944. s->last_flush = -1;
  945. return Z_OK;
  946. }
  947. }
  948. else {
  949. put_byte(s, (s->gzhead->text ? 1 : 0) +
  950. (s->gzhead->hcrc ? 2 : 0) +
  951. (s->gzhead->extra == Z_NULL ? 0 : 4) +
  952. (s->gzhead->name == Z_NULL ? 0 : 8) +
  953. (s->gzhead->comment == Z_NULL ? 0 : 16)
  954. );
  955. put_byte(s, (Byte)(s->gzhead->time & 0xff));
  956. put_byte(s, (Byte)((s->gzhead->time >> 8) & 0xff));
  957. put_byte(s, (Byte)((s->gzhead->time >> 16) & 0xff));
  958. put_byte(s, (Byte)((s->gzhead->time >> 24) & 0xff));
  959. put_byte(s, s->level == 9 ? 2 :
  960. (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2 ?
  961. 4 : 0));
  962. put_byte(s, s->gzhead->os & 0xff);
  963. if (s->gzhead->extra != Z_NULL) {
  964. put_byte(s, s->gzhead->extra_len & 0xff);
  965. put_byte(s, (s->gzhead->extra_len >> 8) & 0xff);
  966. }
  967. if (s->gzhead->hcrc)
  968. strm->adler = crc32(strm->adler, s->pending_buf,
  969. s->pending);
  970. s->gzindex = 0;
  971. s->status = EXTRA_STATE;
  972. }
  973. }
  974. if (s->status == EXTRA_STATE) {
  975. if (s->gzhead->extra != Z_NULL) {
  976. ulg beg = s->pending; /* start of bytes to update crc */
  977. uInt left = (s->gzhead->extra_len & 0xffff) - s->gzindex;
  978. while (s->pending + left > s->pending_buf_size) {
  979. uInt copy = s->pending_buf_size - s->pending;
  980. zmemcpy(s->pending_buf + s->pending,
  981. s->gzhead->extra + s->gzindex, copy);
  982. s->pending = s->pending_buf_size;
  983. HCRC_UPDATE(beg);
  984. s->gzindex += copy;
  985. flush_pending(strm);
  986. if (s->pending != 0) {
  987. s->last_flush = -1;
  988. return Z_OK;
  989. }
  990. beg = 0;
  991. left -= copy;
  992. }
  993. zmemcpy(s->pending_buf + s->pending,
  994. s->gzhead->extra + s->gzindex, left);
  995. s->pending += left;
  996. HCRC_UPDATE(beg);
  997. s->gzindex = 0;
  998. }
  999. s->status = NAME_STATE;
  1000. }
  1001. if (s->status == NAME_STATE) {
  1002. if (s->gzhead->name != Z_NULL) {
  1003. ulg beg = s->pending; /* start of bytes to update crc */
  1004. int val;
  1005. do {
  1006. if (s->pending == s->pending_buf_size) {
  1007. HCRC_UPDATE(beg);
  1008. flush_pending(strm);
  1009. if (s->pending != 0) {
  1010. s->last_flush = -1;
  1011. return Z_OK;
  1012. }
  1013. beg = 0;
  1014. }
  1015. val = s->gzhead->name[s->gzindex++];
  1016. put_byte(s, val);
  1017. } while (val != 0);
  1018. HCRC_UPDATE(beg);
  1019. s->gzindex = 0;
  1020. }
  1021. s->status = COMMENT_STATE;
  1022. }
  1023. if (s->status == COMMENT_STATE) {
  1024. if (s->gzhead->comment != Z_NULL) {
  1025. ulg beg = s->pending; /* start of bytes to update crc */
  1026. int val;
  1027. do {
  1028. if (s->pending == s->pending_buf_size) {
  1029. HCRC_UPDATE(beg);
  1030. flush_pending(strm);
  1031. if (s->pending != 0) {
  1032. s->last_flush = -1;
  1033. return Z_OK;
  1034. }
  1035. beg = 0;
  1036. }
  1037. val = s->gzhead->comment[s->gzindex++];
  1038. put_byte(s, val);
  1039. } while (val != 0);
  1040. HCRC_UPDATE(beg);
  1041. }
  1042. s->status = HCRC_STATE;
  1043. }
  1044. if (s->status == HCRC_STATE) {
  1045. if (s->gzhead->hcrc) {
  1046. if (s->pending + 2 > s->pending_buf_size) {
  1047. flush_pending(strm);
  1048. if (s->pending != 0) {
  1049. s->last_flush = -1;
  1050. return Z_OK;
  1051. }
  1052. }
  1053. put_byte(s, (Byte)(strm->adler & 0xff));
  1054. put_byte(s, (Byte)((strm->adler >> 8) & 0xff));
  1055. strm->adler = crc32(0L, Z_NULL, 0);
  1056. }
  1057. s->status = BUSY_STATE;
  1058. /* Compression must start with an empty pending buffer */
  1059. flush_pending(strm);
  1060. if (s->pending != 0) {
  1061. s->last_flush = -1;
  1062. return Z_OK;
  1063. }
  1064. }
  1065. #endif
  1066. /* Start a new block or continue the current one.
  1067. */
  1068. if (strm->avail_in != 0 || s->lookahead != 0 ||
  1069. (flush != Z_NO_FLUSH && s->status != FINISH_STATE)) {
  1070. block_state bstate;
  1071. bstate = s->level == 0 ? deflate_stored(s, flush) :
  1072. s->strategy == Z_HUFFMAN_ONLY ? deflate_huff(s, flush) :
  1073. s->strategy == Z_RLE ? deflate_rle(s, flush) :
  1074. (*(configuration_table[s->level].func))(s, flush);
  1075. if (bstate == finish_started || bstate == finish_done) {
  1076. s->status = FINISH_STATE;
  1077. }
  1078. if (bstate == need_more || bstate == finish_started) {
  1079. if (strm->avail_out == 0) {
  1080. s->last_flush = -1; /* avoid BUF_ERROR next call, see above */
  1081. }
  1082. return Z_OK;
  1083. /* If flush != Z_NO_FLUSH && avail_out == 0, the next call
  1084. * of deflate should use the same flush parameter to make sure
  1085. * that the flush is complete. So we don't have to output an
  1086. * empty block here, this will be done at next call. This also
  1087. * ensures that for a very small output buffer, we emit at most
  1088. * one empty block.
  1089. */
  1090. }
  1091. if (bstate == block_done) {
  1092. if (flush == Z_PARTIAL_FLUSH) {
  1093. _tr_align(s);
  1094. } else if (flush != Z_BLOCK) { /* FULL_FLUSH or SYNC_FLUSH */
  1095. _tr_stored_block(s, (char*)0, 0L, 0);
  1096. /* For a full flush, this empty block will be recognized
  1097. * as a special marker by inflate_sync().
  1098. */
  1099. if (flush == Z_FULL_FLUSH) {
  1100. CLEAR_HASH(s); /* forget history */
  1101. if (s->lookahead == 0) {
  1102. s->strstart = 0;
  1103. s->block_start = 0L;
  1104. s->insert = 0;
  1105. }
  1106. }
  1107. }
  1108. flush_pending(strm);
  1109. if (strm->avail_out == 0) {
  1110. s->last_flush = -1; /* avoid BUF_ERROR at next call, see above */
  1111. return Z_OK;
  1112. }
  1113. }
  1114. }
  1115. if (flush != Z_FINISH) return Z_OK;
  1116. if (s->wrap <= 0) return Z_STREAM_END;
  1117. /* Write the trailer */
  1118. #ifdef GZIP
  1119. if (s->wrap == 2) {
  1120. put_byte(s, (Byte)(strm->adler & 0xff));
  1121. put_byte(s, (Byte)((strm->adler >> 8) & 0xff));
  1122. put_byte(s, (Byte)((strm->adler >> 16) & 0xff));
  1123. put_byte(s, (Byte)((strm->adler >> 24) & 0xff));
  1124. put_byte(s, (Byte)(strm->total_in & 0xff));
  1125. put_byte(s, (Byte)((strm->total_in >> 8) & 0xff));
  1126. put_byte(s, (Byte)((strm->total_in >> 16) & 0xff));
  1127. put_byte(s, (Byte)((strm->total_in >> 24) & 0xff));
  1128. }
  1129. else
  1130. #endif
  1131. {
  1132. putShortMSB(s, (uInt)(strm->adler >> 16));
  1133. putShortMSB(s, (uInt)(strm->adler & 0xffff));
  1134. }
  1135. flush_pending(strm);
  1136. /* If avail_out is zero, the application will call deflate again
  1137. * to flush the rest.
  1138. */
  1139. if (s->wrap > 0) s->wrap = -s->wrap; /* write the trailer only once! */
  1140. return s->pending != 0 ? Z_OK : Z_STREAM_END;
  1141. }
  1142. /* ========================================================================= */
  1143. int ZEXPORT deflateEnd(z_streamp strm) {
  1144. int status;
  1145. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  1146. status = strm->state->status;
  1147. /* Deallocate in reverse order of allocations: */
  1148. TRY_FREE(strm, strm->state->pending_buf);
  1149. TRY_FREE(strm, strm->state->head);
  1150. TRY_FREE(strm, strm->state->prev);
  1151. TRY_FREE(strm, strm->state->window);
  1152. ZFREE(strm, strm->state);
  1153. strm->state = Z_NULL;
  1154. return status == BUSY_STATE ? Z_DATA_ERROR : Z_OK;
  1155. }
  1156. /* =========================================================================
  1157. * Copy the source state to the destination state.
  1158. * To simplify the source, this is not supported for 16-bit MSDOS (which
  1159. * doesn't have enough memory anyway to duplicate compression states).
  1160. */
  1161. int ZEXPORT deflateCopy(z_streamp dest, z_streamp source) {
  1162. #ifdef MAXSEG_64K
  1163. (void)dest;
  1164. (void)source;
  1165. return Z_STREAM_ERROR;
  1166. #else
  1167. deflate_state *ds;
  1168. deflate_state *ss;
  1169. if (deflateStateCheck(source) || dest == Z_NULL) {
  1170. return Z_STREAM_ERROR;
  1171. }
  1172. ss = source->state;
  1173. zmemcpy((voidpf)dest, (voidpf)source, sizeof(z_stream));
  1174. ds = (deflate_state *) ZALLOC(dest, 1, sizeof(deflate_state));
  1175. if (ds == Z_NULL) return Z_MEM_ERROR;
  1176. dest->state = (struct internal_state FAR *) ds;
  1177. zmemcpy((voidpf)ds, (voidpf)ss, sizeof(deflate_state));
  1178. ds->strm = dest;
  1179. ds->window = (Bytef *) ZALLOC(dest, ds->w_size, 2*sizeof(Byte));
  1180. ds->prev = (Posf *) ZALLOC(dest, ds->w_size, sizeof(Pos));
  1181. ds->head = (Posf *) ZALLOC(dest, ds->hash_size, sizeof(Pos));
  1182. ds->pending_buf = (uchf *) ZALLOC(dest, ds->lit_bufsize, LIT_BUFS);
  1183. if (ds->window == Z_NULL || ds->prev == Z_NULL || ds->head == Z_NULL ||
  1184. ds->pending_buf == Z_NULL) {
  1185. deflateEnd (dest);
  1186. return Z_MEM_ERROR;
  1187. }
  1188. /* following zmemcpy do not work for 16-bit MSDOS */
  1189. zmemcpy(ds->window, ss->window, ds->w_size * 2 * sizeof(Byte));
  1190. zmemcpy((voidpf)ds->prev, (voidpf)ss->prev, ds->w_size * sizeof(Pos));
  1191. zmemcpy((voidpf)ds->head, (voidpf)ss->head, ds->hash_size * sizeof(Pos));
  1192. zmemcpy(ds->pending_buf, ss->pending_buf, ds->lit_bufsize * LIT_BUFS);
  1193. ds->pending_out = ds->pending_buf + (ss->pending_out - ss->pending_buf);
  1194. #ifdef LIT_MEM
  1195. ds->d_buf = (ushf *)(ds->pending_buf + (ds->lit_bufsize << 1));
  1196. ds->l_buf = ds->pending_buf + (ds->lit_bufsize << 2);
  1197. #else
  1198. ds->sym_buf = ds->pending_buf + ds->lit_bufsize;
  1199. #endif
  1200. ds->l_desc.dyn_tree = ds->dyn_ltree;
  1201. ds->d_desc.dyn_tree = ds->dyn_dtree;
  1202. ds->bl_desc.dyn_tree = ds->bl_tree;
  1203. return Z_OK;
  1204. #endif /* MAXSEG_64K */
  1205. }
  1206. #ifndef FASTEST
  1207. /* ===========================================================================
  1208. * Set match_start to the longest match starting at the given string and
  1209. * return its length. Matches shorter or equal to prev_length are discarded,
  1210. * in which case the result is equal to prev_length and match_start is
  1211. * garbage.
  1212. * IN assertions: cur_match is the head of the hash chain for the current
  1213. * string (strstart) and its distance is <= MAX_DIST, and prev_length >= 1
  1214. * OUT assertion: the match length is not greater than s->lookahead.
  1215. */
  1216. local uInt longest_match(deflate_state *s, IPos cur_match) {
  1217. unsigned chain_length = s->max_chain_length;/* max hash chain length */
  1218. register Bytef *scan = s->window + s->strstart; /* current string */
  1219. register Bytef *match; /* matched string */
  1220. register int len; /* length of current match */
  1221. int best_len = (int)s->prev_length; /* best match length so far */
  1222. int nice_match = s->nice_match; /* stop if match long enough */
  1223. IPos limit = s->strstart > (IPos)MAX_DIST(s) ?
  1224. s->strstart - (IPos)MAX_DIST(s) : NIL;
  1225. /* Stop when cur_match becomes <= limit. To simplify the code,
  1226. * we prevent matches with the string of window index 0.
  1227. */
  1228. Posf *prev = s->prev;
  1229. uInt wmask = s->w_mask;
  1230. #ifdef UNALIGNED_OK
  1231. /* Compare two bytes at a time. Note: this is not always beneficial.
  1232. * Try with and without -DUNALIGNED_OK to check.
  1233. */
  1234. register Bytef *strend = s->window + s->strstart + MAX_MATCH - 1;
  1235. register ush scan_start = *(ushf*)scan;
  1236. register ush scan_end = *(ushf*)(scan + best_len - 1);
  1237. #else
  1238. register Bytef *strend = s->window + s->strstart + MAX_MATCH;
  1239. register Byte scan_end1 = scan[best_len - 1];
  1240. register Byte scan_end = scan[best_len];
  1241. #endif
  1242. /* The code is optimized for HASH_BITS >= 8 and MAX_MATCH-2 multiple of 16.
  1243. * It is easy to get rid of this optimization if necessary.
  1244. */
  1245. Assert(s->hash_bits >= 8 && MAX_MATCH == 258, "Code too clever");
  1246. /* Do not waste too much time if we already have a good match: */
  1247. if (s->prev_length >= s->good_match) {
  1248. chain_length >>= 2;
  1249. }
  1250. /* Do not look for matches beyond the end of the input. This is necessary
  1251. * to make deflate deterministic.
  1252. */
  1253. if ((uInt)nice_match > s->lookahead) nice_match = (int)s->lookahead;
  1254. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  1255. "need lookahead");
  1256. do {
  1257. Assert(cur_match < s->strstart, "no future");
  1258. match = s->window + cur_match;
  1259. /* Skip to next match if the match length cannot increase
  1260. * or if the match length is less than 2. Note that the checks below
  1261. * for insufficient lookahead only occur occasionally for performance
  1262. * reasons. Therefore uninitialized memory will be accessed, and
  1263. * conditional jumps will be made that depend on those values.
  1264. * However the length of the match is limited to the lookahead, so
  1265. * the output of deflate is not affected by the uninitialized values.
  1266. */
  1267. #if (defined(UNALIGNED_OK) && MAX_MATCH == 258)
  1268. /* This code assumes sizeof(unsigned short) == 2. Do not use
  1269. * UNALIGNED_OK if your compiler uses a different size.
  1270. */
  1271. if (*(ushf*)(match + best_len - 1) != scan_end ||
  1272. *(ushf*)match != scan_start) continue;
  1273. /* It is not necessary to compare scan[2] and match[2] since they are
  1274. * always equal when the other bytes match, given that the hash keys
  1275. * are equal and that HASH_BITS >= 8. Compare 2 bytes at a time at
  1276. * strstart + 3, + 5, up to strstart + 257. We check for insufficient
  1277. * lookahead only every 4th comparison; the 128th check will be made
  1278. * at strstart + 257. If MAX_MATCH-2 is not a multiple of 8, it is
  1279. * necessary to put more guard bytes at the end of the window, or
  1280. * to check more often for insufficient lookahead.
  1281. */
  1282. Assert(scan[2] == match[2], "scan[2]?");
  1283. scan++, match++;
  1284. do {
  1285. } while (*(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1286. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1287. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1288. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1289. scan < strend);
  1290. /* The funny "do {}" generates better code on most compilers */
  1291. /* Here, scan <= window + strstart + 257 */
  1292. Assert(scan <= s->window + (unsigned)(s->window_size - 1),
  1293. "wild scan");
  1294. if (*scan == *match) scan++;
  1295. len = (MAX_MATCH - 1) - (int)(strend - scan);
  1296. scan = strend - (MAX_MATCH-1);
  1297. #else /* UNALIGNED_OK */
  1298. if (match[best_len] != scan_end ||
  1299. match[best_len - 1] != scan_end1 ||
  1300. *match != *scan ||
  1301. *++match != scan[1]) continue;
  1302. /* The check at best_len - 1 can be removed because it will be made
  1303. * again later. (This heuristic is not always a win.)
  1304. * It is not necessary to compare scan[2] and match[2] since they
  1305. * are always equal when the other bytes match, given that
  1306. * the hash keys are equal and that HASH_BITS >= 8.
  1307. */
  1308. scan += 2, match++;
  1309. Assert(*scan == *match, "match[2]?");
  1310. /* We check for insufficient lookahead only every 8th comparison;
  1311. * the 256th check will be made at strstart + 258.
  1312. */
  1313. do {
  1314. } while (*++scan == *++match && *++scan == *++match &&
  1315. *++scan == *++match && *++scan == *++match &&
  1316. *++scan == *++match && *++scan == *++match &&
  1317. *++scan == *++match && *++scan == *++match &&
  1318. scan < strend);
  1319. Assert(scan <= s->window + (unsigned)(s->window_size - 1),
  1320. "wild scan");
  1321. len = MAX_MATCH - (int)(strend - scan);
  1322. scan = strend - MAX_MATCH;
  1323. #endif /* UNALIGNED_OK */
  1324. if (len > best_len) {
  1325. s->match_start = cur_match;
  1326. best_len = len;
  1327. if (len >= nice_match) break;
  1328. #ifdef UNALIGNED_OK
  1329. scan_end = *(ushf*)(scan + best_len - 1);
  1330. #else
  1331. scan_end1 = scan[best_len - 1];
  1332. scan_end = scan[best_len];
  1333. #endif
  1334. }
  1335. } while ((cur_match = prev[cur_match & wmask]) > limit
  1336. && --chain_length != 0);
  1337. if ((uInt)best_len <= s->lookahead) return (uInt)best_len;
  1338. return s->lookahead;
  1339. }
  1340. #else /* FASTEST */
  1341. /* ---------------------------------------------------------------------------
  1342. * Optimized version for FASTEST only
  1343. */
  1344. local uInt longest_match(deflate_state *s, IPos cur_match) {
  1345. register Bytef *scan = s->window + s->strstart; /* current string */
  1346. register Bytef *match; /* matched string */
  1347. register int len; /* length of current match */
  1348. register Bytef *strend = s->window + s->strstart + MAX_MATCH;
  1349. /* The code is optimized for HASH_BITS >= 8 and MAX_MATCH-2 multiple of 16.
  1350. * It is easy to get rid of this optimization if necessary.
  1351. */
  1352. Assert(s->hash_bits >= 8 && MAX_MATCH == 258, "Code too clever");
  1353. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  1354. "need lookahead");
  1355. Assert(cur_match < s->strstart, "no future");
  1356. match = s->window + cur_match;
  1357. /* Return failure if the match length is less than 2:
  1358. */
  1359. if (match[0] != scan[0] || match[1] != scan[1]) return MIN_MATCH-1;
  1360. /* The check at best_len - 1 can be removed because it will be made
  1361. * again later. (This heuristic is not always a win.)
  1362. * It is not necessary to compare scan[2] and match[2] since they
  1363. * are always equal when the other bytes match, given that
  1364. * the hash keys are equal and that HASH_BITS >= 8.
  1365. */
  1366. scan += 2, match += 2;
  1367. Assert(*scan == *match, "match[2]?");
  1368. /* We check for insufficient lookahead only every 8th comparison;
  1369. * the 256th check will be made at strstart + 258.
  1370. */
  1371. do {
  1372. } while (*++scan == *++match && *++scan == *++match &&
  1373. *++scan == *++match && *++scan == *++match &&
  1374. *++scan == *++match && *++scan == *++match &&
  1375. *++scan == *++match && *++scan == *++match &&
  1376. scan < strend);
  1377. Assert(scan <= s->window + (unsigned)(s->window_size - 1), "wild scan");
  1378. len = MAX_MATCH - (int)(strend - scan);
  1379. if (len < MIN_MATCH) return MIN_MATCH - 1;
  1380. s->match_start = cur_match;
  1381. return (uInt)len <= s->lookahead ? (uInt)len : s->lookahead;
  1382. }
  1383. #endif /* FASTEST */
  1384. #ifdef ZLIB_DEBUG
  1385. #define EQUAL 0
  1386. /* result of memcmp for equal strings */
  1387. /* ===========================================================================
  1388. * Check that the match at match_start is indeed a match.
  1389. */
  1390. local void check_match(deflate_state *s, IPos start, IPos match, int length) {
  1391. /* check that the match is indeed a match */
  1392. Bytef *back = s->window + (int)match, *here = s->window + start;
  1393. IPos len = length;
  1394. if (match == (IPos)-1) {
  1395. /* match starts one byte before the current window -- just compare the
  1396. subsequent length-1 bytes */
  1397. back++;
  1398. here++;
  1399. len--;
  1400. }
  1401. if (zmemcmp(back, here, len) != EQUAL) {
  1402. fprintf(stderr, " start %u, match %d, length %d\n",
  1403. start, (int)match, length);
  1404. do {
  1405. fprintf(stderr, "(%02x %02x)", *back++, *here++);
  1406. } while (--len != 0);
  1407. z_error("invalid match");
  1408. }
  1409. if (z_verbose > 1) {
  1410. fprintf(stderr,"\\[%d,%d]", start - match, length);
  1411. do { putc(s->window[start++], stderr); } while (--length != 0);
  1412. }
  1413. }
  1414. #else
  1415. # define check_match(s, start, match, length)
  1416. #endif /* ZLIB_DEBUG */
  1417. /* ===========================================================================
  1418. * Flush the current block, with given end-of-file flag.
  1419. * IN assertion: strstart is set to the end of the current match.
  1420. */
  1421. #define FLUSH_BLOCK_ONLY(s, last) { \
  1422. _tr_flush_block(s, (s->block_start >= 0L ? \
  1423. (charf *)&s->window[(unsigned)s->block_start] : \
  1424. (charf *)Z_NULL), \
  1425. (ulg)((long)s->strstart - s->block_start), \
  1426. (last)); \
  1427. s->block_start = s->strstart; \
  1428. flush_pending(s->strm); \
  1429. Tracev((stderr,"[FLUSH]")); \
  1430. }
  1431. /* Same but force premature exit if necessary. */
  1432. #define FLUSH_BLOCK(s, last) { \
  1433. FLUSH_BLOCK_ONLY(s, last); \
  1434. if (s->strm->avail_out == 0) return (last) ? finish_started : need_more; \
  1435. }
  1436. /* Maximum stored block length in deflate format (not including header). */
  1437. #define MAX_STORED 65535
  1438. /* Minimum of a and b. */
  1439. #define MIN(a, b) ((a) > (b) ? (b) : (a))
  1440. /* ===========================================================================
  1441. * Copy without compression as much as possible from the input stream, return
  1442. * the current block state.
  1443. *
  1444. * In case deflateParams() is used to later switch to a non-zero compression
  1445. * level, s->matches (otherwise unused when storing) keeps track of the number
  1446. * of hash table slides to perform. If s->matches is 1, then one hash table
  1447. * slide will be done when switching. If s->matches is 2, the maximum value
  1448. * allowed here, then the hash table will be cleared, since two or more slides
  1449. * is the same as a clear.
  1450. *
  1451. * deflate_stored() is written to minimize the number of times an input byte is
  1452. * copied. It is most efficient with large input and output buffers, which
  1453. * maximizes the opportunities to have a single copy from next_in to next_out.
  1454. */
  1455. local block_state deflate_stored(deflate_state *s, int flush) {
  1456. /* Smallest worthy block size when not flushing or finishing. By default
  1457. * this is 32K. This can be as small as 507 bytes for memLevel == 1. For
  1458. * large input and output buffers, the stored block size will be larger.
  1459. */
  1460. unsigned min_block = MIN(s->pending_buf_size - 5, s->w_size);
  1461. /* Copy as many min_block or larger stored blocks directly to next_out as
  1462. * possible. If flushing, copy the remaining available input to next_out as
  1463. * stored blocks, if there is enough space.
  1464. */
  1465. unsigned len, left, have, last = 0;
  1466. unsigned used = s->strm->avail_in;
  1467. do {
  1468. /* Set len to the maximum size block that we can copy directly with the
  1469. * available input data and output space. Set left to how much of that
  1470. * would be copied from what's left in the window.
  1471. */
  1472. len = MAX_STORED; /* maximum deflate stored block length */
  1473. have = (s->bi_valid + 42) >> 3; /* number of header bytes */
  1474. if (s->strm->avail_out < have) /* need room for header */
  1475. break;
  1476. /* maximum stored block length that will fit in avail_out: */
  1477. have = s->strm->avail_out - have;
  1478. left = s->strstart - s->block_start; /* bytes left in window */
  1479. if (len > (ulg)left + s->strm->avail_in)
  1480. len = left + s->strm->avail_in; /* limit len to the input */
  1481. if (len > have)
  1482. len = have; /* limit len to the output */
  1483. /* If the stored block would be less than min_block in length, or if
  1484. * unable to copy all of the available input when flushing, then try
  1485. * copying to the window and the pending buffer instead. Also don't
  1486. * write an empty block when flushing -- deflate() does that.
  1487. */
  1488. if (len < min_block && ((len == 0 && flush != Z_FINISH) ||
  1489. flush == Z_NO_FLUSH ||
  1490. len != left + s->strm->avail_in))
  1491. break;
  1492. /* Make a dummy stored block in pending to get the header bytes,
  1493. * including any pending bits. This also updates the debugging counts.
  1494. */
  1495. last = flush == Z_FINISH && len == left + s->strm->avail_in ? 1 : 0;
  1496. _tr_stored_block(s, (char *)0, 0L, last);
  1497. /* Replace the lengths in the dummy stored block with len. */
  1498. s->pending_buf[s->pending - 4] = len;
  1499. s->pending_buf[s->pending - 3] = len >> 8;
  1500. s->pending_buf[s->pending - 2] = ~len;
  1501. s->pending_buf[s->pending - 1] = ~len >> 8;
  1502. /* Write the stored block header bytes. */
  1503. flush_pending(s->strm);
  1504. #ifdef ZLIB_DEBUG
  1505. /* Update debugging counts for the data about to be copied. */
  1506. s->compressed_len += len << 3;
  1507. s->bits_sent += len << 3;
  1508. #endif
  1509. /* Copy uncompressed bytes from the window to next_out. */
  1510. if (left) {
  1511. if (left > len)
  1512. left = len;
  1513. zmemcpy(s->strm->next_out, s->window + s->block_start, left);
  1514. s->strm->next_out += left;
  1515. s->strm->avail_out -= left;
  1516. s->strm->total_out += left;
  1517. s->block_start += left;
  1518. len -= left;
  1519. }
  1520. /* Copy uncompressed bytes directly from next_in to next_out, updating
  1521. * the check value.
  1522. */
  1523. if (len) {
  1524. read_buf(s->strm, s->strm->next_out, len);
  1525. s->strm->next_out += len;
  1526. s->strm->avail_out -= len;
  1527. s->strm->total_out += len;
  1528. }
  1529. } while (last == 0);
  1530. /* Update the sliding window with the last s->w_size bytes of the copied
  1531. * data, or append all of the copied data to the existing window if less
  1532. * than s->w_size bytes were copied. Also update the number of bytes to
  1533. * insert in the hash tables, in the event that deflateParams() switches to
  1534. * a non-zero compression level.
  1535. */
  1536. used -= s->strm->avail_in; /* number of input bytes directly copied */
  1537. if (used) {
  1538. /* If any input was used, then no unused input remains in the window,
  1539. * therefore s->block_start == s->strstart.
  1540. */
  1541. if (used >= s->w_size) { /* supplant the previous history */
  1542. s->matches = 2; /* clear hash */
  1543. zmemcpy(s->window, s->strm->next_in - s->w_size, s->w_size);
  1544. s->strstart = s->w_size;
  1545. s->insert = s->strstart;
  1546. }
  1547. else {
  1548. if (s->window_size - s->strstart <= used) {
  1549. /* Slide the window down. */
  1550. s->strstart -= s->w_size;
  1551. zmemcpy(s->window, s->window + s->w_size, s->strstart);
  1552. if (s->matches < 2)
  1553. s->matches++; /* add a pending slide_hash() */
  1554. if (s->insert > s->strstart)
  1555. s->insert = s->strstart;
  1556. }
  1557. zmemcpy(s->window + s->strstart, s->strm->next_in - used, used);
  1558. s->strstart += used;
  1559. s->insert += MIN(used, s->w_size - s->insert);
  1560. }
  1561. s->block_start = s->strstart;
  1562. }
  1563. if (s->high_water < s->strstart)
  1564. s->high_water = s->strstart;
  1565. /* If the last block was written to next_out, then done. */
  1566. if (last)
  1567. return finish_done;
  1568. /* If flushing and all input has been consumed, then done. */
  1569. if (flush != Z_NO_FLUSH && flush != Z_FINISH &&
  1570. s->strm->avail_in == 0 && (long)s->strstart == s->block_start)
  1571. return block_done;
  1572. /* Fill the window with any remaining input. */
  1573. have = s->window_size - s->strstart;
  1574. if (s->strm->avail_in > have && s->block_start >= (long)s->w_size) {
  1575. /* Slide the window down. */
  1576. s->block_start -= s->w_size;
  1577. s->strstart -= s->w_size;
  1578. zmemcpy(s->window, s->window + s->w_size, s->strstart);
  1579. if (s->matches < 2)
  1580. s->matches++; /* add a pending slide_hash() */
  1581. have += s->w_size; /* more space now */
  1582. if (s->insert > s->strstart)
  1583. s->insert = s->strstart;
  1584. }
  1585. if (have > s->strm->avail_in)
  1586. have = s->strm->avail_in;
  1587. if (have) {
  1588. read_buf(s->strm, s->window + s->strstart, have);
  1589. s->strstart += have;
  1590. s->insert += MIN(have, s->w_size - s->insert);
  1591. }
  1592. if (s->high_water < s->strstart)
  1593. s->high_water = s->strstart;
  1594. /* There was not enough avail_out to write a complete worthy or flushed
  1595. * stored block to next_out. Write a stored block to pending instead, if we
  1596. * have enough input for a worthy block, or if flushing and there is enough
  1597. * room for the remaining input as a stored block in the pending buffer.
  1598. */
  1599. have = (s->bi_valid + 42) >> 3; /* number of header bytes */
  1600. /* maximum stored block length that will fit in pending: */
  1601. have = MIN(s->pending_buf_size - have, MAX_STORED);
  1602. min_block = MIN(have, s->w_size);
  1603. left = s->strstart - s->block_start;
  1604. if (left >= min_block ||
  1605. ((left || flush == Z_FINISH) && flush != Z_NO_FLUSH &&
  1606. s->strm->avail_in == 0 && left <= have)) {
  1607. len = MIN(left, have);
  1608. last = flush == Z_FINISH && s->strm->avail_in == 0 &&
  1609. len == left ? 1 : 0;
  1610. _tr_stored_block(s, (charf *)s->window + s->block_start, len, last);
  1611. s->block_start += len;
  1612. flush_pending(s->strm);
  1613. }
  1614. /* We've done all we can with the available input and output. */
  1615. return last ? finish_started : need_more;
  1616. }
  1617. /* ===========================================================================
  1618. * Compress as much as possible from the input stream, return the current
  1619. * block state.
  1620. * This function does not perform lazy evaluation of matches and inserts
  1621. * new strings in the dictionary only for unmatched strings or for short
  1622. * matches. It is used only for the fast compression options.
  1623. */
  1624. local block_state deflate_fast(deflate_state *s, int flush) {
  1625. IPos hash_head; /* head of the hash chain */
  1626. int bflush; /* set if current block must be flushed */
  1627. for (;;) {
  1628. /* Make sure that we always have enough lookahead, except
  1629. * at the end of the input file. We need MAX_MATCH bytes
  1630. * for the next match, plus MIN_MATCH bytes to insert the
  1631. * string following the next match.
  1632. */
  1633. if (s->lookahead < MIN_LOOKAHEAD) {
  1634. fill_window(s);
  1635. if (s->lookahead < MIN_LOOKAHEAD && flush == Z_NO_FLUSH) {
  1636. return need_more;
  1637. }
  1638. if (s->lookahead == 0) break; /* flush the current block */
  1639. }
  1640. /* Insert the string window[strstart .. strstart + 2] in the
  1641. * dictionary, and set hash_head to the head of the hash chain:
  1642. */
  1643. hash_head = NIL;
  1644. if (s->lookahead >= MIN_MATCH) {
  1645. INSERT_STRING(s, s->strstart, hash_head);
  1646. }
  1647. /* Find the longest match, discarding those <= prev_length.
  1648. * At this point we have always match_length < MIN_MATCH
  1649. */
  1650. if (hash_head != NIL && s->strstart - hash_head <= MAX_DIST(s)) {
  1651. /* To simplify the code, we prevent matches with the string
  1652. * of window index 0 (in particular we have to avoid a match
  1653. * of the string with itself at the start of the input file).
  1654. */
  1655. s->match_length = longest_match (s, hash_head);
  1656. /* longest_match() sets match_start */
  1657. }
  1658. if (s->match_length >= MIN_MATCH) {
  1659. check_match(s, s->strstart, s->match_start, s->match_length);
  1660. _tr_tally_dist(s, s->strstart - s->match_start,
  1661. s->match_length - MIN_MATCH, bflush);
  1662. s->lookahead -= s->match_length;
  1663. /* Insert new strings in the hash table only if the match length
  1664. * is not too large. This saves time but degrades compression.
  1665. */
  1666. #ifndef FASTEST
  1667. if (s->match_length <= s->max_insert_length &&
  1668. s->lookahead >= MIN_MATCH) {
  1669. s->match_length--; /* string at strstart already in table */
  1670. do {
  1671. s->strstart++;
  1672. INSERT_STRING(s, s->strstart, hash_head);
  1673. /* strstart never exceeds WSIZE-MAX_MATCH, so there are
  1674. * always MIN_MATCH bytes ahead.
  1675. */
  1676. } while (--s->match_length != 0);
  1677. s->strstart++;
  1678. } else
  1679. #endif
  1680. {
  1681. s->strstart += s->match_length;
  1682. s->match_length = 0;
  1683. s->ins_h = s->window[s->strstart];
  1684. UPDATE_HASH(s, s->ins_h, s->window[s->strstart + 1]);
  1685. #if MIN_MATCH != 3
  1686. Call UPDATE_HASH() MIN_MATCH-3 more times
  1687. #endif
  1688. /* If lookahead < MIN_MATCH, ins_h is garbage, but it does not
  1689. * matter since it will be recomputed at next deflate call.
  1690. */
  1691. }
  1692. } else {
  1693. /* No match, output a literal byte */
  1694. Tracevv((stderr,"%c", s->window[s->strstart]));
  1695. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1696. s->lookahead--;
  1697. s->strstart++;
  1698. }
  1699. if (bflush) FLUSH_BLOCK(s, 0);
  1700. }
  1701. s->insert = s->strstart < MIN_MATCH-1 ? s->strstart : MIN_MATCH-1;
  1702. if (flush == Z_FINISH) {
  1703. FLUSH_BLOCK(s, 1);
  1704. return finish_done;
  1705. }
  1706. if (s->sym_next)
  1707. FLUSH_BLOCK(s, 0);
  1708. return block_done;
  1709. }
  1710. #ifndef FASTEST
  1711. /* ===========================================================================
  1712. * Same as above, but achieves better compression. We use a lazy
  1713. * evaluation for matches: a match is finally adopted only if there is
  1714. * no better match at the next window position.
  1715. */
  1716. local block_state deflate_slow(deflate_state *s, int flush) {
  1717. IPos hash_head; /* head of hash chain */
  1718. int bflush; /* set if current block must be flushed */
  1719. /* Process the input block. */
  1720. for (;;) {
  1721. /* Make sure that we always have enough lookahead, except
  1722. * at the end of the input file. We need MAX_MATCH bytes
  1723. * for the next match, plus MIN_MATCH bytes to insert the
  1724. * string following the next match.
  1725. */
  1726. if (s->lookahead < MIN_LOOKAHEAD) {
  1727. fill_window(s);
  1728. if (s->lookahead < MIN_LOOKAHEAD && flush == Z_NO_FLUSH) {
  1729. return need_more;
  1730. }
  1731. if (s->lookahead == 0) break; /* flush the current block */
  1732. }
  1733. /* Insert the string window[strstart .. strstart + 2] in the
  1734. * dictionary, and set hash_head to the head of the hash chain:
  1735. */
  1736. hash_head = NIL;
  1737. if (s->lookahead >= MIN_MATCH) {
  1738. INSERT_STRING(s, s->strstart, hash_head);
  1739. }
  1740. /* Find the longest match, discarding those <= prev_length.
  1741. */
  1742. s->prev_length = s->match_length, s->prev_match = s->match_start;
  1743. s->match_length = MIN_MATCH-1;
  1744. if (hash_head != NIL && s->prev_length < s->max_lazy_match &&
  1745. s->strstart - hash_head <= MAX_DIST(s)) {
  1746. /* To simplify the code, we prevent matches with the string
  1747. * of window index 0 (in particular we have to avoid a match
  1748. * of the string with itself at the start of the input file).
  1749. */
  1750. s->match_length = longest_match (s, hash_head);
  1751. /* longest_match() sets match_start */
  1752. if (s->match_length <= 5 && (s->strategy == Z_FILTERED
  1753. #if TOO_FAR <= 32767
  1754. || (s->match_length == MIN_MATCH &&
  1755. s->strstart - s->match_start > TOO_FAR)
  1756. #endif
  1757. )) {
  1758. /* If prev_match is also MIN_MATCH, match_start is garbage
  1759. * but we will ignore the current match anyway.
  1760. */
  1761. s->match_length = MIN_MATCH-1;
  1762. }
  1763. }
  1764. /* If there was a match at the previous step and the current
  1765. * match is not better, output the previous match:
  1766. */
  1767. if (s->prev_length >= MIN_MATCH && s->match_length <= s->prev_length) {
  1768. uInt max_insert = s->strstart + s->lookahead - MIN_MATCH;
  1769. /* Do not insert strings in hash table beyond this. */
  1770. check_match(s, s->strstart - 1, s->prev_match, s->prev_length);
  1771. _tr_tally_dist(s, s->strstart - 1 - s->prev_match,
  1772. s->prev_length - MIN_MATCH, bflush);
  1773. /* Insert in hash table all strings up to the end of the match.
  1774. * strstart - 1 and strstart are already inserted. If there is not
  1775. * enough lookahead, the last two strings are not inserted in
  1776. * the hash table.
  1777. */
  1778. s->lookahead -= s->prev_length - 1;
  1779. s->prev_length -= 2;
  1780. do {
  1781. if (++s->strstart <= max_insert) {
  1782. INSERT_STRING(s, s->strstart, hash_head);
  1783. }
  1784. } while (--s->prev_length != 0);
  1785. s->match_available = 0;
  1786. s->match_length = MIN_MATCH-1;
  1787. s->strstart++;
  1788. if (bflush) FLUSH_BLOCK(s, 0);
  1789. } else if (s->match_available) {
  1790. /* If there was no match at the previous position, output a
  1791. * single literal. If there was a match but the current match
  1792. * is longer, truncate the previous match to a single literal.
  1793. */
  1794. Tracevv((stderr,"%c", s->window[s->strstart - 1]));
  1795. _tr_tally_lit(s, s->window[s->strstart - 1], bflush);
  1796. if (bflush) {
  1797. FLUSH_BLOCK_ONLY(s, 0);
  1798. }
  1799. s->strstart++;
  1800. s->lookahead--;
  1801. if (s->strm->avail_out == 0) return need_more;
  1802. } else {
  1803. /* There is no previous match to compare with, wait for
  1804. * the next step to decide.
  1805. */
  1806. s->match_available = 1;
  1807. s->strstart++;
  1808. s->lookahead--;
  1809. }
  1810. }
  1811. Assert (flush != Z_NO_FLUSH, "no flush?");
  1812. if (s->match_available) {
  1813. Tracevv((stderr,"%c", s->window[s->strstart - 1]));
  1814. _tr_tally_lit(s, s->window[s->strstart - 1], bflush);
  1815. s->match_available = 0;
  1816. }
  1817. s->insert = s->strstart < MIN_MATCH-1 ? s->strstart : MIN_MATCH-1;
  1818. if (flush == Z_FINISH) {
  1819. FLUSH_BLOCK(s, 1);
  1820. return finish_done;
  1821. }
  1822. if (s->sym_next)
  1823. FLUSH_BLOCK(s, 0);
  1824. return block_done;
  1825. }
  1826. #endif /* FASTEST */
  1827. /* ===========================================================================
  1828. * For Z_RLE, simply look for runs of bytes, generate matches only of distance
  1829. * one. Do not maintain a hash table. (It will be regenerated if this run of
  1830. * deflate switches away from Z_RLE.)
  1831. */
  1832. local block_state deflate_rle(deflate_state *s, int flush) {
  1833. int bflush; /* set if current block must be flushed */
  1834. uInt prev; /* byte at distance one to match */
  1835. Bytef *scan, *strend; /* scan goes up to strend for length of run */
  1836. for (;;) {
  1837. /* Make sure that we always have enough lookahead, except
  1838. * at the end of the input file. We need MAX_MATCH bytes
  1839. * for the longest run, plus one for the unrolled loop.
  1840. */
  1841. if (s->lookahead <= MAX_MATCH) {
  1842. fill_window(s);
  1843. if (s->lookahead <= MAX_MATCH && flush == Z_NO_FLUSH) {
  1844. return need_more;
  1845. }
  1846. if (s->lookahead == 0) break; /* flush the current block */
  1847. }
  1848. /* See how many times the previous byte repeats */
  1849. s->match_length = 0;
  1850. if (s->lookahead >= MIN_MATCH && s->strstart > 0) {
  1851. scan = s->window + s->strstart - 1;
  1852. prev = *scan;
  1853. if (prev == *++scan && prev == *++scan && prev == *++scan) {
  1854. strend = s->window + s->strstart + MAX_MATCH;
  1855. do {
  1856. } while (prev == *++scan && prev == *++scan &&
  1857. prev == *++scan && prev == *++scan &&
  1858. prev == *++scan && prev == *++scan &&
  1859. prev == *++scan && prev == *++scan &&
  1860. scan < strend);
  1861. s->match_length = MAX_MATCH - (uInt)(strend - scan);
  1862. if (s->match_length > s->lookahead)
  1863. s->match_length = s->lookahead;
  1864. }
  1865. Assert(scan <= s->window + (uInt)(s->window_size - 1),
  1866. "wild scan");
  1867. }
  1868. /* Emit match if have run of MIN_MATCH or longer, else emit literal */
  1869. if (s->match_length >= MIN_MATCH) {
  1870. check_match(s, s->strstart, s->strstart - 1, s->match_length);
  1871. _tr_tally_dist(s, 1, s->match_length - MIN_MATCH, bflush);
  1872. s->lookahead -= s->match_length;
  1873. s->strstart += s->match_length;
  1874. s->match_length = 0;
  1875. } else {
  1876. /* No match, output a literal byte */
  1877. Tracevv((stderr,"%c", s->window[s->strstart]));
  1878. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1879. s->lookahead--;
  1880. s->strstart++;
  1881. }
  1882. if (bflush) FLUSH_BLOCK(s, 0);
  1883. }
  1884. s->insert = 0;
  1885. if (flush == Z_FINISH) {
  1886. FLUSH_BLOCK(s, 1);
  1887. return finish_done;
  1888. }
  1889. if (s->sym_next)
  1890. FLUSH_BLOCK(s, 0);
  1891. return block_done;
  1892. }
  1893. /* ===========================================================================
  1894. * For Z_HUFFMAN_ONLY, do not look for matches. Do not maintain a hash table.
  1895. * (It will be regenerated if this run of deflate switches away from Huffman.)
  1896. */
  1897. local block_state deflate_huff(deflate_state *s, int flush) {
  1898. int bflush; /* set if current block must be flushed */
  1899. for (;;) {
  1900. /* Make sure that we have a literal to write. */
  1901. if (s->lookahead == 0) {
  1902. fill_window(s);
  1903. if (s->lookahead == 0) {
  1904. if (flush == Z_NO_FLUSH)
  1905. return need_more;
  1906. break; /* flush the current block */
  1907. }
  1908. }
  1909. /* Output a literal byte */
  1910. s->match_length = 0;
  1911. Tracevv((stderr,"%c", s->window[s->strstart]));
  1912. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1913. s->lookahead--;
  1914. s->strstart++;
  1915. if (bflush) FLUSH_BLOCK(s, 0);
  1916. }
  1917. s->insert = 0;
  1918. if (flush == Z_FINISH) {
  1919. FLUSH_BLOCK(s, 1);
  1920. return finish_done;
  1921. }
  1922. if (s->sym_next)
  1923. FLUSH_BLOCK(s, 0);
  1924. return block_done;
  1925. }