deflate.c 80 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143
  1. /* deflate.c -- compress data using the deflation algorithm
  2. * Copyright (C) 1995-2024 Jean-loup Gailly and Mark Adler
  3. * For conditions of distribution and use, see copyright notice in zlib.h
  4. */
  5. /*
  6. * ALGORITHM
  7. *
  8. * The "deflation" process depends on being able to identify portions
  9. * of the input text which are identical to earlier input (within a
  10. * sliding window trailing behind the input currently being processed).
  11. *
  12. * The most straightforward technique turns out to be the fastest for
  13. * most input files: try all possible matches and select the longest.
  14. * The key feature of this algorithm is that insertions into the string
  15. * dictionary are very simple and thus fast, and deletions are avoided
  16. * completely. Insertions are performed at each input character, whereas
  17. * string matches are performed only when the previous match ends. So it
  18. * is preferable to spend more time in matches to allow very fast string
  19. * insertions and avoid deletions. The matching algorithm for small
  20. * strings is inspired from that of Rabin & Karp. A brute force approach
  21. * is used to find longer strings when a small match has been found.
  22. * A similar algorithm is used in comic (by Jan-Mark Wams) and freeze
  23. * (by Leonid Broukhis).
  24. * A previous version of this file used a more sophisticated algorithm
  25. * (by Fiala and Greene) which is guaranteed to run in linear amortized
  26. * time, but has a larger average cost, uses more memory and is patented.
  27. * However the F&G algorithm may be faster for some highly redundant
  28. * files if the parameter max_chain_length (described below) is too large.
  29. *
  30. * ACKNOWLEDGEMENTS
  31. *
  32. * The idea of lazy evaluation of matches is due to Jan-Mark Wams, and
  33. * I found it in 'freeze' written by Leonid Broukhis.
  34. * Thanks to many people for bug reports and testing.
  35. *
  36. * REFERENCES
  37. *
  38. * Deutsch, L.P.,"DEFLATE Compressed Data Format Specification".
  39. * Available in http://tools.ietf.org/html/rfc1951
  40. *
  41. * A description of the Rabin and Karp algorithm is given in the book
  42. * "Algorithms" by R. Sedgewick, Addison-Wesley, p252.
  43. *
  44. * Fiala,E.R., and Greene,D.H.
  45. * Data Compression with Finite Windows, Comm.ACM, 32,4 (1989) 490-595
  46. *
  47. */
  48. /* @(#) $Id$ */
  49. #include "deflate.h"
  50. #include <util/system/compiler.h>
  51. const char deflate_copyright[] =
  52. " deflate 1.3.1 Copyright 1995-2024 Jean-loup Gailly and Mark Adler ";
  53. /*
  54. If you use the zlib library in a product, an acknowledgment is welcome
  55. in the documentation of your product. If for some reason you cannot
  56. include such an acknowledgment, I would appreciate that you keep this
  57. copyright string in the executable of your product.
  58. */
  59. typedef enum {
  60. need_more, /* block not completed, need more input or more output */
  61. block_done, /* block flush performed */
  62. finish_started, /* finish started, need only more output at next deflate */
  63. finish_done /* finish done, accept no more input or output */
  64. } block_state;
  65. typedef block_state (*compress_func)(deflate_state *s, int flush);
  66. /* Compression function. Returns the block state after the call. */
  67. local block_state deflate_stored(deflate_state *s, int flush);
  68. local block_state deflate_fast(deflate_state *s, int flush);
  69. #ifndef FASTEST
  70. local block_state deflate_slow(deflate_state *s, int flush);
  71. #endif
  72. local block_state deflate_rle(deflate_state *s, int flush);
  73. local block_state deflate_huff(deflate_state *s, int flush);
  74. /* ===========================================================================
  75. * Local data
  76. */
  77. #define NIL 0
  78. /* Tail of hash chains */
  79. #ifndef TOO_FAR
  80. # define TOO_FAR 4096
  81. #endif
  82. /* Matches of length 3 are discarded if their distance exceeds TOO_FAR */
  83. /* Values for max_lazy_match, good_match and max_chain_length, depending on
  84. * the desired pack level (0..9). The values given below have been tuned to
  85. * exclude worst case performance for pathological files. Better values may be
  86. * found for specific files.
  87. */
  88. typedef struct config_s {
  89. ush good_length; /* reduce lazy search above this match length */
  90. ush max_lazy; /* do not perform lazy search above this match length */
  91. ush nice_length; /* quit search above this match length */
  92. ush max_chain;
  93. compress_func func;
  94. } config;
  95. #ifdef FASTEST
  96. local const config configuration_table[2] = {
  97. /* good lazy nice chain */
  98. /* 0 */ {0, 0, 0, 0, deflate_stored}, /* store only */
  99. /* 1 */ {4, 4, 8, 4, deflate_fast}}; /* max speed, no lazy matches */
  100. #else
  101. local const config configuration_table[10] = {
  102. /* good lazy nice chain */
  103. /* 0 */ {0, 0, 0, 0, deflate_stored}, /* store only */
  104. /* 1 */ {4, 4, 8, 4, deflate_fast}, /* max speed, no lazy matches */
  105. /* 2 */ {4, 5, 16, 8, deflate_fast},
  106. /* 3 */ {4, 6, 32, 32, deflate_fast},
  107. /* 4 */ {4, 4, 16, 16, deflate_slow}, /* lazy matches */
  108. /* 5 */ {8, 16, 32, 32, deflate_slow},
  109. /* 6 */ {8, 16, 128, 128, deflate_slow},
  110. /* 7 */ {8, 32, 128, 256, deflate_slow},
  111. /* 8 */ {32, 128, 258, 1024, deflate_slow},
  112. /* 9 */ {32, 258, 258, 4096, deflate_slow}}; /* max compression */
  113. #endif
  114. /* Note: the deflate() code requires max_lazy >= MIN_MATCH and max_chain >= 4
  115. * For deflate_fast() (levels <= 3) good is ignored and lazy has a different
  116. * meaning.
  117. */
  118. /* rank Z_BLOCK between Z_NO_FLUSH and Z_PARTIAL_FLUSH */
  119. #define RANK(f) (((f) * 2) - ((f) > 4 ? 9 : 0))
  120. /* ===========================================================================
  121. * Update a hash value with the given input byte
  122. * IN assertion: all calls to UPDATE_HASH are made with consecutive input
  123. * characters, so that a running hash key can be computed from the previous
  124. * key instead of complete recalculation each time.
  125. */
  126. #define UPDATE_HASH(s,h,c) (h = (((h) << s->hash_shift) ^ (c)) & s->hash_mask)
  127. /* ===========================================================================
  128. * Insert string str in the dictionary and set match_head to the previous head
  129. * of the hash chain (the most recent string with same hash key). Return
  130. * the previous length of the hash chain.
  131. * If this file is compiled with -DFASTEST, the compression level is forced
  132. * to 1, and no hash chains are maintained.
  133. * IN assertion: all calls to INSERT_STRING are made with consecutive input
  134. * characters and the first MIN_MATCH bytes of str are valid (except for
  135. * the last MIN_MATCH-1 bytes of the input file).
  136. */
  137. #ifdef FASTEST
  138. #define INSERT_STRING(s, str, match_head) \
  139. (UPDATE_HASH(s, s->ins_h, s->window[(str) + (MIN_MATCH-1)]), \
  140. match_head = s->head[s->ins_h], \
  141. s->head[s->ins_h] = (Pos)(str))
  142. #else
  143. #define INSERT_STRING(s, str, match_head) \
  144. (UPDATE_HASH(s, s->ins_h, s->window[(str) + (MIN_MATCH-1)]), \
  145. match_head = s->prev[(str) & s->w_mask] = s->head[s->ins_h], \
  146. s->head[s->ins_h] = (Pos)(str))
  147. #endif
  148. /* ===========================================================================
  149. * Initialize the hash table (avoiding 64K overflow for 16 bit systems).
  150. * prev[] will be initialized on the fly.
  151. */
  152. #define CLEAR_HASH(s) \
  153. do { \
  154. s->head[s->hash_size - 1] = NIL; \
  155. zmemzero((Bytef *)s->head, \
  156. (unsigned)(s->hash_size - 1)*sizeof(*s->head)); \
  157. } while (0)
  158. /* ===========================================================================
  159. * Slide the hash table when sliding the window down (could be avoided with 32
  160. * bit values at the expense of memory usage). We slide even when level == 0 to
  161. * keep the hash table consistent if we switch back to level > 0 later.
  162. */
  163. #if defined(__has_feature)
  164. # if __has_feature(memory_sanitizer)
  165. __attribute__((no_sanitize("memory")))
  166. # endif
  167. #endif
  168. local void slide_hash(deflate_state *s) {
  169. unsigned n, m;
  170. Posf *p;
  171. uInt wsize = s->w_size;
  172. n = s->hash_size;
  173. p = &s->head[n];
  174. do {
  175. m = *--p;
  176. *p = (Pos)(m >= wsize ? m - wsize : NIL);
  177. } while (--n);
  178. n = wsize;
  179. #ifndef FASTEST
  180. p = &s->prev[n];
  181. do {
  182. m = *--p;
  183. *p = (Pos)(m >= wsize ? m - wsize : NIL);
  184. /* If n is not on any hash chain, prev[n] is garbage but
  185. * its value will never be used.
  186. */
  187. } while (--n);
  188. #endif
  189. }
  190. /* ===========================================================================
  191. * Read a new buffer from the current input stream, update the adler32
  192. * and total number of bytes read. All deflate() input goes through
  193. * this function so some applications may wish to modify it to avoid
  194. * allocating a large strm->next_in buffer and copying from it.
  195. * (See also flush_pending()).
  196. */
  197. local unsigned read_buf(z_streamp strm, Bytef *buf, unsigned size) {
  198. unsigned len = strm->avail_in;
  199. if (len > size) len = size;
  200. if (len == 0) return 0;
  201. strm->avail_in -= len;
  202. zmemcpy(buf, strm->next_in, len);
  203. if (strm->state->wrap == 1) {
  204. strm->adler = adler32(strm->adler, buf, len);
  205. }
  206. #ifdef GZIP
  207. else if (strm->state->wrap == 2) {
  208. strm->adler = crc32(strm->adler, buf, len);
  209. }
  210. #endif
  211. strm->next_in += len;
  212. strm->total_in += len;
  213. return len;
  214. }
  215. /* ===========================================================================
  216. * Fill the window when the lookahead becomes insufficient.
  217. * Updates strstart and lookahead.
  218. *
  219. * IN assertion: lookahead < MIN_LOOKAHEAD
  220. * OUT assertions: strstart <= window_size-MIN_LOOKAHEAD
  221. * At least one byte has been read, or avail_in == 0; reads are
  222. * performed for at least two bytes (required for the zip translate_eol
  223. * option -- not supported here).
  224. */
  225. local void fill_window(deflate_state *s) {
  226. unsigned n;
  227. unsigned more; /* Amount of free space at the end of the window. */
  228. uInt wsize = s->w_size;
  229. Assert(s->lookahead < MIN_LOOKAHEAD, "already enough lookahead");
  230. do {
  231. more = (unsigned)(s->window_size -(ulg)s->lookahead -(ulg)s->strstart);
  232. /* Deal with !@#$% 64K limit: */
  233. if (sizeof(int) <= 2) {
  234. if (more == 0 && s->strstart == 0 && s->lookahead == 0) {
  235. more = wsize;
  236. } else if (more == (unsigned)(-1)) {
  237. /* Very unlikely, but possible on 16 bit machine if
  238. * strstart == 0 && lookahead == 1 (input done a byte at time)
  239. */
  240. more--;
  241. }
  242. }
  243. /* If the window is almost full and there is insufficient lookahead,
  244. * move the upper half to the lower one to make room in the upper half.
  245. */
  246. if (s->strstart >= wsize + MAX_DIST(s)) {
  247. zmemcpy(s->window, s->window + wsize, (unsigned)wsize - more);
  248. s->match_start -= wsize;
  249. s->strstart -= wsize; /* we now have strstart >= MAX_DIST */
  250. s->block_start -= (long) wsize;
  251. if (s->insert > s->strstart)
  252. s->insert = s->strstart;
  253. slide_hash(s);
  254. more += wsize;
  255. }
  256. if (s->strm->avail_in == 0) break;
  257. /* If there was no sliding:
  258. * strstart <= WSIZE+MAX_DIST-1 && lookahead <= MIN_LOOKAHEAD - 1 &&
  259. * more == window_size - lookahead - strstart
  260. * => more >= window_size - (MIN_LOOKAHEAD-1 + WSIZE + MAX_DIST-1)
  261. * => more >= window_size - 2*WSIZE + 2
  262. * In the BIG_MEM or MMAP case (not yet supported),
  263. * window_size == input_size + MIN_LOOKAHEAD &&
  264. * strstart + s->lookahead <= input_size => more >= MIN_LOOKAHEAD.
  265. * Otherwise, window_size == 2*WSIZE so more >= 2.
  266. * If there was sliding, more >= WSIZE. So in all cases, more >= 2.
  267. */
  268. Assert(more >= 2, "more < 2");
  269. n = read_buf(s->strm, s->window + s->strstart + s->lookahead, more);
  270. s->lookahead += n;
  271. /* Initialize the hash value now that we have some input: */
  272. if (s->lookahead + s->insert >= MIN_MATCH) {
  273. uInt str = s->strstart - s->insert;
  274. s->ins_h = s->window[str];
  275. UPDATE_HASH(s, s->ins_h, s->window[str + 1]);
  276. #if MIN_MATCH != 3
  277. Call UPDATE_HASH() MIN_MATCH-3 more times
  278. #endif
  279. while (s->insert) {
  280. UPDATE_HASH(s, s->ins_h, s->window[str + MIN_MATCH-1]);
  281. #ifndef FASTEST
  282. s->prev[str & s->w_mask] = s->head[s->ins_h];
  283. #endif
  284. s->head[s->ins_h] = (Pos)str;
  285. str++;
  286. s->insert--;
  287. if (s->lookahead + s->insert < MIN_MATCH)
  288. break;
  289. }
  290. }
  291. /* If the whole input has less than MIN_MATCH bytes, ins_h is garbage,
  292. * but this is not important since only literal bytes will be emitted.
  293. */
  294. } while (s->lookahead < MIN_LOOKAHEAD && s->strm->avail_in != 0);
  295. /* If the WIN_INIT bytes after the end of the current data have never been
  296. * written, then zero those bytes in order to avoid memory check reports of
  297. * the use of uninitialized (or uninitialised as Julian writes) bytes by
  298. * the longest match routines. Update the high water mark for the next
  299. * time through here. WIN_INIT is set to MAX_MATCH since the longest match
  300. * routines allow scanning to strstart + MAX_MATCH, ignoring lookahead.
  301. */
  302. if (s->high_water < s->window_size) {
  303. ulg curr = s->strstart + (ulg)(s->lookahead);
  304. ulg init;
  305. if (s->high_water < curr) {
  306. /* Previous high water mark below current data -- zero WIN_INIT
  307. * bytes or up to end of window, whichever is less.
  308. */
  309. init = s->window_size - curr;
  310. if (init > WIN_INIT)
  311. init = WIN_INIT;
  312. zmemzero(s->window + curr, (unsigned)init);
  313. s->high_water = curr + init;
  314. }
  315. else if (s->high_water < (ulg)curr + WIN_INIT) {
  316. /* High water mark at or above current data, but below current data
  317. * plus WIN_INIT -- zero out to current data plus WIN_INIT, or up
  318. * to end of window, whichever is less.
  319. */
  320. init = (ulg)curr + WIN_INIT - s->high_water;
  321. if (init > s->window_size - s->high_water)
  322. init = s->window_size - s->high_water;
  323. zmemzero(s->window + s->high_water, (unsigned)init);
  324. s->high_water += init;
  325. }
  326. }
  327. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  328. "not enough room for search");
  329. }
  330. /* ========================================================================= */
  331. int ZEXPORT deflateInit_(z_streamp strm, int level, const char *version,
  332. int stream_size) {
  333. return deflateInit2_(strm, level, Z_DEFLATED, MAX_WBITS, DEF_MEM_LEVEL,
  334. Z_DEFAULT_STRATEGY, version, stream_size);
  335. /* To do: ignore strm->next_in if we use it as window */
  336. }
  337. /* ========================================================================= */
  338. int ZEXPORT deflateInit2_(z_streamp strm, int level, int method,
  339. int windowBits, int memLevel, int strategy,
  340. const char *version, int stream_size) {
  341. deflate_state *s;
  342. int wrap = 1;
  343. static const char my_version[] = ZLIB_VERSION;
  344. if (version == Z_NULL || version[0] != my_version[0] ||
  345. stream_size != sizeof(z_stream)) {
  346. return Z_VERSION_ERROR;
  347. }
  348. if (strm == Z_NULL) return Z_STREAM_ERROR;
  349. strm->msg = Z_NULL;
  350. if (strm->zalloc == (alloc_func)0) {
  351. #ifdef Z_SOLO
  352. return Z_STREAM_ERROR;
  353. #else
  354. strm->zalloc = zcalloc;
  355. strm->opaque = (voidpf)0;
  356. #endif
  357. }
  358. if (strm->zfree == (free_func)0)
  359. #ifdef Z_SOLO
  360. return Z_STREAM_ERROR;
  361. #else
  362. strm->zfree = zcfree;
  363. #endif
  364. #ifdef FASTEST
  365. if (level != 0) level = 1;
  366. #else
  367. if (level == Z_DEFAULT_COMPRESSION) level = 6;
  368. #endif
  369. if (windowBits < 0) { /* suppress zlib wrapper */
  370. wrap = 0;
  371. if (windowBits < -15)
  372. return Z_STREAM_ERROR;
  373. windowBits = -windowBits;
  374. }
  375. #ifdef GZIP
  376. else if (windowBits > 15) {
  377. wrap = 2; /* write gzip wrapper instead */
  378. windowBits -= 16;
  379. }
  380. #endif
  381. if (memLevel < 1 || memLevel > MAX_MEM_LEVEL || method != Z_DEFLATED ||
  382. windowBits < 8 || windowBits > 15 || level < 0 || level > 9 ||
  383. strategy < 0 || strategy > Z_FIXED || (windowBits == 8 && wrap != 1)) {
  384. return Z_STREAM_ERROR;
  385. }
  386. if (windowBits == 8) windowBits = 9; /* until 256-byte window bug fixed */
  387. s = (deflate_state *) ZALLOC(strm, 1, sizeof(deflate_state));
  388. if (s == Z_NULL) return Z_MEM_ERROR;
  389. strm->state = (struct internal_state FAR *)s;
  390. s->strm = strm;
  391. s->status = INIT_STATE; /* to pass state test in deflateReset() */
  392. s->wrap = wrap;
  393. s->gzhead = Z_NULL;
  394. s->w_bits = (uInt)windowBits;
  395. s->w_size = 1 << s->w_bits;
  396. s->w_mask = s->w_size - 1;
  397. s->hash_bits = (uInt)memLevel + 7;
  398. s->hash_size = 1 << s->hash_bits;
  399. s->hash_mask = s->hash_size - 1;
  400. s->hash_shift = ((s->hash_bits + MIN_MATCH-1) / MIN_MATCH);
  401. s->window = (Bytef *) ZALLOC(strm, s->w_size, 2*sizeof(Byte));
  402. memset(s->window, 0, s->w_size * 2*sizeof(Byte));
  403. s->prev = (Posf *) ZALLOC(strm, s->w_size, sizeof(Pos));
  404. memset(s->prev, 0, s->w_size * sizeof(Pos));
  405. s->head = (Posf *) ZALLOC(strm, s->hash_size, sizeof(Pos));
  406. s->high_water = 0; /* nothing written to s->window yet */
  407. s->lit_bufsize = 1 << (memLevel + 6); /* 16K elements by default */
  408. /* We overlay pending_buf and sym_buf. This works since the average size
  409. * for length/distance pairs over any compressed block is assured to be 31
  410. * bits or less.
  411. *
  412. * Analysis: The longest fixed codes are a length code of 8 bits plus 5
  413. * extra bits, for lengths 131 to 257. The longest fixed distance codes are
  414. * 5 bits plus 13 extra bits, for distances 16385 to 32768. The longest
  415. * possible fixed-codes length/distance pair is then 31 bits total.
  416. *
  417. * sym_buf starts one-fourth of the way into pending_buf. So there are
  418. * three bytes in sym_buf for every four bytes in pending_buf. Each symbol
  419. * in sym_buf is three bytes -- two for the distance and one for the
  420. * literal/length. As each symbol is consumed, the pointer to the next
  421. * sym_buf value to read moves forward three bytes. From that symbol, up to
  422. * 31 bits are written to pending_buf. The closest the written pending_buf
  423. * bits gets to the next sym_buf symbol to read is just before the last
  424. * code is written. At that time, 31*(n - 2) bits have been written, just
  425. * after 24*(n - 2) bits have been consumed from sym_buf. sym_buf starts at
  426. * 8*n bits into pending_buf. (Note that the symbol buffer fills when n - 1
  427. * symbols are written.) The closest the writing gets to what is unread is
  428. * then n + 14 bits. Here n is lit_bufsize, which is 16384 by default, and
  429. * can range from 128 to 32768.
  430. *
  431. * Therefore, at a minimum, there are 142 bits of space between what is
  432. * written and what is read in the overlain buffers, so the symbols cannot
  433. * be overwritten by the compressed data. That space is actually 139 bits,
  434. * due to the three-bit fixed-code block header.
  435. *
  436. * That covers the case where either Z_FIXED is specified, forcing fixed
  437. * codes, or when the use of fixed codes is chosen, because that choice
  438. * results in a smaller compressed block than dynamic codes. That latter
  439. * condition then assures that the above analysis also covers all dynamic
  440. * blocks. A dynamic-code block will only be chosen to be emitted if it has
  441. * fewer bits than a fixed-code block would for the same set of symbols.
  442. * Therefore its average symbol length is assured to be less than 31. So
  443. * the compressed data for a dynamic block also cannot overwrite the
  444. * symbols from which it is being constructed.
  445. */
  446. s->pending_buf = (uchf *) ZALLOC(strm, s->lit_bufsize, LIT_BUFS);
  447. s->pending_buf_size = (ulg)s->lit_bufsize * 4;
  448. if (s->window == Z_NULL || s->prev == Z_NULL || s->head == Z_NULL ||
  449. s->pending_buf == Z_NULL) {
  450. s->status = FINISH_STATE;
  451. strm->msg = ERR_MSG(Z_MEM_ERROR);
  452. deflateEnd (strm);
  453. return Z_MEM_ERROR;
  454. }
  455. #ifdef LIT_MEM
  456. s->d_buf = (ushf *)(s->pending_buf + (s->lit_bufsize << 1));
  457. s->l_buf = s->pending_buf + (s->lit_bufsize << 2);
  458. s->sym_end = s->lit_bufsize - 1;
  459. #else
  460. s->sym_buf = s->pending_buf + s->lit_bufsize;
  461. s->sym_end = (s->lit_bufsize - 1) * 3;
  462. #endif
  463. /* We avoid equality with lit_bufsize*3 because of wraparound at 64K
  464. * on 16 bit machines and because stored blocks are restricted to
  465. * 64K-1 bytes.
  466. */
  467. s->level = level;
  468. s->strategy = strategy;
  469. s->method = (Byte)method;
  470. return deflateReset(strm);
  471. }
  472. /* =========================================================================
  473. * Check for a valid deflate stream state. Return 0 if ok, 1 if not.
  474. */
  475. local int deflateStateCheck(z_streamp strm) {
  476. deflate_state *s;
  477. if (strm == Z_NULL ||
  478. strm->zalloc == (alloc_func)0 || strm->zfree == (free_func)0)
  479. return 1;
  480. s = strm->state;
  481. if (s == Z_NULL || s->strm != strm || (s->status != INIT_STATE &&
  482. #ifdef GZIP
  483. s->status != GZIP_STATE &&
  484. #endif
  485. s->status != EXTRA_STATE &&
  486. s->status != NAME_STATE &&
  487. s->status != COMMENT_STATE &&
  488. s->status != HCRC_STATE &&
  489. s->status != BUSY_STATE &&
  490. s->status != FINISH_STATE))
  491. return 1;
  492. return 0;
  493. }
  494. /* ========================================================================= */
  495. int ZEXPORT deflateSetDictionary(z_streamp strm, const Bytef *dictionary,
  496. uInt dictLength) {
  497. deflate_state *s;
  498. uInt str, n;
  499. int wrap;
  500. unsigned avail;
  501. z_const unsigned char *next;
  502. if (deflateStateCheck(strm) || dictionary == Z_NULL)
  503. return Z_STREAM_ERROR;
  504. s = strm->state;
  505. wrap = s->wrap;
  506. if (wrap == 2 || (wrap == 1 && s->status != INIT_STATE) || s->lookahead)
  507. return Z_STREAM_ERROR;
  508. /* when using zlib wrappers, compute Adler-32 for provided dictionary */
  509. if (wrap == 1)
  510. strm->adler = adler32(strm->adler, dictionary, dictLength);
  511. s->wrap = 0; /* avoid computing Adler-32 in read_buf */
  512. /* if dictionary would fill window, just replace the history */
  513. if (dictLength >= s->w_size) {
  514. if (wrap == 0) { /* already empty otherwise */
  515. CLEAR_HASH(s);
  516. s->strstart = 0;
  517. s->block_start = 0L;
  518. s->insert = 0;
  519. }
  520. dictionary += dictLength - s->w_size; /* use the tail */
  521. dictLength = s->w_size;
  522. }
  523. /* insert dictionary into window and hash */
  524. avail = strm->avail_in;
  525. next = strm->next_in;
  526. strm->avail_in = dictLength;
  527. strm->next_in = (z_const Bytef *)dictionary;
  528. fill_window(s);
  529. while (s->lookahead >= MIN_MATCH) {
  530. str = s->strstart;
  531. n = s->lookahead - (MIN_MATCH-1);
  532. do {
  533. UPDATE_HASH(s, s->ins_h, s->window[str + MIN_MATCH-1]);
  534. #ifndef FASTEST
  535. s->prev[str & s->w_mask] = s->head[s->ins_h];
  536. #endif
  537. s->head[s->ins_h] = (Pos)str;
  538. str++;
  539. } while (--n);
  540. s->strstart = str;
  541. s->lookahead = MIN_MATCH-1;
  542. fill_window(s);
  543. }
  544. s->strstart += s->lookahead;
  545. s->block_start = (long)s->strstart;
  546. s->insert = s->lookahead;
  547. s->lookahead = 0;
  548. s->match_length = s->prev_length = MIN_MATCH-1;
  549. s->match_available = 0;
  550. strm->next_in = next;
  551. strm->avail_in = avail;
  552. s->wrap = wrap;
  553. return Z_OK;
  554. }
  555. /* ========================================================================= */
  556. int ZEXPORT deflateGetDictionary(z_streamp strm, Bytef *dictionary,
  557. uInt *dictLength) {
  558. deflate_state *s;
  559. uInt len;
  560. if (deflateStateCheck(strm))
  561. return Z_STREAM_ERROR;
  562. s = strm->state;
  563. len = s->strstart + s->lookahead;
  564. if (len > s->w_size)
  565. len = s->w_size;
  566. if (dictionary != Z_NULL && len)
  567. zmemcpy(dictionary, s->window + s->strstart + s->lookahead - len, len);
  568. if (dictLength != Z_NULL)
  569. *dictLength = len;
  570. return Z_OK;
  571. }
  572. /* ========================================================================= */
  573. int ZEXPORT deflateResetKeep(z_streamp strm) {
  574. deflate_state *s;
  575. if (deflateStateCheck(strm)) {
  576. return Z_STREAM_ERROR;
  577. }
  578. strm->total_in = strm->total_out = 0;
  579. strm->msg = Z_NULL; /* use zfree if we ever allocate msg dynamically */
  580. strm->data_type = Z_UNKNOWN;
  581. s = (deflate_state *)strm->state;
  582. s->pending = 0;
  583. s->pending_out = s->pending_buf;
  584. if (s->wrap < 0) {
  585. s->wrap = -s->wrap; /* was made negative by deflate(..., Z_FINISH); */
  586. }
  587. s->status =
  588. #ifdef GZIP
  589. s->wrap == 2 ? GZIP_STATE :
  590. #endif
  591. INIT_STATE;
  592. strm->adler =
  593. #ifdef GZIP
  594. s->wrap == 2 ? crc32(0L, Z_NULL, 0) :
  595. #endif
  596. adler32(0L, Z_NULL, 0);
  597. s->last_flush = -2;
  598. _tr_init(s);
  599. return Z_OK;
  600. }
  601. /* ===========================================================================
  602. * Initialize the "longest match" routines for a new zlib stream
  603. */
  604. local void lm_init(deflate_state *s) {
  605. s->window_size = (ulg)2L*s->w_size;
  606. CLEAR_HASH(s);
  607. /* Set the default configuration parameters:
  608. */
  609. s->max_lazy_match = configuration_table[s->level].max_lazy;
  610. s->good_match = configuration_table[s->level].good_length;
  611. s->nice_match = configuration_table[s->level].nice_length;
  612. s->max_chain_length = configuration_table[s->level].max_chain;
  613. s->strstart = 0;
  614. s->block_start = 0L;
  615. s->lookahead = 0;
  616. s->insert = 0;
  617. s->match_length = s->prev_length = MIN_MATCH-1;
  618. s->match_available = 0;
  619. s->ins_h = 0;
  620. }
  621. /* ========================================================================= */
  622. int ZEXPORT deflateReset(z_streamp strm) {
  623. int ret;
  624. ret = deflateResetKeep(strm);
  625. if (ret == Z_OK)
  626. lm_init(strm->state);
  627. return ret;
  628. }
  629. /* ========================================================================= */
  630. int ZEXPORT deflateSetHeader(z_streamp strm, gz_headerp head) {
  631. if (deflateStateCheck(strm) || strm->state->wrap != 2)
  632. return Z_STREAM_ERROR;
  633. strm->state->gzhead = head;
  634. return Z_OK;
  635. }
  636. /* ========================================================================= */
  637. int ZEXPORT deflatePending(z_streamp strm, unsigned *pending, int *bits) {
  638. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  639. if (pending != Z_NULL)
  640. *pending = strm->state->pending;
  641. if (bits != Z_NULL)
  642. *bits = strm->state->bi_valid;
  643. return Z_OK;
  644. }
  645. /* ========================================================================= */
  646. int ZEXPORT deflatePrime(z_streamp strm, int bits, int value) {
  647. deflate_state *s;
  648. int put;
  649. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  650. s = strm->state;
  651. #ifdef LIT_MEM
  652. if (bits < 0 || bits > 16 ||
  653. (uchf *)s->d_buf < s->pending_out + ((Buf_size + 7) >> 3))
  654. return Z_BUF_ERROR;
  655. #else
  656. if (bits < 0 || bits > 16 ||
  657. s->sym_buf < s->pending_out + ((Buf_size + 7) >> 3))
  658. return Z_BUF_ERROR;
  659. #endif
  660. do {
  661. put = Buf_size - s->bi_valid;
  662. if (put > bits)
  663. put = bits;
  664. s->bi_buf |= (ush)((value & ((1 << put) - 1)) << s->bi_valid);
  665. s->bi_valid += put;
  666. _tr_flush_bits(s);
  667. value >>= put;
  668. bits -= put;
  669. } while (bits);
  670. return Z_OK;
  671. }
  672. /* ========================================================================= */
  673. int ZEXPORT deflateParams(z_streamp strm, int level, int strategy) {
  674. deflate_state *s;
  675. compress_func func;
  676. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  677. s = strm->state;
  678. #ifdef FASTEST
  679. if (level != 0) level = 1;
  680. #else
  681. if (level == Z_DEFAULT_COMPRESSION) level = 6;
  682. #endif
  683. if (level < 0 || level > 9 || strategy < 0 || strategy > Z_FIXED) {
  684. return Z_STREAM_ERROR;
  685. }
  686. func = configuration_table[s->level].func;
  687. if ((strategy != s->strategy || func != configuration_table[level].func) &&
  688. s->last_flush != -2) {
  689. /* Flush the last buffer: */
  690. int err = deflate(strm, Z_BLOCK);
  691. if (err == Z_STREAM_ERROR)
  692. return err;
  693. if (strm->avail_in || (s->strstart - s->block_start) + s->lookahead)
  694. return Z_BUF_ERROR;
  695. }
  696. if (s->level != level) {
  697. if (s->level == 0 && s->matches != 0) {
  698. if (s->matches == 1)
  699. slide_hash(s);
  700. else
  701. CLEAR_HASH(s);
  702. s->matches = 0;
  703. }
  704. s->level = level;
  705. s->max_lazy_match = configuration_table[level].max_lazy;
  706. s->good_match = configuration_table[level].good_length;
  707. s->nice_match = configuration_table[level].nice_length;
  708. s->max_chain_length = configuration_table[level].max_chain;
  709. }
  710. s->strategy = strategy;
  711. return Z_OK;
  712. }
  713. /* ========================================================================= */
  714. int ZEXPORT deflateTune(z_streamp strm, int good_length, int max_lazy,
  715. int nice_length, int max_chain) {
  716. deflate_state *s;
  717. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  718. s = strm->state;
  719. s->good_match = (uInt)good_length;
  720. s->max_lazy_match = (uInt)max_lazy;
  721. s->nice_match = nice_length;
  722. s->max_chain_length = (uInt)max_chain;
  723. return Z_OK;
  724. }
  725. /* =========================================================================
  726. * For the default windowBits of 15 and memLevel of 8, this function returns a
  727. * close to exact, as well as small, upper bound on the compressed size. This
  728. * is an expansion of ~0.03%, plus a small constant.
  729. *
  730. * For any setting other than those defaults for windowBits and memLevel, one
  731. * of two worst case bounds is returned. This is at most an expansion of ~4% or
  732. * ~13%, plus a small constant.
  733. *
  734. * Both the 0.03% and 4% derive from the overhead of stored blocks. The first
  735. * one is for stored blocks of 16383 bytes (memLevel == 8), whereas the second
  736. * is for stored blocks of 127 bytes (the worst case memLevel == 1). The
  737. * expansion results from five bytes of header for each stored block.
  738. *
  739. * The larger expansion of 13% results from a window size less than or equal to
  740. * the symbols buffer size (windowBits <= memLevel + 7). In that case some of
  741. * the data being compressed may have slid out of the sliding window, impeding
  742. * a stored block from being emitted. Then the only choice is a fixed or
  743. * dynamic block, where a fixed block limits the maximum expansion to 9 bits
  744. * per 8-bit byte, plus 10 bits for every block. The smallest block size for
  745. * which this can occur is 255 (memLevel == 2).
  746. *
  747. * Shifts are used to approximate divisions, for speed.
  748. */
  749. uLong ZEXPORT deflateBound(z_streamp strm, uLong sourceLen) {
  750. deflate_state *s;
  751. uLong fixedlen, storelen, wraplen;
  752. /* upper bound for fixed blocks with 9-bit literals and length 255
  753. (memLevel == 2, which is the lowest that may not use stored blocks) --
  754. ~13% overhead plus a small constant */
  755. fixedlen = sourceLen + (sourceLen >> 3) + (sourceLen >> 8) +
  756. (sourceLen >> 9) + 4;
  757. /* upper bound for stored blocks with length 127 (memLevel == 1) --
  758. ~4% overhead plus a small constant */
  759. storelen = sourceLen + (sourceLen >> 5) + (sourceLen >> 7) +
  760. (sourceLen >> 11) + 7;
  761. /* if can't get parameters, return larger bound plus a zlib wrapper */
  762. if (deflateStateCheck(strm))
  763. return (fixedlen > storelen ? fixedlen : storelen) + 6;
  764. /* compute wrapper length */
  765. s = strm->state;
  766. switch (s->wrap) {
  767. case 0: /* raw deflate */
  768. wraplen = 0;
  769. break;
  770. case 1: /* zlib wrapper */
  771. wraplen = 6 + (s->strstart ? 4 : 0);
  772. break;
  773. #ifdef GZIP
  774. case 2: /* gzip wrapper */
  775. wraplen = 18;
  776. if (s->gzhead != Z_NULL) { /* user-supplied gzip header */
  777. Bytef *str;
  778. if (s->gzhead->extra != Z_NULL)
  779. wraplen += 2 + s->gzhead->extra_len;
  780. str = s->gzhead->name;
  781. if (str != Z_NULL)
  782. do {
  783. wraplen++;
  784. } while (*str++);
  785. str = s->gzhead->comment;
  786. if (str != Z_NULL)
  787. do {
  788. wraplen++;
  789. } while (*str++);
  790. if (s->gzhead->hcrc)
  791. wraplen += 2;
  792. }
  793. break;
  794. #endif
  795. default: /* for compiler happiness */
  796. wraplen = 6;
  797. }
  798. /* if not default parameters, return one of the conservative bounds */
  799. if (s->w_bits != 15 || s->hash_bits != 8 + 7)
  800. return (s->w_bits <= s->hash_bits && s->level ? fixedlen : storelen) +
  801. wraplen;
  802. /* default settings: return tight bound for that case -- ~0.03% overhead
  803. plus a small constant */
  804. return sourceLen + (sourceLen >> 12) + (sourceLen >> 14) +
  805. (sourceLen >> 25) + 13 - 6 + wraplen;
  806. }
  807. /* =========================================================================
  808. * Put a short in the pending buffer. The 16-bit value is put in MSB order.
  809. * IN assertion: the stream state is correct and there is enough room in
  810. * pending_buf.
  811. */
  812. local void putShortMSB(deflate_state *s, uInt b) {
  813. put_byte(s, (Byte)(b >> 8));
  814. put_byte(s, (Byte)(b & 0xff));
  815. }
  816. /* =========================================================================
  817. * Flush as much pending output as possible. All deflate() output, except for
  818. * some deflate_stored() output, goes through this function so some
  819. * applications may wish to modify it to avoid allocating a large
  820. * strm->next_out buffer and copying into it. (See also read_buf()).
  821. */
  822. local void flush_pending(z_streamp strm) {
  823. unsigned len;
  824. deflate_state *s = strm->state;
  825. _tr_flush_bits(s);
  826. len = s->pending;
  827. if (len > strm->avail_out) len = strm->avail_out;
  828. if (len == 0) return;
  829. zmemcpy(strm->next_out, s->pending_out, len);
  830. strm->next_out += len;
  831. s->pending_out += len;
  832. strm->total_out += len;
  833. strm->avail_out -= len;
  834. s->pending -= len;
  835. if (s->pending == 0) {
  836. s->pending_out = s->pending_buf;
  837. }
  838. }
  839. /* ===========================================================================
  840. * Update the header CRC with the bytes s->pending_buf[beg..s->pending - 1].
  841. */
  842. #define HCRC_UPDATE(beg) \
  843. do { \
  844. if (s->gzhead->hcrc && s->pending > (beg)) \
  845. strm->adler = crc32(strm->adler, s->pending_buf + (beg), \
  846. s->pending - (beg)); \
  847. } while (0)
  848. /* ========================================================================= */
  849. int ZEXPORT deflate(z_streamp strm, int flush) {
  850. int old_flush; /* value of flush param for previous deflate call */
  851. deflate_state *s;
  852. if (deflateStateCheck(strm) || flush > Z_BLOCK || flush < 0) {
  853. return Z_STREAM_ERROR;
  854. }
  855. s = strm->state;
  856. if (strm->next_out == Z_NULL ||
  857. (strm->avail_in != 0 && strm->next_in == Z_NULL) ||
  858. (s->status == FINISH_STATE && flush != Z_FINISH)) {
  859. ERR_RETURN(strm, Z_STREAM_ERROR);
  860. }
  861. if (strm->avail_out == 0) ERR_RETURN(strm, Z_BUF_ERROR);
  862. old_flush = s->last_flush;
  863. s->last_flush = flush;
  864. /* Flush as much pending output as possible */
  865. if (s->pending != 0) {
  866. flush_pending(strm);
  867. if (strm->avail_out == 0) {
  868. /* Since avail_out is 0, deflate will be called again with
  869. * more output space, but possibly with both pending and
  870. * avail_in equal to zero. There won't be anything to do,
  871. * but this is not an error situation so make sure we
  872. * return OK instead of BUF_ERROR at next call of deflate:
  873. */
  874. s->last_flush = -1;
  875. return Z_OK;
  876. }
  877. /* Make sure there is something to do and avoid duplicate consecutive
  878. * flushes. For repeated and useless calls with Z_FINISH, we keep
  879. * returning Z_STREAM_END instead of Z_BUF_ERROR.
  880. */
  881. } else if (strm->avail_in == 0 && RANK(flush) <= RANK(old_flush) &&
  882. flush != Z_FINISH) {
  883. ERR_RETURN(strm, Z_BUF_ERROR);
  884. }
  885. /* User must not provide more input after the first FINISH: */
  886. if (s->status == FINISH_STATE && strm->avail_in != 0) {
  887. ERR_RETURN(strm, Z_BUF_ERROR);
  888. }
  889. /* Write the header */
  890. if (s->status == INIT_STATE && s->wrap == 0)
  891. s->status = BUSY_STATE;
  892. if (s->status == INIT_STATE) {
  893. /* zlib header */
  894. uInt header = (Z_DEFLATED + ((s->w_bits - 8) << 4)) << 8;
  895. uInt level_flags;
  896. if (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2)
  897. level_flags = 0;
  898. else if (s->level < 6)
  899. level_flags = 1;
  900. else if (s->level == 6)
  901. level_flags = 2;
  902. else
  903. level_flags = 3;
  904. header |= (level_flags << 6);
  905. if (s->strstart != 0) header |= PRESET_DICT;
  906. header += 31 - (header % 31);
  907. putShortMSB(s, header);
  908. /* Save the adler32 of the preset dictionary: */
  909. if (s->strstart != 0) {
  910. putShortMSB(s, (uInt)(strm->adler >> 16));
  911. putShortMSB(s, (uInt)(strm->adler & 0xffff));
  912. }
  913. strm->adler = adler32(0L, Z_NULL, 0);
  914. s->status = BUSY_STATE;
  915. /* Compression must start with an empty pending buffer */
  916. flush_pending(strm);
  917. if (s->pending != 0) {
  918. s->last_flush = -1;
  919. return Z_OK;
  920. }
  921. }
  922. #ifdef GZIP
  923. if (s->status == GZIP_STATE) {
  924. /* gzip header */
  925. strm->adler = crc32(0L, Z_NULL, 0);
  926. put_byte(s, 31);
  927. put_byte(s, 139);
  928. put_byte(s, 8);
  929. if (s->gzhead == Z_NULL) {
  930. put_byte(s, 0);
  931. put_byte(s, 0);
  932. put_byte(s, 0);
  933. put_byte(s, 0);
  934. put_byte(s, 0);
  935. put_byte(s, s->level == 9 ? 2 :
  936. (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2 ?
  937. 4 : 0));
  938. put_byte(s, OS_CODE);
  939. s->status = BUSY_STATE;
  940. /* Compression must start with an empty pending buffer */
  941. flush_pending(strm);
  942. if (s->pending != 0) {
  943. s->last_flush = -1;
  944. return Z_OK;
  945. }
  946. }
  947. else {
  948. put_byte(s, (s->gzhead->text ? 1 : 0) +
  949. (s->gzhead->hcrc ? 2 : 0) +
  950. (s->gzhead->extra == Z_NULL ? 0 : 4) +
  951. (s->gzhead->name == Z_NULL ? 0 : 8) +
  952. (s->gzhead->comment == Z_NULL ? 0 : 16)
  953. );
  954. put_byte(s, (Byte)(s->gzhead->time & 0xff));
  955. put_byte(s, (Byte)((s->gzhead->time >> 8) & 0xff));
  956. put_byte(s, (Byte)((s->gzhead->time >> 16) & 0xff));
  957. put_byte(s, (Byte)((s->gzhead->time >> 24) & 0xff));
  958. put_byte(s, s->level == 9 ? 2 :
  959. (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2 ?
  960. 4 : 0));
  961. put_byte(s, s->gzhead->os & 0xff);
  962. if (s->gzhead->extra != Z_NULL) {
  963. put_byte(s, s->gzhead->extra_len & 0xff);
  964. put_byte(s, (s->gzhead->extra_len >> 8) & 0xff);
  965. }
  966. if (s->gzhead->hcrc)
  967. strm->adler = crc32(strm->adler, s->pending_buf,
  968. s->pending);
  969. s->gzindex = 0;
  970. s->status = EXTRA_STATE;
  971. }
  972. }
  973. if (s->status == EXTRA_STATE) {
  974. if (s->gzhead->extra != Z_NULL) {
  975. ulg beg = s->pending; /* start of bytes to update crc */
  976. uInt left = (s->gzhead->extra_len & 0xffff) - s->gzindex;
  977. while (s->pending + left > s->pending_buf_size) {
  978. uInt copy = s->pending_buf_size - s->pending;
  979. zmemcpy(s->pending_buf + s->pending,
  980. s->gzhead->extra + s->gzindex, copy);
  981. s->pending = s->pending_buf_size;
  982. HCRC_UPDATE(beg);
  983. s->gzindex += copy;
  984. flush_pending(strm);
  985. if (s->pending != 0) {
  986. s->last_flush = -1;
  987. return Z_OK;
  988. }
  989. beg = 0;
  990. left -= copy;
  991. }
  992. zmemcpy(s->pending_buf + s->pending,
  993. s->gzhead->extra + s->gzindex, left);
  994. s->pending += left;
  995. HCRC_UPDATE(beg);
  996. s->gzindex = 0;
  997. }
  998. s->status = NAME_STATE;
  999. }
  1000. if (s->status == NAME_STATE) {
  1001. if (s->gzhead->name != Z_NULL) {
  1002. ulg beg = s->pending; /* start of bytes to update crc */
  1003. int val;
  1004. do {
  1005. if (s->pending == s->pending_buf_size) {
  1006. HCRC_UPDATE(beg);
  1007. flush_pending(strm);
  1008. if (s->pending != 0) {
  1009. s->last_flush = -1;
  1010. return Z_OK;
  1011. }
  1012. beg = 0;
  1013. }
  1014. val = s->gzhead->name[s->gzindex++];
  1015. put_byte(s, val);
  1016. } while (val != 0);
  1017. HCRC_UPDATE(beg);
  1018. s->gzindex = 0;
  1019. }
  1020. s->status = COMMENT_STATE;
  1021. }
  1022. if (s->status == COMMENT_STATE) {
  1023. if (s->gzhead->comment != Z_NULL) {
  1024. ulg beg = s->pending; /* start of bytes to update crc */
  1025. int val;
  1026. do {
  1027. if (s->pending == s->pending_buf_size) {
  1028. HCRC_UPDATE(beg);
  1029. flush_pending(strm);
  1030. if (s->pending != 0) {
  1031. s->last_flush = -1;
  1032. return Z_OK;
  1033. }
  1034. beg = 0;
  1035. }
  1036. val = s->gzhead->comment[s->gzindex++];
  1037. put_byte(s, val);
  1038. } while (val != 0);
  1039. HCRC_UPDATE(beg);
  1040. }
  1041. s->status = HCRC_STATE;
  1042. }
  1043. if (s->status == HCRC_STATE) {
  1044. if (s->gzhead->hcrc) {
  1045. if (s->pending + 2 > s->pending_buf_size) {
  1046. flush_pending(strm);
  1047. if (s->pending != 0) {
  1048. s->last_flush = -1;
  1049. return Z_OK;
  1050. }
  1051. }
  1052. put_byte(s, (Byte)(strm->adler & 0xff));
  1053. put_byte(s, (Byte)((strm->adler >> 8) & 0xff));
  1054. strm->adler = crc32(0L, Z_NULL, 0);
  1055. }
  1056. s->status = BUSY_STATE;
  1057. /* Compression must start with an empty pending buffer */
  1058. flush_pending(strm);
  1059. if (s->pending != 0) {
  1060. s->last_flush = -1;
  1061. return Z_OK;
  1062. }
  1063. }
  1064. #endif
  1065. /* Start a new block or continue the current one.
  1066. */
  1067. if (strm->avail_in != 0 || s->lookahead != 0 ||
  1068. (flush != Z_NO_FLUSH && s->status != FINISH_STATE)) {
  1069. block_state bstate;
  1070. bstate = s->level == 0 ? deflate_stored(s, flush) :
  1071. s->strategy == Z_HUFFMAN_ONLY ? deflate_huff(s, flush) :
  1072. s->strategy == Z_RLE ? deflate_rle(s, flush) :
  1073. (*(configuration_table[s->level].func))(s, flush);
  1074. if (bstate == finish_started || bstate == finish_done) {
  1075. s->status = FINISH_STATE;
  1076. }
  1077. if (bstate == need_more || bstate == finish_started) {
  1078. if (strm->avail_out == 0) {
  1079. s->last_flush = -1; /* avoid BUF_ERROR next call, see above */
  1080. }
  1081. return Z_OK;
  1082. /* If flush != Z_NO_FLUSH && avail_out == 0, the next call
  1083. * of deflate should use the same flush parameter to make sure
  1084. * that the flush is complete. So we don't have to output an
  1085. * empty block here, this will be done at next call. This also
  1086. * ensures that for a very small output buffer, we emit at most
  1087. * one empty block.
  1088. */
  1089. }
  1090. if (bstate == block_done) {
  1091. if (flush == Z_PARTIAL_FLUSH) {
  1092. _tr_align(s);
  1093. } else if (flush != Z_BLOCK) { /* FULL_FLUSH or SYNC_FLUSH */
  1094. _tr_stored_block(s, (char*)0, 0L, 0);
  1095. /* For a full flush, this empty block will be recognized
  1096. * as a special marker by inflate_sync().
  1097. */
  1098. if (flush == Z_FULL_FLUSH) {
  1099. CLEAR_HASH(s); /* forget history */
  1100. if (s->lookahead == 0) {
  1101. s->strstart = 0;
  1102. s->block_start = 0L;
  1103. s->insert = 0;
  1104. }
  1105. }
  1106. }
  1107. flush_pending(strm);
  1108. if (strm->avail_out == 0) {
  1109. s->last_flush = -1; /* avoid BUF_ERROR at next call, see above */
  1110. return Z_OK;
  1111. }
  1112. }
  1113. }
  1114. if (flush != Z_FINISH) return Z_OK;
  1115. if (s->wrap <= 0) return Z_STREAM_END;
  1116. /* Write the trailer */
  1117. #ifdef GZIP
  1118. if (s->wrap == 2) {
  1119. put_byte(s, (Byte)(strm->adler & 0xff));
  1120. put_byte(s, (Byte)((strm->adler >> 8) & 0xff));
  1121. put_byte(s, (Byte)((strm->adler >> 16) & 0xff));
  1122. put_byte(s, (Byte)((strm->adler >> 24) & 0xff));
  1123. put_byte(s, (Byte)(strm->total_in & 0xff));
  1124. put_byte(s, (Byte)((strm->total_in >> 8) & 0xff));
  1125. put_byte(s, (Byte)((strm->total_in >> 16) & 0xff));
  1126. put_byte(s, (Byte)((strm->total_in >> 24) & 0xff));
  1127. }
  1128. else
  1129. #endif
  1130. {
  1131. putShortMSB(s, (uInt)(strm->adler >> 16));
  1132. putShortMSB(s, (uInt)(strm->adler & 0xffff));
  1133. }
  1134. flush_pending(strm);
  1135. /* If avail_out is zero, the application will call deflate again
  1136. * to flush the rest.
  1137. */
  1138. if (s->wrap > 0) s->wrap = -s->wrap; /* write the trailer only once! */
  1139. return s->pending != 0 ? Z_OK : Z_STREAM_END;
  1140. }
  1141. /* ========================================================================= */
  1142. int ZEXPORT deflateEnd(z_streamp strm) {
  1143. int status;
  1144. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  1145. status = strm->state->status;
  1146. /* Deallocate in reverse order of allocations: */
  1147. TRY_FREE(strm, strm->state->pending_buf);
  1148. TRY_FREE(strm, strm->state->head);
  1149. TRY_FREE(strm, strm->state->prev);
  1150. TRY_FREE(strm, strm->state->window);
  1151. ZFREE(strm, strm->state);
  1152. strm->state = Z_NULL;
  1153. return status == BUSY_STATE ? Z_DATA_ERROR : Z_OK;
  1154. }
  1155. /* =========================================================================
  1156. * Copy the source state to the destination state.
  1157. * To simplify the source, this is not supported for 16-bit MSDOS (which
  1158. * doesn't have enough memory anyway to duplicate compression states).
  1159. */
  1160. int ZEXPORT deflateCopy(z_streamp dest, z_streamp source) {
  1161. #ifdef MAXSEG_64K
  1162. (void)dest;
  1163. (void)source;
  1164. return Z_STREAM_ERROR;
  1165. #else
  1166. deflate_state *ds;
  1167. deflate_state *ss;
  1168. if (deflateStateCheck(source) || dest == Z_NULL) {
  1169. return Z_STREAM_ERROR;
  1170. }
  1171. ss = source->state;
  1172. zmemcpy((voidpf)dest, (voidpf)source, sizeof(z_stream));
  1173. ds = (deflate_state *) ZALLOC(dest, 1, sizeof(deflate_state));
  1174. if (ds == Z_NULL) return Z_MEM_ERROR;
  1175. dest->state = (struct internal_state FAR *) ds;
  1176. zmemcpy((voidpf)ds, (voidpf)ss, sizeof(deflate_state));
  1177. ds->strm = dest;
  1178. ds->window = (Bytef *) ZALLOC(dest, ds->w_size, 2*sizeof(Byte));
  1179. ds->prev = (Posf *) ZALLOC(dest, ds->w_size, sizeof(Pos));
  1180. ds->head = (Posf *) ZALLOC(dest, ds->hash_size, sizeof(Pos));
  1181. ds->pending_buf = (uchf *) ZALLOC(dest, ds->lit_bufsize, LIT_BUFS);
  1182. if (ds->window == Z_NULL || ds->prev == Z_NULL || ds->head == Z_NULL ||
  1183. ds->pending_buf == Z_NULL) {
  1184. deflateEnd (dest);
  1185. return Z_MEM_ERROR;
  1186. }
  1187. /* following zmemcpy do not work for 16-bit MSDOS */
  1188. zmemcpy(ds->window, ss->window, ds->w_size * 2 * sizeof(Byte));
  1189. zmemcpy((voidpf)ds->prev, (voidpf)ss->prev, ds->w_size * sizeof(Pos));
  1190. zmemcpy((voidpf)ds->head, (voidpf)ss->head, ds->hash_size * sizeof(Pos));
  1191. zmemcpy(ds->pending_buf, ss->pending_buf, ds->lit_bufsize * LIT_BUFS);
  1192. ds->pending_out = ds->pending_buf + (ss->pending_out - ss->pending_buf);
  1193. #ifdef LIT_MEM
  1194. ds->d_buf = (ushf *)(ds->pending_buf + (ds->lit_bufsize << 1));
  1195. ds->l_buf = ds->pending_buf + (ds->lit_bufsize << 2);
  1196. #else
  1197. ds->sym_buf = ds->pending_buf + ds->lit_bufsize;
  1198. #endif
  1199. ds->l_desc.dyn_tree = ds->dyn_ltree;
  1200. ds->d_desc.dyn_tree = ds->dyn_dtree;
  1201. ds->bl_desc.dyn_tree = ds->bl_tree;
  1202. return Z_OK;
  1203. #endif /* MAXSEG_64K */
  1204. }
  1205. #ifndef FASTEST
  1206. /* ===========================================================================
  1207. * Set match_start to the longest match starting at the given string and
  1208. * return its length. Matches shorter or equal to prev_length are discarded,
  1209. * in which case the result is equal to prev_length and match_start is
  1210. * garbage.
  1211. * IN assertions: cur_match is the head of the hash chain for the current
  1212. * string (strstart) and its distance is <= MAX_DIST, and prev_length >= 1
  1213. * OUT assertion: the match length is not greater than s->lookahead.
  1214. */
  1215. Y_NO_SANITIZE("undefined")
  1216. local uInt longest_match(deflate_state *s, IPos cur_match) {
  1217. unsigned chain_length = s->max_chain_length;/* max hash chain length */
  1218. register Bytef *scan = s->window + s->strstart; /* current string */
  1219. register Bytef *match; /* matched string */
  1220. register int len; /* length of current match */
  1221. int best_len = (int)s->prev_length; /* best match length so far */
  1222. int nice_match = s->nice_match; /* stop if match long enough */
  1223. IPos limit = s->strstart > (IPos)MAX_DIST(s) ?
  1224. s->strstart - (IPos)MAX_DIST(s) : NIL;
  1225. /* Stop when cur_match becomes <= limit. To simplify the code,
  1226. * we prevent matches with the string of window index 0.
  1227. */
  1228. Posf *prev = s->prev;
  1229. uInt wmask = s->w_mask;
  1230. #ifdef UNALIGNED_OK
  1231. /* Compare two bytes at a time. Note: this is not always beneficial.
  1232. * Try with and without -DUNALIGNED_OK to check.
  1233. */
  1234. register Bytef *strend = s->window + s->strstart + MAX_MATCH - 1;
  1235. register ush scan_start = *(ushf*)scan;
  1236. register ush scan_end = *(ushf*)(scan + best_len - 1);
  1237. #else
  1238. register Bytef *strend = s->window + s->strstart + MAX_MATCH;
  1239. register Byte scan_end1 = scan[best_len - 1];
  1240. register Byte scan_end = scan[best_len];
  1241. #endif
  1242. /* The code is optimized for HASH_BITS >= 8 and MAX_MATCH-2 multiple of 16.
  1243. * It is easy to get rid of this optimization if necessary.
  1244. */
  1245. Assert(s->hash_bits >= 8 && MAX_MATCH == 258, "Code too clever");
  1246. /* Do not waste too much time if we already have a good match: */
  1247. if (s->prev_length >= s->good_match) {
  1248. chain_length >>= 2;
  1249. }
  1250. /* Do not look for matches beyond the end of the input. This is necessary
  1251. * to make deflate deterministic.
  1252. */
  1253. if ((uInt)nice_match > s->lookahead) nice_match = (int)s->lookahead;
  1254. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  1255. "need lookahead");
  1256. do {
  1257. Assert(cur_match < s->strstart, "no future");
  1258. match = s->window + cur_match;
  1259. /* Skip to next match if the match length cannot increase
  1260. * or if the match length is less than 2. Note that the checks below
  1261. * for insufficient lookahead only occur occasionally for performance
  1262. * reasons. Therefore uninitialized memory will be accessed, and
  1263. * conditional jumps will be made that depend on those values.
  1264. * However the length of the match is limited to the lookahead, so
  1265. * the output of deflate is not affected by the uninitialized values.
  1266. */
  1267. #if (defined(UNALIGNED_OK) && MAX_MATCH == 258)
  1268. /* This code assumes sizeof(unsigned short) == 2. Do not use
  1269. * UNALIGNED_OK if your compiler uses a different size.
  1270. */
  1271. if (*(ushf*)(match + best_len - 1) != scan_end ||
  1272. *(ushf*)match != scan_start) continue;
  1273. /* It is not necessary to compare scan[2] and match[2] since they are
  1274. * always equal when the other bytes match, given that the hash keys
  1275. * are equal and that HASH_BITS >= 8. Compare 2 bytes at a time at
  1276. * strstart + 3, + 5, up to strstart + 257. We check for insufficient
  1277. * lookahead only every 4th comparison; the 128th check will be made
  1278. * at strstart + 257. If MAX_MATCH-2 is not a multiple of 8, it is
  1279. * necessary to put more guard bytes at the end of the window, or
  1280. * to check more often for insufficient lookahead.
  1281. */
  1282. Assert(scan[2] == match[2], "scan[2]?");
  1283. scan++, match++;
  1284. do {
  1285. } while (*(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1286. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1287. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1288. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1289. scan < strend);
  1290. /* The funny "do {}" generates better code on most compilers */
  1291. /* Here, scan <= window + strstart + 257 */
  1292. Assert(scan <= s->window + (unsigned)(s->window_size - 1),
  1293. "wild scan");
  1294. if (*scan == *match) scan++;
  1295. len = (MAX_MATCH - 1) - (int)(strend - scan);
  1296. scan = strend - (MAX_MATCH-1);
  1297. #else /* UNALIGNED_OK */
  1298. if (match[best_len] != scan_end ||
  1299. match[best_len - 1] != scan_end1 ||
  1300. *match != *scan ||
  1301. *++match != scan[1]) continue;
  1302. /* The check at best_len - 1 can be removed because it will be made
  1303. * again later. (This heuristic is not always a win.)
  1304. * It is not necessary to compare scan[2] and match[2] since they
  1305. * are always equal when the other bytes match, given that
  1306. * the hash keys are equal and that HASH_BITS >= 8.
  1307. */
  1308. scan += 2, match++;
  1309. Assert(*scan == *match, "match[2]?");
  1310. /* We check for insufficient lookahead only every 8th comparison;
  1311. * the 256th check will be made at strstart + 258.
  1312. */
  1313. do {
  1314. } while (*++scan == *++match && *++scan == *++match &&
  1315. *++scan == *++match && *++scan == *++match &&
  1316. *++scan == *++match && *++scan == *++match &&
  1317. *++scan == *++match && *++scan == *++match &&
  1318. scan < strend);
  1319. Assert(scan <= s->window + (unsigned)(s->window_size - 1),
  1320. "wild scan");
  1321. len = MAX_MATCH - (int)(strend - scan);
  1322. scan = strend - MAX_MATCH;
  1323. #endif /* UNALIGNED_OK */
  1324. if (len > best_len) {
  1325. s->match_start = cur_match;
  1326. best_len = len;
  1327. if (len >= nice_match) break;
  1328. #ifdef UNALIGNED_OK
  1329. scan_end = *(ushf*)(scan + best_len - 1);
  1330. #else
  1331. scan_end1 = scan[best_len - 1];
  1332. scan_end = scan[best_len];
  1333. #endif
  1334. }
  1335. } while ((cur_match = prev[cur_match & wmask]) > limit
  1336. && --chain_length != 0);
  1337. if ((uInt)best_len <= s->lookahead) return (uInt)best_len;
  1338. return s->lookahead;
  1339. }
  1340. #else /* FASTEST */
  1341. /* ---------------------------------------------------------------------------
  1342. * Optimized version for FASTEST only
  1343. */
  1344. local uInt longest_match(deflate_state *s, IPos cur_match) {
  1345. register Bytef *scan = s->window + s->strstart; /* current string */
  1346. register Bytef *match; /* matched string */
  1347. register int len; /* length of current match */
  1348. register Bytef *strend = s->window + s->strstart + MAX_MATCH;
  1349. /* The code is optimized for HASH_BITS >= 8 and MAX_MATCH-2 multiple of 16.
  1350. * It is easy to get rid of this optimization if necessary.
  1351. */
  1352. Assert(s->hash_bits >= 8 && MAX_MATCH == 258, "Code too clever");
  1353. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  1354. "need lookahead");
  1355. Assert(cur_match < s->strstart, "no future");
  1356. match = s->window + cur_match;
  1357. /* Return failure if the match length is less than 2:
  1358. */
  1359. if (match[0] != scan[0] || match[1] != scan[1]) return MIN_MATCH-1;
  1360. /* The check at best_len - 1 can be removed because it will be made
  1361. * again later. (This heuristic is not always a win.)
  1362. * It is not necessary to compare scan[2] and match[2] since they
  1363. * are always equal when the other bytes match, given that
  1364. * the hash keys are equal and that HASH_BITS >= 8.
  1365. */
  1366. scan += 2, match += 2;
  1367. Assert(*scan == *match, "match[2]?");
  1368. /* We check for insufficient lookahead only every 8th comparison;
  1369. * the 256th check will be made at strstart + 258.
  1370. */
  1371. do {
  1372. } while (*++scan == *++match && *++scan == *++match &&
  1373. *++scan == *++match && *++scan == *++match &&
  1374. *++scan == *++match && *++scan == *++match &&
  1375. *++scan == *++match && *++scan == *++match &&
  1376. scan < strend);
  1377. Assert(scan <= s->window + (unsigned)(s->window_size - 1), "wild scan");
  1378. len = MAX_MATCH - (int)(strend - scan);
  1379. if (len < MIN_MATCH) return MIN_MATCH - 1;
  1380. s->match_start = cur_match;
  1381. return (uInt)len <= s->lookahead ? (uInt)len : s->lookahead;
  1382. }
  1383. #endif /* FASTEST */
  1384. #ifdef ZLIB_DEBUG
  1385. #define EQUAL 0
  1386. /* result of memcmp for equal strings */
  1387. /* ===========================================================================
  1388. * Check that the match at match_start is indeed a match.
  1389. */
  1390. local void check_match(deflate_state *s, IPos start, IPos match, int length) {
  1391. /* check that the match is indeed a match */
  1392. Bytef *back = s->window + (int)match, *here = s->window + start;
  1393. IPos len = length;
  1394. if (match == (IPos)-1) {
  1395. /* match starts one byte before the current window -- just compare the
  1396. subsequent length-1 bytes */
  1397. back++;
  1398. here++;
  1399. len--;
  1400. }
  1401. if (zmemcmp(back, here, len) != EQUAL) {
  1402. fprintf(stderr, " start %u, match %d, length %d\n",
  1403. start, (int)match, length);
  1404. do {
  1405. fprintf(stderr, "(%02x %02x)", *back++, *here++);
  1406. } while (--len != 0);
  1407. z_error("invalid match");
  1408. }
  1409. if (z_verbose > 1) {
  1410. fprintf(stderr,"\\[%d,%d]", start - match, length);
  1411. do { putc(s->window[start++], stderr); } while (--length != 0);
  1412. }
  1413. }
  1414. #else
  1415. # define check_match(s, start, match, length)
  1416. #endif /* ZLIB_DEBUG */
  1417. /* ===========================================================================
  1418. * Flush the current block, with given end-of-file flag.
  1419. * IN assertion: strstart is set to the end of the current match.
  1420. */
  1421. #define FLUSH_BLOCK_ONLY(s, last) { \
  1422. _tr_flush_block(s, (s->block_start >= 0L ? \
  1423. (charf *)&s->window[(unsigned)s->block_start] : \
  1424. (charf *)Z_NULL), \
  1425. (ulg)((long)s->strstart - s->block_start), \
  1426. (last)); \
  1427. s->block_start = s->strstart; \
  1428. flush_pending(s->strm); \
  1429. Tracev((stderr,"[FLUSH]")); \
  1430. }
  1431. /* Same but force premature exit if necessary. */
  1432. #define FLUSH_BLOCK(s, last) { \
  1433. FLUSH_BLOCK_ONLY(s, last); \
  1434. if (s->strm->avail_out == 0) return (last) ? finish_started : need_more; \
  1435. }
  1436. /* Maximum stored block length in deflate format (not including header). */
  1437. #define MAX_STORED 65535
  1438. /* Minimum of a and b. */
  1439. #define MIN(a, b) ((a) > (b) ? (b) : (a))
  1440. /* ===========================================================================
  1441. * Copy without compression as much as possible from the input stream, return
  1442. * the current block state.
  1443. *
  1444. * In case deflateParams() is used to later switch to a non-zero compression
  1445. * level, s->matches (otherwise unused when storing) keeps track of the number
  1446. * of hash table slides to perform. If s->matches is 1, then one hash table
  1447. * slide will be done when switching. If s->matches is 2, the maximum value
  1448. * allowed here, then the hash table will be cleared, since two or more slides
  1449. * is the same as a clear.
  1450. *
  1451. * deflate_stored() is written to minimize the number of times an input byte is
  1452. * copied. It is most efficient with large input and output buffers, which
  1453. * maximizes the opportunities to have a single copy from next_in to next_out.
  1454. */
  1455. local block_state deflate_stored(deflate_state *s, int flush) {
  1456. /* Smallest worthy block size when not flushing or finishing. By default
  1457. * this is 32K. This can be as small as 507 bytes for memLevel == 1. For
  1458. * large input and output buffers, the stored block size will be larger.
  1459. */
  1460. unsigned min_block = MIN(s->pending_buf_size - 5, s->w_size);
  1461. /* Copy as many min_block or larger stored blocks directly to next_out as
  1462. * possible. If flushing, copy the remaining available input to next_out as
  1463. * stored blocks, if there is enough space.
  1464. */
  1465. unsigned len, left, have, last = 0;
  1466. unsigned used = s->strm->avail_in;
  1467. do {
  1468. /* Set len to the maximum size block that we can copy directly with the
  1469. * available input data and output space. Set left to how much of that
  1470. * would be copied from what's left in the window.
  1471. */
  1472. len = MAX_STORED; /* maximum deflate stored block length */
  1473. have = (s->bi_valid + 42) >> 3; /* number of header bytes */
  1474. if (s->strm->avail_out < have) /* need room for header */
  1475. break;
  1476. /* maximum stored block length that will fit in avail_out: */
  1477. have = s->strm->avail_out - have;
  1478. left = s->strstart - s->block_start; /* bytes left in window */
  1479. if (len > (ulg)left + s->strm->avail_in)
  1480. len = left + s->strm->avail_in; /* limit len to the input */
  1481. if (len > have)
  1482. len = have; /* limit len to the output */
  1483. /* If the stored block would be less than min_block in length, or if
  1484. * unable to copy all of the available input when flushing, then try
  1485. * copying to the window and the pending buffer instead. Also don't
  1486. * write an empty block when flushing -- deflate() does that.
  1487. */
  1488. if (len < min_block && ((len == 0 && flush != Z_FINISH) ||
  1489. flush == Z_NO_FLUSH ||
  1490. len != left + s->strm->avail_in))
  1491. break;
  1492. /* Make a dummy stored block in pending to get the header bytes,
  1493. * including any pending bits. This also updates the debugging counts.
  1494. */
  1495. last = flush == Z_FINISH && len == left + s->strm->avail_in ? 1 : 0;
  1496. _tr_stored_block(s, (char *)0, 0L, last);
  1497. /* Replace the lengths in the dummy stored block with len. */
  1498. s->pending_buf[s->pending - 4] = len;
  1499. s->pending_buf[s->pending - 3] = len >> 8;
  1500. s->pending_buf[s->pending - 2] = ~len;
  1501. s->pending_buf[s->pending - 1] = ~len >> 8;
  1502. /* Write the stored block header bytes. */
  1503. flush_pending(s->strm);
  1504. #ifdef ZLIB_DEBUG
  1505. /* Update debugging counts for the data about to be copied. */
  1506. s->compressed_len += len << 3;
  1507. s->bits_sent += len << 3;
  1508. #endif
  1509. /* Copy uncompressed bytes from the window to next_out. */
  1510. if (left) {
  1511. if (left > len)
  1512. left = len;
  1513. zmemcpy(s->strm->next_out, s->window + s->block_start, left);
  1514. s->strm->next_out += left;
  1515. s->strm->avail_out -= left;
  1516. s->strm->total_out += left;
  1517. s->block_start += left;
  1518. len -= left;
  1519. }
  1520. /* Copy uncompressed bytes directly from next_in to next_out, updating
  1521. * the check value.
  1522. */
  1523. if (len) {
  1524. read_buf(s->strm, s->strm->next_out, len);
  1525. s->strm->next_out += len;
  1526. s->strm->avail_out -= len;
  1527. s->strm->total_out += len;
  1528. }
  1529. } while (last == 0);
  1530. /* Update the sliding window with the last s->w_size bytes of the copied
  1531. * data, or append all of the copied data to the existing window if less
  1532. * than s->w_size bytes were copied. Also update the number of bytes to
  1533. * insert in the hash tables, in the event that deflateParams() switches to
  1534. * a non-zero compression level.
  1535. */
  1536. used -= s->strm->avail_in; /* number of input bytes directly copied */
  1537. if (used) {
  1538. /* If any input was used, then no unused input remains in the window,
  1539. * therefore s->block_start == s->strstart.
  1540. */
  1541. if (used >= s->w_size) { /* supplant the previous history */
  1542. s->matches = 2; /* clear hash */
  1543. zmemcpy(s->window, s->strm->next_in - s->w_size, s->w_size);
  1544. s->strstart = s->w_size;
  1545. s->insert = s->strstart;
  1546. }
  1547. else {
  1548. if (s->window_size - s->strstart <= used) {
  1549. /* Slide the window down. */
  1550. s->strstart -= s->w_size;
  1551. zmemcpy(s->window, s->window + s->w_size, s->strstart);
  1552. if (s->matches < 2)
  1553. s->matches++; /* add a pending slide_hash() */
  1554. if (s->insert > s->strstart)
  1555. s->insert = s->strstart;
  1556. }
  1557. zmemcpy(s->window + s->strstart, s->strm->next_in - used, used);
  1558. s->strstart += used;
  1559. s->insert += MIN(used, s->w_size - s->insert);
  1560. }
  1561. s->block_start = s->strstart;
  1562. }
  1563. if (s->high_water < s->strstart)
  1564. s->high_water = s->strstart;
  1565. /* If the last block was written to next_out, then done. */
  1566. if (last)
  1567. return finish_done;
  1568. /* If flushing and all input has been consumed, then done. */
  1569. if (flush != Z_NO_FLUSH && flush != Z_FINISH &&
  1570. s->strm->avail_in == 0 && (long)s->strstart == s->block_start)
  1571. return block_done;
  1572. /* Fill the window with any remaining input. */
  1573. have = s->window_size - s->strstart;
  1574. if (s->strm->avail_in > have && s->block_start >= (long)s->w_size) {
  1575. /* Slide the window down. */
  1576. s->block_start -= s->w_size;
  1577. s->strstart -= s->w_size;
  1578. zmemcpy(s->window, s->window + s->w_size, s->strstart);
  1579. if (s->matches < 2)
  1580. s->matches++; /* add a pending slide_hash() */
  1581. have += s->w_size; /* more space now */
  1582. if (s->insert > s->strstart)
  1583. s->insert = s->strstart;
  1584. }
  1585. if (have > s->strm->avail_in)
  1586. have = s->strm->avail_in;
  1587. if (have) {
  1588. read_buf(s->strm, s->window + s->strstart, have);
  1589. s->strstart += have;
  1590. s->insert += MIN(have, s->w_size - s->insert);
  1591. }
  1592. if (s->high_water < s->strstart)
  1593. s->high_water = s->strstart;
  1594. /* There was not enough avail_out to write a complete worthy or flushed
  1595. * stored block to next_out. Write a stored block to pending instead, if we
  1596. * have enough input for a worthy block, or if flushing and there is enough
  1597. * room for the remaining input as a stored block in the pending buffer.
  1598. */
  1599. have = (s->bi_valid + 42) >> 3; /* number of header bytes */
  1600. /* maximum stored block length that will fit in pending: */
  1601. have = MIN(s->pending_buf_size - have, MAX_STORED);
  1602. min_block = MIN(have, s->w_size);
  1603. left = s->strstart - s->block_start;
  1604. if (left >= min_block ||
  1605. ((left || flush == Z_FINISH) && flush != Z_NO_FLUSH &&
  1606. s->strm->avail_in == 0 && left <= have)) {
  1607. len = MIN(left, have);
  1608. last = flush == Z_FINISH && s->strm->avail_in == 0 &&
  1609. len == left ? 1 : 0;
  1610. _tr_stored_block(s, (charf *)s->window + s->block_start, len, last);
  1611. s->block_start += len;
  1612. flush_pending(s->strm);
  1613. }
  1614. /* We've done all we can with the available input and output. */
  1615. return last ? finish_started : need_more;
  1616. }
  1617. /* ===========================================================================
  1618. * Compress as much as possible from the input stream, return the current
  1619. * block state.
  1620. * This function does not perform lazy evaluation of matches and inserts
  1621. * new strings in the dictionary only for unmatched strings or for short
  1622. * matches. It is used only for the fast compression options.
  1623. */
  1624. local block_state deflate_fast(deflate_state *s, int flush) {
  1625. IPos hash_head; /* head of the hash chain */
  1626. int bflush; /* set if current block must be flushed */
  1627. for (;;) {
  1628. /* Make sure that we always have enough lookahead, except
  1629. * at the end of the input file. We need MAX_MATCH bytes
  1630. * for the next match, plus MIN_MATCH bytes to insert the
  1631. * string following the next match.
  1632. */
  1633. if (s->lookahead < MIN_LOOKAHEAD) {
  1634. fill_window(s);
  1635. if (s->lookahead < MIN_LOOKAHEAD && flush == Z_NO_FLUSH) {
  1636. return need_more;
  1637. }
  1638. if (s->lookahead == 0) break; /* flush the current block */
  1639. }
  1640. /* Insert the string window[strstart .. strstart + 2] in the
  1641. * dictionary, and set hash_head to the head of the hash chain:
  1642. */
  1643. hash_head = NIL;
  1644. if (s->lookahead >= MIN_MATCH) {
  1645. INSERT_STRING(s, s->strstart, hash_head);
  1646. }
  1647. /* Find the longest match, discarding those <= prev_length.
  1648. * At this point we have always match_length < MIN_MATCH
  1649. */
  1650. if (hash_head != NIL && s->strstart - hash_head <= MAX_DIST(s)) {
  1651. /* To simplify the code, we prevent matches with the string
  1652. * of window index 0 (in particular we have to avoid a match
  1653. * of the string with itself at the start of the input file).
  1654. */
  1655. s->match_length = longest_match (s, hash_head);
  1656. /* longest_match() sets match_start */
  1657. }
  1658. if (s->match_length >= MIN_MATCH) {
  1659. check_match(s, s->strstart, s->match_start, s->match_length);
  1660. _tr_tally_dist(s, s->strstart - s->match_start,
  1661. s->match_length - MIN_MATCH, bflush);
  1662. s->lookahead -= s->match_length;
  1663. /* Insert new strings in the hash table only if the match length
  1664. * is not too large. This saves time but degrades compression.
  1665. */
  1666. #ifndef FASTEST
  1667. if (s->match_length <= s->max_insert_length &&
  1668. s->lookahead >= MIN_MATCH) {
  1669. s->match_length--; /* string at strstart already in table */
  1670. do {
  1671. s->strstart++;
  1672. INSERT_STRING(s, s->strstart, hash_head);
  1673. /* strstart never exceeds WSIZE-MAX_MATCH, so there are
  1674. * always MIN_MATCH bytes ahead.
  1675. */
  1676. } while (--s->match_length != 0);
  1677. s->strstart++;
  1678. } else
  1679. #endif
  1680. {
  1681. s->strstart += s->match_length;
  1682. s->match_length = 0;
  1683. s->ins_h = s->window[s->strstart];
  1684. UPDATE_HASH(s, s->ins_h, s->window[s->strstart + 1]);
  1685. #if MIN_MATCH != 3
  1686. Call UPDATE_HASH() MIN_MATCH-3 more times
  1687. #endif
  1688. /* If lookahead < MIN_MATCH, ins_h is garbage, but it does not
  1689. * matter since it will be recomputed at next deflate call.
  1690. */
  1691. }
  1692. } else {
  1693. /* No match, output a literal byte */
  1694. Tracevv((stderr,"%c", s->window[s->strstart]));
  1695. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1696. s->lookahead--;
  1697. s->strstart++;
  1698. }
  1699. if (bflush) FLUSH_BLOCK(s, 0);
  1700. }
  1701. s->insert = s->strstart < MIN_MATCH-1 ? s->strstart : MIN_MATCH-1;
  1702. if (flush == Z_FINISH) {
  1703. FLUSH_BLOCK(s, 1);
  1704. return finish_done;
  1705. }
  1706. if (s->sym_next)
  1707. FLUSH_BLOCK(s, 0);
  1708. return block_done;
  1709. }
  1710. #ifndef FASTEST
  1711. /* ===========================================================================
  1712. * Same as above, but achieves better compression. We use a lazy
  1713. * evaluation for matches: a match is finally adopted only if there is
  1714. * no better match at the next window position.
  1715. */
  1716. local block_state deflate_slow(deflate_state *s, int flush) {
  1717. IPos hash_head; /* head of hash chain */
  1718. int bflush; /* set if current block must be flushed */
  1719. /* Process the input block. */
  1720. for (;;) {
  1721. /* Make sure that we always have enough lookahead, except
  1722. * at the end of the input file. We need MAX_MATCH bytes
  1723. * for the next match, plus MIN_MATCH bytes to insert the
  1724. * string following the next match.
  1725. */
  1726. if (s->lookahead < MIN_LOOKAHEAD) {
  1727. fill_window(s);
  1728. if (s->lookahead < MIN_LOOKAHEAD && flush == Z_NO_FLUSH) {
  1729. return need_more;
  1730. }
  1731. if (s->lookahead == 0) break; /* flush the current block */
  1732. }
  1733. /* Insert the string window[strstart .. strstart + 2] in the
  1734. * dictionary, and set hash_head to the head of the hash chain:
  1735. */
  1736. hash_head = NIL;
  1737. if (s->lookahead >= MIN_MATCH) {
  1738. INSERT_STRING(s, s->strstart, hash_head);
  1739. }
  1740. /* Find the longest match, discarding those <= prev_length.
  1741. */
  1742. s->prev_length = s->match_length, s->prev_match = s->match_start;
  1743. s->match_length = MIN_MATCH-1;
  1744. if (hash_head != NIL && s->prev_length < s->max_lazy_match &&
  1745. s->strstart - hash_head <= MAX_DIST(s)) {
  1746. /* To simplify the code, we prevent matches with the string
  1747. * of window index 0 (in particular we have to avoid a match
  1748. * of the string with itself at the start of the input file).
  1749. */
  1750. s->match_length = longest_match (s, hash_head);
  1751. /* longest_match() sets match_start */
  1752. if (s->match_length <= 5 && (s->strategy == Z_FILTERED
  1753. #if TOO_FAR <= 32767
  1754. || (s->match_length == MIN_MATCH &&
  1755. s->strstart - s->match_start > TOO_FAR)
  1756. #endif
  1757. )) {
  1758. /* If prev_match is also MIN_MATCH, match_start is garbage
  1759. * but we will ignore the current match anyway.
  1760. */
  1761. s->match_length = MIN_MATCH-1;
  1762. }
  1763. }
  1764. /* If there was a match at the previous step and the current
  1765. * match is not better, output the previous match:
  1766. */
  1767. if (s->prev_length >= MIN_MATCH && s->match_length <= s->prev_length) {
  1768. uInt max_insert = s->strstart + s->lookahead - MIN_MATCH;
  1769. /* Do not insert strings in hash table beyond this. */
  1770. check_match(s, s->strstart - 1, s->prev_match, s->prev_length);
  1771. _tr_tally_dist(s, s->strstart - 1 - s->prev_match,
  1772. s->prev_length - MIN_MATCH, bflush);
  1773. /* Insert in hash table all strings up to the end of the match.
  1774. * strstart - 1 and strstart are already inserted. If there is not
  1775. * enough lookahead, the last two strings are not inserted in
  1776. * the hash table.
  1777. */
  1778. s->lookahead -= s->prev_length - 1;
  1779. s->prev_length -= 2;
  1780. do {
  1781. if (++s->strstart <= max_insert) {
  1782. INSERT_STRING(s, s->strstart, hash_head);
  1783. }
  1784. } while (--s->prev_length != 0);
  1785. s->match_available = 0;
  1786. s->match_length = MIN_MATCH-1;
  1787. s->strstart++;
  1788. if (bflush) FLUSH_BLOCK(s, 0);
  1789. } else if (s->match_available) {
  1790. /* If there was no match at the previous position, output a
  1791. * single literal. If there was a match but the current match
  1792. * is longer, truncate the previous match to a single literal.
  1793. */
  1794. Tracevv((stderr,"%c", s->window[s->strstart - 1]));
  1795. _tr_tally_lit(s, s->window[s->strstart - 1], bflush);
  1796. if (bflush) {
  1797. FLUSH_BLOCK_ONLY(s, 0);
  1798. }
  1799. s->strstart++;
  1800. s->lookahead--;
  1801. if (s->strm->avail_out == 0) return need_more;
  1802. } else {
  1803. /* There is no previous match to compare with, wait for
  1804. * the next step to decide.
  1805. */
  1806. s->match_available = 1;
  1807. s->strstart++;
  1808. s->lookahead--;
  1809. }
  1810. }
  1811. Assert (flush != Z_NO_FLUSH, "no flush?");
  1812. if (s->match_available) {
  1813. Tracevv((stderr,"%c", s->window[s->strstart - 1]));
  1814. _tr_tally_lit(s, s->window[s->strstart - 1], bflush);
  1815. s->match_available = 0;
  1816. }
  1817. s->insert = s->strstart < MIN_MATCH-1 ? s->strstart : MIN_MATCH-1;
  1818. if (flush == Z_FINISH) {
  1819. FLUSH_BLOCK(s, 1);
  1820. return finish_done;
  1821. }
  1822. if (s->sym_next)
  1823. FLUSH_BLOCK(s, 0);
  1824. return block_done;
  1825. }
  1826. #endif /* FASTEST */
  1827. /* ===========================================================================
  1828. * For Z_RLE, simply look for runs of bytes, generate matches only of distance
  1829. * one. Do not maintain a hash table. (It will be regenerated if this run of
  1830. * deflate switches away from Z_RLE.)
  1831. */
  1832. local block_state deflate_rle(deflate_state *s, int flush) {
  1833. int bflush; /* set if current block must be flushed */
  1834. uInt prev; /* byte at distance one to match */
  1835. Bytef *scan, *strend; /* scan goes up to strend for length of run */
  1836. for (;;) {
  1837. /* Make sure that we always have enough lookahead, except
  1838. * at the end of the input file. We need MAX_MATCH bytes
  1839. * for the longest run, plus one for the unrolled loop.
  1840. */
  1841. if (s->lookahead <= MAX_MATCH) {
  1842. fill_window(s);
  1843. if (s->lookahead <= MAX_MATCH && flush == Z_NO_FLUSH) {
  1844. return need_more;
  1845. }
  1846. if (s->lookahead == 0) break; /* flush the current block */
  1847. }
  1848. /* See how many times the previous byte repeats */
  1849. s->match_length = 0;
  1850. if (s->lookahead >= MIN_MATCH && s->strstart > 0) {
  1851. scan = s->window + s->strstart - 1;
  1852. prev = *scan;
  1853. if (prev == *++scan && prev == *++scan && prev == *++scan) {
  1854. strend = s->window + s->strstart + MAX_MATCH;
  1855. do {
  1856. } while (prev == *++scan && prev == *++scan &&
  1857. prev == *++scan && prev == *++scan &&
  1858. prev == *++scan && prev == *++scan &&
  1859. prev == *++scan && prev == *++scan &&
  1860. scan < strend);
  1861. s->match_length = MAX_MATCH - (uInt)(strend - scan);
  1862. if (s->match_length > s->lookahead)
  1863. s->match_length = s->lookahead;
  1864. }
  1865. Assert(scan <= s->window + (uInt)(s->window_size - 1),
  1866. "wild scan");
  1867. }
  1868. /* Emit match if have run of MIN_MATCH or longer, else emit literal */
  1869. if (s->match_length >= MIN_MATCH) {
  1870. check_match(s, s->strstart, s->strstart - 1, s->match_length);
  1871. _tr_tally_dist(s, 1, s->match_length - MIN_MATCH, bflush);
  1872. s->lookahead -= s->match_length;
  1873. s->strstart += s->match_length;
  1874. s->match_length = 0;
  1875. } else {
  1876. /* No match, output a literal byte */
  1877. Tracevv((stderr,"%c", s->window[s->strstart]));
  1878. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1879. s->lookahead--;
  1880. s->strstart++;
  1881. }
  1882. if (bflush) FLUSH_BLOCK(s, 0);
  1883. }
  1884. s->insert = 0;
  1885. if (flush == Z_FINISH) {
  1886. FLUSH_BLOCK(s, 1);
  1887. return finish_done;
  1888. }
  1889. if (s->sym_next)
  1890. FLUSH_BLOCK(s, 0);
  1891. return block_done;
  1892. }
  1893. /* ===========================================================================
  1894. * For Z_HUFFMAN_ONLY, do not look for matches. Do not maintain a hash table.
  1895. * (It will be regenerated if this run of deflate switches away from Huffman.)
  1896. */
  1897. local block_state deflate_huff(deflate_state *s, int flush) {
  1898. int bflush; /* set if current block must be flushed */
  1899. for (;;) {
  1900. /* Make sure that we have a literal to write. */
  1901. if (s->lookahead == 0) {
  1902. fill_window(s);
  1903. if (s->lookahead == 0) {
  1904. if (flush == Z_NO_FLUSH)
  1905. return need_more;
  1906. break; /* flush the current block */
  1907. }
  1908. }
  1909. /* Output a literal byte */
  1910. s->match_length = 0;
  1911. Tracevv((stderr,"%c", s->window[s->strstart]));
  1912. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1913. s->lookahead--;
  1914. s->strstart++;
  1915. if (bflush) FLUSH_BLOCK(s, 0);
  1916. }
  1917. s->insert = 0;
  1918. if (flush == Z_FINISH) {
  1919. FLUSH_BLOCK(s, 1);
  1920. return finish_done;
  1921. }
  1922. if (s->sym_next)
  1923. FLUSH_BLOCK(s, 0);
  1924. return block_done;
  1925. }