deflate.c 80 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152
  1. /* deflate.c -- compress data using the deflation algorithm
  2. * Copyright (C) 1995-2024 Jean-loup Gailly and Mark Adler
  3. * For conditions of distribution and use, see copyright notice in zlib.h
  4. */
  5. /*
  6. * ALGORITHM
  7. *
  8. * The "deflation" process depends on being able to identify portions
  9. * of the input text which are identical to earlier input (within a
  10. * sliding window trailing behind the input currently being processed).
  11. *
  12. * The most straightforward technique turns out to be the fastest for
  13. * most input files: try all possible matches and select the longest.
  14. * The key feature of this algorithm is that insertions into the string
  15. * dictionary are very simple and thus fast, and deletions are avoided
  16. * completely. Insertions are performed at each input character, whereas
  17. * string matches are performed only when the previous match ends. So it
  18. * is preferable to spend more time in matches to allow very fast string
  19. * insertions and avoid deletions. The matching algorithm for small
  20. * strings is inspired from that of Rabin & Karp. A brute force approach
  21. * is used to find longer strings when a small match has been found.
  22. * A similar algorithm is used in comic (by Jan-Mark Wams) and freeze
  23. * (by Leonid Broukhis).
  24. * A previous version of this file used a more sophisticated algorithm
  25. * (by Fiala and Greene) which is guaranteed to run in linear amortized
  26. * time, but has a larger average cost, uses more memory and is patented.
  27. * However the F&G algorithm may be faster for some highly redundant
  28. * files if the parameter max_chain_length (described below) is too large.
  29. *
  30. * ACKNOWLEDGEMENTS
  31. *
  32. * The idea of lazy evaluation of matches is due to Jan-Mark Wams, and
  33. * I found it in 'freeze' written by Leonid Broukhis.
  34. * Thanks to many people for bug reports and testing.
  35. *
  36. * REFERENCES
  37. *
  38. * Deutsch, L.P.,"DEFLATE Compressed Data Format Specification".
  39. * Available in http://tools.ietf.org/html/rfc1951
  40. *
  41. * A description of the Rabin and Karp algorithm is given in the book
  42. * "Algorithms" by R. Sedgewick, Addison-Wesley, p252.
  43. *
  44. * Fiala,E.R., and Greene,D.H.
  45. * Data Compression with Finite Windows, Comm.ACM, 32,4 (1989) 490-595
  46. *
  47. */
  48. /* @(#) $Id$ */
  49. #include "deflate.h"
  50. const char deflate_copyright[] =
  51. " deflate 1.3.1.1 Copyright 1995-2024 Jean-loup Gailly and Mark Adler ";
  52. /*
  53. If you use the zlib library in a product, an acknowledgment is welcome
  54. in the documentation of your product. If for some reason you cannot
  55. include such an acknowledgment, I would appreciate that you keep this
  56. copyright string in the executable of your product.
  57. */
  58. typedef enum {
  59. need_more, /* block not completed, need more input or more output */
  60. block_done, /* block flush performed */
  61. finish_started, /* finish started, need only more output at next deflate */
  62. finish_done /* finish done, accept no more input or output */
  63. } block_state;
  64. typedef block_state (*compress_func)(deflate_state *s, int flush);
  65. /* Compression function. Returns the block state after the call. */
  66. local block_state deflate_stored(deflate_state *s, int flush);
  67. local block_state deflate_fast(deflate_state *s, int flush);
  68. #ifndef FASTEST
  69. local block_state deflate_slow(deflate_state *s, int flush);
  70. #endif
  71. local block_state deflate_rle(deflate_state *s, int flush);
  72. local block_state deflate_huff(deflate_state *s, int flush);
  73. /* ===========================================================================
  74. * Local data
  75. */
  76. #define NIL 0
  77. /* Tail of hash chains */
  78. #ifndef TOO_FAR
  79. # define TOO_FAR 4096
  80. #endif
  81. /* Matches of length 3 are discarded if their distance exceeds TOO_FAR */
  82. /* Values for max_lazy_match, good_match and max_chain_length, depending on
  83. * the desired pack level (0..9). The values given below have been tuned to
  84. * exclude worst case performance for pathological files. Better values may be
  85. * found for specific files.
  86. */
  87. typedef struct config_s {
  88. ush good_length; /* reduce lazy search above this match length */
  89. ush max_lazy; /* do not perform lazy search above this match length */
  90. ush nice_length; /* quit search above this match length */
  91. ush max_chain;
  92. compress_func func;
  93. } config;
  94. #ifdef FASTEST
  95. local const config configuration_table[2] = {
  96. /* good lazy nice chain */
  97. /* 0 */ {0, 0, 0, 0, deflate_stored}, /* store only */
  98. /* 1 */ {4, 4, 8, 4, deflate_fast}}; /* max speed, no lazy matches */
  99. #else
  100. local const config configuration_table[10] = {
  101. /* good lazy nice chain */
  102. /* 0 */ {0, 0, 0, 0, deflate_stored}, /* store only */
  103. /* 1 */ {4, 4, 8, 4, deflate_fast}, /* max speed, no lazy matches */
  104. /* 2 */ {4, 5, 16, 8, deflate_fast},
  105. /* 3 */ {4, 6, 32, 32, deflate_fast},
  106. /* 4 */ {4, 4, 16, 16, deflate_slow}, /* lazy matches */
  107. /* 5 */ {8, 16, 32, 32, deflate_slow},
  108. /* 6 */ {8, 16, 128, 128, deflate_slow},
  109. /* 7 */ {8, 32, 128, 256, deflate_slow},
  110. /* 8 */ {32, 128, 258, 1024, deflate_slow},
  111. /* 9 */ {32, 258, 258, 4096, deflate_slow}}; /* max compression */
  112. #endif
  113. /* Note: the deflate() code requires max_lazy >= MIN_MATCH and max_chain >= 4
  114. * For deflate_fast() (levels <= 3) good is ignored and lazy has a different
  115. * meaning.
  116. */
  117. /* rank Z_BLOCK between Z_NO_FLUSH and Z_PARTIAL_FLUSH */
  118. #define RANK(f) (((f) * 2) - ((f) > 4 ? 9 : 0))
  119. /* ===========================================================================
  120. * Update a hash value with the given input byte
  121. * IN assertion: all calls to UPDATE_HASH are made with consecutive input
  122. * characters, so that a running hash key can be computed from the previous
  123. * key instead of complete recalculation each time.
  124. */
  125. #define UPDATE_HASH(s,h,c) (h = (((h) << s->hash_shift) ^ (c)) & s->hash_mask)
  126. /* ===========================================================================
  127. * Insert string str in the dictionary and set match_head to the previous head
  128. * of the hash chain (the most recent string with same hash key). Return
  129. * the previous length of the hash chain.
  130. * If this file is compiled with -DFASTEST, the compression level is forced
  131. * to 1, and no hash chains are maintained.
  132. * IN assertion: all calls to INSERT_STRING are made with consecutive input
  133. * characters and the first MIN_MATCH bytes of str are valid (except for
  134. * the last MIN_MATCH-1 bytes of the input file).
  135. */
  136. #ifdef FASTEST
  137. #define INSERT_STRING(s, str, match_head) \
  138. (UPDATE_HASH(s, s->ins_h, s->window[(str) + (MIN_MATCH-1)]), \
  139. match_head = s->head[s->ins_h], \
  140. s->head[s->ins_h] = (Pos)(str))
  141. #else
  142. #define INSERT_STRING(s, str, match_head) \
  143. (UPDATE_HASH(s, s->ins_h, s->window[(str) + (MIN_MATCH-1)]), \
  144. match_head = s->prev[(str) & s->w_mask] = s->head[s->ins_h], \
  145. s->head[s->ins_h] = (Pos)(str))
  146. #endif
  147. /* ===========================================================================
  148. * Initialize the hash table (avoiding 64K overflow for 16 bit systems).
  149. * prev[] will be initialized on the fly.
  150. */
  151. #define CLEAR_HASH(s) \
  152. do { \
  153. s->head[s->hash_size - 1] = NIL; \
  154. zmemzero((Bytef *)s->head, \
  155. (unsigned)(s->hash_size - 1)*sizeof(*s->head)); \
  156. } while (0)
  157. /* ===========================================================================
  158. * Slide the hash table when sliding the window down (could be avoided with 32
  159. * bit values at the expense of memory usage). We slide even when level == 0 to
  160. * keep the hash table consistent if we switch back to level > 0 later.
  161. */
  162. #if defined(__has_feature)
  163. # if __has_feature(memory_sanitizer)
  164. __attribute__((no_sanitize("memory")))
  165. # endif
  166. #endif
  167. local void slide_hash(deflate_state *s) {
  168. unsigned n, m;
  169. Posf *p;
  170. uInt wsize = s->w_size;
  171. n = s->hash_size;
  172. p = &s->head[n];
  173. do {
  174. m = *--p;
  175. *p = (Pos)(m >= wsize ? m - wsize : NIL);
  176. } while (--n);
  177. n = wsize;
  178. #ifndef FASTEST
  179. p = &s->prev[n];
  180. do {
  181. m = *--p;
  182. *p = (Pos)(m >= wsize ? m - wsize : NIL);
  183. /* If n is not on any hash chain, prev[n] is garbage but
  184. * its value will never be used.
  185. */
  186. } while (--n);
  187. #endif
  188. }
  189. /* ===========================================================================
  190. * Read a new buffer from the current input stream, update the adler32
  191. * and total number of bytes read. All deflate() input goes through
  192. * this function so some applications may wish to modify it to avoid
  193. * allocating a large strm->next_in buffer and copying from it.
  194. * (See also flush_pending()).
  195. */
  196. local unsigned read_buf(z_streamp strm, Bytef *buf, unsigned size) {
  197. unsigned len = strm->avail_in;
  198. if (len > size) len = size;
  199. if (len == 0) return 0;
  200. strm->avail_in -= len;
  201. zmemcpy(buf, strm->next_in, len);
  202. if (strm->state->wrap == 1) {
  203. strm->adler = adler32(strm->adler, buf, len);
  204. }
  205. #ifdef GZIP
  206. else if (strm->state->wrap == 2) {
  207. strm->adler = crc32(strm->adler, buf, len);
  208. }
  209. #endif
  210. strm->next_in += len;
  211. strm->total_in += len;
  212. return len;
  213. }
  214. /* ===========================================================================
  215. * Fill the window when the lookahead becomes insufficient.
  216. * Updates strstart and lookahead.
  217. *
  218. * IN assertion: lookahead < MIN_LOOKAHEAD
  219. * OUT assertions: strstart <= window_size-MIN_LOOKAHEAD
  220. * At least one byte has been read, or avail_in == 0; reads are
  221. * performed for at least two bytes (required for the zip translate_eol
  222. * option -- not supported here).
  223. */
  224. local void fill_window(deflate_state *s) {
  225. unsigned n;
  226. unsigned more; /* Amount of free space at the end of the window. */
  227. uInt wsize = s->w_size;
  228. Assert(s->lookahead < MIN_LOOKAHEAD, "already enough lookahead");
  229. do {
  230. more = (unsigned)(s->window_size -(ulg)s->lookahead -(ulg)s->strstart);
  231. /* Deal with !@#$% 64K limit: */
  232. if (sizeof(int) <= 2) {
  233. if (more == 0 && s->strstart == 0 && s->lookahead == 0) {
  234. more = wsize;
  235. } else if (more == (unsigned)(-1)) {
  236. /* Very unlikely, but possible on 16 bit machine if
  237. * strstart == 0 && lookahead == 1 (input done a byte at time)
  238. */
  239. more--;
  240. }
  241. }
  242. /* If the window is almost full and there is insufficient lookahead,
  243. * move the upper half to the lower one to make room in the upper half.
  244. */
  245. if (s->strstart >= wsize + MAX_DIST(s)) {
  246. zmemcpy(s->window, s->window + wsize, (unsigned)wsize - more);
  247. s->match_start -= wsize;
  248. s->strstart -= wsize; /* we now have strstart >= MAX_DIST */
  249. s->block_start -= (long) wsize;
  250. if (s->insert > s->strstart)
  251. s->insert = s->strstart;
  252. slide_hash(s);
  253. more += wsize;
  254. }
  255. if (s->strm->avail_in == 0) break;
  256. /* If there was no sliding:
  257. * strstart <= WSIZE+MAX_DIST-1 && lookahead <= MIN_LOOKAHEAD - 1 &&
  258. * more == window_size - lookahead - strstart
  259. * => more >= window_size - (MIN_LOOKAHEAD-1 + WSIZE + MAX_DIST-1)
  260. * => more >= window_size - 2*WSIZE + 2
  261. * In the BIG_MEM or MMAP case (not yet supported),
  262. * window_size == input_size + MIN_LOOKAHEAD &&
  263. * strstart + s->lookahead <= input_size => more >= MIN_LOOKAHEAD.
  264. * Otherwise, window_size == 2*WSIZE so more >= 2.
  265. * If there was sliding, more >= WSIZE. So in all cases, more >= 2.
  266. */
  267. Assert(more >= 2, "more < 2");
  268. n = read_buf(s->strm, s->window + s->strstart + s->lookahead, more);
  269. s->lookahead += n;
  270. /* Initialize the hash value now that we have some input: */
  271. if (s->lookahead + s->insert >= MIN_MATCH) {
  272. uInt str = s->strstart - s->insert;
  273. s->ins_h = s->window[str];
  274. UPDATE_HASH(s, s->ins_h, s->window[str + 1]);
  275. #if MIN_MATCH != 3
  276. Call UPDATE_HASH() MIN_MATCH-3 more times
  277. #endif
  278. while (s->insert) {
  279. UPDATE_HASH(s, s->ins_h, s->window[str + MIN_MATCH-1]);
  280. #ifndef FASTEST
  281. s->prev[str & s->w_mask] = s->head[s->ins_h];
  282. #endif
  283. s->head[s->ins_h] = (Pos)str;
  284. str++;
  285. s->insert--;
  286. if (s->lookahead + s->insert < MIN_MATCH)
  287. break;
  288. }
  289. }
  290. /* If the whole input has less than MIN_MATCH bytes, ins_h is garbage,
  291. * but this is not important since only literal bytes will be emitted.
  292. */
  293. } while (s->lookahead < MIN_LOOKAHEAD && s->strm->avail_in != 0);
  294. /* If the WIN_INIT bytes after the end of the current data have never been
  295. * written, then zero those bytes in order to avoid memory check reports of
  296. * the use of uninitialized (or uninitialised as Julian writes) bytes by
  297. * the longest match routines. Update the high water mark for the next
  298. * time through here. WIN_INIT is set to MAX_MATCH since the longest match
  299. * routines allow scanning to strstart + MAX_MATCH, ignoring lookahead.
  300. */
  301. if (s->high_water < s->window_size) {
  302. ulg curr = s->strstart + (ulg)(s->lookahead);
  303. ulg init;
  304. if (s->high_water < curr) {
  305. /* Previous high water mark below current data -- zero WIN_INIT
  306. * bytes or up to end of window, whichever is less.
  307. */
  308. init = s->window_size - curr;
  309. if (init > WIN_INIT)
  310. init = WIN_INIT;
  311. zmemzero(s->window + curr, (unsigned)init);
  312. s->high_water = curr + init;
  313. }
  314. else if (s->high_water < (ulg)curr + WIN_INIT) {
  315. /* High water mark at or above current data, but below current data
  316. * plus WIN_INIT -- zero out to current data plus WIN_INIT, or up
  317. * to end of window, whichever is less.
  318. */
  319. init = (ulg)curr + WIN_INIT - s->high_water;
  320. if (init > s->window_size - s->high_water)
  321. init = s->window_size - s->high_water;
  322. zmemzero(s->window + s->high_water, (unsigned)init);
  323. s->high_water += init;
  324. }
  325. }
  326. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  327. "not enough room for search");
  328. }
  329. /* ========================================================================= */
  330. int ZEXPORT deflateInit_(z_streamp strm, int level, const char *version,
  331. int stream_size) {
  332. return deflateInit2_(strm, level, Z_DEFLATED, MAX_WBITS, DEF_MEM_LEVEL,
  333. Z_DEFAULT_STRATEGY, version, stream_size);
  334. /* To do: ignore strm->next_in if we use it as window */
  335. }
  336. /* ========================================================================= */
  337. int ZEXPORT deflateInit2_(z_streamp strm, int level, int method,
  338. int windowBits, int memLevel, int strategy,
  339. const char *version, int stream_size) {
  340. deflate_state *s;
  341. int wrap = 1;
  342. static const char my_version[] = ZLIB_VERSION;
  343. if (version == Z_NULL || version[0] != my_version[0] ||
  344. stream_size != sizeof(z_stream)) {
  345. return Z_VERSION_ERROR;
  346. }
  347. if (strm == Z_NULL) return Z_STREAM_ERROR;
  348. strm->msg = Z_NULL;
  349. if (strm->zalloc == (alloc_func)0) {
  350. #ifdef Z_SOLO
  351. return Z_STREAM_ERROR;
  352. #else
  353. strm->zalloc = zcalloc;
  354. strm->opaque = (voidpf)0;
  355. #endif
  356. }
  357. if (strm->zfree == (free_func)0)
  358. #ifdef Z_SOLO
  359. return Z_STREAM_ERROR;
  360. #else
  361. strm->zfree = zcfree;
  362. #endif
  363. #ifdef FASTEST
  364. if (level != 0) level = 1;
  365. #else
  366. if (level == Z_DEFAULT_COMPRESSION) level = 6;
  367. #endif
  368. if (windowBits < 0) { /* suppress zlib wrapper */
  369. wrap = 0;
  370. if (windowBits < -15)
  371. return Z_STREAM_ERROR;
  372. windowBits = -windowBits;
  373. }
  374. #ifdef GZIP
  375. else if (windowBits > 15) {
  376. wrap = 2; /* write gzip wrapper instead */
  377. windowBits -= 16;
  378. }
  379. #endif
  380. if (memLevel < 1 || memLevel > MAX_MEM_LEVEL || method != Z_DEFLATED ||
  381. windowBits < 8 || windowBits > 15 || level < 0 || level > 9 ||
  382. strategy < 0 || strategy > Z_FIXED || (windowBits == 8 && wrap != 1)) {
  383. return Z_STREAM_ERROR;
  384. }
  385. if (windowBits == 8) windowBits = 9; /* until 256-byte window bug fixed */
  386. s = (deflate_state *) ZALLOC(strm, 1, sizeof(deflate_state));
  387. if (s == Z_NULL) return Z_MEM_ERROR;
  388. strm->state = (struct internal_state FAR *)s;
  389. s->strm = strm;
  390. s->status = INIT_STATE; /* to pass state test in deflateReset() */
  391. s->wrap = wrap;
  392. s->gzhead = Z_NULL;
  393. s->w_bits = (uInt)windowBits;
  394. s->w_size = 1 << s->w_bits;
  395. s->w_mask = s->w_size - 1;
  396. s->hash_bits = (uInt)memLevel + 7;
  397. s->hash_size = 1 << s->hash_bits;
  398. s->hash_mask = s->hash_size - 1;
  399. s->hash_shift = ((s->hash_bits + MIN_MATCH-1) / MIN_MATCH);
  400. s->window = (Bytef *) ZALLOC(strm, s->w_size, 2*sizeof(Byte));
  401. s->prev = (Posf *) ZALLOC(strm, s->w_size, sizeof(Pos));
  402. s->head = (Posf *) ZALLOC(strm, s->hash_size, sizeof(Pos));
  403. s->high_water = 0; /* nothing written to s->window yet */
  404. s->lit_bufsize = 1 << (memLevel + 6); /* 16K elements by default */
  405. /* We overlay pending_buf and sym_buf. This works since the average size
  406. * for length/distance pairs over any compressed block is assured to be 31
  407. * bits or less.
  408. *
  409. * Analysis: The longest fixed codes are a length code of 8 bits plus 5
  410. * extra bits, for lengths 131 to 257. The longest fixed distance codes are
  411. * 5 bits plus 13 extra bits, for distances 16385 to 32768. The longest
  412. * possible fixed-codes length/distance pair is then 31 bits total.
  413. *
  414. * sym_buf starts one-fourth of the way into pending_buf. So there are
  415. * three bytes in sym_buf for every four bytes in pending_buf. Each symbol
  416. * in sym_buf is three bytes -- two for the distance and one for the
  417. * literal/length. As each symbol is consumed, the pointer to the next
  418. * sym_buf value to read moves forward three bytes. From that symbol, up to
  419. * 31 bits are written to pending_buf. The closest the written pending_buf
  420. * bits gets to the next sym_buf symbol to read is just before the last
  421. * code is written. At that time, 31*(n - 2) bits have been written, just
  422. * after 24*(n - 2) bits have been consumed from sym_buf. sym_buf starts at
  423. * 8*n bits into pending_buf. (Note that the symbol buffer fills when n - 1
  424. * symbols are written.) The closest the writing gets to what is unread is
  425. * then n + 14 bits. Here n is lit_bufsize, which is 16384 by default, and
  426. * can range from 128 to 32768.
  427. *
  428. * Therefore, at a minimum, there are 142 bits of space between what is
  429. * written and what is read in the overlain buffers, so the symbols cannot
  430. * be overwritten by the compressed data. That space is actually 139 bits,
  431. * due to the three-bit fixed-code block header.
  432. *
  433. * That covers the case where either Z_FIXED is specified, forcing fixed
  434. * codes, or when the use of fixed codes is chosen, because that choice
  435. * results in a smaller compressed block than dynamic codes. That latter
  436. * condition then assures that the above analysis also covers all dynamic
  437. * blocks. A dynamic-code block will only be chosen to be emitted if it has
  438. * fewer bits than a fixed-code block would for the same set of symbols.
  439. * Therefore its average symbol length is assured to be less than 31. So
  440. * the compressed data for a dynamic block also cannot overwrite the
  441. * symbols from which it is being constructed.
  442. */
  443. s->pending_buf = (uchf *) ZALLOC(strm, s->lit_bufsize, LIT_BUFS);
  444. s->pending_buf_size = (ulg)s->lit_bufsize * 4;
  445. if (s->window == Z_NULL || s->prev == Z_NULL || s->head == Z_NULL ||
  446. s->pending_buf == Z_NULL) {
  447. s->status = FINISH_STATE;
  448. strm->msg = ERR_MSG(Z_MEM_ERROR);
  449. deflateEnd (strm);
  450. return Z_MEM_ERROR;
  451. }
  452. #ifdef LIT_MEM
  453. s->d_buf = (ushf *)(s->pending_buf + (s->lit_bufsize << 1));
  454. s->l_buf = s->pending_buf + (s->lit_bufsize << 2);
  455. s->sym_end = s->lit_bufsize - 1;
  456. #else
  457. s->sym_buf = s->pending_buf + s->lit_bufsize;
  458. s->sym_end = (s->lit_bufsize - 1) * 3;
  459. #endif
  460. /* We avoid equality with lit_bufsize*3 because of wraparound at 64K
  461. * on 16 bit machines and because stored blocks are restricted to
  462. * 64K-1 bytes.
  463. */
  464. s->level = level;
  465. s->strategy = strategy;
  466. s->method = (Byte)method;
  467. return deflateReset(strm);
  468. }
  469. /* =========================================================================
  470. * Check for a valid deflate stream state. Return 0 if ok, 1 if not.
  471. */
  472. local int deflateStateCheck(z_streamp strm) {
  473. deflate_state *s;
  474. if (strm == Z_NULL ||
  475. strm->zalloc == (alloc_func)0 || strm->zfree == (free_func)0)
  476. return 1;
  477. s = strm->state;
  478. if (s == Z_NULL || s->strm != strm || (s->status != INIT_STATE &&
  479. #ifdef GZIP
  480. s->status != GZIP_STATE &&
  481. #endif
  482. s->status != EXTRA_STATE &&
  483. s->status != NAME_STATE &&
  484. s->status != COMMENT_STATE &&
  485. s->status != HCRC_STATE &&
  486. s->status != BUSY_STATE &&
  487. s->status != FINISH_STATE))
  488. return 1;
  489. return 0;
  490. }
  491. /* ========================================================================= */
  492. int ZEXPORT deflateSetDictionary(z_streamp strm, const Bytef *dictionary,
  493. uInt dictLength) {
  494. deflate_state *s;
  495. uInt str, n;
  496. int wrap;
  497. unsigned avail;
  498. z_const unsigned char *next;
  499. if (deflateStateCheck(strm) || dictionary == Z_NULL)
  500. return Z_STREAM_ERROR;
  501. s = strm->state;
  502. wrap = s->wrap;
  503. if (wrap == 2 || (wrap == 1 && s->status != INIT_STATE) || s->lookahead)
  504. return Z_STREAM_ERROR;
  505. /* when using zlib wrappers, compute Adler-32 for provided dictionary */
  506. if (wrap == 1)
  507. strm->adler = adler32(strm->adler, dictionary, dictLength);
  508. s->wrap = 0; /* avoid computing Adler-32 in read_buf */
  509. /* if dictionary would fill window, just replace the history */
  510. if (dictLength >= s->w_size) {
  511. if (wrap == 0) { /* already empty otherwise */
  512. CLEAR_HASH(s);
  513. s->strstart = 0;
  514. s->block_start = 0L;
  515. s->insert = 0;
  516. }
  517. dictionary += dictLength - s->w_size; /* use the tail */
  518. dictLength = s->w_size;
  519. }
  520. /* insert dictionary into window and hash */
  521. avail = strm->avail_in;
  522. next = strm->next_in;
  523. strm->avail_in = dictLength;
  524. strm->next_in = (z_const Bytef *)dictionary;
  525. fill_window(s);
  526. while (s->lookahead >= MIN_MATCH) {
  527. str = s->strstart;
  528. n = s->lookahead - (MIN_MATCH-1);
  529. do {
  530. UPDATE_HASH(s, s->ins_h, s->window[str + MIN_MATCH-1]);
  531. #ifndef FASTEST
  532. s->prev[str & s->w_mask] = s->head[s->ins_h];
  533. #endif
  534. s->head[s->ins_h] = (Pos)str;
  535. str++;
  536. } while (--n);
  537. s->strstart = str;
  538. s->lookahead = MIN_MATCH-1;
  539. fill_window(s);
  540. }
  541. s->strstart += s->lookahead;
  542. s->block_start = (long)s->strstart;
  543. s->insert = s->lookahead;
  544. s->lookahead = 0;
  545. s->match_length = s->prev_length = MIN_MATCH-1;
  546. s->match_available = 0;
  547. strm->next_in = next;
  548. strm->avail_in = avail;
  549. s->wrap = wrap;
  550. return Z_OK;
  551. }
  552. /* ========================================================================= */
  553. int ZEXPORT deflateGetDictionary(z_streamp strm, Bytef *dictionary,
  554. uInt *dictLength) {
  555. deflate_state *s;
  556. uInt len;
  557. if (deflateStateCheck(strm))
  558. return Z_STREAM_ERROR;
  559. s = strm->state;
  560. len = s->strstart + s->lookahead;
  561. if (len > s->w_size)
  562. len = s->w_size;
  563. if (dictionary != Z_NULL && len)
  564. zmemcpy(dictionary, s->window + s->strstart + s->lookahead - len, len);
  565. if (dictLength != Z_NULL)
  566. *dictLength = len;
  567. return Z_OK;
  568. }
  569. /* ========================================================================= */
  570. int ZEXPORT deflateResetKeep(z_streamp strm) {
  571. deflate_state *s;
  572. if (deflateStateCheck(strm)) {
  573. return Z_STREAM_ERROR;
  574. }
  575. strm->total_in = strm->total_out = 0;
  576. strm->msg = Z_NULL; /* use zfree if we ever allocate msg dynamically */
  577. strm->data_type = Z_UNKNOWN;
  578. s = (deflate_state *)strm->state;
  579. s->pending = 0;
  580. s->pending_out = s->pending_buf;
  581. if (s->wrap < 0) {
  582. s->wrap = -s->wrap; /* was made negative by deflate(..., Z_FINISH); */
  583. }
  584. s->status =
  585. #ifdef GZIP
  586. s->wrap == 2 ? GZIP_STATE :
  587. #endif
  588. INIT_STATE;
  589. strm->adler =
  590. #ifdef GZIP
  591. s->wrap == 2 ? crc32(0L, Z_NULL, 0) :
  592. #endif
  593. adler32(0L, Z_NULL, 0);
  594. s->last_flush = -2;
  595. _tr_init(s);
  596. return Z_OK;
  597. }
  598. /* ===========================================================================
  599. * Initialize the "longest match" routines for a new zlib stream
  600. */
  601. local void lm_init(deflate_state *s) {
  602. s->window_size = (ulg)2L*s->w_size;
  603. CLEAR_HASH(s);
  604. /* Set the default configuration parameters:
  605. */
  606. s->max_lazy_match = configuration_table[s->level].max_lazy;
  607. s->good_match = configuration_table[s->level].good_length;
  608. s->nice_match = configuration_table[s->level].nice_length;
  609. s->max_chain_length = configuration_table[s->level].max_chain;
  610. s->strstart = 0;
  611. s->block_start = 0L;
  612. s->lookahead = 0;
  613. s->insert = 0;
  614. s->match_length = s->prev_length = MIN_MATCH-1;
  615. s->match_available = 0;
  616. s->ins_h = 0;
  617. }
  618. /* ========================================================================= */
  619. int ZEXPORT deflateReset(z_streamp strm) {
  620. int ret;
  621. ret = deflateResetKeep(strm);
  622. if (ret == Z_OK)
  623. lm_init(strm->state);
  624. return ret;
  625. }
  626. /* ========================================================================= */
  627. int ZEXPORT deflateSetHeader(z_streamp strm, gz_headerp head) {
  628. if (deflateStateCheck(strm) || strm->state->wrap != 2)
  629. return Z_STREAM_ERROR;
  630. strm->state->gzhead = head;
  631. return Z_OK;
  632. }
  633. /* ========================================================================= */
  634. int ZEXPORT deflatePending(z_streamp strm, unsigned *pending, int *bits) {
  635. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  636. if (pending != Z_NULL)
  637. *pending = strm->state->pending;
  638. if (bits != Z_NULL)
  639. *bits = strm->state->bi_valid;
  640. return Z_OK;
  641. }
  642. /* ========================================================================= */
  643. int ZEXPORT deflateUsed(z_streamp strm, int *bits) {
  644. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  645. if (bits != Z_NULL)
  646. *bits = strm->state->bi_used;
  647. return Z_OK;
  648. }
  649. /* ========================================================================= */
  650. int ZEXPORT deflatePrime(z_streamp strm, int bits, int value) {
  651. deflate_state *s;
  652. int put;
  653. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  654. s = strm->state;
  655. #ifdef LIT_MEM
  656. if (bits < 0 || bits > 16 ||
  657. (uchf *)s->d_buf < s->pending_out + ((Buf_size + 7) >> 3))
  658. return Z_BUF_ERROR;
  659. #else
  660. if (bits < 0 || bits > 16 ||
  661. s->sym_buf < s->pending_out + ((Buf_size + 7) >> 3))
  662. return Z_BUF_ERROR;
  663. #endif
  664. do {
  665. put = Buf_size - s->bi_valid;
  666. if (put > bits)
  667. put = bits;
  668. s->bi_buf |= (ush)((value & ((1 << put) - 1)) << s->bi_valid);
  669. s->bi_valid += put;
  670. _tr_flush_bits(s);
  671. value >>= put;
  672. bits -= put;
  673. } while (bits);
  674. return Z_OK;
  675. }
  676. /* ========================================================================= */
  677. int ZEXPORT deflateParams(z_streamp strm, int level, int strategy) {
  678. deflate_state *s;
  679. compress_func func;
  680. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  681. s = strm->state;
  682. #ifdef FASTEST
  683. if (level != 0) level = 1;
  684. #else
  685. if (level == Z_DEFAULT_COMPRESSION) level = 6;
  686. #endif
  687. if (level < 0 || level > 9 || strategy < 0 || strategy > Z_FIXED) {
  688. return Z_STREAM_ERROR;
  689. }
  690. func = configuration_table[s->level].func;
  691. if ((strategy != s->strategy || func != configuration_table[level].func) &&
  692. s->last_flush != -2) {
  693. /* Flush the last buffer: */
  694. int err = deflate(strm, Z_BLOCK);
  695. if (err == Z_STREAM_ERROR)
  696. return err;
  697. if (strm->avail_in || (s->strstart - s->block_start) + s->lookahead)
  698. return Z_BUF_ERROR;
  699. }
  700. if (s->level != level) {
  701. if (s->level == 0 && s->matches != 0) {
  702. if (s->matches == 1)
  703. slide_hash(s);
  704. else
  705. CLEAR_HASH(s);
  706. s->matches = 0;
  707. }
  708. s->level = level;
  709. s->max_lazy_match = configuration_table[level].max_lazy;
  710. s->good_match = configuration_table[level].good_length;
  711. s->nice_match = configuration_table[level].nice_length;
  712. s->max_chain_length = configuration_table[level].max_chain;
  713. }
  714. s->strategy = strategy;
  715. return Z_OK;
  716. }
  717. /* ========================================================================= */
  718. int ZEXPORT deflateTune(z_streamp strm, int good_length, int max_lazy,
  719. int nice_length, int max_chain) {
  720. deflate_state *s;
  721. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  722. s = strm->state;
  723. s->good_match = (uInt)good_length;
  724. s->max_lazy_match = (uInt)max_lazy;
  725. s->nice_match = nice_length;
  726. s->max_chain_length = (uInt)max_chain;
  727. return Z_OK;
  728. }
  729. /* =========================================================================
  730. * For the default windowBits of 15 and memLevel of 8, this function returns a
  731. * close to exact, as well as small, upper bound on the compressed size. This
  732. * is an expansion of ~0.03%, plus a small constant.
  733. *
  734. * For any setting other than those defaults for windowBits and memLevel, one
  735. * of two worst case bounds is returned. This is at most an expansion of ~4% or
  736. * ~13%, plus a small constant.
  737. *
  738. * Both the 0.03% and 4% derive from the overhead of stored blocks. The first
  739. * one is for stored blocks of 16383 bytes (memLevel == 8), whereas the second
  740. * is for stored blocks of 127 bytes (the worst case memLevel == 1). The
  741. * expansion results from five bytes of header for each stored block.
  742. *
  743. * The larger expansion of 13% results from a window size less than or equal to
  744. * the symbols buffer size (windowBits <= memLevel + 7). In that case some of
  745. * the data being compressed may have slid out of the sliding window, impeding
  746. * a stored block from being emitted. Then the only choice is a fixed or
  747. * dynamic block, where a fixed block limits the maximum expansion to 9 bits
  748. * per 8-bit byte, plus 10 bits for every block. The smallest block size for
  749. * which this can occur is 255 (memLevel == 2).
  750. *
  751. * Shifts are used to approximate divisions, for speed.
  752. */
  753. uLong ZEXPORT deflateBound(z_streamp strm, uLong sourceLen) {
  754. deflate_state *s;
  755. uLong fixedlen, storelen, wraplen;
  756. /* upper bound for fixed blocks with 9-bit literals and length 255
  757. (memLevel == 2, which is the lowest that may not use stored blocks) --
  758. ~13% overhead plus a small constant */
  759. fixedlen = sourceLen + (sourceLen >> 3) + (sourceLen >> 8) +
  760. (sourceLen >> 9) + 4;
  761. /* upper bound for stored blocks with length 127 (memLevel == 1) --
  762. ~4% overhead plus a small constant */
  763. storelen = sourceLen + (sourceLen >> 5) + (sourceLen >> 7) +
  764. (sourceLen >> 11) + 7;
  765. /* if can't get parameters, return larger bound plus a wrapper */
  766. if (deflateStateCheck(strm))
  767. return (fixedlen > storelen ? fixedlen : storelen) + 18;
  768. /* compute wrapper length */
  769. s = strm->state;
  770. switch (s->wrap < 0 ? -s->wrap : s->wrap) {
  771. case 0: /* raw deflate */
  772. wraplen = 0;
  773. break;
  774. case 1: /* zlib wrapper */
  775. wraplen = 6 + (s->strstart ? 4 : 0);
  776. break;
  777. #ifdef GZIP
  778. case 2: /* gzip wrapper */
  779. wraplen = 18;
  780. if (s->gzhead != Z_NULL) { /* user-supplied gzip header */
  781. Bytef *str;
  782. if (s->gzhead->extra != Z_NULL)
  783. wraplen += 2 + s->gzhead->extra_len;
  784. str = s->gzhead->name;
  785. if (str != Z_NULL)
  786. do {
  787. wraplen++;
  788. } while (*str++);
  789. str = s->gzhead->comment;
  790. if (str != Z_NULL)
  791. do {
  792. wraplen++;
  793. } while (*str++);
  794. if (s->gzhead->hcrc)
  795. wraplen += 2;
  796. }
  797. break;
  798. #endif
  799. default: /* for compiler happiness */
  800. wraplen = 18;
  801. }
  802. /* if not default parameters, return one of the conservative bounds */
  803. if (s->w_bits != 15 || s->hash_bits != 8 + 7)
  804. return (s->w_bits <= s->hash_bits && s->level ? fixedlen : storelen) +
  805. wraplen;
  806. /* default settings: return tight bound for that case -- ~0.03% overhead
  807. plus a small constant */
  808. return sourceLen + (sourceLen >> 12) + (sourceLen >> 14) +
  809. (sourceLen >> 25) + 13 - 6 + wraplen;
  810. }
  811. /* =========================================================================
  812. * Put a short in the pending buffer. The 16-bit value is put in MSB order.
  813. * IN assertion: the stream state is correct and there is enough room in
  814. * pending_buf.
  815. */
  816. local void putShortMSB(deflate_state *s, uInt b) {
  817. put_byte(s, (Byte)(b >> 8));
  818. put_byte(s, (Byte)(b & 0xff));
  819. }
  820. /* =========================================================================
  821. * Flush as much pending output as possible. All deflate() output, except for
  822. * some deflate_stored() output, goes through this function so some
  823. * applications may wish to modify it to avoid allocating a large
  824. * strm->next_out buffer and copying into it. (See also read_buf()).
  825. */
  826. local void flush_pending(z_streamp strm) {
  827. unsigned len;
  828. deflate_state *s = strm->state;
  829. _tr_flush_bits(s);
  830. len = s->pending;
  831. if (len > strm->avail_out) len = strm->avail_out;
  832. if (len == 0) return;
  833. zmemcpy(strm->next_out, s->pending_out, len);
  834. strm->next_out += len;
  835. s->pending_out += len;
  836. strm->total_out += len;
  837. strm->avail_out -= len;
  838. s->pending -= len;
  839. if (s->pending == 0) {
  840. s->pending_out = s->pending_buf;
  841. }
  842. }
  843. /* ===========================================================================
  844. * Update the header CRC with the bytes s->pending_buf[beg..s->pending - 1].
  845. */
  846. #define HCRC_UPDATE(beg) \
  847. do { \
  848. if (s->gzhead->hcrc && s->pending > (beg)) \
  849. strm->adler = crc32(strm->adler, s->pending_buf + (beg), \
  850. s->pending - (beg)); \
  851. } while (0)
  852. /* ========================================================================= */
  853. int ZEXPORT deflate(z_streamp strm, int flush) {
  854. int old_flush; /* value of flush param for previous deflate call */
  855. deflate_state *s;
  856. if (deflateStateCheck(strm) || flush > Z_BLOCK || flush < 0) {
  857. return Z_STREAM_ERROR;
  858. }
  859. s = strm->state;
  860. if (strm->next_out == Z_NULL ||
  861. (strm->avail_in != 0 && strm->next_in == Z_NULL) ||
  862. (s->status == FINISH_STATE && flush != Z_FINISH)) {
  863. ERR_RETURN(strm, Z_STREAM_ERROR);
  864. }
  865. if (strm->avail_out == 0) ERR_RETURN(strm, Z_BUF_ERROR);
  866. old_flush = s->last_flush;
  867. s->last_flush = flush;
  868. /* Flush as much pending output as possible */
  869. if (s->pending != 0) {
  870. flush_pending(strm);
  871. if (strm->avail_out == 0) {
  872. /* Since avail_out is 0, deflate will be called again with
  873. * more output space, but possibly with both pending and
  874. * avail_in equal to zero. There won't be anything to do,
  875. * but this is not an error situation so make sure we
  876. * return OK instead of BUF_ERROR at next call of deflate:
  877. */
  878. s->last_flush = -1;
  879. return Z_OK;
  880. }
  881. /* Make sure there is something to do and avoid duplicate consecutive
  882. * flushes. For repeated and useless calls with Z_FINISH, we keep
  883. * returning Z_STREAM_END instead of Z_BUF_ERROR.
  884. */
  885. } else if (strm->avail_in == 0 && RANK(flush) <= RANK(old_flush) &&
  886. flush != Z_FINISH) {
  887. ERR_RETURN(strm, Z_BUF_ERROR);
  888. }
  889. /* User must not provide more input after the first FINISH: */
  890. if (s->status == FINISH_STATE && strm->avail_in != 0) {
  891. ERR_RETURN(strm, Z_BUF_ERROR);
  892. }
  893. /* Write the header */
  894. if (s->status == INIT_STATE && s->wrap == 0)
  895. s->status = BUSY_STATE;
  896. if (s->status == INIT_STATE) {
  897. /* zlib header */
  898. uInt header = (Z_DEFLATED + ((s->w_bits - 8) << 4)) << 8;
  899. uInt level_flags;
  900. if (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2)
  901. level_flags = 0;
  902. else if (s->level < 6)
  903. level_flags = 1;
  904. else if (s->level == 6)
  905. level_flags = 2;
  906. else
  907. level_flags = 3;
  908. header |= (level_flags << 6);
  909. if (s->strstart != 0) header |= PRESET_DICT;
  910. header += 31 - (header % 31);
  911. putShortMSB(s, header);
  912. /* Save the adler32 of the preset dictionary: */
  913. if (s->strstart != 0) {
  914. putShortMSB(s, (uInt)(strm->adler >> 16));
  915. putShortMSB(s, (uInt)(strm->adler & 0xffff));
  916. }
  917. strm->adler = adler32(0L, Z_NULL, 0);
  918. s->status = BUSY_STATE;
  919. /* Compression must start with an empty pending buffer */
  920. flush_pending(strm);
  921. if (s->pending != 0) {
  922. s->last_flush = -1;
  923. return Z_OK;
  924. }
  925. }
  926. #ifdef GZIP
  927. if (s->status == GZIP_STATE) {
  928. /* gzip header */
  929. strm->adler = crc32(0L, Z_NULL, 0);
  930. put_byte(s, 31);
  931. put_byte(s, 139);
  932. put_byte(s, 8);
  933. if (s->gzhead == Z_NULL) {
  934. put_byte(s, 0);
  935. put_byte(s, 0);
  936. put_byte(s, 0);
  937. put_byte(s, 0);
  938. put_byte(s, 0);
  939. put_byte(s, s->level == 9 ? 2 :
  940. (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2 ?
  941. 4 : 0));
  942. put_byte(s, OS_CODE);
  943. s->status = BUSY_STATE;
  944. /* Compression must start with an empty pending buffer */
  945. flush_pending(strm);
  946. if (s->pending != 0) {
  947. s->last_flush = -1;
  948. return Z_OK;
  949. }
  950. }
  951. else {
  952. put_byte(s, (s->gzhead->text ? 1 : 0) +
  953. (s->gzhead->hcrc ? 2 : 0) +
  954. (s->gzhead->extra == Z_NULL ? 0 : 4) +
  955. (s->gzhead->name == Z_NULL ? 0 : 8) +
  956. (s->gzhead->comment == Z_NULL ? 0 : 16)
  957. );
  958. put_byte(s, (Byte)(s->gzhead->time & 0xff));
  959. put_byte(s, (Byte)((s->gzhead->time >> 8) & 0xff));
  960. put_byte(s, (Byte)((s->gzhead->time >> 16) & 0xff));
  961. put_byte(s, (Byte)((s->gzhead->time >> 24) & 0xff));
  962. put_byte(s, s->level == 9 ? 2 :
  963. (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2 ?
  964. 4 : 0));
  965. put_byte(s, s->gzhead->os & 0xff);
  966. if (s->gzhead->extra != Z_NULL) {
  967. put_byte(s, s->gzhead->extra_len & 0xff);
  968. put_byte(s, (s->gzhead->extra_len >> 8) & 0xff);
  969. }
  970. if (s->gzhead->hcrc)
  971. strm->adler = crc32(strm->adler, s->pending_buf,
  972. s->pending);
  973. s->gzindex = 0;
  974. s->status = EXTRA_STATE;
  975. }
  976. }
  977. if (s->status == EXTRA_STATE) {
  978. if (s->gzhead->extra != Z_NULL) {
  979. ulg beg = s->pending; /* start of bytes to update crc */
  980. uInt left = (s->gzhead->extra_len & 0xffff) - s->gzindex;
  981. while (s->pending + left > s->pending_buf_size) {
  982. uInt copy = s->pending_buf_size - s->pending;
  983. zmemcpy(s->pending_buf + s->pending,
  984. s->gzhead->extra + s->gzindex, copy);
  985. s->pending = s->pending_buf_size;
  986. HCRC_UPDATE(beg);
  987. s->gzindex += copy;
  988. flush_pending(strm);
  989. if (s->pending != 0) {
  990. s->last_flush = -1;
  991. return Z_OK;
  992. }
  993. beg = 0;
  994. left -= copy;
  995. }
  996. zmemcpy(s->pending_buf + s->pending,
  997. s->gzhead->extra + s->gzindex, left);
  998. s->pending += left;
  999. HCRC_UPDATE(beg);
  1000. s->gzindex = 0;
  1001. }
  1002. s->status = NAME_STATE;
  1003. }
  1004. if (s->status == NAME_STATE) {
  1005. if (s->gzhead->name != Z_NULL) {
  1006. ulg beg = s->pending; /* start of bytes to update crc */
  1007. int val;
  1008. do {
  1009. if (s->pending == s->pending_buf_size) {
  1010. HCRC_UPDATE(beg);
  1011. flush_pending(strm);
  1012. if (s->pending != 0) {
  1013. s->last_flush = -1;
  1014. return Z_OK;
  1015. }
  1016. beg = 0;
  1017. }
  1018. val = s->gzhead->name[s->gzindex++];
  1019. put_byte(s, val);
  1020. } while (val != 0);
  1021. HCRC_UPDATE(beg);
  1022. s->gzindex = 0;
  1023. }
  1024. s->status = COMMENT_STATE;
  1025. }
  1026. if (s->status == COMMENT_STATE) {
  1027. if (s->gzhead->comment != Z_NULL) {
  1028. ulg beg = s->pending; /* start of bytes to update crc */
  1029. int val;
  1030. do {
  1031. if (s->pending == s->pending_buf_size) {
  1032. HCRC_UPDATE(beg);
  1033. flush_pending(strm);
  1034. if (s->pending != 0) {
  1035. s->last_flush = -1;
  1036. return Z_OK;
  1037. }
  1038. beg = 0;
  1039. }
  1040. val = s->gzhead->comment[s->gzindex++];
  1041. put_byte(s, val);
  1042. } while (val != 0);
  1043. HCRC_UPDATE(beg);
  1044. }
  1045. s->status = HCRC_STATE;
  1046. }
  1047. if (s->status == HCRC_STATE) {
  1048. if (s->gzhead->hcrc) {
  1049. if (s->pending + 2 > s->pending_buf_size) {
  1050. flush_pending(strm);
  1051. if (s->pending != 0) {
  1052. s->last_flush = -1;
  1053. return Z_OK;
  1054. }
  1055. }
  1056. put_byte(s, (Byte)(strm->adler & 0xff));
  1057. put_byte(s, (Byte)((strm->adler >> 8) & 0xff));
  1058. strm->adler = crc32(0L, Z_NULL, 0);
  1059. }
  1060. s->status = BUSY_STATE;
  1061. /* Compression must start with an empty pending buffer */
  1062. flush_pending(strm);
  1063. if (s->pending != 0) {
  1064. s->last_flush = -1;
  1065. return Z_OK;
  1066. }
  1067. }
  1068. #endif
  1069. /* Start a new block or continue the current one.
  1070. */
  1071. if (strm->avail_in != 0 || s->lookahead != 0 ||
  1072. (flush != Z_NO_FLUSH && s->status != FINISH_STATE)) {
  1073. block_state bstate;
  1074. bstate = s->level == 0 ? deflate_stored(s, flush) :
  1075. s->strategy == Z_HUFFMAN_ONLY ? deflate_huff(s, flush) :
  1076. s->strategy == Z_RLE ? deflate_rle(s, flush) :
  1077. (*(configuration_table[s->level].func))(s, flush);
  1078. if (bstate == finish_started || bstate == finish_done) {
  1079. s->status = FINISH_STATE;
  1080. }
  1081. if (bstate == need_more || bstate == finish_started) {
  1082. if (strm->avail_out == 0) {
  1083. s->last_flush = -1; /* avoid BUF_ERROR next call, see above */
  1084. }
  1085. return Z_OK;
  1086. /* If flush != Z_NO_FLUSH && avail_out == 0, the next call
  1087. * of deflate should use the same flush parameter to make sure
  1088. * that the flush is complete. So we don't have to output an
  1089. * empty block here, this will be done at next call. This also
  1090. * ensures that for a very small output buffer, we emit at most
  1091. * one empty block.
  1092. */
  1093. }
  1094. if (bstate == block_done) {
  1095. if (flush == Z_PARTIAL_FLUSH) {
  1096. _tr_align(s);
  1097. } else if (flush != Z_BLOCK) { /* FULL_FLUSH or SYNC_FLUSH */
  1098. _tr_stored_block(s, (char*)0, 0L, 0);
  1099. /* For a full flush, this empty block will be recognized
  1100. * as a special marker by inflate_sync().
  1101. */
  1102. if (flush == Z_FULL_FLUSH) {
  1103. CLEAR_HASH(s); /* forget history */
  1104. if (s->lookahead == 0) {
  1105. s->strstart = 0;
  1106. s->block_start = 0L;
  1107. s->insert = 0;
  1108. }
  1109. }
  1110. }
  1111. flush_pending(strm);
  1112. if (strm->avail_out == 0) {
  1113. s->last_flush = -1; /* avoid BUF_ERROR at next call, see above */
  1114. return Z_OK;
  1115. }
  1116. }
  1117. }
  1118. if (flush != Z_FINISH) return Z_OK;
  1119. if (s->wrap <= 0) return Z_STREAM_END;
  1120. /* Write the trailer */
  1121. #ifdef GZIP
  1122. if (s->wrap == 2) {
  1123. put_byte(s, (Byte)(strm->adler & 0xff));
  1124. put_byte(s, (Byte)((strm->adler >> 8) & 0xff));
  1125. put_byte(s, (Byte)((strm->adler >> 16) & 0xff));
  1126. put_byte(s, (Byte)((strm->adler >> 24) & 0xff));
  1127. put_byte(s, (Byte)(strm->total_in & 0xff));
  1128. put_byte(s, (Byte)((strm->total_in >> 8) & 0xff));
  1129. put_byte(s, (Byte)((strm->total_in >> 16) & 0xff));
  1130. put_byte(s, (Byte)((strm->total_in >> 24) & 0xff));
  1131. }
  1132. else
  1133. #endif
  1134. {
  1135. putShortMSB(s, (uInt)(strm->adler >> 16));
  1136. putShortMSB(s, (uInt)(strm->adler & 0xffff));
  1137. }
  1138. flush_pending(strm);
  1139. /* If avail_out is zero, the application will call deflate again
  1140. * to flush the rest.
  1141. */
  1142. if (s->wrap > 0) s->wrap = -s->wrap; /* write the trailer only once! */
  1143. return s->pending != 0 ? Z_OK : Z_STREAM_END;
  1144. }
  1145. /* ========================================================================= */
  1146. int ZEXPORT deflateEnd(z_streamp strm) {
  1147. int status;
  1148. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  1149. status = strm->state->status;
  1150. /* Deallocate in reverse order of allocations: */
  1151. TRY_FREE(strm, strm->state->pending_buf);
  1152. TRY_FREE(strm, strm->state->head);
  1153. TRY_FREE(strm, strm->state->prev);
  1154. TRY_FREE(strm, strm->state->window);
  1155. ZFREE(strm, strm->state);
  1156. strm->state = Z_NULL;
  1157. return status == BUSY_STATE ? Z_DATA_ERROR : Z_OK;
  1158. }
  1159. /* =========================================================================
  1160. * Copy the source state to the destination state.
  1161. * To simplify the source, this is not supported for 16-bit MSDOS (which
  1162. * doesn't have enough memory anyway to duplicate compression states).
  1163. */
  1164. int ZEXPORT deflateCopy(z_streamp dest, z_streamp source) {
  1165. #ifdef MAXSEG_64K
  1166. (void)dest;
  1167. (void)source;
  1168. return Z_STREAM_ERROR;
  1169. #else
  1170. deflate_state *ds;
  1171. deflate_state *ss;
  1172. if (deflateStateCheck(source) || dest == Z_NULL) {
  1173. return Z_STREAM_ERROR;
  1174. }
  1175. ss = source->state;
  1176. zmemcpy((voidpf)dest, (voidpf)source, sizeof(z_stream));
  1177. ds = (deflate_state *) ZALLOC(dest, 1, sizeof(deflate_state));
  1178. if (ds == Z_NULL) return Z_MEM_ERROR;
  1179. dest->state = (struct internal_state FAR *) ds;
  1180. zmemcpy((voidpf)ds, (voidpf)ss, sizeof(deflate_state));
  1181. ds->strm = dest;
  1182. ds->window = (Bytef *) ZALLOC(dest, ds->w_size, 2*sizeof(Byte));
  1183. ds->prev = (Posf *) ZALLOC(dest, ds->w_size, sizeof(Pos));
  1184. ds->head = (Posf *) ZALLOC(dest, ds->hash_size, sizeof(Pos));
  1185. ds->pending_buf = (uchf *) ZALLOC(dest, ds->lit_bufsize, LIT_BUFS);
  1186. if (ds->window == Z_NULL || ds->prev == Z_NULL || ds->head == Z_NULL ||
  1187. ds->pending_buf == Z_NULL) {
  1188. deflateEnd (dest);
  1189. return Z_MEM_ERROR;
  1190. }
  1191. /* following zmemcpy do not work for 16-bit MSDOS */
  1192. zmemcpy(ds->window, ss->window, ds->w_size * 2 * sizeof(Byte));
  1193. zmemcpy((voidpf)ds->prev, (voidpf)ss->prev, ds->w_size * sizeof(Pos));
  1194. zmemcpy((voidpf)ds->head, (voidpf)ss->head, ds->hash_size * sizeof(Pos));
  1195. zmemcpy(ds->pending_buf, ss->pending_buf, ds->lit_bufsize * LIT_BUFS);
  1196. ds->pending_out = ds->pending_buf + (ss->pending_out - ss->pending_buf);
  1197. #ifdef LIT_MEM
  1198. ds->d_buf = (ushf *)(ds->pending_buf + (ds->lit_bufsize << 1));
  1199. ds->l_buf = ds->pending_buf + (ds->lit_bufsize << 2);
  1200. #else
  1201. ds->sym_buf = ds->pending_buf + ds->lit_bufsize;
  1202. #endif
  1203. ds->l_desc.dyn_tree = ds->dyn_ltree;
  1204. ds->d_desc.dyn_tree = ds->dyn_dtree;
  1205. ds->bl_desc.dyn_tree = ds->bl_tree;
  1206. return Z_OK;
  1207. #endif /* MAXSEG_64K */
  1208. }
  1209. #ifndef FASTEST
  1210. /* ===========================================================================
  1211. * Set match_start to the longest match starting at the given string and
  1212. * return its length. Matches shorter or equal to prev_length are discarded,
  1213. * in which case the result is equal to prev_length and match_start is
  1214. * garbage.
  1215. * IN assertions: cur_match is the head of the hash chain for the current
  1216. * string (strstart) and its distance is <= MAX_DIST, and prev_length >= 1
  1217. * OUT assertion: the match length is not greater than s->lookahead.
  1218. */
  1219. local uInt longest_match(deflate_state *s, IPos cur_match) {
  1220. unsigned chain_length = s->max_chain_length;/* max hash chain length */
  1221. register Bytef *scan = s->window + s->strstart; /* current string */
  1222. register Bytef *match; /* matched string */
  1223. register int len; /* length of current match */
  1224. int best_len = (int)s->prev_length; /* best match length so far */
  1225. int nice_match = s->nice_match; /* stop if match long enough */
  1226. IPos limit = s->strstart > (IPos)MAX_DIST(s) ?
  1227. s->strstart - (IPos)MAX_DIST(s) : NIL;
  1228. /* Stop when cur_match becomes <= limit. To simplify the code,
  1229. * we prevent matches with the string of window index 0.
  1230. */
  1231. Posf *prev = s->prev;
  1232. uInt wmask = s->w_mask;
  1233. #ifdef UNALIGNED_OK
  1234. /* Compare two bytes at a time. Note: this is not always beneficial.
  1235. * Try with and without -DUNALIGNED_OK to check.
  1236. */
  1237. register Bytef *strend = s->window + s->strstart + MAX_MATCH - 1;
  1238. register ush scan_start = *(ushf*)scan;
  1239. register ush scan_end = *(ushf*)(scan + best_len - 1);
  1240. #else
  1241. register Bytef *strend = s->window + s->strstart + MAX_MATCH;
  1242. register Byte scan_end1 = scan[best_len - 1];
  1243. register Byte scan_end = scan[best_len];
  1244. #endif
  1245. /* The code is optimized for HASH_BITS >= 8 and MAX_MATCH-2 multiple of 16.
  1246. * It is easy to get rid of this optimization if necessary.
  1247. */
  1248. Assert(s->hash_bits >= 8 && MAX_MATCH == 258, "Code too clever");
  1249. /* Do not waste too much time if we already have a good match: */
  1250. if (s->prev_length >= s->good_match) {
  1251. chain_length >>= 2;
  1252. }
  1253. /* Do not look for matches beyond the end of the input. This is necessary
  1254. * to make deflate deterministic.
  1255. */
  1256. if ((uInt)nice_match > s->lookahead) nice_match = (int)s->lookahead;
  1257. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  1258. "need lookahead");
  1259. do {
  1260. Assert(cur_match < s->strstart, "no future");
  1261. match = s->window + cur_match;
  1262. /* Skip to next match if the match length cannot increase
  1263. * or if the match length is less than 2. Note that the checks below
  1264. * for insufficient lookahead only occur occasionally for performance
  1265. * reasons. Therefore uninitialized memory will be accessed, and
  1266. * conditional jumps will be made that depend on those values.
  1267. * However the length of the match is limited to the lookahead, so
  1268. * the output of deflate is not affected by the uninitialized values.
  1269. */
  1270. #if (defined(UNALIGNED_OK) && MAX_MATCH == 258)
  1271. /* This code assumes sizeof(unsigned short) == 2. Do not use
  1272. * UNALIGNED_OK if your compiler uses a different size.
  1273. */
  1274. if (*(ushf*)(match + best_len - 1) != scan_end ||
  1275. *(ushf*)match != scan_start) continue;
  1276. /* It is not necessary to compare scan[2] and match[2] since they are
  1277. * always equal when the other bytes match, given that the hash keys
  1278. * are equal and that HASH_BITS >= 8. Compare 2 bytes at a time at
  1279. * strstart + 3, + 5, up to strstart + 257. We check for insufficient
  1280. * lookahead only every 4th comparison; the 128th check will be made
  1281. * at strstart + 257. If MAX_MATCH-2 is not a multiple of 8, it is
  1282. * necessary to put more guard bytes at the end of the window, or
  1283. * to check more often for insufficient lookahead.
  1284. */
  1285. Assert(scan[2] == match[2], "scan[2]?");
  1286. scan++, match++;
  1287. do {
  1288. } while (*(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1289. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1290. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1291. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1292. scan < strend);
  1293. /* The funny "do {}" generates better code on most compilers */
  1294. /* Here, scan <= window + strstart + 257 */
  1295. Assert(scan <= s->window + (unsigned)(s->window_size - 1),
  1296. "wild scan");
  1297. if (*scan == *match) scan++;
  1298. len = (MAX_MATCH - 1) - (int)(strend - scan);
  1299. scan = strend - (MAX_MATCH-1);
  1300. #else /* UNALIGNED_OK */
  1301. if (match[best_len] != scan_end ||
  1302. match[best_len - 1] != scan_end1 ||
  1303. *match != *scan ||
  1304. *++match != scan[1]) continue;
  1305. /* The check at best_len - 1 can be removed because it will be made
  1306. * again later. (This heuristic is not always a win.)
  1307. * It is not necessary to compare scan[2] and match[2] since they
  1308. * are always equal when the other bytes match, given that
  1309. * the hash keys are equal and that HASH_BITS >= 8.
  1310. */
  1311. scan += 2, match++;
  1312. Assert(*scan == *match, "match[2]?");
  1313. /* We check for insufficient lookahead only every 8th comparison;
  1314. * the 256th check will be made at strstart + 258.
  1315. */
  1316. do {
  1317. } while (*++scan == *++match && *++scan == *++match &&
  1318. *++scan == *++match && *++scan == *++match &&
  1319. *++scan == *++match && *++scan == *++match &&
  1320. *++scan == *++match && *++scan == *++match &&
  1321. scan < strend);
  1322. Assert(scan <= s->window + (unsigned)(s->window_size - 1),
  1323. "wild scan");
  1324. len = MAX_MATCH - (int)(strend - scan);
  1325. scan = strend - MAX_MATCH;
  1326. #endif /* UNALIGNED_OK */
  1327. if (len > best_len) {
  1328. s->match_start = cur_match;
  1329. best_len = len;
  1330. if (len >= nice_match) break;
  1331. #ifdef UNALIGNED_OK
  1332. scan_end = *(ushf*)(scan + best_len - 1);
  1333. #else
  1334. scan_end1 = scan[best_len - 1];
  1335. scan_end = scan[best_len];
  1336. #endif
  1337. }
  1338. } while ((cur_match = prev[cur_match & wmask]) > limit
  1339. && --chain_length != 0);
  1340. if ((uInt)best_len <= s->lookahead) return (uInt)best_len;
  1341. return s->lookahead;
  1342. }
  1343. #else /* FASTEST */
  1344. /* ---------------------------------------------------------------------------
  1345. * Optimized version for FASTEST only
  1346. */
  1347. local uInt longest_match(deflate_state *s, IPos cur_match) {
  1348. register Bytef *scan = s->window + s->strstart; /* current string */
  1349. register Bytef *match; /* matched string */
  1350. register int len; /* length of current match */
  1351. register Bytef *strend = s->window + s->strstart + MAX_MATCH;
  1352. /* The code is optimized for HASH_BITS >= 8 and MAX_MATCH-2 multiple of 16.
  1353. * It is easy to get rid of this optimization if necessary.
  1354. */
  1355. Assert(s->hash_bits >= 8 && MAX_MATCH == 258, "Code too clever");
  1356. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  1357. "need lookahead");
  1358. Assert(cur_match < s->strstart, "no future");
  1359. match = s->window + cur_match;
  1360. /* Return failure if the match length is less than 2:
  1361. */
  1362. if (match[0] != scan[0] || match[1] != scan[1]) return MIN_MATCH-1;
  1363. /* The check at best_len - 1 can be removed because it will be made
  1364. * again later. (This heuristic is not always a win.)
  1365. * It is not necessary to compare scan[2] and match[2] since they
  1366. * are always equal when the other bytes match, given that
  1367. * the hash keys are equal and that HASH_BITS >= 8.
  1368. */
  1369. scan += 2, match += 2;
  1370. Assert(*scan == *match, "match[2]?");
  1371. /* We check for insufficient lookahead only every 8th comparison;
  1372. * the 256th check will be made at strstart + 258.
  1373. */
  1374. do {
  1375. } while (*++scan == *++match && *++scan == *++match &&
  1376. *++scan == *++match && *++scan == *++match &&
  1377. *++scan == *++match && *++scan == *++match &&
  1378. *++scan == *++match && *++scan == *++match &&
  1379. scan < strend);
  1380. Assert(scan <= s->window + (unsigned)(s->window_size - 1), "wild scan");
  1381. len = MAX_MATCH - (int)(strend - scan);
  1382. if (len < MIN_MATCH) return MIN_MATCH - 1;
  1383. s->match_start = cur_match;
  1384. return (uInt)len <= s->lookahead ? (uInt)len : s->lookahead;
  1385. }
  1386. #endif /* FASTEST */
  1387. #ifdef ZLIB_DEBUG
  1388. #define EQUAL 0
  1389. /* result of memcmp for equal strings */
  1390. /* ===========================================================================
  1391. * Check that the match at match_start is indeed a match.
  1392. */
  1393. local void check_match(deflate_state *s, IPos start, IPos match, int length) {
  1394. /* check that the match is indeed a match */
  1395. Bytef *back = s->window + (int)match, *here = s->window + start;
  1396. IPos len = length;
  1397. if (match == (IPos)-1) {
  1398. /* match starts one byte before the current window -- just compare the
  1399. subsequent length-1 bytes */
  1400. back++;
  1401. here++;
  1402. len--;
  1403. }
  1404. if (zmemcmp(back, here, len) != EQUAL) {
  1405. fprintf(stderr, " start %u, match %d, length %d\n",
  1406. start, (int)match, length);
  1407. do {
  1408. fprintf(stderr, "(%02x %02x)", *back++, *here++);
  1409. } while (--len != 0);
  1410. z_error("invalid match");
  1411. }
  1412. if (z_verbose > 1) {
  1413. fprintf(stderr,"\\[%d,%d]", start - match, length);
  1414. do { putc(s->window[start++], stderr); } while (--length != 0);
  1415. }
  1416. }
  1417. #else
  1418. # define check_match(s, start, match, length)
  1419. #endif /* ZLIB_DEBUG */
  1420. /* ===========================================================================
  1421. * Flush the current block, with given end-of-file flag.
  1422. * IN assertion: strstart is set to the end of the current match.
  1423. */
  1424. #define FLUSH_BLOCK_ONLY(s, last) { \
  1425. _tr_flush_block(s, (s->block_start >= 0L ? \
  1426. (charf *)&s->window[(unsigned)s->block_start] : \
  1427. (charf *)Z_NULL), \
  1428. (ulg)((long)s->strstart - s->block_start), \
  1429. (last)); \
  1430. s->block_start = s->strstart; \
  1431. flush_pending(s->strm); \
  1432. Tracev((stderr,"[FLUSH]")); \
  1433. }
  1434. /* Same but force premature exit if necessary. */
  1435. #define FLUSH_BLOCK(s, last) { \
  1436. FLUSH_BLOCK_ONLY(s, last); \
  1437. if (s->strm->avail_out == 0) return (last) ? finish_started : need_more; \
  1438. }
  1439. /* Maximum stored block length in deflate format (not including header). */
  1440. #define MAX_STORED 65535
  1441. /* Minimum of a and b. */
  1442. #define MIN(a, b) ((a) > (b) ? (b) : (a))
  1443. /* ===========================================================================
  1444. * Copy without compression as much as possible from the input stream, return
  1445. * the current block state.
  1446. *
  1447. * In case deflateParams() is used to later switch to a non-zero compression
  1448. * level, s->matches (otherwise unused when storing) keeps track of the number
  1449. * of hash table slides to perform. If s->matches is 1, then one hash table
  1450. * slide will be done when switching. If s->matches is 2, the maximum value
  1451. * allowed here, then the hash table will be cleared, since two or more slides
  1452. * is the same as a clear.
  1453. *
  1454. * deflate_stored() is written to minimize the number of times an input byte is
  1455. * copied. It is most efficient with large input and output buffers, which
  1456. * maximizes the opportunities to have a single copy from next_in to next_out.
  1457. */
  1458. local block_state deflate_stored(deflate_state *s, int flush) {
  1459. /* Smallest worthy block size when not flushing or finishing. By default
  1460. * this is 32K. This can be as small as 507 bytes for memLevel == 1. For
  1461. * large input and output buffers, the stored block size will be larger.
  1462. */
  1463. unsigned min_block = MIN(s->pending_buf_size - 5, s->w_size);
  1464. /* Copy as many min_block or larger stored blocks directly to next_out as
  1465. * possible. If flushing, copy the remaining available input to next_out as
  1466. * stored blocks, if there is enough space.
  1467. */
  1468. int last = 0;
  1469. unsigned len, left, have;
  1470. unsigned used = s->strm->avail_in;
  1471. do {
  1472. /* Set len to the maximum size block that we can copy directly with the
  1473. * available input data and output space. Set left to how much of that
  1474. * would be copied from what's left in the window.
  1475. */
  1476. len = MAX_STORED; /* maximum deflate stored block length */
  1477. have = (s->bi_valid + 42) >> 3; /* number of header bytes */
  1478. if (s->strm->avail_out < have) /* need room for header */
  1479. break;
  1480. /* maximum stored block length that will fit in avail_out: */
  1481. have = s->strm->avail_out - have;
  1482. left = s->strstart - s->block_start; /* bytes left in window */
  1483. if (len > (ulg)left + s->strm->avail_in)
  1484. len = left + s->strm->avail_in; /* limit len to the input */
  1485. if (len > have)
  1486. len = have; /* limit len to the output */
  1487. /* If the stored block would be less than min_block in length, or if
  1488. * unable to copy all of the available input when flushing, then try
  1489. * copying to the window and the pending buffer instead. Also don't
  1490. * write an empty block when flushing -- deflate() does that.
  1491. */
  1492. if (len < min_block && ((len == 0 && flush != Z_FINISH) ||
  1493. flush == Z_NO_FLUSH ||
  1494. len != left + s->strm->avail_in))
  1495. break;
  1496. /* Make a dummy stored block in pending to get the header bytes,
  1497. * including any pending bits. This also updates the debugging counts.
  1498. */
  1499. last = flush == Z_FINISH && len == left + s->strm->avail_in ? 1 : 0;
  1500. _tr_stored_block(s, (char *)0, 0L, last);
  1501. /* Replace the lengths in the dummy stored block with len. */
  1502. s->pending_buf[s->pending - 4] = (Bytef)len;
  1503. s->pending_buf[s->pending - 3] = (Bytef)(len >> 8);
  1504. s->pending_buf[s->pending - 2] = (Bytef)~len;
  1505. s->pending_buf[s->pending - 1] = (Bytef)(~len >> 8);
  1506. /* Write the stored block header bytes. */
  1507. flush_pending(s->strm);
  1508. #ifdef ZLIB_DEBUG
  1509. /* Update debugging counts for the data about to be copied. */
  1510. s->compressed_len += len << 3;
  1511. s->bits_sent += len << 3;
  1512. #endif
  1513. /* Copy uncompressed bytes from the window to next_out. */
  1514. if (left) {
  1515. if (left > len)
  1516. left = len;
  1517. zmemcpy(s->strm->next_out, s->window + s->block_start, left);
  1518. s->strm->next_out += left;
  1519. s->strm->avail_out -= left;
  1520. s->strm->total_out += left;
  1521. s->block_start += left;
  1522. len -= left;
  1523. }
  1524. /* Copy uncompressed bytes directly from next_in to next_out, updating
  1525. * the check value.
  1526. */
  1527. if (len) {
  1528. read_buf(s->strm, s->strm->next_out, len);
  1529. s->strm->next_out += len;
  1530. s->strm->avail_out -= len;
  1531. s->strm->total_out += len;
  1532. }
  1533. } while (last == 0);
  1534. /* Update the sliding window with the last s->w_size bytes of the copied
  1535. * data, or append all of the copied data to the existing window if less
  1536. * than s->w_size bytes were copied. Also update the number of bytes to
  1537. * insert in the hash tables, in the event that deflateParams() switches to
  1538. * a non-zero compression level.
  1539. */
  1540. used -= s->strm->avail_in; /* number of input bytes directly copied */
  1541. if (used) {
  1542. /* If any input was used, then no unused input remains in the window,
  1543. * therefore s->block_start == s->strstart.
  1544. */
  1545. if (used >= s->w_size) { /* supplant the previous history */
  1546. s->matches = 2; /* clear hash */
  1547. zmemcpy(s->window, s->strm->next_in - s->w_size, s->w_size);
  1548. s->strstart = s->w_size;
  1549. s->insert = s->strstart;
  1550. }
  1551. else {
  1552. if (s->window_size - s->strstart <= used) {
  1553. /* Slide the window down. */
  1554. s->strstart -= s->w_size;
  1555. zmemcpy(s->window, s->window + s->w_size, s->strstart);
  1556. if (s->matches < 2)
  1557. s->matches++; /* add a pending slide_hash() */
  1558. if (s->insert > s->strstart)
  1559. s->insert = s->strstart;
  1560. }
  1561. zmemcpy(s->window + s->strstart, s->strm->next_in - used, used);
  1562. s->strstart += used;
  1563. s->insert += MIN(used, s->w_size - s->insert);
  1564. }
  1565. s->block_start = s->strstart;
  1566. }
  1567. if (s->high_water < s->strstart)
  1568. s->high_water = s->strstart;
  1569. /* If the last block was written to next_out, then done. */
  1570. if (last) {
  1571. s->bi_used = 8;
  1572. return finish_done;
  1573. }
  1574. /* If flushing and all input has been consumed, then done. */
  1575. if (flush != Z_NO_FLUSH && flush != Z_FINISH &&
  1576. s->strm->avail_in == 0 && (long)s->strstart == s->block_start)
  1577. return block_done;
  1578. /* Fill the window with any remaining input. */
  1579. have = s->window_size - s->strstart;
  1580. if (s->strm->avail_in > have && s->block_start >= (long)s->w_size) {
  1581. /* Slide the window down. */
  1582. s->block_start -= s->w_size;
  1583. s->strstart -= s->w_size;
  1584. zmemcpy(s->window, s->window + s->w_size, s->strstart);
  1585. if (s->matches < 2)
  1586. s->matches++; /* add a pending slide_hash() */
  1587. have += s->w_size; /* more space now */
  1588. if (s->insert > s->strstart)
  1589. s->insert = s->strstart;
  1590. }
  1591. if (have > s->strm->avail_in)
  1592. have = s->strm->avail_in;
  1593. if (have) {
  1594. read_buf(s->strm, s->window + s->strstart, have);
  1595. s->strstart += have;
  1596. s->insert += MIN(have, s->w_size - s->insert);
  1597. }
  1598. if (s->high_water < s->strstart)
  1599. s->high_water = s->strstart;
  1600. /* There was not enough avail_out to write a complete worthy or flushed
  1601. * stored block to next_out. Write a stored block to pending instead, if we
  1602. * have enough input for a worthy block, or if flushing and there is enough
  1603. * room for the remaining input as a stored block in the pending buffer.
  1604. */
  1605. have = (s->bi_valid + 42) >> 3; /* number of header bytes */
  1606. /* maximum stored block length that will fit in pending: */
  1607. have = MIN(s->pending_buf_size - have, MAX_STORED);
  1608. min_block = MIN(have, s->w_size);
  1609. left = s->strstart - s->block_start;
  1610. if (left >= min_block ||
  1611. ((left || flush == Z_FINISH) && flush != Z_NO_FLUSH &&
  1612. s->strm->avail_in == 0 && left <= have)) {
  1613. len = MIN(left, have);
  1614. last = flush == Z_FINISH && s->strm->avail_in == 0 &&
  1615. len == left ? 1 : 0;
  1616. _tr_stored_block(s, (charf *)s->window + s->block_start, len, last);
  1617. s->block_start += len;
  1618. flush_pending(s->strm);
  1619. }
  1620. /* We've done all we can with the available input and output. */
  1621. if (last)
  1622. s->bi_used = 8;
  1623. return last ? finish_started : need_more;
  1624. }
  1625. /* ===========================================================================
  1626. * Compress as much as possible from the input stream, return the current
  1627. * block state.
  1628. * This function does not perform lazy evaluation of matches and inserts
  1629. * new strings in the dictionary only for unmatched strings or for short
  1630. * matches. It is used only for the fast compression options.
  1631. */
  1632. local block_state deflate_fast(deflate_state *s, int flush) {
  1633. IPos hash_head; /* head of the hash chain */
  1634. int bflush; /* set if current block must be flushed */
  1635. for (;;) {
  1636. /* Make sure that we always have enough lookahead, except
  1637. * at the end of the input file. We need MAX_MATCH bytes
  1638. * for the next match, plus MIN_MATCH bytes to insert the
  1639. * string following the next match.
  1640. */
  1641. if (s->lookahead < MIN_LOOKAHEAD) {
  1642. fill_window(s);
  1643. if (s->lookahead < MIN_LOOKAHEAD && flush == Z_NO_FLUSH) {
  1644. return need_more;
  1645. }
  1646. if (s->lookahead == 0) break; /* flush the current block */
  1647. }
  1648. /* Insert the string window[strstart .. strstart + 2] in the
  1649. * dictionary, and set hash_head to the head of the hash chain:
  1650. */
  1651. hash_head = NIL;
  1652. if (s->lookahead >= MIN_MATCH) {
  1653. INSERT_STRING(s, s->strstart, hash_head);
  1654. }
  1655. /* Find the longest match, discarding those <= prev_length.
  1656. * At this point we have always match_length < MIN_MATCH
  1657. */
  1658. if (hash_head != NIL && s->strstart - hash_head <= MAX_DIST(s)) {
  1659. /* To simplify the code, we prevent matches with the string
  1660. * of window index 0 (in particular we have to avoid a match
  1661. * of the string with itself at the start of the input file).
  1662. */
  1663. s->match_length = longest_match (s, hash_head);
  1664. /* longest_match() sets match_start */
  1665. }
  1666. if (s->match_length >= MIN_MATCH) {
  1667. check_match(s, s->strstart, s->match_start, s->match_length);
  1668. _tr_tally_dist(s, s->strstart - s->match_start,
  1669. s->match_length - MIN_MATCH, bflush);
  1670. s->lookahead -= s->match_length;
  1671. /* Insert new strings in the hash table only if the match length
  1672. * is not too large. This saves time but degrades compression.
  1673. */
  1674. #ifndef FASTEST
  1675. if (s->match_length <= s->max_insert_length &&
  1676. s->lookahead >= MIN_MATCH) {
  1677. s->match_length--; /* string at strstart already in table */
  1678. do {
  1679. s->strstart++;
  1680. INSERT_STRING(s, s->strstart, hash_head);
  1681. /* strstart never exceeds WSIZE-MAX_MATCH, so there are
  1682. * always MIN_MATCH bytes ahead.
  1683. */
  1684. } while (--s->match_length != 0);
  1685. s->strstart++;
  1686. } else
  1687. #endif
  1688. {
  1689. s->strstart += s->match_length;
  1690. s->match_length = 0;
  1691. s->ins_h = s->window[s->strstart];
  1692. UPDATE_HASH(s, s->ins_h, s->window[s->strstart + 1]);
  1693. #if MIN_MATCH != 3
  1694. Call UPDATE_HASH() MIN_MATCH-3 more times
  1695. #endif
  1696. /* If lookahead < MIN_MATCH, ins_h is garbage, but it does not
  1697. * matter since it will be recomputed at next deflate call.
  1698. */
  1699. }
  1700. } else {
  1701. /* No match, output a literal byte */
  1702. Tracevv((stderr,"%c", s->window[s->strstart]));
  1703. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1704. s->lookahead--;
  1705. s->strstart++;
  1706. }
  1707. if (bflush) FLUSH_BLOCK(s, 0);
  1708. }
  1709. s->insert = s->strstart < MIN_MATCH-1 ? s->strstart : MIN_MATCH-1;
  1710. if (flush == Z_FINISH) {
  1711. FLUSH_BLOCK(s, 1);
  1712. return finish_done;
  1713. }
  1714. if (s->sym_next)
  1715. FLUSH_BLOCK(s, 0);
  1716. return block_done;
  1717. }
  1718. #ifndef FASTEST
  1719. /* ===========================================================================
  1720. * Same as above, but achieves better compression. We use a lazy
  1721. * evaluation for matches: a match is finally adopted only if there is
  1722. * no better match at the next window position.
  1723. */
  1724. local block_state deflate_slow(deflate_state *s, int flush) {
  1725. IPos hash_head; /* head of hash chain */
  1726. int bflush; /* set if current block must be flushed */
  1727. /* Process the input block. */
  1728. for (;;) {
  1729. /* Make sure that we always have enough lookahead, except
  1730. * at the end of the input file. We need MAX_MATCH bytes
  1731. * for the next match, plus MIN_MATCH bytes to insert the
  1732. * string following the next match.
  1733. */
  1734. if (s->lookahead < MIN_LOOKAHEAD) {
  1735. fill_window(s);
  1736. if (s->lookahead < MIN_LOOKAHEAD && flush == Z_NO_FLUSH) {
  1737. return need_more;
  1738. }
  1739. if (s->lookahead == 0) break; /* flush the current block */
  1740. }
  1741. /* Insert the string window[strstart .. strstart + 2] in the
  1742. * dictionary, and set hash_head to the head of the hash chain:
  1743. */
  1744. hash_head = NIL;
  1745. if (s->lookahead >= MIN_MATCH) {
  1746. INSERT_STRING(s, s->strstart, hash_head);
  1747. }
  1748. /* Find the longest match, discarding those <= prev_length.
  1749. */
  1750. s->prev_length = s->match_length, s->prev_match = s->match_start;
  1751. s->match_length = MIN_MATCH-1;
  1752. if (hash_head != NIL && s->prev_length < s->max_lazy_match &&
  1753. s->strstart - hash_head <= MAX_DIST(s)) {
  1754. /* To simplify the code, we prevent matches with the string
  1755. * of window index 0 (in particular we have to avoid a match
  1756. * of the string with itself at the start of the input file).
  1757. */
  1758. s->match_length = longest_match (s, hash_head);
  1759. /* longest_match() sets match_start */
  1760. if (s->match_length <= 5 && (s->strategy == Z_FILTERED
  1761. #if TOO_FAR <= 32767
  1762. || (s->match_length == MIN_MATCH &&
  1763. s->strstart - s->match_start > TOO_FAR)
  1764. #endif
  1765. )) {
  1766. /* If prev_match is also MIN_MATCH, match_start is garbage
  1767. * but we will ignore the current match anyway.
  1768. */
  1769. s->match_length = MIN_MATCH-1;
  1770. }
  1771. }
  1772. /* If there was a match at the previous step and the current
  1773. * match is not better, output the previous match:
  1774. */
  1775. if (s->prev_length >= MIN_MATCH && s->match_length <= s->prev_length) {
  1776. uInt max_insert = s->strstart + s->lookahead - MIN_MATCH;
  1777. /* Do not insert strings in hash table beyond this. */
  1778. check_match(s, s->strstart - 1, s->prev_match, s->prev_length);
  1779. _tr_tally_dist(s, s->strstart - 1 - s->prev_match,
  1780. s->prev_length - MIN_MATCH, bflush);
  1781. /* Insert in hash table all strings up to the end of the match.
  1782. * strstart - 1 and strstart are already inserted. If there is not
  1783. * enough lookahead, the last two strings are not inserted in
  1784. * the hash table.
  1785. */
  1786. s->lookahead -= s->prev_length - 1;
  1787. s->prev_length -= 2;
  1788. do {
  1789. if (++s->strstart <= max_insert) {
  1790. INSERT_STRING(s, s->strstart, hash_head);
  1791. }
  1792. } while (--s->prev_length != 0);
  1793. s->match_available = 0;
  1794. s->match_length = MIN_MATCH-1;
  1795. s->strstart++;
  1796. if (bflush) FLUSH_BLOCK(s, 0);
  1797. } else if (s->match_available) {
  1798. /* If there was no match at the previous position, output a
  1799. * single literal. If there was a match but the current match
  1800. * is longer, truncate the previous match to a single literal.
  1801. */
  1802. Tracevv((stderr,"%c", s->window[s->strstart - 1]));
  1803. _tr_tally_lit(s, s->window[s->strstart - 1], bflush);
  1804. if (bflush) {
  1805. FLUSH_BLOCK_ONLY(s, 0);
  1806. }
  1807. s->strstart++;
  1808. s->lookahead--;
  1809. if (s->strm->avail_out == 0) return need_more;
  1810. } else {
  1811. /* There is no previous match to compare with, wait for
  1812. * the next step to decide.
  1813. */
  1814. s->match_available = 1;
  1815. s->strstart++;
  1816. s->lookahead--;
  1817. }
  1818. }
  1819. Assert (flush != Z_NO_FLUSH, "no flush?");
  1820. if (s->match_available) {
  1821. Tracevv((stderr,"%c", s->window[s->strstart - 1]));
  1822. _tr_tally_lit(s, s->window[s->strstart - 1], bflush);
  1823. s->match_available = 0;
  1824. }
  1825. s->insert = s->strstart < MIN_MATCH-1 ? s->strstart : MIN_MATCH-1;
  1826. if (flush == Z_FINISH) {
  1827. FLUSH_BLOCK(s, 1);
  1828. return finish_done;
  1829. }
  1830. if (s->sym_next)
  1831. FLUSH_BLOCK(s, 0);
  1832. return block_done;
  1833. }
  1834. #endif /* FASTEST */
  1835. /* ===========================================================================
  1836. * For Z_RLE, simply look for runs of bytes, generate matches only of distance
  1837. * one. Do not maintain a hash table. (It will be regenerated if this run of
  1838. * deflate switches away from Z_RLE.)
  1839. */
  1840. local block_state deflate_rle(deflate_state *s, int flush) {
  1841. int bflush; /* set if current block must be flushed */
  1842. uInt prev; /* byte at distance one to match */
  1843. Bytef *scan, *strend; /* scan goes up to strend for length of run */
  1844. for (;;) {
  1845. /* Make sure that we always have enough lookahead, except
  1846. * at the end of the input file. We need MAX_MATCH bytes
  1847. * for the longest run, plus one for the unrolled loop.
  1848. */
  1849. if (s->lookahead <= MAX_MATCH) {
  1850. fill_window(s);
  1851. if (s->lookahead <= MAX_MATCH && flush == Z_NO_FLUSH) {
  1852. return need_more;
  1853. }
  1854. if (s->lookahead == 0) break; /* flush the current block */
  1855. }
  1856. /* See how many times the previous byte repeats */
  1857. s->match_length = 0;
  1858. if (s->lookahead >= MIN_MATCH && s->strstart > 0) {
  1859. scan = s->window + s->strstart - 1;
  1860. prev = *scan;
  1861. if (prev == *++scan && prev == *++scan && prev == *++scan) {
  1862. strend = s->window + s->strstart + MAX_MATCH;
  1863. do {
  1864. } while (prev == *++scan && prev == *++scan &&
  1865. prev == *++scan && prev == *++scan &&
  1866. prev == *++scan && prev == *++scan &&
  1867. prev == *++scan && prev == *++scan &&
  1868. scan < strend);
  1869. s->match_length = MAX_MATCH - (uInt)(strend - scan);
  1870. if (s->match_length > s->lookahead)
  1871. s->match_length = s->lookahead;
  1872. }
  1873. Assert(scan <= s->window + (uInt)(s->window_size - 1),
  1874. "wild scan");
  1875. }
  1876. /* Emit match if have run of MIN_MATCH or longer, else emit literal */
  1877. if (s->match_length >= MIN_MATCH) {
  1878. check_match(s, s->strstart, s->strstart - 1, s->match_length);
  1879. _tr_tally_dist(s, 1, s->match_length - MIN_MATCH, bflush);
  1880. s->lookahead -= s->match_length;
  1881. s->strstart += s->match_length;
  1882. s->match_length = 0;
  1883. } else {
  1884. /* No match, output a literal byte */
  1885. Tracevv((stderr,"%c", s->window[s->strstart]));
  1886. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1887. s->lookahead--;
  1888. s->strstart++;
  1889. }
  1890. if (bflush) FLUSH_BLOCK(s, 0);
  1891. }
  1892. s->insert = 0;
  1893. if (flush == Z_FINISH) {
  1894. FLUSH_BLOCK(s, 1);
  1895. return finish_done;
  1896. }
  1897. if (s->sym_next)
  1898. FLUSH_BLOCK(s, 0);
  1899. return block_done;
  1900. }
  1901. /* ===========================================================================
  1902. * For Z_HUFFMAN_ONLY, do not look for matches. Do not maintain a hash table.
  1903. * (It will be regenerated if this run of deflate switches away from Huffman.)
  1904. */
  1905. local block_state deflate_huff(deflate_state *s, int flush) {
  1906. int bflush; /* set if current block must be flushed */
  1907. for (;;) {
  1908. /* Make sure that we have a literal to write. */
  1909. if (s->lookahead == 0) {
  1910. fill_window(s);
  1911. if (s->lookahead == 0) {
  1912. if (flush == Z_NO_FLUSH)
  1913. return need_more;
  1914. break; /* flush the current block */
  1915. }
  1916. }
  1917. /* Output a literal byte */
  1918. s->match_length = 0;
  1919. Tracevv((stderr,"%c", s->window[s->strstart]));
  1920. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1921. s->lookahead--;
  1922. s->strstart++;
  1923. if (bflush) FLUSH_BLOCK(s, 0);
  1924. }
  1925. s->insert = 0;
  1926. if (flush == Z_FINISH) {
  1927. FLUSH_BLOCK(s, 1);
  1928. return finish_done;
  1929. }
  1930. if (s->sym_next)
  1931. FLUSH_BLOCK(s, 0);
  1932. return block_done;
  1933. }