deflate.c 80 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140
  1. /* deflate.c -- compress data using the deflation algorithm
  2. * Copyright (C) 1995-2024 Jean-loup Gailly and Mark Adler
  3. * For conditions of distribution and use, see copyright notice in zlib.h
  4. */
  5. /*
  6. * ALGORITHM
  7. *
  8. * The "deflation" process depends on being able to identify portions
  9. * of the input text which are identical to earlier input (within a
  10. * sliding window trailing behind the input currently being processed).
  11. *
  12. * The most straightforward technique turns out to be the fastest for
  13. * most input files: try all possible matches and select the longest.
  14. * The key feature of this algorithm is that insertions into the string
  15. * dictionary are very simple and thus fast, and deletions are avoided
  16. * completely. Insertions are performed at each input character, whereas
  17. * string matches are performed only when the previous match ends. So it
  18. * is preferable to spend more time in matches to allow very fast string
  19. * insertions and avoid deletions. The matching algorithm for small
  20. * strings is inspired from that of Rabin & Karp. A brute force approach
  21. * is used to find longer strings when a small match has been found.
  22. * A similar algorithm is used in comic (by Jan-Mark Wams) and freeze
  23. * (by Leonid Broukhis).
  24. * A previous version of this file used a more sophisticated algorithm
  25. * (by Fiala and Greene) which is guaranteed to run in linear amortized
  26. * time, but has a larger average cost, uses more memory and is patented.
  27. * However the F&G algorithm may be faster for some highly redundant
  28. * files if the parameter max_chain_length (described below) is too large.
  29. *
  30. * ACKNOWLEDGEMENTS
  31. *
  32. * The idea of lazy evaluation of matches is due to Jan-Mark Wams, and
  33. * I found it in 'freeze' written by Leonid Broukhis.
  34. * Thanks to many people for bug reports and testing.
  35. *
  36. * REFERENCES
  37. *
  38. * Deutsch, L.P.,"DEFLATE Compressed Data Format Specification".
  39. * Available in http://tools.ietf.org/html/rfc1951
  40. *
  41. * A description of the Rabin and Karp algorithm is given in the book
  42. * "Algorithms" by R. Sedgewick, Addison-Wesley, p252.
  43. *
  44. * Fiala,E.R., and Greene,D.H.
  45. * Data Compression with Finite Windows, Comm.ACM, 32,4 (1989) 490-595
  46. *
  47. */
  48. /* @(#) $Id$ */
  49. #include "deflate.h"
  50. const char deflate_copyright[] =
  51. " deflate 1.3.1 Copyright 1995-2024 Jean-loup Gailly and Mark Adler ";
  52. /*
  53. If you use the zlib library in a product, an acknowledgment is welcome
  54. in the documentation of your product. If for some reason you cannot
  55. include such an acknowledgment, I would appreciate that you keep this
  56. copyright string in the executable of your product.
  57. */
  58. typedef enum {
  59. need_more, /* block not completed, need more input or more output */
  60. block_done, /* block flush performed */
  61. finish_started, /* finish started, need only more output at next deflate */
  62. finish_done /* finish done, accept no more input or output */
  63. } block_state;
  64. typedef block_state (*compress_func)(deflate_state *s, int flush);
  65. /* Compression function. Returns the block state after the call. */
  66. local block_state deflate_stored(deflate_state *s, int flush);
  67. local block_state deflate_fast(deflate_state *s, int flush);
  68. #ifndef FASTEST
  69. local block_state deflate_slow(deflate_state *s, int flush);
  70. #endif
  71. local block_state deflate_rle(deflate_state *s, int flush);
  72. local block_state deflate_huff(deflate_state *s, int flush);
  73. /* ===========================================================================
  74. * Local data
  75. */
  76. #define NIL 0
  77. /* Tail of hash chains */
  78. #ifndef TOO_FAR
  79. # define TOO_FAR 4096
  80. #endif
  81. /* Matches of length 3 are discarded if their distance exceeds TOO_FAR */
  82. /* Values for max_lazy_match, good_match and max_chain_length, depending on
  83. * the desired pack level (0..9). The values given below have been tuned to
  84. * exclude worst case performance for pathological files. Better values may be
  85. * found for specific files.
  86. */
  87. typedef struct config_s {
  88. ush good_length; /* reduce lazy search above this match length */
  89. ush max_lazy; /* do not perform lazy search above this match length */
  90. ush nice_length; /* quit search above this match length */
  91. ush max_chain;
  92. compress_func func;
  93. } config;
  94. #ifdef FASTEST
  95. local const config configuration_table[2] = {
  96. /* good lazy nice chain */
  97. /* 0 */ {0, 0, 0, 0, deflate_stored}, /* store only */
  98. /* 1 */ {4, 4, 8, 4, deflate_fast}}; /* max speed, no lazy matches */
  99. #else
  100. local const config configuration_table[10] = {
  101. /* good lazy nice chain */
  102. /* 0 */ {0, 0, 0, 0, deflate_stored}, /* store only */
  103. /* 1 */ {4, 4, 8, 4, deflate_fast}, /* max speed, no lazy matches */
  104. /* 2 */ {4, 5, 16, 8, deflate_fast},
  105. /* 3 */ {4, 6, 32, 32, deflate_fast},
  106. /* 4 */ {4, 4, 16, 16, deflate_slow}, /* lazy matches */
  107. /* 5 */ {8, 16, 32, 32, deflate_slow},
  108. /* 6 */ {8, 16, 128, 128, deflate_slow},
  109. /* 7 */ {8, 32, 128, 256, deflate_slow},
  110. /* 8 */ {32, 128, 258, 1024, deflate_slow},
  111. /* 9 */ {32, 258, 258, 4096, deflate_slow}}; /* max compression */
  112. #endif
  113. /* Note: the deflate() code requires max_lazy >= MIN_MATCH and max_chain >= 4
  114. * For deflate_fast() (levels <= 3) good is ignored and lazy has a different
  115. * meaning.
  116. */
  117. /* rank Z_BLOCK between Z_NO_FLUSH and Z_PARTIAL_FLUSH */
  118. #define RANK(f) (((f) * 2) - ((f) > 4 ? 9 : 0))
  119. /* ===========================================================================
  120. * Update a hash value with the given input byte
  121. * IN assertion: all calls to UPDATE_HASH are made with consecutive input
  122. * characters, so that a running hash key can be computed from the previous
  123. * key instead of complete recalculation each time.
  124. */
  125. #define UPDATE_HASH(s,h,c) (h = (((h) << s->hash_shift) ^ (c)) & s->hash_mask)
  126. /* ===========================================================================
  127. * Insert string str in the dictionary and set match_head to the previous head
  128. * of the hash chain (the most recent string with same hash key). Return
  129. * the previous length of the hash chain.
  130. * If this file is compiled with -DFASTEST, the compression level is forced
  131. * to 1, and no hash chains are maintained.
  132. * IN assertion: all calls to INSERT_STRING are made with consecutive input
  133. * characters and the first MIN_MATCH bytes of str are valid (except for
  134. * the last MIN_MATCH-1 bytes of the input file).
  135. */
  136. #ifdef FASTEST
  137. #define INSERT_STRING(s, str, match_head) \
  138. (UPDATE_HASH(s, s->ins_h, s->window[(str) + (MIN_MATCH-1)]), \
  139. match_head = s->head[s->ins_h], \
  140. s->head[s->ins_h] = (Pos)(str))
  141. #else
  142. #define INSERT_STRING(s, str, match_head) \
  143. (UPDATE_HASH(s, s->ins_h, s->window[(str) + (MIN_MATCH-1)]), \
  144. match_head = s->prev[(str) & s->w_mask] = s->head[s->ins_h], \
  145. s->head[s->ins_h] = (Pos)(str))
  146. #endif
  147. /* ===========================================================================
  148. * Initialize the hash table (avoiding 64K overflow for 16 bit systems).
  149. * prev[] will be initialized on the fly.
  150. */
  151. #define CLEAR_HASH(s) \
  152. do { \
  153. s->head[s->hash_size - 1] = NIL; \
  154. zmemzero((Bytef *)s->head, \
  155. (unsigned)(s->hash_size - 1)*sizeof(*s->head)); \
  156. } while (0)
  157. /* ===========================================================================
  158. * Slide the hash table when sliding the window down (could be avoided with 32
  159. * bit values at the expense of memory usage). We slide even when level == 0 to
  160. * keep the hash table consistent if we switch back to level > 0 later.
  161. */
  162. #if defined(__has_feature)
  163. # if __has_feature(memory_sanitizer)
  164. __attribute__((no_sanitize("memory")))
  165. # endif
  166. #endif
  167. local void slide_hash(deflate_state *s) {
  168. unsigned n, m;
  169. Posf *p;
  170. uInt wsize = s->w_size;
  171. n = s->hash_size;
  172. p = &s->head[n];
  173. do {
  174. m = *--p;
  175. *p = (Pos)(m >= wsize ? m - wsize : NIL);
  176. } while (--n);
  177. n = wsize;
  178. #ifndef FASTEST
  179. p = &s->prev[n];
  180. do {
  181. m = *--p;
  182. *p = (Pos)(m >= wsize ? m - wsize : NIL);
  183. /* If n is not on any hash chain, prev[n] is garbage but
  184. * its value will never be used.
  185. */
  186. } while (--n);
  187. #endif
  188. }
  189. /* ===========================================================================
  190. * Read a new buffer from the current input stream, update the adler32
  191. * and total number of bytes read. All deflate() input goes through
  192. * this function so some applications may wish to modify it to avoid
  193. * allocating a large strm->next_in buffer and copying from it.
  194. * (See also flush_pending()).
  195. */
  196. local unsigned read_buf(z_streamp strm, Bytef *buf, unsigned size) {
  197. unsigned len = strm->avail_in;
  198. if (len > size) len = size;
  199. if (len == 0) return 0;
  200. strm->avail_in -= len;
  201. zmemcpy(buf, strm->next_in, len);
  202. if (strm->state->wrap == 1) {
  203. strm->adler = adler32(strm->adler, buf, len);
  204. }
  205. #ifdef GZIP
  206. else if (strm->state->wrap == 2) {
  207. strm->adler = crc32(strm->adler, buf, len);
  208. }
  209. #endif
  210. strm->next_in += len;
  211. strm->total_in += len;
  212. return len;
  213. }
  214. /* ===========================================================================
  215. * Fill the window when the lookahead becomes insufficient.
  216. * Updates strstart and lookahead.
  217. *
  218. * IN assertion: lookahead < MIN_LOOKAHEAD
  219. * OUT assertions: strstart <= window_size-MIN_LOOKAHEAD
  220. * At least one byte has been read, or avail_in == 0; reads are
  221. * performed for at least two bytes (required for the zip translate_eol
  222. * option -- not supported here).
  223. */
  224. local void fill_window(deflate_state *s) {
  225. unsigned n;
  226. unsigned more; /* Amount of free space at the end of the window. */
  227. uInt wsize = s->w_size;
  228. Assert(s->lookahead < MIN_LOOKAHEAD, "already enough lookahead");
  229. do {
  230. more = (unsigned)(s->window_size -(ulg)s->lookahead -(ulg)s->strstart);
  231. /* Deal with !@#$% 64K limit: */
  232. if (sizeof(int) <= 2) {
  233. if (more == 0 && s->strstart == 0 && s->lookahead == 0) {
  234. more = wsize;
  235. } else if (more == (unsigned)(-1)) {
  236. /* Very unlikely, but possible on 16 bit machine if
  237. * strstart == 0 && lookahead == 1 (input done a byte at time)
  238. */
  239. more--;
  240. }
  241. }
  242. /* If the window is almost full and there is insufficient lookahead,
  243. * move the upper half to the lower one to make room in the upper half.
  244. */
  245. if (s->strstart >= wsize + MAX_DIST(s)) {
  246. zmemcpy(s->window, s->window + wsize, (unsigned)wsize - more);
  247. s->match_start -= wsize;
  248. s->strstart -= wsize; /* we now have strstart >= MAX_DIST */
  249. s->block_start -= (long) wsize;
  250. if (s->insert > s->strstart)
  251. s->insert = s->strstart;
  252. slide_hash(s);
  253. more += wsize;
  254. }
  255. if (s->strm->avail_in == 0) break;
  256. /* If there was no sliding:
  257. * strstart <= WSIZE+MAX_DIST-1 && lookahead <= MIN_LOOKAHEAD - 1 &&
  258. * more == window_size - lookahead - strstart
  259. * => more >= window_size - (MIN_LOOKAHEAD-1 + WSIZE + MAX_DIST-1)
  260. * => more >= window_size - 2*WSIZE + 2
  261. * In the BIG_MEM or MMAP case (not yet supported),
  262. * window_size == input_size + MIN_LOOKAHEAD &&
  263. * strstart + s->lookahead <= input_size => more >= MIN_LOOKAHEAD.
  264. * Otherwise, window_size == 2*WSIZE so more >= 2.
  265. * If there was sliding, more >= WSIZE. So in all cases, more >= 2.
  266. */
  267. Assert(more >= 2, "more < 2");
  268. n = read_buf(s->strm, s->window + s->strstart + s->lookahead, more);
  269. s->lookahead += n;
  270. /* Initialize the hash value now that we have some input: */
  271. if (s->lookahead + s->insert >= MIN_MATCH) {
  272. uInt str = s->strstart - s->insert;
  273. s->ins_h = s->window[str];
  274. UPDATE_HASH(s, s->ins_h, s->window[str + 1]);
  275. #if MIN_MATCH != 3
  276. Call UPDATE_HASH() MIN_MATCH-3 more times
  277. #endif
  278. while (s->insert) {
  279. UPDATE_HASH(s, s->ins_h, s->window[str + MIN_MATCH-1]);
  280. #ifndef FASTEST
  281. s->prev[str & s->w_mask] = s->head[s->ins_h];
  282. #endif
  283. s->head[s->ins_h] = (Pos)str;
  284. str++;
  285. s->insert--;
  286. if (s->lookahead + s->insert < MIN_MATCH)
  287. break;
  288. }
  289. }
  290. /* If the whole input has less than MIN_MATCH bytes, ins_h is garbage,
  291. * but this is not important since only literal bytes will be emitted.
  292. */
  293. } while (s->lookahead < MIN_LOOKAHEAD && s->strm->avail_in != 0);
  294. /* If the WIN_INIT bytes after the end of the current data have never been
  295. * written, then zero those bytes in order to avoid memory check reports of
  296. * the use of uninitialized (or uninitialised as Julian writes) bytes by
  297. * the longest match routines. Update the high water mark for the next
  298. * time through here. WIN_INIT is set to MAX_MATCH since the longest match
  299. * routines allow scanning to strstart + MAX_MATCH, ignoring lookahead.
  300. */
  301. if (s->high_water < s->window_size) {
  302. ulg curr = s->strstart + (ulg)(s->lookahead);
  303. ulg init;
  304. if (s->high_water < curr) {
  305. /* Previous high water mark below current data -- zero WIN_INIT
  306. * bytes or up to end of window, whichever is less.
  307. */
  308. init = s->window_size - curr;
  309. if (init > WIN_INIT)
  310. init = WIN_INIT;
  311. zmemzero(s->window + curr, (unsigned)init);
  312. s->high_water = curr + init;
  313. }
  314. else if (s->high_water < (ulg)curr + WIN_INIT) {
  315. /* High water mark at or above current data, but below current data
  316. * plus WIN_INIT -- zero out to current data plus WIN_INIT, or up
  317. * to end of window, whichever is less.
  318. */
  319. init = (ulg)curr + WIN_INIT - s->high_water;
  320. if (init > s->window_size - s->high_water)
  321. init = s->window_size - s->high_water;
  322. zmemzero(s->window + s->high_water, (unsigned)init);
  323. s->high_water += init;
  324. }
  325. }
  326. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  327. "not enough room for search");
  328. }
  329. /* ========================================================================= */
  330. int ZEXPORT deflateInit_(z_streamp strm, int level, const char *version,
  331. int stream_size) {
  332. return deflateInit2_(strm, level, Z_DEFLATED, MAX_WBITS, DEF_MEM_LEVEL,
  333. Z_DEFAULT_STRATEGY, version, stream_size);
  334. /* To do: ignore strm->next_in if we use it as window */
  335. }
  336. /* ========================================================================= */
  337. int ZEXPORT deflateInit2_(z_streamp strm, int level, int method,
  338. int windowBits, int memLevel, int strategy,
  339. const char *version, int stream_size) {
  340. deflate_state *s;
  341. int wrap = 1;
  342. static const char my_version[] = ZLIB_VERSION;
  343. if (version == Z_NULL || version[0] != my_version[0] ||
  344. stream_size != sizeof(z_stream)) {
  345. return Z_VERSION_ERROR;
  346. }
  347. if (strm == Z_NULL) return Z_STREAM_ERROR;
  348. strm->msg = Z_NULL;
  349. if (strm->zalloc == (alloc_func)0) {
  350. #ifdef Z_SOLO
  351. return Z_STREAM_ERROR;
  352. #else
  353. strm->zalloc = zcalloc;
  354. strm->opaque = (voidpf)0;
  355. #endif
  356. }
  357. if (strm->zfree == (free_func)0)
  358. #ifdef Z_SOLO
  359. return Z_STREAM_ERROR;
  360. #else
  361. strm->zfree = zcfree;
  362. #endif
  363. #ifdef FASTEST
  364. if (level != 0) level = 1;
  365. #else
  366. if (level == Z_DEFAULT_COMPRESSION) level = 6;
  367. #endif
  368. if (windowBits < 0) { /* suppress zlib wrapper */
  369. wrap = 0;
  370. if (windowBits < -15)
  371. return Z_STREAM_ERROR;
  372. windowBits = -windowBits;
  373. }
  374. #ifdef GZIP
  375. else if (windowBits > 15) {
  376. wrap = 2; /* write gzip wrapper instead */
  377. windowBits -= 16;
  378. }
  379. #endif
  380. if (memLevel < 1 || memLevel > MAX_MEM_LEVEL || method != Z_DEFLATED ||
  381. windowBits < 8 || windowBits > 15 || level < 0 || level > 9 ||
  382. strategy < 0 || strategy > Z_FIXED || (windowBits == 8 && wrap != 1)) {
  383. return Z_STREAM_ERROR;
  384. }
  385. if (windowBits == 8) windowBits = 9; /* until 256-byte window bug fixed */
  386. s = (deflate_state *) ZALLOC(strm, 1, sizeof(deflate_state));
  387. if (s == Z_NULL) return Z_MEM_ERROR;
  388. strm->state = (struct internal_state FAR *)s;
  389. s->strm = strm;
  390. s->status = INIT_STATE; /* to pass state test in deflateReset() */
  391. s->wrap = wrap;
  392. s->gzhead = Z_NULL;
  393. s->w_bits = (uInt)windowBits;
  394. s->w_size = 1 << s->w_bits;
  395. s->w_mask = s->w_size - 1;
  396. s->hash_bits = (uInt)memLevel + 7;
  397. s->hash_size = 1 << s->hash_bits;
  398. s->hash_mask = s->hash_size - 1;
  399. s->hash_shift = ((s->hash_bits + MIN_MATCH-1) / MIN_MATCH);
  400. s->window = (Bytef *) ZALLOC(strm, s->w_size, 2*sizeof(Byte));
  401. s->prev = (Posf *) ZALLOC(strm, s->w_size, sizeof(Pos));
  402. s->head = (Posf *) ZALLOC(strm, s->hash_size, sizeof(Pos));
  403. s->high_water = 0; /* nothing written to s->window yet */
  404. s->lit_bufsize = 1 << (memLevel + 6); /* 16K elements by default */
  405. /* We overlay pending_buf and sym_buf. This works since the average size
  406. * for length/distance pairs over any compressed block is assured to be 31
  407. * bits or less.
  408. *
  409. * Analysis: The longest fixed codes are a length code of 8 bits plus 5
  410. * extra bits, for lengths 131 to 257. The longest fixed distance codes are
  411. * 5 bits plus 13 extra bits, for distances 16385 to 32768. The longest
  412. * possible fixed-codes length/distance pair is then 31 bits total.
  413. *
  414. * sym_buf starts one-fourth of the way into pending_buf. So there are
  415. * three bytes in sym_buf for every four bytes in pending_buf. Each symbol
  416. * in sym_buf is three bytes -- two for the distance and one for the
  417. * literal/length. As each symbol is consumed, the pointer to the next
  418. * sym_buf value to read moves forward three bytes. From that symbol, up to
  419. * 31 bits are written to pending_buf. The closest the written pending_buf
  420. * bits gets to the next sym_buf symbol to read is just before the last
  421. * code is written. At that time, 31*(n - 2) bits have been written, just
  422. * after 24*(n - 2) bits have been consumed from sym_buf. sym_buf starts at
  423. * 8*n bits into pending_buf. (Note that the symbol buffer fills when n - 1
  424. * symbols are written.) The closest the writing gets to what is unread is
  425. * then n + 14 bits. Here n is lit_bufsize, which is 16384 by default, and
  426. * can range from 128 to 32768.
  427. *
  428. * Therefore, at a minimum, there are 142 bits of space between what is
  429. * written and what is read in the overlain buffers, so the symbols cannot
  430. * be overwritten by the compressed data. That space is actually 139 bits,
  431. * due to the three-bit fixed-code block header.
  432. *
  433. * That covers the case where either Z_FIXED is specified, forcing fixed
  434. * codes, or when the use of fixed codes is chosen, because that choice
  435. * results in a smaller compressed block than dynamic codes. That latter
  436. * condition then assures that the above analysis also covers all dynamic
  437. * blocks. A dynamic-code block will only be chosen to be emitted if it has
  438. * fewer bits than a fixed-code block would for the same set of symbols.
  439. * Therefore its average symbol length is assured to be less than 31. So
  440. * the compressed data for a dynamic block also cannot overwrite the
  441. * symbols from which it is being constructed.
  442. */
  443. s->pending_buf = (uchf *) ZALLOC(strm, s->lit_bufsize, LIT_BUFS);
  444. s->pending_buf_size = (ulg)s->lit_bufsize * 4;
  445. if (s->window == Z_NULL || s->prev == Z_NULL || s->head == Z_NULL ||
  446. s->pending_buf == Z_NULL) {
  447. s->status = FINISH_STATE;
  448. strm->msg = ERR_MSG(Z_MEM_ERROR);
  449. deflateEnd (strm);
  450. return Z_MEM_ERROR;
  451. }
  452. #ifdef LIT_MEM
  453. s->d_buf = (ushf *)(s->pending_buf + (s->lit_bufsize << 1));
  454. s->l_buf = s->pending_buf + (s->lit_bufsize << 2);
  455. s->sym_end = s->lit_bufsize - 1;
  456. #else
  457. s->sym_buf = s->pending_buf + s->lit_bufsize;
  458. s->sym_end = (s->lit_bufsize - 1) * 3;
  459. #endif
  460. /* We avoid equality with lit_bufsize*3 because of wraparound at 64K
  461. * on 16 bit machines and because stored blocks are restricted to
  462. * 64K-1 bytes.
  463. */
  464. s->level = level;
  465. s->strategy = strategy;
  466. s->method = (Byte)method;
  467. return deflateReset(strm);
  468. }
  469. /* =========================================================================
  470. * Check for a valid deflate stream state. Return 0 if ok, 1 if not.
  471. */
  472. local int deflateStateCheck(z_streamp strm) {
  473. deflate_state *s;
  474. if (strm == Z_NULL ||
  475. strm->zalloc == (alloc_func)0 || strm->zfree == (free_func)0)
  476. return 1;
  477. s = strm->state;
  478. if (s == Z_NULL || s->strm != strm || (s->status != INIT_STATE &&
  479. #ifdef GZIP
  480. s->status != GZIP_STATE &&
  481. #endif
  482. s->status != EXTRA_STATE &&
  483. s->status != NAME_STATE &&
  484. s->status != COMMENT_STATE &&
  485. s->status != HCRC_STATE &&
  486. s->status != BUSY_STATE &&
  487. s->status != FINISH_STATE))
  488. return 1;
  489. return 0;
  490. }
  491. /* ========================================================================= */
  492. int ZEXPORT deflateSetDictionary(z_streamp strm, const Bytef *dictionary,
  493. uInt dictLength) {
  494. deflate_state *s;
  495. uInt str, n;
  496. int wrap;
  497. unsigned avail;
  498. z_const unsigned char *next;
  499. if (deflateStateCheck(strm) || dictionary == Z_NULL)
  500. return Z_STREAM_ERROR;
  501. s = strm->state;
  502. wrap = s->wrap;
  503. if (wrap == 2 || (wrap == 1 && s->status != INIT_STATE) || s->lookahead)
  504. return Z_STREAM_ERROR;
  505. /* when using zlib wrappers, compute Adler-32 for provided dictionary */
  506. if (wrap == 1)
  507. strm->adler = adler32(strm->adler, dictionary, dictLength);
  508. s->wrap = 0; /* avoid computing Adler-32 in read_buf */
  509. /* if dictionary would fill window, just replace the history */
  510. if (dictLength >= s->w_size) {
  511. if (wrap == 0) { /* already empty otherwise */
  512. CLEAR_HASH(s);
  513. s->strstart = 0;
  514. s->block_start = 0L;
  515. s->insert = 0;
  516. }
  517. dictionary += dictLength - s->w_size; /* use the tail */
  518. dictLength = s->w_size;
  519. }
  520. /* insert dictionary into window and hash */
  521. avail = strm->avail_in;
  522. next = strm->next_in;
  523. strm->avail_in = dictLength;
  524. strm->next_in = (z_const Bytef *)dictionary;
  525. fill_window(s);
  526. while (s->lookahead >= MIN_MATCH) {
  527. str = s->strstart;
  528. n = s->lookahead - (MIN_MATCH-1);
  529. do {
  530. UPDATE_HASH(s, s->ins_h, s->window[str + MIN_MATCH-1]);
  531. #ifndef FASTEST
  532. s->prev[str & s->w_mask] = s->head[s->ins_h];
  533. #endif
  534. s->head[s->ins_h] = (Pos)str;
  535. str++;
  536. } while (--n);
  537. s->strstart = str;
  538. s->lookahead = MIN_MATCH-1;
  539. fill_window(s);
  540. }
  541. s->strstart += s->lookahead;
  542. s->block_start = (long)s->strstart;
  543. s->insert = s->lookahead;
  544. s->lookahead = 0;
  545. s->match_length = s->prev_length = MIN_MATCH-1;
  546. s->match_available = 0;
  547. strm->next_in = next;
  548. strm->avail_in = avail;
  549. s->wrap = wrap;
  550. return Z_OK;
  551. }
  552. /* ========================================================================= */
  553. int ZEXPORT deflateGetDictionary(z_streamp strm, Bytef *dictionary,
  554. uInt *dictLength) {
  555. deflate_state *s;
  556. uInt len;
  557. if (deflateStateCheck(strm))
  558. return Z_STREAM_ERROR;
  559. s = strm->state;
  560. len = s->strstart + s->lookahead;
  561. if (len > s->w_size)
  562. len = s->w_size;
  563. if (dictionary != Z_NULL && len)
  564. zmemcpy(dictionary, s->window + s->strstart + s->lookahead - len, len);
  565. if (dictLength != Z_NULL)
  566. *dictLength = len;
  567. return Z_OK;
  568. }
  569. /* ========================================================================= */
  570. int ZEXPORT deflateResetKeep(z_streamp strm) {
  571. deflate_state *s;
  572. if (deflateStateCheck(strm)) {
  573. return Z_STREAM_ERROR;
  574. }
  575. strm->total_in = strm->total_out = 0;
  576. strm->msg = Z_NULL; /* use zfree if we ever allocate msg dynamically */
  577. strm->data_type = Z_UNKNOWN;
  578. s = (deflate_state *)strm->state;
  579. s->pending = 0;
  580. s->pending_out = s->pending_buf;
  581. if (s->wrap < 0) {
  582. s->wrap = -s->wrap; /* was made negative by deflate(..., Z_FINISH); */
  583. }
  584. s->status =
  585. #ifdef GZIP
  586. s->wrap == 2 ? GZIP_STATE :
  587. #endif
  588. INIT_STATE;
  589. strm->adler =
  590. #ifdef GZIP
  591. s->wrap == 2 ? crc32(0L, Z_NULL, 0) :
  592. #endif
  593. adler32(0L, Z_NULL, 0);
  594. s->last_flush = -2;
  595. _tr_init(s);
  596. return Z_OK;
  597. }
  598. /* ===========================================================================
  599. * Initialize the "longest match" routines for a new zlib stream
  600. */
  601. local void lm_init(deflate_state *s) {
  602. s->window_size = (ulg)2L*s->w_size;
  603. CLEAR_HASH(s);
  604. /* Set the default configuration parameters:
  605. */
  606. s->max_lazy_match = configuration_table[s->level].max_lazy;
  607. s->good_match = configuration_table[s->level].good_length;
  608. s->nice_match = configuration_table[s->level].nice_length;
  609. s->max_chain_length = configuration_table[s->level].max_chain;
  610. s->strstart = 0;
  611. s->block_start = 0L;
  612. s->lookahead = 0;
  613. s->insert = 0;
  614. s->match_length = s->prev_length = MIN_MATCH-1;
  615. s->match_available = 0;
  616. s->ins_h = 0;
  617. }
  618. /* ========================================================================= */
  619. int ZEXPORT deflateReset(z_streamp strm) {
  620. int ret;
  621. ret = deflateResetKeep(strm);
  622. if (ret == Z_OK)
  623. lm_init(strm->state);
  624. return ret;
  625. }
  626. /* ========================================================================= */
  627. int ZEXPORT deflateSetHeader(z_streamp strm, gz_headerp head) {
  628. if (deflateStateCheck(strm) || strm->state->wrap != 2)
  629. return Z_STREAM_ERROR;
  630. strm->state->gzhead = head;
  631. return Z_OK;
  632. }
  633. /* ========================================================================= */
  634. int ZEXPORT deflatePending(z_streamp strm, unsigned *pending, int *bits) {
  635. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  636. if (pending != Z_NULL)
  637. *pending = strm->state->pending;
  638. if (bits != Z_NULL)
  639. *bits = strm->state->bi_valid;
  640. return Z_OK;
  641. }
  642. /* ========================================================================= */
  643. int ZEXPORT deflatePrime(z_streamp strm, int bits, int value) {
  644. deflate_state *s;
  645. int put;
  646. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  647. s = strm->state;
  648. #ifdef LIT_MEM
  649. if (bits < 0 || bits > 16 ||
  650. (uchf *)s->d_buf < s->pending_out + ((Buf_size + 7) >> 3))
  651. return Z_BUF_ERROR;
  652. #else
  653. if (bits < 0 || bits > 16 ||
  654. s->sym_buf < s->pending_out + ((Buf_size + 7) >> 3))
  655. return Z_BUF_ERROR;
  656. #endif
  657. do {
  658. put = Buf_size - s->bi_valid;
  659. if (put > bits)
  660. put = bits;
  661. s->bi_buf |= (ush)((value & ((1 << put) - 1)) << s->bi_valid);
  662. s->bi_valid += put;
  663. _tr_flush_bits(s);
  664. value >>= put;
  665. bits -= put;
  666. } while (bits);
  667. return Z_OK;
  668. }
  669. /* ========================================================================= */
  670. int ZEXPORT deflateParams(z_streamp strm, int level, int strategy) {
  671. deflate_state *s;
  672. compress_func func;
  673. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  674. s = strm->state;
  675. #ifdef FASTEST
  676. if (level != 0) level = 1;
  677. #else
  678. if (level == Z_DEFAULT_COMPRESSION) level = 6;
  679. #endif
  680. if (level < 0 || level > 9 || strategy < 0 || strategy > Z_FIXED) {
  681. return Z_STREAM_ERROR;
  682. }
  683. func = configuration_table[s->level].func;
  684. if ((strategy != s->strategy || func != configuration_table[level].func) &&
  685. s->last_flush != -2) {
  686. /* Flush the last buffer: */
  687. int err = deflate(strm, Z_BLOCK);
  688. if (err == Z_STREAM_ERROR)
  689. return err;
  690. if (strm->avail_in || (s->strstart - s->block_start) + s->lookahead)
  691. return Z_BUF_ERROR;
  692. }
  693. if (s->level != level) {
  694. if (s->level == 0 && s->matches != 0) {
  695. if (s->matches == 1)
  696. slide_hash(s);
  697. else
  698. CLEAR_HASH(s);
  699. s->matches = 0;
  700. }
  701. s->level = level;
  702. s->max_lazy_match = configuration_table[level].max_lazy;
  703. s->good_match = configuration_table[level].good_length;
  704. s->nice_match = configuration_table[level].nice_length;
  705. s->max_chain_length = configuration_table[level].max_chain;
  706. }
  707. s->strategy = strategy;
  708. return Z_OK;
  709. }
  710. /* ========================================================================= */
  711. int ZEXPORT deflateTune(z_streamp strm, int good_length, int max_lazy,
  712. int nice_length, int max_chain) {
  713. deflate_state *s;
  714. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  715. s = strm->state;
  716. s->good_match = (uInt)good_length;
  717. s->max_lazy_match = (uInt)max_lazy;
  718. s->nice_match = nice_length;
  719. s->max_chain_length = (uInt)max_chain;
  720. return Z_OK;
  721. }
  722. /* =========================================================================
  723. * For the default windowBits of 15 and memLevel of 8, this function returns a
  724. * close to exact, as well as small, upper bound on the compressed size. This
  725. * is an expansion of ~0.03%, plus a small constant.
  726. *
  727. * For any setting other than those defaults for windowBits and memLevel, one
  728. * of two worst case bounds is returned. This is at most an expansion of ~4% or
  729. * ~13%, plus a small constant.
  730. *
  731. * Both the 0.03% and 4% derive from the overhead of stored blocks. The first
  732. * one is for stored blocks of 16383 bytes (memLevel == 8), whereas the second
  733. * is for stored blocks of 127 bytes (the worst case memLevel == 1). The
  734. * expansion results from five bytes of header for each stored block.
  735. *
  736. * The larger expansion of 13% results from a window size less than or equal to
  737. * the symbols buffer size (windowBits <= memLevel + 7). In that case some of
  738. * the data being compressed may have slid out of the sliding window, impeding
  739. * a stored block from being emitted. Then the only choice is a fixed or
  740. * dynamic block, where a fixed block limits the maximum expansion to 9 bits
  741. * per 8-bit byte, plus 10 bits for every block. The smallest block size for
  742. * which this can occur is 255 (memLevel == 2).
  743. *
  744. * Shifts are used to approximate divisions, for speed.
  745. */
  746. uLong ZEXPORT deflateBound(z_streamp strm, uLong sourceLen) {
  747. deflate_state *s;
  748. uLong fixedlen, storelen, wraplen;
  749. /* upper bound for fixed blocks with 9-bit literals and length 255
  750. (memLevel == 2, which is the lowest that may not use stored blocks) --
  751. ~13% overhead plus a small constant */
  752. fixedlen = sourceLen + (sourceLen >> 3) + (sourceLen >> 8) +
  753. (sourceLen >> 9) + 4;
  754. /* upper bound for stored blocks with length 127 (memLevel == 1) --
  755. ~4% overhead plus a small constant */
  756. storelen = sourceLen + (sourceLen >> 5) + (sourceLen >> 7) +
  757. (sourceLen >> 11) + 7;
  758. /* if can't get parameters, return larger bound plus a zlib wrapper */
  759. if (deflateStateCheck(strm))
  760. return (fixedlen > storelen ? fixedlen : storelen) + 6;
  761. /* compute wrapper length */
  762. s = strm->state;
  763. switch (s->wrap) {
  764. case 0: /* raw deflate */
  765. wraplen = 0;
  766. break;
  767. case 1: /* zlib wrapper */
  768. wraplen = 6 + (s->strstart ? 4 : 0);
  769. break;
  770. #ifdef GZIP
  771. case 2: /* gzip wrapper */
  772. wraplen = 18;
  773. if (s->gzhead != Z_NULL) { /* user-supplied gzip header */
  774. Bytef *str;
  775. if (s->gzhead->extra != Z_NULL)
  776. wraplen += 2 + s->gzhead->extra_len;
  777. str = s->gzhead->name;
  778. if (str != Z_NULL)
  779. do {
  780. wraplen++;
  781. } while (*str++);
  782. str = s->gzhead->comment;
  783. if (str != Z_NULL)
  784. do {
  785. wraplen++;
  786. } while (*str++);
  787. if (s->gzhead->hcrc)
  788. wraplen += 2;
  789. }
  790. break;
  791. #endif
  792. default: /* for compiler happiness */
  793. wraplen = 6;
  794. }
  795. /* if not default parameters, return one of the conservative bounds */
  796. if (s->w_bits != 15 || s->hash_bits != 8 + 7)
  797. return (s->w_bits <= s->hash_bits && s->level ? fixedlen : storelen) +
  798. wraplen;
  799. /* default settings: return tight bound for that case -- ~0.03% overhead
  800. plus a small constant */
  801. return sourceLen + (sourceLen >> 12) + (sourceLen >> 14) +
  802. (sourceLen >> 25) + 13 - 6 + wraplen;
  803. }
  804. /* =========================================================================
  805. * Put a short in the pending buffer. The 16-bit value is put in MSB order.
  806. * IN assertion: the stream state is correct and there is enough room in
  807. * pending_buf.
  808. */
  809. local void putShortMSB(deflate_state *s, uInt b) {
  810. put_byte(s, (Byte)(b >> 8));
  811. put_byte(s, (Byte)(b & 0xff));
  812. }
  813. /* =========================================================================
  814. * Flush as much pending output as possible. All deflate() output, except for
  815. * some deflate_stored() output, goes through this function so some
  816. * applications may wish to modify it to avoid allocating a large
  817. * strm->next_out buffer and copying into it. (See also read_buf()).
  818. */
  819. local void flush_pending(z_streamp strm) {
  820. unsigned len;
  821. deflate_state *s = strm->state;
  822. _tr_flush_bits(s);
  823. len = s->pending;
  824. if (len > strm->avail_out) len = strm->avail_out;
  825. if (len == 0) return;
  826. zmemcpy(strm->next_out, s->pending_out, len);
  827. strm->next_out += len;
  828. s->pending_out += len;
  829. strm->total_out += len;
  830. strm->avail_out -= len;
  831. s->pending -= len;
  832. if (s->pending == 0) {
  833. s->pending_out = s->pending_buf;
  834. }
  835. }
  836. /* ===========================================================================
  837. * Update the header CRC with the bytes s->pending_buf[beg..s->pending - 1].
  838. */
  839. #define HCRC_UPDATE(beg) \
  840. do { \
  841. if (s->gzhead->hcrc && s->pending > (beg)) \
  842. strm->adler = crc32(strm->adler, s->pending_buf + (beg), \
  843. s->pending - (beg)); \
  844. } while (0)
  845. /* ========================================================================= */
  846. int ZEXPORT deflate(z_streamp strm, int flush) {
  847. int old_flush; /* value of flush param for previous deflate call */
  848. deflate_state *s;
  849. if (deflateStateCheck(strm) || flush > Z_BLOCK || flush < 0) {
  850. return Z_STREAM_ERROR;
  851. }
  852. s = strm->state;
  853. if (strm->next_out == Z_NULL ||
  854. (strm->avail_in != 0 && strm->next_in == Z_NULL) ||
  855. (s->status == FINISH_STATE && flush != Z_FINISH)) {
  856. ERR_RETURN(strm, Z_STREAM_ERROR);
  857. }
  858. if (strm->avail_out == 0) ERR_RETURN(strm, Z_BUF_ERROR);
  859. old_flush = s->last_flush;
  860. s->last_flush = flush;
  861. /* Flush as much pending output as possible */
  862. if (s->pending != 0) {
  863. flush_pending(strm);
  864. if (strm->avail_out == 0) {
  865. /* Since avail_out is 0, deflate will be called again with
  866. * more output space, but possibly with both pending and
  867. * avail_in equal to zero. There won't be anything to do,
  868. * but this is not an error situation so make sure we
  869. * return OK instead of BUF_ERROR at next call of deflate:
  870. */
  871. s->last_flush = -1;
  872. return Z_OK;
  873. }
  874. /* Make sure there is something to do and avoid duplicate consecutive
  875. * flushes. For repeated and useless calls with Z_FINISH, we keep
  876. * returning Z_STREAM_END instead of Z_BUF_ERROR.
  877. */
  878. } else if (strm->avail_in == 0 && RANK(flush) <= RANK(old_flush) &&
  879. flush != Z_FINISH) {
  880. ERR_RETURN(strm, Z_BUF_ERROR);
  881. }
  882. /* User must not provide more input after the first FINISH: */
  883. if (s->status == FINISH_STATE && strm->avail_in != 0) {
  884. ERR_RETURN(strm, Z_BUF_ERROR);
  885. }
  886. /* Write the header */
  887. if (s->status == INIT_STATE && s->wrap == 0)
  888. s->status = BUSY_STATE;
  889. if (s->status == INIT_STATE) {
  890. /* zlib header */
  891. uInt header = (Z_DEFLATED + ((s->w_bits - 8) << 4)) << 8;
  892. uInt level_flags;
  893. if (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2)
  894. level_flags = 0;
  895. else if (s->level < 6)
  896. level_flags = 1;
  897. else if (s->level == 6)
  898. level_flags = 2;
  899. else
  900. level_flags = 3;
  901. header |= (level_flags << 6);
  902. if (s->strstart != 0) header |= PRESET_DICT;
  903. header += 31 - (header % 31);
  904. putShortMSB(s, header);
  905. /* Save the adler32 of the preset dictionary: */
  906. if (s->strstart != 0) {
  907. putShortMSB(s, (uInt)(strm->adler >> 16));
  908. putShortMSB(s, (uInt)(strm->adler & 0xffff));
  909. }
  910. strm->adler = adler32(0L, Z_NULL, 0);
  911. s->status = BUSY_STATE;
  912. /* Compression must start with an empty pending buffer */
  913. flush_pending(strm);
  914. if (s->pending != 0) {
  915. s->last_flush = -1;
  916. return Z_OK;
  917. }
  918. }
  919. #ifdef GZIP
  920. if (s->status == GZIP_STATE) {
  921. /* gzip header */
  922. strm->adler = crc32(0L, Z_NULL, 0);
  923. put_byte(s, 31);
  924. put_byte(s, 139);
  925. put_byte(s, 8);
  926. if (s->gzhead == Z_NULL) {
  927. put_byte(s, 0);
  928. put_byte(s, 0);
  929. put_byte(s, 0);
  930. put_byte(s, 0);
  931. put_byte(s, 0);
  932. put_byte(s, s->level == 9 ? 2 :
  933. (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2 ?
  934. 4 : 0));
  935. put_byte(s, OS_CODE);
  936. s->status = BUSY_STATE;
  937. /* Compression must start with an empty pending buffer */
  938. flush_pending(strm);
  939. if (s->pending != 0) {
  940. s->last_flush = -1;
  941. return Z_OK;
  942. }
  943. }
  944. else {
  945. put_byte(s, (s->gzhead->text ? 1 : 0) +
  946. (s->gzhead->hcrc ? 2 : 0) +
  947. (s->gzhead->extra == Z_NULL ? 0 : 4) +
  948. (s->gzhead->name == Z_NULL ? 0 : 8) +
  949. (s->gzhead->comment == Z_NULL ? 0 : 16)
  950. );
  951. put_byte(s, (Byte)(s->gzhead->time & 0xff));
  952. put_byte(s, (Byte)((s->gzhead->time >> 8) & 0xff));
  953. put_byte(s, (Byte)((s->gzhead->time >> 16) & 0xff));
  954. put_byte(s, (Byte)((s->gzhead->time >> 24) & 0xff));
  955. put_byte(s, s->level == 9 ? 2 :
  956. (s->strategy >= Z_HUFFMAN_ONLY || s->level < 2 ?
  957. 4 : 0));
  958. put_byte(s, s->gzhead->os & 0xff);
  959. if (s->gzhead->extra != Z_NULL) {
  960. put_byte(s, s->gzhead->extra_len & 0xff);
  961. put_byte(s, (s->gzhead->extra_len >> 8) & 0xff);
  962. }
  963. if (s->gzhead->hcrc)
  964. strm->adler = crc32(strm->adler, s->pending_buf,
  965. s->pending);
  966. s->gzindex = 0;
  967. s->status = EXTRA_STATE;
  968. }
  969. }
  970. if (s->status == EXTRA_STATE) {
  971. if (s->gzhead->extra != Z_NULL) {
  972. ulg beg = s->pending; /* start of bytes to update crc */
  973. uInt left = (s->gzhead->extra_len & 0xffff) - s->gzindex;
  974. while (s->pending + left > s->pending_buf_size) {
  975. uInt copy = s->pending_buf_size - s->pending;
  976. zmemcpy(s->pending_buf + s->pending,
  977. s->gzhead->extra + s->gzindex, copy);
  978. s->pending = s->pending_buf_size;
  979. HCRC_UPDATE(beg);
  980. s->gzindex += copy;
  981. flush_pending(strm);
  982. if (s->pending != 0) {
  983. s->last_flush = -1;
  984. return Z_OK;
  985. }
  986. beg = 0;
  987. left -= copy;
  988. }
  989. zmemcpy(s->pending_buf + s->pending,
  990. s->gzhead->extra + s->gzindex, left);
  991. s->pending += left;
  992. HCRC_UPDATE(beg);
  993. s->gzindex = 0;
  994. }
  995. s->status = NAME_STATE;
  996. }
  997. if (s->status == NAME_STATE) {
  998. if (s->gzhead->name != Z_NULL) {
  999. ulg beg = s->pending; /* start of bytes to update crc */
  1000. int val;
  1001. do {
  1002. if (s->pending == s->pending_buf_size) {
  1003. HCRC_UPDATE(beg);
  1004. flush_pending(strm);
  1005. if (s->pending != 0) {
  1006. s->last_flush = -1;
  1007. return Z_OK;
  1008. }
  1009. beg = 0;
  1010. }
  1011. val = s->gzhead->name[s->gzindex++];
  1012. put_byte(s, val);
  1013. } while (val != 0);
  1014. HCRC_UPDATE(beg);
  1015. s->gzindex = 0;
  1016. }
  1017. s->status = COMMENT_STATE;
  1018. }
  1019. if (s->status == COMMENT_STATE) {
  1020. if (s->gzhead->comment != Z_NULL) {
  1021. ulg beg = s->pending; /* start of bytes to update crc */
  1022. int val;
  1023. do {
  1024. if (s->pending == s->pending_buf_size) {
  1025. HCRC_UPDATE(beg);
  1026. flush_pending(strm);
  1027. if (s->pending != 0) {
  1028. s->last_flush = -1;
  1029. return Z_OK;
  1030. }
  1031. beg = 0;
  1032. }
  1033. val = s->gzhead->comment[s->gzindex++];
  1034. put_byte(s, val);
  1035. } while (val != 0);
  1036. HCRC_UPDATE(beg);
  1037. }
  1038. s->status = HCRC_STATE;
  1039. }
  1040. if (s->status == HCRC_STATE) {
  1041. if (s->gzhead->hcrc) {
  1042. if (s->pending + 2 > s->pending_buf_size) {
  1043. flush_pending(strm);
  1044. if (s->pending != 0) {
  1045. s->last_flush = -1;
  1046. return Z_OK;
  1047. }
  1048. }
  1049. put_byte(s, (Byte)(strm->adler & 0xff));
  1050. put_byte(s, (Byte)((strm->adler >> 8) & 0xff));
  1051. strm->adler = crc32(0L, Z_NULL, 0);
  1052. }
  1053. s->status = BUSY_STATE;
  1054. /* Compression must start with an empty pending buffer */
  1055. flush_pending(strm);
  1056. if (s->pending != 0) {
  1057. s->last_flush = -1;
  1058. return Z_OK;
  1059. }
  1060. }
  1061. #endif
  1062. /* Start a new block or continue the current one.
  1063. */
  1064. if (strm->avail_in != 0 || s->lookahead != 0 ||
  1065. (flush != Z_NO_FLUSH && s->status != FINISH_STATE)) {
  1066. block_state bstate;
  1067. bstate = s->level == 0 ? deflate_stored(s, flush) :
  1068. s->strategy == Z_HUFFMAN_ONLY ? deflate_huff(s, flush) :
  1069. s->strategy == Z_RLE ? deflate_rle(s, flush) :
  1070. (*(configuration_table[s->level].func))(s, flush);
  1071. if (bstate == finish_started || bstate == finish_done) {
  1072. s->status = FINISH_STATE;
  1073. }
  1074. if (bstate == need_more || bstate == finish_started) {
  1075. if (strm->avail_out == 0) {
  1076. s->last_flush = -1; /* avoid BUF_ERROR next call, see above */
  1077. }
  1078. return Z_OK;
  1079. /* If flush != Z_NO_FLUSH && avail_out == 0, the next call
  1080. * of deflate should use the same flush parameter to make sure
  1081. * that the flush is complete. So we don't have to output an
  1082. * empty block here, this will be done at next call. This also
  1083. * ensures that for a very small output buffer, we emit at most
  1084. * one empty block.
  1085. */
  1086. }
  1087. if (bstate == block_done) {
  1088. if (flush == Z_PARTIAL_FLUSH) {
  1089. _tr_align(s);
  1090. } else if (flush != Z_BLOCK) { /* FULL_FLUSH or SYNC_FLUSH */
  1091. _tr_stored_block(s, (char*)0, 0L, 0);
  1092. /* For a full flush, this empty block will be recognized
  1093. * as a special marker by inflate_sync().
  1094. */
  1095. if (flush == Z_FULL_FLUSH) {
  1096. CLEAR_HASH(s); /* forget history */
  1097. if (s->lookahead == 0) {
  1098. s->strstart = 0;
  1099. s->block_start = 0L;
  1100. s->insert = 0;
  1101. }
  1102. }
  1103. }
  1104. flush_pending(strm);
  1105. if (strm->avail_out == 0) {
  1106. s->last_flush = -1; /* avoid BUF_ERROR at next call, see above */
  1107. return Z_OK;
  1108. }
  1109. }
  1110. }
  1111. if (flush != Z_FINISH) return Z_OK;
  1112. if (s->wrap <= 0) return Z_STREAM_END;
  1113. /* Write the trailer */
  1114. #ifdef GZIP
  1115. if (s->wrap == 2) {
  1116. put_byte(s, (Byte)(strm->adler & 0xff));
  1117. put_byte(s, (Byte)((strm->adler >> 8) & 0xff));
  1118. put_byte(s, (Byte)((strm->adler >> 16) & 0xff));
  1119. put_byte(s, (Byte)((strm->adler >> 24) & 0xff));
  1120. put_byte(s, (Byte)(strm->total_in & 0xff));
  1121. put_byte(s, (Byte)((strm->total_in >> 8) & 0xff));
  1122. put_byte(s, (Byte)((strm->total_in >> 16) & 0xff));
  1123. put_byte(s, (Byte)((strm->total_in >> 24) & 0xff));
  1124. }
  1125. else
  1126. #endif
  1127. {
  1128. putShortMSB(s, (uInt)(strm->adler >> 16));
  1129. putShortMSB(s, (uInt)(strm->adler & 0xffff));
  1130. }
  1131. flush_pending(strm);
  1132. /* If avail_out is zero, the application will call deflate again
  1133. * to flush the rest.
  1134. */
  1135. if (s->wrap > 0) s->wrap = -s->wrap; /* write the trailer only once! */
  1136. return s->pending != 0 ? Z_OK : Z_STREAM_END;
  1137. }
  1138. /* ========================================================================= */
  1139. int ZEXPORT deflateEnd(z_streamp strm) {
  1140. int status;
  1141. if (deflateStateCheck(strm)) return Z_STREAM_ERROR;
  1142. status = strm->state->status;
  1143. /* Deallocate in reverse order of allocations: */
  1144. TRY_FREE(strm, strm->state->pending_buf);
  1145. TRY_FREE(strm, strm->state->head);
  1146. TRY_FREE(strm, strm->state->prev);
  1147. TRY_FREE(strm, strm->state->window);
  1148. ZFREE(strm, strm->state);
  1149. strm->state = Z_NULL;
  1150. return status == BUSY_STATE ? Z_DATA_ERROR : Z_OK;
  1151. }
  1152. /* =========================================================================
  1153. * Copy the source state to the destination state.
  1154. * To simplify the source, this is not supported for 16-bit MSDOS (which
  1155. * doesn't have enough memory anyway to duplicate compression states).
  1156. */
  1157. int ZEXPORT deflateCopy(z_streamp dest, z_streamp source) {
  1158. #ifdef MAXSEG_64K
  1159. (void)dest;
  1160. (void)source;
  1161. return Z_STREAM_ERROR;
  1162. #else
  1163. deflate_state *ds;
  1164. deflate_state *ss;
  1165. if (deflateStateCheck(source) || dest == Z_NULL) {
  1166. return Z_STREAM_ERROR;
  1167. }
  1168. ss = source->state;
  1169. zmemcpy((voidpf)dest, (voidpf)source, sizeof(z_stream));
  1170. ds = (deflate_state *) ZALLOC(dest, 1, sizeof(deflate_state));
  1171. if (ds == Z_NULL) return Z_MEM_ERROR;
  1172. dest->state = (struct internal_state FAR *) ds;
  1173. zmemcpy((voidpf)ds, (voidpf)ss, sizeof(deflate_state));
  1174. ds->strm = dest;
  1175. ds->window = (Bytef *) ZALLOC(dest, ds->w_size, 2*sizeof(Byte));
  1176. ds->prev = (Posf *) ZALLOC(dest, ds->w_size, sizeof(Pos));
  1177. ds->head = (Posf *) ZALLOC(dest, ds->hash_size, sizeof(Pos));
  1178. ds->pending_buf = (uchf *) ZALLOC(dest, ds->lit_bufsize, LIT_BUFS);
  1179. if (ds->window == Z_NULL || ds->prev == Z_NULL || ds->head == Z_NULL ||
  1180. ds->pending_buf == Z_NULL) {
  1181. deflateEnd (dest);
  1182. return Z_MEM_ERROR;
  1183. }
  1184. /* following zmemcpy do not work for 16-bit MSDOS */
  1185. zmemcpy(ds->window, ss->window, ds->w_size * 2 * sizeof(Byte));
  1186. zmemcpy((voidpf)ds->prev, (voidpf)ss->prev, ds->w_size * sizeof(Pos));
  1187. zmemcpy((voidpf)ds->head, (voidpf)ss->head, ds->hash_size * sizeof(Pos));
  1188. zmemcpy(ds->pending_buf, ss->pending_buf, ds->lit_bufsize * LIT_BUFS);
  1189. ds->pending_out = ds->pending_buf + (ss->pending_out - ss->pending_buf);
  1190. #ifdef LIT_MEM
  1191. ds->d_buf = (ushf *)(ds->pending_buf + (ds->lit_bufsize << 1));
  1192. ds->l_buf = ds->pending_buf + (ds->lit_bufsize << 2);
  1193. #else
  1194. ds->sym_buf = ds->pending_buf + ds->lit_bufsize;
  1195. #endif
  1196. ds->l_desc.dyn_tree = ds->dyn_ltree;
  1197. ds->d_desc.dyn_tree = ds->dyn_dtree;
  1198. ds->bl_desc.dyn_tree = ds->bl_tree;
  1199. return Z_OK;
  1200. #endif /* MAXSEG_64K */
  1201. }
  1202. #ifndef FASTEST
  1203. /* ===========================================================================
  1204. * Set match_start to the longest match starting at the given string and
  1205. * return its length. Matches shorter or equal to prev_length are discarded,
  1206. * in which case the result is equal to prev_length and match_start is
  1207. * garbage.
  1208. * IN assertions: cur_match is the head of the hash chain for the current
  1209. * string (strstart) and its distance is <= MAX_DIST, and prev_length >= 1
  1210. * OUT assertion: the match length is not greater than s->lookahead.
  1211. */
  1212. local uInt longest_match(deflate_state *s, IPos cur_match) {
  1213. unsigned chain_length = s->max_chain_length;/* max hash chain length */
  1214. register Bytef *scan = s->window + s->strstart; /* current string */
  1215. register Bytef *match; /* matched string */
  1216. register int len; /* length of current match */
  1217. int best_len = (int)s->prev_length; /* best match length so far */
  1218. int nice_match = s->nice_match; /* stop if match long enough */
  1219. IPos limit = s->strstart > (IPos)MAX_DIST(s) ?
  1220. s->strstart - (IPos)MAX_DIST(s) : NIL;
  1221. /* Stop when cur_match becomes <= limit. To simplify the code,
  1222. * we prevent matches with the string of window index 0.
  1223. */
  1224. Posf *prev = s->prev;
  1225. uInt wmask = s->w_mask;
  1226. #ifdef UNALIGNED_OK
  1227. /* Compare two bytes at a time. Note: this is not always beneficial.
  1228. * Try with and without -DUNALIGNED_OK to check.
  1229. */
  1230. register Bytef *strend = s->window + s->strstart + MAX_MATCH - 1;
  1231. register ush scan_start = *(ushf*)scan;
  1232. register ush scan_end = *(ushf*)(scan + best_len - 1);
  1233. #else
  1234. register Bytef *strend = s->window + s->strstart + MAX_MATCH;
  1235. register Byte scan_end1 = scan[best_len - 1];
  1236. register Byte scan_end = scan[best_len];
  1237. #endif
  1238. /* The code is optimized for HASH_BITS >= 8 and MAX_MATCH-2 multiple of 16.
  1239. * It is easy to get rid of this optimization if necessary.
  1240. */
  1241. Assert(s->hash_bits >= 8 && MAX_MATCH == 258, "Code too clever");
  1242. /* Do not waste too much time if we already have a good match: */
  1243. if (s->prev_length >= s->good_match) {
  1244. chain_length >>= 2;
  1245. }
  1246. /* Do not look for matches beyond the end of the input. This is necessary
  1247. * to make deflate deterministic.
  1248. */
  1249. if ((uInt)nice_match > s->lookahead) nice_match = (int)s->lookahead;
  1250. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  1251. "need lookahead");
  1252. do {
  1253. Assert(cur_match < s->strstart, "no future");
  1254. match = s->window + cur_match;
  1255. /* Skip to next match if the match length cannot increase
  1256. * or if the match length is less than 2. Note that the checks below
  1257. * for insufficient lookahead only occur occasionally for performance
  1258. * reasons. Therefore uninitialized memory will be accessed, and
  1259. * conditional jumps will be made that depend on those values.
  1260. * However the length of the match is limited to the lookahead, so
  1261. * the output of deflate is not affected by the uninitialized values.
  1262. */
  1263. #if (defined(UNALIGNED_OK) && MAX_MATCH == 258)
  1264. /* This code assumes sizeof(unsigned short) == 2. Do not use
  1265. * UNALIGNED_OK if your compiler uses a different size.
  1266. */
  1267. if (*(ushf*)(match + best_len - 1) != scan_end ||
  1268. *(ushf*)match != scan_start) continue;
  1269. /* It is not necessary to compare scan[2] and match[2] since they are
  1270. * always equal when the other bytes match, given that the hash keys
  1271. * are equal and that HASH_BITS >= 8. Compare 2 bytes at a time at
  1272. * strstart + 3, + 5, up to strstart + 257. We check for insufficient
  1273. * lookahead only every 4th comparison; the 128th check will be made
  1274. * at strstart + 257. If MAX_MATCH-2 is not a multiple of 8, it is
  1275. * necessary to put more guard bytes at the end of the window, or
  1276. * to check more often for insufficient lookahead.
  1277. */
  1278. Assert(scan[2] == match[2], "scan[2]?");
  1279. scan++, match++;
  1280. do {
  1281. } while (*(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1282. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1283. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1284. *(ushf*)(scan += 2) == *(ushf*)(match += 2) &&
  1285. scan < strend);
  1286. /* The funny "do {}" generates better code on most compilers */
  1287. /* Here, scan <= window + strstart + 257 */
  1288. Assert(scan <= s->window + (unsigned)(s->window_size - 1),
  1289. "wild scan");
  1290. if (*scan == *match) scan++;
  1291. len = (MAX_MATCH - 1) - (int)(strend - scan);
  1292. scan = strend - (MAX_MATCH-1);
  1293. #else /* UNALIGNED_OK */
  1294. if (match[best_len] != scan_end ||
  1295. match[best_len - 1] != scan_end1 ||
  1296. *match != *scan ||
  1297. *++match != scan[1]) continue;
  1298. /* The check at best_len - 1 can be removed because it will be made
  1299. * again later. (This heuristic is not always a win.)
  1300. * It is not necessary to compare scan[2] and match[2] since they
  1301. * are always equal when the other bytes match, given that
  1302. * the hash keys are equal and that HASH_BITS >= 8.
  1303. */
  1304. scan += 2, match++;
  1305. Assert(*scan == *match, "match[2]?");
  1306. /* We check for insufficient lookahead only every 8th comparison;
  1307. * the 256th check will be made at strstart + 258.
  1308. */
  1309. do {
  1310. } while (*++scan == *++match && *++scan == *++match &&
  1311. *++scan == *++match && *++scan == *++match &&
  1312. *++scan == *++match && *++scan == *++match &&
  1313. *++scan == *++match && *++scan == *++match &&
  1314. scan < strend);
  1315. Assert(scan <= s->window + (unsigned)(s->window_size - 1),
  1316. "wild scan");
  1317. len = MAX_MATCH - (int)(strend - scan);
  1318. scan = strend - MAX_MATCH;
  1319. #endif /* UNALIGNED_OK */
  1320. if (len > best_len) {
  1321. s->match_start = cur_match;
  1322. best_len = len;
  1323. if (len >= nice_match) break;
  1324. #ifdef UNALIGNED_OK
  1325. scan_end = *(ushf*)(scan + best_len - 1);
  1326. #else
  1327. scan_end1 = scan[best_len - 1];
  1328. scan_end = scan[best_len];
  1329. #endif
  1330. }
  1331. } while ((cur_match = prev[cur_match & wmask]) > limit
  1332. && --chain_length != 0);
  1333. if ((uInt)best_len <= s->lookahead) return (uInt)best_len;
  1334. return s->lookahead;
  1335. }
  1336. #else /* FASTEST */
  1337. /* ---------------------------------------------------------------------------
  1338. * Optimized version for FASTEST only
  1339. */
  1340. local uInt longest_match(deflate_state *s, IPos cur_match) {
  1341. register Bytef *scan = s->window + s->strstart; /* current string */
  1342. register Bytef *match; /* matched string */
  1343. register int len; /* length of current match */
  1344. register Bytef *strend = s->window + s->strstart + MAX_MATCH;
  1345. /* The code is optimized for HASH_BITS >= 8 and MAX_MATCH-2 multiple of 16.
  1346. * It is easy to get rid of this optimization if necessary.
  1347. */
  1348. Assert(s->hash_bits >= 8 && MAX_MATCH == 258, "Code too clever");
  1349. Assert((ulg)s->strstart <= s->window_size - MIN_LOOKAHEAD,
  1350. "need lookahead");
  1351. Assert(cur_match < s->strstart, "no future");
  1352. match = s->window + cur_match;
  1353. /* Return failure if the match length is less than 2:
  1354. */
  1355. if (match[0] != scan[0] || match[1] != scan[1]) return MIN_MATCH-1;
  1356. /* The check at best_len - 1 can be removed because it will be made
  1357. * again later. (This heuristic is not always a win.)
  1358. * It is not necessary to compare scan[2] and match[2] since they
  1359. * are always equal when the other bytes match, given that
  1360. * the hash keys are equal and that HASH_BITS >= 8.
  1361. */
  1362. scan += 2, match += 2;
  1363. Assert(*scan == *match, "match[2]?");
  1364. /* We check for insufficient lookahead only every 8th comparison;
  1365. * the 256th check will be made at strstart + 258.
  1366. */
  1367. do {
  1368. } while (*++scan == *++match && *++scan == *++match &&
  1369. *++scan == *++match && *++scan == *++match &&
  1370. *++scan == *++match && *++scan == *++match &&
  1371. *++scan == *++match && *++scan == *++match &&
  1372. scan < strend);
  1373. Assert(scan <= s->window + (unsigned)(s->window_size - 1), "wild scan");
  1374. len = MAX_MATCH - (int)(strend - scan);
  1375. if (len < MIN_MATCH) return MIN_MATCH - 1;
  1376. s->match_start = cur_match;
  1377. return (uInt)len <= s->lookahead ? (uInt)len : s->lookahead;
  1378. }
  1379. #endif /* FASTEST */
  1380. #ifdef ZLIB_DEBUG
  1381. #define EQUAL 0
  1382. /* result of memcmp for equal strings */
  1383. /* ===========================================================================
  1384. * Check that the match at match_start is indeed a match.
  1385. */
  1386. local void check_match(deflate_state *s, IPos start, IPos match, int length) {
  1387. /* check that the match is indeed a match */
  1388. Bytef *back = s->window + (int)match, *here = s->window + start;
  1389. IPos len = length;
  1390. if (match == (IPos)-1) {
  1391. /* match starts one byte before the current window -- just compare the
  1392. subsequent length-1 bytes */
  1393. back++;
  1394. here++;
  1395. len--;
  1396. }
  1397. if (zmemcmp(back, here, len) != EQUAL) {
  1398. fprintf(stderr, " start %u, match %d, length %d\n",
  1399. start, (int)match, length);
  1400. do {
  1401. fprintf(stderr, "(%02x %02x)", *back++, *here++);
  1402. } while (--len != 0);
  1403. z_error("invalid match");
  1404. }
  1405. if (z_verbose > 1) {
  1406. fprintf(stderr,"\\[%d,%d]", start - match, length);
  1407. do { putc(s->window[start++], stderr); } while (--length != 0);
  1408. }
  1409. }
  1410. #else
  1411. # define check_match(s, start, match, length)
  1412. #endif /* ZLIB_DEBUG */
  1413. /* ===========================================================================
  1414. * Flush the current block, with given end-of-file flag.
  1415. * IN assertion: strstart is set to the end of the current match.
  1416. */
  1417. #define FLUSH_BLOCK_ONLY(s, last) { \
  1418. _tr_flush_block(s, (s->block_start >= 0L ? \
  1419. (charf *)&s->window[(unsigned)s->block_start] : \
  1420. (charf *)Z_NULL), \
  1421. (ulg)((long)s->strstart - s->block_start), \
  1422. (last)); \
  1423. s->block_start = s->strstart; \
  1424. flush_pending(s->strm); \
  1425. Tracev((stderr,"[FLUSH]")); \
  1426. }
  1427. /* Same but force premature exit if necessary. */
  1428. #define FLUSH_BLOCK(s, last) { \
  1429. FLUSH_BLOCK_ONLY(s, last); \
  1430. if (s->strm->avail_out == 0) return (last) ? finish_started : need_more; \
  1431. }
  1432. /* Maximum stored block length in deflate format (not including header). */
  1433. #define MAX_STORED 65535
  1434. /* Minimum of a and b. */
  1435. #define MIN(a, b) ((a) > (b) ? (b) : (a))
  1436. /* ===========================================================================
  1437. * Copy without compression as much as possible from the input stream, return
  1438. * the current block state.
  1439. *
  1440. * In case deflateParams() is used to later switch to a non-zero compression
  1441. * level, s->matches (otherwise unused when storing) keeps track of the number
  1442. * of hash table slides to perform. If s->matches is 1, then one hash table
  1443. * slide will be done when switching. If s->matches is 2, the maximum value
  1444. * allowed here, then the hash table will be cleared, since two or more slides
  1445. * is the same as a clear.
  1446. *
  1447. * deflate_stored() is written to minimize the number of times an input byte is
  1448. * copied. It is most efficient with large input and output buffers, which
  1449. * maximizes the opportunities to have a single copy from next_in to next_out.
  1450. */
  1451. local block_state deflate_stored(deflate_state *s, int flush) {
  1452. /* Smallest worthy block size when not flushing or finishing. By default
  1453. * this is 32K. This can be as small as 507 bytes for memLevel == 1. For
  1454. * large input and output buffers, the stored block size will be larger.
  1455. */
  1456. unsigned min_block = MIN(s->pending_buf_size - 5, s->w_size);
  1457. /* Copy as many min_block or larger stored blocks directly to next_out as
  1458. * possible. If flushing, copy the remaining available input to next_out as
  1459. * stored blocks, if there is enough space.
  1460. */
  1461. unsigned len, left, have, last = 0;
  1462. unsigned used = s->strm->avail_in;
  1463. do {
  1464. /* Set len to the maximum size block that we can copy directly with the
  1465. * available input data and output space. Set left to how much of that
  1466. * would be copied from what's left in the window.
  1467. */
  1468. len = MAX_STORED; /* maximum deflate stored block length */
  1469. have = (s->bi_valid + 42) >> 3; /* number of header bytes */
  1470. if (s->strm->avail_out < have) /* need room for header */
  1471. break;
  1472. /* maximum stored block length that will fit in avail_out: */
  1473. have = s->strm->avail_out - have;
  1474. left = s->strstart - s->block_start; /* bytes left in window */
  1475. if (len > (ulg)left + s->strm->avail_in)
  1476. len = left + s->strm->avail_in; /* limit len to the input */
  1477. if (len > have)
  1478. len = have; /* limit len to the output */
  1479. /* If the stored block would be less than min_block in length, or if
  1480. * unable to copy all of the available input when flushing, then try
  1481. * copying to the window and the pending buffer instead. Also don't
  1482. * write an empty block when flushing -- deflate() does that.
  1483. */
  1484. if (len < min_block && ((len == 0 && flush != Z_FINISH) ||
  1485. flush == Z_NO_FLUSH ||
  1486. len != left + s->strm->avail_in))
  1487. break;
  1488. /* Make a dummy stored block in pending to get the header bytes,
  1489. * including any pending bits. This also updates the debugging counts.
  1490. */
  1491. last = flush == Z_FINISH && len == left + s->strm->avail_in ? 1 : 0;
  1492. _tr_stored_block(s, (char *)0, 0L, last);
  1493. /* Replace the lengths in the dummy stored block with len. */
  1494. s->pending_buf[s->pending - 4] = len;
  1495. s->pending_buf[s->pending - 3] = len >> 8;
  1496. s->pending_buf[s->pending - 2] = ~len;
  1497. s->pending_buf[s->pending - 1] = ~len >> 8;
  1498. /* Write the stored block header bytes. */
  1499. flush_pending(s->strm);
  1500. #ifdef ZLIB_DEBUG
  1501. /* Update debugging counts for the data about to be copied. */
  1502. s->compressed_len += len << 3;
  1503. s->bits_sent += len << 3;
  1504. #endif
  1505. /* Copy uncompressed bytes from the window to next_out. */
  1506. if (left) {
  1507. if (left > len)
  1508. left = len;
  1509. zmemcpy(s->strm->next_out, s->window + s->block_start, left);
  1510. s->strm->next_out += left;
  1511. s->strm->avail_out -= left;
  1512. s->strm->total_out += left;
  1513. s->block_start += left;
  1514. len -= left;
  1515. }
  1516. /* Copy uncompressed bytes directly from next_in to next_out, updating
  1517. * the check value.
  1518. */
  1519. if (len) {
  1520. read_buf(s->strm, s->strm->next_out, len);
  1521. s->strm->next_out += len;
  1522. s->strm->avail_out -= len;
  1523. s->strm->total_out += len;
  1524. }
  1525. } while (last == 0);
  1526. /* Update the sliding window with the last s->w_size bytes of the copied
  1527. * data, or append all of the copied data to the existing window if less
  1528. * than s->w_size bytes were copied. Also update the number of bytes to
  1529. * insert in the hash tables, in the event that deflateParams() switches to
  1530. * a non-zero compression level.
  1531. */
  1532. used -= s->strm->avail_in; /* number of input bytes directly copied */
  1533. if (used) {
  1534. /* If any input was used, then no unused input remains in the window,
  1535. * therefore s->block_start == s->strstart.
  1536. */
  1537. if (used >= s->w_size) { /* supplant the previous history */
  1538. s->matches = 2; /* clear hash */
  1539. zmemcpy(s->window, s->strm->next_in - s->w_size, s->w_size);
  1540. s->strstart = s->w_size;
  1541. s->insert = s->strstart;
  1542. }
  1543. else {
  1544. if (s->window_size - s->strstart <= used) {
  1545. /* Slide the window down. */
  1546. s->strstart -= s->w_size;
  1547. zmemcpy(s->window, s->window + s->w_size, s->strstart);
  1548. if (s->matches < 2)
  1549. s->matches++; /* add a pending slide_hash() */
  1550. if (s->insert > s->strstart)
  1551. s->insert = s->strstart;
  1552. }
  1553. zmemcpy(s->window + s->strstart, s->strm->next_in - used, used);
  1554. s->strstart += used;
  1555. s->insert += MIN(used, s->w_size - s->insert);
  1556. }
  1557. s->block_start = s->strstart;
  1558. }
  1559. if (s->high_water < s->strstart)
  1560. s->high_water = s->strstart;
  1561. /* If the last block was written to next_out, then done. */
  1562. if (last)
  1563. return finish_done;
  1564. /* If flushing and all input has been consumed, then done. */
  1565. if (flush != Z_NO_FLUSH && flush != Z_FINISH &&
  1566. s->strm->avail_in == 0 && (long)s->strstart == s->block_start)
  1567. return block_done;
  1568. /* Fill the window with any remaining input. */
  1569. have = s->window_size - s->strstart;
  1570. if (s->strm->avail_in > have && s->block_start >= (long)s->w_size) {
  1571. /* Slide the window down. */
  1572. s->block_start -= s->w_size;
  1573. s->strstart -= s->w_size;
  1574. zmemcpy(s->window, s->window + s->w_size, s->strstart);
  1575. if (s->matches < 2)
  1576. s->matches++; /* add a pending slide_hash() */
  1577. have += s->w_size; /* more space now */
  1578. if (s->insert > s->strstart)
  1579. s->insert = s->strstart;
  1580. }
  1581. if (have > s->strm->avail_in)
  1582. have = s->strm->avail_in;
  1583. if (have) {
  1584. read_buf(s->strm, s->window + s->strstart, have);
  1585. s->strstart += have;
  1586. s->insert += MIN(have, s->w_size - s->insert);
  1587. }
  1588. if (s->high_water < s->strstart)
  1589. s->high_water = s->strstart;
  1590. /* There was not enough avail_out to write a complete worthy or flushed
  1591. * stored block to next_out. Write a stored block to pending instead, if we
  1592. * have enough input for a worthy block, or if flushing and there is enough
  1593. * room for the remaining input as a stored block in the pending buffer.
  1594. */
  1595. have = (s->bi_valid + 42) >> 3; /* number of header bytes */
  1596. /* maximum stored block length that will fit in pending: */
  1597. have = MIN(s->pending_buf_size - have, MAX_STORED);
  1598. min_block = MIN(have, s->w_size);
  1599. left = s->strstart - s->block_start;
  1600. if (left >= min_block ||
  1601. ((left || flush == Z_FINISH) && flush != Z_NO_FLUSH &&
  1602. s->strm->avail_in == 0 && left <= have)) {
  1603. len = MIN(left, have);
  1604. last = flush == Z_FINISH && s->strm->avail_in == 0 &&
  1605. len == left ? 1 : 0;
  1606. _tr_stored_block(s, (charf *)s->window + s->block_start, len, last);
  1607. s->block_start += len;
  1608. flush_pending(s->strm);
  1609. }
  1610. /* We've done all we can with the available input and output. */
  1611. return last ? finish_started : need_more;
  1612. }
  1613. /* ===========================================================================
  1614. * Compress as much as possible from the input stream, return the current
  1615. * block state.
  1616. * This function does not perform lazy evaluation of matches and inserts
  1617. * new strings in the dictionary only for unmatched strings or for short
  1618. * matches. It is used only for the fast compression options.
  1619. */
  1620. local block_state deflate_fast(deflate_state *s, int flush) {
  1621. IPos hash_head; /* head of the hash chain */
  1622. int bflush; /* set if current block must be flushed */
  1623. for (;;) {
  1624. /* Make sure that we always have enough lookahead, except
  1625. * at the end of the input file. We need MAX_MATCH bytes
  1626. * for the next match, plus MIN_MATCH bytes to insert the
  1627. * string following the next match.
  1628. */
  1629. if (s->lookahead < MIN_LOOKAHEAD) {
  1630. fill_window(s);
  1631. if (s->lookahead < MIN_LOOKAHEAD && flush == Z_NO_FLUSH) {
  1632. return need_more;
  1633. }
  1634. if (s->lookahead == 0) break; /* flush the current block */
  1635. }
  1636. /* Insert the string window[strstart .. strstart + 2] in the
  1637. * dictionary, and set hash_head to the head of the hash chain:
  1638. */
  1639. hash_head = NIL;
  1640. if (s->lookahead >= MIN_MATCH) {
  1641. INSERT_STRING(s, s->strstart, hash_head);
  1642. }
  1643. /* Find the longest match, discarding those <= prev_length.
  1644. * At this point we have always match_length < MIN_MATCH
  1645. */
  1646. if (hash_head != NIL && s->strstart - hash_head <= MAX_DIST(s)) {
  1647. /* To simplify the code, we prevent matches with the string
  1648. * of window index 0 (in particular we have to avoid a match
  1649. * of the string with itself at the start of the input file).
  1650. */
  1651. s->match_length = longest_match (s, hash_head);
  1652. /* longest_match() sets match_start */
  1653. }
  1654. if (s->match_length >= MIN_MATCH) {
  1655. check_match(s, s->strstart, s->match_start, s->match_length);
  1656. _tr_tally_dist(s, s->strstart - s->match_start,
  1657. s->match_length - MIN_MATCH, bflush);
  1658. s->lookahead -= s->match_length;
  1659. /* Insert new strings in the hash table only if the match length
  1660. * is not too large. This saves time but degrades compression.
  1661. */
  1662. #ifndef FASTEST
  1663. if (s->match_length <= s->max_insert_length &&
  1664. s->lookahead >= MIN_MATCH) {
  1665. s->match_length--; /* string at strstart already in table */
  1666. do {
  1667. s->strstart++;
  1668. INSERT_STRING(s, s->strstart, hash_head);
  1669. /* strstart never exceeds WSIZE-MAX_MATCH, so there are
  1670. * always MIN_MATCH bytes ahead.
  1671. */
  1672. } while (--s->match_length != 0);
  1673. s->strstart++;
  1674. } else
  1675. #endif
  1676. {
  1677. s->strstart += s->match_length;
  1678. s->match_length = 0;
  1679. s->ins_h = s->window[s->strstart];
  1680. UPDATE_HASH(s, s->ins_h, s->window[s->strstart + 1]);
  1681. #if MIN_MATCH != 3
  1682. Call UPDATE_HASH() MIN_MATCH-3 more times
  1683. #endif
  1684. /* If lookahead < MIN_MATCH, ins_h is garbage, but it does not
  1685. * matter since it will be recomputed at next deflate call.
  1686. */
  1687. }
  1688. } else {
  1689. /* No match, output a literal byte */
  1690. Tracevv((stderr,"%c", s->window[s->strstart]));
  1691. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1692. s->lookahead--;
  1693. s->strstart++;
  1694. }
  1695. if (bflush) FLUSH_BLOCK(s, 0);
  1696. }
  1697. s->insert = s->strstart < MIN_MATCH-1 ? s->strstart : MIN_MATCH-1;
  1698. if (flush == Z_FINISH) {
  1699. FLUSH_BLOCK(s, 1);
  1700. return finish_done;
  1701. }
  1702. if (s->sym_next)
  1703. FLUSH_BLOCK(s, 0);
  1704. return block_done;
  1705. }
  1706. #ifndef FASTEST
  1707. /* ===========================================================================
  1708. * Same as above, but achieves better compression. We use a lazy
  1709. * evaluation for matches: a match is finally adopted only if there is
  1710. * no better match at the next window position.
  1711. */
  1712. local block_state deflate_slow(deflate_state *s, int flush) {
  1713. IPos hash_head; /* head of hash chain */
  1714. int bflush; /* set if current block must be flushed */
  1715. /* Process the input block. */
  1716. for (;;) {
  1717. /* Make sure that we always have enough lookahead, except
  1718. * at the end of the input file. We need MAX_MATCH bytes
  1719. * for the next match, plus MIN_MATCH bytes to insert the
  1720. * string following the next match.
  1721. */
  1722. if (s->lookahead < MIN_LOOKAHEAD) {
  1723. fill_window(s);
  1724. if (s->lookahead < MIN_LOOKAHEAD && flush == Z_NO_FLUSH) {
  1725. return need_more;
  1726. }
  1727. if (s->lookahead == 0) break; /* flush the current block */
  1728. }
  1729. /* Insert the string window[strstart .. strstart + 2] in the
  1730. * dictionary, and set hash_head to the head of the hash chain:
  1731. */
  1732. hash_head = NIL;
  1733. if (s->lookahead >= MIN_MATCH) {
  1734. INSERT_STRING(s, s->strstart, hash_head);
  1735. }
  1736. /* Find the longest match, discarding those <= prev_length.
  1737. */
  1738. s->prev_length = s->match_length, s->prev_match = s->match_start;
  1739. s->match_length = MIN_MATCH-1;
  1740. if (hash_head != NIL && s->prev_length < s->max_lazy_match &&
  1741. s->strstart - hash_head <= MAX_DIST(s)) {
  1742. /* To simplify the code, we prevent matches with the string
  1743. * of window index 0 (in particular we have to avoid a match
  1744. * of the string with itself at the start of the input file).
  1745. */
  1746. s->match_length = longest_match (s, hash_head);
  1747. /* longest_match() sets match_start */
  1748. if (s->match_length <= 5 && (s->strategy == Z_FILTERED
  1749. #if TOO_FAR <= 32767
  1750. || (s->match_length == MIN_MATCH &&
  1751. s->strstart - s->match_start > TOO_FAR)
  1752. #endif
  1753. )) {
  1754. /* If prev_match is also MIN_MATCH, match_start is garbage
  1755. * but we will ignore the current match anyway.
  1756. */
  1757. s->match_length = MIN_MATCH-1;
  1758. }
  1759. }
  1760. /* If there was a match at the previous step and the current
  1761. * match is not better, output the previous match:
  1762. */
  1763. if (s->prev_length >= MIN_MATCH && s->match_length <= s->prev_length) {
  1764. uInt max_insert = s->strstart + s->lookahead - MIN_MATCH;
  1765. /* Do not insert strings in hash table beyond this. */
  1766. check_match(s, s->strstart - 1, s->prev_match, s->prev_length);
  1767. _tr_tally_dist(s, s->strstart - 1 - s->prev_match,
  1768. s->prev_length - MIN_MATCH, bflush);
  1769. /* Insert in hash table all strings up to the end of the match.
  1770. * strstart - 1 and strstart are already inserted. If there is not
  1771. * enough lookahead, the last two strings are not inserted in
  1772. * the hash table.
  1773. */
  1774. s->lookahead -= s->prev_length - 1;
  1775. s->prev_length -= 2;
  1776. do {
  1777. if (++s->strstart <= max_insert) {
  1778. INSERT_STRING(s, s->strstart, hash_head);
  1779. }
  1780. } while (--s->prev_length != 0);
  1781. s->match_available = 0;
  1782. s->match_length = MIN_MATCH-1;
  1783. s->strstart++;
  1784. if (bflush) FLUSH_BLOCK(s, 0);
  1785. } else if (s->match_available) {
  1786. /* If there was no match at the previous position, output a
  1787. * single literal. If there was a match but the current match
  1788. * is longer, truncate the previous match to a single literal.
  1789. */
  1790. Tracevv((stderr,"%c", s->window[s->strstart - 1]));
  1791. _tr_tally_lit(s, s->window[s->strstart - 1], bflush);
  1792. if (bflush) {
  1793. FLUSH_BLOCK_ONLY(s, 0);
  1794. }
  1795. s->strstart++;
  1796. s->lookahead--;
  1797. if (s->strm->avail_out == 0) return need_more;
  1798. } else {
  1799. /* There is no previous match to compare with, wait for
  1800. * the next step to decide.
  1801. */
  1802. s->match_available = 1;
  1803. s->strstart++;
  1804. s->lookahead--;
  1805. }
  1806. }
  1807. Assert (flush != Z_NO_FLUSH, "no flush?");
  1808. if (s->match_available) {
  1809. Tracevv((stderr,"%c", s->window[s->strstart - 1]));
  1810. _tr_tally_lit(s, s->window[s->strstart - 1], bflush);
  1811. s->match_available = 0;
  1812. }
  1813. s->insert = s->strstart < MIN_MATCH-1 ? s->strstart : MIN_MATCH-1;
  1814. if (flush == Z_FINISH) {
  1815. FLUSH_BLOCK(s, 1);
  1816. return finish_done;
  1817. }
  1818. if (s->sym_next)
  1819. FLUSH_BLOCK(s, 0);
  1820. return block_done;
  1821. }
  1822. #endif /* FASTEST */
  1823. /* ===========================================================================
  1824. * For Z_RLE, simply look for runs of bytes, generate matches only of distance
  1825. * one. Do not maintain a hash table. (It will be regenerated if this run of
  1826. * deflate switches away from Z_RLE.)
  1827. */
  1828. local block_state deflate_rle(deflate_state *s, int flush) {
  1829. int bflush; /* set if current block must be flushed */
  1830. uInt prev; /* byte at distance one to match */
  1831. Bytef *scan, *strend; /* scan goes up to strend for length of run */
  1832. for (;;) {
  1833. /* Make sure that we always have enough lookahead, except
  1834. * at the end of the input file. We need MAX_MATCH bytes
  1835. * for the longest run, plus one for the unrolled loop.
  1836. */
  1837. if (s->lookahead <= MAX_MATCH) {
  1838. fill_window(s);
  1839. if (s->lookahead <= MAX_MATCH && flush == Z_NO_FLUSH) {
  1840. return need_more;
  1841. }
  1842. if (s->lookahead == 0) break; /* flush the current block */
  1843. }
  1844. /* See how many times the previous byte repeats */
  1845. s->match_length = 0;
  1846. if (s->lookahead >= MIN_MATCH && s->strstart > 0) {
  1847. scan = s->window + s->strstart - 1;
  1848. prev = *scan;
  1849. if (prev == *++scan && prev == *++scan && prev == *++scan) {
  1850. strend = s->window + s->strstart + MAX_MATCH;
  1851. do {
  1852. } while (prev == *++scan && prev == *++scan &&
  1853. prev == *++scan && prev == *++scan &&
  1854. prev == *++scan && prev == *++scan &&
  1855. prev == *++scan && prev == *++scan &&
  1856. scan < strend);
  1857. s->match_length = MAX_MATCH - (uInt)(strend - scan);
  1858. if (s->match_length > s->lookahead)
  1859. s->match_length = s->lookahead;
  1860. }
  1861. Assert(scan <= s->window + (uInt)(s->window_size - 1),
  1862. "wild scan");
  1863. }
  1864. /* Emit match if have run of MIN_MATCH or longer, else emit literal */
  1865. if (s->match_length >= MIN_MATCH) {
  1866. check_match(s, s->strstart, s->strstart - 1, s->match_length);
  1867. _tr_tally_dist(s, 1, s->match_length - MIN_MATCH, bflush);
  1868. s->lookahead -= s->match_length;
  1869. s->strstart += s->match_length;
  1870. s->match_length = 0;
  1871. } else {
  1872. /* No match, output a literal byte */
  1873. Tracevv((stderr,"%c", s->window[s->strstart]));
  1874. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1875. s->lookahead--;
  1876. s->strstart++;
  1877. }
  1878. if (bflush) FLUSH_BLOCK(s, 0);
  1879. }
  1880. s->insert = 0;
  1881. if (flush == Z_FINISH) {
  1882. FLUSH_BLOCK(s, 1);
  1883. return finish_done;
  1884. }
  1885. if (s->sym_next)
  1886. FLUSH_BLOCK(s, 0);
  1887. return block_done;
  1888. }
  1889. /* ===========================================================================
  1890. * For Z_HUFFMAN_ONLY, do not look for matches. Do not maintain a hash table.
  1891. * (It will be regenerated if this run of deflate switches away from Huffman.)
  1892. */
  1893. local block_state deflate_huff(deflate_state *s, int flush) {
  1894. int bflush; /* set if current block must be flushed */
  1895. for (;;) {
  1896. /* Make sure that we have a literal to write. */
  1897. if (s->lookahead == 0) {
  1898. fill_window(s);
  1899. if (s->lookahead == 0) {
  1900. if (flush == Z_NO_FLUSH)
  1901. return need_more;
  1902. break; /* flush the current block */
  1903. }
  1904. }
  1905. /* Output a literal byte */
  1906. s->match_length = 0;
  1907. Tracevv((stderr,"%c", s->window[s->strstart]));
  1908. _tr_tally_lit(s, s->window[s->strstart], bflush);
  1909. s->lookahead--;
  1910. s->strstart++;
  1911. if (bflush) FLUSH_BLOCK(s, 0);
  1912. }
  1913. s->insert = 0;
  1914. if (flush == Z_FINISH) {
  1915. FLUSH_BLOCK(s, 1);
  1916. return finish_done;
  1917. }
  1918. if (s->sym_next)
  1919. FLUSH_BLOCK(s, 0);
  1920. return block_done;
  1921. }