12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411 |
- From 6bac7a3e0ebcd3147294b73acb34606eba18ae7f Mon Sep 17 00:00:00 2001
- From: Simon Hosie <simon.hosie@arm.com>
- Date: Wed, 12 Apr 2017 12:52:33 -0700
- Subject: [PATCH 1/2] Prepare ARM-specific contrib directory.
- Change-Id: Id4cda552b39bfb39ab35ec499dbe122b43b6d1a1
- ---
- contrib/arm/inffast.c | 323 ++++++++++
- contrib/arm/inflate.c | 1561 +++++++++++++++++++++++++++++++++++++++++++++++++
- 2 files changed, 1884 insertions(+)
- create mode 100644 contrib/arm/inffast.c
- create mode 100644 contrib/arm/inflate.c
- diff --git a/contrib/arm/inffast.c b/contrib/arm/inffast.c
- new file mode 100644
- index 00000000..0dbd1dbc
- --- /dev/null
- +++ b/contrib/arm/inffast.c
- @@ -0,0 +1,323 @@
- +/* inffast.c -- fast decoding
- + * Copyright (C) 1995-2017 Mark Adler
- + * For conditions of distribution and use, see copyright notice in zlib.h
- + */
- +
- +#include "zutil.h"
- +#include "inftrees.h"
- +#include "inflate.h"
- +#include "inffast.h"
- +
- +#ifdef ASMINF
- +# pragma message("Assembler code may have bugs -- use at your own risk")
- +#else
- +
- +/*
- + Decode literal, length, and distance codes and write out the resulting
- + literal and match bytes until either not enough input or output is
- + available, an end-of-block is encountered, or a data error is encountered.
- + When large enough input and output buffers are supplied to inflate(), for
- + example, a 16K input buffer and a 64K output buffer, more than 95% of the
- + inflate execution time is spent in this routine.
- +
- + Entry assumptions:
- +
- + state->mode == LEN
- + strm->avail_in >= 6
- + strm->avail_out >= 258
- + start >= strm->avail_out
- + state->bits < 8
- +
- + On return, state->mode is one of:
- +
- + LEN -- ran out of enough output space or enough available input
- + TYPE -- reached end of block code, inflate() to interpret next block
- + BAD -- error in block data
- +
- + Notes:
- +
- + - The maximum input bits used by a length/distance pair is 15 bits for the
- + length code, 5 bits for the length extra, 15 bits for the distance code,
- + and 13 bits for the distance extra. This totals 48 bits, or six bytes.
- + Therefore if strm->avail_in >= 6, then there is enough input to avoid
- + checking for available input while decoding.
- +
- + - The maximum bytes that a single length/distance pair can output is 258
- + bytes, which is the maximum length that can be coded. inflate_fast()
- + requires strm->avail_out >= 258 for each loop to avoid checking for
- + output space.
- + */
- +void ZLIB_INTERNAL inflate_fast(strm, start)
- +z_streamp strm;
- +unsigned start; /* inflate()'s starting value for strm->avail_out */
- +{
- + struct inflate_state FAR *state;
- + z_const unsigned char FAR *in; /* local strm->next_in */
- + z_const unsigned char FAR *last; /* have enough input while in < last */
- + unsigned char FAR *out; /* local strm->next_out */
- + unsigned char FAR *beg; /* inflate()'s initial strm->next_out */
- + unsigned char FAR *end; /* while out < end, enough space available */
- +#ifdef INFLATE_STRICT
- + unsigned dmax; /* maximum distance from zlib header */
- +#endif
- + unsigned wsize; /* window size or zero if not using window */
- + unsigned whave; /* valid bytes in the window */
- + unsigned wnext; /* window write index */
- + unsigned char FAR *window; /* allocated sliding window, if wsize != 0 */
- + unsigned long hold; /* local strm->hold */
- + unsigned bits; /* local strm->bits */
- + code const FAR *lcode; /* local strm->lencode */
- + code const FAR *dcode; /* local strm->distcode */
- + unsigned lmask; /* mask for first level of length codes */
- + unsigned dmask; /* mask for first level of distance codes */
- + code here; /* retrieved table entry */
- + unsigned op; /* code bits, operation, extra bits, or */
- + /* window position, window bytes to copy */
- + unsigned len; /* match length, unused bytes */
- + unsigned dist; /* match distance */
- + unsigned char FAR *from; /* where to copy match from */
- +
- + /* copy state to local variables */
- + state = (struct inflate_state FAR *)strm->state;
- + in = strm->next_in;
- + last = in + (strm->avail_in - 5);
- + out = strm->next_out;
- + beg = out - (start - strm->avail_out);
- + end = out + (strm->avail_out - 257);
- +#ifdef INFLATE_STRICT
- + dmax = state->dmax;
- +#endif
- + wsize = state->wsize;
- + whave = state->whave;
- + wnext = state->wnext;
- + window = state->window;
- + hold = state->hold;
- + bits = state->bits;
- + lcode = state->lencode;
- + dcode = state->distcode;
- + lmask = (1U << state->lenbits) - 1;
- + dmask = (1U << state->distbits) - 1;
- +
- + /* decode literals and length/distances until end-of-block or not enough
- + input data or output space */
- + do {
- + if (bits < 15) {
- + hold += (unsigned long)(*in++) << bits;
- + bits += 8;
- + hold += (unsigned long)(*in++) << bits;
- + bits += 8;
- + }
- + here = lcode[hold & lmask];
- + dolen:
- + op = (unsigned)(here.bits);
- + hold >>= op;
- + bits -= op;
- + op = (unsigned)(here.op);
- + if (op == 0) { /* literal */
- + Tracevv((stderr, here.val >= 0x20 && here.val < 0x7f ?
- + "inflate: literal '%c'\n" :
- + "inflate: literal 0x%02x\n", here.val));
- + *out++ = (unsigned char)(here.val);
- + }
- + else if (op & 16) { /* length base */
- + len = (unsigned)(here.val);
- + op &= 15; /* number of extra bits */
- + if (op) {
- + if (bits < op) {
- + hold += (unsigned long)(*in++) << bits;
- + bits += 8;
- + }
- + len += (unsigned)hold & ((1U << op) - 1);
- + hold >>= op;
- + bits -= op;
- + }
- + Tracevv((stderr, "inflate: length %u\n", len));
- + if (bits < 15) {
- + hold += (unsigned long)(*in++) << bits;
- + bits += 8;
- + hold += (unsigned long)(*in++) << bits;
- + bits += 8;
- + }
- + here = dcode[hold & dmask];
- + dodist:
- + op = (unsigned)(here.bits);
- + hold >>= op;
- + bits -= op;
- + op = (unsigned)(here.op);
- + if (op & 16) { /* distance base */
- + dist = (unsigned)(here.val);
- + op &= 15; /* number of extra bits */
- + if (bits < op) {
- + hold += (unsigned long)(*in++) << bits;
- + bits += 8;
- + if (bits < op) {
- + hold += (unsigned long)(*in++) << bits;
- + bits += 8;
- + }
- + }
- + dist += (unsigned)hold & ((1U << op) - 1);
- +#ifdef INFLATE_STRICT
- + if (dist > dmax) {
- + strm->msg = (char *)"invalid distance too far back";
- + state->mode = BAD;
- + break;
- + }
- +#endif
- + hold >>= op;
- + bits -= op;
- + Tracevv((stderr, "inflate: distance %u\n", dist));
- + op = (unsigned)(out - beg); /* max distance in output */
- + if (dist > op) { /* see if copy from window */
- + op = dist - op; /* distance back in window */
- + if (op > whave) {
- + if (state->sane) {
- + strm->msg =
- + (char *)"invalid distance too far back";
- + state->mode = BAD;
- + break;
- + }
- +#ifdef INFLATE_ALLOW_INVALID_DISTANCE_TOOFAR_ARRR
- + if (len <= op - whave) {
- + do {
- + *out++ = 0;
- + } while (--len);
- + continue;
- + }
- + len -= op - whave;
- + do {
- + *out++ = 0;
- + } while (--op > whave);
- + if (op == 0) {
- + from = out - dist;
- + do {
- + *out++ = *from++;
- + } while (--len);
- + continue;
- + }
- +#endif
- + }
- + from = window;
- + if (wnext == 0) { /* very common case */
- + from += wsize - op;
- + if (op < len) { /* some from window */
- + len -= op;
- + do {
- + *out++ = *from++;
- + } while (--op);
- + from = out - dist; /* rest from output */
- + }
- + }
- + else if (wnext < op) { /* wrap around window */
- + from += wsize + wnext - op;
- + op -= wnext;
- + if (op < len) { /* some from end of window */
- + len -= op;
- + do {
- + *out++ = *from++;
- + } while (--op);
- + from = window;
- + if (wnext < len) { /* some from start of window */
- + op = wnext;
- + len -= op;
- + do {
- + *out++ = *from++;
- + } while (--op);
- + from = out - dist; /* rest from output */
- + }
- + }
- + }
- + else { /* contiguous in window */
- + from += wnext - op;
- + if (op < len) { /* some from window */
- + len -= op;
- + do {
- + *out++ = *from++;
- + } while (--op);
- + from = out - dist; /* rest from output */
- + }
- + }
- + while (len > 2) {
- + *out++ = *from++;
- + *out++ = *from++;
- + *out++ = *from++;
- + len -= 3;
- + }
- + if (len) {
- + *out++ = *from++;
- + if (len > 1)
- + *out++ = *from++;
- + }
- + }
- + else {
- + from = out - dist; /* copy direct from output */
- + do { /* minimum length is three */
- + *out++ = *from++;
- + *out++ = *from++;
- + *out++ = *from++;
- + len -= 3;
- + } while (len > 2);
- + if (len) {
- + *out++ = *from++;
- + if (len > 1)
- + *out++ = *from++;
- + }
- + }
- + }
- + else if ((op & 64) == 0) { /* 2nd level distance code */
- + here = dcode[here.val + (hold & ((1U << op) - 1))];
- + goto dodist;
- + }
- + else {
- + strm->msg = (char *)"invalid distance code";
- + state->mode = BAD;
- + break;
- + }
- + }
- + else if ((op & 64) == 0) { /* 2nd level length code */
- + here = lcode[here.val + (hold & ((1U << op) - 1))];
- + goto dolen;
- + }
- + else if (op & 32) { /* end-of-block */
- + Tracevv((stderr, "inflate: end of block\n"));
- + state->mode = TYPE;
- + break;
- + }
- + else {
- + strm->msg = (char *)"invalid literal/length code";
- + state->mode = BAD;
- + break;
- + }
- + } while (in < last && out < end);
- +
- + /* return unused bytes (on entry, bits < 8, so in won't go too far back) */
- + len = bits >> 3;
- + in -= len;
- + bits -= len << 3;
- + hold &= (1U << bits) - 1;
- +
- + /* update state and return */
- + strm->next_in = in;
- + strm->next_out = out;
- + strm->avail_in = (unsigned)(in < last ? 5 + (last - in) : 5 - (in - last));
- + strm->avail_out = (unsigned)(out < end ?
- + 257 + (end - out) : 257 - (out - end));
- + state->hold = hold;
- + state->bits = bits;
- + return;
- +}
- +
- +/*
- + inflate_fast() speedups that turned out slower (on a PowerPC G3 750CXe):
- + - Using bit fields for code structure
- + - Different op definition to avoid & for extra bits (do & for table bits)
- + - Three separate decoding do-loops for direct, window, and wnext == 0
- + - Special case for distance > 1 copies to do overlapped load and store copy
- + - Explicit branch predictions (based on measured branch probabilities)
- + - Deferring match copy and interspersed it with decoding subsequent codes
- + - Swapping literal/length else
- + - Swapping window/direct else
- + - Larger unrolled copy loops (three is about right)
- + - Moving len -= 3 statement into middle of loop
- + */
- +
- +#endif /* !ASMINF */
- diff --git a/contrib/arm/inflate.c b/contrib/arm/inflate.c
- new file mode 100644
- index 00000000..ac333e8c
- --- /dev/null
- +++ b/contrib/arm/inflate.c
- @@ -0,0 +1,1561 @@
- +/* inflate.c -- zlib decompression
- + * Copyright (C) 1995-2016 Mark Adler
- + * For conditions of distribution and use, see copyright notice in zlib.h
- + */
- +
- +/*
- + * Change history:
- + *
- + * 1.2.beta0 24 Nov 2002
- + * - First version -- complete rewrite of inflate to simplify code, avoid
- + * creation of window when not needed, minimize use of window when it is
- + * needed, make inffast.c even faster, implement gzip decoding, and to
- + * improve code readability and style over the previous zlib inflate code
- + *
- + * 1.2.beta1 25 Nov 2002
- + * - Use pointers for available input and output checking in inffast.c
- + * - Remove input and output counters in inffast.c
- + * - Change inffast.c entry and loop from avail_in >= 7 to >= 6
- + * - Remove unnecessary second byte pull from length extra in inffast.c
- + * - Unroll direct copy to three copies per loop in inffast.c
- + *
- + * 1.2.beta2 4 Dec 2002
- + * - Change external routine names to reduce potential conflicts
- + * - Correct filename to inffixed.h for fixed tables in inflate.c
- + * - Make hbuf[] unsigned char to match parameter type in inflate.c
- + * - Change strm->next_out[-state->offset] to *(strm->next_out - state->offset)
- + * to avoid negation problem on Alphas (64 bit) in inflate.c
- + *
- + * 1.2.beta3 22 Dec 2002
- + * - Add comments on state->bits assertion in inffast.c
- + * - Add comments on op field in inftrees.h
- + * - Fix bug in reuse of allocated window after inflateReset()
- + * - Remove bit fields--back to byte structure for speed
- + * - Remove distance extra == 0 check in inflate_fast()--only helps for lengths
- + * - Change post-increments to pre-increments in inflate_fast(), PPC biased?
- + * - Add compile time option, POSTINC, to use post-increments instead (Intel?)
- + * - Make MATCH copy in inflate() much faster for when inflate_fast() not used
- + * - Use local copies of stream next and avail values, as well as local bit
- + * buffer and bit count in inflate()--for speed when inflate_fast() not used
- + *
- + * 1.2.beta4 1 Jan 2003
- + * - Split ptr - 257 statements in inflate_table() to avoid compiler warnings
- + * - Move a comment on output buffer sizes from inffast.c to inflate.c
- + * - Add comments in inffast.c to introduce the inflate_fast() routine
- + * - Rearrange window copies in inflate_fast() for speed and simplification
- + * - Unroll last copy for window match in inflate_fast()
- + * - Use local copies of window variables in inflate_fast() for speed
- + * - Pull out common wnext == 0 case for speed in inflate_fast()
- + * - Make op and len in inflate_fast() unsigned for consistency
- + * - Add FAR to lcode and dcode declarations in inflate_fast()
- + * - Simplified bad distance check in inflate_fast()
- + * - Added inflateBackInit(), inflateBack(), and inflateBackEnd() in new
- + * source file infback.c to provide a call-back interface to inflate for
- + * programs like gzip and unzip -- uses window as output buffer to avoid
- + * window copying
- + *
- + * 1.2.beta5 1 Jan 2003
- + * - Improved inflateBack() interface to allow the caller to provide initial
- + * input in strm.
- + * - Fixed stored blocks bug in inflateBack()
- + *
- + * 1.2.beta6 4 Jan 2003
- + * - Added comments in inffast.c on effectiveness of POSTINC
- + * - Typecasting all around to reduce compiler warnings
- + * - Changed loops from while (1) or do {} while (1) to for (;;), again to
- + * make compilers happy
- + * - Changed type of window in inflateBackInit() to unsigned char *
- + *
- + * 1.2.beta7 27 Jan 2003
- + * - Changed many types to unsigned or unsigned short to avoid warnings
- + * - Added inflateCopy() function
- + *
- + * 1.2.0 9 Mar 2003
- + * - Changed inflateBack() interface to provide separate opaque descriptors
- + * for the in() and out() functions
- + * - Changed inflateBack() argument and in_func typedef to swap the length
- + * and buffer address return values for the input function
- + * - Check next_in and next_out for Z_NULL on entry to inflate()
- + *
- + * The history for versions after 1.2.0 are in ChangeLog in zlib distribution.
- + */
- +
- +#include "zutil.h"
- +#include "inftrees.h"
- +#include "inflate.h"
- +#include "inffast.h"
- +
- +#ifdef MAKEFIXED
- +# ifndef BUILDFIXED
- +# define BUILDFIXED
- +# endif
- +#endif
- +
- +/* function prototypes */
- +local int inflateStateCheck OF((z_streamp strm));
- +local void fixedtables OF((struct inflate_state FAR *state));
- +local int updatewindow OF((z_streamp strm, const unsigned char FAR *end,
- + unsigned copy));
- +#ifdef BUILDFIXED
- + void makefixed OF((void));
- +#endif
- +local unsigned syncsearch OF((unsigned FAR *have, const unsigned char FAR *buf,
- + unsigned len));
- +
- +local int inflateStateCheck(strm)
- +z_streamp strm;
- +{
- + struct inflate_state FAR *state;
- + if (strm == Z_NULL ||
- + strm->zalloc == (alloc_func)0 || strm->zfree == (free_func)0)
- + return 1;
- + state = (struct inflate_state FAR *)strm->state;
- + if (state == Z_NULL || state->strm != strm ||
- + state->mode < HEAD || state->mode > SYNC)
- + return 1;
- + return 0;
- +}
- +
- +int ZEXPORT inflateResetKeep(strm)
- +z_streamp strm;
- +{
- + struct inflate_state FAR *state;
- +
- + if (inflateStateCheck(strm)) return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- + strm->total_in = strm->total_out = state->total = 0;
- + strm->msg = Z_NULL;
- + if (state->wrap) /* to support ill-conceived Java test suite */
- + strm->adler = state->wrap & 1;
- + state->mode = HEAD;
- + state->last = 0;
- + state->havedict = 0;
- + state->dmax = 32768U;
- + state->head = Z_NULL;
- + state->hold = 0;
- + state->bits = 0;
- + state->lencode = state->distcode = state->next = state->codes;
- + state->sane = 1;
- + state->back = -1;
- + Tracev((stderr, "inflate: reset\n"));
- + return Z_OK;
- +}
- +
- +int ZEXPORT inflateReset(strm)
- +z_streamp strm;
- +{
- + struct inflate_state FAR *state;
- +
- + if (inflateStateCheck(strm)) return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- + state->wsize = 0;
- + state->whave = 0;
- + state->wnext = 0;
- + return inflateResetKeep(strm);
- +}
- +
- +int ZEXPORT inflateReset2(strm, windowBits)
- +z_streamp strm;
- +int windowBits;
- +{
- + int wrap;
- + struct inflate_state FAR *state;
- +
- + /* get the state */
- + if (inflateStateCheck(strm)) return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- +
- + /* extract wrap request from windowBits parameter */
- + if (windowBits < 0) {
- + wrap = 0;
- + windowBits = -windowBits;
- + }
- + else {
- + wrap = (windowBits >> 4) + 5;
- +#ifdef GUNZIP
- + if (windowBits < 48)
- + windowBits &= 15;
- +#endif
- + }
- +
- + /* set number of window bits, free window if different */
- + if (windowBits && (windowBits < 8 || windowBits > 15))
- + return Z_STREAM_ERROR;
- + if (state->window != Z_NULL && state->wbits != (unsigned)windowBits) {
- + ZFREE(strm, state->window);
- + state->window = Z_NULL;
- + }
- +
- + /* update state and reset the rest of it */
- + state->wrap = wrap;
- + state->wbits = (unsigned)windowBits;
- + return inflateReset(strm);
- +}
- +
- +int ZEXPORT inflateInit2_(strm, windowBits, version, stream_size)
- +z_streamp strm;
- +int windowBits;
- +const char *version;
- +int stream_size;
- +{
- + int ret;
- + struct inflate_state FAR *state;
- +
- + if (version == Z_NULL || version[0] != ZLIB_VERSION[0] ||
- + stream_size != (int)(sizeof(z_stream)))
- + return Z_VERSION_ERROR;
- + if (strm == Z_NULL) return Z_STREAM_ERROR;
- + strm->msg = Z_NULL; /* in case we return an error */
- + if (strm->zalloc == (alloc_func)0) {
- +#ifdef Z_SOLO
- + return Z_STREAM_ERROR;
- +#else
- + strm->zalloc = zcalloc;
- + strm->opaque = (voidpf)0;
- +#endif
- + }
- + if (strm->zfree == (free_func)0)
- +#ifdef Z_SOLO
- + return Z_STREAM_ERROR;
- +#else
- + strm->zfree = zcfree;
- +#endif
- + state = (struct inflate_state FAR *)
- + ZALLOC(strm, 1, sizeof(struct inflate_state));
- + if (state == Z_NULL) return Z_MEM_ERROR;
- + Tracev((stderr, "inflate: allocated\n"));
- + strm->state = (struct internal_state FAR *)state;
- + state->strm = strm;
- + state->window = Z_NULL;
- + state->mode = HEAD; /* to pass state test in inflateReset2() */
- + ret = inflateReset2(strm, windowBits);
- + if (ret != Z_OK) {
- + ZFREE(strm, state);
- + strm->state = Z_NULL;
- + }
- + return ret;
- +}
- +
- +int ZEXPORT inflateInit_(strm, version, stream_size)
- +z_streamp strm;
- +const char *version;
- +int stream_size;
- +{
- + return inflateInit2_(strm, DEF_WBITS, version, stream_size);
- +}
- +
- +int ZEXPORT inflatePrime(strm, bits, value)
- +z_streamp strm;
- +int bits;
- +int value;
- +{
- + struct inflate_state FAR *state;
- +
- + if (inflateStateCheck(strm)) return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- + if (bits < 0) {
- + state->hold = 0;
- + state->bits = 0;
- + return Z_OK;
- + }
- + if (bits > 16 || state->bits + (uInt)bits > 32) return Z_STREAM_ERROR;
- + value &= (1L << bits) - 1;
- + state->hold += (unsigned)value << state->bits;
- + state->bits += (uInt)bits;
- + return Z_OK;
- +}
- +
- +/*
- + Return state with length and distance decoding tables and index sizes set to
- + fixed code decoding. Normally this returns fixed tables from inffixed.h.
- + If BUILDFIXED is defined, then instead this routine builds the tables the
- + first time it's called, and returns those tables the first time and
- + thereafter. This reduces the size of the code by about 2K bytes, in
- + exchange for a little execution time. However, BUILDFIXED should not be
- + used for threaded applications, since the rewriting of the tables and virgin
- + may not be thread-safe.
- + */
- +local void fixedtables(state)
- +struct inflate_state FAR *state;
- +{
- +#ifdef BUILDFIXED
- + static int virgin = 1;
- + static code *lenfix, *distfix;
- + static code fixed[544];
- +
- + /* build fixed huffman tables if first call (may not be thread safe) */
- + if (virgin) {
- + unsigned sym, bits;
- + static code *next;
- +
- + /* literal/length table */
- + sym = 0;
- + while (sym < 144) state->lens[sym++] = 8;
- + while (sym < 256) state->lens[sym++] = 9;
- + while (sym < 280) state->lens[sym++] = 7;
- + while (sym < 288) state->lens[sym++] = 8;
- + next = fixed;
- + lenfix = next;
- + bits = 9;
- + inflate_table(LENS, state->lens, 288, &(next), &(bits), state->work);
- +
- + /* distance table */
- + sym = 0;
- + while (sym < 32) state->lens[sym++] = 5;
- + distfix = next;
- + bits = 5;
- + inflate_table(DISTS, state->lens, 32, &(next), &(bits), state->work);
- +
- + /* do this just once */
- + virgin = 0;
- + }
- +#else /* !BUILDFIXED */
- +# include "inffixed.h"
- +#endif /* BUILDFIXED */
- + state->lencode = lenfix;
- + state->lenbits = 9;
- + state->distcode = distfix;
- + state->distbits = 5;
- +}
- +
- +#ifdef MAKEFIXED
- +#include <stdio.h>
- +
- +/*
- + Write out the inffixed.h that is #include'd above. Defining MAKEFIXED also
- + defines BUILDFIXED, so the tables are built on the fly. makefixed() writes
- + those tables to stdout, which would be piped to inffixed.h. A small program
- + can simply call makefixed to do this:
- +
- + void makefixed(void);
- +
- + int main(void)
- + {
- + makefixed();
- + return 0;
- + }
- +
- + Then that can be linked with zlib built with MAKEFIXED defined and run:
- +
- + a.out > inffixed.h
- + */
- +void makefixed()
- +{
- + unsigned low, size;
- + struct inflate_state state;
- +
- + fixedtables(&state);
- + puts(" /* inffixed.h -- table for decoding fixed codes");
- + puts(" * Generated automatically by makefixed().");
- + puts(" */");
- + puts("");
- + puts(" /* WARNING: this file should *not* be used by applications.");
- + puts(" It is part of the implementation of this library and is");
- + puts(" subject to change. Applications should only use zlib.h.");
- + puts(" */");
- + puts("");
- + size = 1U << 9;
- + printf(" static const code lenfix[%u] = {", size);
- + low = 0;
- + for (;;) {
- + if ((low % 7) == 0) printf("\n ");
- + printf("{%u,%u,%d}", (low & 127) == 99 ? 64 : state.lencode[low].op,
- + state.lencode[low].bits, state.lencode[low].val);
- + if (++low == size) break;
- + putchar(',');
- + }
- + puts("\n };");
- + size = 1U << 5;
- + printf("\n static const code distfix[%u] = {", size);
- + low = 0;
- + for (;;) {
- + if ((low % 6) == 0) printf("\n ");
- + printf("{%u,%u,%d}", state.distcode[low].op, state.distcode[low].bits,
- + state.distcode[low].val);
- + if (++low == size) break;
- + putchar(',');
- + }
- + puts("\n };");
- +}
- +#endif /* MAKEFIXED */
- +
- +/*
- + Update the window with the last wsize (normally 32K) bytes written before
- + returning. If window does not exist yet, create it. This is only called
- + when a window is already in use, or when output has been written during this
- + inflate call, but the end of the deflate stream has not been reached yet.
- + It is also called to create a window for dictionary data when a dictionary
- + is loaded.
- +
- + Providing output buffers larger than 32K to inflate() should provide a speed
- + advantage, since only the last 32K of output is copied to the sliding window
- + upon return from inflate(), and since all distances after the first 32K of
- + output will fall in the output data, making match copies simpler and faster.
- + The advantage may be dependent on the size of the processor's data caches.
- + */
- +local int updatewindow(strm, end, copy)
- +z_streamp strm;
- +const Bytef *end;
- +unsigned copy;
- +{
- + struct inflate_state FAR *state;
- + unsigned dist;
- +
- + state = (struct inflate_state FAR *)strm->state;
- +
- + /* if it hasn't been done already, allocate space for the window */
- + if (state->window == Z_NULL) {
- + state->window = (unsigned char FAR *)
- + ZALLOC(strm, 1U << state->wbits,
- + sizeof(unsigned char));
- + if (state->window == Z_NULL) return 1;
- + }
- +
- + /* if window not in use yet, initialize */
- + if (state->wsize == 0) {
- + state->wsize = 1U << state->wbits;
- + state->wnext = 0;
- + state->whave = 0;
- + }
- +
- + /* copy state->wsize or less output bytes into the circular window */
- + if (copy >= state->wsize) {
- + zmemcpy(state->window, end - state->wsize, state->wsize);
- + state->wnext = 0;
- + state->whave = state->wsize;
- + }
- + else {
- + dist = state->wsize - state->wnext;
- + if (dist > copy) dist = copy;
- + zmemcpy(state->window + state->wnext, end - copy, dist);
- + copy -= dist;
- + if (copy) {
- + zmemcpy(state->window, end - copy, copy);
- + state->wnext = copy;
- + state->whave = state->wsize;
- + }
- + else {
- + state->wnext += dist;
- + if (state->wnext == state->wsize) state->wnext = 0;
- + if (state->whave < state->wsize) state->whave += dist;
- + }
- + }
- + return 0;
- +}
- +
- +/* Macros for inflate(): */
- +
- +/* check function to use adler32() for zlib or crc32() for gzip */
- +#ifdef GUNZIP
- +# define UPDATE(check, buf, len) \
- + (state->flags ? crc32(check, buf, len) : adler32(check, buf, len))
- +#else
- +# define UPDATE(check, buf, len) adler32(check, buf, len)
- +#endif
- +
- +/* check macros for header crc */
- +#ifdef GUNZIP
- +# define CRC2(check, word) \
- + do { \
- + hbuf[0] = (unsigned char)(word); \
- + hbuf[1] = (unsigned char)((word) >> 8); \
- + check = crc32(check, hbuf, 2); \
- + } while (0)
- +
- +# define CRC4(check, word) \
- + do { \
- + hbuf[0] = (unsigned char)(word); \
- + hbuf[1] = (unsigned char)((word) >> 8); \
- + hbuf[2] = (unsigned char)((word) >> 16); \
- + hbuf[3] = (unsigned char)((word) >> 24); \
- + check = crc32(check, hbuf, 4); \
- + } while (0)
- +#endif
- +
- +/* Load registers with state in inflate() for speed */
- +#define LOAD() \
- + do { \
- + put = strm->next_out; \
- + left = strm->avail_out; \
- + next = strm->next_in; \
- + have = strm->avail_in; \
- + hold = state->hold; \
- + bits = state->bits; \
- + } while (0)
- +
- +/* Restore state from registers in inflate() */
- +#define RESTORE() \
- + do { \
- + strm->next_out = put; \
- + strm->avail_out = left; \
- + strm->next_in = next; \
- + strm->avail_in = have; \
- + state->hold = hold; \
- + state->bits = bits; \
- + } while (0)
- +
- +/* Clear the input bit accumulator */
- +#define INITBITS() \
- + do { \
- + hold = 0; \
- + bits = 0; \
- + } while (0)
- +
- +/* Get a byte of input into the bit accumulator, or return from inflate()
- + if there is no input available. */
- +#define PULLBYTE() \
- + do { \
- + if (have == 0) goto inf_leave; \
- + have--; \
- + hold += (unsigned long)(*next++) << bits; \
- + bits += 8; \
- + } while (0)
- +
- +/* Assure that there are at least n bits in the bit accumulator. If there is
- + not enough available input to do that, then return from inflate(). */
- +#define NEEDBITS(n) \
- + do { \
- + while (bits < (unsigned)(n)) \
- + PULLBYTE(); \
- + } while (0)
- +
- +/* Return the low n bits of the bit accumulator (n < 16) */
- +#define BITS(n) \
- + ((unsigned)hold & ((1U << (n)) - 1))
- +
- +/* Remove n bits from the bit accumulator */
- +#define DROPBITS(n) \
- + do { \
- + hold >>= (n); \
- + bits -= (unsigned)(n); \
- + } while (0)
- +
- +/* Remove zero to seven bits as needed to go to a byte boundary */
- +#define BYTEBITS() \
- + do { \
- + hold >>= bits & 7; \
- + bits -= bits & 7; \
- + } while (0)
- +
- +/*
- + inflate() uses a state machine to process as much input data and generate as
- + much output data as possible before returning. The state machine is
- + structured roughly as follows:
- +
- + for (;;) switch (state) {
- + ...
- + case STATEn:
- + if (not enough input data or output space to make progress)
- + return;
- + ... make progress ...
- + state = STATEm;
- + break;
- + ...
- + }
- +
- + so when inflate() is called again, the same case is attempted again, and
- + if the appropriate resources are provided, the machine proceeds to the
- + next state. The NEEDBITS() macro is usually the way the state evaluates
- + whether it can proceed or should return. NEEDBITS() does the return if
- + the requested bits are not available. The typical use of the BITS macros
- + is:
- +
- + NEEDBITS(n);
- + ... do something with BITS(n) ...
- + DROPBITS(n);
- +
- + where NEEDBITS(n) either returns from inflate() if there isn't enough
- + input left to load n bits into the accumulator, or it continues. BITS(n)
- + gives the low n bits in the accumulator. When done, DROPBITS(n) drops
- + the low n bits off the accumulator. INITBITS() clears the accumulator
- + and sets the number of available bits to zero. BYTEBITS() discards just
- + enough bits to put the accumulator on a byte boundary. After BYTEBITS()
- + and a NEEDBITS(8), then BITS(8) would return the next byte in the stream.
- +
- + NEEDBITS(n) uses PULLBYTE() to get an available byte of input, or to return
- + if there is no input available. The decoding of variable length codes uses
- + PULLBYTE() directly in order to pull just enough bytes to decode the next
- + code, and no more.
- +
- + Some states loop until they get enough input, making sure that enough
- + state information is maintained to continue the loop where it left off
- + if NEEDBITS() returns in the loop. For example, want, need, and keep
- + would all have to actually be part of the saved state in case NEEDBITS()
- + returns:
- +
- + case STATEw:
- + while (want < need) {
- + NEEDBITS(n);
- + keep[want++] = BITS(n);
- + DROPBITS(n);
- + }
- + state = STATEx;
- + case STATEx:
- +
- + As shown above, if the next state is also the next case, then the break
- + is omitted.
- +
- + A state may also return if there is not enough output space available to
- + complete that state. Those states are copying stored data, writing a
- + literal byte, and copying a matching string.
- +
- + When returning, a "goto inf_leave" is used to update the total counters,
- + update the check value, and determine whether any progress has been made
- + during that inflate() call in order to return the proper return code.
- + Progress is defined as a change in either strm->avail_in or strm->avail_out.
- + When there is a window, goto inf_leave will update the window with the last
- + output written. If a goto inf_leave occurs in the middle of decompression
- + and there is no window currently, goto inf_leave will create one and copy
- + output to the window for the next call of inflate().
- +
- + In this implementation, the flush parameter of inflate() only affects the
- + return code (per zlib.h). inflate() always writes as much as possible to
- + strm->next_out, given the space available and the provided input--the effect
- + documented in zlib.h of Z_SYNC_FLUSH. Furthermore, inflate() always defers
- + the allocation of and copying into a sliding window until necessary, which
- + provides the effect documented in zlib.h for Z_FINISH when the entire input
- + stream available. So the only thing the flush parameter actually does is:
- + when flush is set to Z_FINISH, inflate() cannot return Z_OK. Instead it
- + will return Z_BUF_ERROR if it has not reached the end of the stream.
- + */
- +
- +int ZEXPORT inflate(strm, flush)
- +z_streamp strm;
- +int flush;
- +{
- + struct inflate_state FAR *state;
- + z_const unsigned char FAR *next; /* next input */
- + unsigned char FAR *put; /* next output */
- + unsigned have, left; /* available input and output */
- + unsigned long hold; /* bit buffer */
- + unsigned bits; /* bits in bit buffer */
- + unsigned in, out; /* save starting available input and output */
- + unsigned copy; /* number of stored or match bytes to copy */
- + unsigned char FAR *from; /* where to copy match bytes from */
- + code here; /* current decoding table entry */
- + code last; /* parent table entry */
- + unsigned len; /* length to copy for repeats, bits to drop */
- + int ret; /* return code */
- +#ifdef GUNZIP
- + unsigned char hbuf[4]; /* buffer for gzip header crc calculation */
- +#endif
- + static const unsigned short order[19] = /* permutation of code lengths */
- + {16, 17, 18, 0, 8, 7, 9, 6, 10, 5, 11, 4, 12, 3, 13, 2, 14, 1, 15};
- +
- + if (inflateStateCheck(strm) || strm->next_out == Z_NULL ||
- + (strm->next_in == Z_NULL && strm->avail_in != 0))
- + return Z_STREAM_ERROR;
- +
- + state = (struct inflate_state FAR *)strm->state;
- + if (state->mode == TYPE) state->mode = TYPEDO; /* skip check */
- + LOAD();
- + in = have;
- + out = left;
- + ret = Z_OK;
- + for (;;)
- + switch (state->mode) {
- + case HEAD:
- + if (state->wrap == 0) {
- + state->mode = TYPEDO;
- + break;
- + }
- + NEEDBITS(16);
- +#ifdef GUNZIP
- + if ((state->wrap & 2) && hold == 0x8b1f) { /* gzip header */
- + if (state->wbits == 0)
- + state->wbits = 15;
- + state->check = crc32(0L, Z_NULL, 0);
- + CRC2(state->check, hold);
- + INITBITS();
- + state->mode = FLAGS;
- + break;
- + }
- + state->flags = 0; /* expect zlib header */
- + if (state->head != Z_NULL)
- + state->head->done = -1;
- + if (!(state->wrap & 1) || /* check if zlib header allowed */
- +#else
- + if (
- +#endif
- + ((BITS(8) << 8) + (hold >> 8)) % 31) {
- + strm->msg = (char *)"incorrect header check";
- + state->mode = BAD;
- + break;
- + }
- + if (BITS(4) != Z_DEFLATED) {
- + strm->msg = (char *)"unknown compression method";
- + state->mode = BAD;
- + break;
- + }
- + DROPBITS(4);
- + len = BITS(4) + 8;
- + if (state->wbits == 0)
- + state->wbits = len;
- + if (len > 15 || len > state->wbits) {
- + strm->msg = (char *)"invalid window size";
- + state->mode = BAD;
- + break;
- + }
- + state->dmax = 1U << len;
- + Tracev((stderr, "inflate: zlib header ok\n"));
- + strm->adler = state->check = adler32(0L, Z_NULL, 0);
- + state->mode = hold & 0x200 ? DICTID : TYPE;
- + INITBITS();
- + break;
- +#ifdef GUNZIP
- + case FLAGS:
- + NEEDBITS(16);
- + state->flags = (int)(hold);
- + if ((state->flags & 0xff) != Z_DEFLATED) {
- + strm->msg = (char *)"unknown compression method";
- + state->mode = BAD;
- + break;
- + }
- + if (state->flags & 0xe000) {
- + strm->msg = (char *)"unknown header flags set";
- + state->mode = BAD;
- + break;
- + }
- + if (state->head != Z_NULL)
- + state->head->text = (int)((hold >> 8) & 1);
- + if ((state->flags & 0x0200) && (state->wrap & 4))
- + CRC2(state->check, hold);
- + INITBITS();
- + state->mode = TIME;
- + case TIME:
- + NEEDBITS(32);
- + if (state->head != Z_NULL)
- + state->head->time = hold;
- + if ((state->flags & 0x0200) && (state->wrap & 4))
- + CRC4(state->check, hold);
- + INITBITS();
- + state->mode = OS;
- + case OS:
- + NEEDBITS(16);
- + if (state->head != Z_NULL) {
- + state->head->xflags = (int)(hold & 0xff);
- + state->head->os = (int)(hold >> 8);
- + }
- + if ((state->flags & 0x0200) && (state->wrap & 4))
- + CRC2(state->check, hold);
- + INITBITS();
- + state->mode = EXLEN;
- + case EXLEN:
- + if (state->flags & 0x0400) {
- + NEEDBITS(16);
- + state->length = (unsigned)(hold);
- + if (state->head != Z_NULL)
- + state->head->extra_len = (unsigned)hold;
- + if ((state->flags & 0x0200) && (state->wrap & 4))
- + CRC2(state->check, hold);
- + INITBITS();
- + }
- + else if (state->head != Z_NULL)
- + state->head->extra = Z_NULL;
- + state->mode = EXTRA;
- + case EXTRA:
- + if (state->flags & 0x0400) {
- + copy = state->length;
- + if (copy > have) copy = have;
- + if (copy) {
- + if (state->head != Z_NULL &&
- + state->head->extra != Z_NULL) {
- + len = state->head->extra_len - state->length;
- + zmemcpy(state->head->extra + len, next,
- + len + copy > state->head->extra_max ?
- + state->head->extra_max - len : copy);
- + }
- + if ((state->flags & 0x0200) && (state->wrap & 4))
- + state->check = crc32(state->check, next, copy);
- + have -= copy;
- + next += copy;
- + state->length -= copy;
- + }
- + if (state->length) goto inf_leave;
- + }
- + state->length = 0;
- + state->mode = NAME;
- + case NAME:
- + if (state->flags & 0x0800) {
- + if (have == 0) goto inf_leave;
- + copy = 0;
- + do {
- + len = (unsigned)(next[copy++]);
- + if (state->head != Z_NULL &&
- + state->head->name != Z_NULL &&
- + state->length < state->head->name_max)
- + state->head->name[state->length++] = (Bytef)len;
- + } while (len && copy < have);
- + if ((state->flags & 0x0200) && (state->wrap & 4))
- + state->check = crc32(state->check, next, copy);
- + have -= copy;
- + next += copy;
- + if (len) goto inf_leave;
- + }
- + else if (state->head != Z_NULL)
- + state->head->name = Z_NULL;
- + state->length = 0;
- + state->mode = COMMENT;
- + case COMMENT:
- + if (state->flags & 0x1000) {
- + if (have == 0) goto inf_leave;
- + copy = 0;
- + do {
- + len = (unsigned)(next[copy++]);
- + if (state->head != Z_NULL &&
- + state->head->comment != Z_NULL &&
- + state->length < state->head->comm_max)
- + state->head->comment[state->length++] = (Bytef)len;
- + } while (len && copy < have);
- + if ((state->flags & 0x0200) && (state->wrap & 4))
- + state->check = crc32(state->check, next, copy);
- + have -= copy;
- + next += copy;
- + if (len) goto inf_leave;
- + }
- + else if (state->head != Z_NULL)
- + state->head->comment = Z_NULL;
- + state->mode = HCRC;
- + case HCRC:
- + if (state->flags & 0x0200) {
- + NEEDBITS(16);
- + if ((state->wrap & 4) && hold != (state->check & 0xffff)) {
- + strm->msg = (char *)"header crc mismatch";
- + state->mode = BAD;
- + break;
- + }
- + INITBITS();
- + }
- + if (state->head != Z_NULL) {
- + state->head->hcrc = (int)((state->flags >> 9) & 1);
- + state->head->done = 1;
- + }
- + strm->adler = state->check = crc32(0L, Z_NULL, 0);
- + state->mode = TYPE;
- + break;
- +#endif
- + case DICTID:
- + NEEDBITS(32);
- + strm->adler = state->check = ZSWAP32(hold);
- + INITBITS();
- + state->mode = DICT;
- + case DICT:
- + if (state->havedict == 0) {
- + RESTORE();
- + return Z_NEED_DICT;
- + }
- + strm->adler = state->check = adler32(0L, Z_NULL, 0);
- + state->mode = TYPE;
- + case TYPE:
- + if (flush == Z_BLOCK || flush == Z_TREES) goto inf_leave;
- + case TYPEDO:
- + if (state->last) {
- + BYTEBITS();
- + state->mode = CHECK;
- + break;
- + }
- + NEEDBITS(3);
- + state->last = BITS(1);
- + DROPBITS(1);
- + switch (BITS(2)) {
- + case 0: /* stored block */
- + Tracev((stderr, "inflate: stored block%s\n",
- + state->last ? " (last)" : ""));
- + state->mode = STORED;
- + break;
- + case 1: /* fixed block */
- + fixedtables(state);
- + Tracev((stderr, "inflate: fixed codes block%s\n",
- + state->last ? " (last)" : ""));
- + state->mode = LEN_; /* decode codes */
- + if (flush == Z_TREES) {
- + DROPBITS(2);
- + goto inf_leave;
- + }
- + break;
- + case 2: /* dynamic block */
- + Tracev((stderr, "inflate: dynamic codes block%s\n",
- + state->last ? " (last)" : ""));
- + state->mode = TABLE;
- + break;
- + case 3:
- + strm->msg = (char *)"invalid block type";
- + state->mode = BAD;
- + }
- + DROPBITS(2);
- + break;
- + case STORED:
- + BYTEBITS(); /* go to byte boundary */
- + NEEDBITS(32);
- + if ((hold & 0xffff) != ((hold >> 16) ^ 0xffff)) {
- + strm->msg = (char *)"invalid stored block lengths";
- + state->mode = BAD;
- + break;
- + }
- + state->length = (unsigned)hold & 0xffff;
- + Tracev((stderr, "inflate: stored length %u\n",
- + state->length));
- + INITBITS();
- + state->mode = COPY_;
- + if (flush == Z_TREES) goto inf_leave;
- + case COPY_:
- + state->mode = COPY;
- + case COPY:
- + copy = state->length;
- + if (copy) {
- + if (copy > have) copy = have;
- + if (copy > left) copy = left;
- + if (copy == 0) goto inf_leave;
- + zmemcpy(put, next, copy);
- + have -= copy;
- + next += copy;
- + left -= copy;
- + put += copy;
- + state->length -= copy;
- + break;
- + }
- + Tracev((stderr, "inflate: stored end\n"));
- + state->mode = TYPE;
- + break;
- + case TABLE:
- + NEEDBITS(14);
- + state->nlen = BITS(5) + 257;
- + DROPBITS(5);
- + state->ndist = BITS(5) + 1;
- + DROPBITS(5);
- + state->ncode = BITS(4) + 4;
- + DROPBITS(4);
- +#ifndef PKZIP_BUG_WORKAROUND
- + if (state->nlen > 286 || state->ndist > 30) {
- + strm->msg = (char *)"too many length or distance symbols";
- + state->mode = BAD;
- + break;
- + }
- +#endif
- + Tracev((stderr, "inflate: table sizes ok\n"));
- + state->have = 0;
- + state->mode = LENLENS;
- + case LENLENS:
- + while (state->have < state->ncode) {
- + NEEDBITS(3);
- + state->lens[order[state->have++]] = (unsigned short)BITS(3);
- + DROPBITS(3);
- + }
- + while (state->have < 19)
- + state->lens[order[state->have++]] = 0;
- + state->next = state->codes;
- + state->lencode = (const code FAR *)(state->next);
- + state->lenbits = 7;
- + ret = inflate_table(CODES, state->lens, 19, &(state->next),
- + &(state->lenbits), state->work);
- + if (ret) {
- + strm->msg = (char *)"invalid code lengths set";
- + state->mode = BAD;
- + break;
- + }
- + Tracev((stderr, "inflate: code lengths ok\n"));
- + state->have = 0;
- + state->mode = CODELENS;
- + case CODELENS:
- + while (state->have < state->nlen + state->ndist) {
- + for (;;) {
- + here = state->lencode[BITS(state->lenbits)];
- + if ((unsigned)(here.bits) <= bits) break;
- + PULLBYTE();
- + }
- + if (here.val < 16) {
- + DROPBITS(here.bits);
- + state->lens[state->have++] = here.val;
- + }
- + else {
- + if (here.val == 16) {
- + NEEDBITS(here.bits + 2);
- + DROPBITS(here.bits);
- + if (state->have == 0) {
- + strm->msg = (char *)"invalid bit length repeat";
- + state->mode = BAD;
- + break;
- + }
- + len = state->lens[state->have - 1];
- + copy = 3 + BITS(2);
- + DROPBITS(2);
- + }
- + else if (here.val == 17) {
- + NEEDBITS(here.bits + 3);
- + DROPBITS(here.bits);
- + len = 0;
- + copy = 3 + BITS(3);
- + DROPBITS(3);
- + }
- + else {
- + NEEDBITS(here.bits + 7);
- + DROPBITS(here.bits);
- + len = 0;
- + copy = 11 + BITS(7);
- + DROPBITS(7);
- + }
- + if (state->have + copy > state->nlen + state->ndist) {
- + strm->msg = (char *)"invalid bit length repeat";
- + state->mode = BAD;
- + break;
- + }
- + while (copy--)
- + state->lens[state->have++] = (unsigned short)len;
- + }
- + }
- +
- + /* handle error breaks in while */
- + if (state->mode == BAD) break;
- +
- + /* check for end-of-block code (better have one) */
- + if (state->lens[256] == 0) {
- + strm->msg = (char *)"invalid code -- missing end-of-block";
- + state->mode = BAD;
- + break;
- + }
- +
- + /* build code tables -- note: do not change the lenbits or distbits
- + values here (9 and 6) without reading the comments in inftrees.h
- + concerning the ENOUGH constants, which depend on those values */
- + state->next = state->codes;
- + state->lencode = (const code FAR *)(state->next);
- + state->lenbits = 9;
- + ret = inflate_table(LENS, state->lens, state->nlen, &(state->next),
- + &(state->lenbits), state->work);
- + if (ret) {
- + strm->msg = (char *)"invalid literal/lengths set";
- + state->mode = BAD;
- + break;
- + }
- + state->distcode = (const code FAR *)(state->next);
- + state->distbits = 6;
- + ret = inflate_table(DISTS, state->lens + state->nlen, state->ndist,
- + &(state->next), &(state->distbits), state->work);
- + if (ret) {
- + strm->msg = (char *)"invalid distances set";
- + state->mode = BAD;
- + break;
- + }
- + Tracev((stderr, "inflate: codes ok\n"));
- + state->mode = LEN_;
- + if (flush == Z_TREES) goto inf_leave;
- + case LEN_:
- + state->mode = LEN;
- + case LEN:
- + if (have >= 6 && left >= 258) {
- + RESTORE();
- + inflate_fast(strm, out);
- + LOAD();
- + if (state->mode == TYPE)
- + state->back = -1;
- + break;
- + }
- + state->back = 0;
- + for (;;) {
- + here = state->lencode[BITS(state->lenbits)];
- + if ((unsigned)(here.bits) <= bits) break;
- + PULLBYTE();
- + }
- + if (here.op && (here.op & 0xf0) == 0) {
- + last = here;
- + for (;;) {
- + here = state->lencode[last.val +
- + (BITS(last.bits + last.op) >> last.bits)];
- + if ((unsigned)(last.bits + here.bits) <= bits) break;
- + PULLBYTE();
- + }
- + DROPBITS(last.bits);
- + state->back += last.bits;
- + }
- + DROPBITS(here.bits);
- + state->back += here.bits;
- + state->length = (unsigned)here.val;
- + if ((int)(here.op) == 0) {
- + Tracevv((stderr, here.val >= 0x20 && here.val < 0x7f ?
- + "inflate: literal '%c'\n" :
- + "inflate: literal 0x%02x\n", here.val));
- + state->mode = LIT;
- + break;
- + }
- + if (here.op & 32) {
- + Tracevv((stderr, "inflate: end of block\n"));
- + state->back = -1;
- + state->mode = TYPE;
- + break;
- + }
- + if (here.op & 64) {
- + strm->msg = (char *)"invalid literal/length code";
- + state->mode = BAD;
- + break;
- + }
- + state->extra = (unsigned)(here.op) & 15;
- + state->mode = LENEXT;
- + case LENEXT:
- + if (state->extra) {
- + NEEDBITS(state->extra);
- + state->length += BITS(state->extra);
- + DROPBITS(state->extra);
- + state->back += state->extra;
- + }
- + Tracevv((stderr, "inflate: length %u\n", state->length));
- + state->was = state->length;
- + state->mode = DIST;
- + case DIST:
- + for (;;) {
- + here = state->distcode[BITS(state->distbits)];
- + if ((unsigned)(here.bits) <= bits) break;
- + PULLBYTE();
- + }
- + if ((here.op & 0xf0) == 0) {
- + last = here;
- + for (;;) {
- + here = state->distcode[last.val +
- + (BITS(last.bits + last.op) >> last.bits)];
- + if ((unsigned)(last.bits + here.bits) <= bits) break;
- + PULLBYTE();
- + }
- + DROPBITS(last.bits);
- + state->back += last.bits;
- + }
- + DROPBITS(here.bits);
- + state->back += here.bits;
- + if (here.op & 64) {
- + strm->msg = (char *)"invalid distance code";
- + state->mode = BAD;
- + break;
- + }
- + state->offset = (unsigned)here.val;
- + state->extra = (unsigned)(here.op) & 15;
- + state->mode = DISTEXT;
- + case DISTEXT:
- + if (state->extra) {
- + NEEDBITS(state->extra);
- + state->offset += BITS(state->extra);
- + DROPBITS(state->extra);
- + state->back += state->extra;
- + }
- +#ifdef INFLATE_STRICT
- + if (state->offset > state->dmax) {
- + strm->msg = (char *)"invalid distance too far back";
- + state->mode = BAD;
- + break;
- + }
- +#endif
- + Tracevv((stderr, "inflate: distance %u\n", state->offset));
- + state->mode = MATCH;
- + case MATCH:
- + if (left == 0) goto inf_leave;
- + copy = out - left;
- + if (state->offset > copy) { /* copy from window */
- + copy = state->offset - copy;
- + if (copy > state->whave) {
- + if (state->sane) {
- + strm->msg = (char *)"invalid distance too far back";
- + state->mode = BAD;
- + break;
- + }
- +#ifdef INFLATE_ALLOW_INVALID_DISTANCE_TOOFAR_ARRR
- + Trace((stderr, "inflate.c too far\n"));
- + copy -= state->whave;
- + if (copy > state->length) copy = state->length;
- + if (copy > left) copy = left;
- + left -= copy;
- + state->length -= copy;
- + do {
- + *put++ = 0;
- + } while (--copy);
- + if (state->length == 0) state->mode = LEN;
- + break;
- +#endif
- + }
- + if (copy > state->wnext) {
- + copy -= state->wnext;
- + from = state->window + (state->wsize - copy);
- + }
- + else
- + from = state->window + (state->wnext - copy);
- + if (copy > state->length) copy = state->length;
- + }
- + else { /* copy from output */
- + from = put - state->offset;
- + copy = state->length;
- + }
- + if (copy > left) copy = left;
- + left -= copy;
- + state->length -= copy;
- + do {
- + *put++ = *from++;
- + } while (--copy);
- + if (state->length == 0) state->mode = LEN;
- + break;
- + case LIT:
- + if (left == 0) goto inf_leave;
- + *put++ = (unsigned char)(state->length);
- + left--;
- + state->mode = LEN;
- + break;
- + case CHECK:
- + if (state->wrap) {
- + NEEDBITS(32);
- + out -= left;
- + strm->total_out += out;
- + state->total += out;
- + if ((state->wrap & 4) && out)
- + strm->adler = state->check =
- + UPDATE(state->check, put - out, out);
- + out = left;
- + if ((state->wrap & 4) && (
- +#ifdef GUNZIP
- + state->flags ? hold :
- +#endif
- + ZSWAP32(hold)) != state->check) {
- + strm->msg = (char *)"incorrect data check";
- + state->mode = BAD;
- + break;
- + }
- + INITBITS();
- + Tracev((stderr, "inflate: check matches trailer\n"));
- + }
- +#ifdef GUNZIP
- + state->mode = LENGTH;
- + case LENGTH:
- + if (state->wrap && state->flags) {
- + NEEDBITS(32);
- + if (hold != (state->total & 0xffffffffUL)) {
- + strm->msg = (char *)"incorrect length check";
- + state->mode = BAD;
- + break;
- + }
- + INITBITS();
- + Tracev((stderr, "inflate: length matches trailer\n"));
- + }
- +#endif
- + state->mode = DONE;
- + case DONE:
- + ret = Z_STREAM_END;
- + goto inf_leave;
- + case BAD:
- + ret = Z_DATA_ERROR;
- + goto inf_leave;
- + case MEM:
- + return Z_MEM_ERROR;
- + case SYNC:
- + default:
- + return Z_STREAM_ERROR;
- + }
- +
- + /*
- + Return from inflate(), updating the total counts and the check value.
- + If there was no progress during the inflate() call, return a buffer
- + error. Call updatewindow() to create and/or update the window state.
- + Note: a memory error from inflate() is non-recoverable.
- + */
- + inf_leave:
- + RESTORE();
- + if (state->wsize || (out != strm->avail_out && state->mode < BAD &&
- + (state->mode < CHECK || flush != Z_FINISH)))
- + if (updatewindow(strm, strm->next_out, out - strm->avail_out)) {
- + state->mode = MEM;
- + return Z_MEM_ERROR;
- + }
- + in -= strm->avail_in;
- + out -= strm->avail_out;
- + strm->total_in += in;
- + strm->total_out += out;
- + state->total += out;
- + if ((state->wrap & 4) && out)
- + strm->adler = state->check =
- + UPDATE(state->check, strm->next_out - out, out);
- + strm->data_type = (int)state->bits + (state->last ? 64 : 0) +
- + (state->mode == TYPE ? 128 : 0) +
- + (state->mode == LEN_ || state->mode == COPY_ ? 256 : 0);
- + if (((in == 0 && out == 0) || flush == Z_FINISH) && ret == Z_OK)
- + ret = Z_BUF_ERROR;
- + return ret;
- +}
- +
- +int ZEXPORT inflateEnd(strm)
- +z_streamp strm;
- +{
- + struct inflate_state FAR *state;
- + if (inflateStateCheck(strm))
- + return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- + if (state->window != Z_NULL) ZFREE(strm, state->window);
- + ZFREE(strm, strm->state);
- + strm->state = Z_NULL;
- + Tracev((stderr, "inflate: end\n"));
- + return Z_OK;
- +}
- +
- +int ZEXPORT inflateGetDictionary(strm, dictionary, dictLength)
- +z_streamp strm;
- +Bytef *dictionary;
- +uInt *dictLength;
- +{
- + struct inflate_state FAR *state;
- +
- + /* check state */
- + if (inflateStateCheck(strm)) return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- +
- + /* copy dictionary */
- + if (state->whave && dictionary != Z_NULL) {
- + zmemcpy(dictionary, state->window + state->wnext,
- + state->whave - state->wnext);
- + zmemcpy(dictionary + state->whave - state->wnext,
- + state->window, state->wnext);
- + }
- + if (dictLength != Z_NULL)
- + *dictLength = state->whave;
- + return Z_OK;
- +}
- +
- +int ZEXPORT inflateSetDictionary(strm, dictionary, dictLength)
- +z_streamp strm;
- +const Bytef *dictionary;
- +uInt dictLength;
- +{
- + struct inflate_state FAR *state;
- + unsigned long dictid;
- + int ret;
- +
- + /* check state */
- + if (inflateStateCheck(strm)) return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- + if (state->wrap != 0 && state->mode != DICT)
- + return Z_STREAM_ERROR;
- +
- + /* check for correct dictionary identifier */
- + if (state->mode == DICT) {
- + dictid = adler32(0L, Z_NULL, 0);
- + dictid = adler32(dictid, dictionary, dictLength);
- + if (dictid != state->check)
- + return Z_DATA_ERROR;
- + }
- +
- + /* copy dictionary to window using updatewindow(), which will amend the
- + existing dictionary if appropriate */
- + ret = updatewindow(strm, dictionary + dictLength, dictLength);
- + if (ret) {
- + state->mode = MEM;
- + return Z_MEM_ERROR;
- + }
- + state->havedict = 1;
- + Tracev((stderr, "inflate: dictionary set\n"));
- + return Z_OK;
- +}
- +
- +int ZEXPORT inflateGetHeader(strm, head)
- +z_streamp strm;
- +gz_headerp head;
- +{
- + struct inflate_state FAR *state;
- +
- + /* check state */
- + if (inflateStateCheck(strm)) return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- + if ((state->wrap & 2) == 0) return Z_STREAM_ERROR;
- +
- + /* save header structure */
- + state->head = head;
- + head->done = 0;
- + return Z_OK;
- +}
- +
- +/*
- + Search buf[0..len-1] for the pattern: 0, 0, 0xff, 0xff. Return when found
- + or when out of input. When called, *have is the number of pattern bytes
- + found in order so far, in 0..3. On return *have is updated to the new
- + state. If on return *have equals four, then the pattern was found and the
- + return value is how many bytes were read including the last byte of the
- + pattern. If *have is less than four, then the pattern has not been found
- + yet and the return value is len. In the latter case, syncsearch() can be
- + called again with more data and the *have state. *have is initialized to
- + zero for the first call.
- + */
- +local unsigned syncsearch(have, buf, len)
- +unsigned FAR *have;
- +const unsigned char FAR *buf;
- +unsigned len;
- +{
- + unsigned got;
- + unsigned next;
- +
- + got = *have;
- + next = 0;
- + while (next < len && got < 4) {
- + if ((int)(buf[next]) == (got < 2 ? 0 : 0xff))
- + got++;
- + else if (buf[next])
- + got = 0;
- + else
- + got = 4 - got;
- + next++;
- + }
- + *have = got;
- + return next;
- +}
- +
- +int ZEXPORT inflateSync(strm)
- +z_streamp strm;
- +{
- + unsigned len; /* number of bytes to look at or looked at */
- + unsigned long in, out; /* temporary to save total_in and total_out */
- + unsigned char buf[4]; /* to restore bit buffer to byte string */
- + struct inflate_state FAR *state;
- +
- + /* check parameters */
- + if (inflateStateCheck(strm)) return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- + if (strm->avail_in == 0 && state->bits < 8) return Z_BUF_ERROR;
- +
- + /* if first time, start search in bit buffer */
- + if (state->mode != SYNC) {
- + state->mode = SYNC;
- + state->hold <<= state->bits & 7;
- + state->bits -= state->bits & 7;
- + len = 0;
- + while (state->bits >= 8) {
- + buf[len++] = (unsigned char)(state->hold);
- + state->hold >>= 8;
- + state->bits -= 8;
- + }
- + state->have = 0;
- + syncsearch(&(state->have), buf, len);
- + }
- +
- + /* search available input */
- + len = syncsearch(&(state->have), strm->next_in, strm->avail_in);
- + strm->avail_in -= len;
- + strm->next_in += len;
- + strm->total_in += len;
- +
- + /* return no joy or set up to restart inflate() on a new block */
- + if (state->have != 4) return Z_DATA_ERROR;
- + in = strm->total_in; out = strm->total_out;
- + inflateReset(strm);
- + strm->total_in = in; strm->total_out = out;
- + state->mode = TYPE;
- + return Z_OK;
- +}
- +
- +/*
- + Returns true if inflate is currently at the end of a block generated by
- + Z_SYNC_FLUSH or Z_FULL_FLUSH. This function is used by one PPP
- + implementation to provide an additional safety check. PPP uses
- + Z_SYNC_FLUSH but removes the length bytes of the resulting empty stored
- + block. When decompressing, PPP checks that at the end of input packet,
- + inflate is waiting for these length bytes.
- + */
- +int ZEXPORT inflateSyncPoint(strm)
- +z_streamp strm;
- +{
- + struct inflate_state FAR *state;
- +
- + if (inflateStateCheck(strm)) return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- + return state->mode == STORED && state->bits == 0;
- +}
- +
- +int ZEXPORT inflateCopy(dest, source)
- +z_streamp dest;
- +z_streamp source;
- +{
- + struct inflate_state FAR *state;
- + struct inflate_state FAR *copy;
- + unsigned char FAR *window;
- + unsigned wsize;
- +
- + /* check input */
- + if (inflateStateCheck(source) || dest == Z_NULL)
- + return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)source->state;
- +
- + /* allocate space */
- + copy = (struct inflate_state FAR *)
- + ZALLOC(source, 1, sizeof(struct inflate_state));
- + if (copy == Z_NULL) return Z_MEM_ERROR;
- + window = Z_NULL;
- + if (state->window != Z_NULL) {
- + window = (unsigned char FAR *)
- + ZALLOC(source, 1U << state->wbits, sizeof(unsigned char));
- + if (window == Z_NULL) {
- + ZFREE(source, copy);
- + return Z_MEM_ERROR;
- + }
- + }
- +
- + /* copy state */
- + zmemcpy((voidpf)dest, (voidpf)source, sizeof(z_stream));
- + zmemcpy((voidpf)copy, (voidpf)state, sizeof(struct inflate_state));
- + copy->strm = dest;
- + if (state->lencode >= state->codes &&
- + state->lencode <= state->codes + ENOUGH - 1) {
- + copy->lencode = copy->codes + (state->lencode - state->codes);
- + copy->distcode = copy->codes + (state->distcode - state->codes);
- + }
- + copy->next = copy->codes + (state->next - state->codes);
- + if (window != Z_NULL) {
- + wsize = 1U << state->wbits;
- + zmemcpy(window, state->window, wsize);
- + }
- + copy->window = window;
- + dest->state = (struct internal_state FAR *)copy;
- + return Z_OK;
- +}
- +
- +int ZEXPORT inflateUndermine(strm, subvert)
- +z_streamp strm;
- +int subvert;
- +{
- + struct inflate_state FAR *state;
- +
- + if (inflateStateCheck(strm)) return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- +#ifdef INFLATE_ALLOW_INVALID_DISTANCE_TOOFAR_ARRR
- + state->sane = !subvert;
- + return Z_OK;
- +#else
- + (void)subvert;
- + state->sane = 1;
- + return Z_DATA_ERROR;
- +#endif
- +}
- +
- +int ZEXPORT inflateValidate(strm, check)
- +z_streamp strm;
- +int check;
- +{
- + struct inflate_state FAR *state;
- +
- + if (inflateStateCheck(strm)) return Z_STREAM_ERROR;
- + state = (struct inflate_state FAR *)strm->state;
- + if (check)
- + state->wrap |= 4;
- + else
- + state->wrap &= ~4;
- + return Z_OK;
- +}
- +
- +long ZEXPORT inflateMark(strm)
- +z_streamp strm;
- +{
- + struct inflate_state FAR *state;
- +
- + if (inflateStateCheck(strm))
- + return -(1L << 16);
- + state = (struct inflate_state FAR *)strm->state;
- + return (long)(((unsigned long)((long)state->back)) << 16) +
- + (state->mode == COPY ? state->length :
- + (state->mode == MATCH ? state->was - state->length : 0));
- +}
- +
- +unsigned long ZEXPORT inflateCodesUsed(strm)
- +z_streamp strm;
- +{
- + struct inflate_state FAR *state;
- + if (inflateStateCheck(strm)) return (unsigned long)-1;
- + state = (struct inflate_state FAR *)strm->state;
- + return (unsigned long)(state->next - state->codes);
- +}
- From 247147654fe5cd11cf15d8dff91440405ea57040 Mon Sep 17 00:00:00 2001
- From: Simon Hosie <simon.hosie@arm.com>
- Date: Wed, 12 Apr 2017 15:44:21 -0700
- Subject: [PATCH 2/2] Inflate using wider loads and stores
- In inflate_fast() the output pointer always has plenty of room to write. This
- means that so long as the target is capable, wide un-aligned loads and stores
- can be used to transfer several bytes at once. When the reference distance is
- too short simply unroll the data a little to increase the distance.
- Change-Id: I59854eb25d2b1e43561c8a2afaf9175bf10cf674
- ---
- contrib/arm/chunkcopy.h | 279 ++++++++++++++++++++++++++++++++++++++++++++++++
- contrib/arm/inffast.c | 96 +++++++----------
- contrib/arm/inflate.c | 22 ++--
- 3 files changed, 335 insertions(+), 62 deletions(-)
- create mode 100644 contrib/arm/chunkcopy.h
- diff --git a/contrib/arm/chunkcopy.h b/contrib/arm/chunkcopy.h
- new file mode 100644
- index 00000000..2d6fd6f9
- --- /dev/null
- +++ b/contrib/arm/chunkcopy.h
- @@ -0,0 +1,279 @@
- +/* chunkcopy.h -- fast copies and sets
- + * Copyright (C) 2017 ARM, Inc.
- + * For conditions of distribution and use, see copyright notice in zlib.h
- + */
- +
- +#ifndef CHUNKCOPY_H
- +#define CHUNKCOPY_H
- +
- +#include "zutil.h"
- +#include <arm_neon.h>
- +
- +#if __STDC_VERSION__ >= 199901L
- +#define Z_RESTRICT restrict
- +#else
- +#define Z_RESTRICT
- +#endif
- +
- +typedef uint8x16_t chunkcopy_chunk_t;
- +#define CHUNKCOPY_CHUNK_SIZE sizeof(chunkcopy_chunk_t)
- +
- +/*
- + Ask the compiler to perform a wide, unaligned load with an machine
- + instruction appropriate for the chunkcopy_chunk_t type.
- + */
- +static inline chunkcopy_chunk_t loadchunk(const unsigned char FAR *s) {
- + chunkcopy_chunk_t c;
- + __builtin_memcpy(&c, s, sizeof(c));
- + return c;
- +}
- +
- +/*
- + Ask the compiler to perform a wide, unaligned store with an machine
- + instruction appropriate for the chunkcopy_chunk_t type.
- + */
- +static inline void storechunk(unsigned char FAR *d, chunkcopy_chunk_t c) {
- + __builtin_memcpy(d, &c, sizeof(c));
- +}
- +
- +/*
- + Perform a memcpy-like operation, but assume that length is non-zero and that
- + it's OK to overwrite at least CHUNKCOPY_CHUNK_SIZE bytes of output even if
- + the length is shorter than this.
- +
- + It also guarantees that it will properly unroll the data if the distance
- + between `out` and `from` is at least CHUNKCOPY_CHUNK_SIZE, which we rely on
- + in chunkcopy_relaxed().
- +
- + Aside from better memory bus utilisation, this means that short copies
- + (CHUNKCOPY_CHUNK_SIZE bytes or fewer) will fall straight through the loop
- + without iteration, which will hopefully make the branch prediction more
- + reliable.
- + */
- +static inline unsigned char FAR *chunkcopy_core(unsigned char FAR *out,
- + const unsigned char FAR *from,
- + unsigned len) {
- + int bump = (--len % CHUNKCOPY_CHUNK_SIZE) + 1;
- + storechunk(out, loadchunk(from));
- + out += bump;
- + from += bump;
- + len /= CHUNKCOPY_CHUNK_SIZE;
- + while (len-- > 0) {
- + storechunk(out, loadchunk(from));
- + out += CHUNKCOPY_CHUNK_SIZE;
- + from += CHUNKCOPY_CHUNK_SIZE;
- + }
- + return out;
- +}
- +
- +/*
- + Like chunkcopy_core, but avoid writing beyond of legal output.
- +
- + Accepts an additional pointer to the end of safe output. A generic safe
- + copy would use (out + len), but it's normally the case that the end of the
- + output buffer is beyond the end of the current copy, and this can still be
- + exploited.
- + */
- +static inline unsigned char FAR *chunkcopy_core_safe(unsigned char FAR *out,
- + const unsigned char FAR * from,
- + unsigned len,
- + unsigned char FAR *limit) {
- + Assert(out + len <= limit, "chunk copy exceeds safety limit");
- + if (limit - out < CHUNKCOPY_CHUNK_SIZE) {
- + const unsigned char FAR * Z_RESTRICT rfrom = from;
- + if (len & 8) { __builtin_memcpy(out, rfrom, 8); out += 8; rfrom += 8; }
- + if (len & 4) { __builtin_memcpy(out, rfrom, 4); out += 4; rfrom += 4; }
- + if (len & 2) { __builtin_memcpy(out, rfrom, 2); out += 2; rfrom += 2; }
- + if (len & 1) { *out++ = *rfrom++; }
- + return out;
- + }
- + return chunkcopy_core(out, from, len);
- +}
- +
- +/*
- + Perform short copies until distance can be rewritten as being at least
- + CHUNKCOPY_CHUNK_SIZE.
- +
- + This assumes that it's OK to overwrite at least the first
- + 2*CHUNKCOPY_CHUNK_SIZE bytes of output even if the copy is shorter than
- + this. This assumption holds within inflate_fast() which starts every
- + iteration with at least 258 bytes of output space available (258 being the
- + maximum length output from a single token; see inffast.c).
- + */
- +static inline unsigned char FAR *chunkunroll_relaxed(unsigned char FAR *out,
- + unsigned FAR *dist,
- + unsigned FAR *len) {
- + const unsigned char FAR *from = out - *dist;
- + while (*dist < *len && *dist < CHUNKCOPY_CHUNK_SIZE) {
- + storechunk(out, loadchunk(from));
- + out += *dist;
- + *len -= *dist;
- + *dist += *dist;
- + }
- + return out;
- +}
- +
- +
- +static inline uint8x16_t chunkset_vld1q_dup_u8x8(const unsigned char FAR * Z_RESTRICT from) {
- +#if defined(__clang__) || defined(__aarch64__)
- + return vreinterpretq_u8_u64(vld1q_dup_u64((void *)from));
- +#else
- + /* 32-bit GCC uses an alignment hint for vld1q_dup_u64, even when given a
- + * void pointer, so here's an alternate implementation.
- + */
- + uint8x8_t h = vld1_u8(from);
- + return vcombine_u8(h, h);
- +#endif
- +}
- +
- +/*
- + Perform an overlapping copy which behaves as a memset() operation, but
- + supporting periods other than one, and assume that length is non-zero and
- + that it's OK to overwrite at least CHUNKCOPY_CHUNK_SIZE*3 bytes of output
- + even if the length is shorter than this.
- + */
- +static inline unsigned char FAR *chunkset_core(unsigned char FAR *out,
- + unsigned period,
- + unsigned len) {
- + uint8x16_t f;
- + int bump = ((len - 1) % sizeof(f)) + 1;
- +
- + switch (period) {
- + case 1:
- + f = vld1q_dup_u8(out - 1);
- + vst1q_u8(out, f);
- + out += bump;
- + len -= bump;
- + while (len > 0) {
- + vst1q_u8(out, f);
- + out += sizeof(f);
- + len -= sizeof(f);
- + }
- + return out;
- + case 2:
- + f = vreinterpretq_u8_u16(vld1q_dup_u16((void *)(out - 2)));
- + vst1q_u8(out, f);
- + out += bump;
- + len -= bump;
- + if (len > 0) {
- + f = vreinterpretq_u8_u16(vld1q_dup_u16((void *)(out - 2)));
- + do {
- + vst1q_u8(out, f);
- + out += sizeof(f);
- + len -= sizeof(f);
- + } while (len > 0);
- + }
- + return out;
- + case 4:
- + f = vreinterpretq_u8_u32(vld1q_dup_u32((void *)(out - 4)));
- + vst1q_u8(out, f);
- + out += bump;
- + len -= bump;
- + if (len > 0) {
- + f = vreinterpretq_u8_u32(vld1q_dup_u32((void *)(out - 4)));
- + do {
- + vst1q_u8(out, f);
- + out += sizeof(f);
- + len -= sizeof(f);
- + } while (len > 0);
- + }
- + return out;
- + case 8:
- + f = chunkset_vld1q_dup_u8x8(out - 8);
- + vst1q_u8(out, f);
- + out += bump;
- + len -= bump;
- + if (len > 0) {
- + f = chunkset_vld1q_dup_u8x8(out - 8);
- + do {
- + vst1q_u8(out, f);
- + out += sizeof(f);
- + len -= sizeof(f);
- + } while (len > 0);
- + }
- + return out;
- + }
- + out = chunkunroll_relaxed(out, &period, &len);
- + return chunkcopy_core(out, out - period, len);
- +}
- +
- +/*
- + Perform a memcpy-like operation, but assume that length is non-zero and that
- + it's OK to overwrite at least CHUNKCOPY_CHUNK_SIZE bytes of output even if
- + the length is shorter than this.
- +
- + Unlike chunkcopy_core() above, no guarantee is made regarding the behaviour
- + of overlapping buffers, regardless of the distance between the pointers.
- + This is reflected in the `restrict`-qualified pointers, allowing the
- + compiler to reorder loads and stores.
- + */
- +static inline unsigned char FAR *chunkcopy_relaxed(unsigned char FAR * Z_RESTRICT out,
- + const unsigned char FAR * Z_RESTRICT from,
- + unsigned len) {
- + return chunkcopy_core(out, from, len);
- +}
- +
- +/*
- + Like chunkcopy_relaxed, but avoid writing beyond of legal output.
- +
- + Unlike chunkcopy_core_safe() above, no guarantee is made regarding the
- + behaviour of overlapping buffers, regardless of the distance between the
- + pointers. This is reflected in the `restrict`-qualified pointers, allowing
- + the compiler to reorder loads and stores.
- +
- + Accepts an additional pointer to the end of safe output. A generic safe
- + copy would use (out + len), but it's normally the case that the end of the
- + output buffer is beyond the end of the current copy, and this can still be
- + exploited.
- + */
- +static inline unsigned char FAR *chunkcopy_safe(unsigned char FAR *out,
- + const unsigned char FAR * Z_RESTRICT from,
- + unsigned len,
- + unsigned char FAR *limit) {
- + Assert(out + len <= limit, "chunk copy exceeds safety limit");
- + return chunkcopy_core_safe(out, from, len, limit);
- +}
- +
- +/*
- + Perform chunky copy within the same buffer, where the source and destination
- + may potentially overlap.
- +
- + Assumes that len > 0 on entry, and that it's safe to write at least
- + CHUNKCOPY_CHUNK_SIZE*3 bytes to the output.
- + */
- +static inline unsigned char FAR *chunkcopy_lapped_relaxed(unsigned char FAR *out,
- + unsigned dist,
- + unsigned len) {
- + if (dist < len && dist < CHUNKCOPY_CHUNK_SIZE) {
- + return chunkset_core(out, dist, len);
- + }
- + return chunkcopy_core(out, out - dist, len);
- +}
- +
- +/*
- + Behave like chunkcopy_lapped_relaxed, but avoid writing beyond of legal output.
- +
- + Accepts an additional pointer to the end of safe output. A generic safe
- + copy would use (out + len), but it's normally the case that the end of the
- + output buffer is beyond the end of the current copy, and this can still be
- + exploited.
- + */
- +static inline unsigned char FAR *chunkcopy_lapped_safe(unsigned char FAR *out,
- + unsigned dist,
- + unsigned len,
- + unsigned char FAR *limit) {
- + Assert(out + len <= limit, "chunk copy exceeds safety limit");
- + if (limit - out < CHUNKCOPY_CHUNK_SIZE * 3) {
- + /* TODO: try harder to optimise this */
- + while (len-- > 0) {
- + *out = *(out - dist);
- + out++;
- + }
- + return out;
- + }
- + return chunkcopy_lapped_relaxed(out, dist, len);
- +}
- +
- +#undef Z_RESTRICT
- +
- +#endif /* CHUNKCOPY_H */
- diff --git a/contrib/arm/inffast.c b/contrib/arm/inffast.c
- index 0dbd1dbc..f7f50071 100644
- --- a/contrib/arm/inffast.c
- +++ b/contrib/arm/inffast.c
- @@ -7,6 +7,7 @@
- #include "inftrees.h"
- #include "inflate.h"
- #include "inffast.h"
- +#include "chunkcopy.h"
-
- #ifdef ASMINF
- # pragma message("Assembler code may have bugs -- use at your own risk")
- @@ -57,6 +58,7 @@ unsigned start; /* inflate()'s starting value for strm->avail_out */
- unsigned char FAR *out; /* local strm->next_out */
- unsigned char FAR *beg; /* inflate()'s initial strm->next_out */
- unsigned char FAR *end; /* while out < end, enough space available */
- + unsigned char FAR *limit; /* safety limit for chunky copies */
- #ifdef INFLATE_STRICT
- unsigned dmax; /* maximum distance from zlib header */
- #endif
- @@ -84,12 +86,13 @@ unsigned start; /* inflate()'s starting value for strm->avail_out */
- out = strm->next_out;
- beg = out - (start - strm->avail_out);
- end = out + (strm->avail_out - 257);
- + limit = out + strm->avail_out;
- #ifdef INFLATE_STRICT
- dmax = state->dmax;
- #endif
- wsize = state->wsize;
- whave = state->whave;
- - wnext = state->wnext;
- + wnext = (state->wnext == 0 && whave >= wsize) ? wsize : state->wnext;
- window = state->window;
- hold = state->hold;
- bits = state->bits;
- @@ -197,70 +200,51 @@ unsigned start; /* inflate()'s starting value for strm->avail_out */
- #endif
- }
- from = window;
- - if (wnext == 0) { /* very common case */
- - from += wsize - op;
- - if (op < len) { /* some from window */
- - len -= op;
- - do {
- - *out++ = *from++;
- - } while (--op);
- - from = out - dist; /* rest from output */
- - }
- + if (wnext >= op) { /* contiguous in window */
- + from += wnext - op;
- }
- - else if (wnext < op) { /* wrap around window */
- - from += wsize + wnext - op;
- + else { /* wrap around window */
- op -= wnext;
- + from += wsize - op;
- if (op < len) { /* some from end of window */
- len -= op;
- - do {
- - *out++ = *from++;
- - } while (--op);
- - from = window;
- - if (wnext < len) { /* some from start of window */
- - op = wnext;
- - len -= op;
- - do {
- - *out++ = *from++;
- - } while (--op);
- - from = out - dist; /* rest from output */
- - }
- + out = chunkcopy_safe(out, from, op, limit);
- + from = window; /* more from start of window */
- + op = wnext;
- + /* This (rare) case can create a situation where
- + the first chunkcopy below must be checked.
- + */
- }
- }
- - else { /* contiguous in window */
- - from += wnext - op;
- - if (op < len) { /* some from window */
- - len -= op;
- - do {
- - *out++ = *from++;
- - } while (--op);
- - from = out - dist; /* rest from output */
- - }
- - }
- - while (len > 2) {
- - *out++ = *from++;
- - *out++ = *from++;
- - *out++ = *from++;
- - len -= 3;
- - }
- - if (len) {
- - *out++ = *from++;
- - if (len > 1)
- - *out++ = *from++;
- + if (op < len) { /* still need some from output */
- + out = chunkcopy_safe(out, from, op, limit);
- + len -= op;
- + /* When dist is small the amount of data that can be
- + copied from the window is also small, and progress
- + towards the dangerous end of the output buffer is
- + also small. This means that for trivial memsets and
- + for chunkunroll_relaxed() a safety check is
- + unnecessary. However, these conditions may not be
- + entered at all, and in that case it's possible that
- + the main copy is near the end.
- + */
- + out = chunkunroll_relaxed(out, &dist, &len);
- + out = chunkcopy_safe(out, out - dist, len, limit);
- + } else {
- + /* from points to window, so there is no risk of
- + overlapping pointers requiring memset-like behaviour
- + */
- + out = chunkcopy_safe(out, from, len, limit);
- }
- }
- else {
- - from = out - dist; /* copy direct from output */
- - do { /* minimum length is three */
- - *out++ = *from++;
- - *out++ = *from++;
- - *out++ = *from++;
- - len -= 3;
- - } while (len > 2);
- - if (len) {
- - *out++ = *from++;
- - if (len > 1)
- - *out++ = *from++;
- - }
- + /* Whole reference is in range of current output. No
- + range checks are necessary because we start with room
- + for at least 258 bytes of output, so unroll and roundoff
- + operations can write beyond `out+len` so long as they
- + stay within 258 bytes of `out`.
- + */
- + out = chunkcopy_lapped_relaxed(out, dist, len);
- }
- }
- else if ((op & 64) == 0) { /* 2nd level distance code */
- diff --git a/contrib/arm/inflate.c b/contrib/arm/inflate.c
- index ac333e8c..e40322c3 100644
- --- a/contrib/arm/inflate.c
- +++ b/contrib/arm/inflate.c
- @@ -84,6 +84,7 @@
- #include "inftrees.h"
- #include "inflate.h"
- #include "inffast.h"
- +#include "contrib/arm/chunkcopy.h"
-
- #ifdef MAKEFIXED
- # ifndef BUILDFIXED
- @@ -405,10 +406,20 @@ unsigned copy;
-
- /* if it hasn't been done already, allocate space for the window */
- if (state->window == Z_NULL) {
- + unsigned wsize = 1U << state->wbits;
- state->window = (unsigned char FAR *)
- - ZALLOC(strm, 1U << state->wbits,
- + ZALLOC(strm, wsize + CHUNKCOPY_CHUNK_SIZE,
- sizeof(unsigned char));
- if (state->window == Z_NULL) return 1;
- +#ifdef INFLATE_CLEAR_UNUSED_UNDEFINED
- + /* Copies from the overflow portion of this buffer are undefined and
- + may cause analysis tools to raise a warning if we don't initialize
- + it. However, this undefined data overwrites other undefined data
- + and is subsequently either overwritten or left deliberately
- + undefined at the end of decode; so there's really no point.
- + */
- + memset(state->window + wsize, 0, CHUNKCOPY_CHUNK_SIZE);
- +#endif
- }
-
- /* if window not in use yet, initialize */
- @@ -1175,17 +1186,16 @@ int flush;
- else
- from = state->window + (state->wnext - copy);
- if (copy > state->length) copy = state->length;
- + if (copy > left) copy = left;
- + put = chunkcopy_safe(put, from, copy, put + left);
- }
- else { /* copy from output */
- - from = put - state->offset;
- copy = state->length;
- + if (copy > left) copy = left;
- + put = chunkcopy_lapped_safe(put, state->offset, copy, put + left);
- }
- - if (copy > left) copy = left;
- left -= copy;
- state->length -= copy;
- - do {
- - *put++ = *from++;
- - } while (--copy);
- if (state->length == 0) state->mode = LEN;
- break;
- case LIT:
|