Annotation of embedaddon/rsync/zlib/inffast.c, revision 1.1

1.1     ! misho       1: /* inffast.c -- fast decoding
        !             2:  * Copyright (C) 1995-2004 Mark Adler
        !             3:  * For conditions of distribution and use, see copyright notice in zlib.h
        !             4:  */
        !             5: 
        !             6: #include "zutil.h"
        !             7: #include "inftrees.h"
        !             8: #include "inflate.h"
        !             9: #include "inffast.h"
        !            10: 
        !            11: #ifndef ASMINF
        !            12: 
        !            13: /* Allow machine dependent optimization for post-increment or pre-increment.
        !            14:    Based on testing to date,
        !            15:    Pre-increment preferred for:
        !            16:    - PowerPC G3 (Adler)
        !            17:    - MIPS R5000 (Randers-Pehrson)
        !            18:    Post-increment preferred for:
        !            19:    - none
        !            20:    No measurable difference:
        !            21:    - Pentium III (Anderson)
        !            22:    - M68060 (Nikl)
        !            23:  */
        !            24: #ifdef POSTINC
        !            25: #  define OFF 0
        !            26: #  define PUP(a) *(a)++
        !            27: #else
        !            28: #  define OFF 1
        !            29: #  define PUP(a) *++(a)
        !            30: #endif
        !            31: 
        !            32: /*
        !            33:    Decode literal, length, and distance codes and write out the resulting
        !            34:    literal and match bytes until either not enough input or output is
        !            35:    available, an end-of-block is encountered, or a data error is encountered.
        !            36:    When large enough input and output buffers are supplied to inflate(), for
        !            37:    example, a 16K input buffer and a 64K output buffer, more than 95% of the
        !            38:    inflate execution time is spent in this routine.
        !            39: 
        !            40:    Entry assumptions:
        !            41: 
        !            42:         state->mode == LEN
        !            43:         strm->avail_in >= 6
        !            44:         strm->avail_out >= 258
        !            45:         start >= strm->avail_out
        !            46:         state->bits < 8
        !            47: 
        !            48:    On return, state->mode is one of:
        !            49: 
        !            50:         LEN -- ran out of enough output space or enough available input
        !            51:         TYPE -- reached end of block code, inflate() to interpret next block
        !            52:         BAD -- error in block data
        !            53: 
        !            54:    Notes:
        !            55: 
        !            56:     - The maximum input bits used by a length/distance pair is 15 bits for the
        !            57:       length code, 5 bits for the length extra, 15 bits for the distance code,
        !            58:       and 13 bits for the distance extra.  This totals 48 bits, or six bytes.
        !            59:       Therefore if strm->avail_in >= 6, then there is enough input to avoid
        !            60:       checking for available input while decoding.
        !            61: 
        !            62:     - The maximum bytes that a single length/distance pair can output is 258
        !            63:       bytes, which is the maximum length that can be coded.  inflate_fast()
        !            64:       requires strm->avail_out >= 258 for each loop to avoid checking for
        !            65:       output space.
        !            66:  */
        !            67: void inflate_fast(strm, start)
        !            68: z_streamp strm;
        !            69: unsigned start;         /* inflate()'s starting value for strm->avail_out */
        !            70: {
        !            71:     struct inflate_state FAR *state;
        !            72:     unsigned char FAR *in;      /* local strm->next_in */
        !            73:     unsigned char FAR *last;    /* while in < last, enough input available */
        !            74:     unsigned char FAR *out;     /* local strm->next_out */
        !            75:     unsigned char FAR *beg;     /* inflate()'s initial strm->next_out */
        !            76:     unsigned char FAR *end;     /* while out < end, enough space available */
        !            77: #ifdef INFLATE_STRICT
        !            78:     unsigned dmax;              /* maximum distance from zlib header */
        !            79: #endif
        !            80:     unsigned wsize;             /* window size or zero if not using window */
        !            81:     unsigned whave;             /* valid bytes in the window */
        !            82:     unsigned write;             /* window write index */
        !            83:     unsigned char FAR *window;  /* allocated sliding window, if wsize != 0 */
        !            84:     unsigned long hold;         /* local strm->hold */
        !            85:     unsigned bits;              /* local strm->bits */
        !            86:     code const FAR *lcode;      /* local strm->lencode */
        !            87:     code const FAR *dcode;      /* local strm->distcode */
        !            88:     unsigned lmask;             /* mask for first level of length codes */
        !            89:     unsigned dmask;             /* mask for first level of distance codes */
        !            90:     code this;                  /* retrieved table entry */
        !            91:     unsigned op;                /* code bits, operation, extra bits, or */
        !            92:                                 /*  window position, window bytes to copy */
        !            93:     unsigned len;               /* match length, unused bytes */
        !            94:     unsigned dist;              /* match distance */
        !            95:     unsigned char FAR *from;    /* where to copy match from */
        !            96: 
        !            97:     /* copy state to local variables */
        !            98:     state = (struct inflate_state FAR *)strm->state;
        !            99:     in = strm->next_in - OFF;
        !           100:     last = in + (strm->avail_in - 5);
        !           101:     out = strm->next_out - OFF;
        !           102:     beg = out - (start - strm->avail_out);
        !           103:     end = out + (strm->avail_out - 257);
        !           104: #ifdef INFLATE_STRICT
        !           105:     dmax = state->dmax;
        !           106: #endif
        !           107:     wsize = state->wsize;
        !           108:     whave = state->whave;
        !           109:     write = state->write;
        !           110:     window = state->window;
        !           111:     hold = state->hold;
        !           112:     bits = state->bits;
        !           113:     lcode = state->lencode;
        !           114:     dcode = state->distcode;
        !           115:     lmask = (1U << state->lenbits) - 1;
        !           116:     dmask = (1U << state->distbits) - 1;
        !           117: 
        !           118:     /* decode literals and length/distances until end-of-block or not enough
        !           119:        input data or output space */
        !           120:     do {
        !           121:         if (bits < 15) {
        !           122:             hold += (unsigned long)(PUP(in)) << bits;
        !           123:             bits += 8;
        !           124:             hold += (unsigned long)(PUP(in)) << bits;
        !           125:             bits += 8;
        !           126:         }
        !           127:         this = lcode[hold & lmask];
        !           128:       dolen:
        !           129:         op = (unsigned)(this.bits);
        !           130:         hold >>= op;
        !           131:         bits -= op;
        !           132:         op = (unsigned)(this.op);
        !           133:         if (op == 0) {                          /* literal */
        !           134:             Tracevv((stderr, this.val >= 0x20 && this.val < 0x7f ?
        !           135:                     "inflate:         literal '%c'\n" :
        !           136:                     "inflate:         literal 0x%02x\n", this.val));
        !           137:             PUP(out) = (unsigned char)(this.val);
        !           138:         }
        !           139:         else if (op & 16) {                     /* length base */
        !           140:             len = (unsigned)(this.val);
        !           141:             op &= 15;                           /* number of extra bits */
        !           142:             if (op) {
        !           143:                 if (bits < op) {
        !           144:                     hold += (unsigned long)(PUP(in)) << bits;
        !           145:                     bits += 8;
        !           146:                 }
        !           147:                 len += (unsigned)hold & ((1U << op) - 1);
        !           148:                 hold >>= op;
        !           149:                 bits -= op;
        !           150:             }
        !           151:             Tracevv((stderr, "inflate:         length %u\n", len));
        !           152:             if (bits < 15) {
        !           153:                 hold += (unsigned long)(PUP(in)) << bits;
        !           154:                 bits += 8;
        !           155:                 hold += (unsigned long)(PUP(in)) << bits;
        !           156:                 bits += 8;
        !           157:             }
        !           158:             this = dcode[hold & dmask];
        !           159:           dodist:
        !           160:             op = (unsigned)(this.bits);
        !           161:             hold >>= op;
        !           162:             bits -= op;
        !           163:             op = (unsigned)(this.op);
        !           164:             if (op & 16) {                      /* distance base */
        !           165:                 dist = (unsigned)(this.val);
        !           166:                 op &= 15;                       /* number of extra bits */
        !           167:                 if (bits < op) {
        !           168:                     hold += (unsigned long)(PUP(in)) << bits;
        !           169:                     bits += 8;
        !           170:                     if (bits < op) {
        !           171:                         hold += (unsigned long)(PUP(in)) << bits;
        !           172:                         bits += 8;
        !           173:                     }
        !           174:                 }
        !           175:                 dist += (unsigned)hold & ((1U << op) - 1);
        !           176: #ifdef INFLATE_STRICT
        !           177:                 if (dist > dmax) {
        !           178:                     strm->msg = (char *)"invalid distance too far back";
        !           179:                     state->mode = BAD;
        !           180:                     break;
        !           181:                 }
        !           182: #endif
        !           183:                 hold >>= op;
        !           184:                 bits -= op;
        !           185:                 Tracevv((stderr, "inflate:         distance %u\n", dist));
        !           186:                 op = (unsigned)(out - beg);     /* max distance in output */
        !           187:                 if (dist > op) {                /* see if copy from window */
        !           188:                     op = dist - op;             /* distance back in window */
        !           189:                     if (op > whave) {
        !           190:                         strm->msg = (char *)"invalid distance too far back";
        !           191:                         state->mode = BAD;
        !           192:                         break;
        !           193:                     }
        !           194:                     from = window - OFF;
        !           195:                     if (write == 0) {           /* very common case */
        !           196:                         from += wsize - op;
        !           197:                         if (op < len) {         /* some from window */
        !           198:                             len -= op;
        !           199:                             do {
        !           200:                                 PUP(out) = PUP(from);
        !           201:                             } while (--op);
        !           202:                             from = out - dist;  /* rest from output */
        !           203:                         }
        !           204:                     }
        !           205:                     else if (write < op) {      /* wrap around window */
        !           206:                         from += wsize + write - op;
        !           207:                         op -= write;
        !           208:                         if (op < len) {         /* some from end of window */
        !           209:                             len -= op;
        !           210:                             do {
        !           211:                                 PUP(out) = PUP(from);
        !           212:                             } while (--op);
        !           213:                             from = window - OFF;
        !           214:                             if (write < len) {  /* some from start of window */
        !           215:                                 op = write;
        !           216:                                 len -= op;
        !           217:                                 do {
        !           218:                                     PUP(out) = PUP(from);
        !           219:                                 } while (--op);
        !           220:                                 from = out - dist;      /* rest from output */
        !           221:                             }
        !           222:                         }
        !           223:                     }
        !           224:                     else {                      /* contiguous in window */
        !           225:                         from += write - op;
        !           226:                         if (op < len) {         /* some from window */
        !           227:                             len -= op;
        !           228:                             do {
        !           229:                                 PUP(out) = PUP(from);
        !           230:                             } while (--op);
        !           231:                             from = out - dist;  /* rest from output */
        !           232:                         }
        !           233:                     }
        !           234:                     while (len > 2) {
        !           235:                         PUP(out) = PUP(from);
        !           236:                         PUP(out) = PUP(from);
        !           237:                         PUP(out) = PUP(from);
        !           238:                         len -= 3;
        !           239:                     }
        !           240:                     if (len) {
        !           241:                         PUP(out) = PUP(from);
        !           242:                         if (len > 1)
        !           243:                             PUP(out) = PUP(from);
        !           244:                     }
        !           245:                 }
        !           246:                 else {
        !           247:                     from = out - dist;          /* copy direct from output */
        !           248:                     do {                        /* minimum length is three */
        !           249:                         PUP(out) = PUP(from);
        !           250:                         PUP(out) = PUP(from);
        !           251:                         PUP(out) = PUP(from);
        !           252:                         len -= 3;
        !           253:                     } while (len > 2);
        !           254:                     if (len) {
        !           255:                         PUP(out) = PUP(from);
        !           256:                         if (len > 1)
        !           257:                             PUP(out) = PUP(from);
        !           258:                     }
        !           259:                 }
        !           260:             }
        !           261:             else if ((op & 64) == 0) {          /* 2nd level distance code */
        !           262:                 this = dcode[this.val + (hold & ((1U << op) - 1))];
        !           263:                 goto dodist;
        !           264:             }
        !           265:             else {
        !           266:                 strm->msg = (char *)"invalid distance code";
        !           267:                 state->mode = BAD;
        !           268:                 break;
        !           269:             }
        !           270:         }
        !           271:         else if ((op & 64) == 0) {              /* 2nd level length code */
        !           272:             this = lcode[this.val + (hold & ((1U << op) - 1))];
        !           273:             goto dolen;
        !           274:         }
        !           275:         else if (op & 32) {                     /* end-of-block */
        !           276:             Tracevv((stderr, "inflate:         end of block\n"));
        !           277:             state->mode = TYPE;
        !           278:             break;
        !           279:         }
        !           280:         else {
        !           281:             strm->msg = (char *)"invalid literal/length code";
        !           282:             state->mode = BAD;
        !           283:             break;
        !           284:         }
        !           285:     } while (in < last && out < end);
        !           286: 
        !           287:     /* return unused bytes (on entry, bits < 8, so in won't go too far back) */
        !           288:     len = bits >> 3;
        !           289:     in -= len;
        !           290:     bits -= len << 3;
        !           291:     hold &= (1U << bits) - 1;
        !           292: 
        !           293:     /* update state and return */
        !           294:     strm->next_in = in + OFF;
        !           295:     strm->next_out = out + OFF;
        !           296:     strm->avail_in = (unsigned)(in < last ? 5 + (last - in) : 5 - (in - last));
        !           297:     strm->avail_out = (unsigned)(out < end ?
        !           298:                                  257 + (end - out) : 257 - (out - end));
        !           299:     state->hold = hold;
        !           300:     state->bits = bits;
        !           301:     return;
        !           302: }
        !           303: 
        !           304: /*
        !           305:    inflate_fast() speedups that turned out slower (on a PowerPC G3 750CXe):
        !           306:    - Using bit fields for code structure
        !           307:    - Different op definition to avoid & for extra bits (do & for table bits)
        !           308:    - Three separate decoding do-loops for direct, window, and write == 0
        !           309:    - Special case for distance > 1 copies to do overlapped load and store copy
        !           310:    - Explicit branch predictions (based on measured branch probabilities)
        !           311:    - Deferring match copy and interspersed it with decoding subsequent codes
        !           312:    - Swapping literal/length else
        !           313:    - Swapping window/direct else
        !           314:    - Larger unrolled copy loops (three is about right)
        !           315:    - Moving len -= 3 statement into middle of loop
        !           316:  */
        !           317: 
        !           318: #endif /* !ASMINF */

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>