inffast.c 12.6 KB
Newer Older
M
Mark Adler 已提交
1
/* inffast.c -- fast decoding
M
Mark Adler 已提交
2
 * Copyright (C) 1995-2008, 2010, 2013 Mark Adler
M
Mark Adler 已提交
3
 * For conditions of distribution and use, see copyright notice in zlib.h
M
Mark Adler 已提交
4 5 6 7
 */

#include "zutil.h"
#include "inftrees.h"
M
Mark Adler 已提交
8
#include "inflate.h"
M
Mark Adler 已提交
9 10
#include "inffast.h"

M
Mark Adler 已提交
11 12
#ifndef ASMINF

M
Mark Adler 已提交
13 14 15 16 17 18 19
/*
   Decode literal, length, and distance codes and write out the resulting
   literal and match bytes until either not enough input or output is
   available, an end-of-block is encountered, or a data error is encountered.
   When large enough input and output buffers are supplied to inflate(), for
   example, a 16K input buffer and a 64K output buffer, more than 95% of the
   inflate execution time is spent in this routine.
M
Mark Adler 已提交
20

M
Mark Adler 已提交
21
   Entry assumptions:
M
Mark Adler 已提交
22

M
Mark Adler 已提交
23 24 25 26 27
        state->mode == LEN
        strm->avail_in >= 6
        strm->avail_out >= 258
        start >= strm->avail_out
        state->bits < 8
M
Mark Adler 已提交
28

M
Mark Adler 已提交
29
   On return, state->mode is one of:
M
Mark Adler 已提交
30

M
Mark Adler 已提交
31 32 33
        LEN -- ran out of enough output space or enough available input
        TYPE -- reached end of block code, inflate() to interpret next block
        BAD -- error in block data
M
Mark Adler 已提交
34

M
Mark Adler 已提交
35
   Notes:
M
Mark Adler 已提交
36

M
Mark Adler 已提交
37 38 39 40 41 42 43 44 45 46 47
    - The maximum input bits used by a length/distance pair is 15 bits for the
      length code, 5 bits for the length extra, 15 bits for the distance code,
      and 13 bits for the distance extra.  This totals 48 bits, or six bytes.
      Therefore if strm->avail_in >= 6, then there is enough input to avoid
      checking for available input while decoding.

    - The maximum bytes that a single length/distance pair can output is 258
      bytes, which is the maximum length that can be coded.  inflate_fast()
      requires strm->avail_out >= 258 for each loop to avoid checking for
      output space.
 */
M
Mark Adler 已提交
48
void ZLIB_INTERNAL inflate_fast(strm, start)
M
Mark Adler 已提交
49 50 51 52
z_streamp strm;
unsigned start;         /* inflate()'s starting value for strm->avail_out */
{
    struct inflate_state FAR *state;
53
    z_const unsigned char FAR *in;      /* local strm->next_in */
M
Mark Adler 已提交
54
    z_const unsigned char FAR *last;    /* have enough input while in < last */
M
Mark Adler 已提交
55 56 57
    unsigned char FAR *out;     /* local strm->next_out */
    unsigned char FAR *beg;     /* inflate()'s initial strm->next_out */
    unsigned char FAR *end;     /* while out < end, enough space available */
M
Mark Adler 已提交
58 59 60
#ifdef INFLATE_STRICT
    unsigned dmax;              /* maximum distance from zlib header */
#endif
M
Mark Adler 已提交
61
    unsigned wsize;             /* window size or zero if not using window */
M
Mark Adler 已提交
62
    unsigned whave;             /* valid bytes in the window */
M
Mark Adler 已提交
63
    unsigned wnext;             /* window write index */
M
Mark Adler 已提交
64 65 66 67 68 69 70
    unsigned char FAR *window;  /* allocated sliding window, if wsize != 0 */
    unsigned long hold;         /* local strm->hold */
    unsigned bits;              /* local strm->bits */
    code const FAR *lcode;      /* local strm->lencode */
    code const FAR *dcode;      /* local strm->distcode */
    unsigned lmask;             /* mask for first level of length codes */
    unsigned dmask;             /* mask for first level of distance codes */
M
Mark Adler 已提交
71
    code here;                  /* retrieved table entry */
M
Mark Adler 已提交
72 73 74 75 76
    unsigned op;                /* code bits, operation, extra bits, or */
                                /*  window position, window bytes to copy */
    unsigned len;               /* match length, unused bytes */
    unsigned dist;              /* match distance */
    unsigned char FAR *from;    /* where to copy match from */
M
Mark Adler 已提交
77

M
Mark Adler 已提交
78 79
    /* copy state to local variables */
    state = (struct inflate_state FAR *)strm->state;
80
    in = strm->next_in;
M
Mark Adler 已提交
81
    last = in + (strm->avail_in - 5);
82
    out = strm->next_out;
M
Mark Adler 已提交
83 84
    beg = out - (start - strm->avail_out);
    end = out + (strm->avail_out - 257);
M
Mark Adler 已提交
85 86 87
#ifdef INFLATE_STRICT
    dmax = state->dmax;
#endif
M
Mark Adler 已提交
88
    wsize = state->wsize;
M
Mark Adler 已提交
89
    whave = state->whave;
M
Mark Adler 已提交
90
    wnext = state->wnext;
M
Mark Adler 已提交
91 92 93 94 95 96 97
    window = state->window;
    hold = state->hold;
    bits = state->bits;
    lcode = state->lencode;
    dcode = state->distcode;
    lmask = (1U << state->lenbits) - 1;
    dmask = (1U << state->distbits) - 1;
M
Mark Adler 已提交
98

M
Mark Adler 已提交
99 100 101 102
    /* decode literals and length/distances until end-of-block or not enough
       input data or output space */
    do {
        if (bits < 15) {
103
            hold += (unsigned long)(*in++) << bits;
M
Mark Adler 已提交
104
            bits += 8;
105
            hold += (unsigned long)(*in++) << bits;
M
Mark Adler 已提交
106 107
            bits += 8;
        }
M
Mark Adler 已提交
108
        here = lcode[hold & lmask];
M
Mark Adler 已提交
109
      dolen:
M
Mark Adler 已提交
110
        op = (unsigned)(here.bits);
M
Mark Adler 已提交
111 112
        hold >>= op;
        bits -= op;
M
Mark Adler 已提交
113
        op = (unsigned)(here.op);
M
Mark Adler 已提交
114
        if (op == 0) {                          /* literal */
M
Mark Adler 已提交
115
            Tracevv((stderr, here.val >= 0x20 && here.val < 0x7f ?
M
Mark Adler 已提交
116
                    "inflate:         literal '%c'\n" :
M
Mark Adler 已提交
117
                    "inflate:         literal 0x%02x\n", here.val));
118
            *out++ = (unsigned char)(here.val);
M
Mark Adler 已提交
119 120
        }
        else if (op & 16) {                     /* length base */
M
Mark Adler 已提交
121
            len = (unsigned)(here.val);
M
Mark Adler 已提交
122 123 124
            op &= 15;                           /* number of extra bits */
            if (op) {
                if (bits < op) {
125
                    hold += (unsigned long)(*in++) << bits;
M
Mark Adler 已提交
126 127
                    bits += 8;
                }
M
Mark Adler 已提交
128
                len += (unsigned)hold & ((1U << op) - 1);
M
Mark Adler 已提交
129 130 131 132 133
                hold >>= op;
                bits -= op;
            }
            Tracevv((stderr, "inflate:         length %u\n", len));
            if (bits < 15) {
134
                hold += (unsigned long)(*in++) << bits;
M
Mark Adler 已提交
135
                bits += 8;
136
                hold += (unsigned long)(*in++) << bits;
M
Mark Adler 已提交
137
                bits += 8;
M
Mark Adler 已提交
138
            }
M
Mark Adler 已提交
139
            here = dcode[hold & dmask];
M
Mark Adler 已提交
140
          dodist:
M
Mark Adler 已提交
141
            op = (unsigned)(here.bits);
M
Mark Adler 已提交
142 143
            hold >>= op;
            bits -= op;
M
Mark Adler 已提交
144
            op = (unsigned)(here.op);
M
Mark Adler 已提交
145
            if (op & 16) {                      /* distance base */
M
Mark Adler 已提交
146
                dist = (unsigned)(here.val);
M
Mark Adler 已提交
147 148
                op &= 15;                       /* number of extra bits */
                if (bits < op) {
149
                    hold += (unsigned long)(*in++) << bits;
M
Mark Adler 已提交
150 151
                    bits += 8;
                    if (bits < op) {
152
                        hold += (unsigned long)(*in++) << bits;
M
Mark Adler 已提交
153 154 155
                        bits += 8;
                    }
                }
M
Mark Adler 已提交
156
                dist += (unsigned)hold & ((1U << op) - 1);
M
Mark Adler 已提交
157 158 159 160 161 162 163
#ifdef INFLATE_STRICT
                if (dist > dmax) {
                    strm->msg = (char *)"invalid distance too far back";
                    state->mode = BAD;
                    break;
                }
#endif
M
Mark Adler 已提交
164 165 166 167 168
                hold >>= op;
                bits -= op;
                Tracevv((stderr, "inflate:         distance %u\n", dist));
                op = (unsigned)(out - beg);     /* max distance in output */
                if (dist > op) {                /* see if copy from window */
M
Mark Adler 已提交
169 170
                    op = dist - op;             /* distance back in window */
                    if (op > whave) {
M
Mark Adler 已提交
171
                        if (state->sane) {
M
Mark Adler 已提交
172 173
                            strm->msg =
                                (char *)"invalid distance too far back";
M
Mark Adler 已提交
174 175 176 177 178 179
                            state->mode = BAD;
                            break;
                        }
#ifdef INFLATE_ALLOW_INVALID_DISTANCE_TOOFAR_ARRR
                        if (len <= op - whave) {
                            do {
180
                                *out++ = 0;
M
Mark Adler 已提交
181 182 183 184 185
                            } while (--len);
                            continue;
                        }
                        len -= op - whave;
                        do {
186
                            *out++ = 0;
M
Mark Adler 已提交
187 188 189 190
                        } while (--op > whave);
                        if (op == 0) {
                            from = out - dist;
                            do {
191
                                *out++ = *from++;
M
Mark Adler 已提交
192 193 194 195
                            } while (--len);
                            continue;
                        }
#endif
M
Mark Adler 已提交
196
                    }
197
                    from = window;
M
Mark Adler 已提交
198
                    if (wnext == 0) {           /* very common case */
M
Mark Adler 已提交
199 200 201 202
                        from += wsize - op;
                        if (op < len) {         /* some from window */
                            len -= op;
                            do {
203
                                *out++ = *from++;
M
Mark Adler 已提交
204 205 206 207
                            } while (--op);
                            from = out - dist;  /* rest from output */
                        }
                    }
M
Mark Adler 已提交
208 209 210
                    else if (wnext < op) {      /* wrap around window */
                        from += wsize + wnext - op;
                        op -= wnext;
M
Mark Adler 已提交
211 212 213
                        if (op < len) {         /* some from end of window */
                            len -= op;
                            do {
214
                                *out++ = *from++;
M
Mark Adler 已提交
215
                            } while (--op);
216
                            from = window;
M
Mark Adler 已提交
217 218
                            if (wnext < len) {  /* some from start of window */
                                op = wnext;
M
Mark Adler 已提交
219 220
                                len -= op;
                                do {
221
                                    *out++ = *from++;
M
Mark Adler 已提交
222 223 224 225 226 227
                                } while (--op);
                                from = out - dist;      /* rest from output */
                            }
                        }
                    }
                    else {                      /* contiguous in window */
M
Mark Adler 已提交
228
                        from += wnext - op;
M
Mark Adler 已提交
229 230 231
                        if (op < len) {         /* some from window */
                            len -= op;
                            do {
232
                                *out++ = *from++;
M
Mark Adler 已提交
233 234 235 236 237
                            } while (--op);
                            from = out - dist;  /* rest from output */
                        }
                    }
                    while (len > 2) {
238 239 240
                        *out++ = *from++;
                        *out++ = *from++;
                        *out++ = *from++;
M
Mark Adler 已提交
241 242 243
                        len -= 3;
                    }
                    if (len) {
244
                        *out++ = *from++;
M
Mark Adler 已提交
245
                        if (len > 1)
246
                            *out++ = *from++;
M
Mark Adler 已提交
247 248 249 250 251
                    }
                }
                else {
                    from = out - dist;          /* copy direct from output */
                    do {                        /* minimum length is three */
252 253 254
                        *out++ = *from++;
                        *out++ = *from++;
                        *out++ = *from++;
M
Mark Adler 已提交
255 256 257
                        len -= 3;
                    } while (len > 2);
                    if (len) {
258
                        *out++ = *from++;
M
Mark Adler 已提交
259
                        if (len > 1)
260
                            *out++ = *from++;
M
Mark Adler 已提交
261 262
                    }
                }
M
Mark Adler 已提交
263
            }
M
Mark Adler 已提交
264
            else if ((op & 64) == 0) {          /* 2nd level distance code */
M
Mark Adler 已提交
265
                here = dcode[here.val + (hold & ((1U << op) - 1))];
M
Mark Adler 已提交
266 267 268 269 270 271 272 273 274
                goto dodist;
            }
            else {
                strm->msg = (char *)"invalid distance code";
                state->mode = BAD;
                break;
            }
        }
        else if ((op & 64) == 0) {              /* 2nd level length code */
M
Mark Adler 已提交
275
            here = lcode[here.val + (hold & ((1U << op) - 1))];
M
Mark Adler 已提交
276 277 278 279 280
            goto dolen;
        }
        else if (op & 32) {                     /* end-of-block */
            Tracevv((stderr, "inflate:         end of block\n"));
            state->mode = TYPE;
M
Mark Adler 已提交
281
            break;
M
Mark Adler 已提交
282
        }
M
Mark Adler 已提交
283 284 285 286 287 288 289 290 291 292 293 294
        else {
            strm->msg = (char *)"invalid literal/length code";
            state->mode = BAD;
            break;
        }
    } while (in < last && out < end);

    /* return unused bytes (on entry, bits < 8, so in won't go too far back) */
    len = bits >> 3;
    in -= len;
    bits -= len << 3;
    hold &= (1U << bits) - 1;
M
Mark Adler 已提交
295

M
Mark Adler 已提交
296
    /* update state and return */
297 298
    strm->next_in = in;
    strm->next_out = out;
M
Mark Adler 已提交
299 300 301 302 303 304
    strm->avail_in = (unsigned)(in < last ? 5 + (last - in) : 5 - (in - last));
    strm->avail_out = (unsigned)(out < end ?
                                 257 + (end - out) : 257 - (out - end));
    state->hold = hold;
    state->bits = bits;
    return;
M
Mark Adler 已提交
305
}
M
Mark Adler 已提交
306 307 308 309 310

/*
   inflate_fast() speedups that turned out slower (on a PowerPC G3 750CXe):
   - Using bit fields for code structure
   - Different op definition to avoid & for extra bits (do & for table bits)
M
Mark Adler 已提交
311
   - Three separate decoding do-loops for direct, window, and wnext == 0
M
Mark Adler 已提交
312 313 314 315 316 317 318 319
   - Special case for distance > 1 copies to do overlapped load and store copy
   - Explicit branch predictions (based on measured branch probabilities)
   - Deferring match copy and interspersed it with decoding subsequent codes
   - Swapping literal/length else
   - Swapping window/direct else
   - Larger unrolled copy loops (three is about right)
   - Moving len -= 3 statement into middle of loop
 */
M
Mark Adler 已提交
320 321

#endif /* !ASMINF */