vp3.c 93.9 KB
Newer Older
1
/*
2
 * Copyright (C) 2003-2004 the ffmpeg project
3 4 5 6 7 8 9 10 11 12 13 14 15
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
16
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17 18 19 20 21 22
 *
 */

/**
 * @file vp3.c
 * On2 VP3 Video Decoder
23 24 25 26 27 28
 *
 * VP3 Video Decoder by Mike Melanson (mike at multimedia.cx)
 * For more information about the VP3 coding process, visit:
 *   http://multimedia.cx/
 *
 * Theora decoder by Alex Beregszaszi
29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44
 */

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>

#include "common.h"
#include "avcodec.h"
#include "dsputil.h"
#include "mpegvideo.h"

#include "vp3data.h"

#define FRAGMENT_PIXELS 8

45
/*
46
 * Debugging Variables
47
 *
48 49 50
 * Define one or more of the following compile-time variables to 1 to obtain
 * elaborate information about certain aspects of the decoding process.
 *
51
 * KEYFRAMES_ONLY: set this to 1 to only see keyframes (VP3 slideshow mode)
52 53 54 55 56 57 58 59 60 61 62 63
 * DEBUG_VP3: high-level decoding flow
 * DEBUG_INIT: initialization parameters
 * DEBUG_DEQUANTIZERS: display how the dequanization tables are built
 * DEBUG_BLOCK_CODING: unpacking the superblock/macroblock/fragment coding
 * DEBUG_MODES: unpacking the coding modes for individual fragments
 * DEBUG_VECTORS: display the motion vectors
 * DEBUG_TOKEN: display exhaustive information about each DCT token
 * DEBUG_VLC: display the VLCs as they are extracted from the stream
 * DEBUG_DC_PRED: display the process of reversing DC prediction
 * DEBUG_IDCT: show every detail of the IDCT process
 */

64 65
#define KEYFRAMES_ONLY 0

A
Alex Beregszaszi 已提交
66
#define DEBUG_VP3 0
67 68 69 70 71 72 73 74 75 76 77
#define DEBUG_INIT 0
#define DEBUG_DEQUANTIZERS 0
#define DEBUG_BLOCK_CODING 0
#define DEBUG_MODES 0
#define DEBUG_VECTORS 0
#define DEBUG_TOKEN 0
#define DEBUG_VLC 0
#define DEBUG_DC_PRED 0
#define DEBUG_IDCT 0

#if DEBUG_VP3
A
Alex Beregszaszi 已提交
78
#define debug_vp3(args...) av_log(NULL, AV_LOG_DEBUG, ## args)
79 80 81 82 83
#else
static inline void debug_vp3(const char *format, ...) { }
#endif

#if DEBUG_INIT
A
Alex Beregszaszi 已提交
84
#define debug_init(args...) av_log(NULL, AV_LOG_DEBUG, ## args)
85 86 87 88 89
#else
static inline void debug_init(const char *format, ...) { }
#endif

#if DEBUG_DEQUANTIZERS
A
Alex Beregszaszi 已提交
90
#define debug_dequantizers(args...) av_log(NULL, AV_LOG_DEBUG, ## args)
91
#else
92
static inline void debug_dequantizers(const char *format, ...) { }
93 94 95
#endif

#if DEBUG_BLOCK_CODING
A
Alex Beregszaszi 已提交
96
#define debug_block_coding(args...) av_log(NULL, AV_LOG_DEBUG, ## args)
97
#else
98
static inline void debug_block_coding(const char *format, ...) { }
99 100 101
#endif

#if DEBUG_MODES
102
#define debug_modes(args...) av_log(NULL, AV_LOG_DEBUG, ## args)
103
#else
104
static inline void debug_modes(const char *format, ...) { }
105 106 107
#endif

#if DEBUG_VECTORS
A
Alex Beregszaszi 已提交
108
#define debug_vectors(args...) av_log(NULL, AV_LOG_DEBUG, ## args)
109
#else
110
static inline void debug_vectors(const char *format, ...) { }
111 112
#endif

113
#if DEBUG_TOKEN
A
Alex Beregszaszi 已提交
114
#define debug_token(args...) av_log(NULL, AV_LOG_DEBUG, ## args)
115
#else
116
static inline void debug_token(const char *format, ...) { }
117 118 119
#endif

#if DEBUG_VLC
A
Alex Beregszaszi 已提交
120
#define debug_vlc(args...) av_log(NULL, AV_LOG_DEBUG, ## args)
121
#else
122
static inline void debug_vlc(const char *format, ...) { }
123 124 125
#endif

#if DEBUG_DC_PRED
A
Alex Beregszaszi 已提交
126
#define debug_dc_pred(args...) av_log(NULL, AV_LOG_DEBUG, ## args)
127
#else
128
static inline void debug_dc_pred(const char *format, ...) { }
129 130 131
#endif

#if DEBUG_IDCT
A
Alex Beregszaszi 已提交
132
#define debug_idct(args...) av_log(NULL, AV_LOG_DEBUG, ## args)
133
#else
134
static inline void debug_idct(const char *format, ...) { }
135 136
#endif

137 138 139 140 141 142 143
typedef struct Coeff {
    struct Coeff *next;
    DCTELEM coeff;
    uint8_t index;
} Coeff;

//FIXME split things out into their own arrays
144
typedef struct Vp3Fragment {
145
    Coeff *next_coeff;
146 147 148 149
    /* address of first pixel taking into account which plane the fragment
     * lives on as well as the plane stride */
    int first_pixel;
    /* this is the macroblock that the fragment belongs to */
150 151 152 153 154
    uint16_t macroblock;
    uint8_t coding_method;
    uint8_t coeff_count;
    int8_t motion_x;
    int8_t motion_y;
155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180
} Vp3Fragment;

#define SB_NOT_CODED        0
#define SB_PARTIALLY_CODED  1
#define SB_FULLY_CODED      2

#define MODE_INTER_NO_MV      0
#define MODE_INTRA            1
#define MODE_INTER_PLUS_MV    2
#define MODE_INTER_LAST_MV    3
#define MODE_INTER_PRIOR_LAST 4
#define MODE_USING_GOLDEN     5
#define MODE_GOLDEN_MV        6
#define MODE_INTER_FOURMV     7
#define CODING_MODE_COUNT     8

/* special internal mode */
#define MODE_COPY             8

/* There are 6 preset schemes, plus a free-form scheme */
static int ModeAlphabet[7][CODING_MODE_COUNT] =
{
    /* this is the custom scheme */
    { 0, 0, 0, 0, 0, 0, 0, 0 },

    /* scheme 1: Last motion vector dominates */
181
    {    MODE_INTER_LAST_MV,    MODE_INTER_PRIOR_LAST,
182
         MODE_INTER_PLUS_MV,    MODE_INTER_NO_MV,
183
         MODE_INTRA,            MODE_USING_GOLDEN,
184 185 186
         MODE_GOLDEN_MV,        MODE_INTER_FOURMV },

    /* scheme 2 */
187
    {    MODE_INTER_LAST_MV,    MODE_INTER_PRIOR_LAST,
188
         MODE_INTER_NO_MV,      MODE_INTER_PLUS_MV,
189
         MODE_INTRA,            MODE_USING_GOLDEN,
190 191 192
         MODE_GOLDEN_MV,        MODE_INTER_FOURMV },

    /* scheme 3 */
193
    {    MODE_INTER_LAST_MV,    MODE_INTER_PLUS_MV,
194
         MODE_INTER_PRIOR_LAST, MODE_INTER_NO_MV,
195
         MODE_INTRA,            MODE_USING_GOLDEN,
196 197 198
         MODE_GOLDEN_MV,        MODE_INTER_FOURMV },

    /* scheme 4 */
199
    {    MODE_INTER_LAST_MV,    MODE_INTER_PLUS_MV,
200
         MODE_INTER_NO_MV,      MODE_INTER_PRIOR_LAST,
201
         MODE_INTRA,            MODE_USING_GOLDEN,
202 203 204
         MODE_GOLDEN_MV,        MODE_INTER_FOURMV },

    /* scheme 5: No motion vector dominates */
205
    {    MODE_INTER_NO_MV,      MODE_INTER_LAST_MV,
206
         MODE_INTER_PRIOR_LAST, MODE_INTER_PLUS_MV,
207
         MODE_INTRA,            MODE_USING_GOLDEN,
208 209 210
         MODE_GOLDEN_MV,        MODE_INTER_FOURMV },

    /* scheme 6 */
211
    {    MODE_INTER_NO_MV,      MODE_USING_GOLDEN,
212
         MODE_INTER_LAST_MV,    MODE_INTER_PRIOR_LAST,
213
         MODE_INTER_PLUS_MV,    MODE_INTRA,
214 215 216 217 218 219 220 221
         MODE_GOLDEN_MV,        MODE_INTER_FOURMV },

};

#define MIN_DEQUANT_VAL 2

typedef struct Vp3DecodeContext {
    AVCodecContext *avctx;
222
    int theora, theora_tables;
A
Alex Beregszaszi 已提交
223
    int version;
224 225 226 227 228 229
    int width, height;
    AVFrame golden_frame;
    AVFrame last_frame;
    AVFrame current_frame;
    int keyframe;
    DSPContext dsp;
230
    int flipped_image;
231

232 233
    int qis[3];
    int nqis;
234 235 236 237 238 239
    int quality_index;
    int last_quality_index;

    int superblock_count;
    int superblock_width;
    int superblock_height;
240 241 242 243
    int y_superblock_width;
    int y_superblock_height;
    int c_superblock_width;
    int c_superblock_height;
244 245 246 247 248 249 250 251 252 253 254 255 256
    int u_superblock_start;
    int v_superblock_start;
    unsigned char *superblock_coding;

    int macroblock_count;
    int macroblock_width;
    int macroblock_height;

    int fragment_count;
    int fragment_width;
    int fragment_height;

    Vp3Fragment *all_fragments;
257 258
    Coeff *coeffs;
    Coeff *next_coeff;
M
Michael Niedermayer 已提交
259
    int fragment_start[3];
260

M
Michael Niedermayer 已提交
261
    ScanTable scantable;
262

263 264
    /* tables */
    uint16_t coded_dc_scale_factor[64];
265
    uint32_t coded_ac_scale_factor[64];
266 267 268 269
    uint8_t base_matrix[384][64];
    uint8_t qr_count[2][3];
    uint8_t qr_size [2][3][64];
    uint16_t qr_base[2][3][64];
270 271 272 273 274 275 276 277 278 279 280 281 282

    /* this is a list of indices into the all_fragments array indicating
     * which of the fragments are coded */
    int *coded_fragment_list;
    int coded_fragment_list_index;
    int pixel_addresses_inited;

    VLC dc_vlc[16];
    VLC ac_vlc_1[16];
    VLC ac_vlc_2[16];
    VLC ac_vlc_3[16];
    VLC ac_vlc_4[16];

283 284 285 286 287
    VLC superblock_run_length_vlc;
    VLC fragment_run_length_vlc;
    VLC mode_code_vlc;
    VLC motion_vector_vlc;

288 289
    /* these arrays need to be on 16-byte boundaries since SSE2 operations
     * index into them */
290
    DECLARE_ALIGNED_16(int16_t, qmat[2][4][64]);        //<qmat[is_inter][plane]
291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307

    /* This table contains superblock_count * 16 entries. Each set of 16
     * numbers corresponds to the fragment indices 0..15 of the superblock.
     * An entry will be -1 to indicate that no entry corresponds to that
     * index. */
    int *superblock_fragments;

    /* This table contains superblock_count * 4 entries. Each set of 4
     * numbers corresponds to the macroblock indices 0..3 of the superblock.
     * An entry will be -1 to indicate that no entry corresponds to that
     * index. */
    int *superblock_macroblocks;

    /* This table contains macroblock_count * 6 entries. Each set of 6
     * numbers corresponds to the fragment indices 0..5 which comprise
     * the macroblock (4 Y fragments and 2 C fragments). */
    int *macroblock_fragments;
308
    /* This is an array that indicates how a particular macroblock
309
     * is coded. */
310
    unsigned char *macroblock_coding;
311

312 313 314 315 316
    int first_coded_y_fragment;
    int first_coded_c_fragment;
    int last_coded_y_fragment;
    int last_coded_c_fragment;

M
Michael Niedermayer 已提交
317
    uint8_t edge_emu_buffer[9*2048]; //FIXME dynamic alloc
M
Måns Rullgård 已提交
318
    int8_t qscale_table[2048]; //FIXME dynamic alloc (width+15)/16
319

320 321 322 323 324 325 326 327 328
    /* Huffman decode */
    int hti;
    unsigned int hbits;
    int entries;
    int huff_code_size;
    uint16_t huffman_table[80][32][2];

    uint32_t filter_limit_values[64];
    int bounding_values_array[256];
329 330
} Vp3DecodeContext;

331
static int theora_decode_tables(AVCodecContext *avctx, GetBitContext *gb);
A
Alex Beregszaszi 已提交
332

333 334 335 336 337 338 339 340
/************************************************************************
 * VP3 specific functions
 ************************************************************************/

/*
 * This function sets up all of the various blocks mappings:
 * superblocks <-> fragments, macroblocks <-> fragments,
 * superblocks <-> macroblocks
341 342
 *
 * Returns 0 is successful; returns 1 if *anything* went wrong.
343
 */
344
static int init_block_mapping(Vp3DecodeContext *s)
345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361
{
    int i, j;
    signed int hilbert_walk_mb[4];

    int current_fragment = 0;
    int current_width = 0;
    int current_height = 0;
    int right_edge = 0;
    int bottom_edge = 0;
    int superblock_row_inc = 0;
    int *hilbert = NULL;
    int mapping_index = 0;

    int current_macroblock;
    int c_fragment;

    signed char travel_width[16] = {
362
         1,  1,  0, -1,
363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400
         0,  0,  1,  0,
         1,  0,  1,  0,
         0, -1,  0,  1
    };

    signed char travel_height[16] = {
         0,  0,  1,  0,
         1,  1,  0, -1,
         0,  1,  0, -1,
        -1,  0, -1,  0
    };

    signed char travel_width_mb[4] = {
         1,  0,  1,  0
    };

    signed char travel_height_mb[4] = {
         0,  1,  0, -1
    };

    debug_vp3("  vp3: initialize block mapping tables\n");

    hilbert_walk_mb[0] = 1;
    hilbert_walk_mb[1] = s->macroblock_width;
    hilbert_walk_mb[2] = 1;
    hilbert_walk_mb[3] = -s->macroblock_width;

    /* iterate through each superblock (all planes) and map the fragments */
    for (i = 0; i < s->superblock_count; i++) {
        debug_init("    superblock %d (u starts @ %d, v starts @ %d)\n",
            i, s->u_superblock_start, s->v_superblock_start);

        /* time to re-assign the limits? */
        if (i == 0) {

            /* start of Y superblocks */
            right_edge = s->fragment_width;
            bottom_edge = s->fragment_height;
401
            current_width = -1;
402
            current_height = 0;
403
            superblock_row_inc = 3 * s->fragment_width -
404
                (s->y_superblock_width * 4 - s->fragment_width);
405 406 407 408 409 410 411 412 413

            /* the first operation for this variable is to advance by 1 */
            current_fragment = -1;

        } else if (i == s->u_superblock_start) {

            /* start of U superblocks */
            right_edge = s->fragment_width / 2;
            bottom_edge = s->fragment_height / 2;
414
            current_width = -1;
415
            current_height = 0;
416
            superblock_row_inc = 3 * (s->fragment_width / 2) -
417
                (s->c_superblock_width * 4 - s->fragment_width / 2);
418 419

            /* the first operation for this variable is to advance by 1 */
M
Michael Niedermayer 已提交
420
            current_fragment = s->fragment_start[1] - 1;
421 422 423 424 425 426

        } else if (i == s->v_superblock_start) {

            /* start of V superblocks */
            right_edge = s->fragment_width / 2;
            bottom_edge = s->fragment_height / 2;
427
            current_width = -1;
428
            current_height = 0;
429
            superblock_row_inc = 3 * (s->fragment_width / 2) -
430
                (s->c_superblock_width * 4 - s->fragment_width / 2);
431 432

            /* the first operation for this variable is to advance by 1 */
M
Michael Niedermayer 已提交
433
            current_fragment = s->fragment_start[2] - 1;
434 435 436

        }

437
        if (current_width >= right_edge - 1) {
438
            /* reset width and move to next superblock row */
439
            current_width = -1;
440 441 442 443 444 445 446 447
            current_height += 4;

            /* fragment is now at the start of a new superblock row */
            current_fragment += superblock_row_inc;
        }

        /* iterate through all 16 fragments in a superblock */
        for (j = 0; j < 16; j++) {
M
Michael Niedermayer 已提交
448
            current_fragment += travel_width[j] + right_edge * travel_height[j];
449
            current_width += travel_width[j];
450 451 452
            current_height += travel_height[j];

            /* check if the fragment is in bounds */
453
            if ((current_width < right_edge) &&
454 455
                (current_height < bottom_edge)) {
                s->superblock_fragments[mapping_index] = current_fragment;
456
                debug_init("    mapping fragment %d to superblock %d, position %d (%d/%d x %d/%d)\n",
457 458
                    s->superblock_fragments[mapping_index], i, j,
                    current_width, right_edge, current_height, bottom_edge);
459 460
            } else {
                s->superblock_fragments[mapping_index] = -1;
461
                debug_init("    superblock %d, position %d has no fragment (%d/%d x %d/%d)\n",
462 463
                    i, j,
                    current_width, right_edge, current_height, bottom_edge);
464 465 466 467 468 469 470 471 472 473
            }

            mapping_index++;
        }
    }

    /* initialize the superblock <-> macroblock mapping; iterate through
     * all of the Y plane superblocks to build this mapping */
    right_edge = s->macroblock_width;
    bottom_edge = s->macroblock_height;
474
    current_width = -1;
475
    current_height = 0;
476 477
    superblock_row_inc = s->macroblock_width -
        (s->y_superblock_width * 2 - s->macroblock_width);;
478 479 480 481 482
    hilbert = hilbert_walk_mb;
    mapping_index = 0;
    current_macroblock = -1;
    for (i = 0; i < s->u_superblock_start; i++) {

483
        if (current_width >= right_edge - 1) {
484
            /* reset width and move to next superblock row */
485
            current_width = -1;
486 487 488 489 490 491 492 493 494
            current_height += 2;

            /* macroblock is now at the start of a new superblock row */
            current_macroblock += superblock_row_inc;
        }

        /* iterate through each potential macroblock in the superblock */
        for (j = 0; j < 4; j++) {
            current_macroblock += hilbert_walk_mb[j];
495
            current_width += travel_width_mb[j];
496 497 498
            current_height += travel_height_mb[j];

            /* check if the macroblock is in bounds */
499
            if ((current_width < right_edge) &&
500 501
                (current_height < bottom_edge)) {
                s->superblock_macroblocks[mapping_index] = current_macroblock;
502 503 504
                debug_init("    mapping macroblock %d to superblock %d, position %d (%d/%d x %d/%d)\n",
                    s->superblock_macroblocks[mapping_index], i, j,
                    current_width, right_edge, current_height, bottom_edge);
505 506
            } else {
                s->superblock_macroblocks[mapping_index] = -1;
507 508 509
                debug_init("    superblock %d, position %d has no macroblock (%d/%d x %d/%d)\n",
                    i, j,
                    current_width, right_edge, current_height, bottom_edge);
510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536
            }

            mapping_index++;
        }
    }

    /* initialize the macroblock <-> fragment mapping */
    current_fragment = 0;
    current_macroblock = 0;
    mapping_index = 0;
    for (i = 0; i < s->fragment_height; i += 2) {

        for (j = 0; j < s->fragment_width; j += 2) {

            debug_init("    macroblock %d contains fragments: ", current_macroblock);
            s->all_fragments[current_fragment].macroblock = current_macroblock;
            s->macroblock_fragments[mapping_index++] = current_fragment;
            debug_init("%d ", current_fragment);

            if (j + 1 < s->fragment_width) {
                s->all_fragments[current_fragment + 1].macroblock = current_macroblock;
                s->macroblock_fragments[mapping_index++] = current_fragment + 1;
                debug_init("%d ", current_fragment + 1);
            } else
                s->macroblock_fragments[mapping_index++] = -1;

            if (i + 1 < s->fragment_height) {
537
                s->all_fragments[current_fragment + s->fragment_width].macroblock =
538
                    current_macroblock;
539
                s->macroblock_fragments[mapping_index++] =
540 541 542 543 544 545
                    current_fragment + s->fragment_width;
                debug_init("%d ", current_fragment + s->fragment_width);
            } else
                s->macroblock_fragments[mapping_index++] = -1;

            if ((j + 1 < s->fragment_width) && (i + 1 < s->fragment_height)) {
546
                s->all_fragments[current_fragment + s->fragment_width + 1].macroblock =
547
                    current_macroblock;
548
                s->macroblock_fragments[mapping_index++] =
549 550 551 552 553 554
                    current_fragment + s->fragment_width + 1;
                debug_init("%d ", current_fragment + s->fragment_width + 1);
            } else
                s->macroblock_fragments[mapping_index++] = -1;

            /* C planes */
M
Michael Niedermayer 已提交
555
            c_fragment = s->fragment_start[1] +
556
                (i * s->fragment_width / 4) + (j / 2);
557
            s->all_fragments[c_fragment].macroblock = s->macroblock_count;
558 559 560
            s->macroblock_fragments[mapping_index++] = c_fragment;
            debug_init("%d ", c_fragment);

M
Michael Niedermayer 已提交
561
            c_fragment = s->fragment_start[2] +
562
                (i * s->fragment_width / 4) + (j / 2);
563
            s->all_fragments[c_fragment].macroblock = s->macroblock_count;
564 565 566 567 568 569 570
            s->macroblock_fragments[mapping_index++] = c_fragment;
            debug_init("%d ", c_fragment);

            debug_init("\n");

            if (j + 2 <= s->fragment_width)
                current_fragment += 2;
571
            else
572 573 574 575 576 577
                current_fragment++;
            current_macroblock++;
        }

        current_fragment += s->fragment_width;
    }
578 579

    return 0;  /* successful path out */
580 581 582 583 584 585 586 587 588 589 590 591 592
}

/*
 * This function wipes out all of the fragment data.
 */
static void init_frame(Vp3DecodeContext *s, GetBitContext *gb)
{
    int i;

    /* zero out all of the fragment information */
    s->coded_fragment_list_index = 0;
    for (i = 0; i < s->fragment_count; i++) {
        s->all_fragments[i].coeff_count = 0;
593 594 595
        s->all_fragments[i].motion_x = 127;
        s->all_fragments[i].motion_y = 127;
        s->all_fragments[i].next_coeff= NULL;
596 597 598
        s->coeffs[i].index=
        s->coeffs[i].coeff=0;
        s->coeffs[i].next= NULL;
599 600 601 602
    }
}

/*
603
 * This function sets up the dequantization tables used for a particular
604 605 606 607
 * frame.
 */
static void init_dequantizer(Vp3DecodeContext *s)
{
608
    int ac_scale_factor = s->coded_ac_scale_factor[s->quality_index];
609
    int dc_scale_factor = s->coded_dc_scale_factor[s->quality_index];
610
    int i, plane, inter, qri, bmi, bmj, qistart;
611 612 613

    debug_vp3("  vp3: initializing dequantization tables\n");

614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630
    for(inter=0; inter<2; inter++){
        for(plane=0; plane<3; plane++){
            int sum=0;
            for(qri=0; qri<s->qr_count[inter][plane]; qri++){
                sum+= s->qr_size[inter][plane][qri];
                if(s->quality_index <= sum)
                    break;
            }
            qistart= sum - s->qr_size[inter][plane][qri];
            bmi= s->qr_base[inter][plane][qri  ];
            bmj= s->qr_base[inter][plane][qri+1];
            for(i=0; i<64; i++){
                int coeff= (  2*(sum    -s->quality_index)*s->base_matrix[bmi][i]
                            - 2*(qistart-s->quality_index)*s->base_matrix[bmj][i]
                            + s->qr_size[inter][plane][qri])
                           / (2*s->qr_size[inter][plane][qri]);

M
Michael Niedermayer 已提交
631
                int qmin= 8<<(inter + !i);
632 633 634 635 636
                int qscale= i ? ac_scale_factor : dc_scale_factor;

                s->qmat[inter][plane][i]= clip((qscale * coeff)/100 * 4, qmin, 4096);
            }
        }
637
    }
638

639
    memset(s->qscale_table, (FFMAX(s->qmat[0][0][1], s->qmat[0][1][1])+8)/16, 512); //FIXME finetune
640 641
}

642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663
/*
 * This function initializes the loop filter boundary limits if the frame's
 * quality index is different from the previous frame's.
 */
static void init_loop_filter(Vp3DecodeContext *s)
{
    int *bounding_values= s->bounding_values_array+127;
    int filter_limit;
    int x;

    filter_limit = s->filter_limit_values[s->quality_index];

    /* set up the bounding values */
    memset(s->bounding_values_array, 0, 256 * sizeof(int));
    for (x = 0; x < filter_limit; x++) {
        bounding_values[-x - filter_limit] = -filter_limit + x;
        bounding_values[-x] = -x;
        bounding_values[x] = x;
        bounding_values[x + filter_limit] = filter_limit - x;
    }
}

664
/*
665
 * This function unpacks all of the superblock/macroblock/fragment coding
666 667
 * information from the bitstream.
 */
668
static int unpack_superblocks(Vp3DecodeContext *s, GetBitContext *gb)
669 670 671 672 673 674
{
    int bit = 0;
    int current_superblock = 0;
    int current_run = 0;
    int decode_fully_flags = 0;
    int decode_partial_blocks = 0;
675
    int first_c_fragment_seen;
676 677 678 679 680 681 682 683 684 685 686 687 688 689 690

    int i, j;
    int current_fragment;

    debug_vp3("  vp3: unpacking superblock coding\n");

    if (s->keyframe) {

        debug_vp3("    keyframe-- all superblocks are fully coded\n");
        memset(s->superblock_coding, SB_FULLY_CODED, s->superblock_count);

    } else {

        /* unpack the list of partially-coded superblocks */
        bit = get_bits(gb, 1);
691
        /* toggle the bit because as soon as the first run length is
692 693 694
         * fetched the bit will be toggled again */
        bit ^= 1;
        while (current_superblock < s->superblock_count) {
695
            if (current_run-- == 0) {
696
                bit ^= 1;
697
                current_run = get_vlc2(gb,
698 699
                    s->superblock_run_length_vlc.table, 6, 2);
                if (current_run == 33)
700
                    current_run += get_bits(gb, 12);
701 702 703 704 705 706 707
                debug_block_coding("      setting superblocks %d..%d to %s\n",
                    current_superblock,
                    current_superblock + current_run - 1,
                    (bit) ? "partially coded" : "not coded");

                /* if any of the superblocks are not partially coded, flag
                 * a boolean to decode the list of fully-coded superblocks */
708
                if (bit == 0) {
709
                    decode_fully_flags = 1;
710
                } else {
711

712 713 714 715
                    /* make a note of the fact that there are partially coded
                     * superblocks */
                    decode_partial_blocks = 1;
                }
716
            }
717
            s->superblock_coding[current_superblock++] = bit;
718 719 720 721 722 723 724 725 726
        }

        /* unpack the list of fully coded superblocks if any of the blocks were
         * not marked as partially coded in the previous step */
        if (decode_fully_flags) {

            current_superblock = 0;
            current_run = 0;
            bit = get_bits(gb, 1);
727
            /* toggle the bit because as soon as the first run length is
728 729 730 731 732 733 734
             * fetched the bit will be toggled again */
            bit ^= 1;
            while (current_superblock < s->superblock_count) {

                /* skip any superblocks already marked as partially coded */
                if (s->superblock_coding[current_superblock] == SB_NOT_CODED) {

735
                    if (current_run-- == 0) {
736
                        bit ^= 1;
737
                        current_run = get_vlc2(gb,
738 739
                            s->superblock_run_length_vlc.table, 6, 2);
                        if (current_run == 33)
740
                            current_run += get_bits(gb, 12);
741 742 743 744 745
                    }

                    debug_block_coding("      setting superblock %d to %s\n",
                        current_superblock,
                        (bit) ? "fully coded" : "not coded");
746
                    s->superblock_coding[current_superblock] = 2*bit;
747 748 749 750 751 752 753 754 755 756 757
                }
                current_superblock++;
            }
        }

        /* if there were partial blocks, initialize bitstream for
         * unpacking fragment codings */
        if (decode_partial_blocks) {

            current_run = 0;
            bit = get_bits(gb, 1);
758
            /* toggle the bit because as soon as the first run length is
759 760 761 762 763 764 765 766
             * fetched the bit will be toggled again */
            bit ^= 1;
        }
    }

    /* figure out which fragments are coded; iterate through each
     * superblock (all planes) */
    s->coded_fragment_list_index = 0;
767
    s->next_coeff= s->coeffs + s->fragment_count;
768 769
    s->first_coded_y_fragment = s->first_coded_c_fragment = 0;
    s->last_coded_y_fragment = s->last_coded_c_fragment = -1;
770
    first_c_fragment_seen = 0;
771
    memset(s->macroblock_coding, MODE_COPY, s->macroblock_count);
772 773 774 775 776 777 778
    for (i = 0; i < s->superblock_count; i++) {

        /* iterate through all 16 fragments in a superblock */
        for (j = 0; j < 16; j++) {

            /* if the fragment is in bounds, check its coding status */
            current_fragment = s->superblock_fragments[i * 16 + j];
779
            if (current_fragment >= s->fragment_count) {
780
                av_log(s->avctx, AV_LOG_ERROR, "  vp3:unpack_superblocks(): bad fragment number (%d >= %d)\n",
781 782 783
                    current_fragment, s->fragment_count);
                return 1;
            }
784 785 786 787
            if (current_fragment != -1) {
                if (s->superblock_coding[i] == SB_NOT_CODED) {

                    /* copy all the fragments from the prior frame */
788
                    s->all_fragments[current_fragment].coding_method =
789 790 791 792 793 794
                        MODE_COPY;

                } else if (s->superblock_coding[i] == SB_PARTIALLY_CODED) {

                    /* fragment may or may not be coded; this is the case
                     * that cares about the fragment coding runs */
795
                    if (current_run-- == 0) {
796
                        bit ^= 1;
797
                        current_run = get_vlc2(gb,
798
                            s->fragment_run_length_vlc.table, 5, 2);
799 800 801
                    }

                    if (bit) {
802
                        /* default mode; actual mode will be decoded in
803
                         * the next phase */
804
                        s->all_fragments[current_fragment].coding_method =
805
                            MODE_INTER_NO_MV;
806
                        s->all_fragments[current_fragment].next_coeff= s->coeffs + current_fragment;
807
                        s->coded_fragment_list[s->coded_fragment_list_index] =
808
                            current_fragment;
M
Michael Niedermayer 已提交
809
                        if ((current_fragment >= s->fragment_start[1]) &&
810 811
                            (s->last_coded_y_fragment == -1) &&
                            (!first_c_fragment_seen)) {
812 813
                            s->first_coded_c_fragment = s->coded_fragment_list_index;
                            s->last_coded_y_fragment = s->first_coded_c_fragment - 1;
814
                            first_c_fragment_seen = 1;
815 816
                        }
                        s->coded_fragment_list_index++;
817
                        s->macroblock_coding[s->all_fragments[current_fragment].macroblock] = MODE_INTER_NO_MV;
818 819 820 821 822 823 824 825 826 827 828 829 830 831
                        debug_block_coding("      superblock %d is partially coded, fragment %d is coded\n",
                            i, current_fragment);
                    } else {
                        /* not coded; copy this fragment from the prior frame */
                        s->all_fragments[current_fragment].coding_method =
                            MODE_COPY;
                        debug_block_coding("      superblock %d is partially coded, fragment %d is not coded\n",
                            i, current_fragment);
                    }

                } else {

                    /* fragments are fully coded in this superblock; actual
                     * coding will be determined in next step */
832
                    s->all_fragments[current_fragment].coding_method =
833
                        MODE_INTER_NO_MV;
834
                    s->all_fragments[current_fragment].next_coeff= s->coeffs + current_fragment;
835
                    s->coded_fragment_list[s->coded_fragment_list_index] =
836
                        current_fragment;
M
Michael Niedermayer 已提交
837
                    if ((current_fragment >= s->fragment_start[1]) &&
838 839
                        (s->last_coded_y_fragment == -1) &&
                        (!first_c_fragment_seen)) {
840 841
                        s->first_coded_c_fragment = s->coded_fragment_list_index;
                        s->last_coded_y_fragment = s->first_coded_c_fragment - 1;
842
                        first_c_fragment_seen = 1;
843 844
                    }
                    s->coded_fragment_list_index++;
845
                    s->macroblock_coding[s->all_fragments[current_fragment].macroblock] = MODE_INTER_NO_MV;
846 847 848 849 850 851
                    debug_block_coding("      superblock %d is fully coded, fragment %d is coded\n",
                        i, current_fragment);
                }
            }
        }
    }
852

853 854
    if (!first_c_fragment_seen)
        /* only Y fragments coded in this frame */
855
        s->last_coded_y_fragment = s->coded_fragment_list_index - 1;
856
    else
857
        /* end the list of coded C fragments */
858
        s->last_coded_c_fragment = s->coded_fragment_list_index - 1;
859

860 861 862 863 864 865
    debug_block_coding("    %d total coded fragments, y: %d -> %d, c: %d -> %d\n",
        s->coded_fragment_list_index,
        s->first_coded_y_fragment,
        s->last_coded_y_fragment,
        s->first_coded_c_fragment,
        s->last_coded_c_fragment);
866 867

    return 0;
868 869 870 871 872 873
}

/*
 * This function unpacks all the coding mode data for individual macroblocks
 * from the bitstream.
 */
874
static int unpack_modes(Vp3DecodeContext *s, GetBitContext *gb)
875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899
{
    int i, j, k;
    int scheme;
    int current_macroblock;
    int current_fragment;
    int coding_mode;

    debug_vp3("  vp3: unpacking encoding modes\n");

    if (s->keyframe) {
        debug_vp3("    keyframe-- all blocks are coded as INTRA\n");

        for (i = 0; i < s->fragment_count; i++)
            s->all_fragments[i].coding_method = MODE_INTRA;

    } else {

        /* fetch the mode coding scheme for this frame */
        scheme = get_bits(gb, 3);
        debug_modes("    using mode alphabet %d\n", scheme);

        /* is it a custom coding scheme? */
        if (scheme == 0) {
            debug_modes("    custom mode alphabet ahead:\n");
            for (i = 0; i < 8; i++)
900
                ModeAlphabet[scheme][get_bits(gb, 3)] = i;
901 902 903
        }

        for (i = 0; i < 8; i++)
904
            debug_modes("      mode[%d][%d] = %d\n", scheme, i,
905 906 907 908 909 910 911 912 913
                ModeAlphabet[scheme][i]);

        /* iterate through all of the macroblocks that contain 1 or more
         * coded fragments */
        for (i = 0; i < s->u_superblock_start; i++) {

            for (j = 0; j < 4; j++) {
                current_macroblock = s->superblock_macroblocks[i * 4 + j];
                if ((current_macroblock == -1) ||
914
                    (s->macroblock_coding[current_macroblock] == MODE_COPY))
915
                    continue;
916
                if (current_macroblock >= s->macroblock_count) {
917
                    av_log(s->avctx, AV_LOG_ERROR, "  vp3:unpack_modes(): bad macroblock number (%d >= %d)\n",
918 919 920
                        current_macroblock, s->macroblock_count);
                    return 1;
                }
921 922 923 924 925

                /* mode 7 means get 3 bits for each coding mode */
                if (scheme == 7)
                    coding_mode = get_bits(gb, 3);
                else
926 927
                    coding_mode = ModeAlphabet[scheme]
                        [get_vlc2(gb, s->mode_code_vlc.table, 3, 3)];
928

929
                s->macroblock_coding[current_macroblock] = coding_mode;
930
                for (k = 0; k < 6; k++) {
931
                    current_fragment =
932
                        s->macroblock_fragments[current_macroblock * 6 + k];
933 934 935
                    if (current_fragment == -1)
                        continue;
                    if (current_fragment >= s->fragment_count) {
936
                        av_log(s->avctx, AV_LOG_ERROR, "  vp3:unpack_modes(): bad fragment number (%d >= %d)\n",
937 938 939
                            current_fragment, s->fragment_count);
                        return 1;
                    }
940
                    if (s->all_fragments[current_fragment].coding_method !=
941 942 943 944 945 946 947 948 949 950
                        MODE_COPY)
                        s->all_fragments[current_fragment].coding_method =
                            coding_mode;
                }

                debug_modes("    coding method for macroblock starting @ fragment %d = %d\n",
                    s->macroblock_fragments[current_macroblock * 6], coding_mode);
            }
        }
    }
951 952

    return 0;
953 954
}

955 956 957 958
/*
 * This function unpacks all the motion vectors for the individual
 * macroblocks from the bitstream.
 */
959
static int unpack_vectors(Vp3DecodeContext *s, GetBitContext *gb)
960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993
{
    int i, j, k;
    int coding_mode;
    int motion_x[6];
    int motion_y[6];
    int last_motion_x = 0;
    int last_motion_y = 0;
    int prior_last_motion_x = 0;
    int prior_last_motion_y = 0;
    int current_macroblock;
    int current_fragment;

    debug_vp3("  vp3: unpacking motion vectors\n");
    if (s->keyframe) {

        debug_vp3("    keyframe-- there are no motion vectors\n");

    } else {

        memset(motion_x, 0, 6 * sizeof(int));
        memset(motion_y, 0, 6 * sizeof(int));

        /* coding mode 0 is the VLC scheme; 1 is the fixed code scheme */
        coding_mode = get_bits(gb, 1);
        debug_vectors("    using %s scheme for unpacking motion vectors\n",
            (coding_mode == 0) ? "VLC" : "fixed-length");

        /* iterate through all of the macroblocks that contain 1 or more
         * coded fragments */
        for (i = 0; i < s->u_superblock_start; i++) {

            for (j = 0; j < 4; j++) {
                current_macroblock = s->superblock_macroblocks[i * 4 + j];
                if ((current_macroblock == -1) ||
994
                    (s->macroblock_coding[current_macroblock] == MODE_COPY))
995
                    continue;
996
                if (current_macroblock >= s->macroblock_count) {
997
                    av_log(s->avctx, AV_LOG_ERROR, "  vp3:unpack_vectors(): bad macroblock number (%d >= %d)\n",
998 999 1000
                        current_macroblock, s->macroblock_count);
                    return 1;
                }
1001 1002

                current_fragment = s->macroblock_fragments[current_macroblock * 6];
1003
                if (current_fragment >= s->fragment_count) {
1004
                    av_log(s->avctx, AV_LOG_ERROR, "  vp3:unpack_vectors(): bad fragment number (%d >= %d\n",
1005 1006 1007
                        current_fragment, s->fragment_count);
                    return 1;
                }
1008
                switch (s->macroblock_coding[current_macroblock]) {
1009 1010 1011 1012 1013

                case MODE_INTER_PLUS_MV:
                case MODE_GOLDEN_MV:
                    /* all 6 fragments use the same motion vector */
                    if (coding_mode == 0) {
1014 1015
                        motion_x[0] = motion_vector_table[get_vlc2(gb, s->motion_vector_vlc.table, 6, 2)];
                        motion_y[0] = motion_vector_table[get_vlc2(gb, s->motion_vector_vlc.table, 6, 2)];
1016
                    } else {
1017 1018
                        motion_x[0] = fixed_motion_vector_table[get_bits(gb, 6)];
                        motion_y[0] = fixed_motion_vector_table[get_bits(gb, 6)];
1019
                    }
1020

1021 1022 1023 1024 1025 1026
                    for (k = 1; k < 6; k++) {
                        motion_x[k] = motion_x[0];
                        motion_y[k] = motion_y[0];
                    }

                    /* vector maintenance, only on MODE_INTER_PLUS_MV */
1027
                    if (s->macroblock_coding[current_macroblock] ==
1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041
                        MODE_INTER_PLUS_MV) {
                        prior_last_motion_x = last_motion_x;
                        prior_last_motion_y = last_motion_y;
                        last_motion_x = motion_x[0];
                        last_motion_y = motion_y[0];
                    }
                    break;

                case MODE_INTER_FOURMV:
                    /* fetch 4 vectors from the bitstream, one for each
                     * Y fragment, then average for the C fragment vectors */
                    motion_x[4] = motion_y[4] = 0;
                    for (k = 0; k < 4; k++) {
                        if (coding_mode == 0) {
1042 1043
                            motion_x[k] = motion_vector_table[get_vlc2(gb, s->motion_vector_vlc.table, 6, 2)];
                            motion_y[k] = motion_vector_table[get_vlc2(gb, s->motion_vector_vlc.table, 6, 2)];
1044
                        } else {
1045 1046
                            motion_x[k] = fixed_motion_vector_table[get_bits(gb, 6)];
                            motion_y[k] = fixed_motion_vector_table[get_bits(gb, 6)];
1047 1048 1049 1050 1051
                        }
                        motion_x[4] += motion_x[k];
                        motion_y[4] += motion_y[k];
                    }

M
Michael Niedermayer 已提交
1052 1053 1054 1055
                    motion_x[5]=
                    motion_x[4]= RSHIFT(motion_x[4], 2);
                    motion_y[5]=
                    motion_y[4]= RSHIFT(motion_y[4], 2);
1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093

                    /* vector maintenance; vector[3] is treated as the
                     * last vector in this case */
                    prior_last_motion_x = last_motion_x;
                    prior_last_motion_y = last_motion_y;
                    last_motion_x = motion_x[3];
                    last_motion_y = motion_y[3];
                    break;

                case MODE_INTER_LAST_MV:
                    /* all 6 fragments use the last motion vector */
                    motion_x[0] = last_motion_x;
                    motion_y[0] = last_motion_y;
                    for (k = 1; k < 6; k++) {
                        motion_x[k] = motion_x[0];
                        motion_y[k] = motion_y[0];
                    }

                    /* no vector maintenance (last vector remains the
                     * last vector) */
                    break;

                case MODE_INTER_PRIOR_LAST:
                    /* all 6 fragments use the motion vector prior to the
                     * last motion vector */
                    motion_x[0] = prior_last_motion_x;
                    motion_y[0] = prior_last_motion_y;
                    for (k = 1; k < 6; k++) {
                        motion_x[k] = motion_x[0];
                        motion_y[k] = motion_y[0];
                    }

                    /* vector maintenance */
                    prior_last_motion_x = last_motion_x;
                    prior_last_motion_y = last_motion_y;
                    last_motion_x = motion_x[0];
                    last_motion_y = motion_y[0];
                    break;
1094 1095 1096 1097 1098 1099 1100 1101

                default:
                    /* covers intra, inter without MV, golden without MV */
                    memset(motion_x, 0, 6 * sizeof(int));
                    memset(motion_y, 0, 6 * sizeof(int));

                    /* no vector maintenance */
                    break;
1102 1103 1104 1105 1106
                }

                /* assign the motion vectors to the correct fragments */
                debug_vectors("    vectors for macroblock starting @ fragment %d (coding method %d):\n",
                    current_fragment,
1107
                    s->macroblock_coding[current_macroblock]);
1108
                for (k = 0; k < 6; k++) {
1109
                    current_fragment =
1110
                        s->macroblock_fragments[current_macroblock * 6 + k];
1111 1112 1113
                    if (current_fragment == -1)
                        continue;
                    if (current_fragment >= s->fragment_count) {
1114
                        av_log(s->avctx, AV_LOG_ERROR, "  vp3:unpack_vectors(): bad fragment number (%d >= %d)\n",
1115 1116 1117
                            current_fragment, s->fragment_count);
                        return 1;
                    }
1118
                    s->all_fragments[current_fragment].motion_x = motion_x[k];
1119
                    s->all_fragments[current_fragment].motion_y = motion_y[k];
1120 1121
                    debug_vectors("    vector %d: fragment %d = (%d, %d)\n",
                        k, current_fragment, motion_x[k], motion_y[k]);
1122 1123 1124 1125
                }
            }
        }
    }
1126 1127

    return 0;
1128 1129
}

1130
/*
1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148
 * This function is called by unpack_dct_coeffs() to extract the VLCs from
 * the bitstream. The VLCs encode tokens which are used to unpack DCT
 * data. This function unpacks all the VLCs for either the Y plane or both
 * C planes, and is called for DC coefficients or different AC coefficient
 * levels (since different coefficient types require different VLC tables.
 *
 * This function returns a residual eob run. E.g, if a particular token gave
 * instructions to EOB the next 5 fragments and there were only 2 fragments
 * left in the current fragment range, 3 would be returned so that it could
 * be passed into the next call to this same function.
 */
static int unpack_vlcs(Vp3DecodeContext *s, GetBitContext *gb,
                        VLC *table, int coeff_index,
                        int first_fragment, int last_fragment,
                        int eob_run)
{
    int i;
    int token;
1149 1150
    int zero_run = 0;
    DCTELEM coeff = 0;
1151
    Vp3Fragment *fragment;
M
Michael Niedermayer 已提交
1152
    uint8_t *perm= s->scantable.permutated;
1153
    int bits_to_get;
1154

1155
    if ((first_fragment >= s->fragment_count) ||
1156 1157
        (last_fragment >= s->fragment_count)) {

1158
        av_log(s->avctx, AV_LOG_ERROR, "  vp3:unpack_vlcs(): bad fragment number (%d -> %d ?)\n",
1159
            first_fragment, last_fragment);
1160
        return 0;
1161 1162
    }

1163
    for (i = first_fragment; i <= last_fragment; i++) {
1164 1165 1166 1167 1168 1169 1170 1171 1172 1173

        fragment = &s->all_fragments[s->coded_fragment_list[i]];
        if (fragment->coeff_count > coeff_index)
            continue;

        if (!eob_run) {
            /* decode a VLC into a token */
            token = get_vlc2(gb, table->table, 5, 3);
            debug_vlc(" token = %2d, ", token);
            /* use the token to get a zero run, a coefficient, and an eob run */
1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189
            if (token <= 6) {
                eob_run = eob_run_base[token];
                if (eob_run_get_bits[token])
                    eob_run += get_bits(gb, eob_run_get_bits[token]);
                coeff = zero_run = 0;
            } else {
                bits_to_get = coeff_get_bits[token];
                if (!bits_to_get)
                    coeff = coeff_tables[token][0];
                else
                    coeff = coeff_tables[token][get_bits(gb, bits_to_get)];

                zero_run = zero_run_base[token];
                if (zero_run_get_bits[token])
                    zero_run += get_bits(gb, zero_run_get_bits[token]);
            }
1190 1191 1192 1193
        }

        if (!eob_run) {
            fragment->coeff_count += zero_run;
1194 1195 1196 1197 1198 1199 1200
            if (fragment->coeff_count < 64){
                fragment->next_coeff->coeff= coeff;
                fragment->next_coeff->index= perm[fragment->coeff_count++]; //FIXME perm here already?
                fragment->next_coeff->next= s->next_coeff;
                s->next_coeff->next=NULL;
                fragment->next_coeff= s->next_coeff++;
            }
1201
            debug_vlc(" fragment %d coeff = %d\n",
1202
                s->coded_fragment_list[i], fragment->next_coeff[coeff_index]);
1203
        } else {
1204
            fragment->coeff_count |= 128;
1205
            debug_vlc(" fragment %d eob with %d coefficients\n",
1206
                s->coded_fragment_list[i], fragment->coeff_count&127);
1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217
            eob_run--;
        }
    }

    return eob_run;
}

/*
 * This function unpacks all of the DCT coefficient data from the
 * bitstream.
 */
1218
static int unpack_dct_coeffs(Vp3DecodeContext *s, GetBitContext *gb)
1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233
{
    int i;
    int dc_y_table;
    int dc_c_table;
    int ac_y_table;
    int ac_c_table;
    int residual_eob_run = 0;

    /* fetch the DC table indices */
    dc_y_table = get_bits(gb, 4);
    dc_c_table = get_bits(gb, 4);

    /* unpack the Y plane DC coefficients */
    debug_vp3("  vp3: unpacking Y plane DC coefficients using table %d\n",
        dc_y_table);
1234
    residual_eob_run = unpack_vlcs(s, gb, &s->dc_vlc[dc_y_table], 0,
1235
        s->first_coded_y_fragment, s->last_coded_y_fragment, residual_eob_run);
1236 1237 1238 1239 1240

    /* unpack the C plane DC coefficients */
    debug_vp3("  vp3: unpacking C plane DC coefficients using table %d\n",
        dc_c_table);
    residual_eob_run = unpack_vlcs(s, gb, &s->dc_vlc[dc_c_table], 0,
1241
        s->first_coded_c_fragment, s->last_coded_c_fragment, residual_eob_run);
1242

1243
    /* fetch the AC table indices */
1244 1245 1246
    ac_y_table = get_bits(gb, 4);
    ac_c_table = get_bits(gb, 4);

1247
    /* unpack the group 1 AC coefficients (coeffs 1-5) */
1248 1249 1250 1251
    for (i = 1; i <= 5; i++) {

        debug_vp3("  vp3: unpacking level %d Y plane AC coefficients using table %d\n",
            i, ac_y_table);
1252
        residual_eob_run = unpack_vlcs(s, gb, &s->ac_vlc_1[ac_y_table], i,
1253
            s->first_coded_y_fragment, s->last_coded_y_fragment, residual_eob_run);
1254 1255 1256

        debug_vp3("  vp3: unpacking level %d C plane AC coefficients using table %d\n",
            i, ac_c_table);
1257
        residual_eob_run = unpack_vlcs(s, gb, &s->ac_vlc_1[ac_c_table], i,
1258
            s->first_coded_c_fragment, s->last_coded_c_fragment, residual_eob_run);
1259 1260
    }

1261
    /* unpack the group 2 AC coefficients (coeffs 6-14) */
1262 1263 1264 1265
    for (i = 6; i <= 14; i++) {

        debug_vp3("  vp3: unpacking level %d Y plane AC coefficients using table %d\n",
            i, ac_y_table);
1266
        residual_eob_run = unpack_vlcs(s, gb, &s->ac_vlc_2[ac_y_table], i,
1267
            s->first_coded_y_fragment, s->last_coded_y_fragment, residual_eob_run);
1268 1269 1270

        debug_vp3("  vp3: unpacking level %d C plane AC coefficients using table %d\n",
            i, ac_c_table);
1271
        residual_eob_run = unpack_vlcs(s, gb, &s->ac_vlc_2[ac_c_table], i,
1272
            s->first_coded_c_fragment, s->last_coded_c_fragment, residual_eob_run);
1273 1274
    }

1275
    /* unpack the group 3 AC coefficients (coeffs 15-27) */
1276 1277 1278 1279
    for (i = 15; i <= 27; i++) {

        debug_vp3("  vp3: unpacking level %d Y plane AC coefficients using table %d\n",
            i, ac_y_table);
1280
        residual_eob_run = unpack_vlcs(s, gb, &s->ac_vlc_3[ac_y_table], i,
1281
            s->first_coded_y_fragment, s->last_coded_y_fragment, residual_eob_run);
1282 1283 1284

        debug_vp3("  vp3: unpacking level %d C plane AC coefficients using table %d\n",
            i, ac_c_table);
1285
        residual_eob_run = unpack_vlcs(s, gb, &s->ac_vlc_3[ac_c_table], i,
1286
            s->first_coded_c_fragment, s->last_coded_c_fragment, residual_eob_run);
1287 1288
    }

1289
    /* unpack the group 4 AC coefficients (coeffs 28-63) */
1290 1291 1292 1293
    for (i = 28; i <= 63; i++) {

        debug_vp3("  vp3: unpacking level %d Y plane AC coefficients using table %d\n",
            i, ac_y_table);
1294
        residual_eob_run = unpack_vlcs(s, gb, &s->ac_vlc_4[ac_y_table], i,
1295
            s->first_coded_y_fragment, s->last_coded_y_fragment, residual_eob_run);
1296 1297 1298

        debug_vp3("  vp3: unpacking level %d C plane AC coefficients using table %d\n",
            i, ac_c_table);
1299
        residual_eob_run = unpack_vlcs(s, gb, &s->ac_vlc_4[ac_c_table], i,
1300
            s->first_coded_c_fragment, s->last_coded_c_fragment, residual_eob_run);
1301
    }
1302 1303

    return 0;
1304 1305 1306 1307
}

/*
 * This function reverses the DC prediction for each coded fragment in
1308
 * the frame. Much of this function is adapted directly from the original
1309 1310 1311 1312 1313
 * VP3 source code.
 */
#define COMPATIBLE_FRAME(x) \
  (compatible_frame[s->all_fragments[x].coding_method] == current_frame_type)
#define FRAME_CODED(x) (s->all_fragments[x].coding_method != MODE_COPY)
1314
#define DC_COEFF(u) (s->coeffs[u].index ? 0 : s->coeffs[u].coeff) //FIXME do somethin to simplify this
1315 1316 1317 1318

static void reverse_dc_prediction(Vp3DecodeContext *s,
                                  int first_fragment,
                                  int fragment_width,
1319
                                  int fragment_height)
1320 1321 1322 1323 1324 1325 1326 1327 1328 1329
{

#define PUL 8
#define PU 4
#define PUR 2
#define PL 1

    int x, y;
    int i = first_fragment;

1330
    int predicted_dc;
1331 1332 1333 1334 1335 1336 1337

    /* DC values for the left, up-left, up, and up-right fragments */
    int vl, vul, vu, vur;

    /* indices for the left, up-left, up, and up-right fragments */
    int l, ul, u, ur;

1338
    /*
1339 1340 1341 1342 1343 1344
     * The 6 fields mean:
     *   0: up-left multiplier
     *   1: up multiplier
     *   2: up-right multiplier
     *   3: left multiplier
     */
M
Michael Niedermayer 已提交
1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361
    int predictor_transform[16][4] = {
        {  0,  0,  0,  0},
        {  0,  0,  0,128},        // PL
        {  0,  0,128,  0},        // PUR
        {  0,  0, 53, 75},        // PUR|PL
        {  0,128,  0,  0},        // PU
        {  0, 64,  0, 64},        // PU|PL
        {  0,128,  0,  0},        // PU|PUR
        {  0,  0, 53, 75},        // PU|PUR|PL
        {128,  0,  0,  0},        // PUL
        {  0,  0,  0,128},        // PUL|PL
        { 64,  0, 64,  0},        // PUL|PUR
        {  0,  0, 53, 75},        // PUL|PUR|PL
        {  0,128,  0,  0},        // PUL|PU
       {-104,116,  0,116},        // PUL|PU|PL
        { 24, 80, 24,  0},        // PUL|PU|PUR
       {-104,116,  0,116}         // PUL|PU|PUR|PL
1362 1363 1364 1365 1366
    };

    /* This table shows which types of blocks can use other blocks for
     * prediction. For example, INTRA is the only mode in this table to
     * have a frame number of 0. That means INTRA blocks can only predict
1367
     * from other INTRA blocks. There are 2 golden frame coding types;
1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400
     * blocks encoding in these modes can only predict from other blocks
     * that were encoded with these 1 of these 2 modes. */
    unsigned char compatible_frame[8] = {
        1,    /* MODE_INTER_NO_MV */
        0,    /* MODE_INTRA */
        1,    /* MODE_INTER_PLUS_MV */
        1,    /* MODE_INTER_LAST_MV */
        1,    /* MODE_INTER_PRIOR_MV */
        2,    /* MODE_USING_GOLDEN */
        2,    /* MODE_GOLDEN_MV */
        1     /* MODE_INTER_FOUR_MV */
    };
    int current_frame_type;

    /* there is a last DC predictor for each of the 3 frame types */
    short last_dc[3];

    int transform = 0;

    debug_vp3("  vp3: reversing DC prediction\n");

    vul = vu = vur = vl = 0;
    last_dc[0] = last_dc[1] = last_dc[2] = 0;

    /* for each fragment row... */
    for (y = 0; y < fragment_height; y++) {

        /* for each fragment in a row... */
        for (x = 0; x < fragment_width; x++, i++) {

            /* reverse prediction if this block was coded */
            if (s->all_fragments[i].coding_method != MODE_COPY) {

1401
                current_frame_type =
1402
                    compatible_frame[s->all_fragments[i].coding_method];
M
Michael Niedermayer 已提交
1403 1404
                debug_dc_pred(" frag %d: orig DC = %d, ",
                    i, DC_COEFF(i));
1405

M
Michael Niedermayer 已提交
1406 1407 1408
                transform= 0;
                if(x){
                    l= i-1;
1409
                    vl = DC_COEFF(l);
M
Michael Niedermayer 已提交
1410 1411
                    if(FRAME_CODED(l) && COMPATIBLE_FRAME(l))
                        transform |= PL;
M
Michael Niedermayer 已提交
1412 1413 1414
                }
                if(y){
                    u= i-fragment_width;
1415
                    vu = DC_COEFF(u);
M
Michael Niedermayer 已提交
1416 1417
                    if(FRAME_CODED(u) && COMPATIBLE_FRAME(u))
                        transform |= PU;
M
Michael Niedermayer 已提交
1418 1419 1420
                    if(x){
                        ul= i-fragment_width-1;
                        vul = DC_COEFF(ul);
M
Michael Niedermayer 已提交
1421 1422
                        if(FRAME_CODED(ul) && COMPATIBLE_FRAME(ul))
                            transform |= PUL;
M
Michael Niedermayer 已提交
1423 1424 1425 1426
                    }
                    if(x + 1 < fragment_width){
                        ur= i-fragment_width+1;
                        vur = DC_COEFF(ur);
M
Michael Niedermayer 已提交
1427 1428
                        if(FRAME_CODED(ur) && COMPATIBLE_FRAME(ur))
                            transform |= PUR;
M
Michael Niedermayer 已提交
1429
                    }
1430 1431 1432 1433 1434 1435 1436 1437
                }

                debug_dc_pred("transform = %d, ", transform);

                if (transform == 0) {

                    /* if there were no fragments to predict from, use last
                     * DC saved */
1438
                    predicted_dc = last_dc[current_frame_type];
1439
                    debug_dc_pred("from last DC (%d) = %d\n",
1440
                        current_frame_type, DC_COEFF(i));
1441 1442 1443 1444 1445 1446 1447 1448 1449 1450

                } else {

                    /* apply the appropriate predictor transform */
                    predicted_dc =
                        (predictor_transform[transform][0] * vul) +
                        (predictor_transform[transform][1] * vu) +
                        (predictor_transform[transform][2] * vur) +
                        (predictor_transform[transform][3] * vl);

M
Michael Niedermayer 已提交
1451
                    predicted_dc /= 128;
1452 1453 1454 1455

                    /* check for outranging on the [ul u l] and
                     * [ul u ur l] predictors */
                    if ((transform == 13) || (transform == 15)) {
M
Michael Niedermayer 已提交
1456
                        if (ABS(predicted_dc - vu) > 128)
1457
                            predicted_dc = vu;
M
Michael Niedermayer 已提交
1458
                        else if (ABS(predicted_dc - vl) > 128)
1459
                            predicted_dc = vl;
M
Michael Niedermayer 已提交
1460
                        else if (ABS(predicted_dc - vul) > 128)
1461 1462 1463
                            predicted_dc = vul;
                    }

1464
                    debug_dc_pred("from pred DC = %d\n",
1465
                    DC_COEFF(i));
1466 1467
                }

1468 1469 1470 1471 1472 1473 1474 1475
                /* at long last, apply the predictor */
                if(s->coeffs[i].index){
                    *s->next_coeff= s->coeffs[i];
                    s->coeffs[i].index=0;
                    s->coeffs[i].coeff=0;
                    s->coeffs[i].next= s->next_coeff++;
                }
                s->coeffs[i].coeff += predicted_dc;
1476
                /* save the DC */
1477 1478 1479 1480 1481 1482 1483
                last_dc[current_frame_type] = DC_COEFF(i);
                if(DC_COEFF(i) && !(s->all_fragments[i].coeff_count&127)){
                    s->all_fragments[i].coeff_count= 129;
//                    s->all_fragments[i].next_coeff= s->next_coeff;
                    s->coeffs[i].next= s->next_coeff;
                    (s->next_coeff++)->next=NULL;
                }
1484 1485 1486 1487 1488
            }
        }
    }
}

1489 1490 1491 1492 1493 1494

static void horizontal_filter(unsigned char *first_pixel, int stride,
    int *bounding_values);
static void vertical_filter(unsigned char *first_pixel, int stride,
    int *bounding_values);

1495 1496 1497 1498 1499 1500
/*
 * Perform the final rendering for a particular slice of data.
 * The slice number ranges from 0..(macroblock_height - 1).
 */
static void render_slice(Vp3DecodeContext *s, int slice)
{
M
Michael Niedermayer 已提交
1501
    int x;
1502 1503
    int m, n;
    int16_t *dequantizer;
1504
    DECLARE_ALIGNED_16(DCTELEM, block[64]);
1505 1506 1507 1508 1509 1510 1511 1512 1513 1514
    int motion_x = 0xdeadbeef, motion_y = 0xdeadbeef;
    int motion_halfpel_index;
    uint8_t *motion_source;
    int plane;
    int current_macroblock_entry = slice * s->macroblock_width * 6;

    if (slice >= s->macroblock_height)
        return;

    for (plane = 0; plane < 3; plane++) {
M
Michael Niedermayer 已提交
1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525
        uint8_t *output_plane = s->current_frame.data    [plane];
        uint8_t *  last_plane = s->   last_frame.data    [plane];
        uint8_t *golden_plane = s-> golden_frame.data    [plane];
        int stride            = s->current_frame.linesize[plane];
        int plane_width       = s->width  >> !!plane;
        int plane_height      = s->height >> !!plane;
        int y =        slice *  FRAGMENT_PIXELS << !plane ;
        int slice_height = y + (FRAGMENT_PIXELS << !plane);
        int i = s->macroblock_fragments[current_macroblock_entry + plane + 3*!!plane];

        if (!s->flipped_image) stride = -stride;
1526

1527

1528 1529 1530 1531 1532 1533 1534 1535 1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548
        if(ABS(stride) > 2048)
            return; //various tables are fixed size

        /* for each fragment row in the slice (both of them)... */
        for (; y < slice_height; y += 8) {

            /* for each fragment in a row... */
            for (x = 0; x < plane_width; x += 8, i++) {

                if ((i < 0) || (i >= s->fragment_count)) {
                    av_log(s->avctx, AV_LOG_ERROR, "  vp3:render_slice(): bad fragment number (%d)\n", i);
                    return;
                }

                /* transform if this block was coded */
                if ((s->all_fragments[i].coding_method != MODE_COPY) &&
                    !((s->avctx->flags & CODEC_FLAG_GRAY) && plane)) {

                    if ((s->all_fragments[i].coding_method == MODE_USING_GOLDEN) ||
                        (s->all_fragments[i].coding_method == MODE_GOLDEN_MV))
                        motion_source= golden_plane;
1549
                    else
1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586
                        motion_source= last_plane;

                    motion_source += s->all_fragments[i].first_pixel;
                    motion_halfpel_index = 0;

                    /* sort out the motion vector if this fragment is coded
                     * using a motion vector method */
                    if ((s->all_fragments[i].coding_method > MODE_INTRA) &&
                        (s->all_fragments[i].coding_method != MODE_USING_GOLDEN)) {
                        int src_x, src_y;
                        motion_x = s->all_fragments[i].motion_x;
                        motion_y = s->all_fragments[i].motion_y;
                        if(plane){
                            motion_x= (motion_x>>1) | (motion_x&1);
                            motion_y= (motion_y>>1) | (motion_y&1);
                        }

                        src_x= (motion_x>>1) + x;
                        src_y= (motion_y>>1) + y;
                        if ((motion_x == 127) || (motion_y == 127))
                            av_log(s->avctx, AV_LOG_ERROR, " help! got invalid motion vector! (%X, %X)\n", motion_x, motion_y);

                        motion_halfpel_index = motion_x & 0x01;
                        motion_source += (motion_x >> 1);

                        motion_halfpel_index |= (motion_y & 0x01) << 1;
                        motion_source += ((motion_y >> 1) * stride);

                        if(src_x<0 || src_y<0 || src_x + 9 >= plane_width || src_y + 9 >= plane_height){
                            uint8_t *temp= s->edge_emu_buffer;
                            if(stride<0) temp -= 9*stride;
                            else temp += 9*stride;

                            ff_emulated_edge_mc(temp, motion_source, stride, 9, 9, src_x, src_y, plane_width, plane_height);
                            motion_source= temp;
                        }
                    }
1587

1588 1589 1590 1591

                    /* first, take care of copying a block from either the
                     * previous or the golden frame */
                    if (s->all_fragments[i].coding_method != MODE_INTRA) {
1592 1593 1594
                        /* Note, it is possible to implement all MC cases with
                           put_no_rnd_pixels_l2 which would look more like the
                           VP3 source but this would be slower as
1595 1596 1597 1598 1599 1600 1601 1602 1603
                           put_no_rnd_pixels_tab is better optimzed */
                        if(motion_halfpel_index != 3){
                            s->dsp.put_no_rnd_pixels_tab[1][motion_halfpel_index](
                                output_plane + s->all_fragments[i].first_pixel,
                                motion_source, stride, 8);
                        }else{
                            int d= (motion_x ^ motion_y)>>31; // d is 0 if motion_x and _y have the same sign, else -1
                            s->dsp.put_no_rnd_pixels_l2[1](
                                output_plane + s->all_fragments[i].first_pixel,
1604 1605
                                motion_source - d,
                                motion_source + stride + 1 + d,
1606 1607
                                stride, 8);
                        }
1608
                        dequantizer = s->qmat[1][plane];
1609
                    }else{
1610
                        dequantizer = s->qmat[0][plane];
1611 1612 1613
                    }

                    /* dequantize the DCT coefficients */
1614 1615
                    debug_idct("fragment %d, coding mode %d, DC = %d, dequant = %d:\n",
                        i, s->all_fragments[i].coding_method,
1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634
                        DC_COEFF(i), dequantizer[0]);

                    if(s->avctx->idct_algo==FF_IDCT_VP3){
                        Coeff *coeff= s->coeffs + i;
                        memset(block, 0, sizeof(block));
                        while(coeff->next){
                            block[coeff->index]= coeff->coeff * dequantizer[coeff->index];
                            coeff= coeff->next;
                        }
                    }else{
                        Coeff *coeff= s->coeffs + i;
                        memset(block, 0, sizeof(block));
                        while(coeff->next){
                            block[coeff->index]= (coeff->coeff * dequantizer[coeff->index] + 2)>>2;
                            coeff= coeff->next;
                        }
                    }

                    /* invert DCT and place (or add) in final output */
1635

1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654
                    if (s->all_fragments[i].coding_method == MODE_INTRA) {
                        if(s->avctx->idct_algo!=FF_IDCT_VP3)
                            block[0] += 128<<3;
                        s->dsp.idct_put(
                            output_plane + s->all_fragments[i].first_pixel,
                            stride,
                            block);
                    } else {
                        s->dsp.idct_add(
                            output_plane + s->all_fragments[i].first_pixel,
                            stride,
                            block);
                    }

                    debug_idct("block after idct_%s():\n",
                        (s->all_fragments[i].coding_method == MODE_INTRA)?
                        "put" : "add");
                    for (m = 0; m < 8; m++) {
                        for (n = 0; n < 8; n++) {
1655
                            debug_idct(" %3d", *(output_plane +
1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670
                                s->all_fragments[i].first_pixel + (m * stride + n)));
                        }
                        debug_idct("\n");
                    }
                    debug_idct("\n");

                } else {

                    /* copy directly from the previous frame */
                    s->dsp.put_pixels_tab[1][0](
                        output_plane + s->all_fragments[i].first_pixel,
                        last_plane + s->all_fragments[i].first_pixel,
                        stride, 8);

                }
1671
#if 0
1672 1673 1674 1675 1676 1677 1678
                /* perform the left edge filter if:
                 *   - the fragment is not on the left column
                 *   - the fragment is coded in this frame
                 *   - the fragment is not coded in this frame but the left
                 *     fragment is coded in this frame (this is done instead
                 *     of a right edge filter when rendering the left fragment
                 *     since this fragment is not available yet) */
1679
                if ((x > 0) &&
1680 1681 1682
                    ((s->all_fragments[i].coding_method != MODE_COPY) ||
                     ((s->all_fragments[i].coding_method == MODE_COPY) &&
                      (s->all_fragments[i - 1].coding_method != MODE_COPY)) )) {
1683
                    horizontal_filter(
1684
                        output_plane + s->all_fragments[i].first_pixel + 7*stride,
M
Michael Niedermayer 已提交
1685
                        -stride, s->bounding_values_array + 127);
1686 1687
                }

1688 1689 1690 1691 1692 1693 1694
                /* perform the top edge filter if:
                 *   - the fragment is not on the top row
                 *   - the fragment is coded in this frame
                 *   - the fragment is not coded in this frame but the above
                 *     fragment is coded in this frame (this is done instead
                 *     of a bottom edge filter when rendering the above
                 *     fragment since this fragment is not available yet) */
1695
                if ((y > 0) &&
1696 1697 1698
                    ((s->all_fragments[i].coding_method != MODE_COPY) ||
                     ((s->all_fragments[i].coding_method == MODE_COPY) &&
                      (s->all_fragments[i - fragment_width].coding_method != MODE_COPY)) )) {
1699
                    vertical_filter(
1700
                        output_plane + s->all_fragments[i].first_pixel - stride,
M
Michael Niedermayer 已提交
1701
                        -stride, s->bounding_values_array + 127);
1702
                }
1703
#endif
1704 1705 1706 1707 1708 1709 1710
            }
        }
    }

     /* this looks like a good place for slice dispatch... */
     /* algorithm:
      *   if (slice == s->macroblock_height - 1)
1711 1712 1713
      *     dispatch (both last slice & 2nd-to-last slice);
      *   else if (slice > 0)
      *     dispatch (slice - 1);
1714 1715 1716 1717 1718
      */

    emms_c();
}

1719 1720 1721
static void horizontal_filter(unsigned char *first_pixel, int stride,
    int *bounding_values)
{
1722
    unsigned char *end;
1723 1724
    int filter_value;

M
Michael Niedermayer 已提交
1725
    for (end= first_pixel + 8*stride; first_pixel != end; first_pixel += stride) {
1726
        filter_value =
1727 1728
            (first_pixel[-2] - first_pixel[ 1])
         +3*(first_pixel[ 0] - first_pixel[-1]);
1729
        filter_value = bounding_values[(filter_value + 4) >> 3];
1730 1731
        first_pixel[-1] = clip_uint8(first_pixel[-1] + filter_value);
        first_pixel[ 0] = clip_uint8(first_pixel[ 0] - filter_value);
1732 1733 1734 1735 1736 1737
    }
}

static void vertical_filter(unsigned char *first_pixel, int stride,
    int *bounding_values)
{
1738
    unsigned char *end;
1739
    int filter_value;
1740
    const int nstride= -stride;
1741

1742
    for (end= first_pixel + 8; first_pixel < end; first_pixel++) {
1743
        filter_value =
1744 1745
            (first_pixel[2 * nstride] - first_pixel[ stride])
         +3*(first_pixel[0          ] - first_pixel[nstride]);
1746
        filter_value = bounding_values[(filter_value + 4) >> 3];
1747
        first_pixel[nstride] = clip_uint8(first_pixel[nstride] + filter_value);
1748
        first_pixel[0] = clip_uint8(first_pixel[0] - filter_value);
1749 1750 1751 1752 1753
    }
}

static void apply_loop_filter(Vp3DecodeContext *s)
{
M
Michael Niedermayer 已提交
1754 1755
    int plane;
    int x, y;
1756
    int *bounding_values= s->bounding_values_array+127;
1757

1758
#if 0
1759
    int bounding_values_array[256];
1760 1761 1762 1763 1764 1765 1766
    int filter_limit;

    /* find the right loop limit value */
    for (x = 63; x >= 0; x--) {
        if (vp31_ac_scale_factor[x] >= s->quality_index)
            break;
    }
1767
    filter_limit = vp31_filter_limit_values[s->quality_index];
1768 1769

    /* set up the bounding values */
1770
    memset(bounding_values_array, 0, 256 * sizeof(int));
1771 1772 1773 1774 1775 1776
    for (x = 0; x < filter_limit; x++) {
        bounding_values[-x - filter_limit] = -filter_limit + x;
        bounding_values[-x] = -x;
        bounding_values[x] = x;
        bounding_values[x + filter_limit] = filter_limit - x;
    }
1777
#endif
1778 1779

    for (plane = 0; plane < 3; plane++) {
M
Michael Niedermayer 已提交
1780 1781 1782 1783 1784
        int width           = s->fragment_width  >> !!plane;
        int height          = s->fragment_height >> !!plane;
        int fragment        = s->fragment_start        [plane];
        int stride          = s->current_frame.linesize[plane];
        uint8_t *plane_data = s->current_frame.data    [plane];
M
Michael Niedermayer 已提交
1785
        if (!s->flipped_image) stride = -stride;
1786 1787

        for (y = 0; y < height; y++) {
1788

1789
            for (x = 0; x < width; x++) {
M
Michael Niedermayer 已提交
1790
START_TIMER
1791 1792 1793 1794
                /* do not perform left edge filter for left columns frags */
                if ((x > 0) &&
                    (s->all_fragments[fragment].coding_method != MODE_COPY)) {
                    horizontal_filter(
M
Michael Niedermayer 已提交
1795
                        plane_data + s->all_fragments[fragment].first_pixel,
1796 1797 1798 1799 1800 1801 1802
                        stride, bounding_values);
                }

                /* do not perform top edge filter for top row fragments */
                if ((y > 0) &&
                    (s->all_fragments[fragment].coding_method != MODE_COPY)) {
                    vertical_filter(
M
Michael Niedermayer 已提交
1803
                        plane_data + s->all_fragments[fragment].first_pixel,
1804 1805 1806 1807 1808 1809 1810 1811 1812 1813
                        stride, bounding_values);
                }

                /* do not perform right edge filter for right column
                 * fragments or if right fragment neighbor is also coded
                 * in this frame (it will be filtered in next iteration) */
                if ((x < width - 1) &&
                    (s->all_fragments[fragment].coding_method != MODE_COPY) &&
                    (s->all_fragments[fragment + 1].coding_method == MODE_COPY)) {
                    horizontal_filter(
M
Michael Niedermayer 已提交
1814
                        plane_data + s->all_fragments[fragment + 1].first_pixel,
1815 1816 1817 1818 1819 1820 1821 1822 1823 1824
                        stride, bounding_values);
                }

                /* do not perform bottom edge filter for bottom row
                 * fragments or if bottom fragment neighbor is also coded
                 * in this frame (it will be filtered in the next row) */
                if ((y < height - 1) &&
                    (s->all_fragments[fragment].coding_method != MODE_COPY) &&
                    (s->all_fragments[fragment + width].coding_method == MODE_COPY)) {
                    vertical_filter(
M
Michael Niedermayer 已提交
1825
                        plane_data + s->all_fragments[fragment + width].first_pixel,
1826 1827 1828 1829
                        stride, bounding_values);
                }

                fragment++;
M
Michael Niedermayer 已提交
1830
STOP_TIMER("loop filter")
1831 1832 1833
            }
        }
    }
1834 1835
}

1836
/*
1837 1838 1839 1840
 * This function computes the first pixel addresses for each fragment.
 * This function needs to be invoked after the first frame is allocated
 * so that it has access to the plane strides.
 */
1841
static void vp3_calculate_pixel_addresses(Vp3DecodeContext *s)
1842 1843 1844 1845 1846 1847 1848 1849 1850
{

    int i, x, y;

    /* figure out the first pixel addresses for each of the fragments */
    /* Y plane */
    i = 0;
    for (y = s->fragment_height; y > 0; y--) {
        for (x = 0; x < s->fragment_width; x++) {
1851
            s->all_fragments[i++].first_pixel =
1852 1853 1854
                s->golden_frame.linesize[0] * y * FRAGMENT_PIXELS -
                    s->golden_frame.linesize[0] +
                    x * FRAGMENT_PIXELS;
1855
            debug_init("  fragment %d, first pixel @ %d\n",
1856 1857 1858 1859 1860
                i-1, s->all_fragments[i-1].first_pixel);
        }
    }

    /* U plane */
M
Michael Niedermayer 已提交
1861
    i = s->fragment_start[1];
1862 1863
    for (y = s->fragment_height / 2; y > 0; y--) {
        for (x = 0; x < s->fragment_width / 2; x++) {
1864
            s->all_fragments[i++].first_pixel =
1865 1866 1867
                s->golden_frame.linesize[1] * y * FRAGMENT_PIXELS -
                    s->golden_frame.linesize[1] +
                    x * FRAGMENT_PIXELS;
1868
            debug_init("  fragment %d, first pixel @ %d\n",
1869 1870 1871 1872 1873
                i-1, s->all_fragments[i-1].first_pixel);
        }
    }

    /* V plane */
M
Michael Niedermayer 已提交
1874
    i = s->fragment_start[2];
1875 1876
    for (y = s->fragment_height / 2; y > 0; y--) {
        for (x = 0; x < s->fragment_width / 2; x++) {
1877
            s->all_fragments[i++].first_pixel =
1878 1879 1880
                s->golden_frame.linesize[2] * y * FRAGMENT_PIXELS -
                    s->golden_frame.linesize[2] +
                    x * FRAGMENT_PIXELS;
1881
            debug_init("  fragment %d, first pixel @ %d\n",
1882 1883 1884 1885 1886
                i-1, s->all_fragments[i-1].first_pixel);
        }
    }
}

1887
/* FIXME: this should be merged with the above! */
1888
static void theora_calculate_pixel_addresses(Vp3DecodeContext *s)
1889 1890 1891 1892 1893 1894 1895 1896 1897
{

    int i, x, y;

    /* figure out the first pixel addresses for each of the fragments */
    /* Y plane */
    i = 0;
    for (y = 1; y <= s->fragment_height; y++) {
        for (x = 0; x < s->fragment_width; x++) {
1898
            s->all_fragments[i++].first_pixel =
1899 1900 1901
                s->golden_frame.linesize[0] * y * FRAGMENT_PIXELS -
                    s->golden_frame.linesize[0] +
                    x * FRAGMENT_PIXELS;
1902
            debug_init("  fragment %d, first pixel @ %d\n",
1903 1904 1905 1906 1907
                i-1, s->all_fragments[i-1].first_pixel);
        }
    }

    /* U plane */
M
Michael Niedermayer 已提交
1908
    i = s->fragment_start[1];
1909 1910
    for (y = 1; y <= s->fragment_height / 2; y++) {
        for (x = 0; x < s->fragment_width / 2; x++) {
1911
            s->all_fragments[i++].first_pixel =
1912 1913 1914
                s->golden_frame.linesize[1] * y * FRAGMENT_PIXELS -
                    s->golden_frame.linesize[1] +
                    x * FRAGMENT_PIXELS;
1915
            debug_init("  fragment %d, first pixel @ %d\n",
1916 1917 1918 1919 1920
                i-1, s->all_fragments[i-1].first_pixel);
        }
    }

    /* V plane */
M
Michael Niedermayer 已提交
1921
    i = s->fragment_start[2];
1922 1923
    for (y = 1; y <= s->fragment_height / 2; y++) {
        for (x = 0; x < s->fragment_width / 2; x++) {
1924
            s->all_fragments[i++].first_pixel =
1925 1926 1927
                s->golden_frame.linesize[2] * y * FRAGMENT_PIXELS -
                    s->golden_frame.linesize[2] +
                    x * FRAGMENT_PIXELS;
1928
            debug_init("  fragment %d, first pixel @ %d\n",
1929 1930 1931 1932 1933
                i-1, s->all_fragments[i-1].first_pixel);
        }
    }
}

1934 1935 1936 1937 1938 1939
/*
 * This is the ffmpeg/libavcodec API init function.
 */
static int vp3_decode_init(AVCodecContext *avctx)
{
    Vp3DecodeContext *s = avctx->priv_data;
1940
    int i, inter, plane;
1941 1942 1943 1944
    int c_width;
    int c_height;
    int y_superblock_count;
    int c_superblock_count;
1945

A
Alex Beregszaszi 已提交
1946
    if (avctx->codec_tag == MKTAG('V','P','3','0'))
1947
        s->version = 0;
A
Alex Beregszaszi 已提交
1948
    else
1949
        s->version = 1;
A
Alex Beregszaszi 已提交
1950

1951
    s->avctx = avctx;
1952 1953
    s->width = (avctx->width + 15) & 0xFFFFFFF0;
    s->height = (avctx->height + 15) & 0xFFFFFFF0;
1954 1955
    avctx->pix_fmt = PIX_FMT_YUV420P;
    avctx->has_b_frames = 0;
1956 1957
    if(avctx->idct_algo==FF_IDCT_AUTO)
        avctx->idct_algo=FF_IDCT_VP3;
1958
    dsputil_init(&s->dsp, avctx);
1959

M
Michael Niedermayer 已提交
1960
    ff_init_scantable(s->dsp.idct_permutation, &s->scantable, ff_zigzag_direct);
1961 1962 1963 1964 1965

    /* initialize to an impossible value which will force a recalculation
     * in the first frame decode */
    s->quality_index = -1;

1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979
    s->y_superblock_width = (s->width + 31) / 32;
    s->y_superblock_height = (s->height + 31) / 32;
    y_superblock_count = s->y_superblock_width * s->y_superblock_height;

    /* work out the dimensions for the C planes */
    c_width = s->width / 2;
    c_height = s->height / 2;
    s->c_superblock_width = (c_width + 31) / 32;
    s->c_superblock_height = (c_height + 31) / 32;
    c_superblock_count = s->c_superblock_width * s->c_superblock_height;

    s->superblock_count = y_superblock_count + (c_superblock_count * 2);
    s->u_superblock_start = y_superblock_count;
    s->v_superblock_start = s->u_superblock_start + c_superblock_count;
1980 1981 1982 1983 1984 1985 1986 1987 1988 1989 1990
    s->superblock_coding = av_malloc(s->superblock_count);

    s->macroblock_width = (s->width + 15) / 16;
    s->macroblock_height = (s->height + 15) / 16;
    s->macroblock_count = s->macroblock_width * s->macroblock_height;

    s->fragment_width = s->width / FRAGMENT_PIXELS;
    s->fragment_height = s->height / FRAGMENT_PIXELS;

    /* fragment count covers all 8x8 blocks for all 3 planes */
    s->fragment_count = s->fragment_width * s->fragment_height * 3 / 2;
M
Michael Niedermayer 已提交
1991 1992
    s->fragment_start[1] = s->fragment_width * s->fragment_height;
    s->fragment_start[2] = s->fragment_width * s->fragment_height * 5 / 4;
1993

1994 1995 1996 1997 1998 1999
    debug_init("  Y plane: %d x %d\n", s->width, s->height);
    debug_init("  C plane: %d x %d\n", c_width, c_height);
    debug_init("  Y superblocks: %d x %d, %d total\n",
        s->y_superblock_width, s->y_superblock_height, y_superblock_count);
    debug_init("  C superblocks: %d x %d, %d total\n",
        s->c_superblock_width, s->c_superblock_height, c_superblock_count);
2000
    debug_init("  total superblocks = %d, U starts @ %d, V starts @ %d\n",
2001
        s->superblock_count, s->u_superblock_start, s->v_superblock_start);
2002 2003 2004 2005 2006 2007
    debug_init("  macroblocks: %d x %d, %d total\n",
        s->macroblock_width, s->macroblock_height, s->macroblock_count);
    debug_init("  %d fragments, %d x %d, u starts @ %d, v starts @ %d\n",
        s->fragment_count,
        s->fragment_width,
        s->fragment_height,
M
Michael Niedermayer 已提交
2008 2009
        s->fragment_start[1],
        s->fragment_start[2]);
2010 2011

    s->all_fragments = av_malloc(s->fragment_count * sizeof(Vp3Fragment));
2012
    s->coeffs = av_malloc(s->fragment_count * sizeof(Coeff) * 65);
2013 2014 2015
    s->coded_fragment_list = av_malloc(s->fragment_count * sizeof(int));
    s->pixel_addresses_inited = 0;

2016 2017
    if (!s->theora_tables)
    {
M
cleanup  
Michael Niedermayer 已提交
2018
        for (i = 0; i < 64; i++) {
2019 2020
            s->coded_dc_scale_factor[i] = vp31_dc_scale_factor[i];
            s->coded_ac_scale_factor[i] = vp31_ac_scale_factor[i];
2021 2022 2023
            s->base_matrix[0][i] = vp31_intra_y_dequant[i];
            s->base_matrix[1][i] = vp31_intra_c_dequant[i];
            s->base_matrix[2][i] = vp31_inter_dequant[i];
2024
            s->filter_limit_values[i] = vp31_filter_limit_values[i];
M
cleanup  
Michael Niedermayer 已提交
2025
        }
2026

2027 2028 2029 2030 2031 2032 2033 2034 2035
        for(inter=0; inter<2; inter++){
            for(plane=0; plane<3; plane++){
                s->qr_count[inter][plane]= 1;
                s->qr_size [inter][plane][0]= 63;
                s->qr_base [inter][plane][0]=
                s->qr_base [inter][plane][1]= 2*inter + (!!plane)*!inter;
            }
        }

2036 2037 2038 2039 2040 2041 2042 2043 2044 2045 2046 2047 2048 2049 2050 2051 2052 2053 2054 2055 2056 2057 2058 2059 2060 2061 2062 2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074 2075 2076 2077 2078 2079 2080 2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091
        /* init VLC tables */
        for (i = 0; i < 16; i++) {

            /* DC histograms */
            init_vlc(&s->dc_vlc[i], 5, 32,
                &dc_bias[i][0][1], 4, 2,
                &dc_bias[i][0][0], 4, 2, 0);

            /* group 1 AC histograms */
            init_vlc(&s->ac_vlc_1[i], 5, 32,
                &ac_bias_0[i][0][1], 4, 2,
                &ac_bias_0[i][0][0], 4, 2, 0);

            /* group 2 AC histograms */
            init_vlc(&s->ac_vlc_2[i], 5, 32,
                &ac_bias_1[i][0][1], 4, 2,
                &ac_bias_1[i][0][0], 4, 2, 0);

            /* group 3 AC histograms */
            init_vlc(&s->ac_vlc_3[i], 5, 32,
                &ac_bias_2[i][0][1], 4, 2,
                &ac_bias_2[i][0][0], 4, 2, 0);

            /* group 4 AC histograms */
            init_vlc(&s->ac_vlc_4[i], 5, 32,
                &ac_bias_3[i][0][1], 4, 2,
                &ac_bias_3[i][0][0], 4, 2, 0);
        }
    } else {
        for (i = 0; i < 16; i++) {

            /* DC histograms */
            init_vlc(&s->dc_vlc[i], 5, 32,
                &s->huffman_table[i][0][1], 4, 2,
                &s->huffman_table[i][0][0], 4, 2, 0);

            /* group 1 AC histograms */
            init_vlc(&s->ac_vlc_1[i], 5, 32,
                &s->huffman_table[i+16][0][1], 4, 2,
                &s->huffman_table[i+16][0][0], 4, 2, 0);

            /* group 2 AC histograms */
            init_vlc(&s->ac_vlc_2[i], 5, 32,
                &s->huffman_table[i+16*2][0][1], 4, 2,
                &s->huffman_table[i+16*2][0][0], 4, 2, 0);

            /* group 3 AC histograms */
            init_vlc(&s->ac_vlc_3[i], 5, 32,
                &s->huffman_table[i+16*3][0][1], 4, 2,
                &s->huffman_table[i+16*3][0][0], 4, 2, 0);

            /* group 4 AC histograms */
            init_vlc(&s->ac_vlc_4[i], 5, 32,
                &s->huffman_table[i+16*4][0][1], 4, 2,
                &s->huffman_table[i+16*4][0][0], 4, 2, 0);
        }
2092 2093
    }

2094 2095 2096 2097
    init_vlc(&s->superblock_run_length_vlc, 6, 34,
        &superblock_run_length_vlc_table[0][1], 4, 2,
        &superblock_run_length_vlc_table[0][0], 4, 2, 0);

2098
    init_vlc(&s->fragment_run_length_vlc, 5, 30,
2099 2100 2101 2102 2103 2104 2105 2106 2107 2108 2109
        &fragment_run_length_vlc_table[0][1], 4, 2,
        &fragment_run_length_vlc_table[0][0], 4, 2, 0);

    init_vlc(&s->mode_code_vlc, 3, 8,
        &mode_code_vlc_table[0][1], 2, 1,
        &mode_code_vlc_table[0][0], 2, 1, 0);

    init_vlc(&s->motion_vector_vlc, 6, 63,
        &motion_vector_vlc_table[0][1], 2, 1,
        &motion_vector_vlc_table[0][0], 2, 1, 0);

2110 2111 2112 2113
    /* work out the block mapping tables */
    s->superblock_fragments = av_malloc(s->superblock_count * 16 * sizeof(int));
    s->superblock_macroblocks = av_malloc(s->superblock_count * 4 * sizeof(int));
    s->macroblock_fragments = av_malloc(s->macroblock_count * 6 * sizeof(int));
2114
    s->macroblock_coding = av_malloc(s->macroblock_count + 1);
2115 2116
    init_block_mapping(s);

2117 2118 2119 2120
    for (i = 0; i < 3; i++) {
        s->current_frame.data[i] = NULL;
        s->last_frame.data[i] = NULL;
        s->golden_frame.data[i] = NULL;
2121 2122
    }

2123 2124 2125 2126 2127 2128
    return 0;
}

/*
 * This is the ffmpeg/libavcodec API frame decode function.
 */
2129
static int vp3_decode_frame(AVCodecContext *avctx,
2130 2131 2132 2133 2134 2135
                            void *data, int *data_size,
                            uint8_t *buf, int buf_size)
{
    Vp3DecodeContext *s = avctx->priv_data;
    GetBitContext gb;
    static int counter = 0;
2136
    int i;
2137 2138

    init_get_bits(&gb, buf, buf_size * 8);
2139

2140 2141
    if (s->theora && get_bits1(&gb))
    {
2142
#if 1
2143 2144
        av_log(avctx, AV_LOG_ERROR, "Header packet passed to frame decoder, skipping\n");
        return -1;
2145
#else
2146 2147 2148 2149 2150 2151 2152
        int ptype = get_bits(&gb, 7);

        skip_bits(&gb, 6*8); /* "theora" */

        switch(ptype)
        {
            case 1:
2153
                theora_decode_comments(avctx, &gb);
2154 2155
                break;
            case 2:
2156
                theora_decode_tables(avctx, &gb);
2157 2158 2159 2160 2161 2162
                    init_dequantizer(s);
                break;
            default:
                av_log(avctx, AV_LOG_ERROR, "Unknown Theora config packet: %d\n", ptype);
        }
        return buf_size;
2163
#endif
2164
    }
A
Alex Beregszaszi 已提交
2165 2166 2167

    s->keyframe = !get_bits1(&gb);
    if (!s->theora)
2168
        skip_bits(&gb, 1);
A
Alex Beregszaszi 已提交
2169
    s->last_quality_index = s->quality_index;
2170 2171 2172 2173 2174 2175 2176

    s->nqis=0;
    do{
        s->qis[s->nqis++]= get_bits(&gb, 6);
    } while(s->theora >= 0x030200 && s->nqis<3 && get_bits1(&gb));

    s->quality_index= s->qis[0];
2177

2178
    if (s->avctx->debug & FF_DEBUG_PICT_INFO)
2179 2180
        av_log(s->avctx, AV_LOG_INFO, " VP3 %sframe #%d: Q index = %d\n",
            s->keyframe?"key":"", counter, s->quality_index);
2181 2182
    counter++;

2183
    if (s->quality_index != s->last_quality_index) {
2184
        init_dequantizer(s);
2185 2186
        init_loop_filter(s);
    }
2187

2188
    if (s->keyframe) {
2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205
        if (!s->theora)
        {
            skip_bits(&gb, 4); /* width code */
            skip_bits(&gb, 4); /* height code */
            if (s->version)
            {
                s->version = get_bits(&gb, 5);
                if (counter == 1)
                    av_log(s->avctx, AV_LOG_DEBUG, "VP version: %d\n", s->version);
            }
        }
        if (s->version || s->theora)
        {
                if (get_bits1(&gb))
                    av_log(s->avctx, AV_LOG_ERROR, "Warning, unsupported keyframe coding type?!\n");
            skip_bits(&gb, 2); /* reserved? */
        }
A
Alex Beregszaszi 已提交
2206

2207 2208 2209
        if (s->last_frame.data[0] == s->golden_frame.data[0]) {
            if (s->golden_frame.data[0])
                avctx->release_buffer(avctx, &s->golden_frame);
2210
            s->last_frame= s->golden_frame; /* ensure that we catch any access to this released frame */
2211 2212 2213 2214 2215 2216
        } else {
            if (s->golden_frame.data[0])
                avctx->release_buffer(avctx, &s->golden_frame);
            if (s->last_frame.data[0])
                avctx->release_buffer(avctx, &s->last_frame);
        }
2217

2218
        s->golden_frame.reference = 3;
2219
        if(avctx->get_buffer(avctx, &s->golden_frame) < 0) {
2220
            av_log(s->avctx, AV_LOG_ERROR, "vp3: get_buffer() failed\n");
2221 2222 2223 2224
            return -1;
        }

        /* golden frame is also the current frame */
M
Michael Niedermayer 已提交
2225
        s->current_frame= s->golden_frame;
2226 2227 2228

        /* time to figure out pixel addresses? */
        if (!s->pixel_addresses_inited)
2229 2230 2231 2232 2233
        {
            if (!s->flipped_image)
                vp3_calculate_pixel_addresses(s);
            else
                theora_calculate_pixel_addresses(s);
2234
            s->pixel_addresses_inited = 1;
2235
        }
2236 2237
    } else {
        /* allocate a new current frame */
2238
        s->current_frame.reference = 3;
2239 2240 2241 2242
        if (!s->pixel_addresses_inited) {
            av_log(s->avctx, AV_LOG_ERROR, "vp3: first frame not a keyframe\n");
            return -1;
        }
2243
        if(avctx->get_buffer(avctx, &s->current_frame) < 0) {
2244
            av_log(s->avctx, AV_LOG_ERROR, "vp3: get_buffer() failed\n");
2245 2246 2247 2248
            return -1;
        }
    }

M
Michael Niedermayer 已提交
2249 2250 2251
    s->current_frame.qscale_table= s->qscale_table; //FIXME allocate individual tables per AVFrame
    s->current_frame.qstride= 0;

M
Michael Niedermayer 已提交
2252
    {START_TIMER
2253
    init_frame(s, &gb);
M
Michael Niedermayer 已提交
2254
    STOP_TIMER("init_frame")}
2255

2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266 2267 2268
#if KEYFRAMES_ONLY
if (!s->keyframe) {

    memcpy(s->current_frame.data[0], s->golden_frame.data[0],
        s->current_frame.linesize[0] * s->height);
    memcpy(s->current_frame.data[1], s->golden_frame.data[1],
        s->current_frame.linesize[1] * s->height / 2);
    memcpy(s->current_frame.data[2], s->golden_frame.data[2],
        s->current_frame.linesize[2] * s->height / 2);

} else {
#endif

M
Michael Niedermayer 已提交
2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285 2286 2287 2288 2289
    {START_TIMER
    if (unpack_superblocks(s, &gb)){
        av_log(s->avctx, AV_LOG_ERROR, "error in unpack_superblocks\n");
        return -1;
    }
    STOP_TIMER("unpack_superblocks")}
    {START_TIMER
    if (unpack_modes(s, &gb)){
        av_log(s->avctx, AV_LOG_ERROR, "error in unpack_modes\n");
        return -1;
    }
    STOP_TIMER("unpack_modes")}
    {START_TIMER
    if (unpack_vectors(s, &gb)){
        av_log(s->avctx, AV_LOG_ERROR, "error in unpack_vectors\n");
        return -1;
    }
    STOP_TIMER("unpack_vectors")}
    {START_TIMER
    if (unpack_dct_coeffs(s, &gb)){
        av_log(s->avctx, AV_LOG_ERROR, "error in unpack_dct_coeffs\n");
2290 2291
        return -1;
    }
M
Michael Niedermayer 已提交
2292 2293
    STOP_TIMER("unpack_dct_coeffs")}
    {START_TIMER
2294 2295

    reverse_dc_prediction(s, 0, s->fragment_width, s->fragment_height);
2296
    if ((avctx->flags & CODEC_FLAG_GRAY) == 0) {
M
Michael Niedermayer 已提交
2297
        reverse_dc_prediction(s, s->fragment_start[1],
2298
            s->fragment_width / 2, s->fragment_height / 2);
M
Michael Niedermayer 已提交
2299
        reverse_dc_prediction(s, s->fragment_start[2],
2300
            s->fragment_width / 2, s->fragment_height / 2);
2301 2302 2303 2304 2305 2306 2307
    }
    STOP_TIMER("reverse_dc_prediction")}
    {START_TIMER

    for (i = 0; i < s->macroblock_height; i++)
        render_slice(s, i);
    STOP_TIMER("render_fragments")}
2308

M
Michael Niedermayer 已提交
2309
    {START_TIMER
2310
    apply_loop_filter(s);
M
Michael Niedermayer 已提交
2311
    STOP_TIMER("apply_loop_filter")}
2312 2313 2314 2315
#if KEYFRAMES_ONLY
}
#endif

2316 2317 2318
    *data_size=sizeof(AVFrame);
    *(AVFrame*)data= s->current_frame;

2319 2320 2321 2322 2323
    /* release the last frame, if it is allocated and if it is not the
     * golden frame */
    if ((s->last_frame.data[0]) &&
        (s->last_frame.data[0] != s->golden_frame.data[0]))
        avctx->release_buffer(avctx, &s->last_frame);
2324

2325
    /* shuffle frames (last = current) */
M
Michael Niedermayer 已提交
2326
    s->last_frame= s->current_frame;
2327
    s->current_frame.data[0]= NULL; /* ensure that we catch any access to this released frame */
2328 2329 2330 2331 2332 2333 2334 2335 2336 2337 2338 2339

    return buf_size;
}

/*
 * This is the ffmpeg/libavcodec API module cleanup function.
 */
static int vp3_decode_end(AVCodecContext *avctx)
{
    Vp3DecodeContext *s = avctx->priv_data;

    av_free(s->all_fragments);
2340
    av_free(s->coeffs);
2341 2342 2343 2344
    av_free(s->coded_fragment_list);
    av_free(s->superblock_fragments);
    av_free(s->superblock_macroblocks);
    av_free(s->macroblock_fragments);
2345
    av_free(s->macroblock_coding);
2346

2347
    /* release all frames */
2348
    if (s->golden_frame.data[0] && s->golden_frame.data[0] != s->last_frame.data[0])
2349 2350 2351 2352 2353
        avctx->release_buffer(avctx, &s->golden_frame);
    if (s->last_frame.data[0])
        avctx->release_buffer(avctx, &s->last_frame);
    /* no need to release the current_frame since it will always be pointing
     * to the same frame as either the golden or last frame */
2354 2355 2356 2357

    return 0;
}

2358 2359 2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371 2372 2373 2374 2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389
static int read_huffman_tree(AVCodecContext *avctx, GetBitContext *gb)
{
    Vp3DecodeContext *s = avctx->priv_data;

    if (get_bits(gb, 1)) {
        int token;
        if (s->entries >= 32) { /* overflow */
            av_log(avctx, AV_LOG_ERROR, "huffman tree overflow\n");
            return -1;
        }
        token = get_bits(gb, 5);
        //av_log(avctx, AV_LOG_DEBUG, "hti %d hbits %x token %d entry : %d size %d\n", s->hti, s->hbits, token, s->entries, s->huff_code_size);
        s->huffman_table[s->hti][token][0] = s->hbits;
        s->huffman_table[s->hti][token][1] = s->huff_code_size;
        s->entries++;
    }
    else {
        if (s->huff_code_size >= 32) {/* overflow */
            av_log(avctx, AV_LOG_ERROR, "huffman tree overflow\n");
            return -1;
        }
        s->huff_code_size++;
        s->hbits <<= 1;
        read_huffman_tree(avctx, gb);
        s->hbits |= 1;
        read_huffman_tree(avctx, gb);
        s->hbits >>= 1;
        s->huff_code_size--;
    }
    return 0;
}

2390
static int theora_decode_header(AVCodecContext *avctx, GetBitContext *gb)
2391 2392
{
    Vp3DecodeContext *s = avctx->priv_data;
2393

2394
    s->theora = get_bits_long(gb, 24);
M
cleanup  
Michael Niedermayer 已提交
2395
    av_log(avctx, AV_LOG_INFO, "Theora bitstream version %X\n", s->theora);
2396

M
Matthieu Castet 已提交
2397
    /* 3.2.0 aka alpha3 has the same frame orientation as original vp3 */
2398
    /* but previous versions have the image flipped relative to vp3 */
M
Matthieu Castet 已提交
2399
    if (s->theora < 0x030200)
2400
    {
2401
        s->flipped_image = 1;
2402 2403
        av_log(avctx, AV_LOG_DEBUG, "Old (<alpha3) Theora bitstream, flipped image\n");
    }
2404

2405 2406
    s->width = get_bits(gb, 16) << 4;
    s->height = get_bits(gb, 16) << 4;
2407

2408
    if(avcodec_check_dimensions(avctx, s->width, s->height)){
2409
        av_log(avctx, AV_LOG_ERROR, "Invalid dimensions (%dx%d)\n", s->width, s->height);
2410 2411 2412
        s->width= s->height= 0;
        return -1;
    }
2413 2414 2415

    if (s->theora >= 0x030400)
    {
2416
        skip_bits(gb, 32); /* total number of superblocks in a frame */
2417
        // fixme, the next field is 36bits long
2418 2419 2420
        skip_bits(gb, 32); /* total number of blocks in a frame */
        skip_bits(gb, 4); /* total number of blocks in a frame */
        skip_bits(gb, 32); /* total number of macroblocks in a frame */
2421

2422 2423
        skip_bits(gb, 24); /* frame width */
        skip_bits(gb, 24); /* frame height */
2424 2425 2426
    }
    else
    {
2427 2428
        skip_bits(gb, 24); /* frame width */
        skip_bits(gb, 24); /* frame height */
2429
    }
2430

2431
  if (s->theora >= 0x030200) {
2432 2433
    skip_bits(gb, 8); /* offset x */
    skip_bits(gb, 8); /* offset y */
2434
  }
2435

2436 2437 2438 2439
    skip_bits(gb, 32); /* fps numerator */
    skip_bits(gb, 32); /* fps denumerator */
    skip_bits(gb, 24); /* aspect numerator */
    skip_bits(gb, 24); /* aspect denumerator */
2440

M
Matthieu Castet 已提交
2441
    if (s->theora < 0x030200)
2442 2443
        skip_bits(gb, 5); /* keyframe frequency force */
    skip_bits(gb, 8); /* colorspace */
2444
    if (s->theora >= 0x030400)
2445 2446
        skip_bits(gb, 2); /* pixel format: 420,res,422,444 */
    skip_bits(gb, 24); /* bitrate */
2447

2448
    skip_bits(gb, 6); /* quality hint */
2449

M
Matthieu Castet 已提交
2450
    if (s->theora >= 0x030200)
2451
    {
2452
        skip_bits(gb, 5); /* keyframe frequency force */
2453

2454
        if (s->theora < 0x030400)
2455
            skip_bits(gb, 5); /* spare bits */
2456
    }
2457

2458
//    align_get_bits(gb);
2459

2460 2461 2462 2463 2464 2465
    avctx->width = s->width;
    avctx->height = s->height;

    return 0;
}

2466
static int theora_decode_tables(AVCodecContext *avctx, GetBitContext *gb)
2467 2468
{
    Vp3DecodeContext *s = avctx->priv_data;
2469
    int i, n, matrices, inter, plane;
M
Matthieu Castet 已提交
2470 2471

    if (s->theora >= 0x030200) {
2472
        n = get_bits(gb, 3);
2473
        /* loop filter limit values table */
M
Matthieu Castet 已提交
2474
        for (i = 0; i < 64; i++)
2475
            s->filter_limit_values[i] = get_bits(gb, n);
M
Matthieu Castet 已提交
2476
    }
2477

M
Matthieu Castet 已提交
2478
    if (s->theora >= 0x030200)
2479
        n = get_bits(gb, 4) + 1;
M
Matthieu Castet 已提交
2480 2481
    else
        n = 16;
2482 2483
    /* quality threshold table */
    for (i = 0; i < 64; i++)
2484
        s->coded_ac_scale_factor[i] = get_bits(gb, n);
2485

M
Matthieu Castet 已提交
2486
    if (s->theora >= 0x030200)
2487
        n = get_bits(gb, 4) + 1;
M
Matthieu Castet 已提交
2488 2489
    else
        n = 16;
2490 2491
    /* dc scale factor table */
    for (i = 0; i < 64; i++)
2492
        s->coded_dc_scale_factor[i] = get_bits(gb, n);
2493

M
Matthieu Castet 已提交
2494
    if (s->theora >= 0x030200)
2495
        matrices = get_bits(gb, 9) + 1;
M
Matthieu Castet 已提交
2496
    else
2497
        matrices = 3;
2498

2499 2500 2501 2502
    if(matrices > 384){
        av_log(avctx, AV_LOG_ERROR, "invalid number of base matrixes\n");
        return -1;
    }
A
Alex Beregszaszi 已提交
2503

2504
    for(n=0; n<matrices; n++){
2505
        for (i = 0; i < 64; i++)
2506 2507
            s->base_matrix[n][i]= get_bits(gb, 8);
    }
2508

2509 2510 2511 2512
    for (inter = 0; inter <= 1; inter++) {
        for (plane = 0; plane <= 2; plane++) {
            int newqr= 1;
            if (inter || plane > 0)
2513
                newqr = get_bits(gb, 1);
2514
            if (!newqr) {
2515 2516 2517 2518 2519 2520 2521 2522 2523 2524 2525 2526 2527
                int qtj, plj;
                if(inter && get_bits(gb, 1)){
                    qtj = 0;
                    plj = plane;
                }else{
                    qtj= (3*inter + plane - 1) / 3;
                    plj= (plane + 2) % 3;
                }
                s->qr_count[inter][plane]= s->qr_count[qtj][plj];
                memcpy(s->qr_size[inter][plane], s->qr_size[qtj][plj], sizeof(s->qr_size[0][0]));
                memcpy(s->qr_base[inter][plane], s->qr_base[qtj][plj], sizeof(s->qr_base[0][0]));
            } else {
                int qri= 0;
2528
                int qi = 0;
2529 2530 2531 2532 2533 2534 2535 2536 2537 2538 2539 2540 2541

                for(;;){
                    i= get_bits(gb, av_log2(matrices-1)+1);
                    if(i>= matrices){
                        av_log(avctx, AV_LOG_ERROR, "invalid base matrix index\n");
                        return -1;
                    }
                    s->qr_base[inter][plane][qri]= i;
                    if(qi >= 63)
                        break;
                    i = get_bits(gb, av_log2(63-qi)+1) + 1;
                    s->qr_size[inter][plane][qri++]= i;
                    qi += i;
2542
                }
2543

2544
                if (qi > 63) {
2545
                    av_log(avctx, AV_LOG_ERROR, "invalid qi %d > 63\n", qi);
2546 2547
                    return -1;
                }
2548
                s->qr_count[inter][plane]= qri;
2549 2550 2551 2552
            }
        }
    }

2553
    /* Huffman tables */
2554 2555 2556
    for (s->hti = 0; s->hti < 80; s->hti++) {
        s->entries = 0;
        s->huff_code_size = 1;
2557
        if (!get_bits(gb, 1)) {
2558
            s->hbits = 0;
2559
            read_huffman_tree(avctx, gb);
2560
            s->hbits = 1;
2561
            read_huffman_tree(avctx, gb);
2562 2563
        }
    }
2564

2565
    s->theora_tables = 1;
2566

2567 2568 2569 2570 2571 2572 2573 2574
    return 0;
}

static int theora_decode_init(AVCodecContext *avctx)
{
    Vp3DecodeContext *s = avctx->priv_data;
    GetBitContext gb;
    int ptype;
2575 2576
    uint8_t *p= avctx->extradata;
    int op_bytes, i;
2577

2578 2579 2580
    s->theora = 1;

    if (!avctx->extradata_size)
2581 2582
    {
        av_log(avctx, AV_LOG_ERROR, "Missing extradata!\n");
2583
        return -1;
2584
    }
2585

2586 2587 2588 2589 2590 2591
  for(i=0;i<3;i++) {
    op_bytes = *(p++)<<8;
    op_bytes += *(p++);

    init_get_bits(&gb, p, op_bytes);
    p += op_bytes;
2592 2593 2594

    ptype = get_bits(&gb, 8);
    debug_vp3("Theora headerpacket type: %x\n", ptype);
2595

2596 2597 2598
     if (!(ptype & 0x80))
     {
        av_log(avctx, AV_LOG_ERROR, "Invalid extradata!\n");
2599
//        return -1;
2600
     }
2601 2602

    // FIXME: check for this aswell
2603
    skip_bits(&gb, 6*8); /* "theora" */
2604

2605 2606 2607
    switch(ptype)
    {
        case 0x80:
2608
            theora_decode_header(avctx, &gb);
2609 2610
                break;
        case 0x81:
2611
// FIXME: is this needed? it breaks sometimes
2612 2613 2614
//            theora_decode_comments(avctx, gb);
            break;
        case 0x82:
2615
            theora_decode_tables(avctx, &gb);
2616 2617 2618 2619
            break;
        default:
            av_log(avctx, AV_LOG_ERROR, "Unknown Theora config packet: %d\n", ptype&~0x80);
            break;
2620
    }
2621 2622
    if(8*op_bytes != get_bits_count(&gb))
        av_log(avctx, AV_LOG_ERROR, "%d bits left in packet %X\n", 8*op_bytes - get_bits_count(&gb), ptype);
2623 2624
    if (s->theora < 0x030200)
        break;
2625
  }
2626

M
Matthieu Castet 已提交
2627
    vp3_decode_init(avctx);
2628 2629 2630
    return 0;
}

2631 2632 2633 2634 2635 2636 2637 2638 2639 2640 2641 2642
AVCodec vp3_decoder = {
    "vp3",
    CODEC_TYPE_VIDEO,
    CODEC_ID_VP3,
    sizeof(Vp3DecodeContext),
    vp3_decode_init,
    NULL,
    vp3_decode_end,
    vp3_decode_frame,
    0,
    NULL
};
2643

2644
#ifndef CONFIG_LIBTHEORA
2645 2646 2647 2648 2649 2650 2651 2652 2653 2654 2655 2656
AVCodec theora_decoder = {
    "theora",
    CODEC_TYPE_VIDEO,
    CODEC_ID_THEORA,
    sizeof(Vp3DecodeContext),
    theora_decode_init,
    NULL,
    vp3_decode_end,
    vp3_decode_frame,
    0,
    NULL
};
2657
#endif