mpegvideo.c 93.3 KB
Newer Older
F
Fabrice Bellard 已提交
1 2
/*
 * The simplest mpeg encoder (well, it was the simplest!)
3
 * Copyright (c) 2000,2001 Fabrice Bellard
4
 * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at>
F
Fabrice Bellard 已提交
5
 *
6 7
 * 4MV & hq & B-frame encoding stuff by Michael Niedermayer <michaelni@gmx.at>
 *
8
 * This file is part of Libav.
9
 *
10
 * Libav is free software; you can redistribute it and/or
F
Fabrice Bellard 已提交
11 12
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
13
 * version 2.1 of the License, or (at your option) any later version.
F
Fabrice Bellard 已提交
14
 *
15
 * Libav is distributed in the hope that it will be useful,
F
Fabrice Bellard 已提交
16
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
F
Fabrice Bellard 已提交
17 18
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
F
Fabrice Bellard 已提交
19
 *
F
Fabrice Bellard 已提交
20
 * You should have received a copy of the GNU Lesser General Public
21
 * License along with Libav; if not, write to the Free Software
22
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
F
Fabrice Bellard 已提交
23
 */
24

M
Michael Niedermayer 已提交
25
/**
26
 * @file
M
Michael Niedermayer 已提交
27
 * The simplest mpeg encoder (well, it was the simplest!).
28 29
 */

30
#include "libavutil/intmath.h"
31
#include "libavutil/imgutils.h"
F
Fabrice Bellard 已提交
32 33
#include "avcodec.h"
#include "dsputil.h"
34
#include "internal.h"
F
Fabrice Bellard 已提交
35
#include "mpegvideo.h"
B
Benoit Fouet 已提交
36
#include "mpegvideo_common.h"
37
#include "mjpegenc.h"
38
#include "msmpeg4.h"
M
Michael Niedermayer 已提交
39
#include "faandct.h"
40
#include "xvmc_internal.h"
41
#include <limits.h>
F
Fabrice Bellard 已提交
42

43 44
//#undef NDEBUG
//#include <assert.h>
45

46
static void dct_unquantize_mpeg1_intra_c(MpegEncContext *s,
47
                                   DCTELEM *block, int n, int qscale);
48
static void dct_unquantize_mpeg1_inter_c(MpegEncContext *s,
49
                                   DCTELEM *block, int n, int qscale);
50 51
static void dct_unquantize_mpeg2_intra_c(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale);
52 53
static void dct_unquantize_mpeg2_intra_bitexact(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale);
54 55
static void dct_unquantize_mpeg2_inter_c(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale);
56
static void dct_unquantize_h263_intra_c(MpegEncContext *s,
57
                                  DCTELEM *block, int n, int qscale);
58
static void dct_unquantize_h263_inter_c(MpegEncContext *s,
59
                                  DCTELEM *block, int n, int qscale);
M
Michael Niedermayer 已提交
60

F
Fabrice Bellard 已提交
61 62 63 64 65 66

/* enable all paranoid tests for rounding, overflows, etc... */
//#define PARANOID

//#define DEBUG

67

M
Michael Niedermayer 已提交
68 69 70 71 72
static const uint8_t ff_default_chroma_qscale_table[32]={
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
    0, 1, 2, 3, 4, 5, 6, 7, 8, 9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31
};

73 74 75 76 77 78 79 80
const uint8_t ff_mpeg1_dc_scale_table[128]={
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
    8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
    8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
    8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
    8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
};

81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104
static const uint8_t mpeg2_dc_scale_table1[128]={
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
    4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
    4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
    4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
    4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
};

static const uint8_t mpeg2_dc_scale_table2[128]={
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
    2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
    2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
    2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
    2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
};

static const uint8_t mpeg2_dc_scale_table3[128]={
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
};

105
const uint8_t * const ff_mpeg2_dc_scale_table[4]={
106 107 108 109 110 111
    ff_mpeg1_dc_scale_table,
    mpeg2_dc_scale_table1,
    mpeg2_dc_scale_table2,
    mpeg2_dc_scale_table3,
};

112
const enum PixelFormat ff_pixfmt_list_420[] = {
113 114 115 116 117
    PIX_FMT_YUV420P,
    PIX_FMT_NONE
};

const enum PixelFormat ff_hwaccel_pixfmt_list_420[] = {
L
Laurent Aimar 已提交
118
    PIX_FMT_DXVA2_VLD,
119
    PIX_FMT_VAAPI_VLD,
120 121 122
    PIX_FMT_YUV420P,
    PIX_FMT_NONE
};
123

M
Michael Niedermayer 已提交
124 125 126
const uint8_t *ff_find_start_code(const uint8_t * restrict p, const uint8_t *end, uint32_t * restrict state){
    int i;

M
Michael Niedermayer 已提交
127 128 129 130
    assert(p<=end);
    if(p>=end)
        return end;

M
Michael Niedermayer 已提交
131 132 133 134 135 136 137 138
    for(i=0; i<3; i++){
        uint32_t tmp= *state << 8;
        *state= tmp + *(p++);
        if(tmp == 0x100 || p==end)
            return p;
    }

    while(p<end){
M
Michael Niedermayer 已提交
139 140 141
        if     (p[-1] > 1      ) p+= 3;
        else if(p[-2]          ) p+= 2;
        else if(p[-3]|(p[-1]-1)) p++;
M
Michael Niedermayer 已提交
142 143 144 145 146 147
        else{
            p++;
            break;
        }
    }

M
Michael Niedermayer 已提交
148
    p= FFMIN(p, end)-4;
149
    *state= AV_RB32(p);
M
Michael Niedermayer 已提交
150 151 152 153

    return p+4;
}

154
/* init common dct for both encoder and decoder */
155
av_cold int ff_dct_common_init(MpegEncContext *s)
F
Fabrice Bellard 已提交
156
{
157 158 159 160 161
    s->dct_unquantize_h263_intra = dct_unquantize_h263_intra_c;
    s->dct_unquantize_h263_inter = dct_unquantize_h263_inter_c;
    s->dct_unquantize_mpeg1_intra = dct_unquantize_mpeg1_intra_c;
    s->dct_unquantize_mpeg1_inter = dct_unquantize_mpeg1_inter_c;
    s->dct_unquantize_mpeg2_intra = dct_unquantize_mpeg2_intra_c;
162 163
    if(s->flags & CODEC_FLAG_BITEXACT)
        s->dct_unquantize_mpeg2_intra = dct_unquantize_mpeg2_intra_bitexact;
164
    s->dct_unquantize_mpeg2_inter = dct_unquantize_mpeg2_inter_c;
165

166
#if   HAVE_MMX
167
    MPV_common_init_mmx(s);
168
#elif ARCH_ALPHA
169
    MPV_common_init_axp(s);
170
#elif CONFIG_MLIB
171
    MPV_common_init_mlib(s);
172
#elif HAVE_MMI
173
    MPV_common_init_mmi(s);
174
#elif ARCH_ARM
M
Måns Rullgård 已提交
175
    MPV_common_init_arm(s);
176
#elif HAVE_ALTIVEC
177
    MPV_common_init_altivec(s);
178
#elif ARCH_BFIN
179 180
    MPV_common_init_bfin(s);
#endif
181

182
    /* load & permutate scantables
183
       note: only wmv uses different ones
184
    */
M
Michael Niedermayer 已提交
185 186 187 188 189 190 191
    if(s->alternate_scan){
        ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable  , ff_alternate_vertical_scan);
        ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable  , ff_alternate_vertical_scan);
    }else{
        ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable  , ff_zigzag_direct);
        ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable  , ff_zigzag_direct);
    }
M
Michael Niedermayer 已提交
192 193
    ff_init_scantable(s->dsp.idct_permutation, &s->intra_h_scantable, ff_alternate_horizontal_scan);
    ff_init_scantable(s->dsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
194

195 196 197
    return 0;
}

198
void ff_copy_picture(Picture *dst, Picture *src){
199 200 201 202
    *dst = *src;
    dst->type= FF_BUFFER_TYPE_COPY;
}

203
/**
204
 * Release a frame buffer
205 206 207 208
 */
static void free_frame_buffer(MpegEncContext *s, Picture *pic)
{
    s->avctx->release_buffer(s->avctx, (AVFrame*)pic);
209
    av_freep(&pic->hwaccel_picture_private);
210 211 212
}

/**
213
 * Allocate a frame buffer
214 215 216 217 218
 */
static int alloc_frame_buffer(MpegEncContext *s, Picture *pic)
{
    int r;

219
    if (s->avctx->hwaccel) {
220
        assert(!pic->hwaccel_picture_private);
221
        if (s->avctx->hwaccel->priv_data_size) {
222 223
            pic->hwaccel_picture_private = av_mallocz(s->avctx->hwaccel->priv_data_size);
            if (!pic->hwaccel_picture_private) {
224 225 226 227 228 229
                av_log(s->avctx, AV_LOG_ERROR, "alloc_frame_buffer() failed (hwaccel private data allocation)\n");
                return -1;
            }
        }
    }

230 231 232 233
    r = s->avctx->get_buffer(s->avctx, (AVFrame*)pic);

    if (r<0 || !pic->age || !pic->type || !pic->data[0]) {
        av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed (%d %d %d %p)\n", r, pic->age, pic->type, pic->data[0]);
234
        av_freep(&pic->hwaccel_picture_private);
235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252
        return -1;
    }

    if (s->linesize && (s->linesize != pic->linesize[0] || s->uvlinesize != pic->linesize[1])) {
        av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed (stride changed)\n");
        free_frame_buffer(s, pic);
        return -1;
    }

    if (pic->linesize[1] != pic->linesize[2]) {
        av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed (uv stride mismatch)\n");
        free_frame_buffer(s, pic);
        return -1;
    }

    return 0;
}

M
cleanup  
Michael Niedermayer 已提交
253
/**
M
Michael Niedermayer 已提交
254 255
 * allocates a Picture
 * The pixels are allocated/set by calling get_buffer() if shared=0
M
cleanup  
Michael Niedermayer 已提交
256
 */
257
int ff_alloc_picture(MpegEncContext *s, Picture *pic, int shared){
D
Diego Biurrun 已提交
258
    const int big_mb_num= s->mb_stride*(s->mb_height+1) + 1; //the +1 is needed so memset(,,stride*height) does not sig11
259
    const int mb_array_size= s->mb_stride*s->mb_height;
260 261
    const int b8_array_size= s->b8_stride*s->mb_height*2;
    const int b4_array_size= s->b4_stride*s->mb_height*4;
M
Michael Niedermayer 已提交
262
    int i;
D
Daniel Kristjansson 已提交
263
    int r= -1;
264

M
Michael Niedermayer 已提交
265 266 267 268 269 270
    if(shared){
        assert(pic->data[0]);
        assert(pic->type == 0 || pic->type == FF_BUFFER_TYPE_SHARED);
        pic->type= FF_BUFFER_TYPE_SHARED;
    }else{
        assert(!pic->data[0]);
271

272
        if (alloc_frame_buffer(s, pic) < 0)
M
Michael Niedermayer 已提交
273 274 275 276
            return -1;

        s->linesize  = pic->linesize[0];
        s->uvlinesize= pic->linesize[1];
M
cleanup  
Michael Niedermayer 已提交
277
    }
278

M
Michael Niedermayer 已提交
279
    if(pic->qscale_table==NULL){
280
        if (s->encoding) {
281 282 283
            FF_ALLOCZ_OR_GOTO(s->avctx, pic->mb_var   , mb_array_size * sizeof(int16_t)  , fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, pic->mc_mb_var, mb_array_size * sizeof(int16_t)  , fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, pic->mb_mean  , mb_array_size * sizeof(int8_t )  , fail)
M
Michael Niedermayer 已提交
284
        }
M
cleanup  
Michael Niedermayer 已提交
285

286 287 288
        FF_ALLOCZ_OR_GOTO(s->avctx, pic->mbskip_table , mb_array_size * sizeof(uint8_t)+2, fail) //the +2 is for the slice end check
        FF_ALLOCZ_OR_GOTO(s->avctx, pic->qscale_table , mb_array_size * sizeof(uint8_t)  , fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, pic->mb_type_base , (big_mb_num + s->mb_stride) * sizeof(uint32_t), fail)
289
        pic->mb_type= pic->mb_type_base + 2*s->mb_stride+1;
M
Michael Niedermayer 已提交
290 291
        if(s->out_format == FMT_H264){
            for(i=0; i<2; i++){
292
                FF_ALLOCZ_OR_GOTO(s->avctx, pic->motion_val_base[i], 2 * (b4_array_size+4)  * sizeof(int16_t), fail)
M
Michael Niedermayer 已提交
293
                pic->motion_val[i]= pic->motion_val_base[i]+4;
294
                FF_ALLOCZ_OR_GOTO(s->avctx, pic->ref_index[i], 4*mb_array_size * sizeof(uint8_t), fail)
295
            }
M
Michael Niedermayer 已提交
296
            pic->motion_subsample_log2= 2;
297
        }else if(s->out_format == FMT_H263 || s->encoding || (s->avctx->debug&FF_DEBUG_MV) || (s->avctx->debug_mv)){
298
            for(i=0; i<2; i++){
299
                FF_ALLOCZ_OR_GOTO(s->avctx, pic->motion_val_base[i], 2 * (b8_array_size+4) * sizeof(int16_t), fail)
M
Michael Niedermayer 已提交
300
                pic->motion_val[i]= pic->motion_val_base[i]+4;
301
                FF_ALLOCZ_OR_GOTO(s->avctx, pic->ref_index[i], 4*mb_array_size * sizeof(uint8_t), fail)
M
Michael Niedermayer 已提交
302
            }
M
Michael Niedermayer 已提交
303
            pic->motion_subsample_log2= 3;
M
Michael Niedermayer 已提交
304
        }
305
        if(s->avctx->debug&FF_DEBUG_DCT_COEFF) {
306
            FF_ALLOCZ_OR_GOTO(s->avctx, pic->dct_coeff, 64 * mb_array_size * sizeof(DCTELEM)*6, fail)
307
        }
308
        pic->qstride= s->mb_stride;
309
        FF_ALLOCZ_OR_GOTO(s->avctx, pic->pan_scan , 1 * sizeof(AVPanScan), fail)
M
Michael Niedermayer 已提交
310
    }
M
Michael Niedermayer 已提交
311

D
Diego Biurrun 已提交
312 313
    /* It might be nicer if the application would keep track of these
     * but it would require an API change. */
314
    memmove(s->prev_pict_types+1, s->prev_pict_types, PREV_PICT_TYPES_BUFFER_SIZE-1);
315 316
    s->prev_pict_types[0]= s->dropable ? AV_PICTURE_TYPE_B : s->pict_type;
    if(pic->age < PREV_PICT_TYPES_BUFFER_SIZE && s->prev_pict_types[pic->age] == AV_PICTURE_TYPE_B)
D
Diego Biurrun 已提交
317
        pic->age= INT_MAX; // Skipped MBs in B-frames are quite rare in MPEG-1/2 and it is a bit tricky to skip them anyway.
318

M
cleanup  
Michael Niedermayer 已提交
319
    return 0;
320
fail: //for the FF_ALLOCZ_OR_GOTO macro
D
Daniel Kristjansson 已提交
321
    if(r>=0)
322
        free_frame_buffer(s, pic);
M
cleanup  
Michael Niedermayer 已提交
323 324 325
    return -1;
}

M
Michael Niedermayer 已提交
326 327 328
/**
 * deallocates a picture
 */
M
cleanup  
Michael Niedermayer 已提交
329 330
static void free_picture(MpegEncContext *s, Picture *pic){
    int i;
M
Michael Niedermayer 已提交
331 332

    if(pic->data[0] && pic->type!=FF_BUFFER_TYPE_SHARED){
333
        free_frame_buffer(s, pic);
M
Michael Niedermayer 已提交
334 335
    }

M
cleanup  
Michael Niedermayer 已提交
336 337 338 339 340
    av_freep(&pic->mb_var);
    av_freep(&pic->mc_mb_var);
    av_freep(&pic->mb_mean);
    av_freep(&pic->mbskip_table);
    av_freep(&pic->qscale_table);
M
Michael Niedermayer 已提交
341
    av_freep(&pic->mb_type_base);
342
    av_freep(&pic->dct_coeff);
343
    av_freep(&pic->pan_scan);
M
Michael Niedermayer 已提交
344 345
    pic->mb_type= NULL;
    for(i=0; i<2; i++){
346
        av_freep(&pic->motion_val_base[i]);
M
Michael Niedermayer 已提交
347 348
        av_freep(&pic->ref_index[i]);
    }
349

350
    if(pic->type == FF_BUFFER_TYPE_SHARED){
M
Michael Niedermayer 已提交
351 352 353 354
        for(i=0; i<4; i++){
            pic->base[i]=
            pic->data[i]= NULL;
        }
355
        pic->type= 0;
M
cleanup  
Michael Niedermayer 已提交
356 357 358
    }
}

359
static int init_duplicate_context(MpegEncContext *s, MpegEncContext *base){
360 361 362
    int y_size = s->b8_stride * (2 * s->mb_height + 1);
    int c_size = s->mb_stride * (s->mb_height + 1);
    int yc_size = y_size + 2 * c_size;
363 364
    int i;

365
    // edge emu needs blocksize + filter length - 1 (=17x17 for halfpel / 21x21 for h264)
366
    FF_ALLOCZ_OR_GOTO(s->avctx, s->allocated_edge_emu_buffer, (s->width+64)*2*21*2, fail); //(width + edge + align)*interlaced*MBsize*tolerance
L
Loren Merritt 已提交
367
    s->edge_emu_buffer= s->allocated_edge_emu_buffer + (s->width+64)*2*21;
368

D
Diego Biurrun 已提交
369
     //FIXME should be linesize instead of s->width*2 but that is not known before get_buffer()
370
    FF_ALLOCZ_OR_GOTO(s->avctx, s->me.scratchpad,  (s->width+64)*4*16*2*sizeof(uint8_t), fail)
371
    s->me.temp=         s->me.scratchpad;
372 373 374 375
    s->rd_scratchpad=   s->me.scratchpad;
    s->b_scratchpad=    s->me.scratchpad;
    s->obmc_scratchpad= s->me.scratchpad + 16;
    if (s->encoding) {
376 377
        FF_ALLOCZ_OR_GOTO(s->avctx, s->me.map      , ME_MAP_SIZE*sizeof(uint32_t), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->me.score_map, ME_MAP_SIZE*sizeof(uint32_t), fail)
378
        if(s->avctx->noise_reduction){
379
            FF_ALLOCZ_OR_GOTO(s->avctx, s->dct_error_sum, 2 * 64 * sizeof(int), fail)
380
        }
381
    }
382
    FF_ALLOCZ_OR_GOTO(s->avctx, s->blocks, 64*12*2 * sizeof(DCTELEM), fail)
383 384 385
    s->block= s->blocks[0];

    for(i=0;i<12;i++){
386
        s->pblocks[i] = &s->block[i];
387
    }
388

389 390
    if (s->out_format == FMT_H263) {
        /* ac values */
391 392 393 394 395 396
        FF_ALLOCZ_OR_GOTO(s->avctx, s->ac_val_base, yc_size * sizeof(int16_t) * 16, fail);
        s->ac_val[0] = s->ac_val_base + s->b8_stride + 1;
        s->ac_val[1] = s->ac_val_base + y_size + s->mb_stride + 1;
        s->ac_val[2] = s->ac_val[1] + c_size;
    }

397 398 399 400 401 402 403 404 405 406
    return 0;
fail:
    return -1; //free() through MPV_common_end()
}

static void free_duplicate_context(MpegEncContext *s){
    if(s==NULL) return;

    av_freep(&s->allocated_edge_emu_buffer); s->edge_emu_buffer= NULL;
    av_freep(&s->me.scratchpad);
407
    s->me.temp=
408 409
    s->rd_scratchpad=
    s->b_scratchpad=
410
    s->obmc_scratchpad= NULL;
411

412 413 414 415
    av_freep(&s->dct_error_sum);
    av_freep(&s->me.map);
    av_freep(&s->me.score_map);
    av_freep(&s->blocks);
416
    av_freep(&s->ac_val_base);
417 418 419 420 421 422 423 424
    s->block= NULL;
}

static void backup_duplicate_context(MpegEncContext *bak, MpegEncContext *src){
#define COPY(a) bak->a= src->a
    COPY(allocated_edge_emu_buffer);
    COPY(edge_emu_buffer);
    COPY(me.scratchpad);
425
    COPY(me.temp);
426 427 428 429 430 431 432 433 434 435 436 437
    COPY(rd_scratchpad);
    COPY(b_scratchpad);
    COPY(obmc_scratchpad);
    COPY(me.map);
    COPY(me.score_map);
    COPY(blocks);
    COPY(block);
    COPY(start_mb_y);
    COPY(end_mb_y);
    COPY(me.map_generation);
    COPY(pb);
    COPY(dct_error_sum);
438 439
    COPY(dct_count[0]);
    COPY(dct_count[1]);
440 441 442 443
    COPY(ac_val_base);
    COPY(ac_val[0]);
    COPY(ac_val[1]);
    COPY(ac_val[2]);
444 445 446
#undef COPY
}

447
void ff_update_duplicate_context(MpegEncContext *dst, MpegEncContext *src){
448
    MpegEncContext bak;
449
    int i;
450 451 452 453 454
    //FIXME copy only needed parts
//START_TIMER
    backup_duplicate_context(&bak, dst);
    memcpy(dst, src, sizeof(MpegEncContext));
    backup_duplicate_context(dst, &bak);
455
    for(i=0;i<12;i++){
456
        dst->pblocks[i] = &dst->block[i];
457
    }
458 459 460
//STOP_TIMER("update_duplicate_context") //about 10k cycles / 0.01 sec for 1000frames on 1ghz with 2 threads
}

M
Michael Niedermayer 已提交
461 462 463 464
/**
 * sets the given MpegEncContext to common defaults (same for encoding and decoding).
 * the changed fields will not depend upon the prior state of the MpegEncContext.
 */
B
Benoit Fouet 已提交
465
void MPV_common_defaults(MpegEncContext *s){
M
Michael Niedermayer 已提交
466 467 468 469 470 471 472 473 474 475 476 477
    s->y_dc_scale_table=
    s->c_dc_scale_table= ff_mpeg1_dc_scale_table;
    s->chroma_qscale_table= ff_default_chroma_qscale_table;
    s->progressive_frame= 1;
    s->progressive_sequence= 1;
    s->picture_structure= PICT_FRAME;

    s->coded_picture_number = 0;
    s->picture_number = 0;
    s->input_picture_number = 0;

    s->picture_in_gop_number = 0;
478 479 480

    s->f_code = 1;
    s->b_code = 1;
M
Michael Niedermayer 已提交
481 482 483 484 485 486 487 488 489 490
}

/**
 * sets the given MpegEncContext to defaults for decoding.
 * the changed fields will not depend upon the prior state of the MpegEncContext.
 */
void MPV_decode_defaults(MpegEncContext *s){
    MPV_common_defaults(s);
}

491
/**
M
Michael Niedermayer 已提交
492 493 494
 * init common structure for both encoder and decoder.
 * this assumes that some variables like width/height are already set
 */
495
av_cold int MPV_common_init(MpegEncContext *s)
496
{
497
    int y_size, c_size, yc_size, i, mb_array_size, mv_table_size, x, y, threads;
498

499 500
    if(s->codec_id == CODEC_ID_MPEG2VIDEO && !s->progressive_sequence)
        s->mb_height = (s->height + 31) / 32 * 2;
501
    else if (s->codec_id != CODEC_ID_H264)
B
Baptiste Coudurier 已提交
502
        s->mb_height = (s->height + 15) / 16;
L
Loren Merritt 已提交
503

504 505 506 507 508
    if(s->avctx->pix_fmt == PIX_FMT_NONE){
        av_log(s->avctx, AV_LOG_ERROR, "decoding to PIX_FMT_NONE is not supported.\n");
        return -1;
    }

L
Loren Merritt 已提交
509
    if(s->avctx->thread_count > MAX_THREADS || (s->avctx->thread_count > s->mb_height && s->mb_height)){
M
10l  
Michael Niedermayer 已提交
510 511 512 513
        av_log(s->avctx, AV_LOG_ERROR, "too many threads\n");
        return -1;
    }

514
    if((s->width || s->height) && av_image_check_size(s->width, s->height, 0, s->avctx))
515 516
        return -1;

517
    dsputil_init(&s->dsp, s->avctx);
518
    ff_dct_common_init(s);
519

520
    s->flags= s->avctx->flags;
521
    s->flags2= s->avctx->flags2;
522

523
    if (s->width && s->height) {
R
Ronald S. Bultje 已提交
524 525 526 527 528 529
        s->mb_width  = (s->width  + 15) / 16;
        s->mb_stride = s->mb_width + 1;
        s->b8_stride = s->mb_width*2 + 1;
        s->b4_stride = s->mb_width*4 + 1;
        mb_array_size= s->mb_height * s->mb_stride;
        mv_table_size= (s->mb_height+2) * s->mb_stride + 1;
530

R
Ronald S. Bultje 已提交
531 532 533
        /* set chroma shifts */
        avcodec_get_chroma_sub_sample(s->avctx->pix_fmt,&(s->chroma_x_shift),
                                      &(s->chroma_y_shift) );
534

R
Ronald S. Bultje 已提交
535 536 537
        /* set default edge pos, will be overriden in decode_header if needed */
        s->h_edge_pos= s->mb_width*16;
        s->v_edge_pos= s->mb_height*16;
538

R
Ronald S. Bultje 已提交
539
        s->mb_num = s->mb_width * s->mb_height;
540

R
Ronald S. Bultje 已提交
541 542 543 544 545 546
        s->block_wrap[0]=
        s->block_wrap[1]=
        s->block_wrap[2]=
        s->block_wrap[3]= s->b8_stride;
        s->block_wrap[4]=
        s->block_wrap[5]= s->mb_stride;
547

R
Ronald S. Bultje 已提交
548 549 550
        y_size = s->b8_stride * (2 * s->mb_height + 1);
        c_size = s->mb_stride * (s->mb_height + 1);
        yc_size = y_size + 2 * c_size;
551

R
Ronald S. Bultje 已提交
552 553
        /* convert fourcc to upper case */
        s->codec_tag = ff_toupper4(s->avctx->codec_tag);
554

R
Ronald S. Bultje 已提交
555
        s->stream_codec_tag = ff_toupper4(s->avctx->stream_codec_tag);
556

R
Ronald S. Bultje 已提交
557
        s->avctx->coded_frame= (AVFrame*)&s->current_picture;
558

R
Ronald S. Bultje 已提交
559 560 561 562 563
        FF_ALLOCZ_OR_GOTO(s->avctx, s->mb_index2xy, (s->mb_num+1)*sizeof(int), fail) //error ressilience code looks cleaner with this
        for(y=0; y<s->mb_height; y++){
            for(x=0; x<s->mb_width; x++){
                s->mb_index2xy[ x + y*s->mb_width ] = x + y*s->mb_stride;
            }
564
        }
R
Ronald S. Bultje 已提交
565
        s->mb_index2xy[ s->mb_height*s->mb_width ] = (s->mb_height-1)*s->mb_stride + s->mb_width; //FIXME really needed?
566

R
Ronald S. Bultje 已提交
567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585
        if (s->encoding) {
            /* Allocate MV tables */
            FF_ALLOCZ_OR_GOTO(s->avctx, s->p_mv_table_base            , mv_table_size * 2 * sizeof(int16_t), fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, s->b_forw_mv_table_base       , mv_table_size * 2 * sizeof(int16_t), fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, s->b_back_mv_table_base       , mv_table_size * 2 * sizeof(int16_t), fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, s->b_bidir_forw_mv_table_base , mv_table_size * 2 * sizeof(int16_t), fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, s->b_bidir_back_mv_table_base , mv_table_size * 2 * sizeof(int16_t), fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, s->b_direct_mv_table_base     , mv_table_size * 2 * sizeof(int16_t), fail)
            s->p_mv_table           = s->p_mv_table_base            + s->mb_stride + 1;
            s->b_forw_mv_table      = s->b_forw_mv_table_base       + s->mb_stride + 1;
            s->b_back_mv_table      = s->b_back_mv_table_base       + s->mb_stride + 1;
            s->b_bidir_forw_mv_table= s->b_bidir_forw_mv_table_base + s->mb_stride + 1;
            s->b_bidir_back_mv_table= s->b_bidir_back_mv_table_base + s->mb_stride + 1;
            s->b_direct_mv_table    = s->b_direct_mv_table_base     + s->mb_stride + 1;

            if(s->msmpeg4_version){
                FF_ALLOCZ_OR_GOTO(s->avctx, s->ac_stats, 2*2*(MAX_LEVEL+1)*(MAX_RUN+1)*2*sizeof(int), fail);
            }
            FF_ALLOCZ_OR_GOTO(s->avctx, s->avctx->stats_out, 256, fail);
586

R
Ronald S. Bultje 已提交
587 588
            /* Allocate MB type table */
            FF_ALLOCZ_OR_GOTO(s->avctx, s->mb_type  , mb_array_size * sizeof(uint16_t), fail) //needed for encoding
589

R
Ronald S. Bultje 已提交
590
            FF_ALLOCZ_OR_GOTO(s->avctx, s->lambda_table, mb_array_size * sizeof(int), fail)
591

R
Ronald S. Bultje 已提交
592 593 594 595 596 597
            FF_ALLOCZ_OR_GOTO(s->avctx, s->q_intra_matrix  , 64*32   * sizeof(int), fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, s->q_inter_matrix  , 64*32   * sizeof(int), fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, s->q_intra_matrix16, 64*32*2 * sizeof(uint16_t), fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, s->q_inter_matrix16, 64*32*2 * sizeof(uint16_t), fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, s->input_picture, MAX_PICTURE_COUNT * sizeof(Picture*), fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, s->reordered_input_picture, MAX_PICTURE_COUNT * sizeof(Picture*), fail)
598

R
Ronald S. Bultje 已提交
599 600 601
            if(s->avctx->noise_reduction){
                FF_ALLOCZ_OR_GOTO(s->avctx, s->dct_offset, 2 * 64 * sizeof(uint16_t), fail)
            }
602
        }
603
    }
604

605
    FF_ALLOCZ_OR_GOTO(s->avctx, s->picture, MAX_PICTURE_COUNT * sizeof(Picture), fail)
606 607 608
    for(i = 0; i < MAX_PICTURE_COUNT; i++) {
        avcodec_get_frame_defaults((AVFrame *)&s->picture[i]);
    }
609

610
    if (s->width && s->height) {
R
Ronald S. Bultje 已提交
611
        FF_ALLOCZ_OR_GOTO(s->avctx, s->error_status_table, mb_array_size*sizeof(uint8_t), fail)
612

R
Ronald S. Bultje 已提交
613 614
        if(s->codec_id==CODEC_ID_MPEG4 || (s->flags & CODEC_FLAG_INTERLACED_ME)){
            /* interlaced direct mode decoding tables */
M
Michael Niedermayer 已提交
615 616 617 618
            for(i=0; i<2; i++){
                int j, k;
                for(j=0; j<2; j++){
                    for(k=0; k<2; k++){
619 620
                        FF_ALLOCZ_OR_GOTO(s->avctx,    s->b_field_mv_table_base[i][j][k], mv_table_size * 2 * sizeof(int16_t), fail)
                        s->b_field_mv_table[i][j][k] = s->b_field_mv_table_base[i][j][k] + s->mb_stride + 1;
M
Michael Niedermayer 已提交
621
                    }
622 623 624
                    FF_ALLOCZ_OR_GOTO(s->avctx, s->b_field_select_table [i][j], mb_array_size * 2 * sizeof(uint8_t), fail)
                    FF_ALLOCZ_OR_GOTO(s->avctx, s->p_field_mv_table_base[i][j], mv_table_size * 2 * sizeof(int16_t), fail)
                    s->p_field_mv_table[i][j] = s->p_field_mv_table_base[i][j]+ s->mb_stride + 1;
M
Michael Niedermayer 已提交
625
                }
626
                FF_ALLOCZ_OR_GOTO(s->avctx, s->p_field_select_table[i], mb_array_size * 2 * sizeof(uint8_t), fail)
M
Michael Niedermayer 已提交
627
            }
R
Ronald S. Bultje 已提交
628 629 630 631 632 633 634 635 636 637
        }
        if (s->out_format == FMT_H263) {
            /* cbp values */
            FF_ALLOCZ_OR_GOTO(s->avctx, s->coded_block_base, y_size, fail);
            s->coded_block= s->coded_block_base + s->b8_stride + 1;

            /* cbp, ac_pred, pred_dir */
            FF_ALLOCZ_OR_GOTO(s->avctx, s->cbp_table     , mb_array_size * sizeof(uint8_t), fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, s->pred_dir_table, mb_array_size * sizeof(uint8_t), fail)
        }
638

R
Ronald S. Bultje 已提交
639 640 641 642 643 644 645 646 647 648
        if (s->h263_pred || s->h263_plus || !s->encoding) {
            /* dc values */
            //MN: we need these for error resilience of intra-frames
            FF_ALLOCZ_OR_GOTO(s->avctx, s->dc_val_base, yc_size * sizeof(int16_t), fail);
            s->dc_val[0] = s->dc_val_base + s->b8_stride + 1;
            s->dc_val[1] = s->dc_val_base + y_size + s->mb_stride + 1;
            s->dc_val[2] = s->dc_val[1] + c_size;
            for(i=0;i<yc_size;i++)
                s->dc_val_base[i] = 1024;
        }
649

R
Ronald S. Bultje 已提交
650 651 652
        /* which mb is a intra block */
        FF_ALLOCZ_OR_GOTO(s->avctx, s->mbintra_table, mb_array_size, fail);
        memset(s->mbintra_table, 1, mb_array_size);
653

R
Ronald S. Bultje 已提交
654 655 656 657
        /* init macroblock skip table */
        FF_ALLOCZ_OR_GOTO(s->avctx, s->mbskip_table, mb_array_size+2, fail);
        //Note the +1 is for a quicker mpeg4 slice_end detection
        FF_ALLOCZ_OR_GOTO(s->avctx, s->prev_pict_types, PREV_PICT_TYPES_BUFFER_SIZE, fail);
658

R
Ronald S. Bultje 已提交
659 660 661 662 663 664
        s->parse_context.state= -1;
        if((s->avctx->debug&(FF_DEBUG_VIS_QP|FF_DEBUG_VIS_MB_TYPE)) || (s->avctx->debug_mv)){
            s->visualization_buffer[0] = av_malloc((s->mb_width*16 + 2*EDGE_WIDTH) * s->mb_height*16 + 2*EDGE_WIDTH);
            s->visualization_buffer[1] = av_malloc((s->mb_width*16 + 2*EDGE_WIDTH) * s->mb_height*16 + 2*EDGE_WIDTH);
            s->visualization_buffer[2] = av_malloc((s->mb_width*16 + 2*EDGE_WIDTH) * s->mb_height*16 + 2*EDGE_WIDTH);
        }
665
    }
666

F
Fabrice Bellard 已提交
667
    s->context_initialized = 1;
668

669
    if (s->width && s->height) {
R
Ronald S. Bultje 已提交
670 671
        s->thread_context[0]= s;
        threads = s->avctx->thread_count;
672

R
Ronald S. Bultje 已提交
673 674 675 676
        for(i=1; i<threads; i++){
            s->thread_context[i]= av_malloc(sizeof(MpegEncContext));
            memcpy(s->thread_context[i], s, sizeof(MpegEncContext));
        }
677

R
Ronald S. Bultje 已提交
678 679 680 681 682 683
        for(i=0; i<threads; i++){
            if(init_duplicate_context(s->thread_context[i], s) < 0)
                goto fail;
            s->thread_context[i]->start_mb_y= (s->mb_height*(i  ) + s->avctx->thread_count/2) / s->avctx->thread_count;
            s->thread_context[i]->end_mb_y  = (s->mb_height*(i+1) + s->avctx->thread_count/2) / s->avctx->thread_count;
        }
684 685
    }

F
Fabrice Bellard 已提交
686 687
    return 0;
 fail:
688
    MPV_common_end(s);
F
Fabrice Bellard 已提交
689 690 691 692 693 694
    return -1;
}

/* init common structure for both encoder and decoder */
void MPV_common_end(MpegEncContext *s)
{
M
Michael Niedermayer 已提交
695
    int i, j, k;
F
Fabrice Bellard 已提交
696

697 698 699 700 701 702 703
    for(i=0; i<s->avctx->thread_count; i++){
        free_duplicate_context(s->thread_context[i]);
    }
    for(i=1; i<s->avctx->thread_count; i++){
        av_freep(&s->thread_context[i]);
    }

704 705 706
    av_freep(&s->parse_context.buffer);
    s->parse_context.buffer_size=0;

707
    av_freep(&s->mb_type);
708 709 710 711 712 713 714 715 716 717 718 719
    av_freep(&s->p_mv_table_base);
    av_freep(&s->b_forw_mv_table_base);
    av_freep(&s->b_back_mv_table_base);
    av_freep(&s->b_bidir_forw_mv_table_base);
    av_freep(&s->b_bidir_back_mv_table_base);
    av_freep(&s->b_direct_mv_table_base);
    s->p_mv_table= NULL;
    s->b_forw_mv_table= NULL;
    s->b_back_mv_table= NULL;
    s->b_bidir_forw_mv_table= NULL;
    s->b_bidir_back_mv_table= NULL;
    s->b_direct_mv_table= NULL;
M
Michael Niedermayer 已提交
720 721 722 723 724 725 726 727 728 729 730 731
    for(i=0; i<2; i++){
        for(j=0; j<2; j++){
            for(k=0; k<2; k++){
                av_freep(&s->b_field_mv_table_base[i][j][k]);
                s->b_field_mv_table[i][j][k]=NULL;
            }
            av_freep(&s->b_field_select_table[i][j]);
            av_freep(&s->p_field_mv_table_base[i][j]);
            s->p_field_mv_table[i][j]=NULL;
        }
        av_freep(&s->p_field_select_table[i]);
    }
732

733 734
    av_freep(&s->dc_val_base);
    av_freep(&s->coded_block_base);
735
    av_freep(&s->mbintra_table);
736 737
    av_freep(&s->cbp_table);
    av_freep(&s->pred_dir_table);
738

739
    av_freep(&s->mbskip_table);
740
    av_freep(&s->prev_pict_types);
741
    av_freep(&s->bitstream_buffer);
742 743
    s->allocated_bitstream_buffer_size=0;

M
Michael Niedermayer 已提交
744
    av_freep(&s->avctx->stats_out);
745
    av_freep(&s->ac_stats);
746
    av_freep(&s->error_status_table);
747
    av_freep(&s->mb_index2xy);
748
    av_freep(&s->lambda_table);
749 750
    av_freep(&s->q_intra_matrix);
    av_freep(&s->q_inter_matrix);
751 752
    av_freep(&s->q_intra_matrix16);
    av_freep(&s->q_inter_matrix16);
753 754
    av_freep(&s->input_picture);
    av_freep(&s->reordered_input_picture);
755
    av_freep(&s->dct_offset);
M
cleanup  
Michael Niedermayer 已提交
756

M
Michael Niedermayer 已提交
757 758 759 760
    if(s->picture){
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            free_picture(s, &s->picture[i]);
        }
F
Fabrice Bellard 已提交
761
    }
762
    av_freep(&s->picture);
F
Fabrice Bellard 已提交
763
    s->context_initialized = 0;
764 765 766
    s->last_picture_ptr=
    s->next_picture_ptr=
    s->current_picture_ptr= NULL;
M
Michael Niedermayer 已提交
767
    s->linesize= s->uvlinesize= 0;
768

769
    for(i=0; i<3; i++)
770
        av_freep(&s->visualization_buffer[i]);
M
Michael Niedermayer 已提交
771 772

    avcodec_default_free_buffers(s->avctx);
F
Fabrice Bellard 已提交
773 774
}

775
void init_rl(RLTable *rl, uint8_t static_store[2][2*MAX_RUN + MAX_LEVEL + 3])
M
Michael Niedermayer 已提交
776
{
777 778
    int8_t max_level[MAX_RUN+1], max_run[MAX_LEVEL+1];
    uint8_t index_run[MAX_RUN+1];
M
Michael Niedermayer 已提交
779 780
    int last, run, level, start, end, i;

781
    /* If table is static, we can quit if rl->max_level[0] is not NULL */
782
    if(static_store && rl->max_level[0])
783 784
        return;

M
Michael Niedermayer 已提交
785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807
    /* compute max_level[], max_run[] and index_run[] */
    for(last=0;last<2;last++) {
        if (last == 0) {
            start = 0;
            end = rl->last;
        } else {
            start = rl->last;
            end = rl->n;
        }

        memset(max_level, 0, MAX_RUN + 1);
        memset(max_run, 0, MAX_LEVEL + 1);
        memset(index_run, rl->n, MAX_RUN + 1);
        for(i=start;i<end;i++) {
            run = rl->table_run[i];
            level = rl->table_level[i];
            if (index_run[run] == rl->n)
                index_run[run] = i;
            if (level > max_level[run])
                max_level[run] = level;
            if (run > max_run[level])
                max_run[level] = run;
        }
808 809
        if(static_store)
            rl->max_level[last] = static_store[last];
810 811
        else
            rl->max_level[last] = av_malloc(MAX_RUN + 1);
M
Michael Niedermayer 已提交
812
        memcpy(rl->max_level[last], max_level, MAX_RUN + 1);
813 814
        if(static_store)
            rl->max_run[last] = static_store[last] + MAX_RUN + 1;
815 816
        else
            rl->max_run[last] = av_malloc(MAX_LEVEL + 1);
M
Michael Niedermayer 已提交
817
        memcpy(rl->max_run[last], max_run, MAX_LEVEL + 1);
818 819
        if(static_store)
            rl->index_run[last] = static_store[last] + MAX_RUN + MAX_LEVEL + 2;
820 821
        else
            rl->index_run[last] = av_malloc(MAX_RUN + 1);
M
Michael Niedermayer 已提交
822 823 824 825
        memcpy(rl->index_run[last], index_run, MAX_RUN + 1);
    }
}

826
void init_vlc_rl(RLTable *rl)
827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865
{
    int i, q;

    for(q=0; q<32; q++){
        int qmul= q*2;
        int qadd= (q-1)|1;

        if(q==0){
            qmul=1;
            qadd=0;
        }
        for(i=0; i<rl->vlc.table_size; i++){
            int code= rl->vlc.table[i][0];
            int len = rl->vlc.table[i][1];
            int level, run;

            if(len==0){ // illegal code
                run= 66;
                level= MAX_LEVEL;
            }else if(len<0){ //more bits needed
                run= 0;
                level= code;
            }else{
                if(code==rl->n){ //esc
                    run= 66;
                    level= 0;
                }else{
                    run=   rl->table_run  [code] + 1;
                    level= rl->table_level[code] * qmul + qadd;
                    if(code >= rl->last) run+=192;
                }
            }
            rl->rl_vlc[q][i].len= len;
            rl->rl_vlc[q][i].level= level;
            rl->rl_vlc[q][i].run= run;
        }
    }
}

M
Michael Niedermayer 已提交
866
int ff_find_unused_picture(MpegEncContext *s, int shared){
M
Michael Niedermayer 已提交
867
    int i;
868

M
Michael Niedermayer 已提交
869 870
    if(shared){
        for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
871
            if(s->picture[i].data[0]==NULL && s->picture[i].type==0) return i;
M
Michael Niedermayer 已提交
872 873 874
        }
    }else{
        for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
875
            if(s->picture[i].data[0]==NULL && s->picture[i].type!=0) return i; //FIXME
M
Michael Niedermayer 已提交
876 877
        }
        for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
878
            if(s->picture[i].data[0]==NULL) return i;
M
Michael Niedermayer 已提交
879 880 881
        }
    }

882
    av_log(s->avctx, AV_LOG_FATAL, "Internal error, picture buffer overflow\n");
883 884 885 886 887 888 889 890 891 892 893
    /* We could return -1, but the codec would crash trying to draw into a
     * non-existing frame anyway. This is safer than waiting for a random crash.
     * Also the return of this is never useful, an encoder must only allocate
     * as much as allowed in the specification. This has no relationship to how
     * much libavcodec could allocate (and MAX_PICTURE_COUNT is always large
     * enough for such valid streams).
     * Plus, a decoder has to check stream validity and remove frames if too
     * many reference frames are around. Waiting for "OOM" is not correct at
     * all. Similarly, missing reference frames have to be replaced by
     * interpolated/MC frames, anything else is a bug in the codec ...
     */
894
    abort();
M
Michael Niedermayer 已提交
895
    return -1;
M
Michael Niedermayer 已提交
896 897
}

898 899 900 901 902 903 904 905 906 907
static void update_noise_reduction(MpegEncContext *s){
    int intra, i;

    for(intra=0; intra<2; intra++){
        if(s->dct_count[intra] > (1<<16)){
            for(i=0; i<64; i++){
                s->dct_error_sum[intra][i] >>=1;
            }
            s->dct_count[intra] >>= 1;
        }
908

909 910 911 912 913 914
        for(i=0; i<64; i++){
            s->dct_offset[intra][i]= (s->avctx->noise_reduction * s->dct_count[intra] + s->dct_error_sum[intra][i]/2) / (s->dct_error_sum[intra][i]+1);
        }
    }
}

M
Michael Niedermayer 已提交
915 916 917
/**
 * generic function for encode/decode called after coding/decoding the header and before a frame is coded/decoded
 */
918
int MPV_frame_start(MpegEncContext *s, AVCodecContext *avctx)
F
Fabrice Bellard 已提交
919
{
M
Michael Niedermayer 已提交
920
    int i;
921
    Picture *pic;
922
    s->mb_skipped = 0;
M
Michael Niedermayer 已提交
923

M
Michael Niedermayer 已提交
924
    assert(s->last_picture_ptr==NULL || s->out_format != FMT_H264 || s->codec_id == CODEC_ID_SVQ3);
M
Michael Niedermayer 已提交
925

M
cleanup  
Michael Niedermayer 已提交
926
    /* mark&release old frames */
927
    if (s->pict_type != AV_PICTURE_TYPE_B && s->last_picture_ptr && s->last_picture_ptr != s->next_picture_ptr && s->last_picture_ptr->data[0]) {
928
      if(s->out_format != FMT_H264 || s->codec_id == CODEC_ID_SVQ3){
929
          free_frame_buffer(s, s->last_picture_ptr);
M
cleanup  
Michael Niedermayer 已提交
930 931 932 933 934

        /* release forgotten pictures */
        /* if(mpeg124/h263) */
        if(!s->encoding){
            for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
935
                if(s->picture[i].data[0] && &s->picture[i] != s->next_picture_ptr && s->picture[i].reference){
936
                    av_log(avctx, AV_LOG_ERROR, "releasing zombie picture\n");
937
                    free_frame_buffer(s, &s->picture[i]);
M
cleanup  
Michael Niedermayer 已提交
938 939
                }
            }
940
        }
941
      }
942
    }
943

944
    if(!s->encoding){
D
Diego Biurrun 已提交
945
        /* release non reference frames */
M
Michael Niedermayer 已提交
946 947
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            if(s->picture[i].data[0] && !s->picture[i].reference /*&& s->picture[i].type!=FF_BUFFER_TYPE_SHARED*/){
948
                free_frame_buffer(s, &s->picture[i]);
M
Michael Niedermayer 已提交
949 950 951
            }
        }

M
Michael Niedermayer 已提交
952
        if(s->current_picture_ptr && s->current_picture_ptr->data[0]==NULL)
953
            pic= s->current_picture_ptr; //we already have a unused image (maybe it was set before reading the header)
M
Michael Niedermayer 已提交
954 955
        else{
            i= ff_find_unused_picture(s, 0);
956
            pic= &s->picture[i];
M
Michael Niedermayer 已提交
957 958
        }

959 960 961 962
        pic->reference= 0;
        if (!s->dropable){
            if (s->codec_id == CODEC_ID_H264)
                pic->reference = s->picture_structure;
963
            else if (s->pict_type != AV_PICTURE_TYPE_B)
964 965
                pic->reference = 3;
        }
M
Michael Niedermayer 已提交
966

M
Michael Niedermayer 已提交
967
        pic->coded_picture_number= s->coded_picture_number++;
968

969
        if(ff_alloc_picture(s, pic, 0) < 0)
970
            return -1;
971

972
        s->current_picture_ptr= pic;
973
        //FIXME use only the vars from current_pic
974
        s->current_picture_ptr->top_field_first= s->top_field_first;
975
        if(s->codec_id == CODEC_ID_MPEG1VIDEO || s->codec_id == CODEC_ID_MPEG2VIDEO) {
976
            if(s->picture_structure != PICT_FRAME)
977
                s->current_picture_ptr->top_field_first= (s->picture_structure == PICT_TOP_FIELD) == s->first_field;
978
        }
979
        s->current_picture_ptr->interlaced_frame= !s->progressive_frame && !s->progressive_sequence;
M
cleanup  
Michael Niedermayer 已提交
980
    }
981

M
Michael Niedermayer 已提交
982
    s->current_picture_ptr->pict_type= s->pict_type;
983
//    if(s->flags && CODEC_FLAG_QSCALE)
984
  //      s->current_picture_ptr->quality= s->new_picture_ptr->quality;
985
    s->current_picture_ptr->key_frame= s->pict_type == AV_PICTURE_TYPE_I;
M
Michael Niedermayer 已提交
986

987
    ff_copy_picture(&s->current_picture, s->current_picture_ptr);
988

989
    if (s->pict_type != AV_PICTURE_TYPE_B) {
M
Michael Niedermayer 已提交
990
        s->last_picture_ptr= s->next_picture_ptr;
991 992
        if(!s->dropable)
            s->next_picture_ptr= s->current_picture_ptr;
F
Fabrice Bellard 已提交
993
    }
994
/*    av_log(s->avctx, AV_LOG_DEBUG, "L%p N%p C%p L%p N%p C%p type:%d drop:%d\n", s->last_picture_ptr, s->next_picture_ptr,s->current_picture_ptr,
995 996
        s->last_picture_ptr    ? s->last_picture_ptr->data[0] : NULL,
        s->next_picture_ptr    ? s->next_picture_ptr->data[0] : NULL,
997 998
        s->current_picture_ptr ? s->current_picture_ptr->data[0] : NULL,
        s->pict_type, s->dropable);*/
999

1000
    if(s->codec_id != CODEC_ID_H264){
1001 1002 1003 1004 1005 1006 1007
        if((s->last_picture_ptr==NULL || s->last_picture_ptr->data[0]==NULL) &&
           (s->pict_type!=AV_PICTURE_TYPE_I || s->picture_structure != PICT_FRAME)){
            if (s->pict_type != AV_PICTURE_TYPE_I)
                av_log(avctx, AV_LOG_ERROR, "warning: first frame is no keyframe\n");
            else if (s->picture_structure != PICT_FRAME)
                av_log(avctx, AV_LOG_INFO, "allocate dummy last picture for field based first keyframe\n");

1008 1009 1010 1011 1012 1013
            /* Allocate a dummy frame */
            i= ff_find_unused_picture(s, 0);
            s->last_picture_ptr= &s->picture[i];
            if(ff_alloc_picture(s, s->last_picture_ptr, 0) < 0)
                return -1;
        }
1014
        if((s->next_picture_ptr==NULL || s->next_picture_ptr->data[0]==NULL) && s->pict_type==AV_PICTURE_TYPE_B){
1015 1016 1017 1018 1019 1020 1021 1022
            /* Allocate a dummy frame */
            i= ff_find_unused_picture(s, 0);
            s->next_picture_ptr= &s->picture[i];
            if(ff_alloc_picture(s, s->next_picture_ptr, 0) < 0)
                return -1;
        }
    }

1023 1024
    if(s->last_picture_ptr) ff_copy_picture(&s->last_picture, s->last_picture_ptr);
    if(s->next_picture_ptr) ff_copy_picture(&s->next_picture, s->next_picture_ptr);
1025

1026
    assert(s->pict_type == AV_PICTURE_TYPE_I || (s->last_picture_ptr && s->last_picture_ptr->data[0]));
1027

1028
    if(s->picture_structure!=PICT_FRAME && s->out_format != FMT_H264){
M
Michael Niedermayer 已提交
1029 1030 1031 1032
        int i;
        for(i=0; i<4; i++){
            if(s->picture_structure == PICT_BOTTOM_FIELD){
                 s->current_picture.data[i] += s->current_picture.linesize[i];
1033
            }
M
Michael Niedermayer 已提交
1034 1035 1036 1037 1038
            s->current_picture.linesize[i] *= 2;
            s->last_picture.linesize[i] *=2;
            s->next_picture.linesize[i] *=2;
        }
    }
1039

1040
    s->error_recognition= avctx->error_recognition;
1041

D
Diego Biurrun 已提交
1042
    /* set dequantizer, we can't do it during init as it might change for mpeg4
D
Diego Biurrun 已提交
1043
       and we can't do it in the header decode as init is not called for mpeg4 there yet */
1044 1045 1046
    if(s->mpeg_quant || s->codec_id == CODEC_ID_MPEG2VIDEO){
        s->dct_unquantize_intra = s->dct_unquantize_mpeg2_intra;
        s->dct_unquantize_inter = s->dct_unquantize_mpeg2_inter;
M
Maarten Daniels 已提交
1047
    }else if(s->out_format == FMT_H263 || s->out_format == FMT_H261){
1048 1049 1050 1051 1052 1053
        s->dct_unquantize_intra = s->dct_unquantize_h263_intra;
        s->dct_unquantize_inter = s->dct_unquantize_h263_inter;
    }else{
        s->dct_unquantize_intra = s->dct_unquantize_mpeg1_intra;
        s->dct_unquantize_inter = s->dct_unquantize_mpeg1_inter;
    }
1054

1055 1056 1057 1058 1059
    if(s->dct_error_sum){
        assert(s->avctx->noise_reduction && s->encoding);

        update_noise_reduction(s);
    }
1060

1061
    if(CONFIG_MPEG_XVMC_DECODER && s->avctx->xvmc_acceleration)
1062
        return ff_xvmc_field_start(s, avctx);
1063

1064
    return 0;
F
Fabrice Bellard 已提交
1065
}
1066

F
Fabrice Bellard 已提交
1067 1068 1069
/* generic function for encode/decode called after a frame has been coded/decoded */
void MPV_frame_end(MpegEncContext *s)
{
M
cleanup  
Michael Niedermayer 已提交
1070
    int i;
F
Fabrice Bellard 已提交
1071
    /* draw edge for correct motion prediction if outside */
1072
    //just to make sure that all data is rendered.
1073
    if(CONFIG_MPEG_XVMC_DECODER && s->avctx->xvmc_acceleration){
1074
        ff_xvmc_field_end(s);
1075 1076
    }else if(!s->avctx->hwaccel
       && !(s->avctx->codec->capabilities&CODEC_CAP_HWACCEL_VDPAU)
1077 1078 1079 1080
       && s->unrestricted_mv
       && s->current_picture.reference
       && !s->intra_only
       && !(s->flags&CODEC_FLAG_EMU_EDGE)) {
1081 1082 1083 1084 1085 1086 1087 1088 1089
            s->dsp.draw_edges(s->current_picture.data[0], s->linesize  ,
                              s->h_edge_pos   , s->v_edge_pos   ,
                              EDGE_WIDTH  , EDGE_TOP | EDGE_BOTTOM);
            s->dsp.draw_edges(s->current_picture.data[1], s->uvlinesize,
                              s->h_edge_pos>>1, s->v_edge_pos>>1,
                              EDGE_WIDTH/2, EDGE_TOP | EDGE_BOTTOM);
            s->dsp.draw_edges(s->current_picture.data[2], s->uvlinesize,
                              s->h_edge_pos>>1, s->v_edge_pos>>1,
                              EDGE_WIDTH/2, EDGE_TOP | EDGE_BOTTOM);
F
Fabrice Bellard 已提交
1090
    }
M
Michael Niedermayer 已提交
1091
    emms_c();
1092

M
Michael Niedermayer 已提交
1093
    s->last_pict_type    = s->pict_type;
1094
    s->last_lambda_for[s->pict_type]= s->current_picture_ptr->quality;
1095
    if(s->pict_type!=AV_PICTURE_TYPE_B){
1096 1097
        s->last_non_b_pict_type= s->pict_type;
    }
M
Michael Niedermayer 已提交
1098 1099
#if 0
        /* copy back current_picture variables */
M
cleanup  
Michael Niedermayer 已提交
1100 1101 1102 1103
    for(i=0; i<MAX_PICTURE_COUNT; i++){
        if(s->picture[i].data[0] == s->current_picture.data[0]){
            s->picture[i]= s->current_picture;
            break;
1104
        }
M
cleanup  
Michael Niedermayer 已提交
1105 1106
    }
    assert(i<MAX_PICTURE_COUNT);
1107
#endif
M
cleanup  
Michael Niedermayer 已提交
1108

M
Michael Niedermayer 已提交
1109
    if(s->encoding){
D
Diego Biurrun 已提交
1110
        /* release non-reference frames */
M
Michael Niedermayer 已提交
1111 1112
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            if(s->picture[i].data[0] && !s->picture[i].reference /*&& s->picture[i].type!=FF_BUFFER_TYPE_SHARED*/){
1113
                free_frame_buffer(s, &s->picture[i]);
M
Michael Niedermayer 已提交
1114 1115
            }
        }
M
cleanup  
Michael Niedermayer 已提交
1116
    }
M
Michael Niedermayer 已提交
1117 1118 1119 1120 1121 1122
    // clear copies, to avoid confusion
#if 0
    memset(&s->last_picture, 0, sizeof(Picture));
    memset(&s->next_picture, 0, sizeof(Picture));
    memset(&s->current_picture, 0, sizeof(Picture));
#endif
M
Michael Niedermayer 已提交
1123
    s->avctx->coded_frame= (AVFrame*)s->current_picture_ptr;
F
Fabrice Bellard 已提交
1124 1125
}

1126 1127 1128 1129 1130 1131 1132 1133
/**
 * draws an line from (ex, ey) -> (sx, sy).
 * @param w width of the image
 * @param h height of the image
 * @param stride stride/linesize of the image
 * @param color color of the arrow
 */
static void draw_line(uint8_t *buf, int sx, int sy, int ex, int ey, int w, int h, int stride, int color){
M
SWAP  
Michael Niedermayer 已提交
1134
    int x, y, fr, f;
1135

1136 1137 1138 1139
    sx= av_clip(sx, 0, w-1);
    sy= av_clip(sy, 0, h-1);
    ex= av_clip(ex, 0, w-1);
    ey= av_clip(ey, 0, h-1);
1140

1141
    buf[sy*stride + sx]+= color;
1142

D
Diego Biurrun 已提交
1143
    if(FFABS(ex - sx) > FFABS(ey - sy)){
1144
        if(sx > ex){
D
Diego Biurrun 已提交
1145 1146
            FFSWAP(int, sx, ex);
            FFSWAP(int, sy, ey);
1147 1148 1149 1150 1151
        }
        buf+= sx + sy*stride;
        ex-= sx;
        f= ((ey-sy)<<16)/ex;
        for(x= 0; x <= ex; x++){
1152 1153 1154 1155
            y = (x*f)>>16;
            fr= (x*f)&0xFFFF;
            buf[ y   *stride + x]+= (color*(0x10000-fr))>>16;
            buf[(y+1)*stride + x]+= (color*         fr )>>16;
1156 1157 1158
        }
    }else{
        if(sy > ey){
D
Diego Biurrun 已提交
1159 1160
            FFSWAP(int, sx, ex);
            FFSWAP(int, sy, ey);
1161 1162 1163 1164 1165 1166
        }
        buf+= sx + sy*stride;
        ey-= sy;
        if(ey) f= ((ex-sx)<<16)/ey;
        else   f= 0;
        for(y= 0; y <= ey; y++){
1167 1168
            x = (y*f)>>16;
            fr= (y*f)&0xFFFF;
M
Fix ;;  
Michael Niedermayer 已提交
1169 1170
            buf[y*stride + x  ]+= (color*(0x10000-fr))>>16;
            buf[y*stride + x+1]+= (color*         fr )>>16;
1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181
        }
    }
}

/**
 * draws an arrow from (ex, ey) -> (sx, sy).
 * @param w width of the image
 * @param h height of the image
 * @param stride stride/linesize of the image
 * @param color color of the arrow
 */
1182
static void draw_arrow(uint8_t *buf, int sx, int sy, int ex, int ey, int w, int h, int stride, int color){
1183 1184
    int dx,dy;

1185 1186 1187 1188
    sx= av_clip(sx, -100, w+100);
    sy= av_clip(sy, -100, h+100);
    ex= av_clip(ex, -100, w+100);
    ey= av_clip(ey, -100, h+100);
1189

1190 1191
    dx= ex - sx;
    dy= ey - sy;
1192

1193 1194 1195 1196
    if(dx*dx + dy*dy > 3*3){
        int rx=  dx + dy;
        int ry= -dx + dy;
        int length= ff_sqrt((rx*rx + ry*ry)<<8);
1197

1198 1199 1200
        //FIXME subpixel accuracy
        rx= ROUNDED_DIV(rx*3<<4, length);
        ry= ROUNDED_DIV(ry*3<<4, length);
1201

1202 1203 1204 1205 1206 1207
        draw_line(buf, sx, sy, sx + rx, sy + ry, w, h, stride, color);
        draw_line(buf, sx, sy, sx - ry, sy + rx, w, h, stride, color);
    }
    draw_line(buf, sx, sy, ex, ey, w, h, stride, color);
}

1208 1209 1210
/**
 * prints debuging info for the given picture.
 */
1211
void ff_print_debug_info(MpegEncContext *s, AVFrame *pict){
1212

1213
    if(s->avctx->hwaccel || !pict || !pict->mb_type) return;
1214 1215 1216

    if(s->avctx->debug&(FF_DEBUG_SKIP | FF_DEBUG_QP | FF_DEBUG_MB_TYPE)){
        int x,y;
1217

1218 1219
        av_log(s->avctx,AV_LOG_DEBUG,"New frame, type: ");
        switch (pict->pict_type) {
1220 1221 1222 1223 1224 1225
            case AV_PICTURE_TYPE_I: av_log(s->avctx,AV_LOG_DEBUG,"I\n"); break;
            case AV_PICTURE_TYPE_P: av_log(s->avctx,AV_LOG_DEBUG,"P\n"); break;
            case AV_PICTURE_TYPE_B: av_log(s->avctx,AV_LOG_DEBUG,"B\n"); break;
            case AV_PICTURE_TYPE_S: av_log(s->avctx,AV_LOG_DEBUG,"S\n"); break;
            case AV_PICTURE_TYPE_SI: av_log(s->avctx,AV_LOG_DEBUG,"SI\n"); break;
            case AV_PICTURE_TYPE_SP: av_log(s->avctx,AV_LOG_DEBUG,"SP\n"); break;
1226
        }
1227 1228 1229 1230 1231
        for(y=0; y<s->mb_height; y++){
            for(x=0; x<s->mb_width; x++){
                if(s->avctx->debug&FF_DEBUG_SKIP){
                    int count= s->mbskip_table[x + y*s->mb_stride];
                    if(count>9) count=9;
1232
                    av_log(s->avctx, AV_LOG_DEBUG, "%1d", count);
1233 1234
                }
                if(s->avctx->debug&FF_DEBUG_QP){
1235
                    av_log(s->avctx, AV_LOG_DEBUG, "%2d", pict->qscale_table[x + y*s->mb_stride]);
1236 1237 1238 1239 1240
                }
                if(s->avctx->debug&FF_DEBUG_MB_TYPE){
                    int mb_type= pict->mb_type[x + y*s->mb_stride];
                    //Type & MV direction
                    if(IS_PCM(mb_type))
1241
                        av_log(s->avctx, AV_LOG_DEBUG, "P");
1242
                    else if(IS_INTRA(mb_type) && IS_ACPRED(mb_type))
1243
                        av_log(s->avctx, AV_LOG_DEBUG, "A");
1244
                    else if(IS_INTRA4x4(mb_type))
1245
                        av_log(s->avctx, AV_LOG_DEBUG, "i");
1246
                    else if(IS_INTRA16x16(mb_type))
1247
                        av_log(s->avctx, AV_LOG_DEBUG, "I");
1248
                    else if(IS_DIRECT(mb_type) && IS_SKIP(mb_type))
1249
                        av_log(s->avctx, AV_LOG_DEBUG, "d");
1250
                    else if(IS_DIRECT(mb_type))
1251
                        av_log(s->avctx, AV_LOG_DEBUG, "D");
1252
                    else if(IS_GMC(mb_type) && IS_SKIP(mb_type))
1253
                        av_log(s->avctx, AV_LOG_DEBUG, "g");
1254
                    else if(IS_GMC(mb_type))
1255
                        av_log(s->avctx, AV_LOG_DEBUG, "G");
1256
                    else if(IS_SKIP(mb_type))
1257
                        av_log(s->avctx, AV_LOG_DEBUG, "S");
1258
                    else if(!USES_LIST(mb_type, 1))
1259
                        av_log(s->avctx, AV_LOG_DEBUG, ">");
1260
                    else if(!USES_LIST(mb_type, 0))
1261
                        av_log(s->avctx, AV_LOG_DEBUG, "<");
1262 1263
                    else{
                        assert(USES_LIST(mb_type, 0) && USES_LIST(mb_type, 1));
1264
                        av_log(s->avctx, AV_LOG_DEBUG, "X");
1265
                    }
1266

1267 1268
                    //segmentation
                    if(IS_8X8(mb_type))
1269
                        av_log(s->avctx, AV_LOG_DEBUG, "+");
1270
                    else if(IS_16X8(mb_type))
1271
                        av_log(s->avctx, AV_LOG_DEBUG, "-");
1272
                    else if(IS_8X16(mb_type))
1273
                        av_log(s->avctx, AV_LOG_DEBUG, "|");
1274
                    else if(IS_INTRA(mb_type) || IS_16X16(mb_type))
1275
                        av_log(s->avctx, AV_LOG_DEBUG, " ");
1276
                    else
1277
                        av_log(s->avctx, AV_LOG_DEBUG, "?");
1278 1279


1280
                    if(IS_INTERLACED(mb_type))
1281
                        av_log(s->avctx, AV_LOG_DEBUG, "=");
1282
                    else
1283
                        av_log(s->avctx, AV_LOG_DEBUG, " ");
1284
                }
1285
//                av_log(s->avctx, AV_LOG_DEBUG, " ");
1286
            }
1287
            av_log(s->avctx, AV_LOG_DEBUG, "\n");
1288 1289
        }
    }
1290

1291
    if((s->avctx->debug&(FF_DEBUG_VIS_QP|FF_DEBUG_VIS_MB_TYPE)) || (s->avctx->debug_mv)){
1292 1293
        const int shift= 1 + s->quarter_sample;
        int mb_y;
1294 1295
        uint8_t *ptr;
        int i;
1296
        int h_chroma_shift, v_chroma_shift, block_height;
1297 1298
        const int width = s->avctx->width;
        const int height= s->avctx->height;
1299
        const int mv_sample_log2= 4 - pict->motion_subsample_log2;
1300
        const int mv_stride= (s->mb_width << mv_sample_log2) + (s->codec_id == CODEC_ID_H264 ? 0 : 1);
M
100000l  
Michael Niedermayer 已提交
1301
        s->low_delay=0; //needed to see the vectors without trashing the buffers
1302

1303
        avcodec_get_chroma_sub_sample(s->avctx->pix_fmt, &h_chroma_shift, &v_chroma_shift);
1304
        for(i=0; i<3; i++){
1305
            memcpy(s->visualization_buffer[i], pict->data[i], (i==0) ? pict->linesize[i]*height:pict->linesize[i]*height >> v_chroma_shift);
1306 1307 1308 1309
            pict->data[i]= s->visualization_buffer[i];
        }
        pict->type= FF_BUFFER_TYPE_COPY;
        ptr= pict->data[0];
1310
        block_height = 16>>v_chroma_shift;
1311 1312 1313 1314 1315

        for(mb_y=0; mb_y<s->mb_height; mb_y++){
            int mb_x;
            for(mb_x=0; mb_x<s->mb_width; mb_x++){
                const int mb_index= mb_x + mb_y*s->mb_stride;
1316 1317 1318
                if((s->avctx->debug_mv) && pict->motion_val){
                  int type;
                  for(type=0; type<3; type++){
1319
                    int direction = 0;
1320
                    switch (type) {
1321
                      case 0: if ((!(s->avctx->debug_mv&FF_DEBUG_VIS_MV_P_FOR)) || (pict->pict_type!=AV_PICTURE_TYPE_P))
1322 1323 1324
                                continue;
                              direction = 0;
                              break;
1325
                      case 1: if ((!(s->avctx->debug_mv&FF_DEBUG_VIS_MV_B_FOR)) || (pict->pict_type!=AV_PICTURE_TYPE_B))
1326 1327 1328
                                continue;
                              direction = 0;
                              break;
1329
                      case 2: if ((!(s->avctx->debug_mv&FF_DEBUG_VIS_MV_B_BACK)) || (pict->pict_type!=AV_PICTURE_TYPE_B))
1330 1331 1332 1333
                                continue;
                              direction = 1;
                              break;
                    }
1334 1335 1336
                    if(!USES_LIST(pict->mb_type[mb_index], direction))
                        continue;

1337 1338 1339
                    if(IS_8X8(pict->mb_type[mb_index])){
                      int i;
                      for(i=0; i<4; i++){
1340 1341
                        int sx= mb_x*16 + 4 + 8*(i&1);
                        int sy= mb_y*16 + 4 + 8*(i>>1);
1342
                        int xy= (mb_x*2 + (i&1) + (mb_y*2 + (i>>1))*mv_stride) << (mv_sample_log2-1);
1343 1344
                        int mx= (pict->motion_val[direction][xy][0]>>shift) + sx;
                        int my= (pict->motion_val[direction][xy][1]>>shift) + sy;
1345
                        draw_arrow(ptr, sx, sy, mx, my, width, height, s->linesize, 100);
1346 1347 1348 1349
                      }
                    }else if(IS_16X8(pict->mb_type[mb_index])){
                      int i;
                      for(i=0; i<2; i++){
1350 1351
                        int sx=mb_x*16 + 8;
                        int sy=mb_y*16 + 4 + 8*i;
1352
                        int xy= (mb_x*2 + (mb_y*2 + i)*mv_stride) << (mv_sample_log2-1);
1353 1354
                        int mx=(pict->motion_val[direction][xy][0]>>shift);
                        int my=(pict->motion_val[direction][xy][1]>>shift);
1355

1356 1357
                        if(IS_INTERLACED(pict->mb_type[mb_index]))
                            my*=2;
1358

1359 1360 1361 1362 1363 1364 1365
                        draw_arrow(ptr, sx, sy, mx+sx, my+sy, width, height, s->linesize, 100);
                      }
                    }else if(IS_8X16(pict->mb_type[mb_index])){
                      int i;
                      for(i=0; i<2; i++){
                        int sx=mb_x*16 + 4 + 8*i;
                        int sy=mb_y*16 + 8;
1366
                        int xy= (mb_x*2 + i + mb_y*2*mv_stride) << (mv_sample_log2-1);
1367 1368
                        int mx=(pict->motion_val[direction][xy][0]>>shift);
                        int my=(pict->motion_val[direction][xy][1]>>shift);
1369

1370 1371
                        if(IS_INTERLACED(pict->mb_type[mb_index]))
                            my*=2;
1372

1373
                        draw_arrow(ptr, sx, sy, mx+sx, my+sy, width, height, s->linesize, 100);
1374 1375 1376 1377
                      }
                    }else{
                      int sx= mb_x*16 + 8;
                      int sy= mb_y*16 + 8;
1378
                      int xy= (mb_x + mb_y*mv_stride) << mv_sample_log2;
1379 1380
                      int mx= (pict->motion_val[direction][xy][0]>>shift) + sx;
                      int my= (pict->motion_val[direction][xy][1]>>shift) + sy;
1381
                      draw_arrow(ptr, sx, sy, mx, my, width, height, s->linesize, 100);
1382
                    }
1383
                  }
M
Michael Niedermayer 已提交
1384 1385 1386 1387
                }
                if((s->avctx->debug&FF_DEBUG_VIS_QP) && pict->motion_val){
                    uint64_t c= (pict->qscale_table[mb_index]*128/31) * 0x0101010101010101ULL;
                    int y;
1388 1389 1390
                    for(y=0; y<block_height; y++){
                        *(uint64_t*)(pict->data[1] + 8*mb_x + (block_height*mb_y + y)*pict->linesize[1])= c;
                        *(uint64_t*)(pict->data[2] + 8*mb_x + (block_height*mb_y + y)*pict->linesize[2])= c;
M
Michael Niedermayer 已提交
1391 1392 1393 1394 1395 1396 1397 1398 1399 1400
                    }
                }
                if((s->avctx->debug&FF_DEBUG_VIS_MB_TYPE) && pict->motion_val){
                    int mb_type= pict->mb_type[mb_index];
                    uint64_t u,v;
                    int y;
#define COLOR(theta, r)\
u= (int)(128 + r*cos(theta*3.141592/180));\
v= (int)(128 + r*sin(theta*3.141592/180));

1401

M
Michael Niedermayer 已提交
1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429
                    u=v=128;
                    if(IS_PCM(mb_type)){
                        COLOR(120,48)
                    }else if((IS_INTRA(mb_type) && IS_ACPRED(mb_type)) || IS_INTRA16x16(mb_type)){
                        COLOR(30,48)
                    }else if(IS_INTRA4x4(mb_type)){
                        COLOR(90,48)
                    }else if(IS_DIRECT(mb_type) && IS_SKIP(mb_type)){
//                        COLOR(120,48)
                    }else if(IS_DIRECT(mb_type)){
                        COLOR(150,48)
                    }else if(IS_GMC(mb_type) && IS_SKIP(mb_type)){
                        COLOR(170,48)
                    }else if(IS_GMC(mb_type)){
                        COLOR(190,48)
                    }else if(IS_SKIP(mb_type)){
//                        COLOR(180,48)
                    }else if(!USES_LIST(mb_type, 1)){
                        COLOR(240,48)
                    }else if(!USES_LIST(mb_type, 0)){
                        COLOR(0,48)
                    }else{
                        assert(USES_LIST(mb_type, 0) && USES_LIST(mb_type, 1));
                        COLOR(300,48)
                    }

                    u*= 0x0101010101010101ULL;
                    v*= 0x0101010101010101ULL;
1430 1431 1432
                    for(y=0; y<block_height; y++){
                        *(uint64_t*)(pict->data[1] + 8*mb_x + (block_height*mb_y + y)*pict->linesize[1])= u;
                        *(uint64_t*)(pict->data[2] + 8*mb_x + (block_height*mb_y + y)*pict->linesize[2])= v;
M
Michael Niedermayer 已提交
1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443
                    }

                    //segmentation
                    if(IS_8X8(mb_type) || IS_16X8(mb_type)){
                        *(uint64_t*)(pict->data[0] + 16*mb_x + 0 + (16*mb_y + 8)*pict->linesize[0])^= 0x8080808080808080ULL;
                        *(uint64_t*)(pict->data[0] + 16*mb_x + 8 + (16*mb_y + 8)*pict->linesize[0])^= 0x8080808080808080ULL;
                    }
                    if(IS_8X8(mb_type) || IS_8X16(mb_type)){
                        for(y=0; y<16; y++)
                            pict->data[0][16*mb_x + 8 + (16*mb_y + y)*pict->linesize[0]]^= 0x80;
                    }
1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458
                    if(IS_8X8(mb_type) && mv_sample_log2 >= 2){
                        int dm= 1 << (mv_sample_log2-2);
                        for(i=0; i<4; i++){
                            int sx= mb_x*16 + 8*(i&1);
                            int sy= mb_y*16 + 8*(i>>1);
                            int xy= (mb_x*2 + (i&1) + (mb_y*2 + (i>>1))*mv_stride) << (mv_sample_log2-1);
                            //FIXME bidir
                            int32_t *mv = (int32_t*)&pict->motion_val[0][xy];
                            if(mv[0] != mv[dm] || mv[dm*mv_stride] != mv[dm*(mv_stride+1)])
                                for(y=0; y<8; y++)
                                    pict->data[0][sx + 4 + (sy + y)*pict->linesize[0]]^= 0x80;
                            if(mv[0] != mv[dm*mv_stride] || mv[dm] != mv[dm*(mv_stride+1)])
                                *(uint64_t*)(pict->data[0] + sx + (sy + 4)*pict->linesize[0])^= 0x8080808080808080ULL;
                        }
                    }
1459

M
Michael Niedermayer 已提交
1460 1461 1462
                    if(IS_INTERLACED(mb_type) && s->codec_id == CODEC_ID_H264){
                        // hmm
                    }
1463 1464 1465 1466 1467
                }
                s->mbskip_table[mb_index]=0;
            }
        }
    }
1468 1469
}

1470
static inline int hpel_motion_lowres(MpegEncContext *s,
M
Michael Niedermayer 已提交
1471 1472 1473 1474 1475 1476 1477 1478 1479
                                  uint8_t *dest, uint8_t *src,
                                  int field_based, int field_select,
                                  int src_x, int src_y,
                                  int width, int height, int stride,
                                  int h_edge_pos, int v_edge_pos,
                                  int w, int h, h264_chroma_mc_func *pix_op,
                                  int motion_x, int motion_y)
{
    const int lowres= s->avctx->lowres;
1480
    const int op_index= FFMIN(lowres, 2);
M
Michael Niedermayer 已提交
1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493
    const int s_mask= (2<<lowres)-1;
    int emu=0;
    int sx, sy;

    if(s->quarter_sample){
        motion_x/=2;
        motion_y/=2;
    }

    sx= motion_x & s_mask;
    sy= motion_y & s_mask;
    src_x += motion_x >> (lowres+1);
    src_y += motion_y >> (lowres+1);
1494

M
Michael Niedermayer 已提交
1495 1496 1497 1498
    src += src_y * stride + src_x;

    if(   (unsigned)src_x > h_edge_pos                 - (!!sx) - w
       || (unsigned)src_y >(v_edge_pos >> field_based) - (!!sy) - h){
1499
        s->dsp.emulated_edge_mc(s->edge_emu_buffer, src, s->linesize, w+1, (h+1)<<field_based,
M
Michael Niedermayer 已提交
1500 1501 1502 1503 1504
                            src_x, src_y<<field_based, h_edge_pos, v_edge_pos);
        src= s->edge_emu_buffer;
        emu=1;
    }

1505 1506
    sx= (sx << 2) >> lowres;
    sy= (sy << 2) >> lowres;
M
Michael Niedermayer 已提交
1507 1508
    if(field_select)
        src += s->linesize;
1509
    pix_op[op_index](dest, src, stride, h, sx, sy);
M
Michael Niedermayer 已提交
1510 1511 1512
    return emu;
}

F
Fabrice Bellard 已提交
1513
/* apply one mpeg motion vector to the three components */
B
Benoit Fouet 已提交
1514
static av_always_inline void mpeg_motion_lowres(MpegEncContext *s,
1515
                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
1516
                               int field_based, int bottom_field, int field_select,
B
Benoit Fouet 已提交
1517
                               uint8_t **ref_picture, h264_chroma_mc_func *pix_op,
1518
                               int motion_x, int motion_y, int h, int mb_y)
F
Fabrice Bellard 已提交
1519
{
1520
    uint8_t *ptr_y, *ptr_cb, *ptr_cr;
B
Benoit Fouet 已提交
1521 1522
    int mx, my, src_x, src_y, uvsrc_x, uvsrc_y, uvlinesize, linesize, sx, sy, uvsx, uvsy;
    const int lowres= s->avctx->lowres;
1523
    const int op_index= FFMIN(lowres, 2);
B
Benoit Fouet 已提交
1524 1525 1526 1527
    const int block_s= 8>>lowres;
    const int s_mask= (2<<lowres)-1;
    const int h_edge_pos = s->h_edge_pos >> lowres;
    const int v_edge_pos = s->v_edge_pos >> lowres;
1528
    linesize   = s->current_picture.linesize[0] << field_based;
M
Michael Niedermayer 已提交
1529
    uvlinesize = s->current_picture.linesize[1] << field_based;
1530

1531
    if(s->quarter_sample){ //FIXME obviously not perfect but qpel will not work in lowres anyway
B
Benoit Fouet 已提交
1532 1533 1534 1535 1536 1537 1538 1539 1540 1541 1542
        motion_x/=2;
        motion_y/=2;
    }

    if(field_based){
        motion_y += (bottom_field - field_select)*((1<<lowres)-1);
    }

    sx= motion_x & s_mask;
    sy= motion_y & s_mask;
    src_x = s->mb_x*2*block_s               + (motion_x >> (lowres+1));
1543
    src_y =(   mb_y*2*block_s>>field_based) + (motion_y >> (lowres+1));
1544

M
Michael Niedermayer 已提交
1545
    if (s->out_format == FMT_H263) {
M
Michael Niedermayer 已提交
1546 1547
        uvsx = ((motion_x>>1) & s_mask) | (sx&1);
        uvsy = ((motion_y>>1) & s_mask) | (sy&1);
M
Michael Niedermayer 已提交
1548 1549 1550 1551 1552 1553 1554 1555
        uvsrc_x = src_x>>1;
        uvsrc_y = src_y>>1;
    }else if(s->out_format == FMT_H261){//even chroma mv's are full pel in H261
        mx = motion_x / 4;
        my = motion_y / 4;
        uvsx = (2*mx) & s_mask;
        uvsy = (2*my) & s_mask;
        uvsrc_x = s->mb_x*block_s               + (mx >> lowres);
1556
        uvsrc_y =    mb_y*block_s               + (my >> lowres);
M
Michael Niedermayer 已提交
1557 1558 1559 1560 1561 1562
    } else {
        mx = motion_x / 2;
        my = motion_y / 2;
        uvsx = mx & s_mask;
        uvsy = my & s_mask;
        uvsrc_x = s->mb_x*block_s               + (mx >> (lowres+1));
1563
        uvsrc_y =(   mb_y*block_s>>field_based) + (my >> (lowres+1));
M
Michael Niedermayer 已提交
1564 1565 1566 1567 1568 1569 1570 1571
    }

    ptr_y  = ref_picture[0] + src_y * linesize + src_x;
    ptr_cb = ref_picture[1] + uvsrc_y * uvlinesize + uvsrc_x;
    ptr_cr = ref_picture[2] + uvsrc_y * uvlinesize + uvsrc_x;

    if(   (unsigned)src_x > h_edge_pos                 - (!!sx) - 2*block_s
       || (unsigned)src_y >(v_edge_pos >> field_based) - (!!sy) - h){
1572
            s->dsp.emulated_edge_mc(s->edge_emu_buffer, ptr_y, s->linesize, 17, 17+field_based,
M
Michael Niedermayer 已提交
1573 1574
                             src_x, src_y<<field_based, h_edge_pos, v_edge_pos);
            ptr_y = s->edge_emu_buffer;
1575
            if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
M
Michael Niedermayer 已提交
1576
                uint8_t *uvbuf= s->edge_emu_buffer+18*s->linesize;
1577
                s->dsp.emulated_edge_mc(uvbuf  , ptr_cb, s->uvlinesize, 9, 9+field_based,
M
Michael Niedermayer 已提交
1578
                                 uvsrc_x, uvsrc_y<<field_based, h_edge_pos>>1, v_edge_pos>>1);
1579
                s->dsp.emulated_edge_mc(uvbuf+16, ptr_cr, s->uvlinesize, 9, 9+field_based,
M
Michael Niedermayer 已提交
1580 1581 1582 1583 1584 1585
                                 uvsrc_x, uvsrc_y<<field_based, h_edge_pos>>1, v_edge_pos>>1);
                ptr_cb= uvbuf;
                ptr_cr= uvbuf+16;
            }
    }

1586 1587 1588 1589 1590 1591 1592 1593 1594 1595 1596 1597
    if(bottom_field){ //FIXME use this for field pix too instead of the obnoxious hack which changes picture.data
        dest_y += s->linesize;
        dest_cb+= s->uvlinesize;
        dest_cr+= s->uvlinesize;
    }

    if(field_select){
        ptr_y += s->linesize;
        ptr_cb+= s->uvlinesize;
        ptr_cr+= s->uvlinesize;
    }

1598 1599
    sx= (sx << 2) >> lowres;
    sy= (sy << 2) >> lowres;
M
Michael Niedermayer 已提交
1600
    pix_op[lowres-1](dest_y, ptr_y, linesize, h, sx, sy);
1601

1602
    if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
1603 1604 1605 1606
        uvsx= (uvsx << 2) >> lowres;
        uvsy= (uvsy << 2) >> lowres;
        pix_op[op_index](dest_cb, ptr_cb, uvlinesize, h >> s->chroma_y_shift, uvsx, uvsy);
        pix_op[op_index](dest_cr, ptr_cr, uvlinesize, h >> s->chroma_y_shift, uvsx, uvsy);
M
Michael Niedermayer 已提交
1607
    }
M
Michael Niedermayer 已提交
1608
    //FIXME h261 lowres loop filter
M
Michael Niedermayer 已提交
1609 1610
}

M
Michael Niedermayer 已提交
1611 1612 1613 1614 1615 1616
static inline void chroma_4mv_motion_lowres(MpegEncContext *s,
                                     uint8_t *dest_cb, uint8_t *dest_cr,
                                     uint8_t **ref_picture,
                                     h264_chroma_mc_func *pix_op,
                                     int mx, int my){
    const int lowres= s->avctx->lowres;
1617
    const int op_index= FFMIN(lowres, 2);
M
Michael Niedermayer 已提交
1618 1619 1620 1621 1622 1623
    const int block_s= 8>>lowres;
    const int s_mask= (2<<lowres)-1;
    const int h_edge_pos = s->h_edge_pos >> (lowres+1);
    const int v_edge_pos = s->v_edge_pos >> (lowres+1);
    int emu=0, src_x, src_y, offset, sx, sy;
    uint8_t *ptr;
1624

M
Michael Niedermayer 已提交
1625 1626 1627 1628 1629 1630 1631 1632 1633
    if(s->quarter_sample){
        mx/=2;
        my/=2;
    }

    /* In case of 8X8, we construct a single chroma motion vector
       with a special rounding */
    mx= ff_h263_round_chroma(mx);
    my= ff_h263_round_chroma(my);
1634

M
Michael Niedermayer 已提交
1635 1636 1637 1638
    sx= mx & s_mask;
    sy= my & s_mask;
    src_x = s->mb_x*block_s + (mx >> (lowres+1));
    src_y = s->mb_y*block_s + (my >> (lowres+1));
1639

M
Michael Niedermayer 已提交
1640 1641 1642 1643 1644
    offset = src_y * s->uvlinesize + src_x;
    ptr = ref_picture[1] + offset;
    if(s->flags&CODEC_FLAG_EMU_EDGE){
        if(   (unsigned)src_x > h_edge_pos - (!!sx) - block_s
           || (unsigned)src_y > v_edge_pos - (!!sy) - block_s){
1645
            s->dsp.emulated_edge_mc(s->edge_emu_buffer, ptr, s->uvlinesize, 9, 9, src_x, src_y, h_edge_pos, v_edge_pos);
M
Michael Niedermayer 已提交
1646 1647 1648
            ptr= s->edge_emu_buffer;
            emu=1;
        }
1649
    }
1650 1651 1652
    sx= (sx << 2) >> lowres;
    sy= (sy << 2) >> lowres;
    pix_op[op_index](dest_cb, ptr, s->uvlinesize, block_s, sx, sy);
1653

M
Michael Niedermayer 已提交
1654 1655
    ptr = ref_picture[2] + offset;
    if(emu){
1656
        s->dsp.emulated_edge_mc(s->edge_emu_buffer, ptr, s->uvlinesize, 9, 9, src_x, src_y, h_edge_pos, v_edge_pos);
M
Michael Niedermayer 已提交
1657 1658
        ptr= s->edge_emu_buffer;
    }
1659
    pix_op[op_index](dest_cr, ptr, s->uvlinesize, block_s, sx, sy);
M
Michael Niedermayer 已提交
1660 1661
}

M
doxy  
Michael Niedermayer 已提交
1662
/**
D
Diego Biurrun 已提交
1663
 * motion compensation of a single macroblock
M
doxy  
Michael Niedermayer 已提交
1664 1665 1666 1667 1668 1669
 * @param s context
 * @param dest_y luma destination pointer
 * @param dest_cb chroma cb/u destination pointer
 * @param dest_cr chroma cr/v destination pointer
 * @param dir direction (0->forward, 1->backward)
 * @param ref_picture array[3] of pointers to the 3 planes of the reference picture
1670
 * @param pix_op halfpel motion compensation function (average or put normally)
M
doxy  
Michael Niedermayer 已提交
1671 1672
 * the motion vectors are taken from s->mv and the MV type from s->mv_type
 */
B
Benoit Fouet 已提交
1673
static inline void MPV_motion_lowres(MpegEncContext *s,
1674
                              uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
1675
                              int dir, uint8_t **ref_picture,
B
Benoit Fouet 已提交
1676
                              h264_chroma_mc_func *pix_op)
F
Fabrice Bellard 已提交
1677
{
B
Benoit Fouet 已提交
1678
    int mx, my;
F
Fabrice Bellard 已提交
1679
    int mb_x, mb_y, i;
B
Benoit Fouet 已提交
1680 1681
    const int lowres= s->avctx->lowres;
    const int block_s= 8>>lowres;
F
Fabrice Bellard 已提交
1682 1683 1684 1685 1686 1687

    mb_x = s->mb_x;
    mb_y = s->mb_y;

    switch(s->mv_type) {
    case MV_TYPE_16X16:
B
Benoit Fouet 已提交
1688 1689 1690
        mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
                    0, 0, 0,
                    ref_picture, pix_op,
1691
                    s->mv[dir][0][0], s->mv[dir][0][1], 2*block_s, mb_y);
F
Fabrice Bellard 已提交
1692 1693
        break;
    case MV_TYPE_8X8:
M
Michael Niedermayer 已提交
1694 1695 1696
        mx = 0;
        my = 0;
            for(i=0;i<4;i++) {
B
Benoit Fouet 已提交
1697
                hpel_motion_lowres(s, dest_y + ((i & 1) + (i >> 1) * s->linesize)*block_s,
1698
                            ref_picture[0], 0, 0,
B
Benoit Fouet 已提交
1699
                            (2*mb_x + (i & 1))*block_s, (2*mb_y + (i >>1))*block_s,
M
Michael Niedermayer 已提交
1700
                            s->width, s->height, s->linesize,
B
Benoit Fouet 已提交
1701 1702
                            s->h_edge_pos >> lowres, s->v_edge_pos >> lowres,
                            block_s, block_s, pix_op,
M
Michael Niedermayer 已提交
1703
                            s->mv[dir][i][0], s->mv[dir][i][1]);
M
Michael Niedermayer 已提交
1704 1705 1706

                mx += s->mv[dir][i][0];
                my += s->mv[dir][i][1];
M
Michael Niedermayer 已提交
1707
            }
M
Michael Niedermayer 已提交
1708

1709
        if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY))
B
Benoit Fouet 已提交
1710
            chroma_4mv_motion_lowres(s, dest_cb, dest_cr, ref_picture, pix_op, mx, my);
F
Fabrice Bellard 已提交
1711 1712 1713
        break;
    case MV_TYPE_FIELD:
        if (s->picture_structure == PICT_FRAME) {
B
Benoit Fouet 已提交
1714 1715 1716 1717
            /* top field */
            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
                        1, 0, s->field_select[dir][0],
                        ref_picture, pix_op,
1718
                        s->mv[dir][0][0], s->mv[dir][0][1], block_s, mb_y);
B
Benoit Fouet 已提交
1719 1720 1721 1722
            /* bottom field */
            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
                        1, 1, s->field_select[dir][1],
                        ref_picture, pix_op,
1723
                        s->mv[dir][1][0], s->mv[dir][1][1], block_s, mb_y);
F
Fabrice Bellard 已提交
1724
        } else {
1725
            if(s->picture_structure != s->field_select[dir][0] + 1 && s->pict_type != AV_PICTURE_TYPE_B && !s->first_field){
1726
                ref_picture= s->current_picture_ptr->data;
1727
            }
F
Fabrice Bellard 已提交
1728

B
Benoit Fouet 已提交
1729
            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
1730 1731
                        0, 0, s->field_select[dir][0],
                        ref_picture, pix_op,
1732
                        s->mv[dir][0][0], s->mv[dir][0][1], 2*block_s, mb_y>>1);
F
Fabrice Bellard 已提交
1733
        }
1734
        break;
M
Michael Niedermayer 已提交
1735 1736 1737
    case MV_TYPE_16X8:
        for(i=0; i<2; i++){
            uint8_t ** ref2picture;
1738

1739
            if(s->picture_structure == s->field_select[dir][i] + 1 || s->pict_type == AV_PICTURE_TYPE_B || s->first_field){
1740 1741
                ref2picture= ref_picture;
            }else{
1742
                ref2picture= s->current_picture_ptr->data;
1743
            }
1744

B
Benoit Fouet 已提交
1745
            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
M
Michael Niedermayer 已提交
1746
                        0, 0, s->field_select[dir][i],
1747
                        ref2picture, pix_op,
1748
                        s->mv[dir][i][0], s->mv[dir][i][1] + 2*block_s*i, block_s, mb_y>>1);
1749

B
Benoit Fouet 已提交
1750 1751 1752
            dest_y += 2*block_s*s->linesize;
            dest_cb+= (2*block_s>>s->chroma_y_shift)*s->uvlinesize;
            dest_cr+= (2*block_s>>s->chroma_y_shift)*s->uvlinesize;
1753
        }
F
Fabrice Bellard 已提交
1754
        break;
1755 1756
    case MV_TYPE_DMV:
        if(s->picture_structure == PICT_FRAME){
M
Michael Niedermayer 已提交
1757 1758 1759
            for(i=0; i<2; i++){
                int j;
                for(j=0; j<2; j++){
B
Benoit Fouet 已提交
1760
                    mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
M
Michael Niedermayer 已提交
1761 1762
                                1, j, j^i,
                                ref_picture, pix_op,
1763
                                s->mv[dir][2*i + j][0], s->mv[dir][2*i + j][1], block_s, mb_y);
M
Michael Niedermayer 已提交
1764
                }
B
Benoit Fouet 已提交
1765
                pix_op = s->dsp.avg_h264_chroma_pixels_tab;
M
Michael Niedermayer 已提交
1766
            }
1767
        }else{
M
Michael Niedermayer 已提交
1768
            for(i=0; i<2; i++){
B
Benoit Fouet 已提交
1769
                mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
M
Michael Niedermayer 已提交
1770 1771
                            0, 0, s->picture_structure != i+1,
                            ref_picture, pix_op,
1772
                            s->mv[dir][2*i][0],s->mv[dir][2*i][1],2*block_s, mb_y>>1);
1773

M
Michael Niedermayer 已提交
1774
                // after put we make avg of the same block
B
Benoit Fouet 已提交
1775
                pix_op = s->dsp.avg_h264_chroma_pixels_tab;
1776

M
Michael Niedermayer 已提交
1777 1778
                //opposite parity is always in the same frame if this is second field
                if(!s->first_field){
1779
                    ref_picture = s->current_picture_ptr->data;
M
Michael Niedermayer 已提交
1780
                }
1781
            }
1782 1783
        }
    break;
M
Michael Niedermayer 已提交
1784
    default: assert(0);
F
Fabrice Bellard 已提交
1785 1786 1787
    }
}

B
Benoit Fouet 已提交
1788 1789 1790
/* put block[] to dest[] */
static inline void put_dct(MpegEncContext *s,
                           DCTELEM *block, int i, uint8_t *dest, int line_size, int qscale)
M
Michael Niedermayer 已提交
1791
{
B
Benoit Fouet 已提交
1792 1793 1794
    s->dct_unquantize_intra(s, block, i, qscale);
    s->dsp.idct_put (dest, line_size, block);
}
1795

B
Benoit Fouet 已提交
1796 1797 1798 1799 1800 1801 1802 1803
/* add block[] to dest[] */
static inline void add_dct(MpegEncContext *s,
                           DCTELEM *block, int i, uint8_t *dest, int line_size)
{
    if (s->block_last_index[i] >= 0) {
        s->dsp.idct_add (dest, line_size, block);
    }
}
1804

1805
static inline void add_dequant_dct(MpegEncContext *s,
M
Michael Niedermayer 已提交
1806
                           DCTELEM *block, int i, uint8_t *dest, int line_size, int qscale)
M
Michael Niedermayer 已提交
1807
{
F
Fabrice Bellard 已提交
1808
    if (s->block_last_index[i] >= 0) {
1809
        s->dct_unquantize_inter(s, block, i, qscale);
1810

1811
        s->dsp.idct_add (dest, line_size, block);
F
Fabrice Bellard 已提交
1812 1813 1814
    }
}

1815 1816 1817 1818 1819
/**
 * cleans dc, ac, coded_block for the current non intra MB
 */
void ff_clean_intra_table_entries(MpegEncContext *s)
{
1820
    int wrap = s->b8_stride;
1821
    int xy = s->block_index[0];
1822 1823 1824

    s->dc_val[0][xy           ] =
    s->dc_val[0][xy + 1       ] =
1825 1826 1827
    s->dc_val[0][xy     + wrap] =
    s->dc_val[0][xy + 1 + wrap] = 1024;
    /* ac pred */
1828 1829
    memset(s->ac_val[0][xy       ], 0, 32 * sizeof(int16_t));
    memset(s->ac_val[0][xy + wrap], 0, 32 * sizeof(int16_t));
1830 1831 1832 1833 1834 1835 1836
    if (s->msmpeg4_version>=3) {
        s->coded_block[xy           ] =
        s->coded_block[xy + 1       ] =
        s->coded_block[xy     + wrap] =
        s->coded_block[xy + 1 + wrap] = 0;
    }
    /* chroma */
1837 1838
    wrap = s->mb_stride;
    xy = s->mb_x + s->mb_y * wrap;
1839 1840 1841
    s->dc_val[1][xy] =
    s->dc_val[2][xy] = 1024;
    /* ac pred */
1842 1843
    memset(s->ac_val[1][xy], 0, 16 * sizeof(int16_t));
    memset(s->ac_val[2][xy], 0, 16 * sizeof(int16_t));
1844

1845
    s->mbintra_table[xy]= 0;
1846 1847
}

F
Fabrice Bellard 已提交
1848 1849 1850 1851 1852 1853 1854 1855 1856 1857
/* generic function called after a macroblock has been parsed by the
   decoder or after it has been encoded by the encoder.

   Important variables used:
   s->mb_intra : true if intra macroblock
   s->mv_dir   : motion vector direction
   s->mv_type  : motion vector type
   s->mv       : motion vector
   s->interlaced_dct : true if interlaced dct used (mpeg2)
 */
1858 1859
static av_always_inline
void MPV_decode_mb_internal(MpegEncContext *s, DCTELEM block[12][64],
K
Keiji Costantini 已提交
1860
                            int lowres_flag, int is_mpeg12)
F
Fabrice Bellard 已提交
1861
{
1862
    const int mb_xy = s->mb_y * s->mb_stride + s->mb_x;
1863
    if(CONFIG_MPEG_XVMC_DECODER && s->avctx->xvmc_acceleration){
1864
        ff_xvmc_decode_mb(s);//xvmc uses pblocks
I
Ivan Kalvachev 已提交
1865 1866
        return;
    }
F
Fabrice Bellard 已提交
1867

1868 1869 1870 1871 1872 1873 1874 1875 1876
    if(s->avctx->debug&FF_DEBUG_DCT_COEFF) {
       /* save DCT coefficients */
       int i,j;
       DCTELEM *dct = &s->current_picture.dct_coeff[mb_xy*64*6];
       for(i=0; i<6; i++)
           for(j=0; j<64; j++)
               *dct++ = block[i][s->dsp.idct_permutation[j]];
    }

M
cleanup  
Michael Niedermayer 已提交
1877
    s->current_picture.qscale_table[mb_xy]= s->qscale;
1878

F
Fabrice Bellard 已提交
1879 1880
    /* update DC predictors for P macroblocks */
    if (!s->mb_intra) {
K
Keiji Costantini 已提交
1881
        if (!is_mpeg12 && (s->h263_pred || s->h263_aic)) {
M
Michael Niedermayer 已提交
1882
            if(s->mbintra_table[mb_xy])
1883
                ff_clean_intra_table_entries(s);
F
Fabrice Bellard 已提交
1884
        } else {
1885 1886
            s->last_dc[0] =
            s->last_dc[1] =
F
Fabrice Bellard 已提交
1887 1888 1889
            s->last_dc[2] = 128 << s->intra_dc_precision;
        }
    }
K
Keiji Costantini 已提交
1890
    else if (!is_mpeg12 && (s->h263_pred || s->h263_aic))
M
Michael Niedermayer 已提交
1891
        s->mbintra_table[mb_xy]=1;
1892

1893
    if ((s->flags&CODEC_FLAG_PSNR) || !(s->encoding && (s->intra_only || s->pict_type==AV_PICTURE_TYPE_B) && s->avctx->mb_decision != FF_MB_DECISION_RD)) { //FIXME precalc
1894
        uint8_t *dest_y, *dest_cb, *dest_cr;
M
Michael Niedermayer 已提交
1895
        int dct_linesize, dct_offset;
M
Michael Niedermayer 已提交
1896 1897
        op_pixels_func (*op_pix)[4];
        qpel_mc_func (*op_qpix)[16];
1898
        const int linesize= s->current_picture.linesize[0]; //not s->linesize as this would be wrong for field pics
M
Michael Niedermayer 已提交
1899
        const int uvlinesize= s->current_picture.linesize[1];
1900
        const int readable= s->pict_type != AV_PICTURE_TYPE_B || s->encoding || s->avctx->draw_horiz_band || lowres_flag;
M
Michael Niedermayer 已提交
1901
        const int block_size= lowres_flag ? 8>>s->avctx->lowres : 8;
1902

M
cleanup  
Michael Niedermayer 已提交
1903 1904 1905
        /* avoid copy if macroblock skipped in last frame too */
        /* skip only during decoding as we might trash the buffers during encoding a bit */
        if(!s->encoding){
1906
            uint8_t *mbskip_ptr = &s->mbskip_table[mb_xy];
M
cleanup  
Michael Niedermayer 已提交
1907
            const int age= s->current_picture.age;
M
Michael Niedermayer 已提交
1908

M
cleanup  
Michael Niedermayer 已提交
1909 1910
            assert(age);

1911 1912
            if (s->mb_skipped) {
                s->mb_skipped= 0;
1913
                assert(s->pict_type!=AV_PICTURE_TYPE_I);
1914

1915
                (*mbskip_ptr) ++; /* indicate that this time we skipped it */
M
Michael Niedermayer 已提交
1916 1917
                if(*mbskip_ptr >99) *mbskip_ptr= 99;

M
cleanup  
Michael Niedermayer 已提交
1918
                /* if previous was skipped too, then nothing to do !  */
1919 1920
                if (*mbskip_ptr >= age && s->current_picture.reference){
                    return;
M
cleanup  
Michael Niedermayer 已提交
1921
                }
1922 1923 1924 1925
            } else if(!s->current_picture.reference){
                (*mbskip_ptr) ++; /* increase counter so the age can be compared cleanly */
                if(*mbskip_ptr >99) *mbskip_ptr= 99;
            } else{
1926 1927
                *mbskip_ptr = 0; /* not skipped */
            }
M
Michael Niedermayer 已提交
1928
        }
1929

1930
        dct_linesize = linesize << s->interlaced_dct;
M
Michael Niedermayer 已提交
1931
        dct_offset =(s->interlaced_dct)? linesize : linesize*block_size;
1932

1933 1934 1935 1936 1937
        if(readable){
            dest_y=  s->dest[0];
            dest_cb= s->dest[1];
            dest_cr= s->dest[2];
        }else{
1938
            dest_y = s->b_scratchpad;
1939
            dest_cb= s->b_scratchpad+16*linesize;
1940
            dest_cr= s->b_scratchpad+32*linesize;
1941
        }
M
Michael Niedermayer 已提交
1942

F
Fabrice Bellard 已提交
1943 1944
        if (!s->mb_intra) {
            /* motion handling */
1945
            /* decoding or more than one mb_type (MC was already done otherwise) */
1946
            if(!s->encoding){
M
Michael Niedermayer 已提交
1947 1948
                if(lowres_flag){
                    h264_chroma_mc_func *op_pix = s->dsp.put_h264_chroma_pixels_tab;
F
Fabrice Bellard 已提交
1949

M
Michael Niedermayer 已提交
1950 1951 1952 1953 1954 1955 1956 1957
                    if (s->mv_dir & MV_DIR_FORWARD) {
                        MPV_motion_lowres(s, dest_y, dest_cb, dest_cr, 0, s->last_picture.data, op_pix);
                        op_pix = s->dsp.avg_h264_chroma_pixels_tab;
                    }
                    if (s->mv_dir & MV_DIR_BACKWARD) {
                        MPV_motion_lowres(s, dest_y, dest_cb, dest_cr, 1, s->next_picture.data, op_pix);
                    }
                }else{
1958
                    op_qpix= s->me.qpel_put;
1959
                    if ((!s->no_rounding) || s->pict_type==AV_PICTURE_TYPE_B){
M
Michael Niedermayer 已提交
1960 1961 1962 1963 1964 1965 1966
                        op_pix = s->dsp.put_pixels_tab;
                    }else{
                        op_pix = s->dsp.put_no_rnd_pixels_tab;
                    }
                    if (s->mv_dir & MV_DIR_FORWARD) {
                        MPV_motion(s, dest_y, dest_cb, dest_cr, 0, s->last_picture.data, op_pix, op_qpix);
                        op_pix = s->dsp.avg_pixels_tab;
1967
                        op_qpix= s->me.qpel_avg;
M
Michael Niedermayer 已提交
1968 1969 1970 1971
                    }
                    if (s->mv_dir & MV_DIR_BACKWARD) {
                        MPV_motion(s, dest_y, dest_cb, dest_cr, 1, s->next_picture.data, op_pix, op_qpix);
                    }
1972
                }
F
Fabrice Bellard 已提交
1973 1974
            }

M
Michael Niedermayer 已提交
1975
            /* skip dequant / idct if we are really late ;) */
M
Michael Niedermayer 已提交
1976
            if(s->avctx->skip_idct){
1977 1978
                if(  (s->avctx->skip_idct >= AVDISCARD_NONREF && s->pict_type == AV_PICTURE_TYPE_B)
                   ||(s->avctx->skip_idct >= AVDISCARD_NONKEY && s->pict_type != AV_PICTURE_TYPE_I)
M
Michael Niedermayer 已提交
1979 1980 1981
                   || s->avctx->skip_idct >= AVDISCARD_ALL)
                    goto skip_idct;
            }
M
Michael Niedermayer 已提交
1982

F
Fabrice Bellard 已提交
1983
            /* add dct residue */
M
Michael Niedermayer 已提交
1984
            if(s->encoding || !(   s->h263_msmpeg4 || s->codec_id==CODEC_ID_MPEG1VIDEO || s->codec_id==CODEC_ID_MPEG2VIDEO
1985
                                || (s->codec_id==CODEC_ID_MPEG4 && !s->mpeg_quant))){
M
Michael Niedermayer 已提交
1986 1987 1988 1989
                add_dequant_dct(s, block[0], 0, dest_y                          , dct_linesize, s->qscale);
                add_dequant_dct(s, block[1], 1, dest_y              + block_size, dct_linesize, s->qscale);
                add_dequant_dct(s, block[2], 2, dest_y + dct_offset             , dct_linesize, s->qscale);
                add_dequant_dct(s, block[3], 3, dest_y + dct_offset + block_size, dct_linesize, s->qscale);
M
Michael Niedermayer 已提交
1990

1991
                if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
1992 1993 1994 1995 1996 1997 1998 1999 2000 2001 2002
                    if (s->chroma_y_shift){
                        add_dequant_dct(s, block[4], 4, dest_cb, uvlinesize, s->chroma_qscale);
                        add_dequant_dct(s, block[5], 5, dest_cr, uvlinesize, s->chroma_qscale);
                    }else{
                        dct_linesize >>= 1;
                        dct_offset >>=1;
                        add_dequant_dct(s, block[4], 4, dest_cb,              dct_linesize, s->chroma_qscale);
                        add_dequant_dct(s, block[5], 5, dest_cr,              dct_linesize, s->chroma_qscale);
                        add_dequant_dct(s, block[6], 6, dest_cb + dct_offset, dct_linesize, s->chroma_qscale);
                        add_dequant_dct(s, block[7], 7, dest_cr + dct_offset, dct_linesize, s->chroma_qscale);
                    }
M
Michael Niedermayer 已提交
2003
                }
K
Keiji Costantini 已提交
2004
            } else if(is_mpeg12 || (s->codec_id != CODEC_ID_WMV2)){
M
Michael Niedermayer 已提交
2005 2006 2007 2008
                add_dct(s, block[0], 0, dest_y                          , dct_linesize);
                add_dct(s, block[1], 1, dest_y              + block_size, dct_linesize);
                add_dct(s, block[2], 2, dest_y + dct_offset             , dct_linesize);
                add_dct(s, block[3], 3, dest_y + dct_offset + block_size, dct_linesize);
F
Fabrice Bellard 已提交
2009

2010
                if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
2011 2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031
                    if(s->chroma_y_shift){//Chroma420
                        add_dct(s, block[4], 4, dest_cb, uvlinesize);
                        add_dct(s, block[5], 5, dest_cr, uvlinesize);
                    }else{
                        //chroma422
                        dct_linesize = uvlinesize << s->interlaced_dct;
                        dct_offset =(s->interlaced_dct)? uvlinesize : uvlinesize*8;

                        add_dct(s, block[4], 4, dest_cb, dct_linesize);
                        add_dct(s, block[5], 5, dest_cr, dct_linesize);
                        add_dct(s, block[6], 6, dest_cb+dct_offset, dct_linesize);
                        add_dct(s, block[7], 7, dest_cr+dct_offset, dct_linesize);
                        if(!s->chroma_x_shift){//Chroma444
                            add_dct(s, block[8], 8, dest_cb+8, dct_linesize);
                            add_dct(s, block[9], 9, dest_cr+8, dct_linesize);
                            add_dct(s, block[10], 10, dest_cb+8+dct_offset, dct_linesize);
                            add_dct(s, block[11], 11, dest_cr+8+dct_offset, dct_linesize);
                        }
                    }
                }//fi gray
            }
2032
            else if (CONFIG_WMV2_DECODER || CONFIG_WMV2_ENCODER) {
M
Michael Niedermayer 已提交
2033
                ff_wmv2_add_mb(s, block, dest_y, dest_cb, dest_cr);
M
Michael Niedermayer 已提交
2034
            }
F
Fabrice Bellard 已提交
2035 2036
        } else {
            /* dct only in intra block */
M
Michael Niedermayer 已提交
2037
            if(s->encoding || !(s->codec_id==CODEC_ID_MPEG1VIDEO || s->codec_id==CODEC_ID_MPEG2VIDEO)){
M
Michael Niedermayer 已提交
2038 2039 2040 2041
                put_dct(s, block[0], 0, dest_y                          , dct_linesize, s->qscale);
                put_dct(s, block[1], 1, dest_y              + block_size, dct_linesize, s->qscale);
                put_dct(s, block[2], 2, dest_y + dct_offset             , dct_linesize, s->qscale);
                put_dct(s, block[3], 3, dest_y + dct_offset + block_size, dct_linesize, s->qscale);
2042

2043
                if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
2044 2045 2046 2047 2048 2049 2050 2051 2052
                    if(s->chroma_y_shift){
                        put_dct(s, block[4], 4, dest_cb, uvlinesize, s->chroma_qscale);
                        put_dct(s, block[5], 5, dest_cr, uvlinesize, s->chroma_qscale);
                    }else{
                        dct_offset >>=1;
                        dct_linesize >>=1;
                        put_dct(s, block[4], 4, dest_cb,              dct_linesize, s->chroma_qscale);
                        put_dct(s, block[5], 5, dest_cr,              dct_linesize, s->chroma_qscale);
                        put_dct(s, block[6], 6, dest_cb + dct_offset, dct_linesize, s->chroma_qscale);
B
Benoit Fouet 已提交
2053
                        put_dct(s, block[7], 7, dest_cr + dct_offset, dct_linesize, s->chroma_qscale);
M
Michael Niedermayer 已提交
2054 2055 2056
                    }
                }
            }else{
B
Benoit Fouet 已提交
2057 2058 2059 2060
                s->dsp.idct_put(dest_y                          , dct_linesize, block[0]);
                s->dsp.idct_put(dest_y              + block_size, dct_linesize, block[1]);
                s->dsp.idct_put(dest_y + dct_offset             , dct_linesize, block[2]);
                s->dsp.idct_put(dest_y + dct_offset + block_size, dct_linesize, block[3]);
2061

2062
                if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
B
Benoit Fouet 已提交
2063 2064 2065 2066
                    if(s->chroma_y_shift){
                        s->dsp.idct_put(dest_cb, uvlinesize, block[4]);
                        s->dsp.idct_put(dest_cr, uvlinesize, block[5]);
                    }else{
2067

B
Benoit Fouet 已提交
2068 2069
                        dct_linesize = uvlinesize << s->interlaced_dct;
                        dct_offset =(s->interlaced_dct)? uvlinesize : uvlinesize*8;
2070

B
Benoit Fouet 已提交
2071 2072 2073 2074 2075 2076 2077 2078 2079 2080 2081 2082
                        s->dsp.idct_put(dest_cb,              dct_linesize, block[4]);
                        s->dsp.idct_put(dest_cr,              dct_linesize, block[5]);
                        s->dsp.idct_put(dest_cb + dct_offset, dct_linesize, block[6]);
                        s->dsp.idct_put(dest_cr + dct_offset, dct_linesize, block[7]);
                        if(!s->chroma_x_shift){//Chroma444
                            s->dsp.idct_put(dest_cb + 8,              dct_linesize, block[8]);
                            s->dsp.idct_put(dest_cr + 8,              dct_linesize, block[9]);
                            s->dsp.idct_put(dest_cb + 8 + dct_offset, dct_linesize, block[10]);
                            s->dsp.idct_put(dest_cr + 8 + dct_offset, dct_linesize, block[11]);
                        }
                    }
                }//gray
2083
            }
M
Michael Niedermayer 已提交
2084
        }
B
Benoit Fouet 已提交
2085 2086 2087 2088 2089
skip_idct:
        if(!readable){
            s->dsp.put_pixels_tab[0][0](s->dest[0], dest_y ,   linesize,16);
            s->dsp.put_pixels_tab[s->chroma_x_shift][0](s->dest[1], dest_cb, uvlinesize,16 >> s->chroma_y_shift);
            s->dsp.put_pixels_tab[s->chroma_x_shift][0](s->dest[2], dest_cr, uvlinesize,16 >> s->chroma_y_shift);
2090
        }
M
Michael Niedermayer 已提交
2091 2092 2093
    }
}

B
Benoit Fouet 已提交
2094
void MPV_decode_mb(MpegEncContext *s, DCTELEM block[12][64]){
2095
#if !CONFIG_SMALL
K
Keiji Costantini 已提交
2096 2097 2098 2099 2100 2101 2102
    if(s->out_format == FMT_MPEG1) {
        if(s->avctx->lowres) MPV_decode_mb_internal(s, block, 1, 1);
        else                 MPV_decode_mb_internal(s, block, 0, 1);
    } else
#endif
    if(s->avctx->lowres) MPV_decode_mb_internal(s, block, 1, 0);
    else                  MPV_decode_mb_internal(s, block, 0, 0);
M
Michael Niedermayer 已提交
2103 2104
}

B
Benoit Fouet 已提交
2105 2106 2107 2108 2109 2110 2111
/**
 *
 * @param h is the normal height, this will be reduced automatically if needed for the last row
 */
void ff_draw_horiz_band(MpegEncContext *s, int y, int h){
    if (s->avctx->draw_horiz_band) {
        AVFrame *src;
2112
        const int field_pic= s->picture_structure != PICT_FRAME;
B
Benoit Fouet 已提交
2113
        int offset[4];
M
Michael Niedermayer 已提交
2114

2115 2116 2117
        h= FFMIN(h, (s->avctx->height>>field_pic) - y);

        if(field_pic && !(s->avctx->slice_flags&SLICE_FLAG_ALLOW_FIELD)){
B
Benoit Fouet 已提交
2118 2119
            h <<= 1;
            y <<= 1;
2120
            if(s->first_field) return;
M
Michael Niedermayer 已提交
2121 2122
        }

2123
        if(s->pict_type==AV_PICTURE_TYPE_B || s->low_delay || (s->avctx->slice_flags&SLICE_FLAG_CODED_ORDER))
B
Benoit Fouet 已提交
2124 2125 2126 2127 2128
            src= (AVFrame*)s->current_picture_ptr;
        else if(s->last_picture_ptr)
            src= (AVFrame*)s->last_picture_ptr;
        else
            return;
2129

2130
        if(s->pict_type==AV_PICTURE_TYPE_B && s->picture_structure == PICT_FRAME && s->out_format != FMT_H264){
B
Benoit Fouet 已提交
2131 2132 2133 2134
            offset[0]=
            offset[1]=
            offset[2]=
            offset[3]= 0;
M
Michael Niedermayer 已提交
2135
        }else{
M
Fix ;;  
Michael Niedermayer 已提交
2136
            offset[0]= y * s->linesize;
B
Benoit Fouet 已提交
2137 2138 2139
            offset[1]=
            offset[2]= (y >> s->chroma_y_shift) * s->uvlinesize;
            offset[3]= 0;
M
Michael Niedermayer 已提交
2140
        }
2141

B
Benoit Fouet 已提交
2142
        emms_c();
M
Michael Niedermayer 已提交
2143

B
Benoit Fouet 已提交
2144 2145 2146 2147
        s->avctx->draw_horiz_band(s->avctx, src, offset,
                                  y, s->picture_structure, h);
    }
}
2148

B
Benoit Fouet 已提交
2149 2150 2151 2152
void ff_init_block_index(MpegEncContext *s){ //FIXME maybe rename
    const int linesize= s->current_picture.linesize[0]; //not s->linesize as this would be wrong for field pics
    const int uvlinesize= s->current_picture.linesize[1];
    const int mb_size= 4 - s->avctx->lowres;
M
Michael Niedermayer 已提交
2153

B
Benoit Fouet 已提交
2154 2155 2156 2157 2158 2159 2160
    s->block_index[0]= s->b8_stride*(s->mb_y*2    ) - 2 + s->mb_x*2;
    s->block_index[1]= s->b8_stride*(s->mb_y*2    ) - 1 + s->mb_x*2;
    s->block_index[2]= s->b8_stride*(s->mb_y*2 + 1) - 2 + s->mb_x*2;
    s->block_index[3]= s->b8_stride*(s->mb_y*2 + 1) - 1 + s->mb_x*2;
    s->block_index[4]= s->mb_stride*(s->mb_y + 1)                + s->b8_stride*s->mb_height*2 + s->mb_x - 1;
    s->block_index[5]= s->mb_stride*(s->mb_y + s->mb_height + 2) + s->b8_stride*s->mb_height*2 + s->mb_x - 1;
    //block_index is not used by mpeg2, so it is not affected by chroma_format
2161

B
Benoit Fouet 已提交
2162 2163 2164
    s->dest[0] = s->current_picture.data[0] + ((s->mb_x - 1) << mb_size);
    s->dest[1] = s->current_picture.data[1] + ((s->mb_x - 1) << (mb_size - s->chroma_x_shift));
    s->dest[2] = s->current_picture.data[2] + ((s->mb_x - 1) << (mb_size - s->chroma_x_shift));
2165

2166
    if(!(s->pict_type==AV_PICTURE_TYPE_B && s->avctx->draw_horiz_band && s->picture_structure==PICT_FRAME))
B
Benoit Fouet 已提交
2167
    {
2168
        if(s->picture_structure==PICT_FRAME){
B
Benoit Fouet 已提交
2169 2170 2171
        s->dest[0] += s->mb_y *   linesize << mb_size;
        s->dest[1] += s->mb_y * uvlinesize << (mb_size - s->chroma_y_shift);
        s->dest[2] += s->mb_y * uvlinesize << (mb_size - s->chroma_y_shift);
2172 2173 2174 2175 2176 2177
        }else{
            s->dest[0] += (s->mb_y>>1) *   linesize << mb_size;
            s->dest[1] += (s->mb_y>>1) * uvlinesize << (mb_size - s->chroma_y_shift);
            s->dest[2] += (s->mb_y>>1) * uvlinesize << (mb_size - s->chroma_y_shift);
            assert((s->mb_y&1) == (s->picture_structure == PICT_BOTTOM_FIELD));
        }
M
Michael Niedermayer 已提交
2178 2179
    }
}
2180

B
Benoit Fouet 已提交
2181 2182 2183
void ff_mpeg_flush(AVCodecContext *avctx){
    int i;
    MpegEncContext *s = avctx->priv_data;
M
Michael Niedermayer 已提交
2184

B
Benoit Fouet 已提交
2185 2186
    if(s==NULL || s->picture==NULL)
        return;
M
Michael Niedermayer 已提交
2187

B
Benoit Fouet 已提交
2188 2189 2190
    for(i=0; i<MAX_PICTURE_COUNT; i++){
       if(s->picture[i].data[0] && (   s->picture[i].type == FF_BUFFER_TYPE_INTERNAL
                                    || s->picture[i].type == FF_BUFFER_TYPE_USER))
2191
        free_frame_buffer(s, &s->picture[i]);
F
Fabrice Bellard 已提交
2192
    }
B
Benoit Fouet 已提交
2193
    s->current_picture_ptr = s->last_picture_ptr = s->next_picture_ptr = NULL;
2194

B
Benoit Fouet 已提交
2195
    s->mb_x= s->mb_y= 0;
2196
    s->closed_gop= 0;
M
Michael Niedermayer 已提交
2197

B
Benoit Fouet 已提交
2198 2199 2200 2201 2202 2203 2204 2205
    s->parse_context.state= -1;
    s->parse_context.frame_start_found= 0;
    s->parse_context.overread= 0;
    s->parse_context.overread_index= 0;
    s->parse_context.index= 0;
    s->parse_context.last_index= 0;
    s->bitstream_buffer_size=0;
    s->pp_time=0;
F
Fabrice Bellard 已提交
2206 2207
}

2208
static void dct_unquantize_mpeg1_intra_c(MpegEncContext *s,
2209
                                   DCTELEM *block, int n, int qscale)
F
Fabrice Bellard 已提交
2210
{
M
Michael Niedermayer 已提交
2211
    int i, level, nCoeffs;
2212
    const uint16_t *quant_matrix;
F
Fabrice Bellard 已提交
2213

2214
    nCoeffs= s->block_last_index[n];
2215 2216

    if (n < 4)
2217 2218 2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233
        block[0] = block[0] * s->y_dc_scale;
    else
        block[0] = block[0] * s->c_dc_scale;
    /* XXX: only mpeg1 */
    quant_matrix = s->intra_matrix;
    for(i=1;i<=nCoeffs;i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = (level - 1) | 1;
                level = -level;
            } else {
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = (level - 1) | 1;
F
Fabrice Bellard 已提交
2234
            }
2235
            block[j] = level;
F
Fabrice Bellard 已提交
2236
        }
2237 2238 2239
    }
}

2240
static void dct_unquantize_mpeg1_inter_c(MpegEncContext *s,
2241 2242 2243 2244 2245 2246
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
    const uint16_t *quant_matrix;

    nCoeffs= s->block_last_index[n];
2247

2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262
    quant_matrix = s->inter_matrix;
    for(i=0; i<=nCoeffs; i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
                level = (level - 1) | 1;
                level = -level;
            } else {
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
                level = (level - 1) | 1;
F
Fabrice Bellard 已提交
2263
            }
2264
            block[j] = level;
F
Fabrice Bellard 已提交
2265 2266 2267
        }
    }
}
2268

2269
static void dct_unquantize_mpeg2_intra_c(MpegEncContext *s,
2270 2271 2272
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
2273
    const uint16_t *quant_matrix;
2274

2275 2276
    if(s->alternate_scan) nCoeffs= 63;
    else nCoeffs= s->block_last_index[n];
2277 2278

    if (n < 4)
2279 2280 2281 2282 2283 2284 2285 2286 2287 2288 2289 2290 2291 2292 2293 2294 2295 2296 2297 2298
        block[0] = block[0] * s->y_dc_scale;
    else
        block[0] = block[0] * s->c_dc_scale;
    quant_matrix = s->intra_matrix;
    for(i=1;i<=nCoeffs;i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = -level;
            } else {
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
            }
            block[j] = level;
        }
    }
}

2299 2300 2301 2302 2303 2304 2305 2306 2307 2308 2309 2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330 2331
static void dct_unquantize_mpeg2_intra_bitexact(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
    const uint16_t *quant_matrix;
    int sum=-1;

    if(s->alternate_scan) nCoeffs= 63;
    else nCoeffs= s->block_last_index[n];

    if (n < 4)
        block[0] = block[0] * s->y_dc_scale;
    else
        block[0] = block[0] * s->c_dc_scale;
    quant_matrix = s->intra_matrix;
    for(i=1;i<=nCoeffs;i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = -level;
            } else {
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
            }
            block[j] = level;
            sum+=level;
        }
    }
    block[63]^=sum&1;
}

2332
static void dct_unquantize_mpeg2_inter_c(MpegEncContext *s,
2333 2334 2335 2336 2337 2338 2339 2340
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
    const uint16_t *quant_matrix;
    int sum=-1;

    if(s->alternate_scan) nCoeffs= 63;
    else nCoeffs= s->block_last_index[n];
2341

2342 2343 2344 2345 2346 2347 2348 2349 2350 2351 2352 2353 2354 2355 2356 2357 2358 2359 2360 2361 2362
    quant_matrix = s->inter_matrix;
    for(i=0; i<=nCoeffs; i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
                level = -level;
            } else {
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
            }
            block[j] = level;
            sum+=level;
        }
    }
    block[63]^=sum&1;
}

2363
static void dct_unquantize_h263_intra_c(MpegEncContext *s,
2364 2365 2366 2367
                                  DCTELEM *block, int n, int qscale)
{
    int i, level, qmul, qadd;
    int nCoeffs;
2368

2369
    assert(s->block_last_index[n]>=0);
2370

2371
    qmul = qscale << 1;
2372

2373
    if (!s->h263_aic) {
2374
        if (n < 4)
2375 2376 2377
            block[0] = block[0] * s->y_dc_scale;
        else
            block[0] = block[0] * s->c_dc_scale;
2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393
        qadd = (qscale - 1) | 1;
    }else{
        qadd = 0;
    }
    if(s->ac_pred)
        nCoeffs=63;
    else
        nCoeffs= s->inter_scantable.raster_end[ s->block_last_index[n] ];

    for(i=1; i<=nCoeffs; i++) {
        level = block[i];
        if (level) {
            if (level < 0) {
                level = level * qmul - qadd;
            } else {
                level = level * qmul + qadd;
2394
            }
2395
            block[i] = level;
2396 2397 2398 2399
        }
    }
}

2400
static void dct_unquantize_h263_inter_c(MpegEncContext *s,
2401 2402 2403
                                  DCTELEM *block, int n, int qscale)
{
    int i, level, qmul, qadd;
M
Michael Niedermayer 已提交
2404
    int nCoeffs;
2405

2406
    assert(s->block_last_index[n]>=0);
2407

2408 2409
    qadd = (qscale - 1) | 1;
    qmul = qscale << 1;
2410

2411
    nCoeffs= s->inter_scantable.raster_end[ s->block_last_index[n] ];
2412

2413
    for(i=0; i<=nCoeffs; i++) {
2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424
        level = block[i];
        if (level) {
            if (level < 0) {
                level = level * qmul - qadd;
            } else {
                level = level * qmul + qadd;
            }
            block[i] = level;
        }
    }
}
F
Fabrice Bellard 已提交
2425

2426 2427 2428 2429 2430 2431 2432 2433 2434 2435 2436 2437 2438 2439 2440 2441
/**
 * set qscale and update qscale dependent variables.
 */
void ff_set_qscale(MpegEncContext * s, int qscale)
{
    if (qscale < 1)
        qscale = 1;
    else if (qscale > 31)
        qscale = 31;

    s->qscale = qscale;
    s->chroma_qscale= s->chroma_qscale_table[qscale];

    s->y_dc_scale= s->y_dc_scale_table[ qscale ];
    s->c_dc_scale= s->c_dc_scale_table[ s->chroma_qscale ];
}