mpegvideo.c 92.2 KB
Newer Older
F
Fabrice Bellard 已提交
1 2
/*
 * The simplest mpeg encoder (well, it was the simplest!)
3
 * Copyright (c) 2000,2001 Fabrice Bellard
4
 * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at>
F
Fabrice Bellard 已提交
5
 *
6 7
 * 4MV & hq & B-frame encoding stuff by Michael Niedermayer <michaelni@gmx.at>
 *
8
 * This file is part of Libav.
9
 *
10
 * Libav is free software; you can redistribute it and/or
F
Fabrice Bellard 已提交
11 12
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
13
 * version 2.1 of the License, or (at your option) any later version.
F
Fabrice Bellard 已提交
14
 *
15
 * Libav is distributed in the hope that it will be useful,
F
Fabrice Bellard 已提交
16
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
F
Fabrice Bellard 已提交
17 18
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
F
Fabrice Bellard 已提交
19
 *
F
Fabrice Bellard 已提交
20
 * You should have received a copy of the GNU Lesser General Public
21
 * License along with Libav; if not, write to the Free Software
22
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
F
Fabrice Bellard 已提交
23
 */
24

M
Michael Niedermayer 已提交
25
/**
26
 * @file
M
Michael Niedermayer 已提交
27
 * The simplest mpeg encoder (well, it was the simplest!).
28 29
 */

30
#include "libavutil/intmath.h"
31
#include "libavutil/imgutils.h"
F
Fabrice Bellard 已提交
32 33
#include "avcodec.h"
#include "dsputil.h"
34
#include "internal.h"
F
Fabrice Bellard 已提交
35
#include "mpegvideo.h"
B
Benoit Fouet 已提交
36
#include "mpegvideo_common.h"
37
#include "mjpegenc.h"
38
#include "msmpeg4.h"
M
Michael Niedermayer 已提交
39
#include "faandct.h"
40
#include "xvmc_internal.h"
41
#include <limits.h>
F
Fabrice Bellard 已提交
42

43 44
//#undef NDEBUG
//#include <assert.h>
45

46
static void dct_unquantize_mpeg1_intra_c(MpegEncContext *s,
47
                                   DCTELEM *block, int n, int qscale);
48
static void dct_unquantize_mpeg1_inter_c(MpegEncContext *s,
49
                                   DCTELEM *block, int n, int qscale);
50 51
static void dct_unquantize_mpeg2_intra_c(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale);
52 53
static void dct_unquantize_mpeg2_intra_bitexact(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale);
54 55
static void dct_unquantize_mpeg2_inter_c(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale);
56
static void dct_unquantize_h263_intra_c(MpegEncContext *s,
57
                                  DCTELEM *block, int n, int qscale);
58
static void dct_unquantize_h263_inter_c(MpegEncContext *s,
59
                                  DCTELEM *block, int n, int qscale);
M
Michael Niedermayer 已提交
60

F
Fabrice Bellard 已提交
61 62 63 64 65 66

/* enable all paranoid tests for rounding, overflows, etc... */
//#define PARANOID

//#define DEBUG

67

M
Michael Niedermayer 已提交
68 69 70 71 72
static const uint8_t ff_default_chroma_qscale_table[32]={
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
    0, 1, 2, 3, 4, 5, 6, 7, 8, 9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31
};

73 74 75 76 77 78 79 80
const uint8_t ff_mpeg1_dc_scale_table[128]={
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
    8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
    8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
    8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
    8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
};

81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104
static const uint8_t mpeg2_dc_scale_table1[128]={
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
    4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
    4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
    4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
    4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
};

static const uint8_t mpeg2_dc_scale_table2[128]={
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
    2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
    2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
    2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
    2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
};

static const uint8_t mpeg2_dc_scale_table3[128]={
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
};

105
const uint8_t * const ff_mpeg2_dc_scale_table[4]={
106 107 108 109 110 111
    ff_mpeg1_dc_scale_table,
    mpeg2_dc_scale_table1,
    mpeg2_dc_scale_table2,
    mpeg2_dc_scale_table3,
};

112
const enum PixelFormat ff_pixfmt_list_420[] = {
113 114 115 116 117
    PIX_FMT_YUV420P,
    PIX_FMT_NONE
};

const enum PixelFormat ff_hwaccel_pixfmt_list_420[] = {
L
Laurent Aimar 已提交
118
    PIX_FMT_DXVA2_VLD,
119
    PIX_FMT_VAAPI_VLD,
120 121 122
    PIX_FMT_YUV420P,
    PIX_FMT_NONE
};
123

M
Michael Niedermayer 已提交
124 125 126
const uint8_t *ff_find_start_code(const uint8_t * restrict p, const uint8_t *end, uint32_t * restrict state){
    int i;

M
Michael Niedermayer 已提交
127 128 129 130
    assert(p<=end);
    if(p>=end)
        return end;

M
Michael Niedermayer 已提交
131 132 133 134 135 136 137 138
    for(i=0; i<3; i++){
        uint32_t tmp= *state << 8;
        *state= tmp + *(p++);
        if(tmp == 0x100 || p==end)
            return p;
    }

    while(p<end){
M
Michael Niedermayer 已提交
139 140 141
        if     (p[-1] > 1      ) p+= 3;
        else if(p[-2]          ) p+= 2;
        else if(p[-3]|(p[-1]-1)) p++;
M
Michael Niedermayer 已提交
142 143 144 145 146 147
        else{
            p++;
            break;
        }
    }

M
Michael Niedermayer 已提交
148
    p= FFMIN(p, end)-4;
149
    *state= AV_RB32(p);
M
Michael Niedermayer 已提交
150 151 152 153

    return p+4;
}

154
/* init common dct for both encoder and decoder */
155
av_cold int ff_dct_common_init(MpegEncContext *s)
F
Fabrice Bellard 已提交
156
{
157 158 159 160 161
    s->dct_unquantize_h263_intra = dct_unquantize_h263_intra_c;
    s->dct_unquantize_h263_inter = dct_unquantize_h263_inter_c;
    s->dct_unquantize_mpeg1_intra = dct_unquantize_mpeg1_intra_c;
    s->dct_unquantize_mpeg1_inter = dct_unquantize_mpeg1_inter_c;
    s->dct_unquantize_mpeg2_intra = dct_unquantize_mpeg2_intra_c;
162 163
    if(s->flags & CODEC_FLAG_BITEXACT)
        s->dct_unquantize_mpeg2_intra = dct_unquantize_mpeg2_intra_bitexact;
164
    s->dct_unquantize_mpeg2_inter = dct_unquantize_mpeg2_inter_c;
165

166
#if   HAVE_MMX
167
    MPV_common_init_mmx(s);
168
#elif ARCH_ALPHA
169
    MPV_common_init_axp(s);
170
#elif CONFIG_MLIB
171
    MPV_common_init_mlib(s);
172
#elif HAVE_MMI
173
    MPV_common_init_mmi(s);
174
#elif ARCH_ARM
M
Måns Rullgård 已提交
175
    MPV_common_init_arm(s);
176
#elif HAVE_ALTIVEC
177
    MPV_common_init_altivec(s);
178
#elif ARCH_BFIN
179 180
    MPV_common_init_bfin(s);
#endif
181

182
    /* load & permutate scantables
183
       note: only wmv uses different ones
184
    */
M
Michael Niedermayer 已提交
185 186 187 188 189 190 191
    if(s->alternate_scan){
        ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable  , ff_alternate_vertical_scan);
        ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable  , ff_alternate_vertical_scan);
    }else{
        ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable  , ff_zigzag_direct);
        ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable  , ff_zigzag_direct);
    }
M
Michael Niedermayer 已提交
192 193
    ff_init_scantable(s->dsp.idct_permutation, &s->intra_h_scantable, ff_alternate_horizontal_scan);
    ff_init_scantable(s->dsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
194

195 196 197
    return 0;
}

198
void ff_copy_picture(Picture *dst, Picture *src){
199 200 201 202
    *dst = *src;
    dst->type= FF_BUFFER_TYPE_COPY;
}

203
/**
204
 * Release a frame buffer
205 206 207 208
 */
static void free_frame_buffer(MpegEncContext *s, Picture *pic)
{
    s->avctx->release_buffer(s->avctx, (AVFrame*)pic);
209
    av_freep(&pic->hwaccel_picture_private);
210 211 212
}

/**
213
 * Allocate a frame buffer
214 215 216 217 218
 */
static int alloc_frame_buffer(MpegEncContext *s, Picture *pic)
{
    int r;

219
    if (s->avctx->hwaccel) {
220
        assert(!pic->hwaccel_picture_private);
221
        if (s->avctx->hwaccel->priv_data_size) {
222 223
            pic->hwaccel_picture_private = av_mallocz(s->avctx->hwaccel->priv_data_size);
            if (!pic->hwaccel_picture_private) {
224 225 226 227 228 229
                av_log(s->avctx, AV_LOG_ERROR, "alloc_frame_buffer() failed (hwaccel private data allocation)\n");
                return -1;
            }
        }
    }

230 231 232 233
    r = s->avctx->get_buffer(s->avctx, (AVFrame*)pic);

    if (r<0 || !pic->age || !pic->type || !pic->data[0]) {
        av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed (%d %d %d %p)\n", r, pic->age, pic->type, pic->data[0]);
234
        av_freep(&pic->hwaccel_picture_private);
235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252
        return -1;
    }

    if (s->linesize && (s->linesize != pic->linesize[0] || s->uvlinesize != pic->linesize[1])) {
        av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed (stride changed)\n");
        free_frame_buffer(s, pic);
        return -1;
    }

    if (pic->linesize[1] != pic->linesize[2]) {
        av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed (uv stride mismatch)\n");
        free_frame_buffer(s, pic);
        return -1;
    }

    return 0;
}

M
cleanup  
Michael Niedermayer 已提交
253
/**
M
Michael Niedermayer 已提交
254 255
 * allocates a Picture
 * The pixels are allocated/set by calling get_buffer() if shared=0
M
cleanup  
Michael Niedermayer 已提交
256
 */
257
int ff_alloc_picture(MpegEncContext *s, Picture *pic, int shared){
D
Diego Biurrun 已提交
258
    const int big_mb_num= s->mb_stride*(s->mb_height+1) + 1; //the +1 is needed so memset(,,stride*height) does not sig11
259
    const int mb_array_size= s->mb_stride*s->mb_height;
260 261
    const int b8_array_size= s->b8_stride*s->mb_height*2;
    const int b4_array_size= s->b4_stride*s->mb_height*4;
M
Michael Niedermayer 已提交
262
    int i;
D
Daniel Kristjansson 已提交
263
    int r= -1;
264

M
Michael Niedermayer 已提交
265 266 267 268 269 270
    if(shared){
        assert(pic->data[0]);
        assert(pic->type == 0 || pic->type == FF_BUFFER_TYPE_SHARED);
        pic->type= FF_BUFFER_TYPE_SHARED;
    }else{
        assert(!pic->data[0]);
271

272
        if (alloc_frame_buffer(s, pic) < 0)
M
Michael Niedermayer 已提交
273 274 275 276
            return -1;

        s->linesize  = pic->linesize[0];
        s->uvlinesize= pic->linesize[1];
M
cleanup  
Michael Niedermayer 已提交
277
    }
278

M
Michael Niedermayer 已提交
279
    if(pic->qscale_table==NULL){
280
        if (s->encoding) {
281 282 283
            FF_ALLOCZ_OR_GOTO(s->avctx, pic->mb_var   , mb_array_size * sizeof(int16_t)  , fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, pic->mc_mb_var, mb_array_size * sizeof(int16_t)  , fail)
            FF_ALLOCZ_OR_GOTO(s->avctx, pic->mb_mean  , mb_array_size * sizeof(int8_t )  , fail)
M
Michael Niedermayer 已提交
284
        }
M
cleanup  
Michael Niedermayer 已提交
285

286 287 288
        FF_ALLOCZ_OR_GOTO(s->avctx, pic->mbskip_table , mb_array_size * sizeof(uint8_t)+2, fail) //the +2 is for the slice end check
        FF_ALLOCZ_OR_GOTO(s->avctx, pic->qscale_table , mb_array_size * sizeof(uint8_t)  , fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, pic->mb_type_base , (big_mb_num + s->mb_stride) * sizeof(uint32_t), fail)
289
        pic->mb_type= pic->mb_type_base + 2*s->mb_stride+1;
M
Michael Niedermayer 已提交
290 291
        if(s->out_format == FMT_H264){
            for(i=0; i<2; i++){
292
                FF_ALLOCZ_OR_GOTO(s->avctx, pic->motion_val_base[i], 2 * (b4_array_size+4)  * sizeof(int16_t), fail)
M
Michael Niedermayer 已提交
293
                pic->motion_val[i]= pic->motion_val_base[i]+4;
294
                FF_ALLOCZ_OR_GOTO(s->avctx, pic->ref_index[i], 4*mb_array_size * sizeof(uint8_t), fail)
295
            }
M
Michael Niedermayer 已提交
296
            pic->motion_subsample_log2= 2;
297
        }else if(s->out_format == FMT_H263 || s->encoding || (s->avctx->debug&FF_DEBUG_MV) || (s->avctx->debug_mv)){
298
            for(i=0; i<2; i++){
299
                FF_ALLOCZ_OR_GOTO(s->avctx, pic->motion_val_base[i], 2 * (b8_array_size+4) * sizeof(int16_t), fail)
M
Michael Niedermayer 已提交
300
                pic->motion_val[i]= pic->motion_val_base[i]+4;
301
                FF_ALLOCZ_OR_GOTO(s->avctx, pic->ref_index[i], 4*mb_array_size * sizeof(uint8_t), fail)
M
Michael Niedermayer 已提交
302
            }
M
Michael Niedermayer 已提交
303
            pic->motion_subsample_log2= 3;
M
Michael Niedermayer 已提交
304
        }
305
        if(s->avctx->debug&FF_DEBUG_DCT_COEFF) {
306
            FF_ALLOCZ_OR_GOTO(s->avctx, pic->dct_coeff, 64 * mb_array_size * sizeof(DCTELEM)*6, fail)
307
        }
308
        pic->qstride= s->mb_stride;
309
        FF_ALLOCZ_OR_GOTO(s->avctx, pic->pan_scan , 1 * sizeof(AVPanScan), fail)
M
Michael Niedermayer 已提交
310
    }
M
Michael Niedermayer 已提交
311

D
Diego Biurrun 已提交
312 313
    /* It might be nicer if the application would keep track of these
     * but it would require an API change. */
314
    memmove(s->prev_pict_types+1, s->prev_pict_types, PREV_PICT_TYPES_BUFFER_SIZE-1);
315
    s->prev_pict_types[0]= s->dropable ? FF_B_TYPE : s->pict_type;
316
    if(pic->age < PREV_PICT_TYPES_BUFFER_SIZE && s->prev_pict_types[pic->age] == FF_B_TYPE)
D
Diego Biurrun 已提交
317
        pic->age= INT_MAX; // Skipped MBs in B-frames are quite rare in MPEG-1/2 and it is a bit tricky to skip them anyway.
318

M
cleanup  
Michael Niedermayer 已提交
319
    return 0;
320
fail: //for the FF_ALLOCZ_OR_GOTO macro
D
Daniel Kristjansson 已提交
321
    if(r>=0)
322
        free_frame_buffer(s, pic);
M
cleanup  
Michael Niedermayer 已提交
323 324 325
    return -1;
}

M
Michael Niedermayer 已提交
326 327 328
/**
 * deallocates a picture
 */
M
cleanup  
Michael Niedermayer 已提交
329 330
static void free_picture(MpegEncContext *s, Picture *pic){
    int i;
M
Michael Niedermayer 已提交
331 332

    if(pic->data[0] && pic->type!=FF_BUFFER_TYPE_SHARED){
333
        free_frame_buffer(s, pic);
M
Michael Niedermayer 已提交
334 335
    }

M
cleanup  
Michael Niedermayer 已提交
336 337 338 339 340
    av_freep(&pic->mb_var);
    av_freep(&pic->mc_mb_var);
    av_freep(&pic->mb_mean);
    av_freep(&pic->mbskip_table);
    av_freep(&pic->qscale_table);
M
Michael Niedermayer 已提交
341
    av_freep(&pic->mb_type_base);
342
    av_freep(&pic->dct_coeff);
343
    av_freep(&pic->pan_scan);
M
Michael Niedermayer 已提交
344 345
    pic->mb_type= NULL;
    for(i=0; i<2; i++){
346
        av_freep(&pic->motion_val_base[i]);
M
Michael Niedermayer 已提交
347 348
        av_freep(&pic->ref_index[i]);
    }
349

350
    if(pic->type == FF_BUFFER_TYPE_SHARED){
M
Michael Niedermayer 已提交
351 352 353 354
        for(i=0; i<4; i++){
            pic->base[i]=
            pic->data[i]= NULL;
        }
355
        pic->type= 0;
M
cleanup  
Michael Niedermayer 已提交
356 357 358
    }
}

359
static int init_duplicate_context(MpegEncContext *s, MpegEncContext *base){
360 361 362
    int y_size = s->b8_stride * (2 * s->mb_height + 1);
    int c_size = s->mb_stride * (s->mb_height + 1);
    int yc_size = y_size + 2 * c_size;
363 364
    int i;

365
    // edge emu needs blocksize + filter length - 1 (=17x17 for halfpel / 21x21 for h264)
366
    FF_ALLOCZ_OR_GOTO(s->avctx, s->allocated_edge_emu_buffer, (s->width+64)*2*21*2, fail); //(width + edge + align)*interlaced*MBsize*tolerance
L
Loren Merritt 已提交
367
    s->edge_emu_buffer= s->allocated_edge_emu_buffer + (s->width+64)*2*21;
368

D
Diego Biurrun 已提交
369
     //FIXME should be linesize instead of s->width*2 but that is not known before get_buffer()
370
    FF_ALLOCZ_OR_GOTO(s->avctx, s->me.scratchpad,  (s->width+64)*4*16*2*sizeof(uint8_t), fail)
371
    s->me.temp=         s->me.scratchpad;
372 373 374 375
    s->rd_scratchpad=   s->me.scratchpad;
    s->b_scratchpad=    s->me.scratchpad;
    s->obmc_scratchpad= s->me.scratchpad + 16;
    if (s->encoding) {
376 377
        FF_ALLOCZ_OR_GOTO(s->avctx, s->me.map      , ME_MAP_SIZE*sizeof(uint32_t), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->me.score_map, ME_MAP_SIZE*sizeof(uint32_t), fail)
378
        if(s->avctx->noise_reduction){
379
            FF_ALLOCZ_OR_GOTO(s->avctx, s->dct_error_sum, 2 * 64 * sizeof(int), fail)
380
        }
381
    }
382
    FF_ALLOCZ_OR_GOTO(s->avctx, s->blocks, 64*12*2 * sizeof(DCTELEM), fail)
383 384 385
    s->block= s->blocks[0];

    for(i=0;i<12;i++){
386
        s->pblocks[i] = &s->block[i];
387
    }
388

389 390
    if (s->out_format == FMT_H263) {
        /* ac values */
391 392 393 394 395 396
        FF_ALLOCZ_OR_GOTO(s->avctx, s->ac_val_base, yc_size * sizeof(int16_t) * 16, fail);
        s->ac_val[0] = s->ac_val_base + s->b8_stride + 1;
        s->ac_val[1] = s->ac_val_base + y_size + s->mb_stride + 1;
        s->ac_val[2] = s->ac_val[1] + c_size;
    }

397 398 399 400 401 402 403 404 405 406
    return 0;
fail:
    return -1; //free() through MPV_common_end()
}

static void free_duplicate_context(MpegEncContext *s){
    if(s==NULL) return;

    av_freep(&s->allocated_edge_emu_buffer); s->edge_emu_buffer= NULL;
    av_freep(&s->me.scratchpad);
407
    s->me.temp=
408 409
    s->rd_scratchpad=
    s->b_scratchpad=
410
    s->obmc_scratchpad= NULL;
411

412 413 414 415
    av_freep(&s->dct_error_sum);
    av_freep(&s->me.map);
    av_freep(&s->me.score_map);
    av_freep(&s->blocks);
416
    av_freep(&s->ac_val_base);
417 418 419 420 421 422 423 424
    s->block= NULL;
}

static void backup_duplicate_context(MpegEncContext *bak, MpegEncContext *src){
#define COPY(a) bak->a= src->a
    COPY(allocated_edge_emu_buffer);
    COPY(edge_emu_buffer);
    COPY(me.scratchpad);
425
    COPY(me.temp);
426 427 428 429 430 431 432 433 434 435 436 437
    COPY(rd_scratchpad);
    COPY(b_scratchpad);
    COPY(obmc_scratchpad);
    COPY(me.map);
    COPY(me.score_map);
    COPY(blocks);
    COPY(block);
    COPY(start_mb_y);
    COPY(end_mb_y);
    COPY(me.map_generation);
    COPY(pb);
    COPY(dct_error_sum);
438 439
    COPY(dct_count[0]);
    COPY(dct_count[1]);
440 441 442 443
    COPY(ac_val_base);
    COPY(ac_val[0]);
    COPY(ac_val[1]);
    COPY(ac_val[2]);
444 445 446
#undef COPY
}

447
void ff_update_duplicate_context(MpegEncContext *dst, MpegEncContext *src){
448
    MpegEncContext bak;
449
    int i;
450 451 452 453 454
    //FIXME copy only needed parts
//START_TIMER
    backup_duplicate_context(&bak, dst);
    memcpy(dst, src, sizeof(MpegEncContext));
    backup_duplicate_context(dst, &bak);
455
    for(i=0;i<12;i++){
456
        dst->pblocks[i] = &dst->block[i];
457
    }
458 459 460
//STOP_TIMER("update_duplicate_context") //about 10k cycles / 0.01 sec for 1000frames on 1ghz with 2 threads
}

M
Michael Niedermayer 已提交
461 462 463 464
/**
 * sets the given MpegEncContext to common defaults (same for encoding and decoding).
 * the changed fields will not depend upon the prior state of the MpegEncContext.
 */
B
Benoit Fouet 已提交
465
void MPV_common_defaults(MpegEncContext *s){
M
Michael Niedermayer 已提交
466 467 468 469 470 471 472 473 474 475 476 477
    s->y_dc_scale_table=
    s->c_dc_scale_table= ff_mpeg1_dc_scale_table;
    s->chroma_qscale_table= ff_default_chroma_qscale_table;
    s->progressive_frame= 1;
    s->progressive_sequence= 1;
    s->picture_structure= PICT_FRAME;

    s->coded_picture_number = 0;
    s->picture_number = 0;
    s->input_picture_number = 0;

    s->picture_in_gop_number = 0;
478 479 480

    s->f_code = 1;
    s->b_code = 1;
M
Michael Niedermayer 已提交
481 482 483 484 485 486 487 488 489 490
}

/**
 * sets the given MpegEncContext to defaults for decoding.
 * the changed fields will not depend upon the prior state of the MpegEncContext.
 */
void MPV_decode_defaults(MpegEncContext *s){
    MPV_common_defaults(s);
}

491
/**
M
Michael Niedermayer 已提交
492 493 494
 * init common structure for both encoder and decoder.
 * this assumes that some variables like width/height are already set
 */
495
av_cold int MPV_common_init(MpegEncContext *s)
496
{
497
    int y_size, c_size, yc_size, i, mb_array_size, mv_table_size, x, y, threads;
498

499 500
    if(s->codec_id == CODEC_ID_MPEG2VIDEO && !s->progressive_sequence)
        s->mb_height = (s->height + 31) / 32 * 2;
501
    else if (s->codec_id != CODEC_ID_H264)
B
Baptiste Coudurier 已提交
502
        s->mb_height = (s->height + 15) / 16;
L
Loren Merritt 已提交
503

504 505 506 507 508
    if(s->avctx->pix_fmt == PIX_FMT_NONE){
        av_log(s->avctx, AV_LOG_ERROR, "decoding to PIX_FMT_NONE is not supported.\n");
        return -1;
    }

L
Loren Merritt 已提交
509
    if(s->avctx->thread_count > MAX_THREADS || (s->avctx->thread_count > s->mb_height && s->mb_height)){
M
10l  
Michael Niedermayer 已提交
510 511 512 513
        av_log(s->avctx, AV_LOG_ERROR, "too many threads\n");
        return -1;
    }

514
    if((s->width || s->height) && av_image_check_size(s->width, s->height, 0, s->avctx))
515 516
        return -1;

517
    dsputil_init(&s->dsp, s->avctx);
518
    ff_dct_common_init(s);
519

520
    s->flags= s->avctx->flags;
521
    s->flags2= s->avctx->flags2;
522

M
cleanup  
Michael Niedermayer 已提交
523
    s->mb_width  = (s->width  + 15) / 16;
524
    s->mb_stride = s->mb_width + 1;
525 526
    s->b8_stride = s->mb_width*2 + 1;
    s->b4_stride = s->mb_width*4 + 1;
527
    mb_array_size= s->mb_height * s->mb_stride;
M
Michael Niedermayer 已提交
528
    mv_table_size= (s->mb_height+2) * s->mb_stride + 1;
529

530 531 532 533
    /* set chroma shifts */
    avcodec_get_chroma_sub_sample(s->avctx->pix_fmt,&(s->chroma_x_shift),
                                                    &(s->chroma_y_shift) );

534 535 536
    /* set default edge pos, will be overriden in decode_header if needed */
    s->h_edge_pos= s->mb_width*16;
    s->v_edge_pos= s->mb_height*16;
537 538

    s->mb_num = s->mb_width * s->mb_height;
539

540 541 542
    s->block_wrap[0]=
    s->block_wrap[1]=
    s->block_wrap[2]=
543
    s->block_wrap[3]= s->b8_stride;
544
    s->block_wrap[4]=
545
    s->block_wrap[5]= s->mb_stride;
546

547 548
    y_size = s->b8_stride * (2 * s->mb_height + 1);
    c_size = s->mb_stride * (s->mb_height + 1);
549
    yc_size = y_size + 2 * c_size;
550

551
    /* convert fourcc to upper case */
552 553 554
    s->codec_tag = ff_toupper4(s->avctx->codec_tag);

    s->stream_codec_tag = ff_toupper4(s->avctx->stream_codec_tag);
555

M
Michael Niedermayer 已提交
556
    s->avctx->coded_frame= (AVFrame*)&s->current_picture;
M
cleanup  
Michael Niedermayer 已提交
557

558
    FF_ALLOCZ_OR_GOTO(s->avctx, s->mb_index2xy, (s->mb_num+1)*sizeof(int), fail) //error ressilience code looks cleaner with this
559 560 561 562 563 564
    for(y=0; y<s->mb_height; y++){
        for(x=0; x<s->mb_width; x++){
            s->mb_index2xy[ x + y*s->mb_width ] = x + y*s->mb_stride;
        }
    }
    s->mb_index2xy[ s->mb_height*s->mb_width ] = (s->mb_height-1)*s->mb_stride + s->mb_width; //FIXME really needed?
565

566
    if (s->encoding) {
567
        /* Allocate MV tables */
568 569 570 571 572 573
        FF_ALLOCZ_OR_GOTO(s->avctx, s->p_mv_table_base            , mv_table_size * 2 * sizeof(int16_t), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->b_forw_mv_table_base       , mv_table_size * 2 * sizeof(int16_t), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->b_back_mv_table_base       , mv_table_size * 2 * sizeof(int16_t), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->b_bidir_forw_mv_table_base , mv_table_size * 2 * sizeof(int16_t), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->b_bidir_back_mv_table_base , mv_table_size * 2 * sizeof(int16_t), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->b_direct_mv_table_base     , mv_table_size * 2 * sizeof(int16_t), fail)
574 575 576 577 578 579
        s->p_mv_table           = s->p_mv_table_base            + s->mb_stride + 1;
        s->b_forw_mv_table      = s->b_forw_mv_table_base       + s->mb_stride + 1;
        s->b_back_mv_table      = s->b_back_mv_table_base       + s->mb_stride + 1;
        s->b_bidir_forw_mv_table= s->b_bidir_forw_mv_table_base + s->mb_stride + 1;
        s->b_bidir_back_mv_table= s->b_bidir_back_mv_table_base + s->mb_stride + 1;
        s->b_direct_mv_table    = s->b_direct_mv_table_base     + s->mb_stride + 1;
580

581
        if(s->msmpeg4_version){
582
            FF_ALLOCZ_OR_GOTO(s->avctx, s->ac_stats, 2*2*(MAX_LEVEL+1)*(MAX_RUN+1)*2*sizeof(int), fail);
583
        }
584
        FF_ALLOCZ_OR_GOTO(s->avctx, s->avctx->stats_out, 256, fail);
585 586

        /* Allocate MB type table */
587
        FF_ALLOCZ_OR_GOTO(s->avctx, s->mb_type  , mb_array_size * sizeof(uint16_t), fail) //needed for encoding
588

589
        FF_ALLOCZ_OR_GOTO(s->avctx, s->lambda_table, mb_array_size * sizeof(int), fail)
590

591 592 593 594 595 596
        FF_ALLOCZ_OR_GOTO(s->avctx, s->q_intra_matrix  , 64*32   * sizeof(int), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->q_inter_matrix  , 64*32   * sizeof(int), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->q_intra_matrix16, 64*32*2 * sizeof(uint16_t), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->q_inter_matrix16, 64*32*2 * sizeof(uint16_t), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->input_picture, MAX_PICTURE_COUNT * sizeof(Picture*), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->reordered_input_picture, MAX_PICTURE_COUNT * sizeof(Picture*), fail)
597

598
        if(s->avctx->noise_reduction){
599
            FF_ALLOCZ_OR_GOTO(s->avctx, s->dct_offset, 2 * 64 * sizeof(uint16_t), fail)
600
        }
601
    }
602
    FF_ALLOCZ_OR_GOTO(s->avctx, s->picture, MAX_PICTURE_COUNT * sizeof(Picture), fail)
603 604 605
    for(i = 0; i < MAX_PICTURE_COUNT; i++) {
        avcodec_get_frame_defaults((AVFrame *)&s->picture[i]);
    }
606

607
    FF_ALLOCZ_OR_GOTO(s->avctx, s->error_status_table, mb_array_size*sizeof(uint8_t), fail)
608

M
Michael Niedermayer 已提交
609
    if(s->codec_id==CODEC_ID_MPEG4 || (s->flags & CODEC_FLAG_INTERLACED_ME)){
610
        /* interlaced direct mode decoding tables */
M
Michael Niedermayer 已提交
611 612 613 614
            for(i=0; i<2; i++){
                int j, k;
                for(j=0; j<2; j++){
                    for(k=0; k<2; k++){
615 616
                        FF_ALLOCZ_OR_GOTO(s->avctx,    s->b_field_mv_table_base[i][j][k], mv_table_size * 2 * sizeof(int16_t), fail)
                        s->b_field_mv_table[i][j][k] = s->b_field_mv_table_base[i][j][k] + s->mb_stride + 1;
M
Michael Niedermayer 已提交
617
                    }
618 619 620
                    FF_ALLOCZ_OR_GOTO(s->avctx, s->b_field_select_table [i][j], mb_array_size * 2 * sizeof(uint8_t), fail)
                    FF_ALLOCZ_OR_GOTO(s->avctx, s->p_field_mv_table_base[i][j], mv_table_size * 2 * sizeof(int16_t), fail)
                    s->p_field_mv_table[i][j] = s->p_field_mv_table_base[i][j]+ s->mb_stride + 1;
M
Michael Niedermayer 已提交
621
                }
622
                FF_ALLOCZ_OR_GOTO(s->avctx, s->p_field_select_table[i], mb_array_size * 2 * sizeof(uint8_t), fail)
M
Michael Niedermayer 已提交
623
            }
F
Fabrice Bellard 已提交
624
    }
M
Michael Niedermayer 已提交
625
    if (s->out_format == FMT_H263) {
F
Fabrice Bellard 已提交
626
        /* cbp values */
627
        FF_ALLOCZ_OR_GOTO(s->avctx, s->coded_block_base, y_size, fail);
628
        s->coded_block= s->coded_block_base + s->b8_stride + 1;
629

630
        /* cbp, ac_pred, pred_dir */
631 632
        FF_ALLOCZ_OR_GOTO(s->avctx, s->cbp_table     , mb_array_size * sizeof(uint8_t), fail)
        FF_ALLOCZ_OR_GOTO(s->avctx, s->pred_dir_table, mb_array_size * sizeof(uint8_t), fail)
633
    }
634

635 636 637
    if (s->h263_pred || s->h263_plus || !s->encoding) {
        /* dc values */
        //MN: we need these for error resilience of intra-frames
638
        FF_ALLOCZ_OR_GOTO(s->avctx, s->dc_val_base, yc_size * sizeof(int16_t), fail);
639 640
        s->dc_val[0] = s->dc_val_base + s->b8_stride + 1;
        s->dc_val[1] = s->dc_val_base + y_size + s->mb_stride + 1;
641 642
        s->dc_val[2] = s->dc_val[1] + c_size;
        for(i=0;i<yc_size;i++)
643
            s->dc_val_base[i] = 1024;
644 645
    }

646
    /* which mb is a intra block */
647
    FF_ALLOCZ_OR_GOTO(s->avctx, s->mbintra_table, mb_array_size, fail);
648
    memset(s->mbintra_table, 1, mb_array_size);
649

650
    /* init macroblock skip table */
651
    FF_ALLOCZ_OR_GOTO(s->avctx, s->mbskip_table, mb_array_size+2, fail);
652
    //Note the +1 is for a quicker mpeg4 slice_end detection
653
    FF_ALLOCZ_OR_GOTO(s->avctx, s->prev_pict_types, PREV_PICT_TYPES_BUFFER_SIZE, fail);
654

655
    s->parse_context.state= -1;
656 657
    if((s->avctx->debug&(FF_DEBUG_VIS_QP|FF_DEBUG_VIS_MB_TYPE)) || (s->avctx->debug_mv)){
       s->visualization_buffer[0] = av_malloc((s->mb_width*16 + 2*EDGE_WIDTH) * s->mb_height*16 + 2*EDGE_WIDTH);
658 659
       s->visualization_buffer[1] = av_malloc((s->mb_width*16 + 2*EDGE_WIDTH) * s->mb_height*16 + 2*EDGE_WIDTH);
       s->visualization_buffer[2] = av_malloc((s->mb_width*16 + 2*EDGE_WIDTH) * s->mb_height*16 + 2*EDGE_WIDTH);
660
    }
661

F
Fabrice Bellard 已提交
662
    s->context_initialized = 1;
663 664

    s->thread_context[0]= s;
665
    threads = s->avctx->thread_count;
666 667

    for(i=1; i<threads; i++){
668 669 670 671
        s->thread_context[i]= av_malloc(sizeof(MpegEncContext));
        memcpy(s->thread_context[i], s, sizeof(MpegEncContext));
    }

672
    for(i=0; i<threads; i++){
673 674 675 676 677 678
        if(init_duplicate_context(s->thread_context[i], s) < 0)
           goto fail;
        s->thread_context[i]->start_mb_y= (s->mb_height*(i  ) + s->avctx->thread_count/2) / s->avctx->thread_count;
        s->thread_context[i]->end_mb_y  = (s->mb_height*(i+1) + s->avctx->thread_count/2) / s->avctx->thread_count;
    }

F
Fabrice Bellard 已提交
679 680
    return 0;
 fail:
681
    MPV_common_end(s);
F
Fabrice Bellard 已提交
682 683 684 685 686 687
    return -1;
}

/* init common structure for both encoder and decoder */
void MPV_common_end(MpegEncContext *s)
{
M
Michael Niedermayer 已提交
688
    int i, j, k;
F
Fabrice Bellard 已提交
689

690 691 692 693 694 695 696
    for(i=0; i<s->avctx->thread_count; i++){
        free_duplicate_context(s->thread_context[i]);
    }
    for(i=1; i<s->avctx->thread_count; i++){
        av_freep(&s->thread_context[i]);
    }

697 698 699
    av_freep(&s->parse_context.buffer);
    s->parse_context.buffer_size=0;

700
    av_freep(&s->mb_type);
701 702 703 704 705 706 707 708 709 710 711 712
    av_freep(&s->p_mv_table_base);
    av_freep(&s->b_forw_mv_table_base);
    av_freep(&s->b_back_mv_table_base);
    av_freep(&s->b_bidir_forw_mv_table_base);
    av_freep(&s->b_bidir_back_mv_table_base);
    av_freep(&s->b_direct_mv_table_base);
    s->p_mv_table= NULL;
    s->b_forw_mv_table= NULL;
    s->b_back_mv_table= NULL;
    s->b_bidir_forw_mv_table= NULL;
    s->b_bidir_back_mv_table= NULL;
    s->b_direct_mv_table= NULL;
M
Michael Niedermayer 已提交
713 714 715 716 717 718 719 720 721 722 723 724
    for(i=0; i<2; i++){
        for(j=0; j<2; j++){
            for(k=0; k<2; k++){
                av_freep(&s->b_field_mv_table_base[i][j][k]);
                s->b_field_mv_table[i][j][k]=NULL;
            }
            av_freep(&s->b_field_select_table[i][j]);
            av_freep(&s->p_field_mv_table_base[i][j]);
            s->p_field_mv_table[i][j]=NULL;
        }
        av_freep(&s->p_field_select_table[i]);
    }
725

726 727
    av_freep(&s->dc_val_base);
    av_freep(&s->coded_block_base);
728
    av_freep(&s->mbintra_table);
729 730
    av_freep(&s->cbp_table);
    av_freep(&s->pred_dir_table);
731

732
    av_freep(&s->mbskip_table);
733
    av_freep(&s->prev_pict_types);
734
    av_freep(&s->bitstream_buffer);
735 736
    s->allocated_bitstream_buffer_size=0;

M
Michael Niedermayer 已提交
737
    av_freep(&s->avctx->stats_out);
738
    av_freep(&s->ac_stats);
739
    av_freep(&s->error_status_table);
740
    av_freep(&s->mb_index2xy);
741
    av_freep(&s->lambda_table);
742 743
    av_freep(&s->q_intra_matrix);
    av_freep(&s->q_inter_matrix);
744 745
    av_freep(&s->q_intra_matrix16);
    av_freep(&s->q_inter_matrix16);
746 747
    av_freep(&s->input_picture);
    av_freep(&s->reordered_input_picture);
748
    av_freep(&s->dct_offset);
M
cleanup  
Michael Niedermayer 已提交
749

M
Michael Niedermayer 已提交
750 751 752 753
    if(s->picture){
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            free_picture(s, &s->picture[i]);
        }
F
Fabrice Bellard 已提交
754
    }
755
    av_freep(&s->picture);
F
Fabrice Bellard 已提交
756
    s->context_initialized = 0;
757 758 759
    s->last_picture_ptr=
    s->next_picture_ptr=
    s->current_picture_ptr= NULL;
M
Michael Niedermayer 已提交
760
    s->linesize= s->uvlinesize= 0;
761

762
    for(i=0; i<3; i++)
763
        av_freep(&s->visualization_buffer[i]);
M
Michael Niedermayer 已提交
764 765

    avcodec_default_free_buffers(s->avctx);
F
Fabrice Bellard 已提交
766 767
}

768
void init_rl(RLTable *rl, uint8_t static_store[2][2*MAX_RUN + MAX_LEVEL + 3])
M
Michael Niedermayer 已提交
769
{
770 771
    int8_t max_level[MAX_RUN+1], max_run[MAX_LEVEL+1];
    uint8_t index_run[MAX_RUN+1];
M
Michael Niedermayer 已提交
772 773
    int last, run, level, start, end, i;

774
    /* If table is static, we can quit if rl->max_level[0] is not NULL */
775
    if(static_store && rl->max_level[0])
776 777
        return;

M
Michael Niedermayer 已提交
778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800
    /* compute max_level[], max_run[] and index_run[] */
    for(last=0;last<2;last++) {
        if (last == 0) {
            start = 0;
            end = rl->last;
        } else {
            start = rl->last;
            end = rl->n;
        }

        memset(max_level, 0, MAX_RUN + 1);
        memset(max_run, 0, MAX_LEVEL + 1);
        memset(index_run, rl->n, MAX_RUN + 1);
        for(i=start;i<end;i++) {
            run = rl->table_run[i];
            level = rl->table_level[i];
            if (index_run[run] == rl->n)
                index_run[run] = i;
            if (level > max_level[run])
                max_level[run] = level;
            if (run > max_run[level])
                max_run[level] = run;
        }
801 802
        if(static_store)
            rl->max_level[last] = static_store[last];
803 804
        else
            rl->max_level[last] = av_malloc(MAX_RUN + 1);
M
Michael Niedermayer 已提交
805
        memcpy(rl->max_level[last], max_level, MAX_RUN + 1);
806 807
        if(static_store)
            rl->max_run[last] = static_store[last] + MAX_RUN + 1;
808 809
        else
            rl->max_run[last] = av_malloc(MAX_LEVEL + 1);
M
Michael Niedermayer 已提交
810
        memcpy(rl->max_run[last], max_run, MAX_LEVEL + 1);
811 812
        if(static_store)
            rl->index_run[last] = static_store[last] + MAX_RUN + MAX_LEVEL + 2;
813 814
        else
            rl->index_run[last] = av_malloc(MAX_RUN + 1);
M
Michael Niedermayer 已提交
815 816 817 818
        memcpy(rl->index_run[last], index_run, MAX_RUN + 1);
    }
}

819
void init_vlc_rl(RLTable *rl)
820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858
{
    int i, q;

    for(q=0; q<32; q++){
        int qmul= q*2;
        int qadd= (q-1)|1;

        if(q==0){
            qmul=1;
            qadd=0;
        }
        for(i=0; i<rl->vlc.table_size; i++){
            int code= rl->vlc.table[i][0];
            int len = rl->vlc.table[i][1];
            int level, run;

            if(len==0){ // illegal code
                run= 66;
                level= MAX_LEVEL;
            }else if(len<0){ //more bits needed
                run= 0;
                level= code;
            }else{
                if(code==rl->n){ //esc
                    run= 66;
                    level= 0;
                }else{
                    run=   rl->table_run  [code] + 1;
                    level= rl->table_level[code] * qmul + qadd;
                    if(code >= rl->last) run+=192;
                }
            }
            rl->rl_vlc[q][i].len= len;
            rl->rl_vlc[q][i].level= level;
            rl->rl_vlc[q][i].run= run;
        }
    }
}

M
Michael Niedermayer 已提交
859
int ff_find_unused_picture(MpegEncContext *s, int shared){
M
Michael Niedermayer 已提交
860
    int i;
861

M
Michael Niedermayer 已提交
862 863
    if(shared){
        for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
864
            if(s->picture[i].data[0]==NULL && s->picture[i].type==0) return i;
M
Michael Niedermayer 已提交
865 866 867
        }
    }else{
        for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
868
            if(s->picture[i].data[0]==NULL && s->picture[i].type!=0) return i; //FIXME
M
Michael Niedermayer 已提交
869 870
        }
        for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
871
            if(s->picture[i].data[0]==NULL) return i;
M
Michael Niedermayer 已提交
872 873 874
        }
    }

875
    av_log(s->avctx, AV_LOG_FATAL, "Internal error, picture buffer overflow\n");
876 877 878 879 880 881 882 883 884 885 886
    /* We could return -1, but the codec would crash trying to draw into a
     * non-existing frame anyway. This is safer than waiting for a random crash.
     * Also the return of this is never useful, an encoder must only allocate
     * as much as allowed in the specification. This has no relationship to how
     * much libavcodec could allocate (and MAX_PICTURE_COUNT is always large
     * enough for such valid streams).
     * Plus, a decoder has to check stream validity and remove frames if too
     * many reference frames are around. Waiting for "OOM" is not correct at
     * all. Similarly, missing reference frames have to be replaced by
     * interpolated/MC frames, anything else is a bug in the codec ...
     */
887
    abort();
M
Michael Niedermayer 已提交
888
    return -1;
M
Michael Niedermayer 已提交
889 890
}

891 892 893 894 895 896 897 898 899 900
static void update_noise_reduction(MpegEncContext *s){
    int intra, i;

    for(intra=0; intra<2; intra++){
        if(s->dct_count[intra] > (1<<16)){
            for(i=0; i<64; i++){
                s->dct_error_sum[intra][i] >>=1;
            }
            s->dct_count[intra] >>= 1;
        }
901

902 903 904 905 906 907
        for(i=0; i<64; i++){
            s->dct_offset[intra][i]= (s->avctx->noise_reduction * s->dct_count[intra] + s->dct_error_sum[intra][i]/2) / (s->dct_error_sum[intra][i]+1);
        }
    }
}

M
Michael Niedermayer 已提交
908 909 910
/**
 * generic function for encode/decode called after coding/decoding the header and before a frame is coded/decoded
 */
911
int MPV_frame_start(MpegEncContext *s, AVCodecContext *avctx)
F
Fabrice Bellard 已提交
912
{
M
Michael Niedermayer 已提交
913
    int i;
914
    Picture *pic;
915
    s->mb_skipped = 0;
M
Michael Niedermayer 已提交
916

M
Michael Niedermayer 已提交
917
    assert(s->last_picture_ptr==NULL || s->out_format != FMT_H264 || s->codec_id == CODEC_ID_SVQ3);
M
Michael Niedermayer 已提交
918

M
cleanup  
Michael Niedermayer 已提交
919
    /* mark&release old frames */
920
    if (s->pict_type != FF_B_TYPE && s->last_picture_ptr && s->last_picture_ptr != s->next_picture_ptr && s->last_picture_ptr->data[0]) {
921
      if(s->out_format != FMT_H264 || s->codec_id == CODEC_ID_SVQ3){
922
          free_frame_buffer(s, s->last_picture_ptr);
M
cleanup  
Michael Niedermayer 已提交
923 924 925 926 927

        /* release forgotten pictures */
        /* if(mpeg124/h263) */
        if(!s->encoding){
            for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
928
                if(s->picture[i].data[0] && &s->picture[i] != s->next_picture_ptr && s->picture[i].reference){
929
                    av_log(avctx, AV_LOG_ERROR, "releasing zombie picture\n");
930
                    free_frame_buffer(s, &s->picture[i]);
M
cleanup  
Michael Niedermayer 已提交
931 932
                }
            }
933
        }
934
      }
935
    }
936

937
    if(!s->encoding){
D
Diego Biurrun 已提交
938
        /* release non reference frames */
M
Michael Niedermayer 已提交
939 940
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            if(s->picture[i].data[0] && !s->picture[i].reference /*&& s->picture[i].type!=FF_BUFFER_TYPE_SHARED*/){
941
                free_frame_buffer(s, &s->picture[i]);
M
Michael Niedermayer 已提交
942 943 944
            }
        }

M
Michael Niedermayer 已提交
945
        if(s->current_picture_ptr && s->current_picture_ptr->data[0]==NULL)
946
            pic= s->current_picture_ptr; //we already have a unused image (maybe it was set before reading the header)
M
Michael Niedermayer 已提交
947 948
        else{
            i= ff_find_unused_picture(s, 0);
949
            pic= &s->picture[i];
M
Michael Niedermayer 已提交
950 951
        }

952 953 954 955
        pic->reference= 0;
        if (!s->dropable){
            if (s->codec_id == CODEC_ID_H264)
                pic->reference = s->picture_structure;
956
            else if (s->pict_type != FF_B_TYPE)
957 958
                pic->reference = 3;
        }
M
Michael Niedermayer 已提交
959

M
Michael Niedermayer 已提交
960
        pic->coded_picture_number= s->coded_picture_number++;
961

962
        if(ff_alloc_picture(s, pic, 0) < 0)
963
            return -1;
964

965
        s->current_picture_ptr= pic;
966
        //FIXME use only the vars from current_pic
967
        s->current_picture_ptr->top_field_first= s->top_field_first;
968
        if(s->codec_id == CODEC_ID_MPEG1VIDEO || s->codec_id == CODEC_ID_MPEG2VIDEO) {
969
            if(s->picture_structure != PICT_FRAME)
970
                s->current_picture_ptr->top_field_first= (s->picture_structure == PICT_TOP_FIELD) == s->first_field;
971
        }
972
        s->current_picture_ptr->interlaced_frame= !s->progressive_frame && !s->progressive_sequence;
M
cleanup  
Michael Niedermayer 已提交
973
    }
974

M
Michael Niedermayer 已提交
975
    s->current_picture_ptr->pict_type= s->pict_type;
976
//    if(s->flags && CODEC_FLAG_QSCALE)
977
  //      s->current_picture_ptr->quality= s->new_picture_ptr->quality;
978
    s->current_picture_ptr->key_frame= s->pict_type == FF_I_TYPE;
M
Michael Niedermayer 已提交
979

980
    ff_copy_picture(&s->current_picture, s->current_picture_ptr);
981

982
    if (s->pict_type != FF_B_TYPE) {
M
Michael Niedermayer 已提交
983
        s->last_picture_ptr= s->next_picture_ptr;
984 985
        if(!s->dropable)
            s->next_picture_ptr= s->current_picture_ptr;
F
Fabrice Bellard 已提交
986
    }
987
/*    av_log(s->avctx, AV_LOG_DEBUG, "L%p N%p C%p L%p N%p C%p type:%d drop:%d\n", s->last_picture_ptr, s->next_picture_ptr,s->current_picture_ptr,
988 989
        s->last_picture_ptr    ? s->last_picture_ptr->data[0] : NULL,
        s->next_picture_ptr    ? s->next_picture_ptr->data[0] : NULL,
990 991
        s->current_picture_ptr ? s->current_picture_ptr->data[0] : NULL,
        s->pict_type, s->dropable);*/
992

993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010
    if(s->codec_id != CODEC_ID_H264){
        if((s->last_picture_ptr==NULL || s->last_picture_ptr->data[0]==NULL) && s->pict_type!=FF_I_TYPE){
            av_log(avctx, AV_LOG_ERROR, "warning: first frame is no keyframe\n");
            /* Allocate a dummy frame */
            i= ff_find_unused_picture(s, 0);
            s->last_picture_ptr= &s->picture[i];
            if(ff_alloc_picture(s, s->last_picture_ptr, 0) < 0)
                return -1;
        }
        if((s->next_picture_ptr==NULL || s->next_picture_ptr->data[0]==NULL) && s->pict_type==FF_B_TYPE){
            /* Allocate a dummy frame */
            i= ff_find_unused_picture(s, 0);
            s->next_picture_ptr= &s->picture[i];
            if(ff_alloc_picture(s, s->next_picture_ptr, 0) < 0)
                return -1;
        }
    }

1011 1012
    if(s->last_picture_ptr) ff_copy_picture(&s->last_picture, s->last_picture_ptr);
    if(s->next_picture_ptr) ff_copy_picture(&s->next_picture, s->next_picture_ptr);
1013

1014
    assert(s->pict_type == FF_I_TYPE || (s->last_picture_ptr && s->last_picture_ptr->data[0]));
1015

1016
    if(s->picture_structure!=PICT_FRAME && s->out_format != FMT_H264){
M
Michael Niedermayer 已提交
1017 1018 1019 1020
        int i;
        for(i=0; i<4; i++){
            if(s->picture_structure == PICT_BOTTOM_FIELD){
                 s->current_picture.data[i] += s->current_picture.linesize[i];
1021
            }
M
Michael Niedermayer 已提交
1022 1023 1024 1025 1026
            s->current_picture.linesize[i] *= 2;
            s->last_picture.linesize[i] *=2;
            s->next_picture.linesize[i] *=2;
        }
    }
1027

1028
    s->error_recognition= avctx->error_recognition;
1029

D
Diego Biurrun 已提交
1030
    /* set dequantizer, we can't do it during init as it might change for mpeg4
D
Diego Biurrun 已提交
1031
       and we can't do it in the header decode as init is not called for mpeg4 there yet */
1032 1033 1034
    if(s->mpeg_quant || s->codec_id == CODEC_ID_MPEG2VIDEO){
        s->dct_unquantize_intra = s->dct_unquantize_mpeg2_intra;
        s->dct_unquantize_inter = s->dct_unquantize_mpeg2_inter;
M
Maarten Daniels 已提交
1035
    }else if(s->out_format == FMT_H263 || s->out_format == FMT_H261){
1036 1037 1038 1039 1040 1041
        s->dct_unquantize_intra = s->dct_unquantize_h263_intra;
        s->dct_unquantize_inter = s->dct_unquantize_h263_inter;
    }else{
        s->dct_unquantize_intra = s->dct_unquantize_mpeg1_intra;
        s->dct_unquantize_inter = s->dct_unquantize_mpeg1_inter;
    }
1042

1043 1044 1045 1046 1047
    if(s->dct_error_sum){
        assert(s->avctx->noise_reduction && s->encoding);

        update_noise_reduction(s);
    }
1048

1049
    if(CONFIG_MPEG_XVMC_DECODER && s->avctx->xvmc_acceleration)
1050
        return ff_xvmc_field_start(s, avctx);
1051

1052
    return 0;
F
Fabrice Bellard 已提交
1053
}
1054

F
Fabrice Bellard 已提交
1055 1056 1057
/* generic function for encode/decode called after a frame has been coded/decoded */
void MPV_frame_end(MpegEncContext *s)
{
M
cleanup  
Michael Niedermayer 已提交
1058
    int i;
F
Fabrice Bellard 已提交
1059
    /* draw edge for correct motion prediction if outside */
1060
    //just to make sure that all data is rendered.
1061
    if(CONFIG_MPEG_XVMC_DECODER && s->avctx->xvmc_acceleration){
1062
        ff_xvmc_field_end(s);
1063 1064
    }else if(!s->avctx->hwaccel
       && !(s->avctx->codec->capabilities&CODEC_CAP_HWACCEL_VDPAU)
1065 1066 1067 1068
       && s->unrestricted_mv
       && s->current_picture.reference
       && !s->intra_only
       && !(s->flags&CODEC_FLAG_EMU_EDGE)) {
1069 1070 1071 1072 1073 1074 1075 1076 1077
            s->dsp.draw_edges(s->current_picture.data[0], s->linesize  ,
                              s->h_edge_pos   , s->v_edge_pos   ,
                              EDGE_WIDTH  , EDGE_TOP | EDGE_BOTTOM);
            s->dsp.draw_edges(s->current_picture.data[1], s->uvlinesize,
                              s->h_edge_pos>>1, s->v_edge_pos>>1,
                              EDGE_WIDTH/2, EDGE_TOP | EDGE_BOTTOM);
            s->dsp.draw_edges(s->current_picture.data[2], s->uvlinesize,
                              s->h_edge_pos>>1, s->v_edge_pos>>1,
                              EDGE_WIDTH/2, EDGE_TOP | EDGE_BOTTOM);
F
Fabrice Bellard 已提交
1078
    }
M
Michael Niedermayer 已提交
1079
    emms_c();
1080

M
Michael Niedermayer 已提交
1081
    s->last_pict_type    = s->pict_type;
1082
    s->last_lambda_for[s->pict_type]= s->current_picture_ptr->quality;
1083
    if(s->pict_type!=FF_B_TYPE){
1084 1085
        s->last_non_b_pict_type= s->pict_type;
    }
M
Michael Niedermayer 已提交
1086 1087
#if 0
        /* copy back current_picture variables */
M
cleanup  
Michael Niedermayer 已提交
1088 1089 1090 1091
    for(i=0; i<MAX_PICTURE_COUNT; i++){
        if(s->picture[i].data[0] == s->current_picture.data[0]){
            s->picture[i]= s->current_picture;
            break;
1092
        }
M
cleanup  
Michael Niedermayer 已提交
1093 1094
    }
    assert(i<MAX_PICTURE_COUNT);
1095
#endif
M
cleanup  
Michael Niedermayer 已提交
1096

M
Michael Niedermayer 已提交
1097
    if(s->encoding){
D
Diego Biurrun 已提交
1098
        /* release non-reference frames */
M
Michael Niedermayer 已提交
1099 1100
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            if(s->picture[i].data[0] && !s->picture[i].reference /*&& s->picture[i].type!=FF_BUFFER_TYPE_SHARED*/){
1101
                free_frame_buffer(s, &s->picture[i]);
M
Michael Niedermayer 已提交
1102 1103
            }
        }
M
cleanup  
Michael Niedermayer 已提交
1104
    }
M
Michael Niedermayer 已提交
1105 1106 1107 1108 1109 1110
    // clear copies, to avoid confusion
#if 0
    memset(&s->last_picture, 0, sizeof(Picture));
    memset(&s->next_picture, 0, sizeof(Picture));
    memset(&s->current_picture, 0, sizeof(Picture));
#endif
M
Michael Niedermayer 已提交
1111
    s->avctx->coded_frame= (AVFrame*)s->current_picture_ptr;
F
Fabrice Bellard 已提交
1112 1113
}

1114 1115 1116 1117 1118 1119 1120 1121
/**
 * draws an line from (ex, ey) -> (sx, sy).
 * @param w width of the image
 * @param h height of the image
 * @param stride stride/linesize of the image
 * @param color color of the arrow
 */
static void draw_line(uint8_t *buf, int sx, int sy, int ex, int ey, int w, int h, int stride, int color){
M
SWAP  
Michael Niedermayer 已提交
1122
    int x, y, fr, f;
1123

1124 1125 1126 1127
    sx= av_clip(sx, 0, w-1);
    sy= av_clip(sy, 0, h-1);
    ex= av_clip(ex, 0, w-1);
    ey= av_clip(ey, 0, h-1);
1128

1129
    buf[sy*stride + sx]+= color;
1130

D
Diego Biurrun 已提交
1131
    if(FFABS(ex - sx) > FFABS(ey - sy)){
1132
        if(sx > ex){
D
Diego Biurrun 已提交
1133 1134
            FFSWAP(int, sx, ex);
            FFSWAP(int, sy, ey);
1135 1136 1137 1138 1139
        }
        buf+= sx + sy*stride;
        ex-= sx;
        f= ((ey-sy)<<16)/ex;
        for(x= 0; x <= ex; x++){
1140 1141 1142 1143
            y = (x*f)>>16;
            fr= (x*f)&0xFFFF;
            buf[ y   *stride + x]+= (color*(0x10000-fr))>>16;
            buf[(y+1)*stride + x]+= (color*         fr )>>16;
1144 1145 1146
        }
    }else{
        if(sy > ey){
D
Diego Biurrun 已提交
1147 1148
            FFSWAP(int, sx, ex);
            FFSWAP(int, sy, ey);
1149 1150 1151 1152 1153 1154
        }
        buf+= sx + sy*stride;
        ey-= sy;
        if(ey) f= ((ex-sx)<<16)/ey;
        else   f= 0;
        for(y= 0; y <= ey; y++){
1155 1156
            x = (y*f)>>16;
            fr= (y*f)&0xFFFF;
M
Fix ;;  
Michael Niedermayer 已提交
1157 1158
            buf[y*stride + x  ]+= (color*(0x10000-fr))>>16;
            buf[y*stride + x+1]+= (color*         fr )>>16;
1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169
        }
    }
}

/**
 * draws an arrow from (ex, ey) -> (sx, sy).
 * @param w width of the image
 * @param h height of the image
 * @param stride stride/linesize of the image
 * @param color color of the arrow
 */
1170
static void draw_arrow(uint8_t *buf, int sx, int sy, int ex, int ey, int w, int h, int stride, int color){
1171 1172
    int dx,dy;

1173 1174 1175 1176
    sx= av_clip(sx, -100, w+100);
    sy= av_clip(sy, -100, h+100);
    ex= av_clip(ex, -100, w+100);
    ey= av_clip(ey, -100, h+100);
1177

1178 1179
    dx= ex - sx;
    dy= ey - sy;
1180

1181 1182 1183 1184
    if(dx*dx + dy*dy > 3*3){
        int rx=  dx + dy;
        int ry= -dx + dy;
        int length= ff_sqrt((rx*rx + ry*ry)<<8);
1185

1186 1187 1188
        //FIXME subpixel accuracy
        rx= ROUNDED_DIV(rx*3<<4, length);
        ry= ROUNDED_DIV(ry*3<<4, length);
1189

1190 1191 1192 1193 1194 1195
        draw_line(buf, sx, sy, sx + rx, sy + ry, w, h, stride, color);
        draw_line(buf, sx, sy, sx - ry, sy + rx, w, h, stride, color);
    }
    draw_line(buf, sx, sy, ex, ey, w, h, stride, color);
}

1196 1197 1198
/**
 * prints debuging info for the given picture.
 */
1199
void ff_print_debug_info(MpegEncContext *s, AVFrame *pict){
1200

1201
    if(s->avctx->hwaccel || !pict || !pict->mb_type) return;
1202 1203 1204

    if(s->avctx->debug&(FF_DEBUG_SKIP | FF_DEBUG_QP | FF_DEBUG_MB_TYPE)){
        int x,y;
1205

1206 1207 1208 1209 1210 1211 1212
        av_log(s->avctx,AV_LOG_DEBUG,"New frame, type: ");
        switch (pict->pict_type) {
            case FF_I_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"I\n"); break;
            case FF_P_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"P\n"); break;
            case FF_B_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"B\n"); break;
            case FF_S_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"S\n"); break;
            case FF_SI_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"SI\n"); break;
1213
            case FF_SP_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"SP\n"); break;
1214
        }
1215 1216 1217 1218 1219
        for(y=0; y<s->mb_height; y++){
            for(x=0; x<s->mb_width; x++){
                if(s->avctx->debug&FF_DEBUG_SKIP){
                    int count= s->mbskip_table[x + y*s->mb_stride];
                    if(count>9) count=9;
1220
                    av_log(s->avctx, AV_LOG_DEBUG, "%1d", count);
1221 1222
                }
                if(s->avctx->debug&FF_DEBUG_QP){
1223
                    av_log(s->avctx, AV_LOG_DEBUG, "%2d", pict->qscale_table[x + y*s->mb_stride]);
1224 1225 1226 1227 1228
                }
                if(s->avctx->debug&FF_DEBUG_MB_TYPE){
                    int mb_type= pict->mb_type[x + y*s->mb_stride];
                    //Type & MV direction
                    if(IS_PCM(mb_type))
1229
                        av_log(s->avctx, AV_LOG_DEBUG, "P");
1230
                    else if(IS_INTRA(mb_type) && IS_ACPRED(mb_type))
1231
                        av_log(s->avctx, AV_LOG_DEBUG, "A");
1232
                    else if(IS_INTRA4x4(mb_type))
1233
                        av_log(s->avctx, AV_LOG_DEBUG, "i");
1234
                    else if(IS_INTRA16x16(mb_type))
1235
                        av_log(s->avctx, AV_LOG_DEBUG, "I");
1236
                    else if(IS_DIRECT(mb_type) && IS_SKIP(mb_type))
1237
                        av_log(s->avctx, AV_LOG_DEBUG, "d");
1238
                    else if(IS_DIRECT(mb_type))
1239
                        av_log(s->avctx, AV_LOG_DEBUG, "D");
1240
                    else if(IS_GMC(mb_type) && IS_SKIP(mb_type))
1241
                        av_log(s->avctx, AV_LOG_DEBUG, "g");
1242
                    else if(IS_GMC(mb_type))
1243
                        av_log(s->avctx, AV_LOG_DEBUG, "G");
1244
                    else if(IS_SKIP(mb_type))
1245
                        av_log(s->avctx, AV_LOG_DEBUG, "S");
1246
                    else if(!USES_LIST(mb_type, 1))
1247
                        av_log(s->avctx, AV_LOG_DEBUG, ">");
1248
                    else if(!USES_LIST(mb_type, 0))
1249
                        av_log(s->avctx, AV_LOG_DEBUG, "<");
1250 1251
                    else{
                        assert(USES_LIST(mb_type, 0) && USES_LIST(mb_type, 1));
1252
                        av_log(s->avctx, AV_LOG_DEBUG, "X");
1253
                    }
1254

1255 1256
                    //segmentation
                    if(IS_8X8(mb_type))
1257
                        av_log(s->avctx, AV_LOG_DEBUG, "+");
1258
                    else if(IS_16X8(mb_type))
1259
                        av_log(s->avctx, AV_LOG_DEBUG, "-");
1260
                    else if(IS_8X16(mb_type))
1261
                        av_log(s->avctx, AV_LOG_DEBUG, "|");
1262
                    else if(IS_INTRA(mb_type) || IS_16X16(mb_type))
1263
                        av_log(s->avctx, AV_LOG_DEBUG, " ");
1264
                    else
1265
                        av_log(s->avctx, AV_LOG_DEBUG, "?");
1266 1267


1268
                    if(IS_INTERLACED(mb_type))
1269
                        av_log(s->avctx, AV_LOG_DEBUG, "=");
1270
                    else
1271
                        av_log(s->avctx, AV_LOG_DEBUG, " ");
1272
                }
1273
//                av_log(s->avctx, AV_LOG_DEBUG, " ");
1274
            }
1275
            av_log(s->avctx, AV_LOG_DEBUG, "\n");
1276 1277
        }
    }
1278

1279
    if((s->avctx->debug&(FF_DEBUG_VIS_QP|FF_DEBUG_VIS_MB_TYPE)) || (s->avctx->debug_mv)){
1280 1281
        const int shift= 1 + s->quarter_sample;
        int mb_y;
1282 1283
        uint8_t *ptr;
        int i;
1284
        int h_chroma_shift, v_chroma_shift, block_height;
1285 1286
        const int width = s->avctx->width;
        const int height= s->avctx->height;
1287
        const int mv_sample_log2= 4 - pict->motion_subsample_log2;
1288
        const int mv_stride= (s->mb_width << mv_sample_log2) + (s->codec_id == CODEC_ID_H264 ? 0 : 1);
M
100000l  
Michael Niedermayer 已提交
1289
        s->low_delay=0; //needed to see the vectors without trashing the buffers
1290

1291
        avcodec_get_chroma_sub_sample(s->avctx->pix_fmt, &h_chroma_shift, &v_chroma_shift);
1292
        for(i=0; i<3; i++){
1293
            memcpy(s->visualization_buffer[i], pict->data[i], (i==0) ? pict->linesize[i]*height:pict->linesize[i]*height >> v_chroma_shift);
1294 1295 1296 1297
            pict->data[i]= s->visualization_buffer[i];
        }
        pict->type= FF_BUFFER_TYPE_COPY;
        ptr= pict->data[0];
1298
        block_height = 16>>v_chroma_shift;
1299 1300 1301 1302 1303

        for(mb_y=0; mb_y<s->mb_height; mb_y++){
            int mb_x;
            for(mb_x=0; mb_x<s->mb_width; mb_x++){
                const int mb_index= mb_x + mb_y*s->mb_stride;
1304 1305 1306
                if((s->avctx->debug_mv) && pict->motion_val){
                  int type;
                  for(type=0; type<3; type++){
1307
                    int direction = 0;
1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321
                    switch (type) {
                      case 0: if ((!(s->avctx->debug_mv&FF_DEBUG_VIS_MV_P_FOR)) || (pict->pict_type!=FF_P_TYPE))
                                continue;
                              direction = 0;
                              break;
                      case 1: if ((!(s->avctx->debug_mv&FF_DEBUG_VIS_MV_B_FOR)) || (pict->pict_type!=FF_B_TYPE))
                                continue;
                              direction = 0;
                              break;
                      case 2: if ((!(s->avctx->debug_mv&FF_DEBUG_VIS_MV_B_BACK)) || (pict->pict_type!=FF_B_TYPE))
                                continue;
                              direction = 1;
                              break;
                    }
1322 1323 1324
                    if(!USES_LIST(pict->mb_type[mb_index], direction))
                        continue;

1325 1326 1327
                    if(IS_8X8(pict->mb_type[mb_index])){
                      int i;
                      for(i=0; i<4; i++){
1328 1329
                        int sx= mb_x*16 + 4 + 8*(i&1);
                        int sy= mb_y*16 + 4 + 8*(i>>1);
1330
                        int xy= (mb_x*2 + (i&1) + (mb_y*2 + (i>>1))*mv_stride) << (mv_sample_log2-1);
1331 1332
                        int mx= (pict->motion_val[direction][xy][0]>>shift) + sx;
                        int my= (pict->motion_val[direction][xy][1]>>shift) + sy;
1333
                        draw_arrow(ptr, sx, sy, mx, my, width, height, s->linesize, 100);
1334 1335 1336 1337
                      }
                    }else if(IS_16X8(pict->mb_type[mb_index])){
                      int i;
                      for(i=0; i<2; i++){
1338 1339
                        int sx=mb_x*16 + 8;
                        int sy=mb_y*16 + 4 + 8*i;
1340
                        int xy= (mb_x*2 + (mb_y*2 + i)*mv_stride) << (mv_sample_log2-1);
1341 1342
                        int mx=(pict->motion_val[direction][xy][0]>>shift);
                        int my=(pict->motion_val[direction][xy][1]>>shift);
1343

1344 1345
                        if(IS_INTERLACED(pict->mb_type[mb_index]))
                            my*=2;
1346

1347 1348 1349 1350 1351 1352 1353
                        draw_arrow(ptr, sx, sy, mx+sx, my+sy, width, height, s->linesize, 100);
                      }
                    }else if(IS_8X16(pict->mb_type[mb_index])){
                      int i;
                      for(i=0; i<2; i++){
                        int sx=mb_x*16 + 4 + 8*i;
                        int sy=mb_y*16 + 8;
1354
                        int xy= (mb_x*2 + i + mb_y*2*mv_stride) << (mv_sample_log2-1);
1355 1356
                        int mx=(pict->motion_val[direction][xy][0]>>shift);
                        int my=(pict->motion_val[direction][xy][1]>>shift);
1357

1358 1359
                        if(IS_INTERLACED(pict->mb_type[mb_index]))
                            my*=2;
1360

1361
                        draw_arrow(ptr, sx, sy, mx+sx, my+sy, width, height, s->linesize, 100);
1362 1363 1364 1365
                      }
                    }else{
                      int sx= mb_x*16 + 8;
                      int sy= mb_y*16 + 8;
1366
                      int xy= (mb_x + mb_y*mv_stride) << mv_sample_log2;
1367 1368
                      int mx= (pict->motion_val[direction][xy][0]>>shift) + sx;
                      int my= (pict->motion_val[direction][xy][1]>>shift) + sy;
1369
                      draw_arrow(ptr, sx, sy, mx, my, width, height, s->linesize, 100);
1370
                    }
1371
                  }
M
Michael Niedermayer 已提交
1372 1373 1374 1375
                }
                if((s->avctx->debug&FF_DEBUG_VIS_QP) && pict->motion_val){
                    uint64_t c= (pict->qscale_table[mb_index]*128/31) * 0x0101010101010101ULL;
                    int y;
1376 1377 1378
                    for(y=0; y<block_height; y++){
                        *(uint64_t*)(pict->data[1] + 8*mb_x + (block_height*mb_y + y)*pict->linesize[1])= c;
                        *(uint64_t*)(pict->data[2] + 8*mb_x + (block_height*mb_y + y)*pict->linesize[2])= c;
M
Michael Niedermayer 已提交
1379 1380 1381 1382 1383 1384 1385 1386 1387 1388
                    }
                }
                if((s->avctx->debug&FF_DEBUG_VIS_MB_TYPE) && pict->motion_val){
                    int mb_type= pict->mb_type[mb_index];
                    uint64_t u,v;
                    int y;
#define COLOR(theta, r)\
u= (int)(128 + r*cos(theta*3.141592/180));\
v= (int)(128 + r*sin(theta*3.141592/180));

1389

M
Michael Niedermayer 已提交
1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417
                    u=v=128;
                    if(IS_PCM(mb_type)){
                        COLOR(120,48)
                    }else if((IS_INTRA(mb_type) && IS_ACPRED(mb_type)) || IS_INTRA16x16(mb_type)){
                        COLOR(30,48)
                    }else if(IS_INTRA4x4(mb_type)){
                        COLOR(90,48)
                    }else if(IS_DIRECT(mb_type) && IS_SKIP(mb_type)){
//                        COLOR(120,48)
                    }else if(IS_DIRECT(mb_type)){
                        COLOR(150,48)
                    }else if(IS_GMC(mb_type) && IS_SKIP(mb_type)){
                        COLOR(170,48)
                    }else if(IS_GMC(mb_type)){
                        COLOR(190,48)
                    }else if(IS_SKIP(mb_type)){
//                        COLOR(180,48)
                    }else if(!USES_LIST(mb_type, 1)){
                        COLOR(240,48)
                    }else if(!USES_LIST(mb_type, 0)){
                        COLOR(0,48)
                    }else{
                        assert(USES_LIST(mb_type, 0) && USES_LIST(mb_type, 1));
                        COLOR(300,48)
                    }

                    u*= 0x0101010101010101ULL;
                    v*= 0x0101010101010101ULL;
1418 1419 1420
                    for(y=0; y<block_height; y++){
                        *(uint64_t*)(pict->data[1] + 8*mb_x + (block_height*mb_y + y)*pict->linesize[1])= u;
                        *(uint64_t*)(pict->data[2] + 8*mb_x + (block_height*mb_y + y)*pict->linesize[2])= v;
M
Michael Niedermayer 已提交
1421 1422 1423 1424 1425 1426 1427 1428 1429 1430 1431
                    }

                    //segmentation
                    if(IS_8X8(mb_type) || IS_16X8(mb_type)){
                        *(uint64_t*)(pict->data[0] + 16*mb_x + 0 + (16*mb_y + 8)*pict->linesize[0])^= 0x8080808080808080ULL;
                        *(uint64_t*)(pict->data[0] + 16*mb_x + 8 + (16*mb_y + 8)*pict->linesize[0])^= 0x8080808080808080ULL;
                    }
                    if(IS_8X8(mb_type) || IS_8X16(mb_type)){
                        for(y=0; y<16; y++)
                            pict->data[0][16*mb_x + 8 + (16*mb_y + y)*pict->linesize[0]]^= 0x80;
                    }
1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446
                    if(IS_8X8(mb_type) && mv_sample_log2 >= 2){
                        int dm= 1 << (mv_sample_log2-2);
                        for(i=0; i<4; i++){
                            int sx= mb_x*16 + 8*(i&1);
                            int sy= mb_y*16 + 8*(i>>1);
                            int xy= (mb_x*2 + (i&1) + (mb_y*2 + (i>>1))*mv_stride) << (mv_sample_log2-1);
                            //FIXME bidir
                            int32_t *mv = (int32_t*)&pict->motion_val[0][xy];
                            if(mv[0] != mv[dm] || mv[dm*mv_stride] != mv[dm*(mv_stride+1)])
                                for(y=0; y<8; y++)
                                    pict->data[0][sx + 4 + (sy + y)*pict->linesize[0]]^= 0x80;
                            if(mv[0] != mv[dm*mv_stride] || mv[dm] != mv[dm*(mv_stride+1)])
                                *(uint64_t*)(pict->data[0] + sx + (sy + 4)*pict->linesize[0])^= 0x8080808080808080ULL;
                        }
                    }
1447

M
Michael Niedermayer 已提交
1448 1449 1450
                    if(IS_INTERLACED(mb_type) && s->codec_id == CODEC_ID_H264){
                        // hmm
                    }
1451 1452 1453 1454 1455
                }
                s->mbskip_table[mb_index]=0;
            }
        }
    }
1456 1457
}

1458
static inline int hpel_motion_lowres(MpegEncContext *s,
M
Michael Niedermayer 已提交
1459 1460 1461 1462 1463 1464 1465 1466 1467
                                  uint8_t *dest, uint8_t *src,
                                  int field_based, int field_select,
                                  int src_x, int src_y,
                                  int width, int height, int stride,
                                  int h_edge_pos, int v_edge_pos,
                                  int w, int h, h264_chroma_mc_func *pix_op,
                                  int motion_x, int motion_y)
{
    const int lowres= s->avctx->lowres;
1468
    const int op_index= FFMIN(lowres, 2);
M
Michael Niedermayer 已提交
1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481
    const int s_mask= (2<<lowres)-1;
    int emu=0;
    int sx, sy;

    if(s->quarter_sample){
        motion_x/=2;
        motion_y/=2;
    }

    sx= motion_x & s_mask;
    sy= motion_y & s_mask;
    src_x += motion_x >> (lowres+1);
    src_y += motion_y >> (lowres+1);
1482

M
Michael Niedermayer 已提交
1483 1484 1485 1486
    src += src_y * stride + src_x;

    if(   (unsigned)src_x > h_edge_pos                 - (!!sx) - w
       || (unsigned)src_y >(v_edge_pos >> field_based) - (!!sy) - h){
1487
        s->dsp.emulated_edge_mc(s->edge_emu_buffer, src, s->linesize, w+1, (h+1)<<field_based,
M
Michael Niedermayer 已提交
1488 1489 1490 1491 1492
                            src_x, src_y<<field_based, h_edge_pos, v_edge_pos);
        src= s->edge_emu_buffer;
        emu=1;
    }

1493 1494
    sx= (sx << 2) >> lowres;
    sy= (sy << 2) >> lowres;
M
Michael Niedermayer 已提交
1495 1496
    if(field_select)
        src += s->linesize;
1497
    pix_op[op_index](dest, src, stride, h, sx, sy);
M
Michael Niedermayer 已提交
1498 1499 1500
    return emu;
}

F
Fabrice Bellard 已提交
1501
/* apply one mpeg motion vector to the three components */
B
Benoit Fouet 已提交
1502
static av_always_inline void mpeg_motion_lowres(MpegEncContext *s,
1503
                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
1504
                               int field_based, int bottom_field, int field_select,
B
Benoit Fouet 已提交
1505
                               uint8_t **ref_picture, h264_chroma_mc_func *pix_op,
1506
                               int motion_x, int motion_y, int h, int mb_y)
F
Fabrice Bellard 已提交
1507
{
1508
    uint8_t *ptr_y, *ptr_cb, *ptr_cr;
B
Benoit Fouet 已提交
1509 1510
    int mx, my, src_x, src_y, uvsrc_x, uvsrc_y, uvlinesize, linesize, sx, sy, uvsx, uvsy;
    const int lowres= s->avctx->lowres;
1511
    const int op_index= FFMIN(lowres, 2);
B
Benoit Fouet 已提交
1512 1513 1514 1515
    const int block_s= 8>>lowres;
    const int s_mask= (2<<lowres)-1;
    const int h_edge_pos = s->h_edge_pos >> lowres;
    const int v_edge_pos = s->v_edge_pos >> lowres;
1516
    linesize   = s->current_picture.linesize[0] << field_based;
M
Michael Niedermayer 已提交
1517
    uvlinesize = s->current_picture.linesize[1] << field_based;
1518

1519
    if(s->quarter_sample){ //FIXME obviously not perfect but qpel will not work in lowres anyway
B
Benoit Fouet 已提交
1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530
        motion_x/=2;
        motion_y/=2;
    }

    if(field_based){
        motion_y += (bottom_field - field_select)*((1<<lowres)-1);
    }

    sx= motion_x & s_mask;
    sy= motion_y & s_mask;
    src_x = s->mb_x*2*block_s               + (motion_x >> (lowres+1));
1531
    src_y =(   mb_y*2*block_s>>field_based) + (motion_y >> (lowres+1));
1532

M
Michael Niedermayer 已提交
1533
    if (s->out_format == FMT_H263) {
M
Michael Niedermayer 已提交
1534 1535
        uvsx = ((motion_x>>1) & s_mask) | (sx&1);
        uvsy = ((motion_y>>1) & s_mask) | (sy&1);
M
Michael Niedermayer 已提交
1536 1537 1538 1539 1540 1541 1542 1543
        uvsrc_x = src_x>>1;
        uvsrc_y = src_y>>1;
    }else if(s->out_format == FMT_H261){//even chroma mv's are full pel in H261
        mx = motion_x / 4;
        my = motion_y / 4;
        uvsx = (2*mx) & s_mask;
        uvsy = (2*my) & s_mask;
        uvsrc_x = s->mb_x*block_s               + (mx >> lowres);
1544
        uvsrc_y =    mb_y*block_s               + (my >> lowres);
M
Michael Niedermayer 已提交
1545 1546 1547 1548 1549 1550
    } else {
        mx = motion_x / 2;
        my = motion_y / 2;
        uvsx = mx & s_mask;
        uvsy = my & s_mask;
        uvsrc_x = s->mb_x*block_s               + (mx >> (lowres+1));
1551
        uvsrc_y =(   mb_y*block_s>>field_based) + (my >> (lowres+1));
M
Michael Niedermayer 已提交
1552 1553 1554 1555 1556 1557 1558 1559
    }

    ptr_y  = ref_picture[0] + src_y * linesize + src_x;
    ptr_cb = ref_picture[1] + uvsrc_y * uvlinesize + uvsrc_x;
    ptr_cr = ref_picture[2] + uvsrc_y * uvlinesize + uvsrc_x;

    if(   (unsigned)src_x > h_edge_pos                 - (!!sx) - 2*block_s
       || (unsigned)src_y >(v_edge_pos >> field_based) - (!!sy) - h){
1560
            s->dsp.emulated_edge_mc(s->edge_emu_buffer, ptr_y, s->linesize, 17, 17+field_based,
M
Michael Niedermayer 已提交
1561 1562
                             src_x, src_y<<field_based, h_edge_pos, v_edge_pos);
            ptr_y = s->edge_emu_buffer;
1563
            if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
M
Michael Niedermayer 已提交
1564
                uint8_t *uvbuf= s->edge_emu_buffer+18*s->linesize;
1565
                s->dsp.emulated_edge_mc(uvbuf  , ptr_cb, s->uvlinesize, 9, 9+field_based,
M
Michael Niedermayer 已提交
1566
                                 uvsrc_x, uvsrc_y<<field_based, h_edge_pos>>1, v_edge_pos>>1);
1567
                s->dsp.emulated_edge_mc(uvbuf+16, ptr_cr, s->uvlinesize, 9, 9+field_based,
M
Michael Niedermayer 已提交
1568 1569 1570 1571 1572 1573
                                 uvsrc_x, uvsrc_y<<field_based, h_edge_pos>>1, v_edge_pos>>1);
                ptr_cb= uvbuf;
                ptr_cr= uvbuf+16;
            }
    }

1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585
    if(bottom_field){ //FIXME use this for field pix too instead of the obnoxious hack which changes picture.data
        dest_y += s->linesize;
        dest_cb+= s->uvlinesize;
        dest_cr+= s->uvlinesize;
    }

    if(field_select){
        ptr_y += s->linesize;
        ptr_cb+= s->uvlinesize;
        ptr_cr+= s->uvlinesize;
    }

1586 1587
    sx= (sx << 2) >> lowres;
    sy= (sy << 2) >> lowres;
M
Michael Niedermayer 已提交
1588
    pix_op[lowres-1](dest_y, ptr_y, linesize, h, sx, sy);
1589

1590
    if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
1591 1592 1593 1594
        uvsx= (uvsx << 2) >> lowres;
        uvsy= (uvsy << 2) >> lowres;
        pix_op[op_index](dest_cb, ptr_cb, uvlinesize, h >> s->chroma_y_shift, uvsx, uvsy);
        pix_op[op_index](dest_cr, ptr_cr, uvlinesize, h >> s->chroma_y_shift, uvsx, uvsy);
M
Michael Niedermayer 已提交
1595
    }
M
Michael Niedermayer 已提交
1596
    //FIXME h261 lowres loop filter
M
Michael Niedermayer 已提交
1597 1598
}

M
Michael Niedermayer 已提交
1599 1600 1601 1602 1603 1604
static inline void chroma_4mv_motion_lowres(MpegEncContext *s,
                                     uint8_t *dest_cb, uint8_t *dest_cr,
                                     uint8_t **ref_picture,
                                     h264_chroma_mc_func *pix_op,
                                     int mx, int my){
    const int lowres= s->avctx->lowres;
1605
    const int op_index= FFMIN(lowres, 2);
M
Michael Niedermayer 已提交
1606 1607 1608 1609 1610 1611
    const int block_s= 8>>lowres;
    const int s_mask= (2<<lowres)-1;
    const int h_edge_pos = s->h_edge_pos >> (lowres+1);
    const int v_edge_pos = s->v_edge_pos >> (lowres+1);
    int emu=0, src_x, src_y, offset, sx, sy;
    uint8_t *ptr;
1612

M
Michael Niedermayer 已提交
1613 1614 1615 1616 1617 1618 1619 1620 1621
    if(s->quarter_sample){
        mx/=2;
        my/=2;
    }

    /* In case of 8X8, we construct a single chroma motion vector
       with a special rounding */
    mx= ff_h263_round_chroma(mx);
    my= ff_h263_round_chroma(my);
1622

M
Michael Niedermayer 已提交
1623 1624 1625 1626
    sx= mx & s_mask;
    sy= my & s_mask;
    src_x = s->mb_x*block_s + (mx >> (lowres+1));
    src_y = s->mb_y*block_s + (my >> (lowres+1));
1627

M
Michael Niedermayer 已提交
1628 1629 1630 1631 1632
    offset = src_y * s->uvlinesize + src_x;
    ptr = ref_picture[1] + offset;
    if(s->flags&CODEC_FLAG_EMU_EDGE){
        if(   (unsigned)src_x > h_edge_pos - (!!sx) - block_s
           || (unsigned)src_y > v_edge_pos - (!!sy) - block_s){
1633
            s->dsp.emulated_edge_mc(s->edge_emu_buffer, ptr, s->uvlinesize, 9, 9, src_x, src_y, h_edge_pos, v_edge_pos);
M
Michael Niedermayer 已提交
1634 1635 1636
            ptr= s->edge_emu_buffer;
            emu=1;
        }
1637
    }
1638 1639 1640
    sx= (sx << 2) >> lowres;
    sy= (sy << 2) >> lowres;
    pix_op[op_index](dest_cb, ptr, s->uvlinesize, block_s, sx, sy);
1641

M
Michael Niedermayer 已提交
1642 1643
    ptr = ref_picture[2] + offset;
    if(emu){
1644
        s->dsp.emulated_edge_mc(s->edge_emu_buffer, ptr, s->uvlinesize, 9, 9, src_x, src_y, h_edge_pos, v_edge_pos);
M
Michael Niedermayer 已提交
1645 1646
        ptr= s->edge_emu_buffer;
    }
1647
    pix_op[op_index](dest_cr, ptr, s->uvlinesize, block_s, sx, sy);
M
Michael Niedermayer 已提交
1648 1649
}

M
doxy  
Michael Niedermayer 已提交
1650
/**
D
Diego Biurrun 已提交
1651
 * motion compensation of a single macroblock
M
doxy  
Michael Niedermayer 已提交
1652 1653 1654 1655 1656 1657
 * @param s context
 * @param dest_y luma destination pointer
 * @param dest_cb chroma cb/u destination pointer
 * @param dest_cr chroma cr/v destination pointer
 * @param dir direction (0->forward, 1->backward)
 * @param ref_picture array[3] of pointers to the 3 planes of the reference picture
1658
 * @param pix_op halfpel motion compensation function (average or put normally)
M
doxy  
Michael Niedermayer 已提交
1659 1660
 * the motion vectors are taken from s->mv and the MV type from s->mv_type
 */
B
Benoit Fouet 已提交
1661
static inline void MPV_motion_lowres(MpegEncContext *s,
1662
                              uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
1663
                              int dir, uint8_t **ref_picture,
B
Benoit Fouet 已提交
1664
                              h264_chroma_mc_func *pix_op)
F
Fabrice Bellard 已提交
1665
{
B
Benoit Fouet 已提交
1666
    int mx, my;
F
Fabrice Bellard 已提交
1667
    int mb_x, mb_y, i;
B
Benoit Fouet 已提交
1668 1669
    const int lowres= s->avctx->lowres;
    const int block_s= 8>>lowres;
F
Fabrice Bellard 已提交
1670 1671 1672 1673 1674 1675

    mb_x = s->mb_x;
    mb_y = s->mb_y;

    switch(s->mv_type) {
    case MV_TYPE_16X16:
B
Benoit Fouet 已提交
1676 1677 1678
        mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
                    0, 0, 0,
                    ref_picture, pix_op,
1679
                    s->mv[dir][0][0], s->mv[dir][0][1], 2*block_s, mb_y);
F
Fabrice Bellard 已提交
1680 1681
        break;
    case MV_TYPE_8X8:
M
Michael Niedermayer 已提交
1682 1683 1684
        mx = 0;
        my = 0;
            for(i=0;i<4;i++) {
B
Benoit Fouet 已提交
1685
                hpel_motion_lowres(s, dest_y + ((i & 1) + (i >> 1) * s->linesize)*block_s,
1686
                            ref_picture[0], 0, 0,
B
Benoit Fouet 已提交
1687
                            (2*mb_x + (i & 1))*block_s, (2*mb_y + (i >>1))*block_s,
M
Michael Niedermayer 已提交
1688
                            s->width, s->height, s->linesize,
B
Benoit Fouet 已提交
1689 1690
                            s->h_edge_pos >> lowres, s->v_edge_pos >> lowres,
                            block_s, block_s, pix_op,
M
Michael Niedermayer 已提交
1691
                            s->mv[dir][i][0], s->mv[dir][i][1]);
M
Michael Niedermayer 已提交
1692 1693 1694

                mx += s->mv[dir][i][0];
                my += s->mv[dir][i][1];
M
Michael Niedermayer 已提交
1695
            }
M
Michael Niedermayer 已提交
1696

1697
        if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY))
B
Benoit Fouet 已提交
1698
            chroma_4mv_motion_lowres(s, dest_cb, dest_cr, ref_picture, pix_op, mx, my);
F
Fabrice Bellard 已提交
1699 1700 1701
        break;
    case MV_TYPE_FIELD:
        if (s->picture_structure == PICT_FRAME) {
B
Benoit Fouet 已提交
1702 1703 1704 1705
            /* top field */
            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
                        1, 0, s->field_select[dir][0],
                        ref_picture, pix_op,
1706
                        s->mv[dir][0][0], s->mv[dir][0][1], block_s, mb_y);
B
Benoit Fouet 已提交
1707 1708 1709 1710
            /* bottom field */
            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
                        1, 1, s->field_select[dir][1],
                        ref_picture, pix_op,
1711
                        s->mv[dir][1][0], s->mv[dir][1][1], block_s, mb_y);
F
Fabrice Bellard 已提交
1712
        } else {
1713
            if(s->picture_structure != s->field_select[dir][0] + 1 && s->pict_type != FF_B_TYPE && !s->first_field){
1714
                ref_picture= s->current_picture_ptr->data;
1715
            }
F
Fabrice Bellard 已提交
1716

B
Benoit Fouet 已提交
1717
            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
1718 1719
                        0, 0, s->field_select[dir][0],
                        ref_picture, pix_op,
1720
                        s->mv[dir][0][0], s->mv[dir][0][1], 2*block_s, mb_y>>1);
F
Fabrice Bellard 已提交
1721
        }
1722
        break;
M
Michael Niedermayer 已提交
1723 1724 1725
    case MV_TYPE_16X8:
        for(i=0; i<2; i++){
            uint8_t ** ref2picture;
1726

1727
            if(s->picture_structure == s->field_select[dir][i] + 1 || s->pict_type == FF_B_TYPE || s->first_field){
1728 1729
                ref2picture= ref_picture;
            }else{
1730
                ref2picture= s->current_picture_ptr->data;
1731
            }
1732

B
Benoit Fouet 已提交
1733
            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
M
Michael Niedermayer 已提交
1734
                        0, 0, s->field_select[dir][i],
1735
                        ref2picture, pix_op,
1736
                        s->mv[dir][i][0], s->mv[dir][i][1] + 2*block_s*i, block_s, mb_y>>1);
1737

B
Benoit Fouet 已提交
1738 1739 1740
            dest_y += 2*block_s*s->linesize;
            dest_cb+= (2*block_s>>s->chroma_y_shift)*s->uvlinesize;
            dest_cr+= (2*block_s>>s->chroma_y_shift)*s->uvlinesize;
1741
        }
F
Fabrice Bellard 已提交
1742
        break;
1743 1744
    case MV_TYPE_DMV:
        if(s->picture_structure == PICT_FRAME){
M
Michael Niedermayer 已提交
1745 1746 1747
            for(i=0; i<2; i++){
                int j;
                for(j=0; j<2; j++){
B
Benoit Fouet 已提交
1748
                    mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
M
Michael Niedermayer 已提交
1749 1750
                                1, j, j^i,
                                ref_picture, pix_op,
1751
                                s->mv[dir][2*i + j][0], s->mv[dir][2*i + j][1], block_s, mb_y);
M
Michael Niedermayer 已提交
1752
                }
B
Benoit Fouet 已提交
1753
                pix_op = s->dsp.avg_h264_chroma_pixels_tab;
M
Michael Niedermayer 已提交
1754
            }
1755
        }else{
M
Michael Niedermayer 已提交
1756
            for(i=0; i<2; i++){
B
Benoit Fouet 已提交
1757
                mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
M
Michael Niedermayer 已提交
1758 1759
                            0, 0, s->picture_structure != i+1,
                            ref_picture, pix_op,
1760
                            s->mv[dir][2*i][0],s->mv[dir][2*i][1],2*block_s, mb_y>>1);
1761

M
Michael Niedermayer 已提交
1762
                // after put we make avg of the same block
B
Benoit Fouet 已提交
1763
                pix_op = s->dsp.avg_h264_chroma_pixels_tab;
1764

M
Michael Niedermayer 已提交
1765 1766
                //opposite parity is always in the same frame if this is second field
                if(!s->first_field){
1767
                    ref_picture = s->current_picture_ptr->data;
M
Michael Niedermayer 已提交
1768
                }
1769
            }
1770 1771
        }
    break;
M
Michael Niedermayer 已提交
1772
    default: assert(0);
F
Fabrice Bellard 已提交
1773 1774 1775
    }
}

B
Benoit Fouet 已提交
1776 1777 1778
/* put block[] to dest[] */
static inline void put_dct(MpegEncContext *s,
                           DCTELEM *block, int i, uint8_t *dest, int line_size, int qscale)
M
Michael Niedermayer 已提交
1779
{
B
Benoit Fouet 已提交
1780 1781 1782
    s->dct_unquantize_intra(s, block, i, qscale);
    s->dsp.idct_put (dest, line_size, block);
}
1783

B
Benoit Fouet 已提交
1784 1785 1786 1787 1788 1789 1790 1791
/* add block[] to dest[] */
static inline void add_dct(MpegEncContext *s,
                           DCTELEM *block, int i, uint8_t *dest, int line_size)
{
    if (s->block_last_index[i] >= 0) {
        s->dsp.idct_add (dest, line_size, block);
    }
}
1792

1793
static inline void add_dequant_dct(MpegEncContext *s,
M
Michael Niedermayer 已提交
1794
                           DCTELEM *block, int i, uint8_t *dest, int line_size, int qscale)
M
Michael Niedermayer 已提交
1795
{
F
Fabrice Bellard 已提交
1796
    if (s->block_last_index[i] >= 0) {
1797
        s->dct_unquantize_inter(s, block, i, qscale);
1798

1799
        s->dsp.idct_add (dest, line_size, block);
F
Fabrice Bellard 已提交
1800 1801 1802
    }
}

1803 1804 1805 1806 1807
/**
 * cleans dc, ac, coded_block for the current non intra MB
 */
void ff_clean_intra_table_entries(MpegEncContext *s)
{
1808
    int wrap = s->b8_stride;
1809
    int xy = s->block_index[0];
1810 1811 1812

    s->dc_val[0][xy           ] =
    s->dc_val[0][xy + 1       ] =
1813 1814 1815
    s->dc_val[0][xy     + wrap] =
    s->dc_val[0][xy + 1 + wrap] = 1024;
    /* ac pred */
1816 1817
    memset(s->ac_val[0][xy       ], 0, 32 * sizeof(int16_t));
    memset(s->ac_val[0][xy + wrap], 0, 32 * sizeof(int16_t));
1818 1819 1820 1821 1822 1823 1824
    if (s->msmpeg4_version>=3) {
        s->coded_block[xy           ] =
        s->coded_block[xy + 1       ] =
        s->coded_block[xy     + wrap] =
        s->coded_block[xy + 1 + wrap] = 0;
    }
    /* chroma */
1825 1826
    wrap = s->mb_stride;
    xy = s->mb_x + s->mb_y * wrap;
1827 1828 1829
    s->dc_val[1][xy] =
    s->dc_val[2][xy] = 1024;
    /* ac pred */
1830 1831
    memset(s->ac_val[1][xy], 0, 16 * sizeof(int16_t));
    memset(s->ac_val[2][xy], 0, 16 * sizeof(int16_t));
1832

1833
    s->mbintra_table[xy]= 0;
1834 1835
}

F
Fabrice Bellard 已提交
1836 1837 1838 1839 1840 1841 1842 1843 1844 1845
/* generic function called after a macroblock has been parsed by the
   decoder or after it has been encoded by the encoder.

   Important variables used:
   s->mb_intra : true if intra macroblock
   s->mv_dir   : motion vector direction
   s->mv_type  : motion vector type
   s->mv       : motion vector
   s->interlaced_dct : true if interlaced dct used (mpeg2)
 */
1846 1847
static av_always_inline
void MPV_decode_mb_internal(MpegEncContext *s, DCTELEM block[12][64],
K
Keiji Costantini 已提交
1848
                            int lowres_flag, int is_mpeg12)
F
Fabrice Bellard 已提交
1849
{
1850
    const int mb_xy = s->mb_y * s->mb_stride + s->mb_x;
1851
    if(CONFIG_MPEG_XVMC_DECODER && s->avctx->xvmc_acceleration){
1852
        ff_xvmc_decode_mb(s);//xvmc uses pblocks
I
Ivan Kalvachev 已提交
1853 1854
        return;
    }
F
Fabrice Bellard 已提交
1855

1856 1857 1858 1859 1860 1861 1862 1863 1864
    if(s->avctx->debug&FF_DEBUG_DCT_COEFF) {
       /* save DCT coefficients */
       int i,j;
       DCTELEM *dct = &s->current_picture.dct_coeff[mb_xy*64*6];
       for(i=0; i<6; i++)
           for(j=0; j<64; j++)
               *dct++ = block[i][s->dsp.idct_permutation[j]];
    }

M
cleanup  
Michael Niedermayer 已提交
1865
    s->current_picture.qscale_table[mb_xy]= s->qscale;
1866

F
Fabrice Bellard 已提交
1867 1868
    /* update DC predictors for P macroblocks */
    if (!s->mb_intra) {
K
Keiji Costantini 已提交
1869
        if (!is_mpeg12 && (s->h263_pred || s->h263_aic)) {
M
Michael Niedermayer 已提交
1870
            if(s->mbintra_table[mb_xy])
1871
                ff_clean_intra_table_entries(s);
F
Fabrice Bellard 已提交
1872
        } else {
1873 1874
            s->last_dc[0] =
            s->last_dc[1] =
F
Fabrice Bellard 已提交
1875 1876 1877
            s->last_dc[2] = 128 << s->intra_dc_precision;
        }
    }
K
Keiji Costantini 已提交
1878
    else if (!is_mpeg12 && (s->h263_pred || s->h263_aic))
M
Michael Niedermayer 已提交
1879
        s->mbintra_table[mb_xy]=1;
1880

1881
    if ((s->flags&CODEC_FLAG_PSNR) || !(s->encoding && (s->intra_only || s->pict_type==FF_B_TYPE) && s->avctx->mb_decision != FF_MB_DECISION_RD)) { //FIXME precalc
1882
        uint8_t *dest_y, *dest_cb, *dest_cr;
M
Michael Niedermayer 已提交
1883
        int dct_linesize, dct_offset;
M
Michael Niedermayer 已提交
1884 1885
        op_pixels_func (*op_pix)[4];
        qpel_mc_func (*op_qpix)[16];
1886
        const int linesize= s->current_picture.linesize[0]; //not s->linesize as this would be wrong for field pics
M
Michael Niedermayer 已提交
1887
        const int uvlinesize= s->current_picture.linesize[1];
1888
        const int readable= s->pict_type != FF_B_TYPE || s->encoding || s->avctx->draw_horiz_band || lowres_flag;
M
Michael Niedermayer 已提交
1889
        const int block_size= lowres_flag ? 8>>s->avctx->lowres : 8;
1890

M
cleanup  
Michael Niedermayer 已提交
1891 1892 1893
        /* avoid copy if macroblock skipped in last frame too */
        /* skip only during decoding as we might trash the buffers during encoding a bit */
        if(!s->encoding){
1894
            uint8_t *mbskip_ptr = &s->mbskip_table[mb_xy];
M
cleanup  
Michael Niedermayer 已提交
1895
            const int age= s->current_picture.age;
M
Michael Niedermayer 已提交
1896

M
cleanup  
Michael Niedermayer 已提交
1897 1898
            assert(age);

1899 1900
            if (s->mb_skipped) {
                s->mb_skipped= 0;
1901
                assert(s->pict_type!=FF_I_TYPE);
1902

1903
                (*mbskip_ptr) ++; /* indicate that this time we skipped it */
M
Michael Niedermayer 已提交
1904 1905
                if(*mbskip_ptr >99) *mbskip_ptr= 99;

M
cleanup  
Michael Niedermayer 已提交
1906
                /* if previous was skipped too, then nothing to do !  */
1907 1908
                if (*mbskip_ptr >= age && s->current_picture.reference){
                    return;
M
cleanup  
Michael Niedermayer 已提交
1909
                }
1910 1911 1912 1913
            } else if(!s->current_picture.reference){
                (*mbskip_ptr) ++; /* increase counter so the age can be compared cleanly */
                if(*mbskip_ptr >99) *mbskip_ptr= 99;
            } else{
1914 1915
                *mbskip_ptr = 0; /* not skipped */
            }
M
Michael Niedermayer 已提交
1916
        }
1917

1918
        dct_linesize = linesize << s->interlaced_dct;
M
Michael Niedermayer 已提交
1919
        dct_offset =(s->interlaced_dct)? linesize : linesize*block_size;
1920

1921 1922 1923 1924 1925
        if(readable){
            dest_y=  s->dest[0];
            dest_cb= s->dest[1];
            dest_cr= s->dest[2];
        }else{
1926
            dest_y = s->b_scratchpad;
1927
            dest_cb= s->b_scratchpad+16*linesize;
1928
            dest_cr= s->b_scratchpad+32*linesize;
1929
        }
M
Michael Niedermayer 已提交
1930

F
Fabrice Bellard 已提交
1931 1932
        if (!s->mb_intra) {
            /* motion handling */
1933
            /* decoding or more than one mb_type (MC was already done otherwise) */
1934
            if(!s->encoding){
M
Michael Niedermayer 已提交
1935 1936
                if(lowres_flag){
                    h264_chroma_mc_func *op_pix = s->dsp.put_h264_chroma_pixels_tab;
F
Fabrice Bellard 已提交
1937

M
Michael Niedermayer 已提交
1938 1939 1940 1941 1942 1943 1944 1945
                    if (s->mv_dir & MV_DIR_FORWARD) {
                        MPV_motion_lowres(s, dest_y, dest_cb, dest_cr, 0, s->last_picture.data, op_pix);
                        op_pix = s->dsp.avg_h264_chroma_pixels_tab;
                    }
                    if (s->mv_dir & MV_DIR_BACKWARD) {
                        MPV_motion_lowres(s, dest_y, dest_cb, dest_cr, 1, s->next_picture.data, op_pix);
                    }
                }else{
1946
                    op_qpix= s->me.qpel_put;
1947
                    if ((!s->no_rounding) || s->pict_type==FF_B_TYPE){
M
Michael Niedermayer 已提交
1948 1949 1950 1951 1952 1953 1954
                        op_pix = s->dsp.put_pixels_tab;
                    }else{
                        op_pix = s->dsp.put_no_rnd_pixels_tab;
                    }
                    if (s->mv_dir & MV_DIR_FORWARD) {
                        MPV_motion(s, dest_y, dest_cb, dest_cr, 0, s->last_picture.data, op_pix, op_qpix);
                        op_pix = s->dsp.avg_pixels_tab;
1955
                        op_qpix= s->me.qpel_avg;
M
Michael Niedermayer 已提交
1956 1957 1958 1959
                    }
                    if (s->mv_dir & MV_DIR_BACKWARD) {
                        MPV_motion(s, dest_y, dest_cb, dest_cr, 1, s->next_picture.data, op_pix, op_qpix);
                    }
1960
                }
F
Fabrice Bellard 已提交
1961 1962
            }

M
Michael Niedermayer 已提交
1963
            /* skip dequant / idct if we are really late ;) */
M
Michael Niedermayer 已提交
1964
            if(s->avctx->skip_idct){
1965 1966
                if(  (s->avctx->skip_idct >= AVDISCARD_NONREF && s->pict_type == FF_B_TYPE)
                   ||(s->avctx->skip_idct >= AVDISCARD_NONKEY && s->pict_type != FF_I_TYPE)
M
Michael Niedermayer 已提交
1967 1968 1969
                   || s->avctx->skip_idct >= AVDISCARD_ALL)
                    goto skip_idct;
            }
M
Michael Niedermayer 已提交
1970

F
Fabrice Bellard 已提交
1971
            /* add dct residue */
M
Michael Niedermayer 已提交
1972
            if(s->encoding || !(   s->h263_msmpeg4 || s->codec_id==CODEC_ID_MPEG1VIDEO || s->codec_id==CODEC_ID_MPEG2VIDEO
1973
                                || (s->codec_id==CODEC_ID_MPEG4 && !s->mpeg_quant))){
M
Michael Niedermayer 已提交
1974 1975 1976 1977
                add_dequant_dct(s, block[0], 0, dest_y                          , dct_linesize, s->qscale);
                add_dequant_dct(s, block[1], 1, dest_y              + block_size, dct_linesize, s->qscale);
                add_dequant_dct(s, block[2], 2, dest_y + dct_offset             , dct_linesize, s->qscale);
                add_dequant_dct(s, block[3], 3, dest_y + dct_offset + block_size, dct_linesize, s->qscale);
M
Michael Niedermayer 已提交
1978

1979
                if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
1980 1981 1982 1983 1984 1985 1986 1987 1988 1989 1990
                    if (s->chroma_y_shift){
                        add_dequant_dct(s, block[4], 4, dest_cb, uvlinesize, s->chroma_qscale);
                        add_dequant_dct(s, block[5], 5, dest_cr, uvlinesize, s->chroma_qscale);
                    }else{
                        dct_linesize >>= 1;
                        dct_offset >>=1;
                        add_dequant_dct(s, block[4], 4, dest_cb,              dct_linesize, s->chroma_qscale);
                        add_dequant_dct(s, block[5], 5, dest_cr,              dct_linesize, s->chroma_qscale);
                        add_dequant_dct(s, block[6], 6, dest_cb + dct_offset, dct_linesize, s->chroma_qscale);
                        add_dequant_dct(s, block[7], 7, dest_cr + dct_offset, dct_linesize, s->chroma_qscale);
                    }
M
Michael Niedermayer 已提交
1991
                }
K
Keiji Costantini 已提交
1992
            } else if(is_mpeg12 || (s->codec_id != CODEC_ID_WMV2)){
M
Michael Niedermayer 已提交
1993 1994 1995 1996
                add_dct(s, block[0], 0, dest_y                          , dct_linesize);
                add_dct(s, block[1], 1, dest_y              + block_size, dct_linesize);
                add_dct(s, block[2], 2, dest_y + dct_offset             , dct_linesize);
                add_dct(s, block[3], 3, dest_y + dct_offset + block_size, dct_linesize);
F
Fabrice Bellard 已提交
1997

1998
                if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019
                    if(s->chroma_y_shift){//Chroma420
                        add_dct(s, block[4], 4, dest_cb, uvlinesize);
                        add_dct(s, block[5], 5, dest_cr, uvlinesize);
                    }else{
                        //chroma422
                        dct_linesize = uvlinesize << s->interlaced_dct;
                        dct_offset =(s->interlaced_dct)? uvlinesize : uvlinesize*8;

                        add_dct(s, block[4], 4, dest_cb, dct_linesize);
                        add_dct(s, block[5], 5, dest_cr, dct_linesize);
                        add_dct(s, block[6], 6, dest_cb+dct_offset, dct_linesize);
                        add_dct(s, block[7], 7, dest_cr+dct_offset, dct_linesize);
                        if(!s->chroma_x_shift){//Chroma444
                            add_dct(s, block[8], 8, dest_cb+8, dct_linesize);
                            add_dct(s, block[9], 9, dest_cr+8, dct_linesize);
                            add_dct(s, block[10], 10, dest_cb+8+dct_offset, dct_linesize);
                            add_dct(s, block[11], 11, dest_cr+8+dct_offset, dct_linesize);
                        }
                    }
                }//fi gray
            }
2020
            else if (CONFIG_WMV2_DECODER || CONFIG_WMV2_ENCODER) {
M
Michael Niedermayer 已提交
2021
                ff_wmv2_add_mb(s, block, dest_y, dest_cb, dest_cr);
M
Michael Niedermayer 已提交
2022
            }
F
Fabrice Bellard 已提交
2023 2024
        } else {
            /* dct only in intra block */
M
Michael Niedermayer 已提交
2025
            if(s->encoding || !(s->codec_id==CODEC_ID_MPEG1VIDEO || s->codec_id==CODEC_ID_MPEG2VIDEO)){
M
Michael Niedermayer 已提交
2026 2027 2028 2029
                put_dct(s, block[0], 0, dest_y                          , dct_linesize, s->qscale);
                put_dct(s, block[1], 1, dest_y              + block_size, dct_linesize, s->qscale);
                put_dct(s, block[2], 2, dest_y + dct_offset             , dct_linesize, s->qscale);
                put_dct(s, block[3], 3, dest_y + dct_offset + block_size, dct_linesize, s->qscale);
2030

2031
                if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
2032 2033 2034 2035 2036 2037 2038 2039 2040
                    if(s->chroma_y_shift){
                        put_dct(s, block[4], 4, dest_cb, uvlinesize, s->chroma_qscale);
                        put_dct(s, block[5], 5, dest_cr, uvlinesize, s->chroma_qscale);
                    }else{
                        dct_offset >>=1;
                        dct_linesize >>=1;
                        put_dct(s, block[4], 4, dest_cb,              dct_linesize, s->chroma_qscale);
                        put_dct(s, block[5], 5, dest_cr,              dct_linesize, s->chroma_qscale);
                        put_dct(s, block[6], 6, dest_cb + dct_offset, dct_linesize, s->chroma_qscale);
B
Benoit Fouet 已提交
2041
                        put_dct(s, block[7], 7, dest_cr + dct_offset, dct_linesize, s->chroma_qscale);
M
Michael Niedermayer 已提交
2042 2043 2044
                    }
                }
            }else{
B
Benoit Fouet 已提交
2045 2046 2047 2048
                s->dsp.idct_put(dest_y                          , dct_linesize, block[0]);
                s->dsp.idct_put(dest_y              + block_size, dct_linesize, block[1]);
                s->dsp.idct_put(dest_y + dct_offset             , dct_linesize, block[2]);
                s->dsp.idct_put(dest_y + dct_offset + block_size, dct_linesize, block[3]);
2049

2050
                if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){
B
Benoit Fouet 已提交
2051 2052 2053 2054
                    if(s->chroma_y_shift){
                        s->dsp.idct_put(dest_cb, uvlinesize, block[4]);
                        s->dsp.idct_put(dest_cr, uvlinesize, block[5]);
                    }else{
2055

B
Benoit Fouet 已提交
2056 2057
                        dct_linesize = uvlinesize << s->interlaced_dct;
                        dct_offset =(s->interlaced_dct)? uvlinesize : uvlinesize*8;
2058

B
Benoit Fouet 已提交
2059 2060 2061 2062 2063 2064 2065 2066 2067 2068 2069 2070
                        s->dsp.idct_put(dest_cb,              dct_linesize, block[4]);
                        s->dsp.idct_put(dest_cr,              dct_linesize, block[5]);
                        s->dsp.idct_put(dest_cb + dct_offset, dct_linesize, block[6]);
                        s->dsp.idct_put(dest_cr + dct_offset, dct_linesize, block[7]);
                        if(!s->chroma_x_shift){//Chroma444
                            s->dsp.idct_put(dest_cb + 8,              dct_linesize, block[8]);
                            s->dsp.idct_put(dest_cr + 8,              dct_linesize, block[9]);
                            s->dsp.idct_put(dest_cb + 8 + dct_offset, dct_linesize, block[10]);
                            s->dsp.idct_put(dest_cr + 8 + dct_offset, dct_linesize, block[11]);
                        }
                    }
                }//gray
2071
            }
M
Michael Niedermayer 已提交
2072
        }
B
Benoit Fouet 已提交
2073 2074 2075 2076 2077
skip_idct:
        if(!readable){
            s->dsp.put_pixels_tab[0][0](s->dest[0], dest_y ,   linesize,16);
            s->dsp.put_pixels_tab[s->chroma_x_shift][0](s->dest[1], dest_cb, uvlinesize,16 >> s->chroma_y_shift);
            s->dsp.put_pixels_tab[s->chroma_x_shift][0](s->dest[2], dest_cr, uvlinesize,16 >> s->chroma_y_shift);
2078
        }
M
Michael Niedermayer 已提交
2079 2080 2081
    }
}

B
Benoit Fouet 已提交
2082
void MPV_decode_mb(MpegEncContext *s, DCTELEM block[12][64]){
2083
#if !CONFIG_SMALL
K
Keiji Costantini 已提交
2084 2085 2086 2087 2088 2089 2090
    if(s->out_format == FMT_MPEG1) {
        if(s->avctx->lowres) MPV_decode_mb_internal(s, block, 1, 1);
        else                 MPV_decode_mb_internal(s, block, 0, 1);
    } else
#endif
    if(s->avctx->lowres) MPV_decode_mb_internal(s, block, 1, 0);
    else                  MPV_decode_mb_internal(s, block, 0, 0);
M
Michael Niedermayer 已提交
2091 2092
}

B
Benoit Fouet 已提交
2093 2094 2095 2096 2097 2098 2099
/**
 *
 * @param h is the normal height, this will be reduced automatically if needed for the last row
 */
void ff_draw_horiz_band(MpegEncContext *s, int y, int h){
    if (s->avctx->draw_horiz_band) {
        AVFrame *src;
2100
        const int field_pic= s->picture_structure != PICT_FRAME;
B
Benoit Fouet 已提交
2101
        int offset[4];
M
Michael Niedermayer 已提交
2102

2103 2104 2105
        h= FFMIN(h, (s->avctx->height>>field_pic) - y);

        if(field_pic && !(s->avctx->slice_flags&SLICE_FLAG_ALLOW_FIELD)){
B
Benoit Fouet 已提交
2106 2107
            h <<= 1;
            y <<= 1;
2108
            if(s->first_field) return;
M
Michael Niedermayer 已提交
2109 2110
        }

2111
        if(s->pict_type==FF_B_TYPE || s->low_delay || (s->avctx->slice_flags&SLICE_FLAG_CODED_ORDER))
B
Benoit Fouet 已提交
2112 2113 2114 2115 2116
            src= (AVFrame*)s->current_picture_ptr;
        else if(s->last_picture_ptr)
            src= (AVFrame*)s->last_picture_ptr;
        else
            return;
2117

2118
        if(s->pict_type==FF_B_TYPE && s->picture_structure == PICT_FRAME && s->out_format != FMT_H264){
B
Benoit Fouet 已提交
2119 2120 2121 2122
            offset[0]=
            offset[1]=
            offset[2]=
            offset[3]= 0;
M
Michael Niedermayer 已提交
2123
        }else{
M
Fix ;;  
Michael Niedermayer 已提交
2124
            offset[0]= y * s->linesize;
B
Benoit Fouet 已提交
2125 2126 2127
            offset[1]=
            offset[2]= (y >> s->chroma_y_shift) * s->uvlinesize;
            offset[3]= 0;
M
Michael Niedermayer 已提交
2128
        }
2129

B
Benoit Fouet 已提交
2130
        emms_c();
M
Michael Niedermayer 已提交
2131

B
Benoit Fouet 已提交
2132 2133 2134 2135
        s->avctx->draw_horiz_band(s->avctx, src, offset,
                                  y, s->picture_structure, h);
    }
}
2136

B
Benoit Fouet 已提交
2137 2138 2139 2140
void ff_init_block_index(MpegEncContext *s){ //FIXME maybe rename
    const int linesize= s->current_picture.linesize[0]; //not s->linesize as this would be wrong for field pics
    const int uvlinesize= s->current_picture.linesize[1];
    const int mb_size= 4 - s->avctx->lowres;
M
Michael Niedermayer 已提交
2141

B
Benoit Fouet 已提交
2142 2143 2144 2145 2146 2147 2148
    s->block_index[0]= s->b8_stride*(s->mb_y*2    ) - 2 + s->mb_x*2;
    s->block_index[1]= s->b8_stride*(s->mb_y*2    ) - 1 + s->mb_x*2;
    s->block_index[2]= s->b8_stride*(s->mb_y*2 + 1) - 2 + s->mb_x*2;
    s->block_index[3]= s->b8_stride*(s->mb_y*2 + 1) - 1 + s->mb_x*2;
    s->block_index[4]= s->mb_stride*(s->mb_y + 1)                + s->b8_stride*s->mb_height*2 + s->mb_x - 1;
    s->block_index[5]= s->mb_stride*(s->mb_y + s->mb_height + 2) + s->b8_stride*s->mb_height*2 + s->mb_x - 1;
    //block_index is not used by mpeg2, so it is not affected by chroma_format
2149

B
Benoit Fouet 已提交
2150 2151 2152
    s->dest[0] = s->current_picture.data[0] + ((s->mb_x - 1) << mb_size);
    s->dest[1] = s->current_picture.data[1] + ((s->mb_x - 1) << (mb_size - s->chroma_x_shift));
    s->dest[2] = s->current_picture.data[2] + ((s->mb_x - 1) << (mb_size - s->chroma_x_shift));
2153

2154
    if(!(s->pict_type==FF_B_TYPE && s->avctx->draw_horiz_band && s->picture_structure==PICT_FRAME))
B
Benoit Fouet 已提交
2155
    {
2156
        if(s->picture_structure==PICT_FRAME){
B
Benoit Fouet 已提交
2157 2158 2159
        s->dest[0] += s->mb_y *   linesize << mb_size;
        s->dest[1] += s->mb_y * uvlinesize << (mb_size - s->chroma_y_shift);
        s->dest[2] += s->mb_y * uvlinesize << (mb_size - s->chroma_y_shift);
2160 2161 2162 2163 2164 2165
        }else{
            s->dest[0] += (s->mb_y>>1) *   linesize << mb_size;
            s->dest[1] += (s->mb_y>>1) * uvlinesize << (mb_size - s->chroma_y_shift);
            s->dest[2] += (s->mb_y>>1) * uvlinesize << (mb_size - s->chroma_y_shift);
            assert((s->mb_y&1) == (s->picture_structure == PICT_BOTTOM_FIELD));
        }
M
Michael Niedermayer 已提交
2166 2167
    }
}
2168

B
Benoit Fouet 已提交
2169 2170 2171
void ff_mpeg_flush(AVCodecContext *avctx){
    int i;
    MpegEncContext *s = avctx->priv_data;
M
Michael Niedermayer 已提交
2172

B
Benoit Fouet 已提交
2173 2174
    if(s==NULL || s->picture==NULL)
        return;
M
Michael Niedermayer 已提交
2175

B
Benoit Fouet 已提交
2176 2177 2178
    for(i=0; i<MAX_PICTURE_COUNT; i++){
       if(s->picture[i].data[0] && (   s->picture[i].type == FF_BUFFER_TYPE_INTERNAL
                                    || s->picture[i].type == FF_BUFFER_TYPE_USER))
2179
        free_frame_buffer(s, &s->picture[i]);
F
Fabrice Bellard 已提交
2180
    }
B
Benoit Fouet 已提交
2181
    s->current_picture_ptr = s->last_picture_ptr = s->next_picture_ptr = NULL;
2182

B
Benoit Fouet 已提交
2183
    s->mb_x= s->mb_y= 0;
2184
    s->closed_gop= 0;
M
Michael Niedermayer 已提交
2185

B
Benoit Fouet 已提交
2186 2187 2188 2189 2190 2191 2192 2193
    s->parse_context.state= -1;
    s->parse_context.frame_start_found= 0;
    s->parse_context.overread= 0;
    s->parse_context.overread_index= 0;
    s->parse_context.index= 0;
    s->parse_context.last_index= 0;
    s->bitstream_buffer_size=0;
    s->pp_time=0;
F
Fabrice Bellard 已提交
2194 2195
}

2196
static void dct_unquantize_mpeg1_intra_c(MpegEncContext *s,
2197
                                   DCTELEM *block, int n, int qscale)
F
Fabrice Bellard 已提交
2198
{
M
Michael Niedermayer 已提交
2199
    int i, level, nCoeffs;
2200
    const uint16_t *quant_matrix;
F
Fabrice Bellard 已提交
2201

2202
    nCoeffs= s->block_last_index[n];
2203 2204

    if (n < 4)
2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221
        block[0] = block[0] * s->y_dc_scale;
    else
        block[0] = block[0] * s->c_dc_scale;
    /* XXX: only mpeg1 */
    quant_matrix = s->intra_matrix;
    for(i=1;i<=nCoeffs;i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = (level - 1) | 1;
                level = -level;
            } else {
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = (level - 1) | 1;
F
Fabrice Bellard 已提交
2222
            }
2223
            block[j] = level;
F
Fabrice Bellard 已提交
2224
        }
2225 2226 2227
    }
}

2228
static void dct_unquantize_mpeg1_inter_c(MpegEncContext *s,
2229 2230 2231 2232 2233 2234
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
    const uint16_t *quant_matrix;

    nCoeffs= s->block_last_index[n];
2235

2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250
    quant_matrix = s->inter_matrix;
    for(i=0; i<=nCoeffs; i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
                level = (level - 1) | 1;
                level = -level;
            } else {
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
                level = (level - 1) | 1;
F
Fabrice Bellard 已提交
2251
            }
2252
            block[j] = level;
F
Fabrice Bellard 已提交
2253 2254 2255
        }
    }
}
2256

2257
static void dct_unquantize_mpeg2_intra_c(MpegEncContext *s,
2258 2259 2260
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
2261
    const uint16_t *quant_matrix;
2262

2263 2264
    if(s->alternate_scan) nCoeffs= 63;
    else nCoeffs= s->block_last_index[n];
2265 2266

    if (n < 4)
2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285 2286
        block[0] = block[0] * s->y_dc_scale;
    else
        block[0] = block[0] * s->c_dc_scale;
    quant_matrix = s->intra_matrix;
    for(i=1;i<=nCoeffs;i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = -level;
            } else {
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
            }
            block[j] = level;
        }
    }
}

2287 2288 2289 2290 2291 2292 2293 2294 2295 2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306 2307 2308 2309 2310 2311 2312 2313 2314 2315 2316 2317 2318 2319
static void dct_unquantize_mpeg2_intra_bitexact(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
    const uint16_t *quant_matrix;
    int sum=-1;

    if(s->alternate_scan) nCoeffs= 63;
    else nCoeffs= s->block_last_index[n];

    if (n < 4)
        block[0] = block[0] * s->y_dc_scale;
    else
        block[0] = block[0] * s->c_dc_scale;
    quant_matrix = s->intra_matrix;
    for(i=1;i<=nCoeffs;i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = -level;
            } else {
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
            }
            block[j] = level;
            sum+=level;
        }
    }
    block[63]^=sum&1;
}

2320
static void dct_unquantize_mpeg2_inter_c(MpegEncContext *s,
2321 2322 2323 2324 2325 2326 2327 2328
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
    const uint16_t *quant_matrix;
    int sum=-1;

    if(s->alternate_scan) nCoeffs= 63;
    else nCoeffs= s->block_last_index[n];
2329

2330 2331 2332 2333 2334 2335 2336 2337 2338 2339 2340 2341 2342 2343 2344 2345 2346 2347 2348 2349 2350
    quant_matrix = s->inter_matrix;
    for(i=0; i<=nCoeffs; i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
                level = -level;
            } else {
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
            }
            block[j] = level;
            sum+=level;
        }
    }
    block[63]^=sum&1;
}

2351
static void dct_unquantize_h263_intra_c(MpegEncContext *s,
2352 2353 2354 2355
                                  DCTELEM *block, int n, int qscale)
{
    int i, level, qmul, qadd;
    int nCoeffs;
2356

2357
    assert(s->block_last_index[n]>=0);
2358

2359
    qmul = qscale << 1;
2360

2361
    if (!s->h263_aic) {
2362
        if (n < 4)
2363 2364 2365
            block[0] = block[0] * s->y_dc_scale;
        else
            block[0] = block[0] * s->c_dc_scale;
2366 2367 2368 2369 2370 2371 2372 2373 2374 2375 2376 2377 2378 2379 2380 2381
        qadd = (qscale - 1) | 1;
    }else{
        qadd = 0;
    }
    if(s->ac_pred)
        nCoeffs=63;
    else
        nCoeffs= s->inter_scantable.raster_end[ s->block_last_index[n] ];

    for(i=1; i<=nCoeffs; i++) {
        level = block[i];
        if (level) {
            if (level < 0) {
                level = level * qmul - qadd;
            } else {
                level = level * qmul + qadd;
2382
            }
2383
            block[i] = level;
2384 2385 2386 2387
        }
    }
}

2388
static void dct_unquantize_h263_inter_c(MpegEncContext *s,
2389 2390 2391
                                  DCTELEM *block, int n, int qscale)
{
    int i, level, qmul, qadd;
M
Michael Niedermayer 已提交
2392
    int nCoeffs;
2393

2394
    assert(s->block_last_index[n]>=0);
2395

2396 2397
    qadd = (qscale - 1) | 1;
    qmul = qscale << 1;
2398

2399
    nCoeffs= s->inter_scantable.raster_end[ s->block_last_index[n] ];
2400

2401
    for(i=0; i<=nCoeffs; i++) {
2402 2403 2404 2405 2406 2407 2408 2409 2410 2411 2412
        level = block[i];
        if (level) {
            if (level < 0) {
                level = level * qmul - qadd;
            } else {
                level = level * qmul + qadd;
            }
            block[i] = level;
        }
    }
}
F
Fabrice Bellard 已提交
2413

2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424 2425 2426 2427 2428 2429
/**
 * set qscale and update qscale dependent variables.
 */
void ff_set_qscale(MpegEncContext * s, int qscale)
{
    if (qscale < 1)
        qscale = 1;
    else if (qscale > 31)
        qscale = 31;

    s->qscale = qscale;
    s->chroma_qscale= s->chroma_qscale_table[qscale];

    s->y_dc_scale= s->y_dc_scale_table[ qscale ];
    s->c_dc_scale= s->c_dc_scale_table[ s->chroma_qscale ];
}