mpegvideo.c 251.7 KB
Newer Older
F
Fabrice Bellard 已提交
1 2
/*
 * The simplest mpeg encoder (well, it was the simplest!)
F
Fabrice Bellard 已提交
3
 * Copyright (c) 2000,2001 Fabrice Bellard.
4
 * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at>
F
Fabrice Bellard 已提交
5
 *
6 7 8
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
F
Fabrice Bellard 已提交
9 10
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
11
 * version 2.1 of the License, or (at your option) any later version.
F
Fabrice Bellard 已提交
12
 *
13
 * FFmpeg is distributed in the hope that it will be useful,
F
Fabrice Bellard 已提交
14
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
F
Fabrice Bellard 已提交
15 16
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
F
Fabrice Bellard 已提交
17
 *
F
Fabrice Bellard 已提交
18
 * You should have received a copy of the GNU Lesser General Public
19
 * License along with FFmpeg; if not, write to the Free Software
20
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
M
Michael Niedermayer 已提交
21
 *
22
 * 4MV & hq & b-frame encoding stuff by Michael Niedermayer <michaelni@gmx.at>
F
Fabrice Bellard 已提交
23
 */
24

M
Michael Niedermayer 已提交
25 26 27
/**
 * @file mpegvideo.c
 * The simplest mpeg encoder (well, it was the simplest!).
28 29
 */

F
Fabrice Bellard 已提交
30 31 32
#include "avcodec.h"
#include "dsputil.h"
#include "mpegvideo.h"
33
#include "msmpeg4.h"
M
Michael Niedermayer 已提交
34
#include "faandct.h"
35
#include <limits.h>
F
Fabrice Bellard 已提交
36

37
#ifdef USE_FASTMEMCPY
38
#include "libvo/fastmemcpy.h"
39 40
#endif

41 42
//#undef NDEBUG
//#include <assert.h>
43

44
#ifdef CONFIG_ENCODERS
45
static int encode_picture(MpegEncContext *s, int picture_number);
46
#endif //CONFIG_ENCODERS
47
static void dct_unquantize_mpeg1_intra_c(MpegEncContext *s,
48
                                   DCTELEM *block, int n, int qscale);
49
static void dct_unquantize_mpeg1_inter_c(MpegEncContext *s,
50
                                   DCTELEM *block, int n, int qscale);
51 52
static void dct_unquantize_mpeg2_intra_c(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale);
53 54
static void dct_unquantize_mpeg2_intra_bitexact(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale);
55 56
static void dct_unquantize_mpeg2_inter_c(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale);
57
static void dct_unquantize_h263_intra_c(MpegEncContext *s,
58
                                  DCTELEM *block, int n, int qscale);
59
static void dct_unquantize_h263_inter_c(MpegEncContext *s,
60
                                  DCTELEM *block, int n, int qscale);
61
static void draw_edges_c(uint8_t *buf, int wrap, int width, int height, int w);
62
#ifdef CONFIG_ENCODERS
63
static int dct_quantize_c(MpegEncContext *s, DCTELEM *block, int n, int qscale, int *overflow);
M
Michael Niedermayer 已提交
64
static int dct_quantize_trellis_c(MpegEncContext *s, DCTELEM *block, int n, int qscale, int *overflow);
M
Michael Niedermayer 已提交
65
static int dct_quantize_refine(MpegEncContext *s, DCTELEM *block, int16_t *weight, DCTELEM *orig, int n, int qscale);
66
static int sse_mb(MpegEncContext *s);
M
Michael Niedermayer 已提交
67
static void  denoise_dct_c(MpegEncContext *s, DCTELEM *block);
68
#endif //CONFIG_ENCODERS
M
Michael Niedermayer 已提交
69

I
Ivan Kalvachev 已提交
70 71 72
#ifdef HAVE_XVMC
extern int  XVMC_field_start(MpegEncContext*s, AVCodecContext *avctx);
extern void XVMC_field_end(MpegEncContext *s);
73
extern void XVMC_decode_mb(MpegEncContext *s);
I
Ivan Kalvachev 已提交
74 75
#endif

76
void (*draw_edges)(uint8_t *buf, int wrap, int width, int height, int w)= draw_edges_c;
M
Michael Niedermayer 已提交
77

F
Fabrice Bellard 已提交
78 79 80 81 82 83

/* enable all paranoid tests for rounding, overflows, etc... */
//#define PARANOID

//#define DEBUG

84

F
Fabrice Bellard 已提交
85 86 87
/* for jpeg fast DCT */
#define CONST_BITS 14

88
static const uint16_t aanscales[64] = {
F
Fabrice Bellard 已提交
89 90 91 92 93 94 95
    /* precomputed values scaled up by 14 bits */
    16384, 22725, 21407, 19266, 16384, 12873,  8867,  4520,
    22725, 31521, 29692, 26722, 22725, 17855, 12299,  6270,
    21407, 29692, 27969, 25172, 21407, 16819, 11585,  5906,
    19266, 26722, 25172, 22654, 19266, 15137, 10426,  5315,
    16384, 22725, 21407, 19266, 16384, 12873,  8867,  4520,
    12873, 17855, 16819, 15137, 12873, 10114,  6967,  3552,
M
Michael Niedermayer 已提交
96 97
    8867 , 12299, 11585, 10426,  8867,  6967,  4799,  2446,
    4520 ,  6270,  5906,  5315,  4520,  3552,  2446,  1247
F
Fabrice Bellard 已提交
98 99
};

100
static const uint8_t h263_chroma_roundtab[16] = {
101
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15
F
Fabrice Bellard 已提交
102 103 104
    0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2,
};

M
Michael Niedermayer 已提交
105 106 107 108 109
static const uint8_t ff_default_chroma_qscale_table[32]={
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
    0, 1, 2, 3, 4, 5, 6, 7, 8, 9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31
};

110
#ifdef CONFIG_ENCODERS
111
static uint8_t default_mv_penalty[MAX_FCODE+1][MAX_MV*2+1];
112
static uint8_t default_fcode_tab[MAX_MV*2+1];
113

M
Michael Niedermayer 已提交
114 115
enum PixelFormat ff_yuv420p_list[2]= {PIX_FMT_YUV420P, -1};

116
static void convert_matrix(DSPContext *dsp, int (*qmat)[64], uint16_t (*qmat16)[2][64],
117
                           const uint16_t *quant_matrix, int bias, int qmin, int qmax, int intra)
F
Fabrice Bellard 已提交
118
{
119
    int qscale;
120
    int shift=0;
121

122
    for(qscale=qmin; qscale<=qmax; qscale++){
123
        int i;
124
        if (dsp->fdct == ff_jpeg_fdct_islow
125
#ifdef FAAN_POSTSCALE
126
            || dsp->fdct == ff_faandct
127 128
#endif
            ) {
129
            for(i=0;i<64;i++) {
130
                const int j= dsp->idct_permutation[i];
131 132 133 134
                /* 16 <= qscale * quant_matrix[i] <= 7905 */
                /* 19952         <= aanscales[i] * qscale * quant_matrix[i]           <= 249205026 */
                /* (1<<36)/19952 >= (1<<36)/(aanscales[i] * qscale * quant_matrix[i]) >= (1<<36)/249205026 */
                /* 3444240       >= (1<<36)/(aanscales[i] * qscale * quant_matrix[i]) >= 275 */
135

136
                qmat[qscale][i] = (int)((UINT64_C(1) << QMAT_SHIFT) /
137 138
                                (qscale * quant_matrix[j]));
            }
139
        } else if (dsp->fdct == fdct_ifast
140
#ifndef FAAN_POSTSCALE
141
                   || dsp->fdct == ff_faandct
142 143
#endif
                   ) {
144
            for(i=0;i<64;i++) {
145
                const int j= dsp->idct_permutation[i];
146 147 148 149
                /* 16 <= qscale * quant_matrix[i] <= 7905 */
                /* 19952         <= aanscales[i] * qscale * quant_matrix[i]           <= 249205026 */
                /* (1<<36)/19952 >= (1<<36)/(aanscales[i] * qscale * quant_matrix[i]) >= (1<<36)/249205026 */
                /* 3444240       >= (1<<36)/(aanscales[i] * qscale * quant_matrix[i]) >= 275 */
150

151
                qmat[qscale][i] = (int)((UINT64_C(1) << (QMAT_SHIFT + 14)) /
152 153 154 155
                                (aanscales[i] * qscale * quant_matrix[j]));
            }
        } else {
            for(i=0;i<64;i++) {
156
                const int j= dsp->idct_permutation[i];
157 158 159 160 161
                /* We can safely suppose that 16 <= quant_matrix[i] <= 255
                   So 16           <= qscale * quant_matrix[i]             <= 7905
                   so (1<<19) / 16 >= (1<<19) / (qscale * quant_matrix[i]) >= (1<<19) / 7905
                   so 32768        >= (1<<19) / (qscale * quant_matrix[i]) >= 67
                */
162
                qmat[qscale][i] = (int)((UINT64_C(1) << QMAT_SHIFT) / (qscale * quant_matrix[j]));
M
Michael Niedermayer 已提交
163
//                qmat  [qscale][i] = (1 << QMAT_SHIFT_MMX) / (qscale * quant_matrix[i]);
164
                qmat16[qscale][0][i] = (1 << QMAT_SHIFT_MMX) / (qscale * quant_matrix[j]);
165

166 167
                if(qmat16[qscale][0][i]==0 || qmat16[qscale][0][i]==128*256) qmat16[qscale][0][i]=128*256-1;
                qmat16[qscale][1][i]= ROUNDED_DIV(bias<<(16-QUANT_BIAS_SHIFT), qmat16[qscale][0][i]);
168
            }
F
Fabrice Bellard 已提交
169
        }
170

171
        for(i=intra; i<64; i++){
172 173 174 175 176 177 178 179
            int64_t max= 8191;
            if (dsp->fdct == fdct_ifast
#ifndef FAAN_POSTSCALE
                   || dsp->fdct == ff_faandct
#endif
                   ) {
                max= (8191LL*aanscales[i]) >> 14;
            }
180
            while(((max * qmat[qscale][i]) >> shift) > INT_MAX){
181 182 183 184 185
                shift++;
            }
        }
    }
    if(shift){
M
Michel Bardiaux 已提交
186
        av_log(NULL, AV_LOG_INFO, "Warning, QMAT_SHIFT is larger than %d, overflows possible\n", QMAT_SHIFT - shift);
F
Fabrice Bellard 已提交
187 188
    }
}
189 190 191

static inline void update_qscale(MpegEncContext *s){
    s->qscale= (s->lambda*139 + FF_LAMBDA_SCALE*64) >> (FF_LAMBDA_SHIFT + 7);
192
    s->qscale= av_clip(s->qscale, s->avctx->qmin, s->avctx->qmax);
193

194 195
    s->lambda2= (s->lambda*s->lambda + FF_LAMBDA_SCALE/2) >> FF_LAMBDA_SHIFT;
}
196 197
#endif //CONFIG_ENCODERS

M
Michael Niedermayer 已提交
198
void ff_init_scantable(uint8_t *permutation, ScanTable *st, const uint8_t *src_scantable){
199 200
    int i;
    int end;
201

M
Michael Niedermayer 已提交
202
    st->scantable= src_scantable;
203 204 205 206

    for(i=0; i<64; i++){
        int j;
        j = src_scantable[i];
M
Michael Niedermayer 已提交
207
        st->permutated[i] = permutation[j];
208 209 210
#ifdef ARCH_POWERPC
        st->inverse[j] = i;
#endif
211
    }
212

213 214 215 216 217 218 219 220 221
    end=-1;
    for(i=0; i<64; i++){
        int j;
        j = st->permutated[i];
        if(j>end) end=j;
        st->raster_end[i]= end;
    }
}

222
#ifdef CONFIG_ENCODERS
M
Måns Rullgård 已提交
223
void ff_write_quant_matrix(PutBitContext *pb, uint16_t *matrix){
224 225 226 227 228 229 230 231 232 233
    int i;

    if(matrix){
        put_bits(pb, 1, 1);
        for(i=0;i<64;i++) {
            put_bits(pb, 8, matrix[ ff_zigzag_direct[i] ]);
        }
    }else
        put_bits(pb, 1, 0);
}
234
#endif //CONFIG_ENCODERS
235

M
Michael Niedermayer 已提交
236 237 238
const uint8_t *ff_find_start_code(const uint8_t * restrict p, const uint8_t *end, uint32_t * restrict state){
    int i;

M
Michael Niedermayer 已提交
239 240 241 242
    assert(p<=end);
    if(p>=end)
        return end;

M
Michael Niedermayer 已提交
243 244 245 246 247 248 249 250
    for(i=0; i<3; i++){
        uint32_t tmp= *state << 8;
        *state= tmp + *(p++);
        if(tmp == 0x100 || p==end)
            return p;
    }

    while(p<end){
M
Michael Niedermayer 已提交
251 252 253
        if     (p[-1] > 1      ) p+= 3;
        else if(p[-2]          ) p+= 2;
        else if(p[-3]|(p[-1]-1)) p++;
M
Michael Niedermayer 已提交
254 255 256 257 258 259
        else{
            p++;
            break;
        }
    }

M
Michael Niedermayer 已提交
260
    p= FFMIN(p, end)-4;
M
Michael Niedermayer 已提交
261 262 263 264 265
    *state=  be2me_32(unaligned32(p));

    return p+4;
}

266 267
/* init common dct for both encoder and decoder */
int DCT_common_init(MpegEncContext *s)
F
Fabrice Bellard 已提交
268
{
269 270 271 272 273
    s->dct_unquantize_h263_intra = dct_unquantize_h263_intra_c;
    s->dct_unquantize_h263_inter = dct_unquantize_h263_inter_c;
    s->dct_unquantize_mpeg1_intra = dct_unquantize_mpeg1_intra_c;
    s->dct_unquantize_mpeg1_inter = dct_unquantize_mpeg1_inter_c;
    s->dct_unquantize_mpeg2_intra = dct_unquantize_mpeg2_intra_c;
274 275
    if(s->flags & CODEC_FLAG_BITEXACT)
        s->dct_unquantize_mpeg2_intra = dct_unquantize_mpeg2_intra_bitexact;
276
    s->dct_unquantize_mpeg2_inter = dct_unquantize_mpeg2_inter_c;
277

278
#ifdef CONFIG_ENCODERS
279
    s->dct_quantize= dct_quantize_c;
M
Michael Niedermayer 已提交
280
    s->denoise_dct= denoise_dct_c;
281
#endif //CONFIG_ENCODERS
282

283
#ifdef HAVE_MMX
284
    MPV_common_init_mmx(s);
285 286 287
#endif
#ifdef ARCH_ALPHA
    MPV_common_init_axp(s);
N
Nick Kurshev 已提交
288
#endif
289 290 291
#ifdef HAVE_MLIB
    MPV_common_init_mlib(s);
#endif
292 293 294
#ifdef HAVE_MMI
    MPV_common_init_mmi(s);
#endif
295
#ifdef ARCH_ARMV4L
296
    MPV_common_init_armv4l(s);
297
#endif
298 299 300
#ifdef ARCH_POWERPC
    MPV_common_init_ppc(s);
#endif
301

302
#ifdef CONFIG_ENCODERS
303 304
    s->fast_dct_quantize= s->dct_quantize;

M
Michael Niedermayer 已提交
305 306 307 308
    if(s->flags&CODEC_FLAG_TRELLIS_QUANT){
        s->dct_quantize= dct_quantize_trellis_c; //move before MPV_common_init_*
    }

309 310
#endif //CONFIG_ENCODERS

311
    /* load & permutate scantables
312
       note: only wmv uses different ones
313
    */
M
Michael Niedermayer 已提交
314 315 316 317 318 319 320
    if(s->alternate_scan){
        ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable  , ff_alternate_vertical_scan);
        ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable  , ff_alternate_vertical_scan);
    }else{
        ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable  , ff_zigzag_direct);
        ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable  , ff_zigzag_direct);
    }
M
Michael Niedermayer 已提交
321 322
    ff_init_scantable(s->dsp.idct_permutation, &s->intra_h_scantable, ff_alternate_horizontal_scan);
    ff_init_scantable(s->dsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
323

324 325 326
    return 0;
}

327 328 329 330 331
static void copy_picture(Picture *dst, Picture *src){
    *dst = *src;
    dst->type= FF_BUFFER_TYPE_COPY;
}

332
#ifdef CONFIG_ENCODERS
333 334 335
static void copy_picture_attributes(MpegEncContext *s, AVFrame *dst, AVFrame *src){
    int i;

336 337 338 339 340 341 342 343
    dst->pict_type              = src->pict_type;
    dst->quality                = src->quality;
    dst->coded_picture_number   = src->coded_picture_number;
    dst->display_picture_number = src->display_picture_number;
//    dst->reference              = src->reference;
    dst->pts                    = src->pts;
    dst->interlaced_frame       = src->interlaced_frame;
    dst->top_field_first        = src->top_field_first;
344

345 346 347 348 349 350 351
    if(s->avctx->me_threshold){
        if(!src->motion_val[0])
            av_log(s->avctx, AV_LOG_ERROR, "AVFrame.motion_val not set!\n");
        if(!src->mb_type)
            av_log(s->avctx, AV_LOG_ERROR, "AVFrame.mb_type not set!\n");
        if(!src->ref_index[0])
            av_log(s->avctx, AV_LOG_ERROR, "AVFrame.ref_index not set!\n");
352
        if(src->motion_subsample_log2 != dst->motion_subsample_log2)
353
            av_log(s->avctx, AV_LOG_ERROR, "AVFrame.motion_subsample_log2 doesn't match! (%d!=%d)\n",
354
            src->motion_subsample_log2, dst->motion_subsample_log2);
355 356

        memcpy(dst->mb_type, src->mb_type, s->mb_stride * s->mb_height * sizeof(dst->mb_type[0]));
357

358
        for(i=0; i<2; i++){
359 360 361
            int stride= ((16*s->mb_width )>>src->motion_subsample_log2) + 1;
            int height= ((16*s->mb_height)>>src->motion_subsample_log2);

362 363 364 365
            if(src->motion_val[i] && src->motion_val[i] != dst->motion_val[i]){
                memcpy(dst->motion_val[i], src->motion_val[i], 2*stride*height*sizeof(int16_t));
            }
            if(src->ref_index[i] && src->ref_index[i] != dst->ref_index[i]){
366
                memcpy(dst->ref_index[i], src->ref_index[i], s->b8_stride*2*s->mb_height*sizeof(int8_t));
367
            }
368 369
        }
    }
370
}
371
#endif
372

M
cleanup  
Michael Niedermayer 已提交
373
/**
M
Michael Niedermayer 已提交
374 375
 * allocates a Picture
 * The pixels are allocated/set by calling get_buffer() if shared=0
M
cleanup  
Michael Niedermayer 已提交
376
 */
M
Michael Niedermayer 已提交
377
static int alloc_picture(MpegEncContext *s, Picture *pic, int shared){
378 379
    const int big_mb_num= s->mb_stride*(s->mb_height+1) + 1; //the +1 is needed so memset(,,stride*height) doesnt sig11
    const int mb_array_size= s->mb_stride*s->mb_height;
380 381
    const int b8_array_size= s->b8_stride*s->mb_height*2;
    const int b4_array_size= s->b4_stride*s->mb_height*4;
M
Michael Niedermayer 已提交
382
    int i;
383

M
Michael Niedermayer 已提交
384 385 386 387 388 389
    if(shared){
        assert(pic->data[0]);
        assert(pic->type == 0 || pic->type == FF_BUFFER_TYPE_SHARED);
        pic->type= FF_BUFFER_TYPE_SHARED;
    }else{
        int r;
390

M
Michael Niedermayer 已提交
391
        assert(!pic->data[0]);
392

M
Michael Niedermayer 已提交
393
        r= s->avctx->get_buffer(s->avctx, (AVFrame*)pic);
394

M
Michael Niedermayer 已提交
395
        if(r<0 || !pic->age || !pic->type || !pic->data[0]){
396
            av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed (%d %d %d %p)\n", r, pic->age, pic->type, pic->data[0]);
M
Michael Niedermayer 已提交
397 398 399 400
            return -1;
        }

        if(s->linesize && (s->linesize != pic->linesize[0] || s->uvlinesize != pic->linesize[1])){
401
            av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed (stride changed)\n");
M
Michael Niedermayer 已提交
402 403 404 405
            return -1;
        }

        if(pic->linesize[1] != pic->linesize[2]){
D
Diego Biurrun 已提交
406
            av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed (uv stride mismatch)\n");
M
Michael Niedermayer 已提交
407 408 409 410 411
            return -1;
        }

        s->linesize  = pic->linesize[0];
        s->uvlinesize= pic->linesize[1];
M
cleanup  
Michael Niedermayer 已提交
412
    }
413

M
Michael Niedermayer 已提交
414
    if(pic->qscale_table==NULL){
415
        if (s->encoding) {
416 417 418
            CHECKED_ALLOCZ(pic->mb_var   , mb_array_size * sizeof(int16_t))
            CHECKED_ALLOCZ(pic->mc_mb_var, mb_array_size * sizeof(int16_t))
            CHECKED_ALLOCZ(pic->mb_mean  , mb_array_size * sizeof(int8_t))
M
Michael Niedermayer 已提交
419
        }
M
cleanup  
Michael Niedermayer 已提交
420

421
        CHECKED_ALLOCZ(pic->mbskip_table , mb_array_size * sizeof(uint8_t)+2) //the +2 is for the slice end check
422
        CHECKED_ALLOCZ(pic->qscale_table , mb_array_size * sizeof(uint8_t))
423
        CHECKED_ALLOCZ(pic->mb_type_base , big_mb_num    * sizeof(uint32_t))
424
        pic->mb_type= pic->mb_type_base + s->mb_stride+1;
M
Michael Niedermayer 已提交
425 426
        if(s->out_format == FMT_H264){
            for(i=0; i<2; i++){
M
Michael Niedermayer 已提交
427 428
                CHECKED_ALLOCZ(pic->motion_val_base[i], 2 * (b4_array_size+4)  * sizeof(int16_t))
                pic->motion_val[i]= pic->motion_val_base[i]+4;
429
                CHECKED_ALLOCZ(pic->ref_index[i], b8_array_size * sizeof(uint8_t))
430
            }
M
Michael Niedermayer 已提交
431
            pic->motion_subsample_log2= 2;
432
        }else if(s->out_format == FMT_H263 || s->encoding || (s->avctx->debug&FF_DEBUG_MV) || (s->avctx->debug_mv)){
433
            for(i=0; i<2; i++){
M
Michael Niedermayer 已提交
434 435
                CHECKED_ALLOCZ(pic->motion_val_base[i], 2 * (b8_array_size+4) * sizeof(int16_t))
                pic->motion_val[i]= pic->motion_val_base[i]+4;
436
                CHECKED_ALLOCZ(pic->ref_index[i], b8_array_size * sizeof(uint8_t))
M
Michael Niedermayer 已提交
437
            }
M
Michael Niedermayer 已提交
438
            pic->motion_subsample_log2= 3;
M
Michael Niedermayer 已提交
439
        }
440 441 442
        if(s->avctx->debug&FF_DEBUG_DCT_COEFF) {
            CHECKED_ALLOCZ(pic->dct_coeff, 64 * mb_array_size * sizeof(DCTELEM)*6)
        }
443
        pic->qstride= s->mb_stride;
444
        CHECKED_ALLOCZ(pic->pan_scan , 1 * sizeof(AVPanScan))
M
Michael Niedermayer 已提交
445
    }
M
Michael Niedermayer 已提交
446

447 448 449 450
    //it might be nicer if the application would keep track of these but it would require a API change
    memmove(s->prev_pict_types+1, s->prev_pict_types, PREV_PICT_TYPES_BUFFER_SIZE-1);
    s->prev_pict_types[0]= s->pict_type;
    if(pic->age < PREV_PICT_TYPES_BUFFER_SIZE && s->prev_pict_types[pic->age] == B_TYPE)
451
        pic->age= INT_MAX; // skipped MBs in b frames are quite rare in mpeg1/2 and its a bit tricky to skip them anyway
452

M
cleanup  
Michael Niedermayer 已提交
453 454 455 456 457
    return 0;
fail: //for the CHECKED_ALLOCZ macro
    return -1;
}

M
Michael Niedermayer 已提交
458 459 460
/**
 * deallocates a picture
 */
M
cleanup  
Michael Niedermayer 已提交
461 462
static void free_picture(MpegEncContext *s, Picture *pic){
    int i;
M
Michael Niedermayer 已提交
463 464

    if(pic->data[0] && pic->type!=FF_BUFFER_TYPE_SHARED){
M
Michael Niedermayer 已提交
465
        s->avctx->release_buffer(s->avctx, (AVFrame*)pic);
M
Michael Niedermayer 已提交
466 467
    }

M
cleanup  
Michael Niedermayer 已提交
468 469 470 471 472
    av_freep(&pic->mb_var);
    av_freep(&pic->mc_mb_var);
    av_freep(&pic->mb_mean);
    av_freep(&pic->mbskip_table);
    av_freep(&pic->qscale_table);
M
Michael Niedermayer 已提交
473
    av_freep(&pic->mb_type_base);
474
    av_freep(&pic->dct_coeff);
475
    av_freep(&pic->pan_scan);
M
Michael Niedermayer 已提交
476 477
    pic->mb_type= NULL;
    for(i=0; i<2; i++){
478
        av_freep(&pic->motion_val_base[i]);
M
Michael Niedermayer 已提交
479 480
        av_freep(&pic->ref_index[i]);
    }
481

482
    if(pic->type == FF_BUFFER_TYPE_SHARED){
M
Michael Niedermayer 已提交
483 484 485 486
        for(i=0; i<4; i++){
            pic->base[i]=
            pic->data[i]= NULL;
        }
487
        pic->type= 0;
M
cleanup  
Michael Niedermayer 已提交
488 489 490
    }
}

491 492 493
static int init_duplicate_context(MpegEncContext *s, MpegEncContext *base){
    int i;

494
    // edge emu needs blocksize + filter length - 1 (=17x17 for halfpel / 21x21 for h264)
L
Loren Merritt 已提交
495 496
    CHECKED_ALLOCZ(s->allocated_edge_emu_buffer, (s->width+64)*2*21*2); //(width + edge + align)*interlaced*MBsize*tolerance
    s->edge_emu_buffer= s->allocated_edge_emu_buffer + (s->width+64)*2*21;
497 498

     //FIXME should be linesize instead of s->width*2 but that isnt known before get_buffer()
499
    CHECKED_ALLOCZ(s->me.scratchpad,  (s->width+64)*4*16*2*sizeof(uint8_t))
500 501 502 503 504 505 506 507 508
    s->rd_scratchpad=   s->me.scratchpad;
    s->b_scratchpad=    s->me.scratchpad;
    s->obmc_scratchpad= s->me.scratchpad + 16;
    if (s->encoding) {
        CHECKED_ALLOCZ(s->me.map      , ME_MAP_SIZE*sizeof(uint32_t))
        CHECKED_ALLOCZ(s->me.score_map, ME_MAP_SIZE*sizeof(uint32_t))
        if(s->avctx->noise_reduction){
            CHECKED_ALLOCZ(s->dct_error_sum, 2 * 64 * sizeof(int))
        }
509
    }
510
    CHECKED_ALLOCZ(s->blocks, 64*12*2 * sizeof(DCTELEM))
511 512 513 514 515 516 517 518 519 520 521 522 523 524 525
    s->block= s->blocks[0];

    for(i=0;i<12;i++){
        s->pblocks[i] = (short *)(&s->block[i]);
    }
    return 0;
fail:
    return -1; //free() through MPV_common_end()
}

static void free_duplicate_context(MpegEncContext *s){
    if(s==NULL) return;

    av_freep(&s->allocated_edge_emu_buffer); s->edge_emu_buffer= NULL;
    av_freep(&s->me.scratchpad);
526 527
    s->rd_scratchpad=
    s->b_scratchpad=
528
    s->obmc_scratchpad= NULL;
529

530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553
    av_freep(&s->dct_error_sum);
    av_freep(&s->me.map);
    av_freep(&s->me.score_map);
    av_freep(&s->blocks);
    s->block= NULL;
}

static void backup_duplicate_context(MpegEncContext *bak, MpegEncContext *src){
#define COPY(a) bak->a= src->a
    COPY(allocated_edge_emu_buffer);
    COPY(edge_emu_buffer);
    COPY(me.scratchpad);
    COPY(rd_scratchpad);
    COPY(b_scratchpad);
    COPY(obmc_scratchpad);
    COPY(me.map);
    COPY(me.score_map);
    COPY(blocks);
    COPY(block);
    COPY(start_mb_y);
    COPY(end_mb_y);
    COPY(me.map_generation);
    COPY(pb);
    COPY(dct_error_sum);
554 555
    COPY(dct_count[0]);
    COPY(dct_count[1]);
556 557 558
#undef COPY
}

559
void ff_update_duplicate_context(MpegEncContext *dst, MpegEncContext *src){
560
    MpegEncContext bak;
561
    int i;
562 563 564 565 566
    //FIXME copy only needed parts
//START_TIMER
    backup_duplicate_context(&bak, dst);
    memcpy(dst, src, sizeof(MpegEncContext));
    backup_duplicate_context(dst, &bak);
567 568 569
    for(i=0;i<12;i++){
        dst->pblocks[i] = (short *)(&dst->block[i]);
    }
570 571 572
//STOP_TIMER("update_duplicate_context") //about 10k cycles / 0.01 sec for 1000frames on 1ghz with 2 threads
}

573
#ifdef CONFIG_ENCODERS
574 575 576 577 578 579 580 581 582 583 584
static void update_duplicate_context_after_me(MpegEncContext *dst, MpegEncContext *src){
#define COPY(a) dst->a= src->a
    COPY(pict_type);
    COPY(current_picture);
    COPY(f_code);
    COPY(b_code);
    COPY(qscale);
    COPY(lambda);
    COPY(lambda2);
    COPY(picture_in_gop_number);
    COPY(gop_picture_number);
D
Diego Biurrun 已提交
585 586 587
    COPY(frame_pred_frame_dct); //FIXME don't set in encode_header
    COPY(progressive_frame); //FIXME don't set in encode_header
    COPY(partitioned_frame); //FIXME don't set in encode_header
588 589
#undef COPY
}
590
#endif
591

M
Michael Niedermayer 已提交
592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608
/**
 * sets the given MpegEncContext to common defaults (same for encoding and decoding).
 * the changed fields will not depend upon the prior state of the MpegEncContext.
 */
static void MPV_common_defaults(MpegEncContext *s){
    s->y_dc_scale_table=
    s->c_dc_scale_table= ff_mpeg1_dc_scale_table;
    s->chroma_qscale_table= ff_default_chroma_qscale_table;
    s->progressive_frame= 1;
    s->progressive_sequence= 1;
    s->picture_structure= PICT_FRAME;

    s->coded_picture_number = 0;
    s->picture_number = 0;
    s->input_picture_number = 0;

    s->picture_in_gop_number = 0;
609 610 611

    s->f_code = 1;
    s->b_code = 1;
M
Michael Niedermayer 已提交
612 613 614 615 616 617 618 619 620 621 622 623 624 625
}

/**
 * sets the given MpegEncContext to defaults for decoding.
 * the changed fields will not depend upon the prior state of the MpegEncContext.
 */
void MPV_decode_defaults(MpegEncContext *s){
    MPV_common_defaults(s);
}

/**
 * sets the given MpegEncContext to defaults for encoding.
 * the changed fields will not depend upon the prior state of the MpegEncContext.
 */
626 627

#ifdef CONFIG_ENCODERS
628
static void MPV_encode_defaults(MpegEncContext *s){
M
Michael Niedermayer 已提交
629
    int i;
M
Michael Niedermayer 已提交
630
    MPV_common_defaults(s);
631

M
Michael Niedermayer 已提交
632 633
    for(i=-16; i<16; i++){
        default_fcode_tab[i + MAX_MV]= 1;
M
Michael Niedermayer 已提交
634 635 636 637
    }
    s->me.mv_penalty= default_mv_penalty;
    s->fcode_tab= default_fcode_tab;
}
638
#endif //CONFIG_ENCODERS
M
Michael Niedermayer 已提交
639

640
/**
M
Michael Niedermayer 已提交
641 642 643
 * init common structure for both encoder and decoder.
 * this assumes that some variables like width/height are already set
 */
644 645
int MPV_common_init(MpegEncContext *s)
{
M
Michael Niedermayer 已提交
646
    int y_size, c_size, yc_size, i, mb_array_size, mv_table_size, x, y;
647

L
Loren Merritt 已提交
648 649 650
    s->mb_height = (s->height + 15) / 16;

    if(s->avctx->thread_count > MAX_THREADS || (s->avctx->thread_count > s->mb_height && s->mb_height)){
M
10l  
Michael Niedermayer 已提交
651 652 653 654
        av_log(s->avctx, AV_LOG_ERROR, "too many threads\n");
        return -1;
    }

655 656 657
    if((s->width || s->height) && avcodec_check_dimensions(s->avctx, s->width, s->height))
        return -1;

658
    dsputil_init(&s->dsp, s->avctx);
659
    DCT_common_init(s);
660

661
    s->flags= s->avctx->flags;
662
    s->flags2= s->avctx->flags2;
663

M
cleanup  
Michael Niedermayer 已提交
664
    s->mb_width  = (s->width  + 15) / 16;
665
    s->mb_stride = s->mb_width + 1;
666 667
    s->b8_stride = s->mb_width*2 + 1;
    s->b4_stride = s->mb_width*4 + 1;
668
    mb_array_size= s->mb_height * s->mb_stride;
M
Michael Niedermayer 已提交
669
    mv_table_size= (s->mb_height+2) * s->mb_stride + 1;
670

671 672 673 674
    /* set chroma shifts */
    avcodec_get_chroma_sub_sample(s->avctx->pix_fmt,&(s->chroma_x_shift),
                                                    &(s->chroma_y_shift) );

675 676 677
    /* set default edge pos, will be overriden in decode_header if needed */
    s->h_edge_pos= s->mb_width*16;
    s->v_edge_pos= s->mb_height*16;
678 679

    s->mb_num = s->mb_width * s->mb_height;
680

681 682 683
    s->block_wrap[0]=
    s->block_wrap[1]=
    s->block_wrap[2]=
684
    s->block_wrap[3]= s->b8_stride;
685
    s->block_wrap[4]=
686
    s->block_wrap[5]= s->mb_stride;
687

688 689
    y_size = s->b8_stride * (2 * s->mb_height + 1);
    c_size = s->mb_stride * (s->mb_height + 1);
690
    yc_size = y_size + 2 * c_size;
691

692
    /* convert fourcc to upper case */
693
    s->codec_tag=          toupper( s->avctx->codec_tag     &0xFF)
694
                        + (toupper((s->avctx->codec_tag>>8 )&0xFF)<<8 )
695
                        + (toupper((s->avctx->codec_tag>>16)&0xFF)<<16)
696
                        + (toupper((s->avctx->codec_tag>>24)&0xFF)<<24);
697

698
    s->stream_codec_tag=          toupper( s->avctx->stream_codec_tag     &0xFF)
699
                               + (toupper((s->avctx->stream_codec_tag>>8 )&0xFF)<<8 )
700
                               + (toupper((s->avctx->stream_codec_tag>>16)&0xFF)<<16)
701 702
                               + (toupper((s->avctx->stream_codec_tag>>24)&0xFF)<<24);

M
Michael Niedermayer 已提交
703
    s->avctx->coded_frame= (AVFrame*)&s->current_picture;
M
cleanup  
Michael Niedermayer 已提交
704

705 706 707 708 709 710 711
    CHECKED_ALLOCZ(s->mb_index2xy, (s->mb_num+1)*sizeof(int)) //error ressilience code looks cleaner with this
    for(y=0; y<s->mb_height; y++){
        for(x=0; x<s->mb_width; x++){
            s->mb_index2xy[ x + y*s->mb_width ] = x + y*s->mb_stride;
        }
    }
    s->mb_index2xy[ s->mb_height*s->mb_width ] = (s->mb_height-1)*s->mb_stride + s->mb_width; //FIXME really needed?
712

713
    if (s->encoding) {
714
        /* Allocate MV tables */
715 716 717 718 719 720 721 722 723 724 725 726
        CHECKED_ALLOCZ(s->p_mv_table_base            , mv_table_size * 2 * sizeof(int16_t))
        CHECKED_ALLOCZ(s->b_forw_mv_table_base       , mv_table_size * 2 * sizeof(int16_t))
        CHECKED_ALLOCZ(s->b_back_mv_table_base       , mv_table_size * 2 * sizeof(int16_t))
        CHECKED_ALLOCZ(s->b_bidir_forw_mv_table_base , mv_table_size * 2 * sizeof(int16_t))
        CHECKED_ALLOCZ(s->b_bidir_back_mv_table_base , mv_table_size * 2 * sizeof(int16_t))
        CHECKED_ALLOCZ(s->b_direct_mv_table_base     , mv_table_size * 2 * sizeof(int16_t))
        s->p_mv_table           = s->p_mv_table_base            + s->mb_stride + 1;
        s->b_forw_mv_table      = s->b_forw_mv_table_base       + s->mb_stride + 1;
        s->b_back_mv_table      = s->b_back_mv_table_base       + s->mb_stride + 1;
        s->b_bidir_forw_mv_table= s->b_bidir_forw_mv_table_base + s->mb_stride + 1;
        s->b_bidir_back_mv_table= s->b_bidir_back_mv_table_base + s->mb_stride + 1;
        s->b_direct_mv_table    = s->b_direct_mv_table_base     + s->mb_stride + 1;
727

728 729 730
        if(s->msmpeg4_version){
            CHECKED_ALLOCZ(s->ac_stats, 2*2*(MAX_LEVEL+1)*(MAX_RUN+1)*2*sizeof(int));
        }
M
Michael Niedermayer 已提交
731
        CHECKED_ALLOCZ(s->avctx->stats_out, 256);
732 733

        /* Allocate MB type table */
M
Michael Niedermayer 已提交
734
        CHECKED_ALLOCZ(s->mb_type  , mb_array_size * sizeof(uint16_t)) //needed for encoding
735

736
        CHECKED_ALLOCZ(s->lambda_table, mb_array_size * sizeof(int))
737

738 739
        CHECKED_ALLOCZ(s->q_intra_matrix, 64*32 * sizeof(int))
        CHECKED_ALLOCZ(s->q_inter_matrix, 64*32 * sizeof(int))
740 741
        CHECKED_ALLOCZ(s->q_intra_matrix16, 64*32*2 * sizeof(uint16_t))
        CHECKED_ALLOCZ(s->q_inter_matrix16, 64*32*2 * sizeof(uint16_t))
742 743
        CHECKED_ALLOCZ(s->input_picture, MAX_PICTURE_COUNT * sizeof(Picture*))
        CHECKED_ALLOCZ(s->reordered_input_picture, MAX_PICTURE_COUNT * sizeof(Picture*))
744

745 746 747
        if(s->avctx->noise_reduction){
            CHECKED_ALLOCZ(s->dct_offset, 2 * 64 * sizeof(uint16_t))
        }
748
    }
749 750
    CHECKED_ALLOCZ(s->picture, MAX_PICTURE_COUNT * sizeof(Picture))

751
    CHECKED_ALLOCZ(s->error_status_table, mb_array_size*sizeof(uint8_t))
752

M
Michael Niedermayer 已提交
753
    if(s->codec_id==CODEC_ID_MPEG4 || (s->flags & CODEC_FLAG_INTERLACED_ME)){
754
        /* interlaced direct mode decoding tables */
M
Michael Niedermayer 已提交
755 756 757 758 759 760 761 762 763 764 765 766 767
            for(i=0; i<2; i++){
                int j, k;
                for(j=0; j<2; j++){
                    for(k=0; k<2; k++){
                        CHECKED_ALLOCZ(s->b_field_mv_table_base[i][j][k]     , mv_table_size * 2 * sizeof(int16_t))
                        s->b_field_mv_table[i][j][k]    = s->b_field_mv_table_base[i][j][k]     + s->mb_stride + 1;
                    }
                    CHECKED_ALLOCZ(s->b_field_select_table[i][j]     , mb_array_size * 2 * sizeof(uint8_t))
                    CHECKED_ALLOCZ(s->p_field_mv_table_base[i][j]     , mv_table_size * 2 * sizeof(int16_t))
                    s->p_field_mv_table[i][j]    = s->p_field_mv_table_base[i][j]     + s->mb_stride + 1;
                }
                CHECKED_ALLOCZ(s->p_field_select_table[i]      , mb_array_size * 2 * sizeof(uint8_t))
            }
F
Fabrice Bellard 已提交
768
    }
M
Michael Niedermayer 已提交
769
    if (s->out_format == FMT_H263) {
F
Fabrice Bellard 已提交
770
        /* ac values */
771 772 773
        CHECKED_ALLOCZ(s->ac_val_base, yc_size * sizeof(int16_t) * 16);
        s->ac_val[0] = s->ac_val_base + s->b8_stride + 1;
        s->ac_val[1] = s->ac_val_base + y_size + s->mb_stride + 1;
F
Fabrice Bellard 已提交
774
        s->ac_val[2] = s->ac_val[1] + c_size;
775

F
Fabrice Bellard 已提交
776
        /* cbp values */
777 778
        CHECKED_ALLOCZ(s->coded_block_base, y_size);
        s->coded_block= s->coded_block_base + s->b8_stride + 1;
779

780
        /* cbp, ac_pred, pred_dir */
781 782
        CHECKED_ALLOCZ(s->cbp_table  , mb_array_size * sizeof(uint8_t))
        CHECKED_ALLOCZ(s->pred_dir_table, mb_array_size * sizeof(uint8_t))
783
    }
784

785 786 787
    if (s->h263_pred || s->h263_plus || !s->encoding) {
        /* dc values */
        //MN: we need these for error resilience of intra-frames
788 789 790
        CHECKED_ALLOCZ(s->dc_val_base, yc_size * sizeof(int16_t));
        s->dc_val[0] = s->dc_val_base + s->b8_stride + 1;
        s->dc_val[1] = s->dc_val_base + y_size + s->mb_stride + 1;
791 792
        s->dc_val[2] = s->dc_val[1] + c_size;
        for(i=0;i<yc_size;i++)
793
            s->dc_val_base[i] = 1024;
794 795
    }

796
    /* which mb is a intra block */
797 798
    CHECKED_ALLOCZ(s->mbintra_table, mb_array_size);
    memset(s->mbintra_table, 1, mb_array_size);
799

800
    /* init macroblock skip table */
801
    CHECKED_ALLOCZ(s->mbskip_table, mb_array_size+2);
802
    //Note the +1 is for a quicker mpeg4 slice_end detection
803
    CHECKED_ALLOCZ(s->prev_pict_types, PREV_PICT_TYPES_BUFFER_SIZE);
804

805
    s->parse_context.state= -1;
806 807 808 809 810
    if((s->avctx->debug&(FF_DEBUG_VIS_QP|FF_DEBUG_VIS_MB_TYPE)) || (s->avctx->debug_mv)){
       s->visualization_buffer[0] = av_malloc((s->mb_width*16 + 2*EDGE_WIDTH) * s->mb_height*16 + 2*EDGE_WIDTH);
       s->visualization_buffer[1] = av_malloc((s->mb_width*8 + EDGE_WIDTH) * s->mb_height*8 + EDGE_WIDTH);
       s->visualization_buffer[2] = av_malloc((s->mb_width*8 + EDGE_WIDTH) * s->mb_height*8 + EDGE_WIDTH);
    }
811

F
Fabrice Bellard 已提交
812
    s->context_initialized = 1;
813 814 815 816 817 818 819 820 821 822 823 824 825 826

    s->thread_context[0]= s;
    for(i=1; i<s->avctx->thread_count; i++){
        s->thread_context[i]= av_malloc(sizeof(MpegEncContext));
        memcpy(s->thread_context[i], s, sizeof(MpegEncContext));
    }

    for(i=0; i<s->avctx->thread_count; i++){
        if(init_duplicate_context(s->thread_context[i], s) < 0)
           goto fail;
        s->thread_context[i]->start_mb_y= (s->mb_height*(i  ) + s->avctx->thread_count/2) / s->avctx->thread_count;
        s->thread_context[i]->end_mb_y  = (s->mb_height*(i+1) + s->avctx->thread_count/2) / s->avctx->thread_count;
    }

F
Fabrice Bellard 已提交
827 828
    return 0;
 fail:
829
    MPV_common_end(s);
F
Fabrice Bellard 已提交
830 831 832 833 834 835
    return -1;
}

/* init common structure for both encoder and decoder */
void MPV_common_end(MpegEncContext *s)
{
M
Michael Niedermayer 已提交
836
    int i, j, k;
F
Fabrice Bellard 已提交
837

838 839 840 841 842 843 844
    for(i=0; i<s->avctx->thread_count; i++){
        free_duplicate_context(s->thread_context[i]);
    }
    for(i=1; i<s->avctx->thread_count; i++){
        av_freep(&s->thread_context[i]);
    }

845 846 847
    av_freep(&s->parse_context.buffer);
    s->parse_context.buffer_size=0;

848
    av_freep(&s->mb_type);
849 850 851 852 853 854 855 856 857 858 859 860
    av_freep(&s->p_mv_table_base);
    av_freep(&s->b_forw_mv_table_base);
    av_freep(&s->b_back_mv_table_base);
    av_freep(&s->b_bidir_forw_mv_table_base);
    av_freep(&s->b_bidir_back_mv_table_base);
    av_freep(&s->b_direct_mv_table_base);
    s->p_mv_table= NULL;
    s->b_forw_mv_table= NULL;
    s->b_back_mv_table= NULL;
    s->b_bidir_forw_mv_table= NULL;
    s->b_bidir_back_mv_table= NULL;
    s->b_direct_mv_table= NULL;
M
Michael Niedermayer 已提交
861 862 863 864 865 866 867 868 869 870 871 872
    for(i=0; i<2; i++){
        for(j=0; j<2; j++){
            for(k=0; k<2; k++){
                av_freep(&s->b_field_mv_table_base[i][j][k]);
                s->b_field_mv_table[i][j][k]=NULL;
            }
            av_freep(&s->b_field_select_table[i][j]);
            av_freep(&s->p_field_mv_table_base[i][j]);
            s->p_field_mv_table[i][j]=NULL;
        }
        av_freep(&s->p_field_select_table[i]);
    }
873

874 875 876
    av_freep(&s->dc_val_base);
    av_freep(&s->ac_val_base);
    av_freep(&s->coded_block_base);
877
    av_freep(&s->mbintra_table);
878 879
    av_freep(&s->cbp_table);
    av_freep(&s->pred_dir_table);
880

881
    av_freep(&s->mbskip_table);
882
    av_freep(&s->prev_pict_types);
883
    av_freep(&s->bitstream_buffer);
884 885
    s->allocated_bitstream_buffer_size=0;

M
Michael Niedermayer 已提交
886
    av_freep(&s->avctx->stats_out);
887
    av_freep(&s->ac_stats);
888
    av_freep(&s->error_status_table);
889
    av_freep(&s->mb_index2xy);
890
    av_freep(&s->lambda_table);
891 892
    av_freep(&s->q_intra_matrix);
    av_freep(&s->q_inter_matrix);
893 894
    av_freep(&s->q_intra_matrix16);
    av_freep(&s->q_inter_matrix16);
895 896
    av_freep(&s->input_picture);
    av_freep(&s->reordered_input_picture);
897
    av_freep(&s->dct_offset);
M
cleanup  
Michael Niedermayer 已提交
898

M
Michael Niedermayer 已提交
899 900 901 902
    if(s->picture){
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            free_picture(s, &s->picture[i]);
        }
F
Fabrice Bellard 已提交
903
    }
904
    av_freep(&s->picture);
F
Fabrice Bellard 已提交
905
    s->context_initialized = 0;
906 907 908
    s->last_picture_ptr=
    s->next_picture_ptr=
    s->current_picture_ptr= NULL;
M
Michael Niedermayer 已提交
909
    s->linesize= s->uvlinesize= 0;
910

911
    for(i=0; i<3; i++)
912
        av_freep(&s->visualization_buffer[i]);
M
Michael Niedermayer 已提交
913 914

    avcodec_default_free_buffers(s->avctx);
F
Fabrice Bellard 已提交
915 916
}

917 918
#ifdef CONFIG_ENCODERS

F
Fabrice Bellard 已提交
919 920 921 922
/* init video encoder */
int MPV_encode_init(AVCodecContext *avctx)
{
    MpegEncContext *s = avctx->priv_data;
923
    int i;
924
    int chroma_h_shift, chroma_v_shift;
925

M
Michael Niedermayer 已提交
926
    MPV_encode_defaults(s);
927

928 929 930 931 932 933 934 935 936
    switch (avctx->codec_id) {
    case CODEC_ID_MPEG2VIDEO:
        if(avctx->pix_fmt != PIX_FMT_YUV420P && avctx->pix_fmt != PIX_FMT_YUV422P){
            av_log(avctx, AV_LOG_ERROR, "only YUV420 and YUV422 are supported\n");
            return -1;
        }
        break;
    case CODEC_ID_LJPEG:
    case CODEC_ID_MJPEG:
B
Baptiste Coudurier 已提交
937 938
        if(avctx->pix_fmt != PIX_FMT_YUVJ420P && avctx->pix_fmt != PIX_FMT_YUVJ422P &&
           ((avctx->pix_fmt != PIX_FMT_YUV420P && avctx->pix_fmt != PIX_FMT_YUV422P) || avctx->strict_std_compliance>FF_COMPLIANCE_INOFFICIAL)){
M
Michael Niedermayer 已提交
939 940 941
            av_log(avctx, AV_LOG_ERROR, "colorspace not supported in jpeg\n");
            return -1;
        }
942 943 944 945
        break;
    default:
        if(avctx->pix_fmt != PIX_FMT_YUV420P){
            av_log(avctx, AV_LOG_ERROR, "only YUV420 is supported\n");
M
Michael Niedermayer 已提交
946 947 948
            return -1;
        }
    }
949

950 951 952 953 954 955 956 957 958 959 960 961
    switch (avctx->pix_fmt) {
    case PIX_FMT_YUVJ422P:
    case PIX_FMT_YUV422P:
        s->chroma_format = CHROMA_422;
        break;
    case PIX_FMT_YUVJ420P:
    case PIX_FMT_YUV420P:
    default:
        s->chroma_format = CHROMA_420;
        break;
    }

F
Fabrice Bellard 已提交
962 963 964
    s->bit_rate = avctx->bit_rate;
    s->width = avctx->width;
    s->height = avctx->height;
965
    if(avctx->gop_size > 600 && avctx->strict_std_compliance>FF_COMPLIANCE_EXPERIMENTAL){
966
        av_log(avctx, AV_LOG_ERROR, "Warning keyframe interval too large! reducing it ...\n");
967 968
        avctx->gop_size=600;
    }
F
Fabrice Bellard 已提交
969
    s->gop_size = avctx->gop_size;
970
    s->avctx = avctx;
971
    s->flags= avctx->flags;
972
    s->flags2= avctx->flags2;
973
    s->max_b_frames= avctx->max_b_frames;
974
    s->codec_id= avctx->codec->id;
975 976 977 978
    s->luma_elim_threshold  = avctx->luma_elim_threshold;
    s->chroma_elim_threshold= avctx->chroma_elim_threshold;
    s->strict_std_compliance= avctx->strict_std_compliance;
    s->data_partitioning= avctx->flags & CODEC_FLAG_PART;
M
Michael Niedermayer 已提交
979
    s->quarter_sample= (avctx->flags & CODEC_FLAG_QPEL)!=0;
980
    s->mpeg_quant= avctx->mpeg_quant;
M
Michael Niedermayer 已提交
981
    s->rtp_mode= !!avctx->rtp_payload_size;
982
    s->intra_dc_precision= avctx->intra_dc_precision;
983
    s->user_specified_pts = AV_NOPTS_VALUE;
984

F
Fabrice Bellard 已提交
985 986 987 988 989 990
    if (s->gop_size <= 1) {
        s->intra_only = 1;
        s->gop_size = 12;
    } else {
        s->intra_only = 0;
    }
991

M
Michael Niedermayer 已提交
992
    s->me_method = avctx->me_method;
993

994
    /* Fixed QSCALE */
M
Michael Niedermayer 已提交
995
    s->fixed_qscale = !!(avctx->flags & CODEC_FLAG_QSCALE);
996

997
    s->adaptive_quant= (   s->avctx->lumi_masking
998
                        || s->avctx->dark_masking
999
                        || s->avctx->temporal_cplx_masking
1000
                        || s->avctx->spatial_cplx_masking
1001
                        || s->avctx->p_masking
1002
                        || s->avctx->border_masking
1003
                        || (s->flags&CODEC_FLAG_QP_RD))
1004
                       && !s->fixed_qscale;
1005

M
Michael Niedermayer 已提交
1006 1007 1008
    s->obmc= !!(s->flags & CODEC_FLAG_OBMC);
    s->loop_filter= !!(s->flags & CODEC_FLAG_LOOP_FILTER);
    s->alternate_scan= !!(s->flags & CODEC_FLAG_ALT_SCAN);
1009
    s->intra_vlc_format= !!(s->flags2 & CODEC_FLAG2_INTRA_VLC);
1010
    s->q_scale_type= !!(s->flags2 & CODEC_FLAG2_NON_LINEAR_QUANT);
1011

M
Michael Niedermayer 已提交
1012 1013 1014
    if(avctx->rc_max_rate && !avctx->rc_buffer_size){
        av_log(avctx, AV_LOG_ERROR, "a vbv buffer size is needed, for encoding with a maximum bitrate\n");
        return -1;
1015
    }
M
Michael Niedermayer 已提交
1016 1017

    if(avctx->rc_min_rate && avctx->rc_max_rate != avctx->rc_min_rate){
1018
        av_log(avctx, AV_LOG_INFO, "Warning min_rate > 0 but min_rate != max_rate isn't recommended!\n");
1019
    }
1020

M
Michael Niedermayer 已提交
1021 1022 1023 1024
    if(avctx->rc_min_rate && avctx->rc_min_rate > avctx->bit_rate){
        av_log(avctx, AV_LOG_INFO, "bitrate below min bitrate\n");
        return -1;
    }
1025

M
Michael Niedermayer 已提交
1026 1027 1028 1029
    if(avctx->rc_max_rate && avctx->rc_max_rate < avctx->bit_rate){
        av_log(avctx, AV_LOG_INFO, "bitrate above max bitrate\n");
        return -1;
    }
1030 1031

    if(   s->avctx->rc_max_rate && s->avctx->rc_min_rate == s->avctx->rc_max_rate
1032 1033
       && (s->codec_id == CODEC_ID_MPEG1VIDEO || s->codec_id == CODEC_ID_MPEG2VIDEO)
       && 90000LL * (avctx->rc_buffer_size-1) > s->avctx->rc_max_rate*0xFFFFLL){
1034

1035 1036
        av_log(avctx, AV_LOG_INFO, "Warning vbv_delay will be set to 0xFFFF (=VBR) as the specified vbv buffer is too large for the given bitrate!\n");
    }
1037 1038

    if((s->flags & CODEC_FLAG_4MV) && s->codec_id != CODEC_ID_MPEG4
1039
       && s->codec_id != CODEC_ID_H263 && s->codec_id != CODEC_ID_H263P && s->codec_id != CODEC_ID_FLV1){
1040
        av_log(avctx, AV_LOG_ERROR, "4MV not supported by codec\n");
1041 1042
        return -1;
    }
1043

M
Michael Niedermayer 已提交
1044
    if(s->obmc && s->avctx->mb_decision != FF_MB_DECISION_SIMPLE){
1045
        av_log(avctx, AV_LOG_ERROR, "OBMC is only supported with simple mb decision\n");
M
Michael Niedermayer 已提交
1046 1047
        return -1;
    }
1048

M
Michael Niedermayer 已提交
1049 1050 1051 1052
    if(s->obmc && s->codec_id != CODEC_ID_H263 && s->codec_id != CODEC_ID_H263P){
        av_log(avctx, AV_LOG_ERROR, "OBMC is only supported with H263(+)\n");
        return -1;
    }
1053

1054
    if(s->quarter_sample && s->codec_id != CODEC_ID_MPEG4){
1055
        av_log(avctx, AV_LOG_ERROR, "qpel not supported by codec\n");
1056 1057 1058 1059
        return -1;
    }

    if(s->data_partitioning && s->codec_id != CODEC_ID_MPEG4){
1060
        av_log(avctx, AV_LOG_ERROR, "data partitioning not supported by codec\n");
1061 1062
        return -1;
    }
1063

M
Michael Niedermayer 已提交
1064
    if(s->max_b_frames && s->codec_id != CODEC_ID_MPEG4 && s->codec_id != CODEC_ID_MPEG1VIDEO && s->codec_id != CODEC_ID_MPEG2VIDEO){
1065
        av_log(avctx, AV_LOG_ERROR, "b frames not supported by codec\n");
1066 1067
        return -1;
    }
M
Michael Niedermayer 已提交
1068

1069
    if((s->flags & (CODEC_FLAG_INTERLACED_DCT|CODEC_FLAG_INTERLACED_ME|CODEC_FLAG_ALT_SCAN))
M
Michael Niedermayer 已提交
1070 1071 1072 1073
       && s->codec_id != CODEC_ID_MPEG4 && s->codec_id != CODEC_ID_MPEG2VIDEO){
        av_log(avctx, AV_LOG_ERROR, "interlacing not supported by codec\n");
        return -1;
    }
1074

1075
    if(s->mpeg_quant && s->codec_id != CODEC_ID_MPEG4){ //FIXME mpeg2 uses that too
1076
        av_log(avctx, AV_LOG_ERROR, "mpeg2 style quantization not supported by codec\n");
1077 1078
        return -1;
    }
1079

1080
    if((s->flags & CODEC_FLAG_CBP_RD) && !(s->flags & CODEC_FLAG_TRELLIS_QUANT)){
1081
        av_log(avctx, AV_LOG_ERROR, "CBP RD needs trellis quant\n");
1082 1083 1084
        return -1;
    }

M
Michael Niedermayer 已提交
1085 1086 1087 1088
    if((s->flags & CODEC_FLAG_QP_RD) && s->avctx->mb_decision != FF_MB_DECISION_RD){
        av_log(avctx, AV_LOG_ERROR, "QP RD needs mbd=2\n");
        return -1;
    }
1089

1090
    if(s->avctx->scenechange_threshold < 1000000000 && (s->flags & CODEC_FLAG_CLOSED_GOP)){
1091
        av_log(avctx, AV_LOG_ERROR, "closed gop with scene change detection arent supported yet, set threshold to 1000000000\n");
1092 1093
        return -1;
    }
1094

1095 1096 1097 1098 1099
    if((s->flags2 & CODEC_FLAG2_INTRA_VLC) && s->codec_id != CODEC_ID_MPEG2VIDEO){
        av_log(avctx, AV_LOG_ERROR, "intra vlc table not supported by codec\n");
        return -1;
    }

1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110
    if(s->flags & CODEC_FLAG_LOW_DELAY){
        if (s->codec_id != CODEC_ID_MPEG2VIDEO && s->codec_id != CODEC_ID_MPEG1VIDEO){
            av_log(avctx, AV_LOG_ERROR, "low delay forcing is only available for mpeg1/2\n");
            return -1;
        }
        if (s->max_b_frames != 0){
            av_log(avctx, AV_LOG_ERROR, "b frames cannot be used with low delay\n");
            return -1;
        }
    }

1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121
    if(s->q_scale_type == 1){
        if(s->codec_id != CODEC_ID_MPEG2VIDEO){
            av_log(avctx, AV_LOG_ERROR, "non linear quant is only available for mpeg2\n");
            return -1;
        }
        if(avctx->qmax > 12){
            av_log(avctx, AV_LOG_ERROR, "non linear quant only supports qmax <= 12 currently\n");
            return -1;
        }
    }

1122 1123
    if(s->avctx->thread_count > 1 && s->codec_id != CODEC_ID_MPEG4
       && s->codec_id != CODEC_ID_MPEG1VIDEO && s->codec_id != CODEC_ID_MPEG2VIDEO
1124 1125 1126 1127
       && (s->codec_id != CODEC_ID_H263P || !(s->flags & CODEC_FLAG_H263P_SLICE_STRUCT))){
        av_log(avctx, AV_LOG_ERROR, "multi threaded encoding not supported by codec\n");
        return -1;
    }
1128

1129 1130
    if(s->avctx->thread_count > 1)
        s->rtp_mode= 1;
M
Michael Niedermayer 已提交
1131

1132
    if(!avctx->time_base.den || !avctx->time_base.num){
M
Michael Niedermayer 已提交
1133 1134 1135
        av_log(avctx, AV_LOG_ERROR, "framerate not set\n");
        return -1;
    }
1136

1137 1138 1139 1140 1141 1142 1143 1144 1145
    i= (INT_MAX/2+128)>>8;
    if(avctx->me_threshold >= i){
        av_log(avctx, AV_LOG_ERROR, "me_threshold too large, max is %d\n", i - 1);
        return -1;
    }
    if(avctx->mb_threshold >= i){
        av_log(avctx, AV_LOG_ERROR, "mb_threshold too large, max is %d\n", i - 1);
        return -1;
    }
1146

1147
    if(avctx->b_frame_strategy && (avctx->flags&CODEC_FLAG_PASS2)){
1148 1149
        av_log(avctx, AV_LOG_INFO, "notice: b_frame_strategy only affects the first pass\n");
        avctx->b_frame_strategy = 0;
1150 1151
    }

1152
    i= ff_gcd(avctx->time_base.den, avctx->time_base.num);
M
Michael Niedermayer 已提交
1153 1154
    if(i > 1){
        av_log(avctx, AV_LOG_INFO, "removing common factors from framerate\n");
1155 1156
        avctx->time_base.den /= i;
        avctx->time_base.num /= i;
M
Michael Niedermayer 已提交
1157 1158
//        return -1;
    }
1159

1160 1161 1162
    if(s->codec_id==CODEC_ID_MJPEG){
        s->intra_quant_bias= 1<<(QUANT_BIAS_SHIFT-1); //(a + x/2)/x
        s->inter_quant_bias= 0;
M
Michael Niedermayer 已提交
1163
    }else if(s->mpeg_quant || s->codec_id==CODEC_ID_MPEG1VIDEO || s->codec_id==CODEC_ID_MPEG2VIDEO){
1164 1165 1166 1167 1168 1169
        s->intra_quant_bias= 3<<(QUANT_BIAS_SHIFT-3); //(a + x*3/8)/x
        s->inter_quant_bias= 0;
    }else{
        s->intra_quant_bias=0;
        s->inter_quant_bias=-(1<<(QUANT_BIAS_SHIFT-2)); //(a - x/4)/x
    }
1170

1171 1172 1173 1174
    if(avctx->intra_quant_bias != FF_DEFAULT_QUANT_BIAS)
        s->intra_quant_bias= avctx->intra_quant_bias;
    if(avctx->inter_quant_bias != FF_DEFAULT_QUANT_BIAS)
        s->inter_quant_bias= avctx->inter_quant_bias;
1175

1176 1177
    avcodec_get_chroma_sub_sample(avctx->pix_fmt, &chroma_h_shift, &chroma_v_shift);

1178
    if(avctx->codec_id == CODEC_ID_MPEG4 && s->avctx->time_base.den > (1<<16)-1){
1179
        av_log(avctx, AV_LOG_ERROR, "timebase not supported by mpeg 4 standard\n");
1180
        return -1;
1181 1182
    }
    s->time_increment_bits = av_log2(s->avctx->time_base.den - 1) + 1;
1183

F
Fabrice Bellard 已提交
1184 1185 1186
    switch(avctx->codec->id) {
    case CODEC_ID_MPEG1VIDEO:
        s->out_format = FMT_MPEG1;
1187
        s->low_delay= !!(s->flags & CODEC_FLAG_LOW_DELAY);
1188
        avctx->delay= s->low_delay ? 0 : (s->max_b_frames + 1);
F
Fabrice Bellard 已提交
1189
        break;
M
Michael Niedermayer 已提交
1190 1191
    case CODEC_ID_MPEG2VIDEO:
        s->out_format = FMT_MPEG1;
1192
        s->low_delay= !!(s->flags & CODEC_FLAG_LOW_DELAY);
M
Michael Niedermayer 已提交
1193
        avctx->delay= s->low_delay ? 0 : (s->max_b_frames + 1);
M
Michael Niedermayer 已提交
1194
        s->rtp_mode= 1;
M
Michael Niedermayer 已提交
1195
        break;
1196
    case CODEC_ID_LJPEG:
F
Fabrice Bellard 已提交
1197 1198 1199
    case CODEC_ID_MJPEG:
        s->out_format = FMT_MJPEG;
        s->intra_only = 1; /* force intra only for jpeg */
B
Baptiste Coudurier 已提交
1200 1201 1202 1203 1204 1205
        s->mjpeg_vsample[0] = 2;
        s->mjpeg_vsample[1] = 2>>chroma_v_shift;
        s->mjpeg_vsample[2] = 2>>chroma_v_shift;
        s->mjpeg_hsample[0] = 2;
        s->mjpeg_hsample[1] = 2>>chroma_h_shift;
        s->mjpeg_hsample[2] = 2>>chroma_h_shift;
1206
        if (!(ENABLE_MJPEG_ENCODER || ENABLE_LJPEG_ENCODER) || mjpeg_init(s) < 0)
F
Fabrice Bellard 已提交
1207
            return -1;
M
Michael Niedermayer 已提交
1208
        avctx->delay=0;
M
Michael Niedermayer 已提交
1209
        s->low_delay=1;
F
Fabrice Bellard 已提交
1210
        break;
1211
    case CODEC_ID_H261:
1212
        if (!ENABLE_H261_ENCODER)  return -1;
1213 1214 1215 1216
        if (ff_h261_get_picture_format(s->width, s->height) < 0) {
            av_log(avctx, AV_LOG_ERROR, "The specified picture size of %dx%d is not valid for the H.261 codec.\nValid sizes are 176x144, 352x288\n", s->width, s->height);
            return -1;
        }
1217 1218 1219 1220
        s->out_format = FMT_H261;
        avctx->delay=0;
        s->low_delay=1;
        break;
F
Fabrice Bellard 已提交
1221
    case CODEC_ID_H263:
1222
        if (h263_get_picture_format(s->width, s->height) == 7) {
1223
            av_log(avctx, AV_LOG_INFO, "The specified picture size of %dx%d is not valid for the H.263 codec.\nValid sizes are 128x96, 176x144, 352x288, 704x576, and 1408x1152. Try H.263+.\n", s->width, s->height);
F
Fabrice Bellard 已提交
1224
            return -1;
1225
        }
F
Fabrice Bellard 已提交
1226
        s->out_format = FMT_H263;
1227
        s->obmc= (avctx->flags & CODEC_FLAG_OBMC) ? 1:0;
M
Michael Niedermayer 已提交
1228
        avctx->delay=0;
M
Michael Niedermayer 已提交
1229
        s->low_delay=1;
F
Fabrice Bellard 已提交
1230 1231 1232 1233
        break;
    case CODEC_ID_H263P:
        s->out_format = FMT_H263;
        s->h263_plus = 1;
1234
        /* Fx */
M
Michael Niedermayer 已提交
1235
        s->umvplus = (avctx->flags & CODEC_FLAG_H263P_UMV) ? 1:0;
1236
        s->h263_aic= (avctx->flags & CODEC_FLAG_AC_PRED) ? 1:0;
1237 1238 1239 1240 1241
        s->modified_quant= s->h263_aic;
        s->alt_inter_vlc= (avctx->flags & CODEC_FLAG_H263P_AIV) ? 1:0;
        s->obmc= (avctx->flags & CODEC_FLAG_OBMC) ? 1:0;
        s->loop_filter= (avctx->flags & CODEC_FLAG_LOOP_FILTER) ? 1:0;
        s->unrestricted_mv= s->obmc || s->loop_filter || s->umvplus;
M
Michael Niedermayer 已提交
1242
        s->h263_slice_structured= (s->flags & CODEC_FLAG_H263P_SLICE_STRUCT) ? 1:0;
M
Michael Niedermayer 已提交
1243

1244
        /* /Fx */
1245
        /* These are just to be sure */
M
Michael Niedermayer 已提交
1246
        avctx->delay=0;
M
Michael Niedermayer 已提交
1247
        s->low_delay=1;
F
Fabrice Bellard 已提交
1248
        break;
1249 1250 1251 1252 1253 1254 1255 1256
    case CODEC_ID_FLV1:
        s->out_format = FMT_H263;
        s->h263_flv = 2; /* format = 1; 11-bit codes */
        s->unrestricted_mv = 1;
        s->rtp_mode=0; /* don't allow GOB */
        avctx->delay=0;
        s->low_delay=1;
        break;
F
Fabrice Bellard 已提交
1257 1258
    case CODEC_ID_RV10:
        s->out_format = FMT_H263;
M
Michael Niedermayer 已提交
1259
        avctx->delay=0;
M
Michael Niedermayer 已提交
1260
        s->low_delay=1;
F
Fabrice Bellard 已提交
1261
        break;
M
Michael Niedermayer 已提交
1262 1263 1264 1265 1266 1267 1268 1269 1270 1271
    case CODEC_ID_RV20:
        s->out_format = FMT_H263;
        avctx->delay=0;
        s->low_delay=1;
        s->modified_quant=1;
        s->h263_aic=1;
        s->h263_plus=1;
        s->loop_filter=1;
        s->unrestricted_mv= s->obmc || s->loop_filter || s->umvplus;
        break;
F
Fabrice Bellard 已提交
1272
    case CODEC_ID_MPEG4:
F
Fabrice Bellard 已提交
1273 1274 1275
        s->out_format = FMT_H263;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
M
Michael Niedermayer 已提交
1276
        s->low_delay= s->max_b_frames ? 0 : 1;
1277
        avctx->delay= s->low_delay ? 0 : (s->max_b_frames + 1);
F
Fabrice Bellard 已提交
1278
        break;
1279
    case CODEC_ID_MSMPEG4V1:
F
Fabrice Bellard 已提交
1280 1281 1282 1283
        s->out_format = FMT_H263;
        s->h263_msmpeg4 = 1;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
1284
        s->msmpeg4_version= 1;
M
Michael Niedermayer 已提交
1285
        avctx->delay=0;
M
Michael Niedermayer 已提交
1286
        s->low_delay=1;
1287 1288 1289 1290 1291 1292 1293
        break;
    case CODEC_ID_MSMPEG4V2:
        s->out_format = FMT_H263;
        s->h263_msmpeg4 = 1;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
        s->msmpeg4_version= 2;
M
Michael Niedermayer 已提交
1294
        avctx->delay=0;
M
Michael Niedermayer 已提交
1295
        s->low_delay=1;
1296 1297 1298 1299 1300 1301 1302
        break;
    case CODEC_ID_MSMPEG4V3:
        s->out_format = FMT_H263;
        s->h263_msmpeg4 = 1;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
        s->msmpeg4_version= 3;
M
Michael Niedermayer 已提交
1303
        s->flipflop_rounding=1;
M
Michael Niedermayer 已提交
1304
        avctx->delay=0;
M
Michael Niedermayer 已提交
1305
        s->low_delay=1;
F
Fabrice Bellard 已提交
1306
        break;
M
Michael Niedermayer 已提交
1307 1308 1309 1310 1311 1312
    case CODEC_ID_WMV1:
        s->out_format = FMT_H263;
        s->h263_msmpeg4 = 1;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
        s->msmpeg4_version= 4;
M
Michael Niedermayer 已提交
1313
        s->flipflop_rounding=1;
M
Michael Niedermayer 已提交
1314
        avctx->delay=0;
M
Michael Niedermayer 已提交
1315
        s->low_delay=1;
M
Michael Niedermayer 已提交
1316 1317 1318 1319 1320 1321 1322
        break;
    case CODEC_ID_WMV2:
        s->out_format = FMT_H263;
        s->h263_msmpeg4 = 1;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
        s->msmpeg4_version= 5;
M
Michael Niedermayer 已提交
1323
        s->flipflop_rounding=1;
M
Michael Niedermayer 已提交
1324
        avctx->delay=0;
M
Michael Niedermayer 已提交
1325
        s->low_delay=1;
M
Michael Niedermayer 已提交
1326
        break;
F
Fabrice Bellard 已提交
1327 1328 1329
    default:
        return -1;
    }
1330

1331
    avctx->has_b_frames= !s->low_delay;
1332

1333 1334
    s->encoding = 1;

F
Fabrice Bellard 已提交
1335 1336 1337
    /* init */
    if (MPV_common_init(s) < 0)
        return -1;
M
Michael Niedermayer 已提交
1338 1339 1340

    if(s->modified_quant)
        s->chroma_qscale_table= ff_h263_chroma_qscale_table;
1341
    s->progressive_frame=
M
Michael Niedermayer 已提交
1342
    s->progressive_sequence= !(avctx->flags & (CODEC_FLAG_INTERLACED_DCT|CODEC_FLAG_INTERLACED_ME|CODEC_FLAG_ALT_SCAN));
1343
    s->quant_precision=5;
1344

1345
    ff_set_cmp(&s->dsp, s->dsp.ildct_cmp, s->avctx->ildct_cmp);
1346
    ff_set_cmp(&s->dsp, s->dsp.frame_skip_cmp, s->avctx->frame_skip_cmp);
1347

1348
    if (ENABLE_H261_ENCODER && s->out_format == FMT_H261)
1349
        ff_h261_encode_init(s);
1350 1351
    if (s->out_format == FMT_H263)
        h263_encode_init(s);
1352
    if (ENABLE_MSMPEG4_ENCODER && s->msmpeg4_version)
1353
        ff_msmpeg4_encode_init(s);
M
Michael Niedermayer 已提交
1354 1355
    if (s->out_format == FMT_MPEG1)
        ff_mpeg1_encode_init(s);
1356

M
Michael Niedermayer 已提交
1357
    /* init q matrix */
1358
    for(i=0;i<64;i++) {
1359
        int j= s->dsp.idct_permutation[i];
1360
        if(s->codec_id==CODEC_ID_MPEG4 && s->mpeg_quant){
1361 1362
            s->intra_matrix[j] = ff_mpeg4_default_intra_matrix[i];
            s->inter_matrix[j] = ff_mpeg4_default_non_intra_matrix[i];
1363
        }else if(s->out_format == FMT_H263 || s->out_format == FMT_H261){
1364 1365
            s->intra_matrix[j] =
            s->inter_matrix[j] = ff_mpeg1_default_non_intra_matrix[i];
M
Michael Niedermayer 已提交
1366
        }else
M
Michael Niedermayer 已提交
1367
        { /* mpeg1/2 */
1368 1369
            s->intra_matrix[j] = ff_mpeg1_default_intra_matrix[i];
            s->inter_matrix[j] = ff_mpeg1_default_non_intra_matrix[i];
1370
        }
1371 1372 1373 1374
        if(s->avctx->intra_matrix)
            s->intra_matrix[j] = s->avctx->intra_matrix[i];
        if(s->avctx->inter_matrix)
            s->inter_matrix[j] = s->avctx->inter_matrix[i];
1375 1376 1377
    }

    /* precompute matrix */
1378
    /* for mjpeg, we do include qscale in the matrix */
1379
    if (s->out_format != FMT_MJPEG) {
1380
        convert_matrix(&s->dsp, s->q_intra_matrix, s->q_intra_matrix16,
1381
                       s->intra_matrix, s->intra_quant_bias, avctx->qmin, 31, 1);
1382
        convert_matrix(&s->dsp, s->q_inter_matrix, s->q_inter_matrix16,
1383
                       s->inter_matrix, s->inter_quant_bias, avctx->qmin, 31, 0);
1384 1385
    }

1386 1387
    if(ff_rate_control_init(s) < 0)
        return -1;
1388

F
Fabrice Bellard 已提交
1389 1390 1391 1392 1393 1394 1395
    return 0;
}

int MPV_encode_end(AVCodecContext *avctx)
{
    MpegEncContext *s = avctx->priv_data;

1396 1397
    ff_rate_control_uninit(s);

F
Fabrice Bellard 已提交
1398
    MPV_common_end(s);
1399
    if ((ENABLE_MJPEG_ENCODER || ENABLE_LJPEG_ENCODER) && s->out_format == FMT_MJPEG)
F
Fabrice Bellard 已提交
1400
        mjpeg_close(s);
1401

1402
    av_freep(&avctx->extradata);
1403

F
Fabrice Bellard 已提交
1404 1405 1406
    return 0;
}

1407 1408
#endif //CONFIG_ENCODERS

1409
void init_rl(RLTable *rl, uint8_t static_store[2][2*MAX_RUN + MAX_LEVEL + 3])
M
Michael Niedermayer 已提交
1410
{
1411 1412
    int8_t max_level[MAX_RUN+1], max_run[MAX_LEVEL+1];
    uint8_t index_run[MAX_RUN+1];
M
Michael Niedermayer 已提交
1413 1414
    int last, run, level, start, end, i;

1415
    /* If table is static, we can quit if rl->max_level[0] is not NULL */
1416
    if(static_store && rl->max_level[0])
1417 1418
        return;

M
Michael Niedermayer 已提交
1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441
    /* compute max_level[], max_run[] and index_run[] */
    for(last=0;last<2;last++) {
        if (last == 0) {
            start = 0;
            end = rl->last;
        } else {
            start = rl->last;
            end = rl->n;
        }

        memset(max_level, 0, MAX_RUN + 1);
        memset(max_run, 0, MAX_LEVEL + 1);
        memset(index_run, rl->n, MAX_RUN + 1);
        for(i=start;i<end;i++) {
            run = rl->table_run[i];
            level = rl->table_level[i];
            if (index_run[run] == rl->n)
                index_run[run] = i;
            if (level > max_level[run])
                max_level[run] = level;
            if (run > max_run[level])
                max_run[level] = run;
        }
1442 1443
        if(static_store)
            rl->max_level[last] = static_store[last];
1444 1445
        else
            rl->max_level[last] = av_malloc(MAX_RUN + 1);
M
Michael Niedermayer 已提交
1446
        memcpy(rl->max_level[last], max_level, MAX_RUN + 1);
1447 1448
        if(static_store)
            rl->max_run[last] = static_store[last] + MAX_RUN + 1;
1449 1450
        else
            rl->max_run[last] = av_malloc(MAX_LEVEL + 1);
M
Michael Niedermayer 已提交
1451
        memcpy(rl->max_run[last], max_run, MAX_LEVEL + 1);
1452 1453
        if(static_store)
            rl->index_run[last] = static_store[last] + MAX_RUN + MAX_LEVEL + 2;
1454 1455
        else
            rl->index_run[last] = av_malloc(MAX_RUN + 1);
M
Michael Niedermayer 已提交
1456 1457 1458 1459
        memcpy(rl->index_run[last], index_run, MAX_RUN + 1);
    }
}

F
Fabrice Bellard 已提交
1460
/* draw the edges of width 'w' of an image of size width, height */
1461
//FIXME check that this is ok for mpeg4 interlaced
1462
static void draw_edges_c(uint8_t *buf, int wrap, int width, int height, int w)
F
Fabrice Bellard 已提交
1463
{
1464
    uint8_t *ptr, *last_line;
F
Fabrice Bellard 已提交
1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488
    int i;

    last_line = buf + (height - 1) * wrap;
    for(i=0;i<w;i++) {
        /* top and bottom */
        memcpy(buf - (i + 1) * wrap, buf, width);
        memcpy(last_line + (i + 1) * wrap, last_line, width);
    }
    /* left and right */
    ptr = buf;
    for(i=0;i<height;i++) {
        memset(ptr - w, ptr[0], w);
        memset(ptr + width, ptr[width-1], w);
        ptr += wrap;
    }
    /* corners */
    for(i=0;i<w;i++) {
        memset(buf - (i + 1) * wrap - w, buf[0], w); /* top left */
        memset(buf - (i + 1) * wrap + width, buf[width-1], w); /* top right */
        memset(last_line + (i + 1) * wrap - w, last_line[0], w); /* top left */
        memset(last_line + (i + 1) * wrap + width, last_line[width-1], w); /* top right */
    }
}

M
Michael Niedermayer 已提交
1489
int ff_find_unused_picture(MpegEncContext *s, int shared){
M
Michael Niedermayer 已提交
1490
    int i;
1491

M
Michael Niedermayer 已提交
1492 1493
    if(shared){
        for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
1494
            if(s->picture[i].data[0]==NULL && s->picture[i].type==0) return i;
M
Michael Niedermayer 已提交
1495 1496 1497
        }
    }else{
        for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
1498
            if(s->picture[i].data[0]==NULL && s->picture[i].type!=0) return i; //FIXME
M
Michael Niedermayer 已提交
1499 1500
        }
        for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
1501
            if(s->picture[i].data[0]==NULL) return i;
M
Michael Niedermayer 已提交
1502 1503 1504
        }
    }

M
Michael Niedermayer 已提交
1505 1506
    assert(0);
    return -1;
M
Michael Niedermayer 已提交
1507 1508
}

1509 1510 1511 1512 1513 1514 1515 1516 1517 1518
static void update_noise_reduction(MpegEncContext *s){
    int intra, i;

    for(intra=0; intra<2; intra++){
        if(s->dct_count[intra] > (1<<16)){
            for(i=0; i<64; i++){
                s->dct_error_sum[intra][i] >>=1;
            }
            s->dct_count[intra] >>= 1;
        }
1519

1520 1521 1522 1523 1524 1525
        for(i=0; i<64; i++){
            s->dct_offset[intra][i]= (s->avctx->noise_reduction * s->dct_count[intra] + s->dct_error_sum[intra][i]/2) / (s->dct_error_sum[intra][i]+1);
        }
    }
}

M
Michael Niedermayer 已提交
1526 1527 1528
/**
 * generic function for encode/decode called after coding/decoding the header and before a frame is coded/decoded
 */
1529
int MPV_frame_start(MpegEncContext *s, AVCodecContext *avctx)
F
Fabrice Bellard 已提交
1530
{
M
Michael Niedermayer 已提交
1531
    int i;
M
Michael Niedermayer 已提交
1532
    AVFrame *pic;
1533
    s->mb_skipped = 0;
M
Michael Niedermayer 已提交
1534

M
Michael Niedermayer 已提交
1535
    assert(s->last_picture_ptr==NULL || s->out_format != FMT_H264 || s->codec_id == CODEC_ID_SVQ3);
M
Michael Niedermayer 已提交
1536

M
cleanup  
Michael Niedermayer 已提交
1537
    /* mark&release old frames */
1538
    if (s->pict_type != B_TYPE && s->last_picture_ptr && s->last_picture_ptr != s->next_picture_ptr && s->last_picture_ptr->data[0]) {
1539
      if(s->out_format != FMT_H264 || s->codec_id == CODEC_ID_SVQ3){
M
Michael Niedermayer 已提交
1540
        avctx->release_buffer(avctx, (AVFrame*)s->last_picture_ptr);
M
cleanup  
Michael Niedermayer 已提交
1541 1542 1543 1544 1545

        /* release forgotten pictures */
        /* if(mpeg124/h263) */
        if(!s->encoding){
            for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
1546
                if(s->picture[i].data[0] && &s->picture[i] != s->next_picture_ptr && s->picture[i].reference){
1547
                    av_log(avctx, AV_LOG_ERROR, "releasing zombie picture\n");
1548
                    avctx->release_buffer(avctx, (AVFrame*)&s->picture[i]);
M
cleanup  
Michael Niedermayer 已提交
1549 1550
                }
            }
1551
        }
1552
      }
1553
    }
1554 1555
alloc:
    if(!s->encoding){
D
Diego Biurrun 已提交
1556
        /* release non reference frames */
M
Michael Niedermayer 已提交
1557 1558 1559 1560 1561 1562
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            if(s->picture[i].data[0] && !s->picture[i].reference /*&& s->picture[i].type!=FF_BUFFER_TYPE_SHARED*/){
                s->avctx->release_buffer(s->avctx, (AVFrame*)&s->picture[i]);
            }
        }

M
Michael Niedermayer 已提交
1563 1564 1565 1566 1567 1568 1569
        if(s->current_picture_ptr && s->current_picture_ptr->data[0]==NULL)
            pic= (AVFrame*)s->current_picture_ptr; //we allready have a unused image (maybe it was set before reading the header)
        else{
            i= ff_find_unused_picture(s, 0);
            pic= (AVFrame*)&s->picture[i];
        }

1570 1571
        pic->reference= (s->pict_type != B_TYPE || s->codec_id == CODEC_ID_H264)
                        && !s->dropable ? 3 : 0;
M
Michael Niedermayer 已提交
1572

M
Michael Niedermayer 已提交
1573
        pic->coded_picture_number= s->coded_picture_number++;
1574

1575 1576
        if( alloc_picture(s, (Picture*)pic, 0) < 0)
            return -1;
1577

M
Michael Niedermayer 已提交
1578
        s->current_picture_ptr= (Picture*)pic;
1579
        s->current_picture_ptr->top_field_first= s->top_field_first; //FIXME use only the vars from current_pic
1580
        s->current_picture_ptr->interlaced_frame= !s->progressive_frame && !s->progressive_sequence;
M
cleanup  
Michael Niedermayer 已提交
1581
    }
1582

M
Michael Niedermayer 已提交
1583
    s->current_picture_ptr->pict_type= s->pict_type;
1584
//    if(s->flags && CODEC_FLAG_QSCALE)
1585
  //      s->current_picture_ptr->quality= s->new_picture_ptr->quality;
1586
    s->current_picture_ptr->key_frame= s->pict_type == I_TYPE;
M
Michael Niedermayer 已提交
1587

1588
    copy_picture(&s->current_picture, s->current_picture_ptr);
1589

M
cleanup  
Michael Niedermayer 已提交
1590
    if (s->pict_type != B_TYPE) {
M
Michael Niedermayer 已提交
1591
        s->last_picture_ptr= s->next_picture_ptr;
1592 1593
        if(!s->dropable)
            s->next_picture_ptr= s->current_picture_ptr;
F
Fabrice Bellard 已提交
1594
    }
1595
/*    av_log(s->avctx, AV_LOG_DEBUG, "L%p N%p C%p L%p N%p C%p type:%d drop:%d\n", s->last_picture_ptr, s->next_picture_ptr,s->current_picture_ptr,
1596 1597
        s->last_picture_ptr    ? s->last_picture_ptr->data[0] : NULL,
        s->next_picture_ptr    ? s->next_picture_ptr->data[0] : NULL,
1598 1599
        s->current_picture_ptr ? s->current_picture_ptr->data[0] : NULL,
        s->pict_type, s->dropable);*/
1600

1601 1602
    if(s->last_picture_ptr) copy_picture(&s->last_picture, s->last_picture_ptr);
    if(s->next_picture_ptr) copy_picture(&s->next_picture, s->next_picture_ptr);
1603

1604
    if(s->pict_type != I_TYPE && (s->last_picture_ptr==NULL || s->last_picture_ptr->data[0]==NULL) && !s->dropable){
1605
        av_log(avctx, AV_LOG_ERROR, "warning: first frame is no keyframe\n");
D
Diego Biurrun 已提交
1606
        assert(s->pict_type != B_TYPE); //these should have been dropped if we don't have a reference
1607 1608 1609 1610 1611
        goto alloc;
    }

    assert(s->pict_type == I_TYPE || (s->last_picture_ptr && s->last_picture_ptr->data[0]));

M
Michael Niedermayer 已提交
1612 1613 1614 1615 1616
    if(s->picture_structure!=PICT_FRAME){
        int i;
        for(i=0; i<4; i++){
            if(s->picture_structure == PICT_BOTTOM_FIELD){
                 s->current_picture.data[i] += s->current_picture.linesize[i];
1617
            }
M
Michael Niedermayer 已提交
1618 1619 1620 1621 1622
            s->current_picture.linesize[i] *= 2;
            s->last_picture.linesize[i] *=2;
            s->next_picture.linesize[i] *=2;
        }
    }
1623

1624 1625 1626
    s->hurry_up= s->avctx->hurry_up;
    s->error_resilience= avctx->error_resilience;

D
Diego Biurrun 已提交
1627 1628
    /* set dequantizer, we can't do it during init as it might change for mpeg4
       and we can't do it in the header decode as init isnt called for mpeg4 there yet */
1629 1630 1631
    if(s->mpeg_quant || s->codec_id == CODEC_ID_MPEG2VIDEO){
        s->dct_unquantize_intra = s->dct_unquantize_mpeg2_intra;
        s->dct_unquantize_inter = s->dct_unquantize_mpeg2_inter;
M
Maarten Daniels 已提交
1632
    }else if(s->out_format == FMT_H263 || s->out_format == FMT_H261){
1633 1634 1635 1636 1637 1638
        s->dct_unquantize_intra = s->dct_unquantize_h263_intra;
        s->dct_unquantize_inter = s->dct_unquantize_h263_inter;
    }else{
        s->dct_unquantize_intra = s->dct_unquantize_mpeg1_intra;
        s->dct_unquantize_inter = s->dct_unquantize_mpeg1_inter;
    }
1639

1640 1641 1642 1643 1644
    if(s->dct_error_sum){
        assert(s->avctx->noise_reduction && s->encoding);

        update_noise_reduction(s);
    }
1645

I
Ivan Kalvachev 已提交
1646 1647 1648 1649
#ifdef HAVE_XVMC
    if(s->avctx->xvmc_acceleration)
        return XVMC_field_start(s, avctx);
#endif
1650
    return 0;
F
Fabrice Bellard 已提交
1651
}
1652

F
Fabrice Bellard 已提交
1653 1654 1655
/* generic function for encode/decode called after a frame has been coded/decoded */
void MPV_frame_end(MpegEncContext *s)
{
M
cleanup  
Michael Niedermayer 已提交
1656
    int i;
F
Fabrice Bellard 已提交
1657
    /* draw edge for correct motion prediction if outside */
I
Ivan Kalvachev 已提交
1658 1659 1660 1661 1662 1663
#ifdef HAVE_XVMC
//just to make sure that all data is rendered.
    if(s->avctx->xvmc_acceleration){
        XVMC_field_end(s);
    }else
#endif
1664
    if(s->unrestricted_mv && s->current_picture.reference && !s->intra_only && !(s->flags&CODEC_FLAG_EMU_EDGE)) {
M
cleanup  
Michael Niedermayer 已提交
1665 1666 1667
            draw_edges(s->current_picture.data[0], s->linesize  , s->h_edge_pos   , s->v_edge_pos   , EDGE_WIDTH  );
            draw_edges(s->current_picture.data[1], s->uvlinesize, s->h_edge_pos>>1, s->v_edge_pos>>1, EDGE_WIDTH/2);
            draw_edges(s->current_picture.data[2], s->uvlinesize, s->h_edge_pos>>1, s->v_edge_pos>>1, EDGE_WIDTH/2);
F
Fabrice Bellard 已提交
1668
    }
M
Michael Niedermayer 已提交
1669
    emms_c();
1670

M
Michael Niedermayer 已提交
1671
    s->last_pict_type    = s->pict_type;
1672
    s->last_lambda_for[s->pict_type]= s->current_picture_ptr->quality;
1673 1674 1675
    if(s->pict_type!=B_TYPE){
        s->last_non_b_pict_type= s->pict_type;
    }
M
Michael Niedermayer 已提交
1676 1677
#if 0
        /* copy back current_picture variables */
M
cleanup  
Michael Niedermayer 已提交
1678 1679 1680 1681
    for(i=0; i<MAX_PICTURE_COUNT; i++){
        if(s->picture[i].data[0] == s->current_picture.data[0]){
            s->picture[i]= s->current_picture;
            break;
1682
        }
M
cleanup  
Michael Niedermayer 已提交
1683 1684
    }
    assert(i<MAX_PICTURE_COUNT);
1685
#endif
M
cleanup  
Michael Niedermayer 已提交
1686

M
Michael Niedermayer 已提交
1687
    if(s->encoding){
D
Diego Biurrun 已提交
1688
        /* release non-reference frames */
M
Michael Niedermayer 已提交
1689 1690 1691 1692 1693
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            if(s->picture[i].data[0] && !s->picture[i].reference /*&& s->picture[i].type!=FF_BUFFER_TYPE_SHARED*/){
                s->avctx->release_buffer(s->avctx, (AVFrame*)&s->picture[i]);
            }
        }
M
cleanup  
Michael Niedermayer 已提交
1694
    }
M
Michael Niedermayer 已提交
1695 1696 1697 1698 1699 1700
    // clear copies, to avoid confusion
#if 0
    memset(&s->last_picture, 0, sizeof(Picture));
    memset(&s->next_picture, 0, sizeof(Picture));
    memset(&s->current_picture, 0, sizeof(Picture));
#endif
M
Michael Niedermayer 已提交
1701
    s->avctx->coded_frame= (AVFrame*)s->current_picture_ptr;
F
Fabrice Bellard 已提交
1702 1703
}

1704 1705 1706 1707 1708 1709 1710 1711
/**
 * draws an line from (ex, ey) -> (sx, sy).
 * @param w width of the image
 * @param h height of the image
 * @param stride stride/linesize of the image
 * @param color color of the arrow
 */
static void draw_line(uint8_t *buf, int sx, int sy, int ex, int ey, int w, int h, int stride, int color){
M
SWAP  
Michael Niedermayer 已提交
1712
    int x, y, fr, f;
1713

1714 1715 1716 1717
    sx= av_clip(sx, 0, w-1);
    sy= av_clip(sy, 0, h-1);
    ex= av_clip(ex, 0, w-1);
    ey= av_clip(ey, 0, h-1);
1718

1719
    buf[sy*stride + sx]+= color;
1720

D
Diego Biurrun 已提交
1721
    if(FFABS(ex - sx) > FFABS(ey - sy)){
1722
        if(sx > ex){
D
Diego Biurrun 已提交
1723 1724
            FFSWAP(int, sx, ex);
            FFSWAP(int, sy, ey);
1725 1726 1727 1728 1729
        }
        buf+= sx + sy*stride;
        ex-= sx;
        f= ((ey-sy)<<16)/ex;
        for(x= 0; x <= ex; x++){
1730 1731 1732 1733
            y = (x*f)>>16;
            fr= (x*f)&0xFFFF;
            buf[ y   *stride + x]+= (color*(0x10000-fr))>>16;
            buf[(y+1)*stride + x]+= (color*         fr )>>16;
1734 1735 1736
        }
    }else{
        if(sy > ey){
D
Diego Biurrun 已提交
1737 1738
            FFSWAP(int, sx, ex);
            FFSWAP(int, sy, ey);
1739 1740 1741 1742 1743 1744
        }
        buf+= sx + sy*stride;
        ey-= sy;
        if(ey) f= ((ex-sx)<<16)/ey;
        else   f= 0;
        for(y= 0; y <= ey; y++){
1745 1746 1747 1748
            x = (y*f)>>16;
            fr= (y*f)&0xFFFF;
            buf[y*stride + x  ]+= (color*(0x10000-fr))>>16;;
            buf[y*stride + x+1]+= (color*         fr )>>16;;
1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759
        }
    }
}

/**
 * draws an arrow from (ex, ey) -> (sx, sy).
 * @param w width of the image
 * @param h height of the image
 * @param stride stride/linesize of the image
 * @param color color of the arrow
 */
1760
static void draw_arrow(uint8_t *buf, int sx, int sy, int ex, int ey, int w, int h, int stride, int color){
1761 1762
    int dx,dy;

1763 1764 1765 1766
    sx= av_clip(sx, -100, w+100);
    sy= av_clip(sy, -100, h+100);
    ex= av_clip(ex, -100, w+100);
    ey= av_clip(ey, -100, h+100);
1767

1768 1769
    dx= ex - sx;
    dy= ey - sy;
1770

1771 1772 1773 1774
    if(dx*dx + dy*dy > 3*3){
        int rx=  dx + dy;
        int ry= -dx + dy;
        int length= ff_sqrt((rx*rx + ry*ry)<<8);
1775

1776 1777 1778
        //FIXME subpixel accuracy
        rx= ROUNDED_DIV(rx*3<<4, length);
        ry= ROUNDED_DIV(ry*3<<4, length);
1779

1780 1781 1782 1783 1784 1785
        draw_line(buf, sx, sy, sx + rx, sy + ry, w, h, stride, color);
        draw_line(buf, sx, sy, sx - ry, sy + rx, w, h, stride, color);
    }
    draw_line(buf, sx, sy, ex, ey, w, h, stride, color);
}

1786 1787 1788
/**
 * prints debuging info for the given picture.
 */
1789
void ff_print_debug_info(MpegEncContext *s, AVFrame *pict){
1790 1791 1792 1793 1794

    if(!pict || !pict->mb_type) return;

    if(s->avctx->debug&(FF_DEBUG_SKIP | FF_DEBUG_QP | FF_DEBUG_MB_TYPE)){
        int x,y;
1795

1796 1797 1798 1799 1800 1801 1802
        av_log(s->avctx,AV_LOG_DEBUG,"New frame, type: ");
        switch (pict->pict_type) {
            case FF_I_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"I\n"); break;
            case FF_P_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"P\n"); break;
            case FF_B_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"B\n"); break;
            case FF_S_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"S\n"); break;
            case FF_SI_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"SI\n"); break;
1803
            case FF_SP_TYPE: av_log(s->avctx,AV_LOG_DEBUG,"SP\n"); break;
1804
        }
1805 1806 1807 1808 1809
        for(y=0; y<s->mb_height; y++){
            for(x=0; x<s->mb_width; x++){
                if(s->avctx->debug&FF_DEBUG_SKIP){
                    int count= s->mbskip_table[x + y*s->mb_stride];
                    if(count>9) count=9;
1810
                    av_log(s->avctx, AV_LOG_DEBUG, "%1d", count);
1811 1812
                }
                if(s->avctx->debug&FF_DEBUG_QP){
1813
                    av_log(s->avctx, AV_LOG_DEBUG, "%2d", pict->qscale_table[x + y*s->mb_stride]);
1814 1815 1816 1817 1818
                }
                if(s->avctx->debug&FF_DEBUG_MB_TYPE){
                    int mb_type= pict->mb_type[x + y*s->mb_stride];
                    //Type & MV direction
                    if(IS_PCM(mb_type))
1819
                        av_log(s->avctx, AV_LOG_DEBUG, "P");
1820
                    else if(IS_INTRA(mb_type) && IS_ACPRED(mb_type))
1821
                        av_log(s->avctx, AV_LOG_DEBUG, "A");
1822
                    else if(IS_INTRA4x4(mb_type))
1823
                        av_log(s->avctx, AV_LOG_DEBUG, "i");
1824
                    else if(IS_INTRA16x16(mb_type))
1825
                        av_log(s->avctx, AV_LOG_DEBUG, "I");
1826
                    else if(IS_DIRECT(mb_type) && IS_SKIP(mb_type))
1827
                        av_log(s->avctx, AV_LOG_DEBUG, "d");
1828
                    else if(IS_DIRECT(mb_type))
1829
                        av_log(s->avctx, AV_LOG_DEBUG, "D");
1830
                    else if(IS_GMC(mb_type) && IS_SKIP(mb_type))
1831
                        av_log(s->avctx, AV_LOG_DEBUG, "g");
1832
                    else if(IS_GMC(mb_type))
1833
                        av_log(s->avctx, AV_LOG_DEBUG, "G");
1834
                    else if(IS_SKIP(mb_type))
1835
                        av_log(s->avctx, AV_LOG_DEBUG, "S");
1836
                    else if(!USES_LIST(mb_type, 1))
1837
                        av_log(s->avctx, AV_LOG_DEBUG, ">");
1838
                    else if(!USES_LIST(mb_type, 0))
1839
                        av_log(s->avctx, AV_LOG_DEBUG, "<");
1840 1841
                    else{
                        assert(USES_LIST(mb_type, 0) && USES_LIST(mb_type, 1));
1842
                        av_log(s->avctx, AV_LOG_DEBUG, "X");
1843
                    }
1844

1845 1846
                    //segmentation
                    if(IS_8X8(mb_type))
1847
                        av_log(s->avctx, AV_LOG_DEBUG, "+");
1848
                    else if(IS_16X8(mb_type))
1849
                        av_log(s->avctx, AV_LOG_DEBUG, "-");
1850
                    else if(IS_8X16(mb_type))
1851
                        av_log(s->avctx, AV_LOG_DEBUG, "|");
1852
                    else if(IS_INTRA(mb_type) || IS_16X16(mb_type))
1853
                        av_log(s->avctx, AV_LOG_DEBUG, " ");
1854
                    else
1855
                        av_log(s->avctx, AV_LOG_DEBUG, "?");
1856 1857


1858
                    if(IS_INTERLACED(mb_type) && s->codec_id == CODEC_ID_H264)
1859
                        av_log(s->avctx, AV_LOG_DEBUG, "=");
1860
                    else
1861
                        av_log(s->avctx, AV_LOG_DEBUG, " ");
1862
                }
1863
//                av_log(s->avctx, AV_LOG_DEBUG, " ");
1864
            }
1865
            av_log(s->avctx, AV_LOG_DEBUG, "\n");
1866 1867
        }
    }
1868

1869
    if((s->avctx->debug&(FF_DEBUG_VIS_QP|FF_DEBUG_VIS_MB_TYPE)) || (s->avctx->debug_mv)){
1870 1871
        const int shift= 1 + s->quarter_sample;
        int mb_y;
1872 1873
        uint8_t *ptr;
        int i;
1874
        int h_chroma_shift, v_chroma_shift;
1875 1876
        const int width = s->avctx->width;
        const int height= s->avctx->height;
1877
        const int mv_sample_log2= 4 - pict->motion_subsample_log2;
1878
        const int mv_stride= (s->mb_width << mv_sample_log2) + (s->codec_id == CODEC_ID_H264 ? 0 : 1);
M
100000l  
Michael Niedermayer 已提交
1879
        s->low_delay=0; //needed to see the vectors without trashing the buffers
1880

1881
        avcodec_get_chroma_sub_sample(s->avctx->pix_fmt, &h_chroma_shift, &v_chroma_shift);
1882
        for(i=0; i<3; i++){
1883
            memcpy(s->visualization_buffer[i], pict->data[i], (i==0) ? pict->linesize[i]*height:pict->linesize[i]*height >> v_chroma_shift);
1884 1885 1886 1887
            pict->data[i]= s->visualization_buffer[i];
        }
        pict->type= FF_BUFFER_TYPE_COPY;
        ptr= pict->data[0];
1888 1889 1890 1891 1892

        for(mb_y=0; mb_y<s->mb_height; mb_y++){
            int mb_x;
            for(mb_x=0; mb_x<s->mb_width; mb_x++){
                const int mb_index= mb_x + mb_y*s->mb_stride;
1893 1894 1895
                if((s->avctx->debug_mv) && pict->motion_val){
                  int type;
                  for(type=0; type<3; type++){
1896
                    int direction = 0;
1897 1898 1899 1900 1901 1902 1903 1904 1905 1906 1907 1908 1909 1910
                    switch (type) {
                      case 0: if ((!(s->avctx->debug_mv&FF_DEBUG_VIS_MV_P_FOR)) || (pict->pict_type!=FF_P_TYPE))
                                continue;
                              direction = 0;
                              break;
                      case 1: if ((!(s->avctx->debug_mv&FF_DEBUG_VIS_MV_B_FOR)) || (pict->pict_type!=FF_B_TYPE))
                                continue;
                              direction = 0;
                              break;
                      case 2: if ((!(s->avctx->debug_mv&FF_DEBUG_VIS_MV_B_BACK)) || (pict->pict_type!=FF_B_TYPE))
                                continue;
                              direction = 1;
                              break;
                    }
1911 1912 1913
                    if(!USES_LIST(pict->mb_type[mb_index], direction))
                        continue;

1914 1915 1916
                    if(IS_8X8(pict->mb_type[mb_index])){
                      int i;
                      for(i=0; i<4; i++){
1917 1918
                        int sx= mb_x*16 + 4 + 8*(i&1);
                        int sy= mb_y*16 + 4 + 8*(i>>1);
1919
                        int xy= (mb_x*2 + (i&1) + (mb_y*2 + (i>>1))*mv_stride) << (mv_sample_log2-1);
1920 1921
                        int mx= (pict->motion_val[direction][xy][0]>>shift) + sx;
                        int my= (pict->motion_val[direction][xy][1]>>shift) + sy;
1922
                        draw_arrow(ptr, sx, sy, mx, my, width, height, s->linesize, 100);
1923 1924 1925 1926
                      }
                    }else if(IS_16X8(pict->mb_type[mb_index])){
                      int i;
                      for(i=0; i<2; i++){
1927 1928
                        int sx=mb_x*16 + 8;
                        int sy=mb_y*16 + 4 + 8*i;
1929
                        int xy= (mb_x*2 + (mb_y*2 + i)*mv_stride) << (mv_sample_log2-1);
1930 1931
                        int mx=(pict->motion_val[direction][xy][0]>>shift);
                        int my=(pict->motion_val[direction][xy][1]>>shift);
1932

1933 1934
                        if(IS_INTERLACED(pict->mb_type[mb_index]))
                            my*=2;
1935

1936 1937 1938 1939 1940 1941 1942
                        draw_arrow(ptr, sx, sy, mx+sx, my+sy, width, height, s->linesize, 100);
                      }
                    }else if(IS_8X16(pict->mb_type[mb_index])){
                      int i;
                      for(i=0; i<2; i++){
                        int sx=mb_x*16 + 4 + 8*i;
                        int sy=mb_y*16 + 8;
1943
                        int xy= (mb_x*2 + i + mb_y*2*mv_stride) << (mv_sample_log2-1);
1944 1945
                        int mx=(pict->motion_val[direction][xy][0]>>shift);
                        int my=(pict->motion_val[direction][xy][1]>>shift);
1946

1947 1948
                        if(IS_INTERLACED(pict->mb_type[mb_index]))
                            my*=2;
1949

1950
                        draw_arrow(ptr, sx, sy, mx+sx, my+sy, width, height, s->linesize, 100);
1951 1952 1953 1954
                      }
                    }else{
                      int sx= mb_x*16 + 8;
                      int sy= mb_y*16 + 8;
1955
                      int xy= (mb_x + mb_y*mv_stride) << mv_sample_log2;
1956 1957
                      int mx= (pict->motion_val[direction][xy][0]>>shift) + sx;
                      int my= (pict->motion_val[direction][xy][1]>>shift) + sy;
1958
                      draw_arrow(ptr, sx, sy, mx, my, width, height, s->linesize, 100);
1959
                    }
1960
                  }
M
Michael Niedermayer 已提交
1961 1962 1963 1964 1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977
                }
                if((s->avctx->debug&FF_DEBUG_VIS_QP) && pict->motion_val){
                    uint64_t c= (pict->qscale_table[mb_index]*128/31) * 0x0101010101010101ULL;
                    int y;
                    for(y=0; y<8; y++){
                        *(uint64_t*)(pict->data[1] + 8*mb_x + (8*mb_y + y)*pict->linesize[1])= c;
                        *(uint64_t*)(pict->data[2] + 8*mb_x + (8*mb_y + y)*pict->linesize[2])= c;
                    }
                }
                if((s->avctx->debug&FF_DEBUG_VIS_MB_TYPE) && pict->motion_val){
                    int mb_type= pict->mb_type[mb_index];
                    uint64_t u,v;
                    int y;
#define COLOR(theta, r)\
u= (int)(128 + r*cos(theta*3.141592/180));\
v= (int)(128 + r*sin(theta*3.141592/180));

1978

M
Michael Niedermayer 已提交
1979 1980 1981 1982 1983 1984 1985 1986 1987 1988 1989 1990 1991 1992 1993 1994 1995 1996 1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020
                    u=v=128;
                    if(IS_PCM(mb_type)){
                        COLOR(120,48)
                    }else if((IS_INTRA(mb_type) && IS_ACPRED(mb_type)) || IS_INTRA16x16(mb_type)){
                        COLOR(30,48)
                    }else if(IS_INTRA4x4(mb_type)){
                        COLOR(90,48)
                    }else if(IS_DIRECT(mb_type) && IS_SKIP(mb_type)){
//                        COLOR(120,48)
                    }else if(IS_DIRECT(mb_type)){
                        COLOR(150,48)
                    }else if(IS_GMC(mb_type) && IS_SKIP(mb_type)){
                        COLOR(170,48)
                    }else if(IS_GMC(mb_type)){
                        COLOR(190,48)
                    }else if(IS_SKIP(mb_type)){
//                        COLOR(180,48)
                    }else if(!USES_LIST(mb_type, 1)){
                        COLOR(240,48)
                    }else if(!USES_LIST(mb_type, 0)){
                        COLOR(0,48)
                    }else{
                        assert(USES_LIST(mb_type, 0) && USES_LIST(mb_type, 1));
                        COLOR(300,48)
                    }

                    u*= 0x0101010101010101ULL;
                    v*= 0x0101010101010101ULL;
                    for(y=0; y<8; y++){
                        *(uint64_t*)(pict->data[1] + 8*mb_x + (8*mb_y + y)*pict->linesize[1])= u;
                        *(uint64_t*)(pict->data[2] + 8*mb_x + (8*mb_y + y)*pict->linesize[2])= v;
                    }

                    //segmentation
                    if(IS_8X8(mb_type) || IS_16X8(mb_type)){
                        *(uint64_t*)(pict->data[0] + 16*mb_x + 0 + (16*mb_y + 8)*pict->linesize[0])^= 0x8080808080808080ULL;
                        *(uint64_t*)(pict->data[0] + 16*mb_x + 8 + (16*mb_y + 8)*pict->linesize[0])^= 0x8080808080808080ULL;
                    }
                    if(IS_8X8(mb_type) || IS_8X16(mb_type)){
                        for(y=0; y<16; y++)
                            pict->data[0][16*mb_x + 8 + (16*mb_y + y)*pict->linesize[0]]^= 0x80;
                    }
2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033 2034 2035
                    if(IS_8X8(mb_type) && mv_sample_log2 >= 2){
                        int dm= 1 << (mv_sample_log2-2);
                        for(i=0; i<4; i++){
                            int sx= mb_x*16 + 8*(i&1);
                            int sy= mb_y*16 + 8*(i>>1);
                            int xy= (mb_x*2 + (i&1) + (mb_y*2 + (i>>1))*mv_stride) << (mv_sample_log2-1);
                            //FIXME bidir
                            int32_t *mv = (int32_t*)&pict->motion_val[0][xy];
                            if(mv[0] != mv[dm] || mv[dm*mv_stride] != mv[dm*(mv_stride+1)])
                                for(y=0; y<8; y++)
                                    pict->data[0][sx + 4 + (sy + y)*pict->linesize[0]]^= 0x80;
                            if(mv[0] != mv[dm*mv_stride] || mv[dm] != mv[dm*(mv_stride+1)])
                                *(uint64_t*)(pict->data[0] + sx + (sy + 4)*pict->linesize[0])^= 0x8080808080808080ULL;
                        }
                    }
2036

M
Michael Niedermayer 已提交
2037 2038 2039
                    if(IS_INTERLACED(mb_type) && s->codec_id == CODEC_ID_H264){
                        // hmm
                    }
2040 2041 2042 2043 2044
                }
                s->mbskip_table[mb_index]=0;
            }
        }
    }
2045 2046
}

2047 2048
#ifdef CONFIG_ENCODERS

M
Michael Niedermayer 已提交
2049 2050 2051
static int get_sae(uint8_t *src, int ref, int stride){
    int x,y;
    int acc=0;
2052

M
Michael Niedermayer 已提交
2053 2054
    for(y=0; y<16; y++){
        for(x=0; x<16; x++){
D
Diego Biurrun 已提交
2055
            acc+= FFABS(src[x+y*stride] - ref);
M
Michael Niedermayer 已提交
2056 2057
        }
    }
2058

M
Michael Niedermayer 已提交
2059 2060 2061 2062 2063 2064
    return acc;
}

static int get_intra_count(MpegEncContext *s, uint8_t *src, uint8_t *ref, int stride){
    int x, y, w, h;
    int acc=0;
2065

M
Michael Niedermayer 已提交
2066 2067
    w= s->width &~15;
    h= s->height&~15;
2068

M
Michael Niedermayer 已提交
2069 2070 2071
    for(y=0; y<h; y+=16){
        for(x=0; x<w; x+=16){
            int offset= x + y*stride;
M
Michael Niedermayer 已提交
2072
            int sad = s->dsp.sad[0](NULL, src + offset, ref + offset, stride, 16);
M
Michael Niedermayer 已提交
2073 2074
            int mean= (s->dsp.pix_sum(src + offset, stride) + 128)>>8;
            int sae = get_sae(src + offset, mean, stride);
2075

M
Michael Niedermayer 已提交
2076 2077 2078 2079 2080 2081
            acc+= sae + 500 < sad;
        }
    }
    return acc;
}

M
Michael Niedermayer 已提交
2082

M
Michael Niedermayer 已提交
2083
static int load_input_picture(MpegEncContext *s, AVFrame *pic_arg){
2084
    AVFrame *pic=NULL;
2085
    int64_t pts;
M
Michael Niedermayer 已提交
2086
    int i;
M
cleanup  
Michael Niedermayer 已提交
2087
    const int encoding_delay= s->max_b_frames;
M
Michael Niedermayer 已提交
2088
    int direct=1;
2089

2090
    if(pic_arg){
2091 2092 2093
        pts= pic_arg->pts;
        pic_arg->display_picture_number= s->input_picture_number++;

2094
        if(pts != AV_NOPTS_VALUE){
2095
            if(s->user_specified_pts != AV_NOPTS_VALUE){
2096 2097
                int64_t time= pts;
                int64_t last= s->user_specified_pts;
2098 2099

                if(time <= last){
2100
                    av_log(s->avctx, AV_LOG_ERROR, "Error, Invalid timestamp=%"PRId64", last=%"PRId64"\n", pts, s->user_specified_pts);
2101 2102 2103
                    return -1;
                }
            }
2104
            s->user_specified_pts= pts;
2105 2106
        }else{
            if(s->user_specified_pts != AV_NOPTS_VALUE){
2107
                s->user_specified_pts=
2108
                pts= s->user_specified_pts + 1;
2109
                av_log(s->avctx, AV_LOG_INFO, "Warning: AVFrame.pts=? trying to guess (%"PRId64")\n", pts);
2110
            }else{
2111
                pts= pic_arg->display_picture_number;
2112 2113 2114 2115
            }
        }
    }

2116
  if(pic_arg){
M
Michael Niedermayer 已提交
2117 2118 2119 2120
    if(encoding_delay && !(s->flags&CODEC_FLAG_INPUT_PRESERVED)) direct=0;
    if(pic_arg->linesize[0] != s->linesize) direct=0;
    if(pic_arg->linesize[1] != s->uvlinesize) direct=0;
    if(pic_arg->linesize[2] != s->uvlinesize) direct=0;
2121

2122
//    av_log(AV_LOG_DEBUG, "%d %d %d %d\n",pic_arg->linesize[0], pic_arg->linesize[1], s->linesize, s->uvlinesize);
2123

M
Michael Niedermayer 已提交
2124
    if(direct){
M
Michael Niedermayer 已提交
2125
        i= ff_find_unused_picture(s, 1);
M
cleanup  
Michael Niedermayer 已提交
2126

M
Michael Niedermayer 已提交
2127
        pic= (AVFrame*)&s->picture[i];
M
Michael Niedermayer 已提交
2128
        pic->reference= 3;
2129

M
Michael Niedermayer 已提交
2130 2131 2132 2133 2134 2135
        for(i=0; i<4; i++){
            pic->data[i]= pic_arg->data[i];
            pic->linesize[i]= pic_arg->linesize[i];
        }
        alloc_picture(s, (Picture*)pic, 1);
    }else{
M
Michael Niedermayer 已提交
2136
        i= ff_find_unused_picture(s, 0);
M
cleanup  
Michael Niedermayer 已提交
2137

M
Michael Niedermayer 已提交
2138
        pic= (AVFrame*)&s->picture[i];
M
Michael Niedermayer 已提交
2139
        pic->reference= 3;
M
cleanup  
Michael Niedermayer 已提交
2140

M
Michael Niedermayer 已提交
2141 2142
        alloc_picture(s, (Picture*)pic, 0);

M
Michael Niedermayer 已提交
2143 2144 2145
        if(   pic->data[0] + INPLACE_OFFSET == pic_arg->data[0]
           && pic->data[1] + INPLACE_OFFSET == pic_arg->data[1]
           && pic->data[2] + INPLACE_OFFSET == pic_arg->data[2]){
M
cleanup  
Michael Niedermayer 已提交
2146
       // empty
M
Michael Niedermayer 已提交
2147 2148 2149
        }else{
            int h_chroma_shift, v_chroma_shift;
            avcodec_get_chroma_sub_sample(s->avctx->pix_fmt, &h_chroma_shift, &v_chroma_shift);
2150

M
Michael Niedermayer 已提交
2151 2152 2153 2154 2155 2156 2157 2158
            for(i=0; i<3; i++){
                int src_stride= pic_arg->linesize[i];
                int dst_stride= i ? s->uvlinesize : s->linesize;
                int h_shift= i ? h_chroma_shift : 0;
                int v_shift= i ? v_chroma_shift : 0;
                int w= s->width >>h_shift;
                int h= s->height>>v_shift;
                uint8_t *src= pic_arg->data[i];
2159 2160 2161 2162
                uint8_t *dst= pic->data[i];

                if(!s->avctx->rc_buffer_size)
                    dst +=INPLACE_OFFSET;
2163

M
Michael Niedermayer 已提交
2164 2165 2166 2167 2168 2169 2170 2171
                if(src_stride==dst_stride)
                    memcpy(dst, src, src_stride*h);
                else{
                    while(h--){
                        memcpy(dst, src, w);
                        dst += dst_stride;
                        src += src_stride;
                    }
M
cleanup  
Michael Niedermayer 已提交
2172
                }
2173
            }
M
cleanup  
Michael Niedermayer 已提交
2174 2175
        }
    }
2176
    copy_picture_attributes(s, pic, pic_arg);
2177
    pic->pts= pts; //we set this here to avoid modifiying pic_arg
2178
  }
2179

M
Michael Niedermayer 已提交
2180 2181 2182
    /* shift buffer entries */
    for(i=1; i<MAX_PICTURE_COUNT /*s->encoding_delay+1*/; i++)
        s->input_picture[i-1]= s->input_picture[i];
2183

M
Michael Niedermayer 已提交
2184
    s->input_picture[encoding_delay]= (Picture*)pic;
M
cleanup  
Michael Niedermayer 已提交
2185 2186 2187

    return 0;
}
2188

M
Michael Niedermayer 已提交
2189 2190 2191
static int skip_check(MpegEncContext *s, Picture *p, Picture *ref){
    int x, y, plane;
    int score=0;
2192
    int64_t score64=0;
M
Michael Niedermayer 已提交
2193 2194 2195 2196 2197 2198

    for(plane=0; plane<3; plane++){
        const int stride= p->linesize[plane];
        const int bw= plane ? 1 : 2;
        for(y=0; y<s->mb_height*bw; y++){
            for(x=0; x<s->mb_width*bw; x++){
M
Michael Niedermayer 已提交
2199 2200
                int off= p->type == FF_BUFFER_TYPE_SHARED ? 0: 16;
                int v= s->dsp.frame_skip_cmp[1](s, p->data[plane] + 8*(x + y*stride)+off, ref->data[plane] + 8*(x + y*stride), stride, 8);
2201

2202 2203
                switch(s->avctx->frame_skip_exp){
                    case 0: score= FFMAX(score, v); break;
D
Diego Biurrun 已提交
2204
                    case 1: score+= FFABS(v);break;
2205
                    case 2: score+= v*v;break;
D
Diego Biurrun 已提交
2206
                    case 3: score64+= FFABS(v*v*(int64_t)v);break;
2207 2208
                    case 4: score64+= v*v*(int64_t)(v*v);break;
                }
M
Michael Niedermayer 已提交
2209 2210 2211
            }
        }
    }
2212

2213
    if(score) score64= score;
M
Michael Niedermayer 已提交
2214

2215
    if(score64 < s->avctx->frame_skip_threshold)
M
Michael Niedermayer 已提交
2216
        return 1;
2217
    if(score64 < ((s->avctx->frame_skip_factor * (int64_t)s->lambda)>>8))
M
Michael Niedermayer 已提交
2218 2219 2220 2221
        return 1;
    return 0;
}

M
Michael Niedermayer 已提交
2222 2223 2224 2225
static int estimate_best_b_count(MpegEncContext *s){
    AVCodec *codec= avcodec_find_encoder(s->avctx->codec_id);
    AVCodecContext *c= avcodec_alloc_context();
    AVFrame input[FF_MAX_B_FRAMES+2];
2226
    const int scale= s->avctx->brd_scale;
M
Michael Niedermayer 已提交
2227
    int i, j, out_size, p_lambda, b_lambda, lambda2;
2228
    int outbuf_size= s->width * s->height; //FIXME
M
Michael Niedermayer 已提交
2229 2230 2231
    uint8_t *outbuf= av_malloc(outbuf_size);
    int64_t best_rd= INT64_MAX;
    int best_b_count= -1;
M
Michael Niedermayer 已提交
2232

2233 2234
    assert(scale>=0 && scale <=3);

M
Michael Niedermayer 已提交
2235 2236
//    emms_c();
    p_lambda= s->last_lambda_for[P_TYPE]; //s->next_picture_ptr->quality;
D
Diego Biurrun 已提交
2237
    b_lambda= s->last_lambda_for[B_TYPE]; //p_lambda *FFABS(s->avctx->b_quant_factor) + s->avctx->b_quant_offset;
M
Michael Niedermayer 已提交
2238 2239
    if(!b_lambda) b_lambda= p_lambda; //FIXME we should do this somewhere else
    lambda2= (b_lambda*b_lambda + (1<<FF_LAMBDA_SHIFT)/2 ) >> FF_LAMBDA_SHIFT;
M
Michael Niedermayer 已提交
2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258

    c->width = s->width >> scale;
    c->height= s->height>> scale;
    c->flags= CODEC_FLAG_QSCALE | CODEC_FLAG_PSNR | CODEC_FLAG_INPUT_PRESERVED /*| CODEC_FLAG_EMU_EDGE*/;
    c->flags|= s->avctx->flags & CODEC_FLAG_QPEL;
    c->mb_decision= s->avctx->mb_decision;
    c->me_cmp= s->avctx->me_cmp;
    c->mb_cmp= s->avctx->mb_cmp;
    c->me_sub_cmp= s->avctx->me_sub_cmp;
    c->pix_fmt = PIX_FMT_YUV420P;
    c->time_base= s->avctx->time_base;
    c->max_b_frames= s->max_b_frames;

    if (avcodec_open(c, codec) < 0)
        return -1;

    for(i=0; i<s->max_b_frames+2; i++){
        int ysize= c->width*c->height;
        int csize= (c->width/2)*(c->height/2);
M
Michael Niedermayer 已提交
2259 2260
        Picture pre_input, *pre_input_ptr= i ? s->input_picture[i-1] : s->next_picture_ptr;

M
Michael Niedermayer 已提交
2261 2262 2263 2264 2265 2266 2267 2268
        avcodec_get_frame_defaults(&input[i]);
        input[i].data[0]= av_malloc(ysize + 2*csize);
        input[i].data[1]= input[i].data[0] + ysize;
        input[i].data[2]= input[i].data[1] + csize;
        input[i].linesize[0]= c->width;
        input[i].linesize[1]=
        input[i].linesize[2]= c->width/2;

2269 2270 2271 2272 2273 2274 2275 2276 2277
        if(pre_input_ptr && (!i || s->input_picture[i-1])) {
            pre_input= *pre_input_ptr;

            if(pre_input.type != FF_BUFFER_TYPE_SHARED && i) {
                pre_input.data[0]+=INPLACE_OFFSET;
                pre_input.data[1]+=INPLACE_OFFSET;
                pre_input.data[2]+=INPLACE_OFFSET;
            }

2278 2279 2280 2281
            s->dsp.shrink[scale](input[i].data[0], input[i].linesize[0], pre_input.data[0], pre_input.linesize[0], c->width, c->height);
            s->dsp.shrink[scale](input[i].data[1], input[i].linesize[1], pre_input.data[1], pre_input.linesize[1], c->width>>1, c->height>>1);
            s->dsp.shrink[scale](input[i].data[2], input[i].linesize[2], pre_input.data[2], pre_input.linesize[2], c->width>>1, c->height>>1);
        }
M
Michael Niedermayer 已提交
2282 2283 2284 2285 2286 2287 2288 2289 2290 2291 2292
    }

    for(j=0; j<s->max_b_frames+1; j++){
        int64_t rd=0;

        if(!s->input_picture[j])
            break;

        c->error[0]= c->error[1]= c->error[2]= 0;

        input[0].pict_type= I_TYPE;
M
Michael Niedermayer 已提交
2293
        input[0].quality= 1 * FF_QP2LAMBDA;
M
Michael Niedermayer 已提交
2294
        out_size = avcodec_encode_video(c, outbuf, outbuf_size, &input[0]);
M
Michael Niedermayer 已提交
2295
//        rd += (out_size * lambda2) >> FF_LAMBDA_SHIFT;
M
Michael Niedermayer 已提交
2296 2297 2298 2299 2300

        for(i=0; i<s->max_b_frames+1; i++){
            int is_p= i % (j+1) == j || i==s->max_b_frames;

            input[i+1].pict_type= is_p ? P_TYPE : B_TYPE;
M
Michael Niedermayer 已提交
2301
            input[i+1].quality= is_p ? p_lambda : b_lambda;
M
Michael Niedermayer 已提交
2302
            out_size = avcodec_encode_video(c, outbuf, outbuf_size, &input[i+1]);
M
Michael Niedermayer 已提交
2303
            rd += (out_size * lambda2) >> (FF_LAMBDA_SHIFT - 3);
M
Michael Niedermayer 已提交
2304 2305 2306 2307 2308
        }

        /* get the delayed frames */
        while(out_size){
            out_size = avcodec_encode_video(c, outbuf, outbuf_size, NULL);
M
Michael Niedermayer 已提交
2309
            rd += (out_size * lambda2) >> (FF_LAMBDA_SHIFT - 3);
M
Michael Niedermayer 已提交
2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330
        }

        rd += c->error[0] + c->error[1] + c->error[2];

        if(rd < best_rd){
            best_rd= rd;
            best_b_count= j;
        }
    }

    av_freep(&outbuf);
    avcodec_close(c);
    av_freep(&c);

    for(i=0; i<s->max_b_frames+2; i++){
        av_freep(&input[i].data[0]);
    }

    return best_b_count;
}

M
cleanup  
Michael Niedermayer 已提交
2331 2332
static void select_input_picture(MpegEncContext *s){
    int i;
M
Michael Niedermayer 已提交
2333

M
cleanup  
Michael Niedermayer 已提交
2334 2335 2336 2337
    for(i=1; i<MAX_PICTURE_COUNT; i++)
        s->reordered_input_picture[i-1]= s->reordered_input_picture[i];
    s->reordered_input_picture[MAX_PICTURE_COUNT-1]= NULL;

D
Diego Biurrun 已提交
2338
    /* set next picture type & ordering */
M
cleanup  
Michael Niedermayer 已提交
2339
    if(s->reordered_input_picture[0]==NULL && s->input_picture[0]){
M
Michael Niedermayer 已提交
2340
        if(/*s->picture_in_gop_number >= s->gop_size ||*/ s->next_picture_ptr==NULL || s->intra_only){
M
Michael Niedermayer 已提交
2341 2342
            s->reordered_input_picture[0]= s->input_picture[0];
            s->reordered_input_picture[0]->pict_type= I_TYPE;
M
Michael Niedermayer 已提交
2343
            s->reordered_input_picture[0]->coded_picture_number= s->coded_picture_number++;
M
Michael Niedermayer 已提交
2344 2345
        }else{
            int b_frames;
M
Michael Niedermayer 已提交
2346 2347

            if(s->avctx->frame_skip_threshold || s->avctx->frame_skip_factor){
M
Michael Niedermayer 已提交
2348 2349
                if(s->picture_in_gop_number < s->gop_size && skip_check(s, s->input_picture[0], s->next_picture_ptr)){
                //FIXME check that te gop check above is +-1 correct
2350
//av_log(NULL, AV_LOG_DEBUG, "skip %p %"PRId64"\n", s->input_picture[0]->data[0], s->input_picture[0]->pts);
2351

M
Michael Niedermayer 已提交
2352 2353 2354
                    if(s->input_picture[0]->type == FF_BUFFER_TYPE_SHARED){
                        for(i=0; i<4; i++)
                            s->input_picture[0]->data[i]= NULL;
2355
                        s->input_picture[0]->type= 0;
M
Michael Niedermayer 已提交
2356
                    }else{
2357
                        assert(   s->input_picture[0]->type==FF_BUFFER_TYPE_USER
M
Michael Niedermayer 已提交
2358
                               || s->input_picture[0]->type==FF_BUFFER_TYPE_INTERNAL);
2359

M
Michael Niedermayer 已提交
2360 2361
                        s->avctx->release_buffer(s->avctx, (AVFrame*)s->input_picture[0]);
                    }
2362

M
Michael Niedermayer 已提交
2363 2364
                    emms_c();
                    ff_vbv_update(s, 0);
M
Michael Niedermayer 已提交
2365 2366 2367 2368 2369

                    goto no_output_pic;
                }
            }

M
Michael Niedermayer 已提交
2370 2371 2372
            if(s->flags&CODEC_FLAG_PASS2){
                for(i=0; i<s->max_b_frames+1; i++){
                    int pict_num= s->input_picture[0]->display_picture_number + i;
2373

2374
                    if(pict_num >= s->rc_context.num_entries)
2375
                        break;
2376
                    if(!s->input_picture[i]){
2377
                        s->rc_context.entry[pict_num-1].new_pict_type = P_TYPE;
2378 2379
                        break;
                    }
2380

2381
                    s->input_picture[i]->pict_type=
2382
                        s->rc_context.entry[pict_num].new_pict_type;
M
Michael Niedermayer 已提交
2383 2384
                }
            }
M
Michael Niedermayer 已提交
2385

2386
            if(s->avctx->b_frame_strategy==0){
M
Michael Niedermayer 已提交
2387
                b_frames= s->max_b_frames;
2388
                while(b_frames && !s->input_picture[b_frames]) b_frames--;
M
cleanup  
Michael Niedermayer 已提交
2389
            }else if(s->avctx->b_frame_strategy==1){
M
Michael Niedermayer 已提交
2390
                for(i=1; i<s->max_b_frames+1; i++){
2391
                    if(s->input_picture[i] && s->input_picture[i]->b_frame_score==0){
2392 2393
                        s->input_picture[i]->b_frame_score=
                            get_intra_count(s, s->input_picture[i  ]->data[0],
M
Michael Niedermayer 已提交
2394
                                               s->input_picture[i-1]->data[0], s->linesize) + 1;
M
Michael Niedermayer 已提交
2395 2396
                    }
                }
2397
                for(i=0; i<s->max_b_frames+1; i++){
2398
                    if(s->input_picture[i]==NULL || s->input_picture[i]->b_frame_score - 1 > s->mb_num/s->avctx->b_sensitivity) break;
M
Michael Niedermayer 已提交
2399
                }
2400

M
Michael Niedermayer 已提交
2401
                b_frames= FFMAX(0, i-1);
2402

M
Michael Niedermayer 已提交
2403 2404 2405 2406
                /* reset scores */
                for(i=0; i<b_frames+1; i++){
                    s->input_picture[i]->b_frame_score=0;
                }
M
Michael Niedermayer 已提交
2407 2408
            }else if(s->avctx->b_frame_strategy==2){
                b_frames= estimate_best_b_count(s);
M
Michael Niedermayer 已提交
2409
            }else{
2410
                av_log(s->avctx, AV_LOG_ERROR, "illegal b frame strategy\n");
M
Michael Niedermayer 已提交
2411
                b_frames=0;
2412
            }
M
Michael Niedermayer 已提交
2413 2414 2415 2416

            emms_c();
//static int b_count=0;
//b_count+= b_frames;
2417
//av_log(s->avctx, AV_LOG_DEBUG, "b_frames: %d\n", b_count);
2418 2419 2420 2421 2422 2423 2424

            for(i= b_frames - 1; i>=0; i--){
                int type= s->input_picture[i]->pict_type;
                if(type && type != B_TYPE)
                    b_frames= i;
            }
            if(s->input_picture[b_frames]->pict_type == B_TYPE && b_frames == s->max_b_frames){
2425
                av_log(s->avctx, AV_LOG_ERROR, "warning, too many b frames in a row\n");
2426 2427
            }

2428
            if(s->picture_in_gop_number + b_frames >= s->gop_size){
2429 2430 2431
              if((s->flags2 & CODEC_FLAG2_STRICT_GOP) && s->gop_size > s->picture_in_gop_number){
                    b_frames= s->gop_size - s->picture_in_gop_number - 1;
              }else{
2432 2433 2434
                if(s->flags & CODEC_FLAG_CLOSED_GOP)
                    b_frames=0;
                s->input_picture[b_frames]->pict_type= I_TYPE;
2435
              }
2436
            }
2437

2438 2439 2440 2441 2442
            if(   (s->flags & CODEC_FLAG_CLOSED_GOP)
               && b_frames
               && s->input_picture[b_frames]->pict_type== I_TYPE)
                b_frames--;

M
Michael Niedermayer 已提交
2443
            s->reordered_input_picture[0]= s->input_picture[b_frames];
2444
            if(s->reordered_input_picture[0]->pict_type != I_TYPE)
M
Michael Niedermayer 已提交
2445
                s->reordered_input_picture[0]->pict_type= P_TYPE;
M
Michael Niedermayer 已提交
2446
            s->reordered_input_picture[0]->coded_picture_number= s->coded_picture_number++;
M
Michael Niedermayer 已提交
2447 2448 2449
            for(i=0; i<b_frames; i++){
                s->reordered_input_picture[i+1]= s->input_picture[i];
                s->reordered_input_picture[i+1]->pict_type= B_TYPE;
M
Michael Niedermayer 已提交
2450
                s->reordered_input_picture[i+1]->coded_picture_number= s->coded_picture_number++;
2451 2452 2453
            }
        }
    }
M
Michael Niedermayer 已提交
2454
no_output_pic:
M
cleanup  
Michael Niedermayer 已提交
2455
    if(s->reordered_input_picture[0]){
M
Michael Niedermayer 已提交
2456
        s->reordered_input_picture[0]->reference= s->reordered_input_picture[0]->pict_type!=B_TYPE ? 3 : 0;
M
Michael Niedermayer 已提交
2457

2458
        copy_picture(&s->new_picture, s->reordered_input_picture[0]);
M
Michael Niedermayer 已提交
2459

2460
        if(s->reordered_input_picture[0]->type == FF_BUFFER_TYPE_SHARED || s->avctx->rc_buffer_size){
D
Diego Biurrun 已提交
2461
            // input is a shared pix, so we can't modifiy it -> alloc a new one & ensure that the shared one is reuseable
2462

M
Michael Niedermayer 已提交
2463
            int i= ff_find_unused_picture(s, 0);
M
Michael Niedermayer 已提交
2464 2465
            Picture *pic= &s->picture[i];

2466 2467 2468
            pic->reference              = s->reordered_input_picture[0]->reference;
            alloc_picture(s, pic, 0);

M
Michael Niedermayer 已提交
2469
            /* mark us unused / free shared pic */
2470 2471
            if(s->reordered_input_picture[0]->type == FF_BUFFER_TYPE_INTERNAL)
                s->avctx->release_buffer(s->avctx, (AVFrame*)s->reordered_input_picture[0]);
M
Michael Niedermayer 已提交
2472 2473 2474
            for(i=0; i<4; i++)
                s->reordered_input_picture[0]->data[i]= NULL;
            s->reordered_input_picture[0]->type= 0;
2475

2476 2477
            copy_picture_attributes(s, (AVFrame*)pic, (AVFrame*)s->reordered_input_picture[0]);

M
Michael Niedermayer 已提交
2478
            s->current_picture_ptr= pic;
M
Michael Niedermayer 已提交
2479
        }else{
M
Michael Niedermayer 已提交
2480 2481
            // input is not a shared pix -> reuse buffer for current_pix

2482
            assert(   s->reordered_input_picture[0]->type==FF_BUFFER_TYPE_USER
M
Michael Niedermayer 已提交
2483
                   || s->reordered_input_picture[0]->type==FF_BUFFER_TYPE_INTERNAL);
2484

M
Michael Niedermayer 已提交
2485
            s->current_picture_ptr= s->reordered_input_picture[0];
M
Michael Niedermayer 已提交
2486
            for(i=0; i<4; i++){
M
Michael Niedermayer 已提交
2487
                s->new_picture.data[i]+= INPLACE_OFFSET;
M
Michael Niedermayer 已提交
2488
            }
M
cleanup  
Michael Niedermayer 已提交
2489
        }
2490
        copy_picture(&s->current_picture, s->current_picture_ptr);
2491

M
cleanup  
Michael Niedermayer 已提交
2492 2493 2494 2495
        s->picture_number= s->new_picture.display_picture_number;
//printf("dpn:%d\n", s->picture_number);
    }else{
       memset(&s->new_picture, 0, sizeof(Picture));
2496 2497 2498
    }
}

F
Fabrice Bellard 已提交
2499 2500 2501 2502
int MPV_encode_picture(AVCodecContext *avctx,
                       unsigned char *buf, int buf_size, void *data)
{
    MpegEncContext *s = avctx->priv_data;
M
Michael Niedermayer 已提交
2503
    AVFrame *pic_arg = data;
2504
    int i, stuffing_count;
F
Fabrice Bellard 已提交
2505

2506
    for(i=0; i<avctx->thread_count; i++){
M
Michael Niedermayer 已提交
2507 2508
        int start_y= s->thread_context[i]->start_mb_y;
        int   end_y= s->thread_context[i]->  end_mb_y;
2509
        int h= s->mb_height;
2510 2511
        uint8_t *start= buf + (size_t)(((int64_t) buf_size)*start_y/h);
        uint8_t *end  = buf + (size_t)(((int64_t) buf_size)*  end_y/h);
2512 2513 2514

        init_put_bits(&s->thread_context[i]->pb, start, end - start);
    }
F
Fabrice Bellard 已提交
2515

M
cleanup  
Michael Niedermayer 已提交
2516
    s->picture_in_gop_number++;
F
Fabrice Bellard 已提交
2517

2518 2519
    if(load_input_picture(s, pic_arg) < 0)
        return -1;
2520

M
cleanup  
Michael Niedermayer 已提交
2521
    select_input_picture(s);
2522

2523
    /* output? */
M
cleanup  
Michael Niedermayer 已提交
2524 2525 2526 2527
    if(s->new_picture.data[0]){
        s->pict_type= s->new_picture.pict_type;
//emms_c();
//printf("qs:%f %f %d\n", s->new_picture.quality, s->current_picture.quality, s->qscale);
2528
        MPV_frame_start(s, avctx);
2529
vbv_retry:
2530 2531
        if (encode_picture(s, s->picture_number) < 0)
            return -1;
2532

J
Juanjo 已提交
2533
        avctx->real_pict_num  = s->picture_number;
2534 2535 2536 2537 2538 2539
        avctx->header_bits = s->header_bits;
        avctx->mv_bits     = s->mv_bits;
        avctx->misc_bits   = s->misc_bits;
        avctx->i_tex_bits  = s->i_tex_bits;
        avctx->p_tex_bits  = s->p_tex_bits;
        avctx->i_count     = s->i_count;
2540
        avctx->p_count     = s->mb_num - s->i_count - s->skip_count; //FIXME f/b_count in avctx
2541 2542 2543 2544
        avctx->skip_count  = s->skip_count;

        MPV_frame_end(s);

2545
        if (ENABLE_MJPEG_ENCODER && s->out_format == FMT_MJPEG)
2546
            mjpeg_picture_trailer(s);
2547

2548 2549 2550 2551
        if(avctx->rc_buffer_size){
            RateControlContext *rcc= &s->rc_context;
            int max_size= rcc->buffer_index/3;

2552
            if(put_bits_count(&s->pb) > max_size && s->lambda < s->avctx->lmax){
M
Michael Niedermayer 已提交
2553
                s->next_lambda= FFMAX(s->lambda+1, s->lambda*(s->qscale+1) / s->qscale);
2554 2555
                if(s->adaptive_quant){
                    int i;
M
Michael Niedermayer 已提交
2556
                    for(i=0; i<s->mb_height*s->mb_stride; i++)
2557 2558
                        s->lambda_table[i]= FFMAX(s->lambda_table[i]+1, s->lambda_table[i]*(s->qscale+1) / s->qscale);
                }
2559 2560 2561 2562 2563
                s->mb_skipped = 0;        //done in MPV_frame_start()
                if(s->pict_type==P_TYPE){ //done in encode_picture() so we must undo it
                    if(s->flipflop_rounding || s->codec_id == CODEC_ID_H263P || s->codec_id == CODEC_ID_MPEG4)
                        s->no_rounding ^= 1;
                }
M
Michael Niedermayer 已提交
2564 2565 2566 2567
                if(s->pict_type!=B_TYPE){
                    s->time_base= s->last_time_base;
                    s->last_non_b_time= s->time - s->pp_time;
                }
2568 2569 2570 2571 2572 2573 2574 2575 2576 2577 2578
//                av_log(NULL, AV_LOG_ERROR, "R:%d ", s->next_lambda);
                for(i=0; i<avctx->thread_count; i++){
                    PutBitContext *pb= &s->thread_context[i]->pb;
                    init_put_bits(pb, pb->buf, pb->buf_end - pb->buf);
                }
                goto vbv_retry;
            }

            assert(s->avctx->rc_max_rate);
        }

2579 2580
        if(s->flags&CODEC_FLAG_PASS1)
            ff_write_pass1_stats(s);
M
Michael Niedermayer 已提交
2581 2582

        for(i=0; i<4; i++){
2583
            s->current_picture_ptr->error[i]= s->current_picture.error[i];
M
Michael Niedermayer 已提交
2584 2585
            avctx->error[i] += s->current_picture_ptr->error[i];
        }
2586

2587 2588
        if(s->flags&CODEC_FLAG_PASS1)
            assert(avctx->header_bits + avctx->mv_bits + avctx->misc_bits + avctx->i_tex_bits + avctx->p_tex_bits == put_bits_count(&s->pb));
2589
        flush_put_bits(&s->pb);
2590
        s->frame_bits  = put_bits_count(&s->pb);
M
Michael Niedermayer 已提交
2591

M
Michael Niedermayer 已提交
2592 2593
        stuffing_count= ff_vbv_update(s, s->frame_bits);
        if(stuffing_count){
2594 2595 2596 2597 2598
            if(s->pb.buf_end - s->pb.buf - (put_bits_count(&s->pb)>>3) < stuffing_count + 50){
                av_log(s->avctx, AV_LOG_ERROR, "stuffing too large\n");
                return -1;
            }

M
Michael Niedermayer 已提交
2599 2600 2601 2602 2603 2604 2605 2606 2607 2608 2609 2610 2611 2612 2613 2614 2615 2616 2617
            switch(s->codec_id){
            case CODEC_ID_MPEG1VIDEO:
            case CODEC_ID_MPEG2VIDEO:
                while(stuffing_count--){
                    put_bits(&s->pb, 8, 0);
                }
            break;
            case CODEC_ID_MPEG4:
                put_bits(&s->pb, 16, 0);
                put_bits(&s->pb, 16, 0x1C3);
                stuffing_count -= 4;
                while(stuffing_count--){
                    put_bits(&s->pb, 8, 0xFF);
                }
            break;
            default:
                av_log(s->avctx, AV_LOG_ERROR, "vbv buffer overflow\n");
            }
            flush_put_bits(&s->pb);
2618
            s->frame_bits  = put_bits_count(&s->pb);
M
Michael Niedermayer 已提交
2619
        }
M
Michael Niedermayer 已提交
2620

2621
        /* update mpeg1/2 vbv_delay for CBR */
2622 2623
        if(s->avctx->rc_max_rate && s->avctx->rc_min_rate == s->avctx->rc_max_rate && s->out_format == FMT_MPEG1
           && 90000LL * (avctx->rc_buffer_size-1) <= s->avctx->rc_max_rate*0xFFFFLL){
M
Michael Niedermayer 已提交
2624
            int vbv_delay;
M
Michael Niedermayer 已提交
2625

M
Michael Niedermayer 已提交
2626
            assert(s->repeat_first_field==0);
2627

M
Michael Niedermayer 已提交
2628 2629 2630 2631 2632 2633 2634 2635 2636 2637 2638 2639 2640 2641
            vbv_delay= lrintf(90000 * s->rc_context.buffer_index / s->avctx->rc_max_rate);
            assert(vbv_delay < 0xFFFF);

            s->vbv_delay_ptr[0] &= 0xF8;
            s->vbv_delay_ptr[0] |= vbv_delay>>13;
            s->vbv_delay_ptr[1]  = vbv_delay>>5;
            s->vbv_delay_ptr[2] &= 0x07;
            s->vbv_delay_ptr[2] |= vbv_delay<<3;
        }
        s->total_bits += s->frame_bits;
        avctx->frame_bits  = s->frame_bits;
    }else{
        assert((pbBufPtr(&s->pb) == s->pb.buf));
        s->frame_bits=0;
M
Michael Niedermayer 已提交
2642
    }
M
Michael Niedermayer 已提交
2643
    assert((s->frame_bits&7)==0);
2644

2645
    return s->frame_bits/8;
F
Fabrice Bellard 已提交
2646 2647
}

2648 2649
#endif //CONFIG_ENCODERS

M
Michael Niedermayer 已提交
2650
static inline void gmc1_motion(MpegEncContext *s,
2651
                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
2652
                               uint8_t **ref_picture)
M
Michael Niedermayer 已提交
2653
{
2654
    uint8_t *ptr;
M
Michael Niedermayer 已提交
2655
    int offset, src_x, src_y, linesize, uvlinesize;
M
Michael Niedermayer 已提交
2656
    int motion_x, motion_y;
M
Michael Niedermayer 已提交
2657
    int emu=0;
M
Michael Niedermayer 已提交
2658 2659 2660 2661 2662 2663 2664

    motion_x= s->sprite_offset[0][0];
    motion_y= s->sprite_offset[0][1];
    src_x = s->mb_x * 16 + (motion_x >> (s->sprite_warping_accuracy+1));
    src_y = s->mb_y * 16 + (motion_y >> (s->sprite_warping_accuracy+1));
    motion_x<<=(3-s->sprite_warping_accuracy);
    motion_y<<=(3-s->sprite_warping_accuracy);
2665
    src_x = av_clip(src_x, -16, s->width);
M
Michael Niedermayer 已提交
2666 2667
    if (src_x == s->width)
        motion_x =0;
2668
    src_y = av_clip(src_y, -16, s->height);
M
Michael Niedermayer 已提交
2669 2670
    if (src_y == s->height)
        motion_y =0;
2671

M
Michael Niedermayer 已提交
2672
    linesize = s->linesize;
M
Michael Niedermayer 已提交
2673
    uvlinesize = s->uvlinesize;
2674

2675
    ptr = ref_picture[0] + (src_y * linesize) + src_x;
M
Michael Niedermayer 已提交
2676

M
Michael Niedermayer 已提交
2677
    if(s->flags&CODEC_FLAG_EMU_EDGE){
2678 2679
        if(   (unsigned)src_x >= s->h_edge_pos - 17
           || (unsigned)src_y >= s->v_edge_pos - 17){
2680
            ff_emulated_edge_mc(s->edge_emu_buffer, ptr, linesize, 17, 17, src_x, src_y, s->h_edge_pos, s->v_edge_pos);
M
Michael Niedermayer 已提交
2681 2682 2683
            ptr= s->edge_emu_buffer;
        }
    }
2684

2685
    if((motion_x|motion_y)&7){
2686 2687
        s->dsp.gmc1(dest_y  , ptr  , linesize, 16, motion_x&15, motion_y&15, 128 - s->no_rounding);
        s->dsp.gmc1(dest_y+8, ptr+8, linesize, 16, motion_x&15, motion_y&15, 128 - s->no_rounding);
2688 2689
    }else{
        int dxy;
2690

2691 2692
        dxy= ((motion_x>>3)&1) | ((motion_y>>2)&2);
        if (s->no_rounding){
2693
            s->dsp.put_no_rnd_pixels_tab[0][dxy](dest_y, ptr, linesize, 16);
2694
        }else{
2695 2696
            s->dsp.put_pixels_tab       [0][dxy](dest_y, ptr, linesize, 16);
        }
2697
    }
2698

2699
    if(s->flags&CODEC_FLAG_GRAY) return;
M
Michael Niedermayer 已提交
2700 2701 2702 2703 2704 2705 2706

    motion_x= s->sprite_offset[1][0];
    motion_y= s->sprite_offset[1][1];
    src_x = s->mb_x * 8 + (motion_x >> (s->sprite_warping_accuracy+1));
    src_y = s->mb_y * 8 + (motion_y >> (s->sprite_warping_accuracy+1));
    motion_x<<=(3-s->sprite_warping_accuracy);
    motion_y<<=(3-s->sprite_warping_accuracy);
2707
    src_x = av_clip(src_x, -8, s->width>>1);
M
Michael Niedermayer 已提交
2708 2709
    if (src_x == s->width>>1)
        motion_x =0;
2710
    src_y = av_clip(src_y, -8, s->height>>1);
M
Michael Niedermayer 已提交
2711 2712 2713
    if (src_y == s->height>>1)
        motion_y =0;

2714
    offset = (src_y * uvlinesize) + src_x;
M
Michael Niedermayer 已提交
2715
    ptr = ref_picture[1] + offset;
2716
    if(s->flags&CODEC_FLAG_EMU_EDGE){
2717 2718
        if(   (unsigned)src_x >= (s->h_edge_pos>>1) - 9
           || (unsigned)src_y >= (s->v_edge_pos>>1) - 9){
2719
            ff_emulated_edge_mc(s->edge_emu_buffer, ptr, uvlinesize, 9, 9, src_x, src_y, s->h_edge_pos>>1, s->v_edge_pos>>1);
2720 2721 2722
            ptr= s->edge_emu_buffer;
            emu=1;
        }
M
Michael Niedermayer 已提交
2723
    }
2724
    s->dsp.gmc1(dest_cb, ptr, uvlinesize, 8, motion_x&15, motion_y&15, 128 - s->no_rounding);
2725

M
Michael Niedermayer 已提交
2726
    ptr = ref_picture[2] + offset;
M
Michael Niedermayer 已提交
2727
    if(emu){
2728
        ff_emulated_edge_mc(s->edge_emu_buffer, ptr, uvlinesize, 9, 9, src_x, src_y, s->h_edge_pos>>1, s->v_edge_pos>>1);
M
Michael Niedermayer 已提交
2729 2730
        ptr= s->edge_emu_buffer;
    }
2731
    s->dsp.gmc1(dest_cr, ptr, uvlinesize, 8, motion_x&15, motion_y&15, 128 - s->no_rounding);
2732

M
Michael Niedermayer 已提交
2733 2734 2735
    return;
}

2736
static inline void gmc_motion(MpegEncContext *s,
2737
                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
2738
                               uint8_t **ref_picture)
2739
{
2740
    uint8_t *ptr;
2741 2742 2743 2744 2745 2746 2747
    int linesize, uvlinesize;
    const int a= s->sprite_warping_accuracy;
    int ox, oy;

    linesize = s->linesize;
    uvlinesize = s->uvlinesize;

2748
    ptr = ref_picture[0];
2749 2750 2751 2752

    ox= s->sprite_offset[0][0] + s->sprite_delta[0][0]*s->mb_x*16 + s->sprite_delta[0][1]*s->mb_y*16;
    oy= s->sprite_offset[0][1] + s->sprite_delta[1][0]*s->mb_x*16 + s->sprite_delta[1][1]*s->mb_y*16;

2753
    s->dsp.gmc(dest_y, ptr, linesize, 16,
2754 2755
           ox,
           oy,
2756
           s->sprite_delta[0][0], s->sprite_delta[0][1],
2757
           s->sprite_delta[1][0], s->sprite_delta[1][1],
2758 2759
           a+1, (1<<(2*a+1)) - s->no_rounding,
           s->h_edge_pos, s->v_edge_pos);
2760
    s->dsp.gmc(dest_y+8, ptr, linesize, 16,
2761 2762
           ox + s->sprite_delta[0][0]*8,
           oy + s->sprite_delta[1][0]*8,
2763
           s->sprite_delta[0][0], s->sprite_delta[0][1],
2764
           s->sprite_delta[1][0], s->sprite_delta[1][1],
2765 2766 2767 2768 2769 2770 2771 2772
           a+1, (1<<(2*a+1)) - s->no_rounding,
           s->h_edge_pos, s->v_edge_pos);

    if(s->flags&CODEC_FLAG_GRAY) return;

    ox= s->sprite_offset[1][0] + s->sprite_delta[0][0]*s->mb_x*8 + s->sprite_delta[0][1]*s->mb_y*8;
    oy= s->sprite_offset[1][1] + s->sprite_delta[1][0]*s->mb_x*8 + s->sprite_delta[1][1]*s->mb_y*8;

2773
    ptr = ref_picture[1];
2774
    s->dsp.gmc(dest_cb, ptr, uvlinesize, 8,
2775 2776
           ox,
           oy,
2777
           s->sprite_delta[0][0], s->sprite_delta[0][1],
2778
           s->sprite_delta[1][0], s->sprite_delta[1][1],
2779 2780
           a+1, (1<<(2*a+1)) - s->no_rounding,
           s->h_edge_pos>>1, s->v_edge_pos>>1);
2781

2782
    ptr = ref_picture[2];
2783
    s->dsp.gmc(dest_cr, ptr, uvlinesize, 8,
2784 2785
           ox,
           oy,
2786
           s->sprite_delta[0][0], s->sprite_delta[0][1],
2787
           s->sprite_delta[1][0], s->sprite_delta[1][1],
2788 2789 2790 2791
           a+1, (1<<(2*a+1)) - s->no_rounding,
           s->h_edge_pos>>1, s->v_edge_pos>>1);
}

2792 2793 2794 2795 2796 2797 2798 2799 2800 2801 2802 2803
/**
 * Copies a rectangular area of samples to a temporary buffer and replicates the boarder samples.
 * @param buf destination buffer
 * @param src source buffer
 * @param linesize number of bytes between 2 vertically adjacent samples in both the source and destination buffers
 * @param block_w width of block
 * @param block_h height of block
 * @param src_x x coordinate of the top left sample of the block in the source buffer
 * @param src_y y coordinate of the top left sample of the block in the source buffer
 * @param w width of the source buffer
 * @param h height of the source buffer
 */
2804
void ff_emulated_edge_mc(uint8_t *buf, uint8_t *src, int linesize, int block_w, int block_h,
2805 2806 2807
                                    int src_x, int src_y, int w, int h){
    int x, y;
    int start_y, start_x, end_y, end_x;
2808

2809 2810 2811
    if(src_y>= h){
        src+= (h-1-src_y)*linesize;
        src_y=h-1;
M
Michael Niedermayer 已提交
2812 2813 2814
    }else if(src_y<=-block_h){
        src+= (1-block_h-src_y)*linesize;
        src_y=1-block_h;
2815 2816 2817 2818
    }
    if(src_x>= w){
        src+= (w-1-src_x);
        src_x=w-1;
M
Michael Niedermayer 已提交
2819 2820 2821
    }else if(src_x<=-block_w){
        src+= (1-block_w-src_x);
        src_x=1-block_w;
2822 2823
    }

M
Michael Niedermayer 已提交
2824 2825 2826 2827
    start_y= FFMAX(0, -src_y);
    start_x= FFMAX(0, -src_x);
    end_y= FFMIN(block_h, h-src_y);
    end_x= FFMIN(block_w, w-src_x);
M
Michael Niedermayer 已提交
2828

2829 2830 2831 2832 2833 2834 2835 2836 2837 2838 2839 2840 2841 2842 2843 2844 2845 2846 2847 2848
    // copy existing part
    for(y=start_y; y<end_y; y++){
        for(x=start_x; x<end_x; x++){
            buf[x + y*linesize]= src[x + y*linesize];
        }
    }

    //top
    for(y=0; y<start_y; y++){
        for(x=start_x; x<end_x; x++){
            buf[x + y*linesize]= buf[x + start_y*linesize];
        }
    }

    //bottom
    for(y=end_y; y<block_h; y++){
        for(x=start_x; x<end_x; x++){
            buf[x + y*linesize]= buf[x + (end_y-1)*linesize];
        }
    }
2849

2850 2851 2852 2853 2854
    for(y=0; y<block_h; y++){
       //left
        for(x=0; x<start_x; x++){
            buf[x + y*linesize]= buf[start_x + y*linesize];
        }
2855

2856 2857 2858 2859 2860 2861 2862
       //right
        for(x=end_x; x<block_w; x++){
            buf[x + y*linesize]= buf[end_x - 1 + y*linesize];
        }
    }
}

2863
static inline int hpel_motion(MpegEncContext *s,
2864 2865
                                  uint8_t *dest, uint8_t *src,
                                  int field_based, int field_select,
M
Michael Niedermayer 已提交
2866 2867 2868 2869 2870 2871 2872 2873 2874 2875 2876 2877
                                  int src_x, int src_y,
                                  int width, int height, int stride,
                                  int h_edge_pos, int v_edge_pos,
                                  int w, int h, op_pixels_func *pix_op,
                                  int motion_x, int motion_y)
{
    int dxy;
    int emu=0;

    dxy = ((motion_y & 1) << 1) | (motion_x & 1);
    src_x += motion_x >> 1;
    src_y += motion_y >> 1;
2878

M
Michael Niedermayer 已提交
2879
    /* WARNING: do no forget half pels */
2880
    src_x = av_clip(src_x, -16, width); //FIXME unneeded for emu?
M
Michael Niedermayer 已提交
2881 2882
    if (src_x == width)
        dxy &= ~1;
2883
    src_y = av_clip(src_y, -16, height);
M
Michael Niedermayer 已提交
2884 2885 2886 2887 2888 2889 2890
    if (src_y == height)
        dxy &= ~2;
    src += src_y * stride + src_x;

    if(s->unrestricted_mv && (s->flags&CODEC_FLAG_EMU_EDGE)){
        if(   (unsigned)src_x > h_edge_pos - (motion_x&1) - w
           || (unsigned)src_y > v_edge_pos - (motion_y&1) - h){
2891 2892
            ff_emulated_edge_mc(s->edge_emu_buffer, src, s->linesize, w+1, (h+1)<<field_based,
                             src_x, src_y<<field_based, h_edge_pos, s->v_edge_pos);
M
Michael Niedermayer 已提交
2893 2894 2895 2896
            src= s->edge_emu_buffer;
            emu=1;
        }
    }
2897 2898
    if(field_select)
        src += s->linesize;
M
Michael Niedermayer 已提交
2899 2900 2901
    pix_op[dxy](dest, src, stride, h);
    return emu;
}
2902

2903
static inline int hpel_motion_lowres(MpegEncContext *s,
M
Michael Niedermayer 已提交
2904 2905 2906 2907 2908 2909 2910 2911 2912 2913 2914 2915 2916 2917 2918 2919 2920 2921 2922 2923 2924 2925
                                  uint8_t *dest, uint8_t *src,
                                  int field_based, int field_select,
                                  int src_x, int src_y,
                                  int width, int height, int stride,
                                  int h_edge_pos, int v_edge_pos,
                                  int w, int h, h264_chroma_mc_func *pix_op,
                                  int motion_x, int motion_y)
{
    const int lowres= s->avctx->lowres;
    const int s_mask= (2<<lowres)-1;
    int emu=0;
    int sx, sy;

    if(s->quarter_sample){
        motion_x/=2;
        motion_y/=2;
    }

    sx= motion_x & s_mask;
    sy= motion_y & s_mask;
    src_x += motion_x >> (lowres+1);
    src_y += motion_y >> (lowres+1);
2926

M
Michael Niedermayer 已提交
2927 2928 2929 2930 2931 2932 2933 2934 2935 2936 2937 2938 2939 2940 2941 2942 2943 2944
    src += src_y * stride + src_x;

    if(   (unsigned)src_x > h_edge_pos                 - (!!sx) - w
       || (unsigned)src_y >(v_edge_pos >> field_based) - (!!sy) - h){
        ff_emulated_edge_mc(s->edge_emu_buffer, src, s->linesize, w+1, (h+1)<<field_based,
                            src_x, src_y<<field_based, h_edge_pos, v_edge_pos);
        src= s->edge_emu_buffer;
        emu=1;
    }

    sx <<= 2 - lowres;
    sy <<= 2 - lowres;
    if(field_select)
        src += s->linesize;
    pix_op[lowres](dest, src, stride, h, sx, sy);
    return emu;
}

F
Fabrice Bellard 已提交
2945
/* apply one mpeg motion vector to the three components */
2946
static av_always_inline void mpeg_motion(MpegEncContext *s,
2947
                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
2948 2949
                               int field_based, int bottom_field, int field_select,
                               uint8_t **ref_picture, op_pixels_func (*pix_op)[4],
F
Fabrice Bellard 已提交
2950 2951
                               int motion_x, int motion_y, int h)
{
2952 2953
    uint8_t *ptr_y, *ptr_cb, *ptr_cr;
    int dxy, uvdxy, mx, my, src_x, src_y, uvsrc_x, uvsrc_y, v_edge_pos, uvlinesize, linesize;
2954 2955

#if 0
M
Michael Niedermayer 已提交
2956 2957 2958 2959 2960
if(s->quarter_sample)
{
    motion_x>>=1;
    motion_y>>=1;
}
M
Michael Niedermayer 已提交
2961
#endif
M
Michael Niedermayer 已提交
2962

2963
    v_edge_pos = s->v_edge_pos >> field_based;
2964
    linesize   = s->current_picture.linesize[0] << field_based;
M
Michael Niedermayer 已提交
2965
    uvlinesize = s->current_picture.linesize[1] << field_based;
2966

2967 2968
    dxy = ((motion_y & 1) << 1) | (motion_x & 1);
    src_x = s->mb_x* 16               + (motion_x >> 1);
2969
    src_y =(s->mb_y<<(4-field_based)) + (motion_y >> 1);
M
Michael Niedermayer 已提交
2970

F
Fabrice Bellard 已提交
2971
    if (s->out_format == FMT_H263) {
2972 2973 2974 2975 2976
        if((s->workaround_bugs & FF_BUG_HPEL_CHROMA) && field_based){
            mx = (motion_x>>1)|(motion_x&1);
            my = motion_y >>1;
            uvdxy = ((my & 1) << 1) | (mx & 1);
            uvsrc_x = s->mb_x* 8               + (mx >> 1);
2977
            uvsrc_y = (s->mb_y<<(3-field_based)) + (my >> 1);
2978 2979 2980 2981 2982
        }else{
            uvdxy = dxy | (motion_y & 2) | ((motion_x & 2) >> 1);
            uvsrc_x = src_x>>1;
            uvsrc_y = src_y>>1;
        }
2983 2984 2985 2986 2987 2988
    }else if(s->out_format == FMT_H261){//even chroma mv's are full pel in H261
        mx = motion_x / 4;
        my = motion_y / 4;
        uvdxy = 0;
        uvsrc_x = s->mb_x*8 + mx;
        uvsrc_y = s->mb_y*8 + my;
F
Fabrice Bellard 已提交
2989
    } else {
2990 2991 2992 2993 2994 2995 2996 2997 2998 2999 3000 3001 3002 3003 3004 3005 3006 3007 3008 3009
        if(s->chroma_y_shift){
            mx = motion_x / 2;
            my = motion_y / 2;
            uvdxy = ((my & 1) << 1) | (mx & 1);
            uvsrc_x = s->mb_x* 8               + (mx >> 1);
            uvsrc_y = (s->mb_y<<(3-field_based)) + (my >> 1);
        } else {
            if(s->chroma_x_shift){
            //Chroma422
                mx = motion_x / 2;
                uvdxy = ((motion_y & 1) << 1) | (mx & 1);
                uvsrc_x = s->mb_x* 8           + (mx >> 1);
                uvsrc_y = src_y;
            } else {
            //Chroma444
                uvdxy = dxy;
                uvsrc_x = src_x;
                uvsrc_y = src_y;
            }
        }
F
Fabrice Bellard 已提交
3010
    }
3011 3012 3013 3014 3015 3016 3017

    ptr_y  = ref_picture[0] + src_y * linesize + src_x;
    ptr_cb = ref_picture[1] + uvsrc_y * uvlinesize + uvsrc_x;
    ptr_cr = ref_picture[2] + uvsrc_y * uvlinesize + uvsrc_x;

    if(   (unsigned)src_x > s->h_edge_pos - (motion_x&1) - 16
       || (unsigned)src_y >    v_edge_pos - (motion_y&1) - h){
3018 3019 3020 3021 3022
            if(s->codec_id == CODEC_ID_MPEG2VIDEO ||
               s->codec_id == CODEC_ID_MPEG1VIDEO){
                av_log(s->avctx,AV_LOG_DEBUG,"MPEG motion vector out of boundary\n");
                return ;
            }
3023 3024 3025 3026
            ff_emulated_edge_mc(s->edge_emu_buffer, ptr_y, s->linesize, 17, 17+field_based,
                             src_x, src_y<<field_based, s->h_edge_pos, s->v_edge_pos);
            ptr_y = s->edge_emu_buffer;
            if(!(s->flags&CODEC_FLAG_GRAY)){
M
10l  
Michael Niedermayer 已提交
3027
                uint8_t *uvbuf= s->edge_emu_buffer+18*s->linesize;
3028
                ff_emulated_edge_mc(uvbuf  , ptr_cb, s->uvlinesize, 9, 9+field_based,
3029
                                 uvsrc_x, uvsrc_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
3030
                ff_emulated_edge_mc(uvbuf+16, ptr_cr, s->uvlinesize, 9, 9+field_based,
3031 3032 3033 3034
                                 uvsrc_x, uvsrc_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
                ptr_cb= uvbuf;
                ptr_cr= uvbuf+16;
            }
3035 3036
    }

3037 3038 3039 3040 3041 3042 3043 3044 3045 3046 3047 3048 3049
    if(bottom_field){ //FIXME use this for field pix too instead of the obnoxious hack which changes picture.data
        dest_y += s->linesize;
        dest_cb+= s->uvlinesize;
        dest_cr+= s->uvlinesize;
    }

    if(field_select){
        ptr_y += s->linesize;
        ptr_cb+= s->uvlinesize;
        ptr_cr+= s->uvlinesize;
    }

    pix_op[0][dxy](dest_y, ptr_y, linesize, h);
3050

3051
    if(!(s->flags&CODEC_FLAG_GRAY)){
3052 3053
        pix_op[s->chroma_x_shift][uvdxy](dest_cb, ptr_cb, uvlinesize, h >> s->chroma_y_shift);
        pix_op[s->chroma_x_shift][uvdxy](dest_cr, ptr_cr, uvlinesize, h >> s->chroma_y_shift);
3054
    }
3055
    if((ENABLE_H261_ENCODER || ENABLE_H261_DECODER) && s->out_format == FMT_H261){
M
Michael Niedermayer 已提交
3056 3057
        ff_h261_loop_filter(s);
    }
F
Fabrice Bellard 已提交
3058
}
M
Michael Niedermayer 已提交
3059 3060

/* apply one mpeg motion vector to the three components */
3061
static av_always_inline void mpeg_motion_lowres(MpegEncContext *s,
M
Michael Niedermayer 已提交
3062 3063 3064 3065 3066 3067 3068 3069 3070 3071 3072 3073 3074 3075 3076
                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
                               int field_based, int bottom_field, int field_select,
                               uint8_t **ref_picture, h264_chroma_mc_func *pix_op,
                               int motion_x, int motion_y, int h)
{
    uint8_t *ptr_y, *ptr_cb, *ptr_cr;
    int mx, my, src_x, src_y, uvsrc_x, uvsrc_y, uvlinesize, linesize, sx, sy, uvsx, uvsy;
    const int lowres= s->avctx->lowres;
    const int block_s= 8>>lowres;
    const int s_mask= (2<<lowres)-1;
    const int h_edge_pos = s->h_edge_pos >> lowres;
    const int v_edge_pos = s->v_edge_pos >> lowres;
    linesize   = s->current_picture.linesize[0] << field_based;
    uvlinesize = s->current_picture.linesize[1] << field_based;

3077 3078 3079 3080
    if(s->quarter_sample){ //FIXME obviously not perfect but qpel wont work in lowres anyway
        motion_x/=2;
        motion_y/=2;
    }
3081

3082 3083 3084 3085
    if(field_based){
        motion_y += (bottom_field - field_select)*((1<<lowres)-1);
    }

M
Michael Niedermayer 已提交
3086 3087 3088
    sx= motion_x & s_mask;
    sy= motion_y & s_mask;
    src_x = s->mb_x*2*block_s               + (motion_x >> (lowres+1));
3089
    src_y =(s->mb_y*2*block_s>>field_based) + (motion_y >> (lowres+1));
3090

M
Michael Niedermayer 已提交
3091
    if (s->out_format == FMT_H263) {
M
Michael Niedermayer 已提交
3092 3093
        uvsx = ((motion_x>>1) & s_mask) | (sx&1);
        uvsy = ((motion_y>>1) & s_mask) | (sy&1);
M
Michael Niedermayer 已提交
3094 3095 3096 3097 3098 3099 3100 3101 3102 3103 3104 3105 3106 3107 3108
        uvsrc_x = src_x>>1;
        uvsrc_y = src_y>>1;
    }else if(s->out_format == FMT_H261){//even chroma mv's are full pel in H261
        mx = motion_x / 4;
        my = motion_y / 4;
        uvsx = (2*mx) & s_mask;
        uvsy = (2*my) & s_mask;
        uvsrc_x = s->mb_x*block_s               + (mx >> lowres);
        uvsrc_y = s->mb_y*block_s               + (my >> lowres);
    } else {
        mx = motion_x / 2;
        my = motion_y / 2;
        uvsx = mx & s_mask;
        uvsy = my & s_mask;
        uvsrc_x = s->mb_x*block_s               + (mx >> (lowres+1));
3109
        uvsrc_y =(s->mb_y*block_s>>field_based) + (my >> (lowres+1));
M
Michael Niedermayer 已提交
3110 3111 3112 3113 3114 3115 3116 3117 3118 3119 3120 3121 3122
    }

    ptr_y  = ref_picture[0] + src_y * linesize + src_x;
    ptr_cb = ref_picture[1] + uvsrc_y * uvlinesize + uvsrc_x;
    ptr_cr = ref_picture[2] + uvsrc_y * uvlinesize + uvsrc_x;

    if(   (unsigned)src_x > h_edge_pos                 - (!!sx) - 2*block_s
       || (unsigned)src_y >(v_edge_pos >> field_based) - (!!sy) - h){
            ff_emulated_edge_mc(s->edge_emu_buffer, ptr_y, s->linesize, 17, 17+field_based,
                             src_x, src_y<<field_based, h_edge_pos, v_edge_pos);
            ptr_y = s->edge_emu_buffer;
            if(!(s->flags&CODEC_FLAG_GRAY)){
                uint8_t *uvbuf= s->edge_emu_buffer+18*s->linesize;
3123
                ff_emulated_edge_mc(uvbuf  , ptr_cb, s->uvlinesize, 9, 9+field_based,
M
Michael Niedermayer 已提交
3124
                                 uvsrc_x, uvsrc_y<<field_based, h_edge_pos>>1, v_edge_pos>>1);
3125
                ff_emulated_edge_mc(uvbuf+16, ptr_cr, s->uvlinesize, 9, 9+field_based,
M
Michael Niedermayer 已提交
3126 3127 3128 3129 3130 3131
                                 uvsrc_x, uvsrc_y<<field_based, h_edge_pos>>1, v_edge_pos>>1);
                ptr_cb= uvbuf;
                ptr_cr= uvbuf+16;
            }
    }

3132 3133 3134 3135 3136 3137 3138 3139 3140 3141 3142 3143
    if(bottom_field){ //FIXME use this for field pix too instead of the obnoxious hack which changes picture.data
        dest_y += s->linesize;
        dest_cb+= s->uvlinesize;
        dest_cr+= s->uvlinesize;
    }

    if(field_select){
        ptr_y += s->linesize;
        ptr_cb+= s->uvlinesize;
        ptr_cr+= s->uvlinesize;
    }

M
Michael Niedermayer 已提交
3144 3145 3146
    sx <<= 2 - lowres;
    sy <<= 2 - lowres;
    pix_op[lowres-1](dest_y, ptr_y, linesize, h, sx, sy);
3147

M
Michael Niedermayer 已提交
3148 3149 3150 3151 3152 3153
    if(!(s->flags&CODEC_FLAG_GRAY)){
        uvsx <<= 2 - lowres;
        uvsy <<= 2 - lowres;
        pix_op[lowres](dest_cb, ptr_cb, uvlinesize, h >> s->chroma_y_shift, uvsx, uvsy);
        pix_op[lowres](dest_cr, ptr_cr, uvlinesize, h >> s->chroma_y_shift, uvsx, uvsy);
    }
M
Michael Niedermayer 已提交
3154
    //FIXME h261 lowres loop filter
M
Michael Niedermayer 已提交
3155 3156
}

M
Michael Niedermayer 已提交
3157 3158 3159 3160 3161 3162 3163 3164 3165 3166 3167 3168 3169 3170 3171
//FIXME move to dsputil, avg variant, 16x16 version
static inline void put_obmc(uint8_t *dst, uint8_t *src[5], int stride){
    int x;
    uint8_t * const top   = src[1];
    uint8_t * const left  = src[2];
    uint8_t * const mid   = src[0];
    uint8_t * const right = src[3];
    uint8_t * const bottom= src[4];
#define OBMC_FILTER(x, t, l, m, r, b)\
    dst[x]= (t*top[x] + l*left[x] + m*mid[x] + r*right[x] + b*bottom[x] + 4)>>3
#define OBMC_FILTER4(x, t, l, m, r, b)\
    OBMC_FILTER(x         , t, l, m, r, b);\
    OBMC_FILTER(x+1       , t, l, m, r, b);\
    OBMC_FILTER(x  +stride, t, l, m, r, b);\
    OBMC_FILTER(x+1+stride, t, l, m, r, b);
3172

M
Michael Niedermayer 已提交
3173 3174 3175 3176 3177 3178 3179 3180 3181 3182 3183 3184 3185 3186 3187 3188 3189 3190 3191 3192 3193 3194 3195 3196 3197 3198 3199 3200 3201 3202 3203 3204 3205 3206 3207 3208 3209 3210 3211 3212 3213 3214 3215 3216 3217 3218
    x=0;
    OBMC_FILTER (x  , 2, 2, 4, 0, 0);
    OBMC_FILTER (x+1, 2, 1, 5, 0, 0);
    OBMC_FILTER4(x+2, 2, 1, 5, 0, 0);
    OBMC_FILTER4(x+4, 2, 0, 5, 1, 0);
    OBMC_FILTER (x+6, 2, 0, 5, 1, 0);
    OBMC_FILTER (x+7, 2, 0, 4, 2, 0);
    x+= stride;
    OBMC_FILTER (x  , 1, 2, 5, 0, 0);
    OBMC_FILTER (x+1, 1, 2, 5, 0, 0);
    OBMC_FILTER (x+6, 1, 0, 5, 2, 0);
    OBMC_FILTER (x+7, 1, 0, 5, 2, 0);
    x+= stride;
    OBMC_FILTER4(x  , 1, 2, 5, 0, 0);
    OBMC_FILTER4(x+2, 1, 1, 6, 0, 0);
    OBMC_FILTER4(x+4, 1, 0, 6, 1, 0);
    OBMC_FILTER4(x+6, 1, 0, 5, 2, 0);
    x+= 2*stride;
    OBMC_FILTER4(x  , 0, 2, 5, 0, 1);
    OBMC_FILTER4(x+2, 0, 1, 6, 0, 1);
    OBMC_FILTER4(x+4, 0, 0, 6, 1, 1);
    OBMC_FILTER4(x+6, 0, 0, 5, 2, 1);
    x+= 2*stride;
    OBMC_FILTER (x  , 0, 2, 5, 0, 1);
    OBMC_FILTER (x+1, 0, 2, 5, 0, 1);
    OBMC_FILTER4(x+2, 0, 1, 5, 0, 2);
    OBMC_FILTER4(x+4, 0, 0, 5, 1, 2);
    OBMC_FILTER (x+6, 0, 0, 5, 2, 1);
    OBMC_FILTER (x+7, 0, 0, 5, 2, 1);
    x+= stride;
    OBMC_FILTER (x  , 0, 2, 4, 0, 2);
    OBMC_FILTER (x+1, 0, 1, 5, 0, 2);
    OBMC_FILTER (x+6, 0, 0, 5, 1, 2);
    OBMC_FILTER (x+7, 0, 0, 4, 2, 2);
}

/* obmc for 1 8x8 luma block */
static inline void obmc_motion(MpegEncContext *s,
                               uint8_t *dest, uint8_t *src,
                               int src_x, int src_y,
                               op_pixels_func *pix_op,
                               int16_t mv[5][2]/* mid top left right bottom*/)
#define MID    0
{
    int i;
    uint8_t *ptr[5];
3219

M
Michael Niedermayer 已提交
3220
    assert(s->quarter_sample==0);
3221

M
Michael Niedermayer 已提交
3222 3223 3224 3225
    for(i=0; i<5; i++){
        if(i && mv[i][0]==mv[MID][0] && mv[i][1]==mv[MID][1]){
            ptr[i]= ptr[MID];
        }else{
3226
            ptr[i]= s->obmc_scratchpad + 8*(i&1) + s->linesize*8*(i>>1);
3227
            hpel_motion(s, ptr[i], src, 0, 0,
M
Michael Niedermayer 已提交
3228 3229 3230 3231 3232 3233 3234 3235
                        src_x, src_y,
                        s->width, s->height, s->linesize,
                        s->h_edge_pos, s->v_edge_pos,
                        8, 8, pix_op,
                        mv[i][0], mv[i][1]);
        }
    }

3236
    put_obmc(dest, ptr, s->linesize);
M
Michael Niedermayer 已提交
3237
}
F
Fabrice Bellard 已提交
3238

M
Michael Niedermayer 已提交
3239
static inline void qpel_motion(MpegEncContext *s,
3240
                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
3241 3242
                               int field_based, int bottom_field, int field_select,
                               uint8_t **ref_picture, op_pixels_func (*pix_op)[4],
M
Michael Niedermayer 已提交
3243
                               qpel_mc_func (*qpix_op)[16],
M
Michael Niedermayer 已提交
3244 3245
                               int motion_x, int motion_y, int h)
{
3246 3247
    uint8_t *ptr_y, *ptr_cb, *ptr_cr;
    int dxy, uvdxy, mx, my, src_x, src_y, uvsrc_x, uvsrc_y, v_edge_pos, linesize, uvlinesize;
3248

M
Michael Niedermayer 已提交
3249
    dxy = ((motion_y & 3) << 2) | (motion_x & 3);
3250
    src_x = s->mb_x *  16                 + (motion_x >> 2);
M
Michael Niedermayer 已提交
3251 3252
    src_y = s->mb_y * (16 >> field_based) + (motion_y >> 2);

3253
    v_edge_pos = s->v_edge_pos >> field_based;
M
Michael Niedermayer 已提交
3254
    linesize = s->linesize << field_based;
3255
    uvlinesize = s->uvlinesize << field_based;
3256

3257 3258 3259
    if(field_based){
        mx= motion_x/2;
        my= motion_y>>1;
M
Michael Niedermayer 已提交
3260 3261 3262 3263
    }else if(s->workaround_bugs&FF_BUG_QPEL_CHROMA2){
        static const int rtab[8]= {0,0,1,1,0,0,0,1};
        mx= (motion_x>>1) + rtab[motion_x&7];
        my= (motion_y>>1) + rtab[motion_y&7];
M
Michael Niedermayer 已提交
3264
    }else if(s->workaround_bugs&FF_BUG_QPEL_CHROMA){
3265 3266 3267 3268 3269 3270 3271 3272
        mx= (motion_x>>1)|(motion_x&1);
        my= (motion_y>>1)|(motion_y&1);
    }else{
        mx= motion_x/2;
        my= motion_y/2;
    }
    mx= (mx>>1)|(mx&1);
    my= (my>>1)|(my&1);
M
Michael Niedermayer 已提交
3273

3274
    uvdxy= (mx&1) | ((my&1)<<1);
3275 3276
    mx>>=1;
    my>>=1;
M
Michael Niedermayer 已提交
3277

3278 3279 3280 3281 3282 3283 3284
    uvsrc_x = s->mb_x *  8                 + mx;
    uvsrc_y = s->mb_y * (8 >> field_based) + my;

    ptr_y  = ref_picture[0] +   src_y *   linesize +   src_x;
    ptr_cb = ref_picture[1] + uvsrc_y * uvlinesize + uvsrc_x;
    ptr_cr = ref_picture[2] + uvsrc_y * uvlinesize + uvsrc_x;

3285
    if(   (unsigned)src_x > s->h_edge_pos - (motion_x&3) - 16
3286
       || (unsigned)src_y >    v_edge_pos - (motion_y&3) - h  ){
3287
        ff_emulated_edge_mc(s->edge_emu_buffer, ptr_y, s->linesize, 17, 17+field_based,
3288 3289 3290
                         src_x, src_y<<field_based, s->h_edge_pos, s->v_edge_pos);
        ptr_y= s->edge_emu_buffer;
        if(!(s->flags&CODEC_FLAG_GRAY)){
M
10l  
Michael Niedermayer 已提交
3291
            uint8_t *uvbuf= s->edge_emu_buffer + 18*s->linesize;
3292
            ff_emulated_edge_mc(uvbuf, ptr_cb, s->uvlinesize, 9, 9 + field_based,
3293
                             uvsrc_x, uvsrc_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
3294
            ff_emulated_edge_mc(uvbuf + 16, ptr_cr, s->uvlinesize, 9, 9 + field_based,
3295 3296 3297 3298 3299
                             uvsrc_x, uvsrc_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
            ptr_cb= uvbuf;
            ptr_cr= uvbuf + 16;
        }
    }
M
Michael Niedermayer 已提交
3300

3301 3302 3303 3304 3305 3306 3307 3308 3309 3310 3311 3312 3313 3314 3315 3316 3317 3318
    if(!field_based)
        qpix_op[0][dxy](dest_y, ptr_y, linesize);
    else{
        if(bottom_field){
            dest_y += s->linesize;
            dest_cb+= s->uvlinesize;
            dest_cr+= s->uvlinesize;
        }

        if(field_select){
            ptr_y  += s->linesize;
            ptr_cb += s->uvlinesize;
            ptr_cr += s->uvlinesize;
        }
        //damn interlaced mode
        //FIXME boundary mirroring is not exactly correct here
        qpix_op[1][dxy](dest_y  , ptr_y  , linesize);
        qpix_op[1][dxy](dest_y+8, ptr_y+8, linesize);
M
Michael Niedermayer 已提交
3319
    }
3320 3321 3322
    if(!(s->flags&CODEC_FLAG_GRAY)){
        pix_op[1][uvdxy](dest_cr, ptr_cr, uvlinesize, h >> 1);
        pix_op[1][uvdxy](dest_cb, ptr_cb, uvlinesize, h >> 1);
M
Michael Niedermayer 已提交
3323
    }
M
Michael Niedermayer 已提交
3324 3325
}

3326 3327 3328 3329 3330 3331 3332 3333
inline int ff_h263_round_chroma(int x){
    if (x >= 0)
        return  (h263_chroma_roundtab[x & 0xf] + ((x >> 3) & ~1));
    else {
        x = -x;
        return -(h263_chroma_roundtab[x & 0xf] + ((x >> 3) & ~1));
    }
}
M
Michael Niedermayer 已提交
3334

M
Michael Niedermayer 已提交
3335 3336 3337 3338 3339 3340 3341 3342 3343 3344
/**
 * h263 chorma 4mv motion compensation.
 */
static inline void chroma_4mv_motion(MpegEncContext *s,
                                     uint8_t *dest_cb, uint8_t *dest_cr,
                                     uint8_t **ref_picture,
                                     op_pixels_func *pix_op,
                                     int mx, int my){
    int dxy, emu=0, src_x, src_y, offset;
    uint8_t *ptr;
3345

M
Michael Niedermayer 已提交
3346 3347 3348 3349
    /* In case of 8X8, we construct a single chroma motion vector
       with a special rounding */
    mx= ff_h263_round_chroma(mx);
    my= ff_h263_round_chroma(my);
3350

M
Michael Niedermayer 已提交
3351 3352 3353 3354 3355 3356
    dxy = ((my & 1) << 1) | (mx & 1);
    mx >>= 1;
    my >>= 1;

    src_x = s->mb_x * 8 + mx;
    src_y = s->mb_y * 8 + my;
3357
    src_x = av_clip(src_x, -8, s->width/2);
M
Michael Niedermayer 已提交
3358 3359
    if (src_x == s->width/2)
        dxy &= ~1;
3360
    src_y = av_clip(src_y, -8, s->height/2);
M
Michael Niedermayer 已提交
3361 3362
    if (src_y == s->height/2)
        dxy &= ~2;
3363

M
Michael Niedermayer 已提交
3364 3365 3366 3367 3368 3369 3370 3371 3372 3373 3374 3375 3376 3377 3378 3379 3380 3381 3382 3383
    offset = (src_y * (s->uvlinesize)) + src_x;
    ptr = ref_picture[1] + offset;
    if(s->flags&CODEC_FLAG_EMU_EDGE){
        if(   (unsigned)src_x > (s->h_edge_pos>>1) - (dxy &1) - 8
           || (unsigned)src_y > (s->v_edge_pos>>1) - (dxy>>1) - 8){
            ff_emulated_edge_mc(s->edge_emu_buffer, ptr, s->uvlinesize, 9, 9, src_x, src_y, s->h_edge_pos>>1, s->v_edge_pos>>1);
            ptr= s->edge_emu_buffer;
            emu=1;
        }
    }
    pix_op[dxy](dest_cb, ptr, s->uvlinesize, 8);

    ptr = ref_picture[2] + offset;
    if(emu){
        ff_emulated_edge_mc(s->edge_emu_buffer, ptr, s->uvlinesize, 9, 9, src_x, src_y, s->h_edge_pos>>1, s->v_edge_pos>>1);
        ptr= s->edge_emu_buffer;
    }
    pix_op[dxy](dest_cr, ptr, s->uvlinesize, 8);
}

M
Michael Niedermayer 已提交
3384 3385 3386 3387 3388 3389 3390 3391 3392 3393 3394 3395
static inline void chroma_4mv_motion_lowres(MpegEncContext *s,
                                     uint8_t *dest_cb, uint8_t *dest_cr,
                                     uint8_t **ref_picture,
                                     h264_chroma_mc_func *pix_op,
                                     int mx, int my){
    const int lowres= s->avctx->lowres;
    const int block_s= 8>>lowres;
    const int s_mask= (2<<lowres)-1;
    const int h_edge_pos = s->h_edge_pos >> (lowres+1);
    const int v_edge_pos = s->v_edge_pos >> (lowres+1);
    int emu=0, src_x, src_y, offset, sx, sy;
    uint8_t *ptr;
3396

M
Michael Niedermayer 已提交
3397 3398 3399 3400 3401 3402 3403 3404 3405
    if(s->quarter_sample){
        mx/=2;
        my/=2;
    }

    /* In case of 8X8, we construct a single chroma motion vector
       with a special rounding */
    mx= ff_h263_round_chroma(mx);
    my= ff_h263_round_chroma(my);
3406

M
Michael Niedermayer 已提交
3407 3408 3409 3410
    sx= mx & s_mask;
    sy= my & s_mask;
    src_x = s->mb_x*block_s + (mx >> (lowres+1));
    src_y = s->mb_y*block_s + (my >> (lowres+1));
3411

M
Michael Niedermayer 已提交
3412 3413 3414 3415 3416 3417 3418 3419 3420
    offset = src_y * s->uvlinesize + src_x;
    ptr = ref_picture[1] + offset;
    if(s->flags&CODEC_FLAG_EMU_EDGE){
        if(   (unsigned)src_x > h_edge_pos - (!!sx) - block_s
           || (unsigned)src_y > v_edge_pos - (!!sy) - block_s){
            ff_emulated_edge_mc(s->edge_emu_buffer, ptr, s->uvlinesize, 9, 9, src_x, src_y, h_edge_pos, v_edge_pos);
            ptr= s->edge_emu_buffer;
            emu=1;
        }
3421
    }
M
Michael Niedermayer 已提交
3422 3423 3424
    sx <<= 2 - lowres;
    sy <<= 2 - lowres;
    pix_op[lowres](dest_cb, ptr, s->uvlinesize, block_s, sx, sy);
3425

M
Michael Niedermayer 已提交
3426 3427 3428 3429 3430 3431 3432 3433
    ptr = ref_picture[2] + offset;
    if(emu){
        ff_emulated_edge_mc(s->edge_emu_buffer, ptr, s->uvlinesize, 9, 9, src_x, src_y, h_edge_pos, v_edge_pos);
        ptr= s->edge_emu_buffer;
    }
    pix_op[lowres](dest_cr, ptr, s->uvlinesize, block_s, sx, sy);
}

3434 3435 3436 3437 3438 3439 3440 3441 3442 3443 3444 3445
static inline void prefetch_motion(MpegEncContext *s, uint8_t **pix, int dir){
    /* fetch pixels for estimated mv 4 macroblocks ahead
     * optimized for 64byte cache lines */
    const int shift = s->quarter_sample ? 2 : 1;
    const int mx= (s->mv[dir][0][0]>>shift) + 16*s->mb_x + 8;
    const int my= (s->mv[dir][0][1]>>shift) + 16*s->mb_y;
    int off= mx + (my + (s->mb_x&3)*4)*s->linesize + 64;
    s->dsp.prefetch(pix[0]+off, s->linesize, 4);
    off= (mx>>1) + ((my>>1) + (s->mb_x&7))*s->uvlinesize + 64;
    s->dsp.prefetch(pix[1]+off, pix[2]-pix[1], 2);
}

M
doxy  
Michael Niedermayer 已提交
3446
/**
D
Diego Biurrun 已提交
3447
 * motion compensation of a single macroblock
M
doxy  
Michael Niedermayer 已提交
3448 3449 3450 3451 3452 3453 3454 3455 3456 3457
 * @param s context
 * @param dest_y luma destination pointer
 * @param dest_cb chroma cb/u destination pointer
 * @param dest_cr chroma cr/v destination pointer
 * @param dir direction (0->forward, 1->backward)
 * @param ref_picture array[3] of pointers to the 3 planes of the reference picture
 * @param pic_op halfpel motion compensation function (average or put normally)
 * @param pic_op qpel motion compensation function (average or put normally)
 * the motion vectors are taken from s->mv and the MV type from s->mv_type
 */
3458
static inline void MPV_motion(MpegEncContext *s,
3459
                              uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
3460
                              int dir, uint8_t **ref_picture,
M
Michael Niedermayer 已提交
3461
                              op_pixels_func (*pix_op)[4], qpel_mc_func (*qpix_op)[16])
F
Fabrice Bellard 已提交
3462
{
M
Michael Niedermayer 已提交
3463
    int dxy, mx, my, src_x, src_y, motion_x, motion_y;
F
Fabrice Bellard 已提交
3464
    int mb_x, mb_y, i;
3465
    uint8_t *ptr, *dest;
F
Fabrice Bellard 已提交
3466 3467 3468 3469

    mb_x = s->mb_x;
    mb_y = s->mb_y;

3470 3471
    prefetch_motion(s, ref_picture, dir);

3472
    if(s->obmc && s->pict_type != B_TYPE){
M
Michael Niedermayer 已提交
3473 3474
        int16_t mv_cache[4][4][2];
        const int xy= s->mb_x + s->mb_y*s->mb_stride;
3475 3476
        const int mot_stride= s->b8_stride;
        const int mot_xy= mb_x*2 + mb_y*2*mot_stride;
M
Michael Niedermayer 已提交
3477

3478
        assert(!s->mb_skipped);
3479

3480 3481 3482
        memcpy(mv_cache[1][1], s->current_picture.motion_val[0][mot_xy           ], sizeof(int16_t)*4);
        memcpy(mv_cache[2][1], s->current_picture.motion_val[0][mot_xy+mot_stride], sizeof(int16_t)*4);
        memcpy(mv_cache[3][1], s->current_picture.motion_val[0][mot_xy+mot_stride], sizeof(int16_t)*4);
M
Michael Niedermayer 已提交
3483 3484 3485 3486

        if(mb_y==0 || IS_INTRA(s->current_picture.mb_type[xy-s->mb_stride])){
            memcpy(mv_cache[0][1], mv_cache[1][1], sizeof(int16_t)*4);
        }else{
3487
            memcpy(mv_cache[0][1], s->current_picture.motion_val[0][mot_xy-mot_stride], sizeof(int16_t)*4);
M
Michael Niedermayer 已提交
3488 3489 3490 3491 3492 3493
        }

        if(mb_x==0 || IS_INTRA(s->current_picture.mb_type[xy-1])){
            *(int32_t*)mv_cache[1][0]= *(int32_t*)mv_cache[1][1];
            *(int32_t*)mv_cache[2][0]= *(int32_t*)mv_cache[2][1];
        }else{
3494 3495
            *(int32_t*)mv_cache[1][0]= *(int32_t*)s->current_picture.motion_val[0][mot_xy-1];
            *(int32_t*)mv_cache[2][0]= *(int32_t*)s->current_picture.motion_val[0][mot_xy-1+mot_stride];
M
Michael Niedermayer 已提交
3496 3497 3498 3499 3500 3501
        }

        if(mb_x+1>=s->mb_width || IS_INTRA(s->current_picture.mb_type[xy+1])){
            *(int32_t*)mv_cache[1][3]= *(int32_t*)mv_cache[1][2];
            *(int32_t*)mv_cache[2][3]= *(int32_t*)mv_cache[2][2];
        }else{
3502 3503
            *(int32_t*)mv_cache[1][3]= *(int32_t*)s->current_picture.motion_val[0][mot_xy+2];
            *(int32_t*)mv_cache[2][3]= *(int32_t*)s->current_picture.motion_val[0][mot_xy+2+mot_stride];
M
Michael Niedermayer 已提交
3504
        }
3505

M
Michael Niedermayer 已提交
3506 3507 3508 3509 3510 3511 3512 3513 3514 3515 3516 3517 3518 3519 3520 3521 3522 3523 3524 3525 3526 3527 3528 3529 3530 3531
        mx = 0;
        my = 0;
        for(i=0;i<4;i++) {
            const int x= (i&1)+1;
            const int y= (i>>1)+1;
            int16_t mv[5][2]= {
                {mv_cache[y][x  ][0], mv_cache[y][x  ][1]},
                {mv_cache[y-1][x][0], mv_cache[y-1][x][1]},
                {mv_cache[y][x-1][0], mv_cache[y][x-1][1]},
                {mv_cache[y][x+1][0], mv_cache[y][x+1][1]},
                {mv_cache[y+1][x][0], mv_cache[y+1][x][1]}};
            //FIXME cleanup
            obmc_motion(s, dest_y + ((i & 1) * 8) + (i >> 1) * 8 * s->linesize,
                        ref_picture[0],
                        mb_x * 16 + (i & 1) * 8, mb_y * 16 + (i >>1) * 8,
                        pix_op[1],
                        mv);

            mx += mv[0][0];
            my += mv[0][1];
        }
        if(!(s->flags&CODEC_FLAG_GRAY))
            chroma_4mv_motion(s, dest_cb, dest_cr, ref_picture, pix_op[1], mx, my);

        return;
    }
3532

F
Fabrice Bellard 已提交
3533 3534
    switch(s->mv_type) {
    case MV_TYPE_16X16:
M
Michael Niedermayer 已提交
3535
        if(s->mcsel){
3536
            if(s->real_sprite_warping_points==1){
3537 3538
                gmc1_motion(s, dest_y, dest_cb, dest_cr,
                            ref_picture);
3539
            }else{
3540 3541
                gmc_motion(s, dest_y, dest_cb, dest_cr,
                            ref_picture);
3542
            }
M
Michael Niedermayer 已提交
3543
        }else if(s->quarter_sample){
3544
            qpel_motion(s, dest_y, dest_cb, dest_cr,
3545 3546
                        0, 0, 0,
                        ref_picture, pix_op, qpix_op,
M
Michael Niedermayer 已提交
3547
                        s->mv[dir][0][0], s->mv[dir][0][1], 16);
3548
        }else if(ENABLE_WMV2 && s->mspel){
M
Michael Niedermayer 已提交
3549 3550 3551
            ff_mspel_motion(s, dest_y, dest_cb, dest_cr,
                        ref_picture, pix_op,
                        s->mv[dir][0][0], s->mv[dir][0][1], 16);
M
Michael Niedermayer 已提交
3552 3553
        }else
        {
3554
            mpeg_motion(s, dest_y, dest_cb, dest_cr,
3555 3556
                        0, 0, 0,
                        ref_picture, pix_op,
M
Michael Niedermayer 已提交
3557
                        s->mv[dir][0][0], s->mv[dir][0][1], 16);
3558
        }
F
Fabrice Bellard 已提交
3559 3560
        break;
    case MV_TYPE_8X8:
M
Michael Niedermayer 已提交
3561 3562 3563 3564 3565 3566 3567 3568 3569 3570
        mx = 0;
        my = 0;
        if(s->quarter_sample){
            for(i=0;i<4;i++) {
                motion_x = s->mv[dir][i][0];
                motion_y = s->mv[dir][i][1];

                dxy = ((motion_y & 3) << 2) | (motion_x & 3);
                src_x = mb_x * 16 + (motion_x >> 2) + (i & 1) * 8;
                src_y = mb_y * 16 + (motion_y >> 2) + (i >>1) * 8;
3571

M
Michael Niedermayer 已提交
3572
                /* WARNING: do no forget half pels */
3573
                src_x = av_clip(src_x, -16, s->width);
M
Michael Niedermayer 已提交
3574 3575
                if (src_x == s->width)
                    dxy &= ~3;
3576
                src_y = av_clip(src_y, -16, s->height);
M
Michael Niedermayer 已提交
3577 3578
                if (src_y == s->height)
                    dxy &= ~12;
3579

M
Michael Niedermayer 已提交
3580 3581
                ptr = ref_picture[0] + (src_y * s->linesize) + (src_x);
                if(s->flags&CODEC_FLAG_EMU_EDGE){
3582
                    if(   (unsigned)src_x > s->h_edge_pos - (motion_x&3) - 8
3583
                       || (unsigned)src_y > s->v_edge_pos - (motion_y&3) - 8 ){
3584
                        ff_emulated_edge_mc(s->edge_emu_buffer, ptr, s->linesize, 9, 9, src_x, src_y, s->h_edge_pos, s->v_edge_pos);
M
Michael Niedermayer 已提交
3585 3586 3587 3588 3589 3590 3591 3592 3593 3594 3595
                        ptr= s->edge_emu_buffer;
                    }
                }
                dest = dest_y + ((i & 1) * 8) + (i >> 1) * 8 * s->linesize;
                qpix_op[1][dxy](dest, ptr, s->linesize);

                mx += s->mv[dir][i][0]/2;
                my += s->mv[dir][i][1]/2;
            }
        }else{
            for(i=0;i<4;i++) {
M
Michael Niedermayer 已提交
3596
                hpel_motion(s, dest_y + ((i & 1) * 8) + (i >> 1) * 8 * s->linesize,
3597
                            ref_picture[0], 0, 0,
M
Michael Niedermayer 已提交
3598 3599 3600 3601 3602
                            mb_x * 16 + (i & 1) * 8, mb_y * 16 + (i >>1) * 8,
                            s->width, s->height, s->linesize,
                            s->h_edge_pos, s->v_edge_pos,
                            8, 8, pix_op[1],
                            s->mv[dir][i][0], s->mv[dir][i][1]);
M
Michael Niedermayer 已提交
3603 3604 3605

                mx += s->mv[dir][i][0];
                my += s->mv[dir][i][1];
M
Michael Niedermayer 已提交
3606
            }
F
Fabrice Bellard 已提交
3607
        }
M
Michael Niedermayer 已提交
3608

M
Michael Niedermayer 已提交
3609 3610
        if(!(s->flags&CODEC_FLAG_GRAY))
            chroma_4mv_motion(s, dest_cb, dest_cr, ref_picture, pix_op[1], mx, my);
F
Fabrice Bellard 已提交
3611 3612 3613
        break;
    case MV_TYPE_FIELD:
        if (s->picture_structure == PICT_FRAME) {
3614
            if(s->quarter_sample){
M
Michael Niedermayer 已提交
3615 3616 3617 3618 3619 3620
                for(i=0; i<2; i++){
                    qpel_motion(s, dest_y, dest_cb, dest_cr,
                                1, i, s->field_select[dir][i],
                                ref_picture, pix_op, qpix_op,
                                s->mv[dir][i][0], s->mv[dir][i][1], 8);
                }
3621
            }else{
3622
                /* top field */
3623 3624 3625
                mpeg_motion(s, dest_y, dest_cb, dest_cr,
                            1, 0, s->field_select[dir][0],
                            ref_picture, pix_op,
3626 3627
                            s->mv[dir][0][0], s->mv[dir][0][1], 8);
                /* bottom field */
3628 3629 3630
                mpeg_motion(s, dest_y, dest_cb, dest_cr,
                            1, 1, s->field_select[dir][1],
                            ref_picture, pix_op,
3631 3632
                            s->mv[dir][1][0], s->mv[dir][1][1], 8);
            }
F
Fabrice Bellard 已提交
3633
        } else {
3634 3635
            if(s->picture_structure != s->field_select[dir][0] + 1 && s->pict_type != B_TYPE && !s->first_field){
                ref_picture= s->current_picture_ptr->data;
3636
            }
F
Fabrice Bellard 已提交
3637

3638 3639 3640
            mpeg_motion(s, dest_y, dest_cb, dest_cr,
                        0, 0, s->field_select[dir][0],
                        ref_picture, pix_op,
3641
                        s->mv[dir][0][0], s->mv[dir][0][1], 16);
F
Fabrice Bellard 已提交
3642
        }
3643
        break;
M
Michael Niedermayer 已提交
3644 3645 3646
    case MV_TYPE_16X8:
        for(i=0; i<2; i++){
            uint8_t ** ref2picture;
3647

M
Michael Niedermayer 已提交
3648
            if(s->picture_structure == s->field_select[dir][i] + 1 || s->pict_type == B_TYPE || s->first_field){
3649 3650
                ref2picture= ref_picture;
            }else{
3651
                ref2picture= s->current_picture_ptr->data;
3652
            }
3653

3654
            mpeg_motion(s, dest_y, dest_cb, dest_cr,
M
Michael Niedermayer 已提交
3655
                        0, 0, s->field_select[dir][i],
3656
                        ref2picture, pix_op,
M
Michael Niedermayer 已提交
3657
                        s->mv[dir][i][0], s->mv[dir][i][1] + 16*i, 8);
3658

M
Michael Niedermayer 已提交
3659
            dest_y += 16*s->linesize;
3660 3661
            dest_cb+= (16>>s->chroma_y_shift)*s->uvlinesize;
            dest_cr+= (16>>s->chroma_y_shift)*s->uvlinesize;
3662
        }
F
Fabrice Bellard 已提交
3663
        break;
3664 3665
    case MV_TYPE_DMV:
        if(s->picture_structure == PICT_FRAME){
M
Michael Niedermayer 已提交
3666 3667 3668 3669 3670 3671 3672 3673
            for(i=0; i<2; i++){
                int j;
                for(j=0; j<2; j++){
                    mpeg_motion(s, dest_y, dest_cb, dest_cr,
                                1, j, j^i,
                                ref_picture, pix_op,
                                s->mv[dir][2*i + j][0], s->mv[dir][2*i + j][1], 8);
                }
3674
                pix_op = s->dsp.avg_pixels_tab;
M
Michael Niedermayer 已提交
3675
            }
3676
        }else{
M
Michael Niedermayer 已提交
3677
            for(i=0; i<2; i++){
3678
                mpeg_motion(s, dest_y, dest_cb, dest_cr,
M
Michael Niedermayer 已提交
3679 3680 3681
                            0, 0, s->picture_structure != i+1,
                            ref_picture, pix_op,
                            s->mv[dir][2*i][0],s->mv[dir][2*i][1],16);
3682

M
Michael Niedermayer 已提交
3683
                // after put we make avg of the same block
3684
                pix_op=s->dsp.avg_pixels_tab;
3685

M
Michael Niedermayer 已提交
3686 3687
                //opposite parity is always in the same frame if this is second field
                if(!s->first_field){
3688
                    ref_picture = s->current_picture_ptr->data;
M
Michael Niedermayer 已提交
3689
                }
3690
            }
3691 3692
        }
    break;
M
Michael Niedermayer 已提交
3693
    default: assert(0);
F
Fabrice Bellard 已提交
3694 3695 3696
    }
}

M
Michael Niedermayer 已提交
3697
/**
D
Diego Biurrun 已提交
3698
 * motion compensation of a single macroblock
M
Michael Niedermayer 已提交
3699 3700 3701 3702 3703 3704 3705 3706 3707
 * @param s context
 * @param dest_y luma destination pointer
 * @param dest_cb chroma cb/u destination pointer
 * @param dest_cr chroma cr/v destination pointer
 * @param dir direction (0->forward, 1->backward)
 * @param ref_picture array[3] of pointers to the 3 planes of the reference picture
 * @param pic_op halfpel motion compensation function (average or put normally)
 * the motion vectors are taken from s->mv and the MV type from s->mv_type
 */
3708
static inline void MPV_motion_lowres(MpegEncContext *s,
M
Michael Niedermayer 已提交
3709
                              uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
3710
                              int dir, uint8_t **ref_picture,
M
Michael Niedermayer 已提交
3711 3712
                              h264_chroma_mc_func *pix_op)
{
M
Michael Niedermayer 已提交
3713
    int mx, my;
3714 3715
    int mb_x, mb_y, i;
    const int lowres= s->avctx->lowres;
3716
    const int block_s= 8>>lowres;
3717 3718 3719 3720 3721 3722

    mb_x = s->mb_x;
    mb_y = s->mb_y;

    switch(s->mv_type) {
    case MV_TYPE_16X16:
3723
        mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
3724 3725 3726 3727
                    0, 0, 0,
                    ref_picture, pix_op,
                    s->mv[dir][0][0], s->mv[dir][0][1], 2*block_s);
        break;
M
Michael Niedermayer 已提交
3728
    case MV_TYPE_8X8:
3729 3730 3731
        mx = 0;
        my = 0;
            for(i=0;i<4;i++) {
M
Michael Niedermayer 已提交
3732
                hpel_motion_lowres(s, dest_y + ((i & 1) + (i >> 1) * s->linesize)*block_s,
3733
                            ref_picture[0], 0, 0,
M
Michael Niedermayer 已提交
3734
                            (2*mb_x + (i & 1))*block_s, (2*mb_y + (i >>1))*block_s,
3735
                            s->width, s->height, s->linesize,
M
Michael Niedermayer 已提交
3736 3737
                            s->h_edge_pos >> lowres, s->v_edge_pos >> lowres,
                            block_s, block_s, pix_op,
3738 3739 3740 3741 3742 3743 3744
                            s->mv[dir][i][0], s->mv[dir][i][1]);

                mx += s->mv[dir][i][0];
                my += s->mv[dir][i][1];
            }

        if(!(s->flags&CODEC_FLAG_GRAY))
M
Michael Niedermayer 已提交
3745 3746
            chroma_4mv_motion_lowres(s, dest_cb, dest_cr, ref_picture, pix_op, mx, my);
        break;
3747 3748
    case MV_TYPE_FIELD:
        if (s->picture_structure == PICT_FRAME) {
3749
            /* top field */
3750 3751 3752 3753 3754 3755 3756 3757 3758 3759 3760 3761
            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
                        1, 0, s->field_select[dir][0],
                        ref_picture, pix_op,
                        s->mv[dir][0][0], s->mv[dir][0][1], block_s);
            /* bottom field */
            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
                        1, 1, s->field_select[dir][1],
                        ref_picture, pix_op,
                        s->mv[dir][1][0], s->mv[dir][1][1], block_s);
        } else {
            if(s->picture_structure != s->field_select[dir][0] + 1 && s->pict_type != B_TYPE && !s->first_field){
                ref_picture= s->current_picture_ptr->data;
3762
            }
3763 3764 3765 3766 3767 3768 3769 3770 3771 3772 3773 3774 3775 3776 3777

            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
                        0, 0, s->field_select[dir][0],
                        ref_picture, pix_op,
                        s->mv[dir][0][0], s->mv[dir][0][1], 2*block_s);
        }
        break;
    case MV_TYPE_16X8:
        for(i=0; i<2; i++){
            uint8_t ** ref2picture;

            if(s->picture_structure == s->field_select[dir][i] + 1 || s->pict_type == B_TYPE || s->first_field){
                ref2picture= ref_picture;
            }else{
                ref2picture= s->current_picture_ptr->data;
3778
            }
3779

3780
            mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
3781 3782 3783
                        0, 0, s->field_select[dir][i],
                        ref2picture, pix_op,
                        s->mv[dir][i][0], s->mv[dir][i][1] + 2*block_s*i, block_s);
3784

3785 3786 3787
            dest_y += 2*block_s*s->linesize;
            dest_cb+= (2*block_s>>s->chroma_y_shift)*s->uvlinesize;
            dest_cr+= (2*block_s>>s->chroma_y_shift)*s->uvlinesize;
3788
        }
3789 3790 3791 3792 3793 3794 3795 3796 3797 3798 3799 3800 3801 3802 3803
        break;
    case MV_TYPE_DMV:
        if(s->picture_structure == PICT_FRAME){
            for(i=0; i<2; i++){
                int j;
                for(j=0; j<2; j++){
                    mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
                                1, j, j^i,
                                ref_picture, pix_op,
                                s->mv[dir][2*i + j][0], s->mv[dir][2*i + j][1], block_s);
                }
                pix_op = s->dsp.avg_h264_chroma_pixels_tab;
            }
        }else{
            for(i=0; i<2; i++){
3804
                mpeg_motion_lowres(s, dest_y, dest_cb, dest_cr,
3805 3806 3807 3808 3809 3810 3811 3812 3813
                            0, 0, s->picture_structure != i+1,
                            ref_picture, pix_op,
                            s->mv[dir][2*i][0],s->mv[dir][2*i][1],2*block_s);

                // after put we make avg of the same block
                pix_op = s->dsp.avg_h264_chroma_pixels_tab;

                //opposite parity is always in the same frame if this is second field
                if(!s->first_field){
3814
                    ref_picture = s->current_picture_ptr->data;
3815 3816 3817 3818 3819 3820
                }
            }
        }
    break;
    default: assert(0);
    }
M
Michael Niedermayer 已提交
3821
}
F
Fabrice Bellard 已提交
3822 3823

/* put block[] to dest[] */
3824
static inline void put_dct(MpegEncContext *s,
3825
                           DCTELEM *block, int i, uint8_t *dest, int line_size, int qscale)
F
Fabrice Bellard 已提交
3826
{
3827
    s->dct_unquantize_intra(s, block, i, qscale);
3828
    s->dsp.idct_put (dest, line_size, block);
F
Fabrice Bellard 已提交
3829 3830 3831
}

/* add block[] to dest[] */
3832
static inline void add_dct(MpegEncContext *s,
3833
                           DCTELEM *block, int i, uint8_t *dest, int line_size)
F
Fabrice Bellard 已提交
3834
{
M
Michael Niedermayer 已提交
3835
    if (s->block_last_index[i] >= 0) {
3836
        s->dsp.idct_add (dest, line_size, block);
M
Michael Niedermayer 已提交
3837 3838
    }
}
3839

3840
static inline void add_dequant_dct(MpegEncContext *s,
M
Michael Niedermayer 已提交
3841
                           DCTELEM *block, int i, uint8_t *dest, int line_size, int qscale)
M
Michael Niedermayer 已提交
3842
{
F
Fabrice Bellard 已提交
3843
    if (s->block_last_index[i] >= 0) {
3844
        s->dct_unquantize_inter(s, block, i, qscale);
3845

3846
        s->dsp.idct_add (dest, line_size, block);
F
Fabrice Bellard 已提交
3847 3848 3849
    }
}

3850 3851 3852 3853 3854
/**
 * cleans dc, ac, coded_block for the current non intra MB
 */
void ff_clean_intra_table_entries(MpegEncContext *s)
{
3855
    int wrap = s->b8_stride;
3856
    int xy = s->block_index[0];
3857 3858 3859

    s->dc_val[0][xy           ] =
    s->dc_val[0][xy + 1       ] =
3860 3861 3862
    s->dc_val[0][xy     + wrap] =
    s->dc_val[0][xy + 1 + wrap] = 1024;
    /* ac pred */
3863 3864
    memset(s->ac_val[0][xy       ], 0, 32 * sizeof(int16_t));
    memset(s->ac_val[0][xy + wrap], 0, 32 * sizeof(int16_t));
3865 3866 3867 3868 3869 3870 3871
    if (s->msmpeg4_version>=3) {
        s->coded_block[xy           ] =
        s->coded_block[xy + 1       ] =
        s->coded_block[xy     + wrap] =
        s->coded_block[xy + 1 + wrap] = 0;
    }
    /* chroma */
3872 3873
    wrap = s->mb_stride;
    xy = s->mb_x + s->mb_y * wrap;
3874 3875 3876
    s->dc_val[1][xy] =
    s->dc_val[2][xy] = 1024;
    /* ac pred */
3877 3878
    memset(s->ac_val[1][xy], 0, 16 * sizeof(int16_t));
    memset(s->ac_val[2][xy], 0, 16 * sizeof(int16_t));
3879

3880
    s->mbintra_table[xy]= 0;
3881 3882
}

F
Fabrice Bellard 已提交
3883 3884 3885 3886 3887 3888 3889 3890 3891 3892
/* generic function called after a macroblock has been parsed by the
   decoder or after it has been encoded by the encoder.

   Important variables used:
   s->mb_intra : true if intra macroblock
   s->mv_dir   : motion vector direction
   s->mv_type  : motion vector type
   s->mv       : motion vector
   s->interlaced_dct : true if interlaced dct used (mpeg2)
 */
3893
static av_always_inline void MPV_decode_mb_internal(MpegEncContext *s, DCTELEM block[12][64], int lowres_flag)
F
Fabrice Bellard 已提交
3894
{
3895
    int mb_x, mb_y;
3896
    const int mb_xy = s->mb_y * s->mb_stride + s->mb_x;
I
Ivan Kalvachev 已提交
3897 3898
#ifdef HAVE_XVMC
    if(s->avctx->xvmc_acceleration){
3899
        XVMC_decode_mb(s);//xvmc uses pblocks
I
Ivan Kalvachev 已提交
3900 3901 3902
        return;
    }
#endif
F
Fabrice Bellard 已提交
3903 3904 3905 3906

    mb_x = s->mb_x;
    mb_y = s->mb_y;

3907 3908 3909 3910 3911 3912 3913 3914 3915
    if(s->avctx->debug&FF_DEBUG_DCT_COEFF) {
       /* save DCT coefficients */
       int i,j;
       DCTELEM *dct = &s->current_picture.dct_coeff[mb_xy*64*6];
       for(i=0; i<6; i++)
           for(j=0; j<64; j++)
               *dct++ = block[i][s->dsp.idct_permutation[j]];
    }

M
cleanup  
Michael Niedermayer 已提交
3916
    s->current_picture.qscale_table[mb_xy]= s->qscale;
3917

F
Fabrice Bellard 已提交
3918 3919
    /* update DC predictors for P macroblocks */
    if (!s->mb_intra) {
3920
        if (s->h263_pred || s->h263_aic) {
M
Michael Niedermayer 已提交
3921
            if(s->mbintra_table[mb_xy])
3922
                ff_clean_intra_table_entries(s);
F
Fabrice Bellard 已提交
3923
        } else {
3924 3925
            s->last_dc[0] =
            s->last_dc[1] =
F
Fabrice Bellard 已提交
3926 3927 3928
            s->last_dc[2] = 128 << s->intra_dc_precision;
        }
    }
3929
    else if (s->h263_pred || s->h263_aic)
M
Michael Niedermayer 已提交
3930
        s->mbintra_table[mb_xy]=1;
3931

3932
    if ((s->flags&CODEC_FLAG_PSNR) || !(s->encoding && (s->intra_only || s->pict_type==B_TYPE) && s->avctx->mb_decision != FF_MB_DECISION_RD)) { //FIXME precalc
3933
        uint8_t *dest_y, *dest_cb, *dest_cr;
M
Michael Niedermayer 已提交
3934
        int dct_linesize, dct_offset;
M
Michael Niedermayer 已提交
3935 3936
        op_pixels_func (*op_pix)[4];
        qpel_mc_func (*op_qpix)[16];
3937
        const int linesize= s->current_picture.linesize[0]; //not s->linesize as this would be wrong for field pics
M
Michael Niedermayer 已提交
3938
        const int uvlinesize= s->current_picture.linesize[1];
M
Michael Niedermayer 已提交
3939 3940
        const int readable= s->pict_type != B_TYPE || s->encoding || s->avctx->draw_horiz_band || lowres_flag;
        const int block_size= lowres_flag ? 8>>s->avctx->lowres : 8;
3941

M
cleanup  
Michael Niedermayer 已提交
3942 3943 3944
        /* avoid copy if macroblock skipped in last frame too */
        /* skip only during decoding as we might trash the buffers during encoding a bit */
        if(!s->encoding){
3945
            uint8_t *mbskip_ptr = &s->mbskip_table[mb_xy];
M
cleanup  
Michael Niedermayer 已提交
3946
            const int age= s->current_picture.age;
M
Michael Niedermayer 已提交
3947

M
cleanup  
Michael Niedermayer 已提交
3948 3949
            assert(age);

3950 3951
            if (s->mb_skipped) {
                s->mb_skipped= 0;
M
cleanup  
Michael Niedermayer 已提交
3952
                assert(s->pict_type!=I_TYPE);
3953

3954
                (*mbskip_ptr) ++; /* indicate that this time we skipped it */
M
Michael Niedermayer 已提交
3955 3956
                if(*mbskip_ptr >99) *mbskip_ptr= 99;

M
cleanup  
Michael Niedermayer 已提交
3957
                /* if previous was skipped too, then nothing to do !  */
3958 3959
                if (*mbskip_ptr >= age && s->current_picture.reference){
                    return;
M
cleanup  
Michael Niedermayer 已提交
3960
                }
3961 3962 3963 3964
            } else if(!s->current_picture.reference){
                (*mbskip_ptr) ++; /* increase counter so the age can be compared cleanly */
                if(*mbskip_ptr >99) *mbskip_ptr= 99;
            } else{
3965 3966
                *mbskip_ptr = 0; /* not skipped */
            }
M
Michael Niedermayer 已提交
3967
        }
3968

3969
        dct_linesize = linesize << s->interlaced_dct;
M
Michael Niedermayer 已提交
3970
        dct_offset =(s->interlaced_dct)? linesize : linesize*block_size;
3971

3972 3973 3974 3975 3976
        if(readable){
            dest_y=  s->dest[0];
            dest_cb= s->dest[1];
            dest_cr= s->dest[2];
        }else{
3977
            dest_y = s->b_scratchpad;
3978
            dest_cb= s->b_scratchpad+16*linesize;
3979
            dest_cr= s->b_scratchpad+32*linesize;
3980
        }
M
Michael Niedermayer 已提交
3981

F
Fabrice Bellard 已提交
3982 3983
        if (!s->mb_intra) {
            /* motion handling */
3984
            /* decoding or more than one mb_type (MC was already done otherwise) */
3985
            if(!s->encoding){
M
Michael Niedermayer 已提交
3986 3987
                if(lowres_flag){
                    h264_chroma_mc_func *op_pix = s->dsp.put_h264_chroma_pixels_tab;
F
Fabrice Bellard 已提交
3988

M
Michael Niedermayer 已提交
3989 3990 3991 3992 3993 3994 3995 3996
                    if (s->mv_dir & MV_DIR_FORWARD) {
                        MPV_motion_lowres(s, dest_y, dest_cb, dest_cr, 0, s->last_picture.data, op_pix);
                        op_pix = s->dsp.avg_h264_chroma_pixels_tab;
                    }
                    if (s->mv_dir & MV_DIR_BACKWARD) {
                        MPV_motion_lowres(s, dest_y, dest_cb, dest_cr, 1, s->next_picture.data, op_pix);
                    }
                }else{
3997
                    op_qpix= s->me.qpel_put;
3998
                    if ((!s->no_rounding) || s->pict_type==B_TYPE){
M
Michael Niedermayer 已提交
3999 4000 4001 4002 4003 4004 4005
                        op_pix = s->dsp.put_pixels_tab;
                    }else{
                        op_pix = s->dsp.put_no_rnd_pixels_tab;
                    }
                    if (s->mv_dir & MV_DIR_FORWARD) {
                        MPV_motion(s, dest_y, dest_cb, dest_cr, 0, s->last_picture.data, op_pix, op_qpix);
                        op_pix = s->dsp.avg_pixels_tab;
4006
                        op_qpix= s->me.qpel_avg;
M
Michael Niedermayer 已提交
4007 4008 4009 4010
                    }
                    if (s->mv_dir & MV_DIR_BACKWARD) {
                        MPV_motion(s, dest_y, dest_cb, dest_cr, 1, s->next_picture.data, op_pix, op_qpix);
                    }
4011
                }
F
Fabrice Bellard 已提交
4012 4013
            }

M
Michael Niedermayer 已提交
4014
            /* skip dequant / idct if we are really late ;) */
M
Michael Niedermayer 已提交
4015 4016 4017 4018 4019 4020 4021
            if(s->hurry_up>1) goto skip_idct;
            if(s->avctx->skip_idct){
                if(  (s->avctx->skip_idct >= AVDISCARD_NONREF && s->pict_type == B_TYPE)
                   ||(s->avctx->skip_idct >= AVDISCARD_NONKEY && s->pict_type != I_TYPE)
                   || s->avctx->skip_idct >= AVDISCARD_ALL)
                    goto skip_idct;
            }
M
Michael Niedermayer 已提交
4022

F
Fabrice Bellard 已提交
4023
            /* add dct residue */
M
Michael Niedermayer 已提交
4024
            if(s->encoding || !(   s->h263_msmpeg4 || s->codec_id==CODEC_ID_MPEG1VIDEO || s->codec_id==CODEC_ID_MPEG2VIDEO
4025
                                || (s->codec_id==CODEC_ID_MPEG4 && !s->mpeg_quant))){
M
Michael Niedermayer 已提交
4026 4027 4028 4029
                add_dequant_dct(s, block[0], 0, dest_y                          , dct_linesize, s->qscale);
                add_dequant_dct(s, block[1], 1, dest_y              + block_size, dct_linesize, s->qscale);
                add_dequant_dct(s, block[2], 2, dest_y + dct_offset             , dct_linesize, s->qscale);
                add_dequant_dct(s, block[3], 3, dest_y + dct_offset + block_size, dct_linesize, s->qscale);
M
Michael Niedermayer 已提交
4030

M
Michael Niedermayer 已提交
4031
                if(!(s->flags&CODEC_FLAG_GRAY)){
4032 4033 4034 4035 4036 4037 4038 4039 4040 4041 4042
                    if (s->chroma_y_shift){
                        add_dequant_dct(s, block[4], 4, dest_cb, uvlinesize, s->chroma_qscale);
                        add_dequant_dct(s, block[5], 5, dest_cr, uvlinesize, s->chroma_qscale);
                    }else{
                        dct_linesize >>= 1;
                        dct_offset >>=1;
                        add_dequant_dct(s, block[4], 4, dest_cb,              dct_linesize, s->chroma_qscale);
                        add_dequant_dct(s, block[5], 5, dest_cr,              dct_linesize, s->chroma_qscale);
                        add_dequant_dct(s, block[6], 6, dest_cb + dct_offset, dct_linesize, s->chroma_qscale);
                        add_dequant_dct(s, block[7], 7, dest_cr + dct_offset, dct_linesize, s->chroma_qscale);
                    }
M
Michael Niedermayer 已提交
4043
                }
M
Michael Niedermayer 已提交
4044
            } else if(s->codec_id != CODEC_ID_WMV2){
M
Michael Niedermayer 已提交
4045 4046 4047 4048
                add_dct(s, block[0], 0, dest_y                          , dct_linesize);
                add_dct(s, block[1], 1, dest_y              + block_size, dct_linesize);
                add_dct(s, block[2], 2, dest_y + dct_offset             , dct_linesize);
                add_dct(s, block[3], 3, dest_y + dct_offset + block_size, dct_linesize);
F
Fabrice Bellard 已提交
4049

M
Michael Niedermayer 已提交
4050
                if(!(s->flags&CODEC_FLAG_GRAY)){
4051 4052 4053 4054 4055 4056 4057 4058 4059 4060 4061 4062 4063 4064 4065 4066 4067 4068 4069 4070 4071
                    if(s->chroma_y_shift){//Chroma420
                        add_dct(s, block[4], 4, dest_cb, uvlinesize);
                        add_dct(s, block[5], 5, dest_cr, uvlinesize);
                    }else{
                        //chroma422
                        dct_linesize = uvlinesize << s->interlaced_dct;
                        dct_offset =(s->interlaced_dct)? uvlinesize : uvlinesize*8;

                        add_dct(s, block[4], 4, dest_cb, dct_linesize);
                        add_dct(s, block[5], 5, dest_cr, dct_linesize);
                        add_dct(s, block[6], 6, dest_cb+dct_offset, dct_linesize);
                        add_dct(s, block[7], 7, dest_cr+dct_offset, dct_linesize);
                        if(!s->chroma_x_shift){//Chroma444
                            add_dct(s, block[8], 8, dest_cb+8, dct_linesize);
                            add_dct(s, block[9], 9, dest_cr+8, dct_linesize);
                            add_dct(s, block[10], 10, dest_cb+8+dct_offset, dct_linesize);
                            add_dct(s, block[11], 11, dest_cr+8+dct_offset, dct_linesize);
                        }
                    }
                }//fi gray
            }
4072
            else if (ENABLE_WMV2) {
M
Michael Niedermayer 已提交
4073
                ff_wmv2_add_mb(s, block, dest_y, dest_cb, dest_cr);
M
Michael Niedermayer 已提交
4074
            }
F
Fabrice Bellard 已提交
4075 4076
        } else {
            /* dct only in intra block */
M
Michael Niedermayer 已提交
4077
            if(s->encoding || !(s->codec_id==CODEC_ID_MPEG1VIDEO || s->codec_id==CODEC_ID_MPEG2VIDEO)){
M
Michael Niedermayer 已提交
4078 4079 4080 4081
                put_dct(s, block[0], 0, dest_y                          , dct_linesize, s->qscale);
                put_dct(s, block[1], 1, dest_y              + block_size, dct_linesize, s->qscale);
                put_dct(s, block[2], 2, dest_y + dct_offset             , dct_linesize, s->qscale);
                put_dct(s, block[3], 3, dest_y + dct_offset + block_size, dct_linesize, s->qscale);
4082 4083

                if(!(s->flags&CODEC_FLAG_GRAY)){
4084 4085 4086 4087 4088 4089 4090 4091 4092 4093 4094
                    if(s->chroma_y_shift){
                        put_dct(s, block[4], 4, dest_cb, uvlinesize, s->chroma_qscale);
                        put_dct(s, block[5], 5, dest_cr, uvlinesize, s->chroma_qscale);
                    }else{
                        dct_offset >>=1;
                        dct_linesize >>=1;
                        put_dct(s, block[4], 4, dest_cb,              dct_linesize, s->chroma_qscale);
                        put_dct(s, block[5], 5, dest_cr,              dct_linesize, s->chroma_qscale);
                        put_dct(s, block[6], 6, dest_cb + dct_offset, dct_linesize, s->chroma_qscale);
                        put_dct(s, block[7], 7, dest_cr + dct_offset, dct_linesize, s->chroma_qscale);
                    }
4095 4096
                }
            }else{
M
Michael Niedermayer 已提交
4097 4098 4099 4100
                s->dsp.idct_put(dest_y                          , dct_linesize, block[0]);
                s->dsp.idct_put(dest_y              + block_size, dct_linesize, block[1]);
                s->dsp.idct_put(dest_y + dct_offset             , dct_linesize, block[2]);
                s->dsp.idct_put(dest_y + dct_offset + block_size, dct_linesize, block[3]);
4101 4102

                if(!(s->flags&CODEC_FLAG_GRAY)){
4103 4104 4105 4106 4107 4108 4109 4110 4111 4112 4113 4114 4115 4116 4117 4118 4119 4120 4121 4122
                    if(s->chroma_y_shift){
                        s->dsp.idct_put(dest_cb, uvlinesize, block[4]);
                        s->dsp.idct_put(dest_cr, uvlinesize, block[5]);
                    }else{

                        dct_linesize = uvlinesize << s->interlaced_dct;
                        dct_offset =(s->interlaced_dct)? uvlinesize : uvlinesize*8;

                        s->dsp.idct_put(dest_cb,              dct_linesize, block[4]);
                        s->dsp.idct_put(dest_cr,              dct_linesize, block[5]);
                        s->dsp.idct_put(dest_cb + dct_offset, dct_linesize, block[6]);
                        s->dsp.idct_put(dest_cr + dct_offset, dct_linesize, block[7]);
                        if(!s->chroma_x_shift){//Chroma444
                            s->dsp.idct_put(dest_cb + 8,              dct_linesize, block[8]);
                            s->dsp.idct_put(dest_cr + 8,              dct_linesize, block[9]);
                            s->dsp.idct_put(dest_cb + 8 + dct_offset, dct_linesize, block[10]);
                            s->dsp.idct_put(dest_cr + 8 + dct_offset, dct_linesize, block[11]);
                        }
                    }
                }//gray
M
Michael Niedermayer 已提交
4123
            }
F
Fabrice Bellard 已提交
4124
        }
M
Michael Niedermayer 已提交
4125
skip_idct:
4126 4127
        if(!readable){
            s->dsp.put_pixels_tab[0][0](s->dest[0], dest_y ,   linesize,16);
4128 4129
            s->dsp.put_pixels_tab[s->chroma_x_shift][0](s->dest[1], dest_cb, uvlinesize,16 >> s->chroma_y_shift);
            s->dsp.put_pixels_tab[s->chroma_x_shift][0](s->dest[2], dest_cr, uvlinesize,16 >> s->chroma_y_shift);
4130
        }
F
Fabrice Bellard 已提交
4131 4132 4133
    }
}

M
Michael Niedermayer 已提交
4134 4135 4136 4137 4138
void MPV_decode_mb(MpegEncContext *s, DCTELEM block[12][64]){
    if(s->avctx->lowres) MPV_decode_mb_internal(s, block, 1);
    else                  MPV_decode_mb_internal(s, block, 0);
}

4139 4140
#ifdef CONFIG_ENCODERS

4141
static inline void dct_single_coeff_elimination(MpegEncContext *s, int n, int threshold)
4142 4143 4144 4145 4146 4147 4148 4149 4150 4151 4152 4153 4154 4155 4156
{
    static const char tab[64]=
        {3,2,2,1,1,1,1,1,
         1,1,1,1,1,1,1,1,
         1,1,1,1,1,1,1,1,
         0,0,0,0,0,0,0,0,
         0,0,0,0,0,0,0,0,
         0,0,0,0,0,0,0,0,
         0,0,0,0,0,0,0,0,
         0,0,0,0,0,0,0,0};
    int score=0;
    int run=0;
    int i;
    DCTELEM *block= s->block[n];
    const int last_index= s->block_last_index[n];
4157
    int skip_dc;
4158

4159 4160 4161
    if(threshold<0){
        skip_dc=0;
        threshold= -threshold;
4162 4163
    }else
        skip_dc=1;
4164

4165 4166 4167 4168
    /* are all which we could set to zero are allready zero? */
    if(last_index<=skip_dc - 1) return;

    for(i=0; i<=last_index; i++){
4169
        const int j = s->intra_scantable.permutated[i];
D
Diego Biurrun 已提交
4170
        const int level = FFABS(block[j]);
4171 4172 4173 4174 4175 4176 4177 4178 4179 4180 4181 4182
        if(level==1){
            if(skip_dc && i==0) continue;
            score+= tab[run];
            run=0;
        }else if(level>1){
            return;
        }else{
            run++;
        }
    }
    if(score >= threshold) return;
    for(i=skip_dc; i<=last_index; i++){
4183
        const int j = s->intra_scantable.permutated[i];
4184 4185 4186 4187 4188 4189
        block[j]=0;
    }
    if(block[0]) s->block_last_index[n]= 0;
    else         s->block_last_index[n]= -1;
}

4190 4191 4192 4193 4194
static inline void clip_coeffs(MpegEncContext *s, DCTELEM *block, int last_index)
{
    int i;
    const int maxlevel= s->max_qcoeff;
    const int minlevel= s->min_qcoeff;
4195
    int overflow=0;
4196

4197 4198 4199 4200
    if(s->mb_intra){
        i=1; //skip clipping of intra dc
    }else
        i=0;
4201

4202 4203
    for(;i<=last_index; i++){
        const int j= s->intra_scantable.permutated[i];
4204
        int level = block[j];
4205

4206 4207 4208 4209 4210 4211 4212
        if     (level>maxlevel){
            level=maxlevel;
            overflow++;
        }else if(level<minlevel){
            level=minlevel;
            overflow++;
        }
4213

M
cleanup  
Michael Niedermayer 已提交
4214
        block[j]= level;
4215
    }
4216

4217
    if(overflow && s->avctx->mb_decision == FF_MB_DECISION_SIMPLE)
4218
        av_log(s->avctx, AV_LOG_INFO, "warning, clipping %d dct coefficients to %d..%d\n", overflow, minlevel, maxlevel);
4219 4220
}

4221 4222
#endif //CONFIG_ENCODERS

4223 4224 4225 4226 4227
/**
 *
 * @param h is the normal height, this will be reduced automatically if needed for the last row
 */
void ff_draw_horiz_band(MpegEncContext *s, int y, int h){
M
Michael Niedermayer 已提交
4228
    if (s->avctx->draw_horiz_band) {
4229
        AVFrame *src;
M
Michael Niedermayer 已提交
4230
        int offset[4];
4231

4232 4233 4234 4235 4236 4237
        if(s->picture_structure != PICT_FRAME){
            h <<= 1;
            y <<= 1;
            if(s->first_field  && !(s->avctx->slice_flags&SLICE_FLAG_ALLOW_FIELD)) return;
        }

4238
        h= FFMIN(h, s->avctx->height - y);
4239

4240
        if(s->pict_type==B_TYPE || s->low_delay || (s->avctx->slice_flags&SLICE_FLAG_CODED_ORDER))
4241 4242 4243 4244 4245
            src= (AVFrame*)s->current_picture_ptr;
        else if(s->last_picture_ptr)
            src= (AVFrame*)s->last_picture_ptr;
        else
            return;
4246

M
Michael Niedermayer 已提交
4247
        if(s->pict_type==B_TYPE && s->picture_structure == PICT_FRAME && s->out_format != FMT_H264){
M
Michael Niedermayer 已提交
4248 4249 4250 4251 4252 4253
            offset[0]=
            offset[1]=
            offset[2]=
            offset[3]= 0;
        }else{
            offset[0]= y * s->linesize;;
4254
            offset[1]=
4255
            offset[2]= (y >> s->chroma_y_shift) * s->uvlinesize;
M
Michael Niedermayer 已提交
4256
            offset[3]= 0;
4257
        }
M
Michael Niedermayer 已提交
4258

M
cleanup  
Michael Niedermayer 已提交
4259 4260
        emms_c();

4261 4262
        s->avctx->draw_horiz_band(s->avctx, src, offset,
                                  y, s->picture_structure, h);
4263 4264 4265
    }
}

4266
void ff_init_block_index(MpegEncContext *s){ //FIXME maybe rename
D
Diego Biurrun 已提交
4267
    const int linesize= s->current_picture.linesize[0]; //not s->linesize as this would be wrong for field pics
4268
    const int uvlinesize= s->current_picture.linesize[1];
M
Michael Niedermayer 已提交
4269
    const int mb_size= 4 - s->avctx->lowres;
4270

4271 4272 4273 4274 4275 4276
    s->block_index[0]= s->b8_stride*(s->mb_y*2    ) - 2 + s->mb_x*2;
    s->block_index[1]= s->b8_stride*(s->mb_y*2    ) - 1 + s->mb_x*2;
    s->block_index[2]= s->b8_stride*(s->mb_y*2 + 1) - 2 + s->mb_x*2;
    s->block_index[3]= s->b8_stride*(s->mb_y*2 + 1) - 1 + s->mb_x*2;
    s->block_index[4]= s->mb_stride*(s->mb_y + 1)                + s->b8_stride*s->mb_height*2 + s->mb_x - 1;
    s->block_index[5]= s->mb_stride*(s->mb_y + s->mb_height + 2) + s->b8_stride*s->mb_height*2 + s->mb_x - 1;
4277 4278
    //block_index is not used by mpeg2, so it is not affected by chroma_format

M
Michael Niedermayer 已提交
4279 4280 4281
    s->dest[0] = s->current_picture.data[0] + ((s->mb_x - 1) << mb_size);
    s->dest[1] = s->current_picture.data[1] + ((s->mb_x - 1) << (mb_size - s->chroma_x_shift));
    s->dest[2] = s->current_picture.data[2] + ((s->mb_x - 1) << (mb_size - s->chroma_x_shift));
M
Michael Niedermayer 已提交
4282

4283 4284
    if(!(s->pict_type==B_TYPE && s->avctx->draw_horiz_band && s->picture_structure==PICT_FRAME))
    {
M
Michael Niedermayer 已提交
4285 4286 4287
        s->dest[0] += s->mb_y *   linesize << mb_size;
        s->dest[1] += s->mb_y * uvlinesize << (mb_size - s->chroma_y_shift);
        s->dest[2] += s->mb_y * uvlinesize << (mb_size - s->chroma_y_shift);
4288
    }
4289 4290
}

4291 4292
#ifdef CONFIG_ENCODERS

M
Michael Niedermayer 已提交
4293 4294 4295 4296 4297 4298 4299 4300 4301 4302 4303 4304 4305 4306 4307 4308 4309 4310 4311 4312 4313 4314 4315
static void get_vissual_weight(int16_t *weight, uint8_t *ptr, int stride){
    int x, y;
//FIXME optimize
    for(y=0; y<8; y++){
        for(x=0; x<8; x++){
            int x2, y2;
            int sum=0;
            int sqr=0;
            int count=0;

            for(y2= FFMAX(y-1, 0); y2 < FFMIN(8, y+2); y2++){
                for(x2= FFMAX(x-1, 0); x2 < FFMIN(8, x+2); x2++){
                    int v= ptr[x2 + y2*stride];
                    sum += v;
                    sqr += v*v;
                    count++;
                }
            }
            weight[x + 8*y]= (36*ff_sqrt(count*sqr - sum*sum)) / count;
        }
    }
}

4316
static av_always_inline void encode_mb_internal(MpegEncContext *s, int motion_x, int motion_y, int mb_block_height, int mb_block_count)
F
Fabrice Bellard 已提交
4317
{
4318 4319
    int16_t weight[8][64];
    DCTELEM orig[8][64];
4320 4321 4322
    const int mb_x= s->mb_x;
    const int mb_y= s->mb_y;
    int i;
4323
    int skip_dct[8];
4324
    int dct_offset   = s->linesize*8; //default for progressive frames
M
Michael Niedermayer 已提交
4325 4326
    uint8_t *ptr_y, *ptr_cb, *ptr_cr;
    int wrap_y, wrap_c;
4327

M
skiprd  
Michael Niedermayer 已提交
4328
    for(i=0; i<mb_block_count; i++) skip_dct[i]=s->skipdct;
4329

4330
    if(s->adaptive_quant){
4331 4332
        const int last_qp= s->qscale;
        const int mb_xy= mb_x + mb_y*s->mb_stride;
4333

4334 4335
        s->lambda= s->lambda_table[mb_xy];
        update_qscale(s);
4336

4337
        if(!(s->flags&CODEC_FLAG_QP_RD)){
4338
            s->qscale= s->current_picture_ptr->qscale_table[mb_xy];
4339
            s->dquant= s->qscale - last_qp;
4340

4341
            if(s->out_format==FMT_H263){
4342
                s->dquant= av_clip(s->dquant, -2, 2);
4343 4344

                if(s->codec_id==CODEC_ID_MPEG4){
4345 4346
                    if(!s->mb_intra){
                        if(s->pict_type == B_TYPE){
A
Aurelien Jacobs 已提交
4347
                            if(s->dquant&1 || s->mv_dir&MV_DIRECT)
4348 4349 4350 4351 4352
                                s->dquant= 0;
                        }
                        if(s->mv_type==MV_TYPE_8X8)
                            s->dquant=0;
                    }
4353
                }
4354 4355
            }
        }
M
cleanup  
Michael Niedermayer 已提交
4356
        ff_set_qscale(s, last_qp + s->dquant);
M
Michael Niedermayer 已提交
4357 4358
    }else if(s->flags&CODEC_FLAG_QP_RD)
        ff_set_qscale(s, s->qscale + s->dquant);
4359

M
Michael Niedermayer 已提交
4360 4361 4362
    wrap_y = s->linesize;
    wrap_c = s->uvlinesize;
    ptr_y = s->new_picture.data[0] + (mb_y * 16 * wrap_y) + mb_x * 16;
4363 4364
    ptr_cb = s->new_picture.data[1] + (mb_y * mb_block_height * wrap_c) + mb_x * 8;
    ptr_cr = s->new_picture.data[2] + (mb_y * mb_block_height * wrap_c) + mb_x * 8;
M
Michael Niedermayer 已提交
4365 4366

    if(mb_x*16+16 > s->width || mb_y*16+16 > s->height){
4367 4368 4369
        uint8_t *ebuf= s->edge_emu_buffer + 32;
        ff_emulated_edge_mc(ebuf            , ptr_y , wrap_y,16,16,mb_x*16,mb_y*16, s->width   , s->height);
        ptr_y= ebuf;
4370
        ff_emulated_edge_mc(ebuf+18*wrap_y  , ptr_cb, wrap_c, 8, mb_block_height, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
4371
        ptr_cb= ebuf+18*wrap_y;
4372
        ff_emulated_edge_mc(ebuf+18*wrap_y+8, ptr_cr, wrap_c, 8, mb_block_height, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
4373
        ptr_cr= ebuf+18*wrap_y+8;
M
Michael Niedermayer 已提交
4374 4375
    }

4376
    if (s->mb_intra) {
4377 4378
        if(s->flags&CODEC_FLAG_INTERLACED_DCT){
            int progressive_score, interlaced_score;
M
Michael Niedermayer 已提交
4379

4380
            s->interlaced_dct=0;
4381
            progressive_score= s->dsp.ildct_cmp[4](s, ptr_y           , NULL, wrap_y, 8)
M
Michael Niedermayer 已提交
4382
                              +s->dsp.ildct_cmp[4](s, ptr_y + wrap_y*8, NULL, wrap_y, 8) - 400;
4383 4384

            if(progressive_score > 0){
4385
                interlaced_score = s->dsp.ildct_cmp[4](s, ptr_y           , NULL, wrap_y*2, 8)
M
Michael Niedermayer 已提交
4386
                                  +s->dsp.ildct_cmp[4](s, ptr_y + wrap_y  , NULL, wrap_y*2, 8);
4387 4388
                if(progressive_score > interlaced_score){
                    s->interlaced_dct=1;
4389

4390 4391
                    dct_offset= wrap_y;
                    wrap_y<<=1;
4392 4393
                    if (s->chroma_format == CHROMA_422)
                        wrap_c<<=1;
4394 4395
                }
            }
4396
        }
4397

4398
        s->dsp.get_pixels(s->block[0], ptr_y                 , wrap_y);
M
Michael Niedermayer 已提交
4399 4400 4401
        s->dsp.get_pixels(s->block[1], ptr_y              + 8, wrap_y);
        s->dsp.get_pixels(s->block[2], ptr_y + dct_offset    , wrap_y);
        s->dsp.get_pixels(s->block[3], ptr_y + dct_offset + 8, wrap_y);
4402

M
Michael Niedermayer 已提交
4403 4404 4405 4406
        if(s->flags&CODEC_FLAG_GRAY){
            skip_dct[4]= 1;
            skip_dct[5]= 1;
        }else{
4407
            s->dsp.get_pixels(s->block[4], ptr_cb, wrap_c);
M
Michael Niedermayer 已提交
4408
            s->dsp.get_pixels(s->block[5], ptr_cr, wrap_c);
4409 4410 4411 4412
            if(!s->chroma_y_shift){ /* 422 */
                s->dsp.get_pixels(s->block[6], ptr_cb + (dct_offset>>1), wrap_c);
                s->dsp.get_pixels(s->block[7], ptr_cr + (dct_offset>>1), wrap_c);
            }
M
Michael Niedermayer 已提交
4413
        }
4414
    }else{
M
Michael Niedermayer 已提交
4415 4416
        op_pixels_func (*op_pix)[4];
        qpel_mc_func (*op_qpix)[16];
4417
        uint8_t *dest_y, *dest_cb, *dest_cr;
4418

4419 4420 4421
        dest_y  = s->dest[0];
        dest_cb = s->dest[1];
        dest_cr = s->dest[2];
4422

4423
        if ((!s->no_rounding) || s->pict_type==B_TYPE){
4424
            op_pix = s->dsp.put_pixels_tab;
4425
            op_qpix= s->dsp.put_qpel_pixels_tab;
M
Michael Niedermayer 已提交
4426
        }else{
4427 4428
            op_pix = s->dsp.put_no_rnd_pixels_tab;
            op_qpix= s->dsp.put_no_rnd_qpel_pixels_tab;
4429 4430 4431
        }

        if (s->mv_dir & MV_DIR_FORWARD) {
M
cleanup  
Michael Niedermayer 已提交
4432
            MPV_motion(s, dest_y, dest_cb, dest_cr, 0, s->last_picture.data, op_pix, op_qpix);
4433 4434
            op_pix = s->dsp.avg_pixels_tab;
            op_qpix= s->dsp.avg_qpel_pixels_tab;
4435 4436
        }
        if (s->mv_dir & MV_DIR_BACKWARD) {
M
cleanup  
Michael Niedermayer 已提交
4437
            MPV_motion(s, dest_y, dest_cb, dest_cr, 1, s->next_picture.data, op_pix, op_qpix);
4438
        }
4439

4440 4441
        if(s->flags&CODEC_FLAG_INTERLACED_DCT){
            int progressive_score, interlaced_score;
4442 4443

            s->interlaced_dct=0;
4444
            progressive_score= s->dsp.ildct_cmp[0](s, dest_y           , ptr_y           , wrap_y, 8)
4445
                              +s->dsp.ildct_cmp[0](s, dest_y + wrap_y*8, ptr_y + wrap_y*8, wrap_y, 8) - 400;
4446

4447 4448 4449
            if(s->avctx->ildct_cmp == FF_CMP_VSSE) progressive_score -= 400;

            if(progressive_score>0){
4450
                interlaced_score = s->dsp.ildct_cmp[0](s, dest_y           , ptr_y           , wrap_y*2, 8)
4451
                                  +s->dsp.ildct_cmp[0](s, dest_y + wrap_y  , ptr_y + wrap_y  , wrap_y*2, 8);
4452

4453 4454
                if(progressive_score > interlaced_score){
                    s->interlaced_dct=1;
4455

4456 4457
                    dct_offset= wrap_y;
                    wrap_y<<=1;
4458 4459
                    if (s->chroma_format == CHROMA_422)
                        wrap_c<<=1;
4460 4461
                }
            }
4462
        }
4463

4464
        s->dsp.diff_pixels(s->block[0], ptr_y                 , dest_y                 , wrap_y);
4465 4466 4467
        s->dsp.diff_pixels(s->block[1], ptr_y              + 8, dest_y              + 8, wrap_y);
        s->dsp.diff_pixels(s->block[2], ptr_y + dct_offset    , dest_y + dct_offset    , wrap_y);
        s->dsp.diff_pixels(s->block[3], ptr_y + dct_offset + 8, dest_y + dct_offset + 8, wrap_y);
4468

M
Michael Niedermayer 已提交
4469 4470 4471 4472
        if(s->flags&CODEC_FLAG_GRAY){
            skip_dct[4]= 1;
            skip_dct[5]= 1;
        }else{
4473 4474
            s->dsp.diff_pixels(s->block[4], ptr_cb, dest_cb, wrap_c);
            s->dsp.diff_pixels(s->block[5], ptr_cr, dest_cr, wrap_c);
4475 4476 4477 4478
            if(!s->chroma_y_shift){ /* 422 */
                s->dsp.diff_pixels(s->block[6], ptr_cb + (dct_offset>>1), dest_cb + (dct_offset>>1), wrap_c);
                s->dsp.diff_pixels(s->block[7], ptr_cr + (dct_offset>>1), dest_cr + (dct_offset>>1), wrap_c);
            }
M
Michael Niedermayer 已提交
4479
        }
4480
        /* pre quantization */
4481
        if(s->current_picture.mc_mb_var[s->mb_stride*mb_y+ mb_x]<2*s->qscale*s->qscale){
4482
            //FIXME optimize
4483
            if(s->dsp.sad[1](NULL, ptr_y               , dest_y               , wrap_y, 8) < 20*s->qscale) skip_dct[0]= 1;
M
Michael Niedermayer 已提交
4484 4485 4486 4487 4488
            if(s->dsp.sad[1](NULL, ptr_y            + 8, dest_y            + 8, wrap_y, 8) < 20*s->qscale) skip_dct[1]= 1;
            if(s->dsp.sad[1](NULL, ptr_y +dct_offset   , dest_y +dct_offset   , wrap_y, 8) < 20*s->qscale) skip_dct[2]= 1;
            if(s->dsp.sad[1](NULL, ptr_y +dct_offset+ 8, dest_y +dct_offset+ 8, wrap_y, 8) < 20*s->qscale) skip_dct[3]= 1;
            if(s->dsp.sad[1](NULL, ptr_cb              , dest_cb              , wrap_c, 8) < 20*s->qscale) skip_dct[4]= 1;
            if(s->dsp.sad[1](NULL, ptr_cr              , dest_cr              , wrap_c, 8) < 20*s->qscale) skip_dct[5]= 1;
4489 4490 4491 4492
            if(!s->chroma_y_shift){ /* 422 */
                if(s->dsp.sad[1](NULL, ptr_cb +(dct_offset>>1), dest_cb +(dct_offset>>1), wrap_c, 8) < 20*s->qscale) skip_dct[6]= 1;
                if(s->dsp.sad[1](NULL, ptr_cr +(dct_offset>>1), dest_cr +(dct_offset>>1), wrap_c, 8) < 20*s->qscale) skip_dct[7]= 1;
            }
4493
        }
M
Michael Niedermayer 已提交
4494
    }
4495

M
Michael Niedermayer 已提交
4496 4497 4498 4499 4500 4501 4502
    if(s->avctx->quantizer_noise_shaping){
        if(!skip_dct[0]) get_vissual_weight(weight[0], ptr_y                 , wrap_y);
        if(!skip_dct[1]) get_vissual_weight(weight[1], ptr_y              + 8, wrap_y);
        if(!skip_dct[2]) get_vissual_weight(weight[2], ptr_y + dct_offset    , wrap_y);
        if(!skip_dct[3]) get_vissual_weight(weight[3], ptr_y + dct_offset + 8, wrap_y);
        if(!skip_dct[4]) get_vissual_weight(weight[4], ptr_cb                , wrap_c);
        if(!skip_dct[5]) get_vissual_weight(weight[5], ptr_cr                , wrap_c);
4503 4504 4505 4506 4507
        if(!s->chroma_y_shift){ /* 422 */
            if(!skip_dct[6]) get_vissual_weight(weight[6], ptr_cb + (dct_offset>>1), wrap_c);
            if(!skip_dct[7]) get_vissual_weight(weight[7], ptr_cr + (dct_offset>>1), wrap_c);
        }
        memcpy(orig[0], s->block[0], sizeof(DCTELEM)*64*mb_block_count);
4508
    }
4509

4510
    /* DCT & quantize */
M
Michael Niedermayer 已提交
4511 4512
    assert(s->out_format!=FMT_MJPEG || s->qscale==8);
    {
4513
        for(i=0;i<mb_block_count;i++) {
4514 4515
            if(!skip_dct[i]){
                int overflow;
4516
                s->block_last_index[i] = s->dct_quantize(s, s->block[i], i, s->qscale, &overflow);
4517
            // FIXME we could decide to change to quantizer instead of clipping
4518 4519
            // JS: I don't think that would be a good idea it could lower quality instead
            //     of improve it. Just INTRADC clipping deserves changes in quantizer
4520 4521 4522
                if (overflow) clip_coeffs(s, s->block[i], s->block_last_index[i]);
            }else
                s->block_last_index[i]= -1;
4523
        }
M
Michael Niedermayer 已提交
4524
        if(s->avctx->quantizer_noise_shaping){
4525
            for(i=0;i<mb_block_count;i++) {
M
Michael Niedermayer 已提交
4526 4527 4528 4529 4530
                if(!skip_dct[i]){
                    s->block_last_index[i] = dct_quantize_refine(s, s->block[i], weight[i], orig[i], i, s->qscale);
                }
            }
        }
4531

4532 4533
        if(s->luma_elim_threshold && !s->mb_intra)
            for(i=0; i<4; i++)
4534
                dct_single_coeff_elimination(s, i, s->luma_elim_threshold);
4535
        if(s->chroma_elim_threshold && !s->mb_intra)
4536
            for(i=4; i<mb_block_count; i++)
4537
                dct_single_coeff_elimination(s, i, s->chroma_elim_threshold);
4538 4539

        if(s->flags & CODEC_FLAG_CBP_RD){
4540
            for(i=0;i<mb_block_count;i++) {
4541 4542 4543 4544
                if(s->block_last_index[i] == -1)
                    s->coded_score[i]= INT_MAX/256;
            }
        }
4545 4546
    }

M
Michael Niedermayer 已提交
4547 4548 4549 4550
    if((s->flags&CODEC_FLAG_GRAY) && s->mb_intra){
        s->block_last_index[4]=
        s->block_last_index[5]= 0;
        s->block[4][0]=
M
bugs  
Michael Niedermayer 已提交
4551
        s->block[5][0]= (1024 + s->c_dc_scale/2)/ s->c_dc_scale;
M
Michael Niedermayer 已提交
4552 4553
    }

M
Michael Niedermayer 已提交
4554 4555
    //non c quantize code returns incorrect block_last_index FIXME
    if(s->alternate_scan && s->dct_quantize != dct_quantize_c){
4556
        for(i=0; i<mb_block_count; i++){
M
Michael Niedermayer 已提交
4557 4558 4559 4560 4561 4562 4563 4564 4565 4566
            int j;
            if(s->block_last_index[i]>0){
                for(j=63; j>0; j--){
                    if(s->block[i][ s->intra_scantable.permutated[j] ]) break;
                }
                s->block_last_index[i]= j;
            }
        }
    }

4567
    /* huffman encode */
M
Michael Niedermayer 已提交
4568 4569
    switch(s->codec_id){ //FIXME funct ptr could be slightly faster
    case CODEC_ID_MPEG1VIDEO:
M
Michael Niedermayer 已提交
4570
    case CODEC_ID_MPEG2VIDEO:
M
Michael Niedermayer 已提交
4571 4572 4573 4574 4575 4576
        mpeg1_encode_mb(s, s->block, motion_x, motion_y); break;
    case CODEC_ID_MPEG4:
        mpeg4_encode_mb(s, s->block, motion_x, motion_y); break;
    case CODEC_ID_MSMPEG4V2:
    case CODEC_ID_MSMPEG4V3:
    case CODEC_ID_WMV1:
4577
        if (ENABLE_MSMPEG4_ENCODER)
A
Aurelien Jacobs 已提交
4578 4579
            msmpeg4_encode_mb(s, s->block, motion_x, motion_y);
        break;
M
Michael Niedermayer 已提交
4580
    case CODEC_ID_WMV2:
4581
        if (ENABLE_WMV2_ENCODER)
A
Aurelien Jacobs 已提交
4582 4583
            ff_wmv2_encode_mb(s, s->block, motion_x, motion_y);
        break;
4584
    case CODEC_ID_H261:
4585
        if (ENABLE_H261_ENCODER)
A
Aurelien Jacobs 已提交
4586 4587
            ff_h261_encode_mb(s, s->block, motion_x, motion_y);
        break;
M
Michael Niedermayer 已提交
4588 4589
    case CODEC_ID_H263:
    case CODEC_ID_H263P:
4590
    case CODEC_ID_FLV1:
M
Michael Niedermayer 已提交
4591
    case CODEC_ID_RV10:
M
Michael Niedermayer 已提交
4592
    case CODEC_ID_RV20:
M
Michael Niedermayer 已提交
4593
        h263_encode_mb(s, s->block, motion_x, motion_y); break;
M
Michael Niedermayer 已提交
4594
    case CODEC_ID_MJPEG:
4595
        if (ENABLE_MJPEG_ENCODER)
A
Aurelien Jacobs 已提交
4596 4597
            mjpeg_encode_mb(s, s->block);
        break;
M
Michael Niedermayer 已提交
4598 4599
    default:
        assert(0);
4600 4601 4602
    }
}

4603
static av_always_inline void encode_mb(MpegEncContext *s, int motion_x, int motion_y)
4604 4605 4606 4607 4608
{
    if (s->chroma_format == CHROMA_420) encode_mb_internal(s, motion_x, motion_y,  8, 6);
    else                                encode_mb_internal(s, motion_x, motion_y, 16, 8);
}

4609 4610
#endif //CONFIG_ENCODERS

M
Michael Niedermayer 已提交
4611 4612 4613
void ff_mpeg_flush(AVCodecContext *avctx){
    int i;
    MpegEncContext *s = avctx->priv_data;
4614 4615

    if(s==NULL || s->picture==NULL)
4616
        return;
4617

M
Michael Niedermayer 已提交
4618 4619 4620 4621 4622
    for(i=0; i<MAX_PICTURE_COUNT; i++){
       if(s->picture[i].data[0] && (   s->picture[i].type == FF_BUFFER_TYPE_INTERNAL
                                    || s->picture[i].type == FF_BUFFER_TYPE_USER))
        avctx->release_buffer(avctx, (AVFrame*)&s->picture[i]);
    }
M
Michael Niedermayer 已提交
4623
    s->current_picture_ptr = s->last_picture_ptr = s->next_picture_ptr = NULL;
4624

M
Michael Niedermayer 已提交
4625
    s->mb_x= s->mb_y= 0;
4626

4627 4628 4629 4630 4631 4632
    s->parse_context.state= -1;
    s->parse_context.frame_start_found= 0;
    s->parse_context.overread= 0;
    s->parse_context.overread_index= 0;
    s->parse_context.index= 0;
    s->parse_context.last_index= 0;
4633
    s->bitstream_buffer_size=0;
4634
    s->pp_time=0;
M
Michael Niedermayer 已提交
4635 4636
}

4637
#ifdef CONFIG_ENCODERS
4638
void ff_copy_bits(PutBitContext *pb, uint8_t *src, int length)
4639
{
4640
    const uint16_t *srcw= (uint16_t*)src;
4641
    int words= length>>4;
4642 4643 4644
    int bits= length&15;
    int i;

4645
    if(length==0) return;
4646

4647 4648 4649 4650
    if(words < 16){
        for(i=0; i<words; i++) put_bits(pb, 16, be2me_16(srcw[i]));
    }else if(put_bits_count(pb)&7){
        for(i=0; i<words; i++) put_bits(pb, 16, be2me_16(srcw[i]));
4651
    }else{
4652 4653
        for(i=0; put_bits_count(pb)&31; i++)
            put_bits(pb, 8, src[i]);
4654
        flush_put_bits(pb);
4655 4656
        memcpy(pbBufPtr(pb), src+i, 2*words-i);
        skip_put_bytes(pb, 2*words-i);
4657
    }
4658

4659
    put_bits(pb, bits, be2me_16(srcw[words])>>(16-bits));
4660 4661
}

4662
static inline void copy_context_before_encode(MpegEncContext *d, MpegEncContext *s, int type){
4663 4664 4665 4666 4667
    int i;

    memcpy(d->last_mv, s->last_mv, 2*2*2*sizeof(int)); //FIXME is memcpy faster then a loop?

    /* mpeg1 */
4668
    d->mb_skip_run= s->mb_skip_run;
4669 4670
    for(i=0; i<3; i++)
        d->last_dc[i]= s->last_dc[i];
4671

4672 4673 4674 4675 4676
    /* statistics */
    d->mv_bits= s->mv_bits;
    d->i_tex_bits= s->i_tex_bits;
    d->p_tex_bits= s->p_tex_bits;
    d->i_count= s->i_count;
4677 4678
    d->f_count= s->f_count;
    d->b_count= s->b_count;
4679 4680
    d->skip_count= s->skip_count;
    d->misc_bits= s->misc_bits;
4681
    d->last_bits= 0;
4682

4683
    d->mb_skipped= 0;
M
Michael Niedermayer 已提交
4684
    d->qscale= s->qscale;
4685
    d->dquant= s->dquant;
4686 4687
}

4688
static inline void copy_context_after_encode(MpegEncContext *d, MpegEncContext *s, int type){
4689 4690
    int i;

4691
    memcpy(d->mv, s->mv, 2*4*2*sizeof(int));
4692
    memcpy(d->last_mv, s->last_mv, 2*2*2*sizeof(int)); //FIXME is memcpy faster then a loop?
4693

4694
    /* mpeg1 */
4695
    d->mb_skip_run= s->mb_skip_run;
4696 4697
    for(i=0; i<3; i++)
        d->last_dc[i]= s->last_dc[i];
4698

4699 4700 4701 4702 4703
    /* statistics */
    d->mv_bits= s->mv_bits;
    d->i_tex_bits= s->i_tex_bits;
    d->p_tex_bits= s->p_tex_bits;
    d->i_count= s->i_count;
4704 4705
    d->f_count= s->f_count;
    d->b_count= s->b_count;
4706 4707 4708 4709
    d->skip_count= s->skip_count;
    d->misc_bits= s->misc_bits;

    d->mb_intra= s->mb_intra;
4710
    d->mb_skipped= s->mb_skipped;
4711 4712 4713
    d->mv_type= s->mv_type;
    d->mv_dir= s->mv_dir;
    d->pb= s->pb;
4714 4715 4716 4717
    if(s->data_partitioning){
        d->pb2= s->pb2;
        d->tex_pb= s->tex_pb;
    }
4718
    d->block= s->block;
4719
    for(i=0; i<8; i++)
4720
        d->block_last_index[i]= s->block_last_index[i];
4721
    d->interlaced_dct= s->interlaced_dct;
M
Michael Niedermayer 已提交
4722
    d->qscale= s->qscale;
4723 4724
}

4725
static inline void encode_mb_hq(MpegEncContext *s, MpegEncContext *backup, MpegEncContext *best, int type,
4726 4727 4728
                           PutBitContext pb[2], PutBitContext pb2[2], PutBitContext tex_pb[2],
                           int *dmin, int *next_block, int motion_x, int motion_y)
{
4729 4730
    int score;
    uint8_t *dest_backup[3];
4731

4732 4733 4734 4735 4736 4737 4738 4739
    copy_context_before_encode(s, backup, type);

    s->block= s->blocks[*next_block];
    s->pb= pb[*next_block];
    if(s->data_partitioning){
        s->pb2   = pb2   [*next_block];
        s->tex_pb= tex_pb[*next_block];
    }
4740

4741 4742
    if(*next_block){
        memcpy(dest_backup, s->dest, sizeof(s->dest));
4743 4744 4745 4746
        s->dest[0] = s->rd_scratchpad;
        s->dest[1] = s->rd_scratchpad + 16*s->linesize;
        s->dest[2] = s->rd_scratchpad + 16*s->linesize + 8;
        assert(s->linesize >= 32); //FIXME
4747
    }
4748 4749

    encode_mb(s, motion_x, motion_y);
4750

4751
    score= put_bits_count(&s->pb);
4752
    if(s->data_partitioning){
4753 4754
        score+= put_bits_count(&s->pb2);
        score+= put_bits_count(&s->tex_pb);
4755
    }
4756

4757 4758
    if(s->avctx->mb_decision == FF_MB_DECISION_RD){
        MPV_decode_mb(s, s->block);
4759

4760 4761
        score *= s->lambda2;
        score += sse_mb(s) << FF_LAMBDA_SHIFT;
4762
    }
4763

4764 4765 4766 4767 4768 4769
    if(*next_block){
        memcpy(s->dest, dest_backup, sizeof(s->dest));
    }

    if(score<*dmin){
        *dmin= score;
4770 4771 4772 4773 4774
        *next_block^=1;

        copy_context_after_encode(best, s, type);
    }
}
4775

4776
static int sse(MpegEncContext *s, uint8_t *src1, uint8_t *src2, int w, int h, int stride){
M
Måns Rullgård 已提交
4777
    uint32_t *sq = ff_squareTbl + 256;
4778 4779
    int acc=0;
    int x,y;
4780 4781

    if(w==16 && h==16)
M
Michael Niedermayer 已提交
4782
        return s->dsp.sse[0](NULL, src1, src2, stride, 16);
M
Michael Niedermayer 已提交
4783
    else if(w==8 && h==8)
M
Michael Niedermayer 已提交
4784
        return s->dsp.sse[1](NULL, src1, src2, stride, 8);
4785

4786 4787 4788
    for(y=0; y<h; y++){
        for(x=0; x<w; x++){
            acc+= sq[src1[x + y*stride] - src2[x + y*stride]];
4789
        }
4790
    }
4791

M
Michael Niedermayer 已提交
4792
    assert(acc>=0);
4793

4794 4795
    return acc;
}
4796

4797 4798 4799 4800 4801 4802 4803 4804
static int sse_mb(MpegEncContext *s){
    int w= 16;
    int h= 16;

    if(s->mb_x*16 + 16 > s->width ) w= s->width - s->mb_x*16;
    if(s->mb_y*16 + 16 > s->height) h= s->height- s->mb_y*16;

    if(w==16 && h==16)
4805
      if(s->avctx->mb_cmp == FF_CMP_NSSE){
M
Michael Niedermayer 已提交
4806 4807 4808
        return  s->dsp.nsse[0](s, s->new_picture.data[0] + s->mb_x*16 + s->mb_y*s->linesize*16, s->dest[0], s->linesize, 16)
               +s->dsp.nsse[1](s, s->new_picture.data[1] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,s->dest[1], s->uvlinesize, 8)
               +s->dsp.nsse[1](s, s->new_picture.data[2] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,s->dest[2], s->uvlinesize, 8);
4809
      }else{
M
Michael Niedermayer 已提交
4810 4811 4812
        return  s->dsp.sse[0](NULL, s->new_picture.data[0] + s->mb_x*16 + s->mb_y*s->linesize*16, s->dest[0], s->linesize, 16)
               +s->dsp.sse[1](NULL, s->new_picture.data[1] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,s->dest[1], s->uvlinesize, 8)
               +s->dsp.sse[1](NULL, s->new_picture.data[2] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,s->dest[2], s->uvlinesize, 8);
4813
      }
4814 4815 4816 4817 4818 4819
    else
        return  sse(s, s->new_picture.data[0] + s->mb_x*16 + s->mb_y*s->linesize*16, s->dest[0], w, h, s->linesize)
               +sse(s, s->new_picture.data[1] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,s->dest[1], w>>1, h>>1, s->uvlinesize)
               +sse(s, s->new_picture.data[2] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,s->dest[2], w>>1, h>>1, s->uvlinesize);
}

4820 4821 4822
static int pre_estimate_motion_thread(AVCodecContext *c, void *arg){
    MpegEncContext *s= arg;

4823

4824 4825 4826 4827 4828 4829 4830 4831 4832
    s->me.pre_pass=1;
    s->me.dia_size= s->avctx->pre_dia_size;
    s->first_slice_line=1;
    for(s->mb_y= s->end_mb_y-1; s->mb_y >= s->start_mb_y; s->mb_y--) {
        for(s->mb_x=s->mb_width-1; s->mb_x >=0 ;s->mb_x--) {
            ff_pre_estimate_p_frame_motion(s, s->mb_x, s->mb_y);
        }
        s->first_slice_line=0;
    }
4833

4834
    s->me.pre_pass=0;
4835

4836 4837 4838 4839 4840 4841
    return 0;
}

static int estimate_motion_thread(AVCodecContext *c, void *arg){
    MpegEncContext *s= arg;

4842 4843
    ff_check_alignment();

4844 4845 4846 4847 4848 4849 4850 4851 4852 4853
    s->me.dia_size= s->avctx->dia_size;
    s->first_slice_line=1;
    for(s->mb_y= s->start_mb_y; s->mb_y < s->end_mb_y; s->mb_y++) {
        s->mb_x=0; //for block init below
        ff_init_block_index(s);
        for(s->mb_x=0; s->mb_x < s->mb_width; s->mb_x++) {
            s->block_index[0]+=2;
            s->block_index[1]+=2;
            s->block_index[2]+=2;
            s->block_index[3]+=2;
4854

4855 4856 4857 4858 4859 4860 4861 4862 4863 4864 4865
            /* compute motion vector & mb_type and store in context */
            if(s->pict_type==B_TYPE)
                ff_estimate_b_frame_motion(s, s->mb_x, s->mb_y);
            else
                ff_estimate_p_frame_motion(s, s->mb_x, s->mb_y);
        }
        s->first_slice_line=0;
    }
    return 0;
}

4866 4867 4868 4869
static int mb_var_thread(AVCodecContext *c, void *arg){
    MpegEncContext *s= arg;
    int mb_x, mb_y;

4870 4871
    ff_check_alignment();

4872 4873 4874 4875 4876 4877 4878
    for(mb_y=s->start_mb_y; mb_y < s->end_mb_y; mb_y++) {
        for(mb_x=0; mb_x < s->mb_width; mb_x++) {
            int xx = mb_x * 16;
            int yy = mb_y * 16;
            uint8_t *pix = s->new_picture.data[0] + (yy * s->linesize) + xx;
            int varc;
            int sum = s->dsp.pix_sum(pix, s->linesize);
4879

4880 4881 4882 4883
            varc = (s->dsp.pix_norm1(pix, s->linesize) - (((unsigned)(sum*sum))>>8) + 500 + 128)>>8;

            s->current_picture.mb_var [s->mb_stride * mb_y + mb_x] = varc;
            s->current_picture.mb_mean[s->mb_stride * mb_y + mb_x] = (sum+128)>>8;
4884
            s->me.mb_var_sum_temp    += varc;
4885 4886
        }
    }
4887
    return 0;
4888 4889
}

4890 4891 4892 4893 4894
static void write_slice_end(MpegEncContext *s){
    if(s->codec_id==CODEC_ID_MPEG4){
        if(s->partitioned_frame){
            ff_mpeg4_merge_partitions(s);
        }
4895

4896
        ff_mpeg4_stuffing(&s->pb);
4897
    }else if(ENABLE_MJPEG_ENCODER && s->out_format == FMT_MJPEG){
4898 4899 4900 4901 4902
        ff_mjpeg_stuffing(&s->pb);
    }

    align_put_bits(&s->pb);
    flush_put_bits(&s->pb);
4903

4904 4905
    if((s->flags&CODEC_FLAG_PASS1) && !s->partitioned_frame)
        s->misc_bits+= get_bits_diff(s);
4906 4907 4908 4909
}

static int encode_thread(AVCodecContext *c, void *arg){
    MpegEncContext *s= arg;
M
Michael Niedermayer 已提交
4910
    int mb_x, mb_y, pdif = 0;
M
Michael Niedermayer 已提交
4911
    int i, j;
4912
    MpegEncContext best_s, backup_s;
4913 4914 4915
    uint8_t bit_buf[2][MAX_MB_BYTES];
    uint8_t bit_buf2[2][MAX_MB_BYTES];
    uint8_t bit_buf_tex[2][MAX_MB_BYTES];
4916
    PutBitContext pb[2], pb2[2], tex_pb[2];
4917
//printf("%d->%d\n", s->resync_mb_y, s->end_mb_y);
4918

4919 4920
    ff_check_alignment();

4921
    for(i=0; i<2; i++){
4922 4923 4924
        init_put_bits(&pb    [i], bit_buf    [i], MAX_MB_BYTES);
        init_put_bits(&pb2   [i], bit_buf2   [i], MAX_MB_BYTES);
        init_put_bits(&tex_pb[i], bit_buf_tex[i], MAX_MB_BYTES);
4925
    }
F
Fabrice Bellard 已提交
4926

4927 4928 4929 4930 4931 4932 4933 4934 4935
    s->last_bits= put_bits_count(&s->pb);
    s->mv_bits=0;
    s->misc_bits=0;
    s->i_tex_bits=0;
    s->p_tex_bits=0;
    s->i_count=0;
    s->f_count=0;
    s->b_count=0;
    s->skip_count=0;
4936

4937 4938 4939
    for(i=0; i<3; i++){
        /* init last dc values */
        /* note: quant matrix value (8) is implied here */
4940
        s->last_dc[i] = 128 << s->intra_dc_precision;
4941

4942
        s->current_picture.error[i] = 0;
M
Michael Niedermayer 已提交
4943
    }
4944 4945
    s->mb_skip_run = 0;
    memset(s->last_mv, 0, sizeof(s->last_mv));
4946

4947
    s->last_mv_dir = 0;
M
Michael Niedermayer 已提交
4948

4949 4950 4951 4952 4953 4954 4955 4956 4957 4958
    switch(s->codec_id){
    case CODEC_ID_H263:
    case CODEC_ID_H263P:
    case CODEC_ID_FLV1:
        s->gob_index = ff_h263_get_gob_height(s);
        break;
    case CODEC_ID_MPEG4:
        if(s->partitioned_frame)
            ff_mpeg4_init_partitions(s);
        break;
4959
    }
4960

4961
    s->resync_mb_x=0;
4962
    s->resync_mb_y=0;
4963 4964 4965 4966 4967 4968
    s->first_slice_line = 1;
    s->ptr_lastgob = s->pb.buf;
    for(mb_y= s->start_mb_y; mb_y < s->end_mb_y; mb_y++) {
//    printf("row %d at %X\n", s->mb_y, (int)s);
        s->mb_x=0;
        s->mb_y= mb_y;
M
cleanup  
Michael Niedermayer 已提交
4969

4970 4971
        ff_set_qscale(s, s->qscale);
        ff_init_block_index(s);
4972

4973
        for(mb_x=0; mb_x < s->mb_width; mb_x++) {
4974
            int xy= mb_y*s->mb_stride + mb_x; // removed const, H261 needs to adjust this
4975 4976 4977 4978
            int mb_type= s->mb_type[xy];
//            int d;
            int dmin= INT_MAX;
            int dir;
M
Michael Niedermayer 已提交
4979

4980 4981 4982 4983 4984 4985 4986 4987 4988 4989 4990 4991
            if(s->pb.buf_end - s->pb.buf - (put_bits_count(&s->pb)>>3) < MAX_MB_BYTES){
                av_log(s->avctx, AV_LOG_ERROR, "encoded frame too large\n");
                return -1;
            }
            if(s->data_partitioning){
                if(   s->pb2   .buf_end - s->pb2   .buf - (put_bits_count(&s->    pb2)>>3) < MAX_MB_BYTES
                   || s->tex_pb.buf_end - s->tex_pb.buf - (put_bits_count(&s->tex_pb )>>3) < MAX_MB_BYTES){
                    av_log(s->avctx, AV_LOG_ERROR, "encoded frame too large\n");
                    return -1;
                }
            }

4992
            s->mb_x = mb_x;
4993
            s->mb_y = mb_y;  // moved into loop, can get changed by H.261
4994 4995
            ff_update_block_index(s);

4996
            if(ENABLE_H261_ENCODER && s->codec_id == CODEC_ID_H261){
4997 4998
                ff_h261_reorder_mb_index(s);
                xy= s->mb_y*s->mb_stride + s->mb_x;
M
Maarten Daniels 已提交
4999
                mb_type= s->mb_type[xy];
5000 5001
            }

5002 5003 5004
            /* write gob / video packet header  */
            if(s->rtp_mode){
                int current_packet_size, is_gob_start;
5005

5006
                current_packet_size= ((put_bits_count(&s->pb)+7)>>3) - (s->ptr_lastgob - s->pb.buf);
5007 5008 5009

                is_gob_start= s->avctx->rtp_payload_size && current_packet_size >= s->avctx->rtp_payload_size && mb_y + mb_x>0;

5010
                if(s->start_mb_y == mb_y && mb_y > 0 && mb_x==0) is_gob_start=1;
5011

5012 5013 5014 5015 5016 5017 5018 5019 5020 5021 5022
                switch(s->codec_id){
                case CODEC_ID_H263:
                case CODEC_ID_H263P:
                    if(!s->h263_slice_structured)
                        if(s->mb_x || s->mb_y%s->gob_index) is_gob_start=0;
                    break;
                case CODEC_ID_MPEG2VIDEO:
                    if(s->mb_x==0 && s->mb_y!=0) is_gob_start=1;
                case CODEC_ID_MPEG1VIDEO:
                    if(s->mb_skip_run) is_gob_start=0;
                    break;
M
Michael Niedermayer 已提交
5023
                }
5024

5025 5026 5027
                if(is_gob_start){
                    if(s->start_mb_y != mb_y || mb_x!=0){
                        write_slice_end(s);
5028

5029 5030
                        if(s->codec_id==CODEC_ID_MPEG4 && s->partitioned_frame){
                            ff_mpeg4_init_partitions(s);
M
Michael Niedermayer 已提交
5031 5032
                        }
                    }
5033

5034
                    assert((put_bits_count(&s->pb)&7) == 0);
M
Michael Niedermayer 已提交
5035
                    current_packet_size= pbBufPtr(&s->pb) - s->ptr_lastgob;
5036

5037
                    if(s->avctx->error_rate && s->resync_mb_x + s->resync_mb_y > 0){
5038
                        int r= put_bits_count(&s->pb)/8 + s->picture_number + 16 + s->mb_x + s->mb_y;
5039 5040 5041 5042 5043 5044 5045 5046 5047
                        int d= 100 / s->avctx->error_rate;
                        if(r % d == 0){
                            current_packet_size=0;
#ifndef ALT_BITSTREAM_WRITER
                            s->pb.buf_ptr= s->ptr_lastgob;
#endif
                            assert(pbBufPtr(&s->pb) == s->ptr_lastgob);
                        }
                    }
5048 5049 5050 5051 5052

                    if (s->avctx->rtp_callback){
                        int number_mb = (mb_y - s->resync_mb_y)*s->mb_width + mb_x - s->resync_mb_x;
                        s->avctx->rtp_callback(s->avctx, s->ptr_lastgob, current_packet_size, number_mb);
                    }
5053

M
Michael Niedermayer 已提交
5054 5055
                    switch(s->codec_id){
                    case CODEC_ID_MPEG4:
5056 5057
                        ff_mpeg4_encode_video_packet_header(s);
                        ff_mpeg4_clean_buffers(s);
M
Michael Niedermayer 已提交
5058 5059 5060
                    break;
                    case CODEC_ID_MPEG1VIDEO:
                    case CODEC_ID_MPEG2VIDEO:
5061 5062
                        ff_mpeg1_encode_slice_header(s);
                        ff_mpeg1_clean_buffers(s);
M
Michael Niedermayer 已提交
5063 5064 5065
                    break;
                    case CODEC_ID_H263:
                    case CODEC_ID_H263P:
5066
                        h263_encode_gob_header(s, mb_y);
M
Michael Niedermayer 已提交
5067
                    break;
M
Michael Niedermayer 已提交
5068 5069
                    }

M
Michael Niedermayer 已提交
5070
                    if(s->flags&CODEC_FLAG_PASS1){
5071
                        int bits= put_bits_count(&s->pb);
M
Michael Niedermayer 已提交
5072 5073 5074
                        s->misc_bits+= bits - s->last_bits;
                        s->last_bits= bits;
                    }
5075

M
Michael Niedermayer 已提交
5076
                    s->ptr_lastgob += current_packet_size;
5077 5078 5079 5080
                    s->first_slice_line=1;
                    s->resync_mb_x=mb_x;
                    s->resync_mb_y=mb_y;
                }
5081
            }
5082

5083 5084
            if(  (s->resync_mb_x   == s->mb_x)
               && s->resync_mb_y+1 == s->mb_y){
5085
                s->first_slice_line=0;
5086 5087
            }

5088
            s->mb_skipped=0;
5089
            s->dquant=0; //only for QP_RD
5090

M
Michael Niedermayer 已提交
5091
            if(mb_type & (mb_type-1) || (s->flags & CODEC_FLAG_QP_RD)){ // more than 1 MB type possible or CODEC_FLAG_QP_RD
5092
                int next_block=0;
5093
                int pb_bits_count, pb2_bits_count, tex_pb_bits_count;
5094 5095

                copy_context_before_encode(&backup_s, s, -1);
5096 5097
                backup_s.pb= s->pb;
                best_s.data_partitioning= s->data_partitioning;
5098
                best_s.partitioned_frame= s->partitioned_frame;
5099 5100 5101 5102
                if(s->data_partitioning){
                    backup_s.pb2= s->pb2;
                    backup_s.tex_pb= s->tex_pb;
                }
5103

M
Michael Niedermayer 已提交
5104
                if(mb_type&CANDIDATE_MB_TYPE_INTER){
5105
                    s->mv_dir = MV_DIR_FORWARD;
M
Michael Niedermayer 已提交
5106
                    s->mv_type = MV_TYPE_16X16;
5107
                    s->mb_intra= 0;
5108 5109
                    s->mv[0][0][0] = s->p_mv_table[xy][0];
                    s->mv[0][0][1] = s->p_mv_table[xy][1];
5110
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_INTER, pb, pb2, tex_pb,
5111
                                 &dmin, &next_block, s->mv[0][0][0], s->mv[0][0][1]);
5112
                }
5113
                if(mb_type&CANDIDATE_MB_TYPE_INTER_I){
M
Michael Niedermayer 已提交
5114 5115 5116 5117 5118 5119 5120 5121
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mv_type = MV_TYPE_FIELD;
                    s->mb_intra= 0;
                    for(i=0; i<2; i++){
                        j= s->field_select[0][i] = s->p_field_select_table[i][xy];
                        s->mv[0][i][0] = s->p_field_mv_table[i][j][xy][0];
                        s->mv[0][i][1] = s->p_field_mv_table[i][j][xy][1];
                    }
5122
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_INTER_I, pb, pb2, tex_pb,
M
Michael Niedermayer 已提交
5123 5124
                                 &dmin, &next_block, 0, 0);
                }
5125
                if(mb_type&CANDIDATE_MB_TYPE_SKIPPED){
5126 5127 5128 5129 5130
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mv_type = MV_TYPE_16X16;
                    s->mb_intra= 0;
                    s->mv[0][0][0] = 0;
                    s->mv[0][0][1] = 0;
5131
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_SKIPPED, pb, pb2, tex_pb,
5132
                                 &dmin, &next_block, s->mv[0][0][0], s->mv[0][0][1]);
F
Fabrice Bellard 已提交
5133
                }
5134
                if(mb_type&CANDIDATE_MB_TYPE_INTER4V){
5135
                    s->mv_dir = MV_DIR_FORWARD;
M
Michael Niedermayer 已提交
5136 5137 5138
                    s->mv_type = MV_TYPE_8X8;
                    s->mb_intra= 0;
                    for(i=0; i<4; i++){
5139 5140
                        s->mv[0][i][0] = s->current_picture.motion_val[0][s->block_index[i]][0];
                        s->mv[0][i][1] = s->current_picture.motion_val[0][s->block_index[i]][1];
M
Michael Niedermayer 已提交
5141
                    }
5142
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_INTER4V, pb, pb2, tex_pb,
5143
                                 &dmin, &next_block, 0, 0);
5144
                }
M
Michael Niedermayer 已提交
5145
                if(mb_type&CANDIDATE_MB_TYPE_FORWARD){
5146 5147 5148 5149 5150
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mv_type = MV_TYPE_16X16;
                    s->mb_intra= 0;
                    s->mv[0][0][0] = s->b_forw_mv_table[xy][0];
                    s->mv[0][0][1] = s->b_forw_mv_table[xy][1];
5151
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_FORWARD, pb, pb2, tex_pb,
5152
                                 &dmin, &next_block, s->mv[0][0][0], s->mv[0][0][1]);
5153
                }
M
Michael Niedermayer 已提交
5154
                if(mb_type&CANDIDATE_MB_TYPE_BACKWARD){
5155 5156 5157 5158 5159
                    s->mv_dir = MV_DIR_BACKWARD;
                    s->mv_type = MV_TYPE_16X16;
                    s->mb_intra= 0;
                    s->mv[1][0][0] = s->b_back_mv_table[xy][0];
                    s->mv[1][0][1] = s->b_back_mv_table[xy][1];
5160
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_BACKWARD, pb, pb2, tex_pb,
5161
                                 &dmin, &next_block, s->mv[1][0][0], s->mv[1][0][1]);
5162
                }
M
Michael Niedermayer 已提交
5163
                if(mb_type&CANDIDATE_MB_TYPE_BIDIR){
5164 5165 5166 5167 5168 5169 5170
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
                    s->mv_type = MV_TYPE_16X16;
                    s->mb_intra= 0;
                    s->mv[0][0][0] = s->b_bidir_forw_mv_table[xy][0];
                    s->mv[0][0][1] = s->b_bidir_forw_mv_table[xy][1];
                    s->mv[1][0][0] = s->b_bidir_back_mv_table[xy][0];
                    s->mv[1][0][1] = s->b_bidir_back_mv_table[xy][1];
5171
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_BIDIR, pb, pb2, tex_pb,
5172
                                 &dmin, &next_block, 0, 0);
5173
                }
5174
                if(mb_type&CANDIDATE_MB_TYPE_FORWARD_I){
M
Michael Niedermayer 已提交
5175 5176 5177 5178 5179 5180 5181 5182
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mv_type = MV_TYPE_FIELD;
                    s->mb_intra= 0;
                    for(i=0; i<2; i++){
                        j= s->field_select[0][i] = s->b_field_select_table[0][i][xy];
                        s->mv[0][i][0] = s->b_field_mv_table[0][i][j][xy][0];
                        s->mv[0][i][1] = s->b_field_mv_table[0][i][j][xy][1];
                    }
5183
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_FORWARD_I, pb, pb2, tex_pb,
M
Michael Niedermayer 已提交
5184 5185
                                 &dmin, &next_block, 0, 0);
                }
5186
                if(mb_type&CANDIDATE_MB_TYPE_BACKWARD_I){
M
Michael Niedermayer 已提交
5187 5188 5189 5190 5191 5192 5193 5194
                    s->mv_dir = MV_DIR_BACKWARD;
                    s->mv_type = MV_TYPE_FIELD;
                    s->mb_intra= 0;
                    for(i=0; i<2; i++){
                        j= s->field_select[1][i] = s->b_field_select_table[1][i][xy];
                        s->mv[1][i][0] = s->b_field_mv_table[1][i][j][xy][0];
                        s->mv[1][i][1] = s->b_field_mv_table[1][i][j][xy][1];
                    }
5195
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_BACKWARD_I, pb, pb2, tex_pb,
M
Michael Niedermayer 已提交
5196 5197
                                 &dmin, &next_block, 0, 0);
                }
5198
                if(mb_type&CANDIDATE_MB_TYPE_BIDIR_I){
M
Michael Niedermayer 已提交
5199 5200 5201 5202 5203 5204 5205 5206 5207 5208
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
                    s->mv_type = MV_TYPE_FIELD;
                    s->mb_intra= 0;
                    for(dir=0; dir<2; dir++){
                        for(i=0; i<2; i++){
                            j= s->field_select[dir][i] = s->b_field_select_table[dir][i][xy];
                            s->mv[dir][i][0] = s->b_field_mv_table[dir][i][j][xy][0];
                            s->mv[dir][i][1] = s->b_field_mv_table[dir][i][j][xy][1];
                        }
                    }
5209
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_BIDIR_I, pb, pb2, tex_pb,
M
Michael Niedermayer 已提交
5210 5211 5212
                                 &dmin, &next_block, 0, 0);
                }
                if(mb_type&CANDIDATE_MB_TYPE_INTRA){
5213
                    s->mv_dir = 0;
M
Michael Niedermayer 已提交
5214
                    s->mv_type = MV_TYPE_16X16;
5215 5216 5217
                    s->mb_intra= 1;
                    s->mv[0][0][0] = 0;
                    s->mv[0][0][1] = 0;
5218
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_INTRA, pb, pb2, tex_pb,
5219
                                 &dmin, &next_block, 0, 0);
5220 5221 5222 5223 5224 5225
                    if(s->h263_pred || s->h263_aic){
                        if(best_s.mb_intra)
                            s->mbintra_table[mb_x + mb_y*s->mb_stride]=1;
                        else
                            ff_clean_intra_table_entries(s); //old mode?
                    }
M
Michael Niedermayer 已提交
5226
                }
5227

5228 5229
                if((s->flags & CODEC_FLAG_QP_RD) && dmin < INT_MAX){
                    if(best_s.mv_type==MV_TYPE_16X16){ //FIXME move 4mv after QPRD
5230
                        const int last_qp= backup_s.qscale;
M
Michael Niedermayer 已提交
5231
                        int qpi, qp, dc[6];
5232
                        DCTELEM ac[6][16];
M
Michael Niedermayer 已提交
5233
                        const int mvdir= (best_s.mv_dir&MV_DIR_BACKWARD) ? 1 : 0;
5234
                        static const int dquant_tab[4]={-1,1,-2,2};
5235

5236 5237 5238 5239 5240 5241 5242 5243 5244 5245
                        assert(backup_s.dquant == 0);

                        //FIXME intra
                        s->mv_dir= best_s.mv_dir;
                        s->mv_type = MV_TYPE_16X16;
                        s->mb_intra= best_s.mb_intra;
                        s->mv[0][0][0] = best_s.mv[0][0][0];
                        s->mv[0][0][1] = best_s.mv[0][0][1];
                        s->mv[1][0][0] = best_s.mv[1][0][0];
                        s->mv[1][0][1] = best_s.mv[1][0][1];
5246

5247
                        qpi = s->pict_type == B_TYPE ? 2 : 0;
M
Michael Niedermayer 已提交
5248 5249
                        for(; qpi<4; qpi++){
                            int dquant= dquant_tab[qpi];
5250 5251
                            qp= last_qp + dquant;
                            if(qp < s->avctx->qmin || qp > s->avctx->qmax)
5252
                                continue;
5253
                            backup_s.dquant= dquant;
M
Michael Niedermayer 已提交
5254
                            if(s->mb_intra && s->dc_val[0]){
5255 5256 5257 5258
                                for(i=0; i<6; i++){
                                    dc[i]= s->dc_val[0][ s->block_index[i] ];
                                    memcpy(ac[i], s->ac_val[0][s->block_index[i]], sizeof(DCTELEM)*16);
                                }
5259
                            }
5260

5261
                            encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_INTER /* wrong but unused */, pb, pb2, tex_pb,
M
Michael Niedermayer 已提交
5262
                                         &dmin, &next_block, s->mv[mvdir][0][0], s->mv[mvdir][0][1]);
5263
                            if(best_s.qscale != qp){
M
Michael Niedermayer 已提交
5264
                                if(s->mb_intra && s->dc_val[0]){
5265 5266 5267 5268
                                    for(i=0; i<6; i++){
                                        s->dc_val[0][ s->block_index[i] ]= dc[i];
                                        memcpy(s->ac_val[0][s->block_index[i]], ac[i], sizeof(DCTELEM)*16);
                                    }
5269 5270 5271 5272 5273
                                }
                            }
                        }
                    }
                }
5274 5275 5276 5277 5278 5279 5280 5281 5282 5283 5284
                if(mb_type&CANDIDATE_MB_TYPE_DIRECT){
                    int mx= s->b_direct_mv_table[xy][0];
                    int my= s->b_direct_mv_table[xy][1];

                    backup_s.dquant = 0;
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD | MV_DIRECT;
                    s->mb_intra= 0;
                    ff_mpeg4_set_direct_mv(s, mx, my);
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_DIRECT, pb, pb2, tex_pb,
                                 &dmin, &next_block, mx, my);
                }
5285 5286 5287 5288 5289 5290 5291 5292
                if(mb_type&CANDIDATE_MB_TYPE_DIRECT0){
                    backup_s.dquant = 0;
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD | MV_DIRECT;
                    s->mb_intra= 0;
                    ff_mpeg4_set_direct_mv(s, 0, 0);
                    encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_DIRECT, pb, pb2, tex_pb,
                                 &dmin, &next_block, 0, 0);
                }
M
skiprd  
Michael Niedermayer 已提交
5293 5294 5295 5296 5297 5298 5299 5300 5301 5302 5303 5304 5305 5306 5307 5308 5309 5310 5311 5312 5313 5314 5315 5316 5317 5318 5319 5320 5321 5322 5323 5324 5325
                if(!best_s.mb_intra && s->flags2&CODEC_FLAG2_SKIP_RD){
                    int coded=0;
                    for(i=0; i<6; i++)
                        coded |= s->block_last_index[i];
                    if(coded){
                        int mx,my;
                        memcpy(s->mv, best_s.mv, sizeof(s->mv));
                        if(best_s.mv_dir & MV_DIRECT){
                            mx=my=0; //FIXME find the one we actually used
                            ff_mpeg4_set_direct_mv(s, mx, my);
                        }else if(best_s.mv_dir&MV_DIR_BACKWARD){
                            mx= s->mv[1][0][0];
                            my= s->mv[1][0][1];
                        }else{
                            mx= s->mv[0][0][0];
                            my= s->mv[0][0][1];
                        }

                        s->mv_dir= best_s.mv_dir;
                        s->mv_type = best_s.mv_type;
                        s->mb_intra= 0;
/*                        s->mv[0][0][0] = best_s.mv[0][0][0];
                        s->mv[0][0][1] = best_s.mv[0][0][1];
                        s->mv[1][0][0] = best_s.mv[1][0][0];
                        s->mv[1][0][1] = best_s.mv[1][0][1];*/
                        backup_s.dquant= 0;
                        s->skipdct=1;
                        encode_mb_hq(s, &backup_s, &best_s, CANDIDATE_MB_TYPE_INTER /* wrong but unused */, pb, pb2, tex_pb,
                                        &dmin, &next_block, mx, my);
                        s->skipdct=0;
                    }
                }

5326
                s->current_picture.qscale_table[xy]= best_s.qscale;
5327

5328
                copy_context_after_encode(s, &best_s, -1);
5329

5330
                pb_bits_count= put_bits_count(&s->pb);
5331 5332 5333
                flush_put_bits(&s->pb);
                ff_copy_bits(&backup_s.pb, bit_buf[next_block^1], pb_bits_count);
                s->pb= backup_s.pb;
5334

5335
                if(s->data_partitioning){
5336
                    pb2_bits_count= put_bits_count(&s->pb2);
5337 5338 5339
                    flush_put_bits(&s->pb2);
                    ff_copy_bits(&backup_s.pb2, bit_buf2[next_block^1], pb2_bits_count);
                    s->pb2= backup_s.pb2;
5340

5341
                    tex_pb_bits_count= put_bits_count(&s->tex_pb);
5342 5343 5344 5345
                    flush_put_bits(&s->tex_pb);
                    ff_copy_bits(&backup_s.tex_pb, bit_buf_tex[next_block^1], tex_pb_bits_count);
                    s->tex_pb= backup_s.tex_pb;
                }
5346
                s->last_bits= put_bits_count(&s->pb);
5347

5348 5349
                if (s->out_format == FMT_H263 && s->pict_type!=B_TYPE)
                    ff_h263_update_motion_val(s);
5350

5351 5352 5353 5354
                if(next_block==0){ //FIXME 16 vs linesize16
                    s->dsp.put_pixels_tab[0][0](s->dest[0], s->rd_scratchpad                     , s->linesize  ,16);
                    s->dsp.put_pixels_tab[1][0](s->dest[1], s->rd_scratchpad + 16*s->linesize    , s->uvlinesize, 8);
                    s->dsp.put_pixels_tab[1][0](s->dest[2], s->rd_scratchpad + 16*s->linesize + 8, s->uvlinesize, 8);
5355 5356 5357 5358
                }

                if(s->avctx->mb_decision == FF_MB_DECISION_BITS)
                    MPV_decode_mb(s, s->block);
F
Fabrice Bellard 已提交
5359
            } else {
5360
                int motion_x = 0, motion_y = 0;
5361
                s->mv_type=MV_TYPE_16X16;
5362
                // only one MB-Type possible
5363

5364
                switch(mb_type){
M
Michael Niedermayer 已提交
5365
                case CANDIDATE_MB_TYPE_INTRA:
5366
                    s->mv_dir = 0;
5367
                    s->mb_intra= 1;
5368 5369
                    motion_x= s->mv[0][0][0] = 0;
                    motion_y= s->mv[0][0][1] = 0;
5370
                    break;
M
Michael Niedermayer 已提交
5371
                case CANDIDATE_MB_TYPE_INTER:
5372 5373 5374 5375
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mb_intra= 0;
                    motion_x= s->mv[0][0][0] = s->p_mv_table[xy][0];
                    motion_y= s->mv[0][0][1] = s->p_mv_table[xy][1];
5376
                    break;
M
Michael Niedermayer 已提交
5377 5378 5379 5380 5381 5382 5383 5384 5385 5386 5387
                case CANDIDATE_MB_TYPE_INTER_I:
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mv_type = MV_TYPE_FIELD;
                    s->mb_intra= 0;
                    for(i=0; i<2; i++){
                        j= s->field_select[0][i] = s->p_field_select_table[i][xy];
                        s->mv[0][i][0] = s->p_field_mv_table[i][j][xy][0];
                        s->mv[0][i][1] = s->p_field_mv_table[i][j][xy][1];
                    }
                    break;
                case CANDIDATE_MB_TYPE_INTER4V:
5388 5389 5390 5391
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mv_type = MV_TYPE_8X8;
                    s->mb_intra= 0;
                    for(i=0; i<4; i++){
5392 5393
                        s->mv[0][i][0] = s->current_picture.motion_val[0][s->block_index[i]][0];
                        s->mv[0][i][1] = s->current_picture.motion_val[0][s->block_index[i]][1];
5394 5395
                    }
                    break;
M
Michael Niedermayer 已提交
5396
                case CANDIDATE_MB_TYPE_DIRECT:
5397 5398
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD | MV_DIRECT;
                    s->mb_intra= 0;
5399 5400
                    motion_x=s->b_direct_mv_table[xy][0];
                    motion_y=s->b_direct_mv_table[xy][1];
M
Michael Niedermayer 已提交
5401
                    ff_mpeg4_set_direct_mv(s, motion_x, motion_y);
5402
                    break;
M
10l  
Michael Niedermayer 已提交
5403 5404 5405 5406 5407
                case CANDIDATE_MB_TYPE_DIRECT0:
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD | MV_DIRECT;
                    s->mb_intra= 0;
                    ff_mpeg4_set_direct_mv(s, 0, 0);
                    break;
M
Michael Niedermayer 已提交
5408
                case CANDIDATE_MB_TYPE_BIDIR:
5409
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
5410
                    s->mb_intra= 0;
5411 5412 5413 5414
                    s->mv[0][0][0] = s->b_bidir_forw_mv_table[xy][0];
                    s->mv[0][0][1] = s->b_bidir_forw_mv_table[xy][1];
                    s->mv[1][0][0] = s->b_bidir_back_mv_table[xy][0];
                    s->mv[1][0][1] = s->b_bidir_back_mv_table[xy][1];
5415
                    break;
M
Michael Niedermayer 已提交
5416
                case CANDIDATE_MB_TYPE_BACKWARD:
5417 5418 5419 5420
                    s->mv_dir = MV_DIR_BACKWARD;
                    s->mb_intra= 0;
                    motion_x= s->mv[1][0][0] = s->b_back_mv_table[xy][0];
                    motion_y= s->mv[1][0][1] = s->b_back_mv_table[xy][1];
5421
                    break;
M
Michael Niedermayer 已提交
5422
                case CANDIDATE_MB_TYPE_FORWARD:
5423 5424 5425 5426 5427
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mb_intra= 0;
                    motion_x= s->mv[0][0][0] = s->b_forw_mv_table[xy][0];
                    motion_y= s->mv[0][0][1] = s->b_forw_mv_table[xy][1];
//                    printf(" %d %d ", motion_x, motion_y);
5428
                    break;
M
Michael Niedermayer 已提交
5429 5430 5431 5432 5433 5434 5435 5436 5437 5438 5439 5440 5441 5442 5443 5444 5445 5446 5447 5448 5449 5450 5451 5452 5453 5454 5455 5456 5457 5458 5459 5460
                case CANDIDATE_MB_TYPE_FORWARD_I:
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mv_type = MV_TYPE_FIELD;
                    s->mb_intra= 0;
                    for(i=0; i<2; i++){
                        j= s->field_select[0][i] = s->b_field_select_table[0][i][xy];
                        s->mv[0][i][0] = s->b_field_mv_table[0][i][j][xy][0];
                        s->mv[0][i][1] = s->b_field_mv_table[0][i][j][xy][1];
                    }
                    break;
                case CANDIDATE_MB_TYPE_BACKWARD_I:
                    s->mv_dir = MV_DIR_BACKWARD;
                    s->mv_type = MV_TYPE_FIELD;
                    s->mb_intra= 0;
                    for(i=0; i<2; i++){
                        j= s->field_select[1][i] = s->b_field_select_table[1][i][xy];
                        s->mv[1][i][0] = s->b_field_mv_table[1][i][j][xy][0];
                        s->mv[1][i][1] = s->b_field_mv_table[1][i][j][xy][1];
                    }
                    break;
                case CANDIDATE_MB_TYPE_BIDIR_I:
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
                    s->mv_type = MV_TYPE_FIELD;
                    s->mb_intra= 0;
                    for(dir=0; dir<2; dir++){
                        for(i=0; i<2; i++){
                            j= s->field_select[dir][i] = s->b_field_select_table[dir][i][xy];
                            s->mv[dir][i][0] = s->b_field_mv_table[dir][i][j][xy][0];
                            s->mv[dir][i][1] = s->b_field_mv_table[dir][i][j][xy][1];
                        }
                    }
                    break;
5461
                default:
5462
                    av_log(s->avctx, AV_LOG_ERROR, "illegal MB type\n");
5463
                }
5464

5465
                encode_mb(s, motion_x, motion_y);
5466

5467
                // RAL: Update last macroblock type
5468
                s->last_mv_dir = s->mv_dir;
5469

5470 5471
                if (s->out_format == FMT_H263 && s->pict_type!=B_TYPE)
                    ff_h263_update_motion_val(s);
5472

5473
                MPV_decode_mb(s, s->block);
F
Fabrice Bellard 已提交
5474
            }
5475

5476 5477 5478 5479 5480
            /* clean the MV table in IPS frames for direct mode in B frames */
            if(s->mb_intra /* && I,P,S_TYPE */){
                s->p_mv_table[xy][0]=0;
                s->p_mv_table[xy][1]=0;
            }
5481

5482 5483 5484 5485 5486 5487
            if(s->flags&CODEC_FLAG_PSNR){
                int w= 16;
                int h= 16;

                if(s->mb_x*16 + 16 > s->width ) w= s->width - s->mb_x*16;
                if(s->mb_y*16 + 16 > s->height) h= s->height- s->mb_y*16;
M
Michael Niedermayer 已提交
5488

5489
                s->current_picture.error[0] += sse(
5490 5491
                    s, s->new_picture.data[0] + s->mb_x*16 + s->mb_y*s->linesize*16,
                    s->dest[0], w, h, s->linesize);
5492
                s->current_picture.error[1] += sse(
5493 5494
                    s, s->new_picture.data[1] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,
                    s->dest[1], w>>1, h>>1, s->uvlinesize);
5495
                s->current_picture.error[2] += sse(
5496 5497
                    s, s->new_picture    .data[2] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,
                    s->dest[2], w>>1, h>>1, s->uvlinesize);
5498
            }
M
Maarten Daniels 已提交
5499 5500 5501 5502
            if(s->loop_filter){
                if(s->out_format == FMT_H263)
                    ff_h263_loop_filter(s);
            }
5503
//printf("MB %d %d bits\n", s->mb_x+s->mb_y*s->mb_stride, put_bits_count(&s->pb));
F
Fabrice Bellard 已提交
5504 5505
        }
    }
5506

5507
    //not beautiful here but we must write it before flushing so it has to be here
5508
    if (ENABLE_MSMPEG4_ENCODER && s->msmpeg4_version && s->msmpeg4_version<4 && s->pict_type == I_TYPE)
M
Michael Niedermayer 已提交
5509
        msmpeg4_encode_ext_header(s);
5510

5511 5512
    write_slice_end(s);

5513
    /* Send the last GOB if RTP */
M
Michael Niedermayer 已提交
5514
    if (s->avctx->rtp_callback) {
5515
        int number_mb = (mb_y - s->resync_mb_y)*s->mb_width - s->resync_mb_x;
5516
        pdif = pbBufPtr(&s->pb) - s->ptr_lastgob;
5517
        /* Call the RTP callback to send the last GOB */
5518
        emms_c();
5519
        s->avctx->rtp_callback(s->avctx, s->ptr_lastgob, pdif, number_mb);
5520
    }
5521 5522 5523 5524 5525 5526

    return 0;
}

#define MERGE(field) dst->field += src->field; src->field=0
static void merge_context_after_me(MpegEncContext *dst, MpegEncContext *src){
5527 5528 5529
    MERGE(me.scene_change_score);
    MERGE(me.mc_mb_var_sum_temp);
    MERGE(me.mb_var_sum_temp);
5530 5531 5532 5533 5534 5535 5536 5537 5538 5539 5540 5541 5542 5543 5544 5545 5546
}

static void merge_context_after_encode(MpegEncContext *dst, MpegEncContext *src){
    int i;

    MERGE(dct_count[0]); //note, the other dct vars are not part of the context
    MERGE(dct_count[1]);
    MERGE(mv_bits);
    MERGE(i_tex_bits);
    MERGE(p_tex_bits);
    MERGE(i_count);
    MERGE(f_count);
    MERGE(b_count);
    MERGE(skip_count);
    MERGE(misc_bits);
    MERGE(error_count);
    MERGE(padding_bug_score);
5547 5548 5549
    MERGE(current_picture.error[0]);
    MERGE(current_picture.error[1]);
    MERGE(current_picture.error[2]);
5550 5551 5552 5553 5554 5555 5556

    if(dst->avctx->noise_reduction){
        for(i=0; i<64; i++){
            MERGE(dct_error_sum[0][i]);
            MERGE(dct_error_sum[1][i]);
        }
    }
5557

5558 5559 5560 5561 5562 5563
    assert(put_bits_count(&src->pb) % 8 ==0);
    assert(put_bits_count(&dst->pb) % 8 ==0);
    ff_copy_bits(&dst->pb, src->pb.buf, put_bits_count(&src->pb));
    flush_put_bits(&dst->pb);
}

5564
static int estimate_qp(MpegEncContext *s, int dry_run){
5565 5566 5567 5568 5569
    if (s->next_lambda){
        s->current_picture_ptr->quality=
        s->current_picture.quality = s->next_lambda;
        if(!dry_run) s->next_lambda= 0;
    } else if (!s->fixed_qscale) {
5570 5571
        s->current_picture_ptr->quality=
        s->current_picture.quality = ff_rate_estimate_qscale(s, dry_run);
5572 5573 5574
        if (s->current_picture.quality < 0)
            return -1;
    }
5575 5576 5577 5578 5579 5580 5581 5582 5583 5584 5585 5586 5587 5588 5589 5590 5591 5592 5593

    if(s->adaptive_quant){
        switch(s->codec_id){
        case CODEC_ID_MPEG4:
            ff_clean_mpeg4_qscales(s);
            break;
        case CODEC_ID_H263:
        case CODEC_ID_H263P:
        case CODEC_ID_FLV1:
            ff_clean_h263_qscales(s);
            break;
        }

        s->lambda= s->lambda_table[0];
        //FIXME broken
    }else
        s->lambda= s->current_picture.quality;
//printf("%d %d\n", s->avctx->global_quality, s->current_picture.quality);
    update_qscale(s);
5594
    return 0;
5595 5596
}

5597
static int encode_picture(MpegEncContext *s, int picture_number)
5598
{
5599
    int i;
5600 5601 5602
    int bits;

    s->picture_number = picture_number;
5603

5604
    /* Reset the average MB variance */
5605 5606
    s->me.mb_var_sum_temp    =
    s->me.mc_mb_var_sum_temp = 0;
5607 5608 5609 5610

    /* we need to initialize some time vars before we can encode b-frames */
    // RAL: Condition added for MPEG1VIDEO
    if (s->codec_id == CODEC_ID_MPEG1VIDEO || s->codec_id == CODEC_ID_MPEG2VIDEO || (s->h263_pred && !s->h263_msmpeg4))
5611
        ff_set_mpeg4_time(s, s->picture_number);  //FIXME rename and use has_b_frames or similar
5612

5613
    s->me.scene_change_score=0;
5614

5615
//    s->lambda= s->current_picture_ptr->quality; //FIXME qscale / ... stuff for ME ratedistoration
5616

5617 5618 5619 5620 5621
    if(s->pict_type==I_TYPE){
        if(s->msmpeg4_version >= 3) s->no_rounding=1;
        else                        s->no_rounding=0;
    }else if(s->pict_type!=B_TYPE){
        if(s->flipflop_rounding || s->codec_id == CODEC_ID_H263P || s->codec_id == CODEC_ID_MPEG4)
5622
            s->no_rounding ^= 1;
5623
    }
5624

5625
    if(s->flags & CODEC_FLAG_PASS2){
5626 5627
        if (estimate_qp(s,1) < 0)
            return -1;
5628 5629
        ff_get_2pass_fcode(s);
    }else if(!(s->flags & CODEC_FLAG_QSCALE)){
5630
        if(s->pict_type==B_TYPE)
5631
            s->lambda= s->last_lambda_for[s->pict_type];
5632
        else
5633
            s->lambda= s->last_lambda_for[s->last_non_b_pict_type];
5634 5635
        update_qscale(s);
    }
5636

5637
    s->mb_intra=0; //for the rate distortion & bit compare functions
5638
    for(i=1; i<s->avctx->thread_count; i++){
5639
        ff_update_duplicate_context(s->thread_context[i], s);
5640
    }
5641 5642 5643

    ff_init_me(s);

5644 5645
    /* Estimate motion for every MB */
    if(s->pict_type != I_TYPE){
5646
        s->lambda = (s->lambda * s->avctx->me_penalty_compensation + 128)>>8;
5647
        s->lambda2= (s->lambda2* (int64_t)s->avctx->me_penalty_compensation + 128)>>8;
5648
        if(s->pict_type != B_TYPE && s->avctx->me_threshold==0){
5649 5650 5651 5652 5653 5654 5655 5656 5657 5658
            if((s->avctx->pre_me && s->last_non_b_pict_type==I_TYPE) || s->avctx->pre_me==2){
                s->avctx->execute(s->avctx, pre_estimate_motion_thread, (void**)&(s->thread_context[0]), NULL, s->avctx->thread_count);
            }
        }

        s->avctx->execute(s->avctx, estimate_motion_thread, (void**)&(s->thread_context[0]), NULL, s->avctx->thread_count);
    }else /* if(s->pict_type == I_TYPE) */{
        /* I-Frame */
        for(i=0; i<s->mb_stride*s->mb_height; i++)
            s->mb_type[i]= CANDIDATE_MB_TYPE_INTRA;
5659

5660 5661
        if(!s->fixed_qscale){
            /* finding spatial complexity for I-frame rate control */
5662
            s->avctx->execute(s->avctx, mb_var_thread, (void**)&(s->thread_context[0]), NULL, s->avctx->thread_count);
5663 5664
        }
    }
5665 5666 5667
    for(i=1; i<s->avctx->thread_count; i++){
        merge_context_after_me(s, s->thread_context[i]);
    }
5668 5669
    s->current_picture.mc_mb_var_sum= s->current_picture_ptr->mc_mb_var_sum= s->me.mc_mb_var_sum_temp;
    s->current_picture.   mb_var_sum= s->current_picture_ptr->   mb_var_sum= s->me.   mb_var_sum_temp;
5670 5671
    emms_c();

5672
    if(s->me.scene_change_score > s->avctx->scenechange_threshold && s->pict_type == P_TYPE){
5673 5674 5675 5676 5677 5678 5679 5680 5681 5682 5683 5684 5685 5686 5687 5688
        s->pict_type= I_TYPE;
        for(i=0; i<s->mb_stride*s->mb_height; i++)
            s->mb_type[i]= CANDIDATE_MB_TYPE_INTRA;
//printf("Scene change detected, encoding as I Frame %d %d\n", s->current_picture.mb_var_sum, s->current_picture.mc_mb_var_sum);
    }

    if(!s->umvplus){
        if(s->pict_type==P_TYPE || s->pict_type==S_TYPE) {
            s->f_code= ff_get_best_fcode(s, s->p_mv_table, CANDIDATE_MB_TYPE_INTER);

            if(s->flags & CODEC_FLAG_INTERLACED_ME){
                int a,b;
                a= ff_get_best_fcode(s, s->p_field_mv_table[0][0], CANDIDATE_MB_TYPE_INTER_I); //FIXME field_select
                b= ff_get_best_fcode(s, s->p_field_mv_table[1][1], CANDIDATE_MB_TYPE_INTER_I);
                s->f_code= FFMAX(s->f_code, FFMAX(a,b));
            }
5689

5690 5691 5692
            ff_fix_long_p_mvs(s);
            ff_fix_long_mvs(s, NULL, 0, s->p_mv_table, s->f_code, CANDIDATE_MB_TYPE_INTER, 0);
            if(s->flags & CODEC_FLAG_INTERLACED_ME){
5693
                int j;
5694 5695
                for(i=0; i<2; i++){
                    for(j=0; j<2; j++)
5696
                        ff_fix_long_mvs(s, s->p_field_select_table[i], j,
5697 5698 5699 5700 5701 5702 5703 5704 5705 5706 5707 5708 5709 5710 5711 5712 5713 5714 5715 5716 5717
                                        s->p_field_mv_table[i][j], s->f_code, CANDIDATE_MB_TYPE_INTER_I, 0);
                }
            }
        }

        if(s->pict_type==B_TYPE){
            int a, b;

            a = ff_get_best_fcode(s, s->b_forw_mv_table, CANDIDATE_MB_TYPE_FORWARD);
            b = ff_get_best_fcode(s, s->b_bidir_forw_mv_table, CANDIDATE_MB_TYPE_BIDIR);
            s->f_code = FFMAX(a, b);

            a = ff_get_best_fcode(s, s->b_back_mv_table, CANDIDATE_MB_TYPE_BACKWARD);
            b = ff_get_best_fcode(s, s->b_bidir_back_mv_table, CANDIDATE_MB_TYPE_BIDIR);
            s->b_code = FFMAX(a, b);

            ff_fix_long_mvs(s, NULL, 0, s->b_forw_mv_table, s->f_code, CANDIDATE_MB_TYPE_FORWARD, 1);
            ff_fix_long_mvs(s, NULL, 0, s->b_back_mv_table, s->b_code, CANDIDATE_MB_TYPE_BACKWARD, 1);
            ff_fix_long_mvs(s, NULL, 0, s->b_bidir_forw_mv_table, s->f_code, CANDIDATE_MB_TYPE_BIDIR, 1);
            ff_fix_long_mvs(s, NULL, 0, s->b_bidir_back_mv_table, s->b_code, CANDIDATE_MB_TYPE_BIDIR, 1);
            if(s->flags & CODEC_FLAG_INTERLACED_ME){
5718
                int dir, j;
5719 5720 5721
                for(dir=0; dir<2; dir++){
                    for(i=0; i<2; i++){
                        for(j=0; j<2; j++){
5722
                            int type= dir ? (CANDIDATE_MB_TYPE_BACKWARD_I|CANDIDATE_MB_TYPE_BIDIR_I)
5723
                                          : (CANDIDATE_MB_TYPE_FORWARD_I |CANDIDATE_MB_TYPE_BIDIR_I);
5724
                            ff_fix_long_mvs(s, s->b_field_select_table[dir][i], j,
5725 5726 5727 5728 5729 5730 5731 5732
                                            s->b_field_mv_table[dir][i][j], dir ? s->b_code : s->f_code, type, 1);
                        }
                    }
                }
            }
        }
    }

5733 5734
    if (estimate_qp(s, 0) < 0)
        return -1;
5735 5736

    if(s->qscale < 3 && s->max_qcoeff<=128 && s->pict_type==I_TYPE && !(s->flags & CODEC_FLAG_QSCALE))
5737
        s->qscale= 3; //reduce clipping problems
5738

5739 5740 5741 5742 5743 5744
    if (s->out_format == FMT_MJPEG) {
        /* for mjpeg, we do include qscale in the matrix */
        s->intra_matrix[0] = ff_mpeg1_default_intra_matrix[0];
        for(i=1;i<64;i++){
            int j= s->dsp.idct_permutation[i];

5745
            s->intra_matrix[j] = av_clip_uint8((ff_mpeg1_default_intra_matrix[i] * s->qscale) >> 3);
5746
        }
5747
        convert_matrix(&s->dsp, s->q_intra_matrix, s->q_intra_matrix16,
5748
                       s->intra_matrix, s->intra_quant_bias, 8, 8, 1);
5749 5750
        s->qscale= 8;
    }
5751

5752
    //FIXME var duplication
5753
    s->current_picture_ptr->key_frame=
5754
    s->current_picture.key_frame= s->pict_type == I_TYPE; //FIXME pic_ptr
5755
    s->current_picture_ptr->pict_type=
5756 5757 5758 5759 5760 5761 5762 5763
    s->current_picture.pict_type= s->pict_type;

    if(s->current_picture.key_frame)
        s->picture_in_gop_number=0;

    s->last_bits= put_bits_count(&s->pb);
    switch(s->out_format) {
    case FMT_MJPEG:
5764
        if (ENABLE_MJPEG_ENCODER)
A
Aurelien Jacobs 已提交
5765
            mjpeg_picture_header(s);
5766
        break;
5767
    case FMT_H261:
5768
        if (ENABLE_H261_ENCODER)
A
Aurelien Jacobs 已提交
5769
            ff_h261_encode_picture_header(s, picture_number);
5770
        break;
5771
    case FMT_H263:
5772
        if (ENABLE_WMV2_ENCODER && s->codec_id == CODEC_ID_WMV2)
5773
            ff_wmv2_encode_picture_header(s, picture_number);
5774
        else if (ENABLE_MSMPEG4_ENCODER && s->h263_msmpeg4)
5775 5776 5777
            msmpeg4_encode_picture_header(s, picture_number);
        else if (s->h263_pred)
            mpeg4_encode_picture_header(s, picture_number);
5778
        else if (ENABLE_RV10_ENCODER && s->codec_id == CODEC_ID_RV10)
5779
            rv10_encode_picture_header(s, picture_number);
5780
        else if (ENABLE_RV20_ENCODER && s->codec_id == CODEC_ID_RV20)
M
Michael Niedermayer 已提交
5781
            rv20_encode_picture_header(s, picture_number);
5782 5783 5784 5785 5786 5787 5788 5789 5790 5791 5792 5793 5794 5795 5796
        else if (s->codec_id == CODEC_ID_FLV1)
            ff_flv_encode_picture_header(s, picture_number);
        else
            h263_encode_picture_header(s, picture_number);
        break;
    case FMT_MPEG1:
        mpeg1_encode_picture_header(s, picture_number);
        break;
    case FMT_H264:
        break;
    default:
        assert(0);
    }
    bits= put_bits_count(&s->pb);
    s->header_bits= bits - s->last_bits;
5797

5798 5799 5800 5801 5802 5803 5804 5805
    for(i=1; i<s->avctx->thread_count; i++){
        update_duplicate_context_after_me(s->thread_context[i], s);
    }
    s->avctx->execute(s->avctx, encode_thread, (void**)&(s->thread_context[0]), NULL, s->avctx->thread_count);
    for(i=1; i<s->avctx->thread_count; i++){
        merge_context_after_encode(s, s->thread_context[i]);
    }
    emms_c();
5806
    return 0;
F
Fabrice Bellard 已提交
5807 5808
}

M
Michael Niedermayer 已提交
5809
static void  denoise_dct_c(MpegEncContext *s, DCTELEM *block){
5810 5811 5812
    const int intra= s->mb_intra;
    int i;

5813 5814
    s->dct_count[intra]++;

5815 5816 5817 5818 5819 5820 5821 5822 5823 5824 5825 5826 5827 5828 5829 5830 5831 5832
    for(i=0; i<64; i++){
        int level= block[i];

        if(level){
            if(level>0){
                s->dct_error_sum[intra][i] += level;
                level -= s->dct_offset[intra][i];
                if(level<0) level=0;
            }else{
                s->dct_error_sum[intra][i] -= level;
                level += s->dct_offset[intra][i];
                if(level>0) level=0;
            }
            block[i]= level;
        }
    }
}

5833
static int dct_quantize_trellis_c(MpegEncContext *s,
M
Michael Niedermayer 已提交
5834 5835 5836
                        DCTELEM *block, int n,
                        int qscale, int *overflow){
    const int *qmat;
5837
    const uint8_t *scantable= s->intra_scantable.scantable;
5838
    const uint8_t *perm_scantable= s->intra_scantable.permutated;
M
Michael Niedermayer 已提交
5839 5840 5841 5842 5843 5844
    int max=0;
    unsigned int threshold1, threshold2;
    int bias=0;
    int run_tab[65];
    int level_tab[65];
    int score_tab[65];
5845 5846
    int survivor[65];
    int survivor_count;
5847 5848 5849
    int last_run=0;
    int last_level=0;
    int last_score= 0;
5850
    int last_i;
5851
    int coeff[2][64];
M
Michael Niedermayer 已提交
5852
    int coeff_count[64];
5853
    int qmul, qadd, start_i, last_non_zero, i, dc;
M
Michael Niedermayer 已提交
5854 5855 5856
    const int esc_length= s->ac_esc_length;
    uint8_t * length;
    uint8_t * last_length;
5857
    const int lambda= s->lambda2 >> (FF_LAMBDA_SHIFT - 6);
5858

5859
    s->dsp.fdct (block);
5860

5861
    if(s->dct_error_sum)
M
Michael Niedermayer 已提交
5862
        s->denoise_dct(s, block);
M
Michael Niedermayer 已提交
5863 5864
    qmul= qscale*16;
    qadd= ((qscale-1)|1)*8;
5865

M
Michael Niedermayer 已提交
5866 5867 5868 5869 5870 5871 5872 5873 5874 5875 5876 5877 5878
    if (s->mb_intra) {
        int q;
        if (!s->h263_aic) {
            if (n < 4)
                q = s->y_dc_scale;
            else
                q = s->c_dc_scale;
            q = q << 3;
        } else{
            /* For AIC we skip quant/dequant of INTRADC */
            q = 1 << 3;
            qadd=0;
        }
5879

M
Michael Niedermayer 已提交
5880 5881 5882 5883 5884
        /* note: block[0] is assumed to be positive */
        block[0] = (block[0] + (q >> 1)) / q;
        start_i = 1;
        last_non_zero = 0;
        qmat = s->q_intra_matrix[qscale];
5885
        if(s->mpeg_quant || s->out_format == FMT_MPEG1)
M
Michael Niedermayer 已提交
5886 5887 5888 5889 5890 5891 5892 5893 5894 5895
            bias= 1<<(QMAT_SHIFT-1);
        length     = s->intra_ac_vlc_length;
        last_length= s->intra_ac_vlc_last_length;
    } else {
        start_i = 0;
        last_non_zero = -1;
        qmat = s->q_inter_matrix[qscale];
        length     = s->inter_ac_vlc_length;
        last_length= s->inter_ac_vlc_last_length;
    }
5896
    last_i= start_i;
M
Michael Niedermayer 已提交
5897 5898 5899

    threshold1= (1<<QMAT_SHIFT) - bias - 1;
    threshold2= (threshold1<<1);
5900

5901 5902 5903 5904 5905 5906 5907 5908 5909 5910 5911
    for(i=63; i>=start_i; i--) {
        const int j = scantable[i];
        int level = block[j] * qmat[j];

        if(((unsigned)(level+threshold1))>threshold2){
            last_non_zero = i;
            break;
        }
    }

    for(i=start_i; i<=last_non_zero; i++) {
M
Michael Niedermayer 已提交
5912
        const int j = scantable[i];
5913
        int level = block[j] * qmat[j];
M
Michael Niedermayer 已提交
5914 5915 5916 5917 5918 5919

//        if(   bias+level >= (1<<(QMAT_SHIFT - 3))
//           || bias-level >= (1<<(QMAT_SHIFT - 3))){
        if(((unsigned)(level+threshold1))>threshold2){
            if(level>0){
                level= (bias + level)>>QMAT_SHIFT;
5920 5921
                coeff[0][i]= level;
                coeff[1][i]= level-1;
5922
//                coeff[2][k]= level-2;
M
Michael Niedermayer 已提交
5923 5924
            }else{
                level= (bias - level)>>QMAT_SHIFT;
5925 5926
                coeff[0][i]= -level;
                coeff[1][i]= -level+1;
5927
//                coeff[2][k]= -level+2;
M
Michael Niedermayer 已提交
5928
            }
5929 5930
            coeff_count[i]= FFMIN(level, 2);
            assert(coeff_count[i]);
M
Michael Niedermayer 已提交
5931 5932
            max |=level;
        }else{
5933 5934
            coeff[0][i]= (level>>31)|1;
            coeff_count[i]= 1;
M
Michael Niedermayer 已提交
5935 5936
        }
    }
5937

5938
    *overflow= s->max_qcoeff < max; //overflow might have happened
5939

M
Michael Niedermayer 已提交
5940 5941 5942 5943 5944
    if(last_non_zero < start_i){
        memset(block + start_i, 0, (64-start_i)*sizeof(DCTELEM));
        return last_non_zero;
    }

5945 5946 5947
    score_tab[start_i]= 0;
    survivor[0]= start_i;
    survivor_count= 1;
5948

5949 5950
    for(i=start_i; i<=last_non_zero; i++){
        int level_index, j;
D
Diego Biurrun 已提交
5951
        const int dct_coeff= FFABS(block[ scantable[i] ]);
M
Michael Niedermayer 已提交
5952
        const int zero_distoration= dct_coeff*dct_coeff;
5953
        int best_score=256*256*256*120;
M
Michael Niedermayer 已提交
5954 5955 5956
        for(level_index=0; level_index < coeff_count[i]; level_index++){
            int distoration;
            int level= coeff[level_index][i];
D
Diego Biurrun 已提交
5957
            const int alevel= FFABS(level);
M
Michael Niedermayer 已提交
5958
            int unquant_coeff;
5959

M
Michael Niedermayer 已提交
5960 5961 5962
            assert(level);

            if(s->out_format == FMT_H263){
M
cleanup  
Michael Niedermayer 已提交
5963
                unquant_coeff= alevel*qmul + qadd;
5964
            }else{ //MPEG1
5965
                j= s->dsp.idct_permutation[ scantable[i] ]; //FIXME optimize
5966
                if(s->mb_intra){
M
cleanup  
Michael Niedermayer 已提交
5967
                        unquant_coeff = (int)(  alevel  * qscale * s->intra_matrix[j]) >> 3;
5968 5969
                        unquant_coeff =   (unquant_coeff - 1) | 1;
                }else{
M
cleanup  
Michael Niedermayer 已提交
5970
                        unquant_coeff = (((  alevel  << 1) + 1) * qscale * ((int) s->inter_matrix[j])) >> 4;
5971 5972 5973 5974
                        unquant_coeff =   (unquant_coeff - 1) | 1;
                }
                unquant_coeff<<= 3;
            }
5975

5976
            distoration= (unquant_coeff - dct_coeff) * (unquant_coeff - dct_coeff) - zero_distoration;
M
Michael Niedermayer 已提交
5977 5978
            level+=64;
            if((level&(~127)) == 0){
5979 5980
                for(j=survivor_count-1; j>=0; j--){
                    int run= i - survivor[j];
5981
                    int score= distoration + length[UNI_AC_ENC_INDEX(run, level)]*lambda;
M
Michael Niedermayer 已提交
5982
                    score += score_tab[i-run];
5983

M
Michael Niedermayer 已提交
5984
                    if(score < best_score){
5985
                        best_score= score;
M
Michael Niedermayer 已提交
5986 5987 5988 5989 5990 5991
                        run_tab[i+1]= run;
                        level_tab[i+1]= level-64;
                    }
                }

                if(s->out_format == FMT_H263){
5992 5993
                    for(j=survivor_count-1; j>=0; j--){
                        int run= i - survivor[j];
5994
                        int score= distoration + last_length[UNI_AC_ENC_INDEX(run, level)]*lambda;
M
Michael Niedermayer 已提交
5995
                        score += score_tab[i-run];
5996 5997 5998 5999 6000
                        if(score < last_score){
                            last_score= score;
                            last_run= run;
                            last_level= level-64;
                            last_i= i+1;
M
Michael Niedermayer 已提交
6001 6002 6003 6004 6005
                        }
                    }
                }
            }else{
                distoration += esc_length*lambda;
6006 6007
                for(j=survivor_count-1; j>=0; j--){
                    int run= i - survivor[j];
M
Michael Niedermayer 已提交
6008
                    int score= distoration + score_tab[i-run];
6009

M
Michael Niedermayer 已提交
6010
                    if(score < best_score){
6011
                        best_score= score;
M
Michael Niedermayer 已提交
6012 6013 6014 6015 6016 6017
                        run_tab[i+1]= run;
                        level_tab[i+1]= level-64;
                    }
                }

                if(s->out_format == FMT_H263){
6018 6019
                  for(j=survivor_count-1; j>=0; j--){
                        int run= i - survivor[j];
M
Michael Niedermayer 已提交
6020
                        int score= distoration + score_tab[i-run];
6021 6022 6023 6024 6025
                        if(score < last_score){
                            last_score= score;
                            last_run= run;
                            last_level= level-64;
                            last_i= i+1;
M
Michael Niedermayer 已提交
6026 6027 6028 6029 6030
                        }
                    }
                }
            }
        }
6031

6032 6033
        score_tab[i+1]= best_score;

6034
        //Note: there is a vlc code in mpeg4 which is 1 bit shorter then another one with a shorter run and the same level
6035 6036 6037 6038 6039 6040 6041 6042 6043 6044
        if(last_non_zero <= 27){
            for(; survivor_count; survivor_count--){
                if(score_tab[ survivor[survivor_count-1] ] <= best_score)
                    break;
            }
        }else{
            for(; survivor_count; survivor_count--){
                if(score_tab[ survivor[survivor_count-1] ] <= best_score + lambda)
                    break;
            }
6045
        }
6046 6047

        survivor[ survivor_count++ ]= i+1;
M
Michael Niedermayer 已提交
6048
    }
6049

M
Michael Niedermayer 已提交
6050
    if(s->out_format != FMT_H263){
6051
        last_score= 256*256*256*120;
6052
        for(i= survivor[0]; i<=last_non_zero + 1; i++){
6053
            int score= score_tab[i];
6054 6055
            if(i) score += lambda*2; //FIXME exacter?

6056 6057 6058 6059 6060 6061
            if(score < last_score){
                last_score= score;
                last_i= i;
                last_level= level_tab[i];
                last_run= run_tab[i];
            }
M
Michael Niedermayer 已提交
6062 6063
        }
    }
6064

6065
    s->coded_score[n] = last_score;
6066

D
Diego Biurrun 已提交
6067
    dc= FFABS(block[0]);
6068
    last_non_zero= last_i - 1;
M
Michael Niedermayer 已提交
6069
    memset(block + start_i, 0, (64-start_i)*sizeof(DCTELEM));
6070

M
Michael Niedermayer 已提交
6071 6072
    if(last_non_zero < start_i)
        return last_non_zero;
6073

6074 6075 6076
    if(last_non_zero == 0 && start_i == 0){
        int best_level= 0;
        int best_score= dc * dc;
6077

6078
        for(i=0; i<coeff_count[0]; i++){
6079
            int level= coeff[i][0];
D
Diego Biurrun 已提交
6080
            int alevel= FFABS(level);
M
cleanup  
Michael Niedermayer 已提交
6081
            int unquant_coeff, score, distortion;
6082 6083

            if(s->out_format == FMT_H263){
M
cleanup  
Michael Niedermayer 已提交
6084
                    unquant_coeff= (alevel*qmul + qadd)>>3;
6085
            }else{ //MPEG1
M
cleanup  
Michael Niedermayer 已提交
6086 6087
                    unquant_coeff = (((  alevel  << 1) + 1) * qscale * ((int) s->inter_matrix[0])) >> 4;
                    unquant_coeff =   (unquant_coeff - 1) | 1;
6088 6089 6090 6091
            }
            unquant_coeff = (unquant_coeff + 4) >> 3;
            unquant_coeff<<= 3 + 3;

M
cleanup  
Michael Niedermayer 已提交
6092
            distortion= (unquant_coeff - dc) * (unquant_coeff - dc);
6093
            level+=64;
M
cleanup  
Michael Niedermayer 已提交
6094 6095
            if((level&(~127)) == 0) score= distortion + last_length[UNI_AC_ENC_INDEX(0, level)]*lambda;
            else                    score= distortion + esc_length*lambda;
6096

6097 6098
            if(score < best_score){
                best_score= score;
6099
                best_level= level - 64;
6100 6101 6102
            }
        }
        block[0]= best_level;
6103 6104 6105
        s->coded_score[n] = best_score - dc*dc;
        if(best_level == 0) return -1;
        else                return last_non_zero;
6106
    }
6107

6108 6109
    i= last_i;
    assert(last_level);
6110 6111

    block[ perm_scantable[last_non_zero] ]= last_level;
6112
    i -= last_run + 1;
6113

6114 6115
    for(; i>start_i; i -= run_tab[i] + 1){
        block[ perm_scantable[i-1] ]= level_tab[i];
M
Michael Niedermayer 已提交
6116 6117 6118 6119 6120
    }

    return last_non_zero;
}

M
Michael Niedermayer 已提交
6121 6122 6123 6124 6125 6126 6127 6128 6129 6130 6131 6132 6133 6134 6135 6136 6137 6138 6139 6140 6141 6142 6143 6144 6145 6146
//#define REFINE_STATS 1
static int16_t basis[64][64];

static void build_basis(uint8_t *perm){
    int i, j, x, y;
    emms_c();
    for(i=0; i<8; i++){
        for(j=0; j<8; j++){
            for(y=0; y<8; y++){
                for(x=0; x<8; x++){
                    double s= 0.25*(1<<BASIS_SHIFT);
                    int index= 8*i + j;
                    int perm_index= perm[index];
                    if(i==0) s*= sqrt(0.5);
                    if(j==0) s*= sqrt(0.5);
                    basis[perm_index][8*x + y]= lrintf(s * cos((M_PI/8.0)*i*(x+0.5)) * cos((M_PI/8.0)*j*(y+0.5)));
                }
            }
        }
    }
}

static int dct_quantize_refine(MpegEncContext *s, //FIXME breaks denoise?
                        DCTELEM *block, int16_t *weight, DCTELEM *orig,
                        int n, int qscale){
    int16_t rem[64];
6147
    DECLARE_ALIGNED_16(DCTELEM, d1[64]);
M
Michael Niedermayer 已提交
6148 6149 6150 6151 6152 6153 6154 6155 6156 6157 6158 6159
    const int *qmat;
    const uint8_t *scantable= s->intra_scantable.scantable;
    const uint8_t *perm_scantable= s->intra_scantable.permutated;
//    unsigned int threshold1, threshold2;
//    int bias=0;
    int run_tab[65];
    int prev_run=0;
    int prev_level=0;
    int qmul, qadd, start_i, last_non_zero, i, dc;
    uint8_t * length;
    uint8_t * last_length;
    int lambda;
6160
    int rle_index, run, q = 1, sum; //q is only used when s->mb_intra is true
M
Michael Niedermayer 已提交
6161 6162 6163 6164 6165 6166 6167 6168 6169 6170 6171 6172
#ifdef REFINE_STATS
static int count=0;
static int after_last=0;
static int to_zero=0;
static int from_zero=0;
static int raise=0;
static int lower=0;
static int messed_sign=0;
#endif

    if(basis[0][0] == 0)
        build_basis(s->dsp.idct_permutation);
6173

M
Michael Niedermayer 已提交
6174 6175 6176 6177 6178 6179 6180 6181 6182 6183 6184 6185 6186 6187 6188 6189 6190 6191 6192 6193 6194 6195 6196 6197 6198 6199 6200 6201 6202 6203 6204 6205 6206 6207 6208
    qmul= qscale*2;
    qadd= (qscale-1)|1;
    if (s->mb_intra) {
        if (!s->h263_aic) {
            if (n < 4)
                q = s->y_dc_scale;
            else
                q = s->c_dc_scale;
        } else{
            /* For AIC we skip quant/dequant of INTRADC */
            q = 1;
            qadd=0;
        }
        q <<= RECON_SHIFT-3;
        /* note: block[0] is assumed to be positive */
        dc= block[0]*q;
//        block[0] = (block[0] + (q >> 1)) / q;
        start_i = 1;
        qmat = s->q_intra_matrix[qscale];
//        if(s->mpeg_quant || s->out_format == FMT_MPEG1)
//            bias= 1<<(QMAT_SHIFT-1);
        length     = s->intra_ac_vlc_length;
        last_length= s->intra_ac_vlc_last_length;
    } else {
        dc= 0;
        start_i = 0;
        qmat = s->q_inter_matrix[qscale];
        length     = s->inter_ac_vlc_length;
        last_length= s->inter_ac_vlc_last_length;
    }
    last_non_zero = s->block_last_index[n];

#ifdef REFINE_STATS
{START_TIMER
#endif
6209 6210
    dc += (1<<(RECON_SHIFT-1));
    for(i=0; i<64; i++){
6211
        rem[i]= dc - (orig[i]<<RECON_SHIFT); //FIXME  use orig dirrectly instead of copying to rem[]
M
Michael Niedermayer 已提交
6212 6213 6214 6215 6216 6217 6218 6219 6220 6221
    }
#ifdef REFINE_STATS
STOP_TIMER("memset rem[]")}
#endif
    sum=0;
    for(i=0; i<64; i++){
        int one= 36;
        int qns=4;
        int w;

D
Diego Biurrun 已提交
6222
        w= FFABS(weight[i]) + qns*one;
M
Michael Niedermayer 已提交
6223 6224 6225 6226
        w= 15 + (48*qns*one + w/2)/w; // 16 .. 63

        weight[i] = w;
//        w=weight[i] = (63*qns + (w/2)) / w;
6227

M
Michael Niedermayer 已提交
6228 6229 6230 6231 6232 6233 6234 6235 6236 6237 6238 6239 6240 6241
        assert(w>0);
        assert(w<(1<<6));
        sum += w*w;
    }
    lambda= sum*(uint64_t)s->lambda2 >> (FF_LAMBDA_SHIFT - 6 + 6 + 6 + 6);
#ifdef REFINE_STATS
{START_TIMER
#endif
    run=0;
    rle_index=0;
    for(i=start_i; i<=last_non_zero; i++){
        int j= perm_scantable[i];
        const int level= block[j];
        int coeff;
6242

M
Michael Niedermayer 已提交
6243 6244 6245 6246 6247 6248
        if(level){
            if(level<0) coeff= qmul*level - qadd;
            else        coeff= qmul*level + qadd;
            run_tab[rle_index++]=run;
            run=0;

6249
            s->dsp.add_8x8basis(rem, basis[j], coeff);
M
Michael Niedermayer 已提交
6250 6251 6252 6253 6254 6255 6256 6257 6258 6259 6260 6261 6262
        }else{
            run++;
        }
    }
#ifdef REFINE_STATS
if(last_non_zero>0){
STOP_TIMER("init rem[]")
}
}

{START_TIMER
#endif
    for(;;){
6263
        int best_score=s->dsp.try_8x8basis(rem, weight, basis[0], 0);
M
Michael Niedermayer 已提交
6264 6265
        int best_coeff=0;
        int best_change=0;
6266
        int run2, best_unquant_change=0, analyze_gradient;
M
Michael Niedermayer 已提交
6267 6268 6269
#ifdef REFINE_STATS
{START_TIMER
#endif
6270 6271 6272 6273 6274 6275 6276 6277
        analyze_gradient = last_non_zero > 2 || s->avctx->quantizer_noise_shaping >= 3;

        if(analyze_gradient){
#ifdef REFINE_STATS
{START_TIMER
#endif
            for(i=0; i<64; i++){
                int w= weight[i];
6278

6279 6280 6281 6282 6283 6284 6285 6286 6287 6288 6289 6290
                d1[i] = (rem[i]*w*w + (1<<(RECON_SHIFT+12-1)))>>(RECON_SHIFT+12);
            }
#ifdef REFINE_STATS
STOP_TIMER("rem*w*w")}
{START_TIMER
#endif
            s->dsp.fdct(d1);
#ifdef REFINE_STATS
STOP_TIMER("dct")}
#endif
        }

M
Michael Niedermayer 已提交
6291 6292 6293 6294 6295
        if(start_i){
            const int level= block[0];
            int change, old_coeff;

            assert(s->mb_intra);
6296

M
Michael Niedermayer 已提交
6297
            old_coeff= q*level;
6298

M
Michael Niedermayer 已提交
6299 6300 6301
            for(change=-1; change<=1; change+=2){
                int new_level= level + change;
                int score, new_coeff;
6302

M
Michael Niedermayer 已提交
6303 6304 6305 6306
                new_coeff= q*new_level;
                if(new_coeff >= 2048 || new_coeff < 0)
                    continue;

6307
                score= s->dsp.try_8x8basis(rem, weight, basis[0], new_coeff - old_coeff);
M
Michael Niedermayer 已提交
6308 6309 6310 6311 6312 6313 6314 6315
                if(score<best_score){
                    best_score= score;
                    best_coeff= 0;
                    best_change= change;
                    best_unquant_change= new_coeff - old_coeff;
                }
            }
        }
6316

M
Michael Niedermayer 已提交
6317 6318 6319 6320 6321 6322 6323 6324 6325 6326 6327 6328 6329 6330 6331 6332 6333 6334 6335 6336 6337 6338 6339
        run=0;
        rle_index=0;
        run2= run_tab[rle_index++];
        prev_level=0;
        prev_run=0;

        for(i=start_i; i<64; i++){
            int j= perm_scantable[i];
            const int level= block[j];
            int change, old_coeff;

            if(s->avctx->quantizer_noise_shaping < 3 && i > last_non_zero + 1)
                break;

            if(level){
                if(level<0) old_coeff= qmul*level - qadd;
                else        old_coeff= qmul*level + qadd;
                run2= run_tab[rle_index++]; //FIXME ! maybe after last
            }else{
                old_coeff=0;
                run2--;
                assert(run2>=0 || i >= last_non_zero );
            }
6340

M
Michael Niedermayer 已提交
6341 6342 6343
            for(change=-1; change<=1; change+=2){
                int new_level= level + change;
                int score, new_coeff, unquant_change;
6344

M
Michael Niedermayer 已提交
6345
                score=0;
D
Diego Biurrun 已提交
6346
                if(s->avctx->quantizer_noise_shaping < 2 && FFABS(new_level) > FFABS(level))
M
Michael Niedermayer 已提交
6347 6348 6349 6350 6351 6352 6353 6354
                   continue;

                if(new_level){
                    if(new_level<0) new_coeff= qmul*new_level - qadd;
                    else            new_coeff= qmul*new_level + qadd;
                    if(new_coeff >= 2048 || new_coeff <= -2048)
                        continue;
                    //FIXME check for overflow
6355

M
Michael Niedermayer 已提交
6356 6357 6358 6359 6360 6361 6362 6363 6364 6365
                    if(level){
                        if(level < 63 && level > -63){
                            if(i < last_non_zero)
                                score +=   length[UNI_AC_ENC_INDEX(run, new_level+64)]
                                         - length[UNI_AC_ENC_INDEX(run, level+64)];
                            else
                                score +=   last_length[UNI_AC_ENC_INDEX(run, new_level+64)]
                                         - last_length[UNI_AC_ENC_INDEX(run, level+64)];
                        }
                    }else{
D
Diego Biurrun 已提交
6366
                        assert(FFABS(new_level)==1);
6367

6368 6369 6370 6371 6372 6373
                        if(analyze_gradient){
                            int g= d1[ scantable[i] ];
                            if(g && (g^new_level) >= 0)
                                continue;
                        }

M
Michael Niedermayer 已提交
6374 6375 6376
                        if(i < last_non_zero){
                            int next_i= i + run2 + 1;
                            int next_level= block[ perm_scantable[next_i] ] + 64;
6377

M
Michael Niedermayer 已提交
6378 6379 6380 6381 6382 6383 6384 6385 6386 6387 6388 6389 6390 6391 6392 6393 6394 6395 6396 6397 6398
                            if(next_level&(~127))
                                next_level= 0;

                            if(next_i < last_non_zero)
                                score +=   length[UNI_AC_ENC_INDEX(run, 65)]
                                         + length[UNI_AC_ENC_INDEX(run2, next_level)]
                                         - length[UNI_AC_ENC_INDEX(run + run2 + 1, next_level)];
                            else
                                score +=  length[UNI_AC_ENC_INDEX(run, 65)]
                                        + last_length[UNI_AC_ENC_INDEX(run2, next_level)]
                                        - last_length[UNI_AC_ENC_INDEX(run + run2 + 1, next_level)];
                        }else{
                            score += last_length[UNI_AC_ENC_INDEX(run, 65)];
                            if(prev_level){
                                score +=  length[UNI_AC_ENC_INDEX(prev_run, prev_level)]
                                        - last_length[UNI_AC_ENC_INDEX(prev_run, prev_level)];
                            }
                        }
                    }
                }else{
                    new_coeff=0;
D
Diego Biurrun 已提交
6399
                    assert(FFABS(level)==1);
M
Michael Niedermayer 已提交
6400 6401 6402 6403

                    if(i < last_non_zero){
                        int next_i= i + run2 + 1;
                        int next_level= block[ perm_scantable[next_i] ] + 64;
6404

M
Michael Niedermayer 已提交
6405 6406 6407 6408 6409 6410 6411 6412 6413 6414 6415 6416 6417 6418 6419 6420 6421 6422 6423
                        if(next_level&(~127))
                            next_level= 0;

                        if(next_i < last_non_zero)
                            score +=   length[UNI_AC_ENC_INDEX(run + run2 + 1, next_level)]
                                     - length[UNI_AC_ENC_INDEX(run2, next_level)]
                                     - length[UNI_AC_ENC_INDEX(run, 65)];
                        else
                            score +=   last_length[UNI_AC_ENC_INDEX(run + run2 + 1, next_level)]
                                     - last_length[UNI_AC_ENC_INDEX(run2, next_level)]
                                     - length[UNI_AC_ENC_INDEX(run, 65)];
                    }else{
                        score += -last_length[UNI_AC_ENC_INDEX(run, 65)];
                        if(prev_level){
                            score +=  last_length[UNI_AC_ENC_INDEX(prev_run, prev_level)]
                                    - length[UNI_AC_ENC_INDEX(prev_run, prev_level)];
                        }
                    }
                }
6424

M
Michael Niedermayer 已提交
6425 6426 6427 6428
                score *= lambda;

                unquant_change= new_coeff - old_coeff;
                assert((score < 100*lambda && score > -100*lambda) || lambda==0);
6429

6430
                score+= s->dsp.try_8x8basis(rem, weight, basis[j], unquant_change);
M
Michael Niedermayer 已提交
6431 6432 6433 6434 6435 6436 6437 6438 6439 6440 6441 6442 6443 6444 6445 6446 6447 6448 6449 6450 6451 6452 6453
                if(score<best_score){
                    best_score= score;
                    best_coeff= i;
                    best_change= change;
                    best_unquant_change= unquant_change;
                }
            }
            if(level){
                prev_level= level + 64;
                if(prev_level&(~127))
                    prev_level= 0;
                prev_run= run;
                run=0;
            }else{
                run++;
            }
        }
#ifdef REFINE_STATS
STOP_TIMER("iterative step")}
#endif

        if(best_change){
            int j= perm_scantable[ best_coeff ];
6454

M
Michael Niedermayer 已提交
6455
            block[j] += best_change;
6456

M
Michael Niedermayer 已提交
6457 6458 6459 6460 6461 6462 6463 6464 6465 6466
            if(best_coeff > last_non_zero){
                last_non_zero= best_coeff;
                assert(block[j]);
#ifdef REFINE_STATS
after_last++;
#endif
            }else{
#ifdef REFINE_STATS
if(block[j]){
    if(block[j] - best_change){
D
Diego Biurrun 已提交
6467
        if(FFABS(block[j]) > FFABS(block[j] - best_change)){
M
Michael Niedermayer 已提交
6468 6469 6470 6471 6472 6473 6474 6475 6476 6477 6478 6479 6480 6481 6482 6483 6484 6485 6486 6487 6488 6489 6490 6491 6492 6493 6494
            raise++;
        }else{
            lower++;
        }
    }else{
        from_zero++;
    }
}else{
    to_zero++;
}
#endif
                for(; last_non_zero>=start_i; last_non_zero--){
                    if(block[perm_scantable[last_non_zero]])
                        break;
                }
            }
#ifdef REFINE_STATS
count++;
if(256*256*256*64 % count == 0){
    printf("after_last:%d to_zero:%d from_zero:%d raise:%d lower:%d sign:%d xyp:%d/%d/%d\n", after_last, to_zero, from_zero, raise, lower, messed_sign, s->mb_x, s->mb_y, s->picture_number);
}
#endif
            run=0;
            rle_index=0;
            for(i=start_i; i<=last_non_zero; i++){
                int j= perm_scantable[i];
                const int level= block[j];
6495

M
Michael Niedermayer 已提交
6496 6497 6498 6499 6500 6501 6502
                 if(level){
                     run_tab[rle_index++]=run;
                     run=0;
                 }else{
                     run++;
                 }
            }
6503

6504
            s->dsp.add_8x8basis(rem, basis[j], best_unquant_change);
M
Michael Niedermayer 已提交
6505 6506 6507 6508 6509 6510 6511 6512 6513 6514 6515 6516 6517 6518
        }else{
            break;
        }
    }
#ifdef REFINE_STATS
if(last_non_zero>0){
STOP_TIMER("iterative search")
}
}
#endif

    return last_non_zero;
}

6519
static int dct_quantize_c(MpegEncContext *s,
F
Fabrice Bellard 已提交
6520
                        DCTELEM *block, int n,
6521
                        int qscale, int *overflow)
F
Fabrice Bellard 已提交
6522
{
6523
    int i, j, level, last_non_zero, q, start_i;
F
Fabrice Bellard 已提交
6524
    const int *qmat;
6525
    const uint8_t *scantable= s->intra_scantable.scantable;
6526 6527 6528
    int bias;
    int max=0;
    unsigned int threshold1, threshold2;
6529

6530
    s->dsp.fdct (block);
F
Fabrice Bellard 已提交
6531

6532
    if(s->dct_error_sum)
M
Michael Niedermayer 已提交
6533
        s->denoise_dct(s, block);
6534

F
Fabrice Bellard 已提交
6535
    if (s->mb_intra) {
6536 6537 6538 6539 6540 6541 6542 6543 6544
        if (!s->h263_aic) {
            if (n < 4)
                q = s->y_dc_scale;
            else
                q = s->c_dc_scale;
            q = q << 3;
        } else
            /* For AIC we skip quant/dequant of INTRADC */
            q = 1 << 3;
6545

F
Fabrice Bellard 已提交
6546 6547
        /* note: block[0] is assumed to be positive */
        block[0] = (block[0] + (q >> 1)) / q;
6548
        start_i = 1;
F
Fabrice Bellard 已提交
6549
        last_non_zero = 0;
6550
        qmat = s->q_intra_matrix[qscale];
M
Michael Niedermayer 已提交
6551
        bias= s->intra_quant_bias<<(QMAT_SHIFT - QUANT_BIAS_SHIFT);
F
Fabrice Bellard 已提交
6552
    } else {
6553
        start_i = 0;
F
Fabrice Bellard 已提交
6554
        last_non_zero = -1;
6555
        qmat = s->q_inter_matrix[qscale];
M
Michael Niedermayer 已提交
6556
        bias= s->inter_quant_bias<<(QMAT_SHIFT - QUANT_BIAS_SHIFT);
F
Fabrice Bellard 已提交
6557
    }
M
Michael Niedermayer 已提交
6558 6559
    threshold1= (1<<QMAT_SHIFT) - bias - 1;
    threshold2= (threshold1<<1);
6560 6561 6562
    for(i=63;i>=start_i;i--) {
        j = scantable[i];
        level = block[j] * qmat[j];
F
Fabrice Bellard 已提交
6563

6564 6565 6566 6567 6568 6569 6570 6571
        if(((unsigned)(level+threshold1))>threshold2){
            last_non_zero = i;
            break;
        }else{
            block[j]=0;
        }
    }
    for(i=start_i; i<=last_non_zero; i++) {
M
Michael Niedermayer 已提交
6572
        j = scantable[i];
6573
        level = block[j] * qmat[j];
F
Fabrice Bellard 已提交
6574

M
Michael Niedermayer 已提交
6575 6576
//        if(   bias+level >= (1<<QMAT_SHIFT)
//           || bias-level >= (1<<QMAT_SHIFT)){
6577 6578
        if(((unsigned)(level+threshold1))>threshold2){
            if(level>0){
M
Michael Niedermayer 已提交
6579
                level= (bias + level)>>QMAT_SHIFT;
6580 6581
                block[j]= level;
            }else{
M
Michael Niedermayer 已提交
6582
                level= (bias - level)>>QMAT_SHIFT;
6583 6584 6585 6586 6587
                block[j]= -level;
            }
            max |=level;
        }else{
            block[j]=0;
F
Fabrice Bellard 已提交
6588 6589
        }
    }
6590
    *overflow= s->max_qcoeff < max; //overflow might have happened
6591

M
Michael Niedermayer 已提交
6592
    /* we need this permutation so that we correct the IDCT, we only permute the !=0 elements */
6593
    if (s->dsp.idct_permutation_type != FF_NO_IDCT_PERM)
6594
        ff_block_permute(block, s->dsp.idct_permutation, scantable, last_non_zero);
M
Michael Niedermayer 已提交
6595

F
Fabrice Bellard 已提交
6596 6597 6598
    return last_non_zero;
}

6599 6600
#endif //CONFIG_ENCODERS

6601
static void dct_unquantize_mpeg1_intra_c(MpegEncContext *s,
6602
                                   DCTELEM *block, int n, int qscale)
F
Fabrice Bellard 已提交
6603
{
M
Michael Niedermayer 已提交
6604
    int i, level, nCoeffs;
6605
    const uint16_t *quant_matrix;
F
Fabrice Bellard 已提交
6606

6607
    nCoeffs= s->block_last_index[n];
6608 6609

    if (n < 4)
6610 6611 6612 6613 6614 6615 6616 6617 6618 6619 6620 6621 6622 6623 6624 6625 6626
        block[0] = block[0] * s->y_dc_scale;
    else
        block[0] = block[0] * s->c_dc_scale;
    /* XXX: only mpeg1 */
    quant_matrix = s->intra_matrix;
    for(i=1;i<=nCoeffs;i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = (level - 1) | 1;
                level = -level;
            } else {
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = (level - 1) | 1;
F
Fabrice Bellard 已提交
6627
            }
6628
            block[j] = level;
F
Fabrice Bellard 已提交
6629
        }
6630 6631 6632
    }
}

6633
static void dct_unquantize_mpeg1_inter_c(MpegEncContext *s,
6634 6635 6636 6637 6638 6639
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
    const uint16_t *quant_matrix;

    nCoeffs= s->block_last_index[n];
6640

6641 6642 6643 6644 6645 6646 6647 6648 6649 6650 6651 6652 6653 6654 6655
    quant_matrix = s->inter_matrix;
    for(i=0; i<=nCoeffs; i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
                level = (level - 1) | 1;
                level = -level;
            } else {
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
                level = (level - 1) | 1;
F
Fabrice Bellard 已提交
6656
            }
6657
            block[j] = level;
F
Fabrice Bellard 已提交
6658 6659 6660
        }
    }
}
6661

6662
static void dct_unquantize_mpeg2_intra_c(MpegEncContext *s,
6663 6664 6665
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
6666
    const uint16_t *quant_matrix;
6667

6668 6669
    if(s->alternate_scan) nCoeffs= 63;
    else nCoeffs= s->block_last_index[n];
6670 6671

    if (n < 4)
6672 6673 6674 6675 6676 6677 6678 6679 6680 6681 6682 6683 6684 6685 6686 6687 6688 6689 6690 6691
        block[0] = block[0] * s->y_dc_scale;
    else
        block[0] = block[0] * s->c_dc_scale;
    quant_matrix = s->intra_matrix;
    for(i=1;i<=nCoeffs;i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = -level;
            } else {
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
            }
            block[j] = level;
        }
    }
}

6692 6693 6694 6695 6696 6697 6698 6699 6700 6701 6702 6703 6704 6705 6706 6707 6708 6709 6710 6711 6712 6713 6714 6715 6716 6717 6718 6719 6720 6721 6722 6723 6724
static void dct_unquantize_mpeg2_intra_bitexact(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
    const uint16_t *quant_matrix;
    int sum=-1;

    if(s->alternate_scan) nCoeffs= 63;
    else nCoeffs= s->block_last_index[n];

    if (n < 4)
        block[0] = block[0] * s->y_dc_scale;
    else
        block[0] = block[0] * s->c_dc_scale;
    quant_matrix = s->intra_matrix;
    for(i=1;i<=nCoeffs;i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
                level = -level;
            } else {
                level = (int)(level * qscale * quant_matrix[j]) >> 3;
            }
            block[j] = level;
            sum+=level;
        }
    }
    block[63]^=sum&1;
}

6725
static void dct_unquantize_mpeg2_inter_c(MpegEncContext *s,
6726 6727 6728 6729 6730 6731 6732 6733
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
    const uint16_t *quant_matrix;
    int sum=-1;

    if(s->alternate_scan) nCoeffs= 63;
    else nCoeffs= s->block_last_index[n];
6734

6735 6736 6737 6738 6739 6740 6741 6742 6743 6744 6745 6746 6747 6748 6749 6750 6751 6752 6753 6754 6755
    quant_matrix = s->inter_matrix;
    for(i=0; i<=nCoeffs; i++) {
        int j= s->intra_scantable.permutated[i];
        level = block[j];
        if (level) {
            if (level < 0) {
                level = -level;
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
                level = -level;
            } else {
                level = (((level << 1) + 1) * qscale *
                         ((int) (quant_matrix[j]))) >> 4;
            }
            block[j] = level;
            sum+=level;
        }
    }
    block[63]^=sum&1;
}

6756
static void dct_unquantize_h263_intra_c(MpegEncContext *s,
6757 6758 6759 6760
                                  DCTELEM *block, int n, int qscale)
{
    int i, level, qmul, qadd;
    int nCoeffs;
6761

6762
    assert(s->block_last_index[n]>=0);
6763

6764
    qmul = qscale << 1;
6765

6766
    if (!s->h263_aic) {
6767
        if (n < 4)
6768 6769 6770
            block[0] = block[0] * s->y_dc_scale;
        else
            block[0] = block[0] * s->c_dc_scale;
6771 6772 6773 6774 6775 6776 6777 6778 6779 6780 6781 6782 6783 6784 6785 6786
        qadd = (qscale - 1) | 1;
    }else{
        qadd = 0;
    }
    if(s->ac_pred)
        nCoeffs=63;
    else
        nCoeffs= s->inter_scantable.raster_end[ s->block_last_index[n] ];

    for(i=1; i<=nCoeffs; i++) {
        level = block[i];
        if (level) {
            if (level < 0) {
                level = level * qmul - qadd;
            } else {
                level = level * qmul + qadd;
6787
            }
6788
            block[i] = level;
6789 6790 6791 6792
        }
    }
}

6793
static void dct_unquantize_h263_inter_c(MpegEncContext *s,
6794 6795 6796
                                  DCTELEM *block, int n, int qscale)
{
    int i, level, qmul, qadd;
M
Michael Niedermayer 已提交
6797
    int nCoeffs;
6798

6799
    assert(s->block_last_index[n]>=0);
6800

6801 6802
    qadd = (qscale - 1) | 1;
    qmul = qscale << 1;
6803

6804
    nCoeffs= s->inter_scantable.raster_end[ s->block_last_index[n] ];
6805

6806
    for(i=0; i<=nCoeffs; i++) {
6807 6808 6809 6810 6811 6812 6813 6814 6815 6816 6817
        level = block[i];
        if (level) {
            if (level < 0) {
                level = level * qmul - qadd;
            } else {
                level = level * qmul + qadd;
            }
            block[i] = level;
        }
    }
}
F
Fabrice Bellard 已提交
6818

6819
#ifdef CONFIG_ENCODERS
F
Fabrice Bellard 已提交
6820 6821 6822 6823 6824 6825 6826 6827
AVCodec h263_encoder = {
    "h263",
    CODEC_TYPE_VIDEO,
    CODEC_ID_H263,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
M
Michael Niedermayer 已提交
6828
    .pix_fmts= (enum PixelFormat[]){PIX_FMT_YUV420P, -1},
F
Fabrice Bellard 已提交
6829 6830 6831 6832 6833 6834 6835 6836 6837 6838
};

AVCodec h263p_encoder = {
    "h263p",
    CODEC_TYPE_VIDEO,
    CODEC_ID_H263P,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
M
Michael Niedermayer 已提交
6839
    .pix_fmts= (enum PixelFormat[]){PIX_FMT_YUV420P, -1},
F
Fabrice Bellard 已提交
6840 6841
};

6842 6843 6844 6845 6846 6847 6848 6849
AVCodec flv_encoder = {
    "flv",
    CODEC_TYPE_VIDEO,
    CODEC_ID_FLV1,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
M
Michael Niedermayer 已提交
6850
    .pix_fmts= (enum PixelFormat[]){PIX_FMT_YUV420P, -1},
6851 6852
};

F
Fabrice Bellard 已提交
6853 6854 6855 6856 6857 6858 6859 6860
AVCodec rv10_encoder = {
    "rv10",
    CODEC_TYPE_VIDEO,
    CODEC_ID_RV10,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
M
Michael Niedermayer 已提交
6861
    .pix_fmts= (enum PixelFormat[]){PIX_FMT_YUV420P, -1},
F
Fabrice Bellard 已提交
6862 6863
};

M
Michael Niedermayer 已提交
6864 6865 6866 6867 6868 6869 6870 6871
AVCodec rv20_encoder = {
    "rv20",
    CODEC_TYPE_VIDEO,
    CODEC_ID_RV20,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
M
Michael Niedermayer 已提交
6872
    .pix_fmts= (enum PixelFormat[]){PIX_FMT_YUV420P, -1},
M
Michael Niedermayer 已提交
6873 6874
};

F
Fabrice Bellard 已提交
6875 6876
AVCodec mpeg4_encoder = {
    "mpeg4",
F
Fabrice Bellard 已提交
6877
    CODEC_TYPE_VIDEO,
F
Fabrice Bellard 已提交
6878
    CODEC_ID_MPEG4,
F
Fabrice Bellard 已提交
6879 6880 6881 6882
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
M
Michael Niedermayer 已提交
6883
    .pix_fmts= (enum PixelFormat[]){PIX_FMT_YUV420P, -1},
6884
    .capabilities= CODEC_CAP_DELAY,
F
Fabrice Bellard 已提交
6885 6886
};

6887 6888 6889 6890 6891 6892 6893 6894
AVCodec msmpeg4v1_encoder = {
    "msmpeg4v1",
    CODEC_TYPE_VIDEO,
    CODEC_ID_MSMPEG4V1,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
M
Michael Niedermayer 已提交
6895
    .pix_fmts= (enum PixelFormat[]){PIX_FMT_YUV420P, -1},
6896 6897 6898 6899 6900 6901 6902 6903 6904 6905
};

AVCodec msmpeg4v2_encoder = {
    "msmpeg4v2",
    CODEC_TYPE_VIDEO,
    CODEC_ID_MSMPEG4V2,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
M
Michael Niedermayer 已提交
6906
    .pix_fmts= (enum PixelFormat[]){PIX_FMT_YUV420P, -1},
6907 6908 6909
};

AVCodec msmpeg4v3_encoder = {
F
Fabrice Bellard 已提交
6910 6911
    "msmpeg4",
    CODEC_TYPE_VIDEO,
6912
    CODEC_ID_MSMPEG4V3,
F
Fabrice Bellard 已提交
6913 6914 6915 6916
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
M
Michael Niedermayer 已提交
6917
    .pix_fmts= (enum PixelFormat[]){PIX_FMT_YUV420P, -1},
F
Fabrice Bellard 已提交
6918
};
M
Michael Niedermayer 已提交
6919 6920 6921 6922 6923 6924 6925 6926 6927

AVCodec wmv1_encoder = {
    "wmv1",
    CODEC_TYPE_VIDEO,
    CODEC_ID_WMV1,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
M
Michael Niedermayer 已提交
6928
    .pix_fmts= (enum PixelFormat[]){PIX_FMT_YUV420P, -1},
M
Michael Niedermayer 已提交
6929 6930
};

6931
#ifdef CONFIG_MJPEG_ENCODER
M
Michael Niedermayer 已提交
6932 6933 6934 6935 6936 6937 6938 6939
AVCodec mjpeg_encoder = {
    "mjpeg",
    CODEC_TYPE_VIDEO,
    CODEC_ID_MJPEG,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
B
Baptiste Coudurier 已提交
6940
    .pix_fmts= (enum PixelFormat[]){PIX_FMT_YUVJ420P, PIX_FMT_YUVJ422P, -1},
M
Michael Niedermayer 已提交
6941
};
6942
#endif
6943 6944

#endif //CONFIG_ENCODERS