mpegvideo.c 138.2 KB
Newer Older
F
Fabrice Bellard 已提交
1 2
/*
 * The simplest mpeg encoder (well, it was the simplest!)
F
Fabrice Bellard 已提交
3
 * Copyright (c) 2000,2001 Fabrice Bellard.
F
Fabrice Bellard 已提交
4
 *
F
Fabrice Bellard 已提交
5 6 7 8
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
F
Fabrice Bellard 已提交
9
 *
F
Fabrice Bellard 已提交
10
 * This library is distributed in the hope that it will be useful,
F
Fabrice Bellard 已提交
11
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
F
Fabrice Bellard 已提交
12 13
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
F
Fabrice Bellard 已提交
14
 *
F
Fabrice Bellard 已提交
15 16 17
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
M
Michael Niedermayer 已提交
18
 *
19
 * 4MV & hq & b-frame encoding stuff by Michael Niedermayer <michaelni@gmx.at>
F
Fabrice Bellard 已提交
20
 */
21
 
M
Michael Niedermayer 已提交
22 23 24 25 26
/**
 * @file mpegvideo.c
 * The simplest mpeg encoder (well, it was the simplest!).
 */ 
 
27
#include <ctype.h>
28
#include <limits.h>
F
Fabrice Bellard 已提交
29 30 31 32
#include "avcodec.h"
#include "dsputil.h"
#include "mpegvideo.h"

33 34 35 36
#ifdef USE_FASTMEMCPY
#include "fastmemcpy.h"
#endif

37 38 39
//#undef NDEBUG
//#include <assert.h>

40
#ifdef CONFIG_ENCODERS
41
static void encode_picture(MpegEncContext *s, int picture_number);
42
#endif //CONFIG_ENCODERS
43 44
static void dct_unquantize_mpeg1_c(MpegEncContext *s, 
                                   DCTELEM *block, int n, int qscale);
45 46
static void dct_unquantize_mpeg2_c(MpegEncContext *s,
                                   DCTELEM *block, int n, int qscale);
47 48
static void dct_unquantize_h263_c(MpegEncContext *s, 
                                  DCTELEM *block, int n, int qscale);
49
static void draw_edges_c(uint8_t *buf, int wrap, int width, int height, int w);
50
#ifdef CONFIG_ENCODERS
51
static int dct_quantize_c(MpegEncContext *s, DCTELEM *block, int n, int qscale, int *overflow);
M
Michael Niedermayer 已提交
52
static int dct_quantize_trellis_c(MpegEncContext *s, DCTELEM *block, int n, int qscale, int *overflow);
53
#endif //CONFIG_ENCODERS
M
Michael Niedermayer 已提交
54

55
void (*draw_edges)(uint8_t *buf, int wrap, int width, int height, int w)= draw_edges_c;
M
Michael Niedermayer 已提交
56

F
Fabrice Bellard 已提交
57 58 59 60 61 62

/* enable all paranoid tests for rounding, overflows, etc... */
//#define PARANOID

//#define DEBUG

63

F
Fabrice Bellard 已提交
64 65 66
/* for jpeg fast DCT */
#define CONST_BITS 14

67
static const uint16_t aanscales[64] = {
F
Fabrice Bellard 已提交
68 69 70 71 72 73 74
    /* precomputed values scaled up by 14 bits */
    16384, 22725, 21407, 19266, 16384, 12873,  8867,  4520,
    22725, 31521, 29692, 26722, 22725, 17855, 12299,  6270,
    21407, 29692, 27969, 25172, 21407, 16819, 11585,  5906,
    19266, 26722, 25172, 22654, 19266, 15137, 10426,  5315,
    16384, 22725, 21407, 19266, 16384, 12873,  8867,  4520,
    12873, 17855, 16819, 15137, 12873, 10114,  6967,  3552,
M
Michael Niedermayer 已提交
75 76
    8867 , 12299, 11585, 10426,  8867,  6967,  4799,  2446,
    4520 ,  6270,  5906,  5315,  4520,  3552,  2446,  1247
F
Fabrice Bellard 已提交
77 78
};

79
static const uint8_t h263_chroma_roundtab[16] = {
80
//  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15
F
Fabrice Bellard 已提交
81 82 83
    0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2,
};

84
#ifdef CONFIG_ENCODERS
85 86
static uint16_t (*default_mv_penalty)[MAX_MV*2+1]=NULL;
static uint8_t default_fcode_tab[MAX_MV*2+1];
87

M
Michael Niedermayer 已提交
88 89
enum PixelFormat ff_yuv420p_list[2]= {PIX_FMT_YUV420P, -1};

90
static void convert_matrix(MpegEncContext *s, int (*qmat)[64], uint16_t (*qmat16)[64], uint16_t (*qmat16_bias)[64],
91
                           const uint16_t *quant_matrix, int bias, int qmin, int qmax)
F
Fabrice Bellard 已提交
92
{
93 94
    int qscale;

95
    for(qscale=qmin; qscale<=qmax; qscale++){
96
        int i;
97
        if (s->dsp.fdct == ff_jpeg_fdct_islow) {
98
            for(i=0;i<64;i++) {
99
                const int j= s->dsp.idct_permutation[i];
100 101 102 103 104
                /* 16 <= qscale * quant_matrix[i] <= 7905 */
                /* 19952         <= aanscales[i] * qscale * quant_matrix[i]           <= 249205026 */
                /* (1<<36)/19952 >= (1<<36)/(aanscales[i] * qscale * quant_matrix[i]) >= (1<<36)/249205026 */
                /* 3444240       >= (1<<36)/(aanscales[i] * qscale * quant_matrix[i]) >= 275 */
                
105
                qmat[qscale][i] = (int)((uint64_t_C(1) << QMAT_SHIFT) / 
106 107
                                (qscale * quant_matrix[j]));
            }
108
        } else if (s->dsp.fdct == fdct_ifast) {
109
            for(i=0;i<64;i++) {
110
                const int j= s->dsp.idct_permutation[i];
111 112 113 114 115
                /* 16 <= qscale * quant_matrix[i] <= 7905 */
                /* 19952         <= aanscales[i] * qscale * quant_matrix[i]           <= 249205026 */
                /* (1<<36)/19952 >= (1<<36)/(aanscales[i] * qscale * quant_matrix[i]) >= (1<<36)/249205026 */
                /* 3444240       >= (1<<36)/(aanscales[i] * qscale * quant_matrix[i]) >= 275 */
                
116
                qmat[qscale][i] = (int)((uint64_t_C(1) << (QMAT_SHIFT + 14)) / 
117 118 119 120
                                (aanscales[i] * qscale * quant_matrix[j]));
            }
        } else {
            for(i=0;i<64;i++) {
121
                const int j= s->dsp.idct_permutation[i];
122 123 124 125 126
                /* We can safely suppose that 16 <= quant_matrix[i] <= 255
                   So 16           <= qscale * quant_matrix[i]             <= 7905
                   so (1<<19) / 16 >= (1<<19) / (qscale * quant_matrix[i]) >= (1<<19) / 7905
                   so 32768        >= (1<<19) / (qscale * quant_matrix[i]) >= 67
                */
127
                qmat[qscale][i] = (int)((uint64_t_C(1) << QMAT_SHIFT) / (qscale * quant_matrix[j]));
M
Michael Niedermayer 已提交
128
//                qmat  [qscale][i] = (1 << QMAT_SHIFT_MMX) / (qscale * quant_matrix[i]);
129
                qmat16[qscale][i] = (1 << QMAT_SHIFT_MMX) / (qscale * quant_matrix[j]);
130 131 132 133

                if(qmat16[qscale][i]==0 || qmat16[qscale][i]==128*256) qmat16[qscale][i]=128*256-1;
                qmat16_bias[qscale][i]= ROUNDED_DIV(bias<<(16-QUANT_BIAS_SHIFT), qmat16[qscale][i]);
            }
F
Fabrice Bellard 已提交
134 135 136
        }
    }
}
137 138
#endif //CONFIG_ENCODERS

139 140 141 142 143 144 145 146 147
// move into common.c perhaps 
#define CHECKED_ALLOCZ(p, size)\
{\
    p= av_mallocz(size);\
    if(p==NULL){\
        perror("malloc");\
        goto fail;\
    }\
}
148

149
void ff_init_scantable(MpegEncContext *s, ScanTable *st, const uint8_t *src_scantable){
150 151
    int i;
    int end;
M
Michael Niedermayer 已提交
152 153
    
    st->scantable= src_scantable;
154 155 156 157

    for(i=0; i<64; i++){
        int j;
        j = src_scantable[i];
158
        st->permutated[i] = s->dsp.idct_permutation[j];
159 160 161
#ifdef ARCH_POWERPC
        st->inverse[j] = i;
#endif
162 163 164 165 166 167 168 169 170 171 172
    }
    
    end=-1;
    for(i=0; i<64; i++){
        int j;
        j = st->permutated[i];
        if(j>end) end=j;
        st->raster_end[i]= end;
    }
}

173 174
/* init common dct for both encoder and decoder */
int DCT_common_init(MpegEncContext *s)
F
Fabrice Bellard 已提交
175
{
176
    s->dct_unquantize_h263 = dct_unquantize_h263_c;
177 178
    s->dct_unquantize_mpeg1 = dct_unquantize_mpeg1_c;
    s->dct_unquantize_mpeg2 = dct_unquantize_mpeg2_c;
179

180
#ifdef CONFIG_ENCODERS
181
    s->dct_quantize= dct_quantize_c;
182
#endif
183 184 185
        
#ifdef HAVE_MMX
    MPV_common_init_mmx(s);
186 187 188
#endif
#ifdef ARCH_ALPHA
    MPV_common_init_axp(s);
N
Nick Kurshev 已提交
189
#endif
190 191 192
#ifdef HAVE_MLIB
    MPV_common_init_mlib(s);
#endif
193 194 195
#ifdef HAVE_MMI
    MPV_common_init_mmi(s);
#endif
196
#ifdef ARCH_ARMV4L
197
    MPV_common_init_armv4l(s);
198
#endif
199 200 201
#ifdef ARCH_POWERPC
    MPV_common_init_ppc(s);
#endif
202

203
#ifdef CONFIG_ENCODERS
204 205
    s->fast_dct_quantize= s->dct_quantize;

M
Michael Niedermayer 已提交
206 207 208 209
    if(s->flags&CODEC_FLAG_TRELLIS_QUANT){
        s->dct_quantize= dct_quantize_trellis_c; //move before MPV_common_init_*
    }

210 211
#endif //CONFIG_ENCODERS

212 213 214 215 216 217 218
    /* load & permutate scantables
       note: only wmv uses differnt ones 
    */
    ff_init_scantable(s, &s->inter_scantable  , ff_zigzag_direct);
    ff_init_scantable(s, &s->intra_scantable  , ff_zigzag_direct);
    ff_init_scantable(s, &s->intra_h_scantable, ff_alternate_horizontal_scan);
    ff_init_scantable(s, &s->intra_v_scantable, ff_alternate_vertical_scan);
219

220 221
    s->picture_structure= PICT_FRAME;
    
222 223 224
    return 0;
}

M
cleanup  
Michael Niedermayer 已提交
225
/**
M
Michael Niedermayer 已提交
226 227
 * allocates a Picture
 * The pixels are allocated/set by calling get_buffer() if shared=0
M
cleanup  
Michael Niedermayer 已提交
228
 */
M
Michael Niedermayer 已提交
229 230 231 232 233 234 235 236 237 238 239
static int alloc_picture(MpegEncContext *s, Picture *pic, int shared){
    
    if(shared){
        assert(pic->data[0]);
        assert(pic->type == 0 || pic->type == FF_BUFFER_TYPE_SHARED);
        pic->type= FF_BUFFER_TYPE_SHARED;
    }else{
        int r;
        
        assert(!pic->data[0]);
        
M
Michael Niedermayer 已提交
240
        r= s->avctx->get_buffer(s->avctx, (AVFrame*)pic);
M
Michael Niedermayer 已提交
241 242
        
        if(r<0 || !pic->age || !pic->type || !pic->data[0]){
243
            fprintf(stderr, "get_buffer() failed (%d %d %d %p)\n", r, pic->age, pic->type, pic->data[0]);
M
Michael Niedermayer 已提交
244 245 246 247 248 249 250 251 252 253 254 255 256 257 258
            return -1;
        }

        if(s->linesize && (s->linesize != pic->linesize[0] || s->uvlinesize != pic->linesize[1])){
            fprintf(stderr, "get_buffer() failed (stride changed)\n");
            return -1;
        }

        if(pic->linesize[1] != pic->linesize[2]){
            fprintf(stderr, "get_buffer() failed (uv stride missmatch)\n");
            return -1;
        }

        s->linesize  = pic->linesize[0];
        s->uvlinesize= pic->linesize[1];
M
cleanup  
Michael Niedermayer 已提交
259
    }
M
Michael Niedermayer 已提交
260 261 262
    
    if(pic->qscale_table==NULL){
        if (s->encoding) {        
263 264 265
            CHECKED_ALLOCZ(pic->mb_var   , s->mb_num * sizeof(int16_t))
            CHECKED_ALLOCZ(pic->mc_mb_var, s->mb_num * sizeof(int16_t))
            CHECKED_ALLOCZ(pic->mb_mean  , s->mb_num * sizeof(int8_t))
266
            CHECKED_ALLOCZ(pic->mb_cmp_score, s->mb_num * sizeof(int32_t))
M
Michael Niedermayer 已提交
267
        }
M
cleanup  
Michael Niedermayer 已提交
268

269 270
        CHECKED_ALLOCZ(pic->mbskip_table , s->mb_num * sizeof(uint8_t)+1) //the +1 is for the slice end check
        CHECKED_ALLOCZ(pic->qscale_table , s->mb_num * sizeof(uint8_t))
M
Michael Niedermayer 已提交
271 272
        pic->qstride= s->mb_width;
    }
M
cleanup  
Michael Niedermayer 已提交
273
    
274 275 276 277 278 279
    //it might be nicer if the application would keep track of these but it would require a API change
    memmove(s->prev_pict_types+1, s->prev_pict_types, PREV_PICT_TYPES_BUFFER_SIZE-1);
    s->prev_pict_types[0]= s->pict_type;
    if(pic->age < PREV_PICT_TYPES_BUFFER_SIZE && s->prev_pict_types[pic->age] == B_TYPE)
        pic->age= INT_MAX; // skiped MBs in b frames are quite rare in mpeg1/2 and its a bit tricky to skip them anyway
    
M
cleanup  
Michael Niedermayer 已提交
280 281 282 283 284
    return 0;
fail: //for the CHECKED_ALLOCZ macro
    return -1;
}

M
Michael Niedermayer 已提交
285 286 287
/**
 * deallocates a picture
 */
M
cleanup  
Michael Niedermayer 已提交
288 289
static void free_picture(MpegEncContext *s, Picture *pic){
    int i;
M
Michael Niedermayer 已提交
290 291

    if(pic->data[0] && pic->type!=FF_BUFFER_TYPE_SHARED){
M
Michael Niedermayer 已提交
292
        s->avctx->release_buffer(s->avctx, (AVFrame*)pic);
M
Michael Niedermayer 已提交
293 294
    }

M
cleanup  
Michael Niedermayer 已提交
295 296 297
    av_freep(&pic->mb_var);
    av_freep(&pic->mc_mb_var);
    av_freep(&pic->mb_mean);
298
    av_freep(&pic->mb_cmp_score);
M
cleanup  
Michael Niedermayer 已提交
299 300 301
    av_freep(&pic->mbskip_table);
    av_freep(&pic->qscale_table);
    
M
Michael Niedermayer 已提交
302
    if(pic->type == FF_BUFFER_TYPE_INTERNAL){
M
cleanup  
Michael Niedermayer 已提交
303 304 305 306 307
        for(i=0; i<4; i++){
            av_freep(&pic->base[i]);
            pic->data[i]= NULL;
        }
        av_freep(&pic->opaque);
M
Michael Niedermayer 已提交
308 309 310 311 312 313 314
        pic->type= 0;
    }else if(pic->type == FF_BUFFER_TYPE_SHARED){
        for(i=0; i<4; i++){
            pic->base[i]=
            pic->data[i]= NULL;
        }
        pic->type= 0;        
M
cleanup  
Michael Niedermayer 已提交
315 316 317
    }
}

318 319 320
/* init common structure for both encoder and decoder */
int MPV_common_init(MpegEncContext *s)
{
321
    int y_size, c_size, yc_size, i;
322

323
    dsputil_init(&s->dsp, s->avctx);
324
    DCT_common_init(s);
325

326
    s->flags= s->avctx->flags;
327

M
cleanup  
Michael Niedermayer 已提交
328
    s->mb_width  = (s->width  + 15) / 16;
F
Fabrice Bellard 已提交
329
    s->mb_height = (s->height + 15) / 16;
330

331 332 333
    /* set default edge pos, will be overriden in decode_header if needed */
    s->h_edge_pos= s->mb_width*16;
    s->v_edge_pos= s->mb_height*16;
334 335 336 337 338 339 340

    s->mb_num = s->mb_width * s->mb_height;

    y_size = (2 * s->mb_width + 2) * (2 * s->mb_height + 2);
    c_size = (s->mb_width + 2) * (s->mb_height + 2);
    yc_size = y_size + 2 * c_size;

341
    /* convert fourcc to upper case */
342 343 344 345
    s->avctx->codec_tag=   toupper( s->avctx->codec_tag     &0xFF)          
                        + (toupper((s->avctx->codec_tag>>8 )&0xFF)<<8 )
                        + (toupper((s->avctx->codec_tag>>16)&0xFF)<<16) 
                        + (toupper((s->avctx->codec_tag>>24)&0xFF)<<24);
346

347 348
    CHECKED_ALLOCZ(s->allocated_edge_emu_buffer, (s->width+64)*2*17*2); //(width + edge + align)*interlaced*MBsize*tolerance
    s->edge_emu_buffer= s->allocated_edge_emu_buffer + (s->width+64)*2*17;
M
cleanup  
Michael Niedermayer 已提交
349

M
Michael Niedermayer 已提交
350
    s->avctx->coded_frame= (AVFrame*)&s->current_picture;
M
cleanup  
Michael Niedermayer 已提交
351

352
    if (s->encoding) {
353 354 355
        int mv_table_size= (s->mb_width+2)*(s->mb_height+2);

        /* Allocate MV tables */
356 357 358 359 360 361
        CHECKED_ALLOCZ(s->p_mv_table            , mv_table_size * 2 * sizeof(int16_t))
        CHECKED_ALLOCZ(s->b_forw_mv_table       , mv_table_size * 2 * sizeof(int16_t))
        CHECKED_ALLOCZ(s->b_back_mv_table       , mv_table_size * 2 * sizeof(int16_t))
        CHECKED_ALLOCZ(s->b_bidir_forw_mv_table , mv_table_size * 2 * sizeof(int16_t))
        CHECKED_ALLOCZ(s->b_bidir_back_mv_table , mv_table_size * 2 * sizeof(int16_t))
        CHECKED_ALLOCZ(s->b_direct_mv_table     , mv_table_size * 2 * sizeof(int16_t))
362

M
cleanup  
Michael Niedermayer 已提交
363
        //FIXME should be linesize instead of s->width*2 but that isnt known before get_buffer()
M
Michael Niedermayer 已提交
364
        CHECKED_ALLOCZ(s->me.scratchpad,  s->width*2*16*3*sizeof(uint8_t)) 
365
        
M
Michael Niedermayer 已提交
366 367
        CHECKED_ALLOCZ(s->me.map      , ME_MAP_SIZE*sizeof(uint32_t))
        CHECKED_ALLOCZ(s->me.score_map, ME_MAP_SIZE*sizeof(uint32_t))
368

369 370 371 372
        if(s->codec_id==CODEC_ID_MPEG4){
            CHECKED_ALLOCZ(s->tex_pb_buffer, PB_BUFFER_SIZE);
            CHECKED_ALLOCZ(   s->pb2_buffer, PB_BUFFER_SIZE);
        }
M
Michael Niedermayer 已提交
373
        
374 375 376
        if(s->msmpeg4_version){
            CHECKED_ALLOCZ(s->ac_stats, 2*2*(MAX_LEVEL+1)*(MAX_RUN+1)*2*sizeof(int));
        }
M
Michael Niedermayer 已提交
377
        CHECKED_ALLOCZ(s->avctx->stats_out, 256);
378
    }
379
        
380
    CHECKED_ALLOCZ(s->error_status_table, s->mb_num*sizeof(uint8_t))
381
    
382
    if (s->out_format == FMT_H263 || s->encoding) {
F
Fabrice Bellard 已提交
383
        int size;
384
        /* Allocate MB type table */
385
        CHECKED_ALLOCZ(s->mb_type  , s->mb_num * sizeof(uint8_t))
386

F
Fabrice Bellard 已提交
387 388
        /* MV prediction */
        size = (2 * s->mb_width + 2) * (2 * s->mb_height + 2);
389
        CHECKED_ALLOCZ(s->motion_val, size * 2 * sizeof(int16_t));
390 391 392
    }

    if(s->codec_id==CODEC_ID_MPEG4){
393
        /* interlaced direct mode decoding tables */
394 395
        CHECKED_ALLOCZ(s->field_mv_table, s->mb_num*2*2 * sizeof(int16_t))
        CHECKED_ALLOCZ(s->field_select_table, s->mb_num*2* sizeof(int8_t))
F
Fabrice Bellard 已提交
396
    }
397 398
    /* 4mv b frame decoding table */
    //note this is needed for h263 without b frames too (segfault on damaged streams otherwise)
399
    CHECKED_ALLOCZ(s->co_located_type_table, s->mb_num * sizeof(uint8_t))
M
Michael Niedermayer 已提交
400
    if (s->out_format == FMT_H263) {
F
Fabrice Bellard 已提交
401
        /* ac values */
402
        CHECKED_ALLOCZ(s->ac_val[0], yc_size * sizeof(int16_t) * 16);
F
Fabrice Bellard 已提交
403 404 405 406
        s->ac_val[1] = s->ac_val[0] + y_size;
        s->ac_val[2] = s->ac_val[1] + c_size;
        
        /* cbp values */
407
        CHECKED_ALLOCZ(s->coded_block, y_size);
M
Michael Niedermayer 已提交
408 409
        
        /* divx501 bitstream reorder buffer */
410
        CHECKED_ALLOCZ(s->bitstream_buffer, BITSTREAM_BUFFER_SIZE);
M
cleanup  
Michael Niedermayer 已提交
411

412
        /* cbp, ac_pred, pred_dir */
413 414
        CHECKED_ALLOCZ(s->cbp_table  , s->mb_num * sizeof(uint8_t))
        CHECKED_ALLOCZ(s->pred_dir_table, s->mb_num * sizeof(uint8_t))
415
    }
416 417 418 419
    
    if (s->h263_pred || s->h263_plus || !s->encoding) {
        /* dc values */
        //MN: we need these for error resilience of intra-frames
420
        CHECKED_ALLOCZ(s->dc_val[0], yc_size * sizeof(int16_t));
421 422 423 424 425 426
        s->dc_val[1] = s->dc_val[0] + y_size;
        s->dc_val[2] = s->dc_val[1] + c_size;
        for(i=0;i<yc_size;i++)
            s->dc_val[0][i] = 1024;
    }

427 428 429 430
    /* which mb is a intra block */
    CHECKED_ALLOCZ(s->mbintra_table, s->mb_num);
    memset(s->mbintra_table, 1, s->mb_num);
    
F
Fabrice Bellard 已提交
431 432
    /* default structure is frame */
    s->picture_structure = PICT_FRAME;
433
    
434
    /* init macroblock skip table */
435 436
    CHECKED_ALLOCZ(s->mbskip_table, s->mb_num+1);
    //Note the +1 is for a quicker mpeg4 slice_end detection
437
    CHECKED_ALLOCZ(s->prev_pict_types, PREV_PICT_TYPES_BUFFER_SIZE);
438
    
439
    s->block= s->blocks[0];
440

441 442
    s->parse_context.state= -1;

F
Fabrice Bellard 已提交
443 444 445
    s->context_initialized = 1;
    return 0;
 fail:
446
    MPV_common_end(s);
F
Fabrice Bellard 已提交
447 448 449
    return -1;
}

450 451 452

//extern int sads;

F
Fabrice Bellard 已提交
453 454 455 456 457
/* init common structure for both encoder and decoder */
void MPV_common_end(MpegEncContext *s)
{
    int i;

458 459 460 461 462 463 464 465 466 467 468 469
    av_freep(&s->mb_type);
    av_freep(&s->p_mv_table);
    av_freep(&s->b_forw_mv_table);
    av_freep(&s->b_back_mv_table);
    av_freep(&s->b_bidir_forw_mv_table);
    av_freep(&s->b_bidir_back_mv_table);
    av_freep(&s->b_direct_mv_table);
    av_freep(&s->motion_val);
    av_freep(&s->dc_val[0]);
    av_freep(&s->ac_val[0]);
    av_freep(&s->coded_block);
    av_freep(&s->mbintra_table);
470 471
    av_freep(&s->cbp_table);
    av_freep(&s->pred_dir_table);
M
Michael Niedermayer 已提交
472 473 474
    av_freep(&s->me.scratchpad);
    av_freep(&s->me.map);
    av_freep(&s->me.score_map);
475
    
476
    av_freep(&s->mbskip_table);
477
    av_freep(&s->prev_pict_types);
478
    av_freep(&s->bitstream_buffer);
479 480
    av_freep(&s->tex_pb_buffer);
    av_freep(&s->pb2_buffer);
481
    av_freep(&s->allocated_edge_emu_buffer); s->edge_emu_buffer= NULL;
482 483 484
    av_freep(&s->co_located_type_table);
    av_freep(&s->field_mv_table);
    av_freep(&s->field_select_table);
M
Michael Niedermayer 已提交
485
    av_freep(&s->avctx->stats_out);
486
    av_freep(&s->ac_stats);
487
    av_freep(&s->error_status_table);
M
cleanup  
Michael Niedermayer 已提交
488 489 490

    for(i=0; i<MAX_PICTURE_COUNT; i++){
        free_picture(s, &s->picture[i]);
F
Fabrice Bellard 已提交
491 492 493 494
    }
    s->context_initialized = 0;
}

495 496
#ifdef CONFIG_ENCODERS

F
Fabrice Bellard 已提交
497 498 499 500
/* init video encoder */
int MPV_encode_init(AVCodecContext *avctx)
{
    MpegEncContext *s = avctx->priv_data;
501
    int i;
F
Fabrice Bellard 已提交
502

503 504
    avctx->pix_fmt = PIX_FMT_YUV420P;

F
Fabrice Bellard 已提交
505
    s->bit_rate = avctx->bit_rate;
506
    s->bit_rate_tolerance = avctx->bit_rate_tolerance;
F
Fabrice Bellard 已提交
507 508 509
    s->frame_rate = avctx->frame_rate;
    s->width = avctx->width;
    s->height = avctx->height;
510
    if(avctx->gop_size > 600){
511
        fprintf(stderr, "Warning keyframe interval too large! reducing it ...\n");
512 513
        avctx->gop_size=600;
    }
F
Fabrice Bellard 已提交
514
    s->gop_size = avctx->gop_size;
515 516
    s->rtp_mode = avctx->rtp_mode;
    s->rtp_payload_size = avctx->rtp_payload_size;
517 518
    if (avctx->rtp_callback)
        s->rtp_callback = avctx->rtp_callback;
519 520 521 522 523
    s->qmin= avctx->qmin;
    s->qmax= avctx->qmax;
    s->max_qdiff= avctx->max_qdiff;
    s->qcompress= avctx->qcompress;
    s->qblur= avctx->qblur;
524
    s->avctx = avctx;
525
    s->flags= avctx->flags;
526
    s->max_b_frames= avctx->max_b_frames;
527
    s->b_frame_strategy= avctx->b_frame_strategy;
528
    s->codec_id= avctx->codec->id;
529 530 531 532
    s->luma_elim_threshold  = avctx->luma_elim_threshold;
    s->chroma_elim_threshold= avctx->chroma_elim_threshold;
    s->strict_std_compliance= avctx->strict_std_compliance;
    s->data_partitioning= avctx->flags & CODEC_FLAG_PART;
M
Michael Niedermayer 已提交
533
    s->quarter_sample= (avctx->flags & CODEC_FLAG_QPEL)!=0;
534
    s->mpeg_quant= avctx->mpeg_quant;
535

F
Fabrice Bellard 已提交
536 537 538 539 540 541
    if (s->gop_size <= 1) {
        s->intra_only = 1;
        s->gop_size = 12;
    } else {
        s->intra_only = 0;
    }
542

M
Michael Niedermayer 已提交
543
    s->me_method = avctx->me_method;
544

545
    /* Fixed QSCALE */
F
Fabrice Bellard 已提交
546
    s->fixed_qscale = (avctx->flags & CODEC_FLAG_QSCALE);
547
    
548
    s->adaptive_quant= (   s->avctx->lumi_masking
549
                        || s->avctx->dark_masking
550 551 552 553
                        || s->avctx->temporal_cplx_masking 
                        || s->avctx->spatial_cplx_masking
                        || s->avctx->p_masking)
                       && !s->fixed_qscale;
554 555
    
    s->progressive_sequence= !(avctx->flags & CODEC_FLAG_INTERLACED_DCT);
556

F
Fabrice Bellard 已提交
557 558 559
    switch(avctx->codec->id) {
    case CODEC_ID_MPEG1VIDEO:
        s->out_format = FMT_MPEG1;
M
Michael Niedermayer 已提交
560
        avctx->delay=0; //FIXME not sure, should check the spec
F
Fabrice Bellard 已提交
561 562 563 564
        break;
    case CODEC_ID_MJPEG:
        s->out_format = FMT_MJPEG;
        s->intra_only = 1; /* force intra only for jpeg */
565
        s->mjpeg_write_tables = 1; /* write all tables */
566
	s->mjpeg_data_only_frames = 0; /* write all the needed headers */
567 568 569
        s->mjpeg_vsample[0] = 2; /* set up default sampling factors */
        s->mjpeg_vsample[1] = 1; /* the only currently supported values */
        s->mjpeg_vsample[2] = 1; 
570
        s->mjpeg_hsample[0] = 2;
571 572
        s->mjpeg_hsample[1] = 1; 
        s->mjpeg_hsample[2] = 1; 
F
Fabrice Bellard 已提交
573 574
        if (mjpeg_init(s) < 0)
            return -1;
M
Michael Niedermayer 已提交
575
        avctx->delay=0;
M
Michael Niedermayer 已提交
576
        s->low_delay=1;
F
Fabrice Bellard 已提交
577
        break;
M
Michael Niedermayer 已提交
578
#ifdef CONFIG_RISKY
F
Fabrice Bellard 已提交
579
    case CODEC_ID_H263:
580 581
        if (h263_get_picture_format(s->width, s->height) == 7) {
            printf("Input picture size isn't suitable for h263 codec! try h263+\n");
F
Fabrice Bellard 已提交
582
            return -1;
583
        }
F
Fabrice Bellard 已提交
584
        s->out_format = FMT_H263;
M
Michael Niedermayer 已提交
585
        avctx->delay=0;
M
Michael Niedermayer 已提交
586
        s->low_delay=1;
F
Fabrice Bellard 已提交
587 588 589 590
        break;
    case CODEC_ID_H263P:
        s->out_format = FMT_H263;
        s->h263_plus = 1;
591 592 593 594
	/* Fx */
	s->unrestricted_mv=(avctx->flags & CODEC_FLAG_H263P_UMV) ? 1:0;
	s->h263_aic= (avctx->flags & CODEC_FLAG_H263P_AIC) ? 1:0;
	/* /Fx */
595
        /* These are just to be sure */
M
Michael Niedermayer 已提交
596
        s->umvplus = 1;
M
Michael Niedermayer 已提交
597
        avctx->delay=0;
M
Michael Niedermayer 已提交
598
        s->low_delay=1;
F
Fabrice Bellard 已提交
599 600 601 602
        break;
    case CODEC_ID_RV10:
        s->out_format = FMT_H263;
        s->h263_rv10 = 1;
M
Michael Niedermayer 已提交
603
        avctx->delay=0;
M
Michael Niedermayer 已提交
604
        s->low_delay=1;
F
Fabrice Bellard 已提交
605
        break;
F
Fabrice Bellard 已提交
606
    case CODEC_ID_MPEG4:
F
Fabrice Bellard 已提交
607 608 609
        s->out_format = FMT_H263;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
M
Michael Niedermayer 已提交
610
        s->low_delay= s->max_b_frames ? 0 : 1;
611
        avctx->delay= s->low_delay ? 0 : (s->max_b_frames + 1);
F
Fabrice Bellard 已提交
612
        break;
613
    case CODEC_ID_MSMPEG4V1:
F
Fabrice Bellard 已提交
614 615 616 617
        s->out_format = FMT_H263;
        s->h263_msmpeg4 = 1;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
618
        s->msmpeg4_version= 1;
M
Michael Niedermayer 已提交
619
        avctx->delay=0;
M
Michael Niedermayer 已提交
620
        s->low_delay=1;
621 622 623 624 625 626 627
        break;
    case CODEC_ID_MSMPEG4V2:
        s->out_format = FMT_H263;
        s->h263_msmpeg4 = 1;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
        s->msmpeg4_version= 2;
M
Michael Niedermayer 已提交
628
        avctx->delay=0;
M
Michael Niedermayer 已提交
629
        s->low_delay=1;
630 631 632 633 634 635 636
        break;
    case CODEC_ID_MSMPEG4V3:
        s->out_format = FMT_H263;
        s->h263_msmpeg4 = 1;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
        s->msmpeg4_version= 3;
M
Michael Niedermayer 已提交
637
        avctx->delay=0;
M
Michael Niedermayer 已提交
638
        s->low_delay=1;
F
Fabrice Bellard 已提交
639
        break;
M
Michael Niedermayer 已提交
640 641 642 643 644 645 646
    case CODEC_ID_WMV1:
        s->out_format = FMT_H263;
        s->h263_msmpeg4 = 1;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
        s->msmpeg4_version= 4;
        avctx->delay=0;
M
Michael Niedermayer 已提交
647
        s->low_delay=1;
M
Michael Niedermayer 已提交
648 649 650 651 652 653 654 655
        break;
    case CODEC_ID_WMV2:
        s->out_format = FMT_H263;
        s->h263_msmpeg4 = 1;
        s->h263_pred = 1;
        s->unrestricted_mv = 1;
        s->msmpeg4_version= 5;
        avctx->delay=0;
M
Michael Niedermayer 已提交
656
        s->low_delay=1;
M
Michael Niedermayer 已提交
657
        break;
M
Michael Niedermayer 已提交
658
#endif
F
Fabrice Bellard 已提交
659 660 661
    default:
        return -1;
    }
M
Michael Niedermayer 已提交
662
    
663 664 665 666 667
    { /* set up some save defaults, some codecs might override them later */
        static int done=0;
        if(!done){
            int i;
            done=1;
668

669 670 671
            default_mv_penalty= av_mallocz( sizeof(uint16_t)*(MAX_FCODE+1)*(2*MAX_MV+1) );
            memset(default_mv_penalty, 0, sizeof(uint16_t)*(MAX_FCODE+1)*(2*MAX_MV+1));
            memset(default_fcode_tab , 0, sizeof(uint8_t)*(2*MAX_MV+1));
672 673 674 675 676 677

            for(i=-16; i<16; i++){
                default_fcode_tab[i + MAX_MV]= 1;
            }
        }
    }
M
Michael Niedermayer 已提交
678
    s->me.mv_penalty= default_mv_penalty;
679
    s->fcode_tab= default_fcode_tab;
680 681 682
    s->y_dc_scale_table=
    s->c_dc_scale_table= ff_mpeg1_dc_scale_table;
 
683
    /* dont use mv_penalty table for crap MV as it would be confused */
M
Michael Niedermayer 已提交
684 685
    //FIXME remove after fixing / removing old ME
    if (s->me_method < ME_EPZS) s->me.mv_penalty = default_mv_penalty;
686

687 688
    s->encoding = 1;

F
Fabrice Bellard 已提交
689 690 691 692
    /* init */
    if (MPV_common_init(s) < 0)
        return -1;
    
M
Michael Niedermayer 已提交
693 694
    ff_init_me(s);

695
#ifdef CONFIG_ENCODERS
M
Michael Niedermayer 已提交
696
#ifdef CONFIG_RISKY
697 698 699 700
    if (s->out_format == FMT_H263)
        h263_encode_init(s);
    if(s->msmpeg4_version)
        ff_msmpeg4_encode_init(s);
701
#endif
M
Michael Niedermayer 已提交
702 703 704
    if (s->out_format == FMT_MPEG1)
        ff_mpeg1_encode_init(s);
#endif
705

706 707
    /* init default q matrix */
    for(i=0;i<64;i++) {
708
        int j= s->dsp.idct_permutation[i];
M
Michael Niedermayer 已提交
709
#ifdef CONFIG_RISKY
710
        if(s->codec_id==CODEC_ID_MPEG4 && s->mpeg_quant){
711 712
            s->intra_matrix[j] = ff_mpeg4_default_intra_matrix[i];
            s->inter_matrix[j] = ff_mpeg4_default_non_intra_matrix[i];
713
        }else if(s->out_format == FMT_H263){
714 715
            s->intra_matrix[j] =
            s->inter_matrix[j] = ff_mpeg1_default_non_intra_matrix[i];
M
Michael Niedermayer 已提交
716 717 718
        }else
#endif
        { /* mpeg1 */
719 720
            s->intra_matrix[j] = ff_mpeg1_default_intra_matrix[i];
            s->inter_matrix[j] = ff_mpeg1_default_non_intra_matrix[i];
721
        }
722 723 724
    }

    /* precompute matrix */
725
    /* for mjpeg, we do include qscale in the matrix */
726
    if (s->out_format != FMT_MJPEG) {
727
        convert_matrix(s, s->q_intra_matrix, s->q_intra_matrix16, s->q_intra_matrix16_bias, 
728
                       s->intra_matrix, s->intra_quant_bias, 1, 31);
729
        convert_matrix(s, s->q_inter_matrix, s->q_inter_matrix16, s->q_inter_matrix16_bias, 
730
                       s->inter_matrix, s->inter_quant_bias, 1, 31);
731 732
    }

733 734
    if(ff_rate_control_init(s) < 0)
        return -1;
F
Fabrice Bellard 已提交
735 736

    s->picture_number = 0;
737
    s->picture_in_gop_number = 0;
F
Fabrice Bellard 已提交
738 739 740
    s->fake_picture_number = 0;
    /* motion detector init */
    s->f_code = 1;
741
    s->b_code = 1;
F
Fabrice Bellard 已提交
742 743 744 745 746 747 748 749 750 751 752

    return 0;
}

int MPV_encode_end(AVCodecContext *avctx)
{
    MpegEncContext *s = avctx->priv_data;

#ifdef STATS
    print_stats();
#endif
753 754 755

    ff_rate_control_uninit(s);

F
Fabrice Bellard 已提交
756 757 758
    MPV_common_end(s);
    if (s->out_format == FMT_MJPEG)
        mjpeg_close(s);
759
      
F
Fabrice Bellard 已提交
760 761 762
    return 0;
}

763 764
#endif //CONFIG_ENCODERS

M
Michael Niedermayer 已提交
765 766
void init_rl(RLTable *rl)
{
767 768
    int8_t max_level[MAX_RUN+1], max_run[MAX_LEVEL+1];
    uint8_t index_run[MAX_RUN+1];
M
Michael Niedermayer 已提交
769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802
    int last, run, level, start, end, i;

    /* compute max_level[], max_run[] and index_run[] */
    for(last=0;last<2;last++) {
        if (last == 0) {
            start = 0;
            end = rl->last;
        } else {
            start = rl->last;
            end = rl->n;
        }

        memset(max_level, 0, MAX_RUN + 1);
        memset(max_run, 0, MAX_LEVEL + 1);
        memset(index_run, rl->n, MAX_RUN + 1);
        for(i=start;i<end;i++) {
            run = rl->table_run[i];
            level = rl->table_level[i];
            if (index_run[run] == rl->n)
                index_run[run] = i;
            if (level > max_level[run])
                max_level[run] = level;
            if (run > max_run[level])
                max_run[level] = run;
        }
        rl->max_level[last] = av_malloc(MAX_RUN + 1);
        memcpy(rl->max_level[last], max_level, MAX_RUN + 1);
        rl->max_run[last] = av_malloc(MAX_LEVEL + 1);
        memcpy(rl->max_run[last], max_run, MAX_LEVEL + 1);
        rl->index_run[last] = av_malloc(MAX_RUN + 1);
        memcpy(rl->index_run[last], index_run, MAX_RUN + 1);
    }
}

F
Fabrice Bellard 已提交
803
/* draw the edges of width 'w' of an image of size width, height */
804
//FIXME check that this is ok for mpeg4 interlaced
805
static void draw_edges_c(uint8_t *buf, int wrap, int width, int height, int w)
F
Fabrice Bellard 已提交
806
{
807
    uint8_t *ptr, *last_line;
F
Fabrice Bellard 已提交
808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831
    int i;

    last_line = buf + (height - 1) * wrap;
    for(i=0;i<w;i++) {
        /* top and bottom */
        memcpy(buf - (i + 1) * wrap, buf, width);
        memcpy(last_line + (i + 1) * wrap, last_line, width);
    }
    /* left and right */
    ptr = buf;
    for(i=0;i<height;i++) {
        memset(ptr - w, ptr[0], w);
        memset(ptr + width, ptr[width-1], w);
        ptr += wrap;
    }
    /* corners */
    for(i=0;i<w;i++) {
        memset(buf - (i + 1) * wrap - w, buf[0], w); /* top left */
        memset(buf - (i + 1) * wrap + width, buf[width-1], w); /* top right */
        memset(last_line + (i + 1) * wrap - w, last_line[0], w); /* top left */
        memset(last_line + (i + 1) * wrap + width, last_line[width-1], w); /* top right */
    }
}

M
Michael Niedermayer 已提交
832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851
static int find_unused_picture(MpegEncContext *s, int shared){
    int i;
    
    if(shared){
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            if(s->picture[i].data[0]==NULL && s->picture[i].type==0) break;
        }
    }else{
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            if(s->picture[i].data[0]==NULL && s->picture[i].type!=0) break;
        }
        for(i=0; i<MAX_PICTURE_COUNT; i++){
            if(s->picture[i].data[0]==NULL) break;
        }
    }

    assert(i<MAX_PICTURE_COUNT);
    return i;
}

F
Fabrice Bellard 已提交
852
/* generic function for encode/decode called before a frame is coded/decoded */
853
int MPV_frame_start(MpegEncContext *s, AVCodecContext *avctx)
F
Fabrice Bellard 已提交
854
{
M
Michael Niedermayer 已提交
855
    int i;
M
Michael Niedermayer 已提交
856
    AVFrame *pic;
F
Fabrice Bellard 已提交
857

858
    s->mb_skiped = 0;
M
cleanup  
Michael Niedermayer 已提交
859 860 861 862
    
    /* mark&release old frames */
    if (s->pict_type != B_TYPE && s->last_picture.data[0]) {
        for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
863
//printf("%8X %d %d %X %X\n", s->picture[i].data[0], s->picture[i].type, i, s->next_picture.data[0], s->last_picture.data[0]);
M
cleanup  
Michael Niedermayer 已提交
864 865
            if(s->picture[i].data[0] == s->last_picture.data[0]){
//                s->picture[i].reference=0;
M
Michael Niedermayer 已提交
866
                avctx->release_buffer(avctx, (AVFrame*)&s->picture[i]);
M
cleanup  
Michael Niedermayer 已提交
867 868 869 870 871 872 873 874 875 876 877
                break;
            }    
        }
        assert(i<MAX_PICTURE_COUNT);

        /* release forgotten pictures */
        /* if(mpeg124/h263) */
        if(!s->encoding){
            for(i=0; i<MAX_PICTURE_COUNT; i++){
                if(s->picture[i].data[0] && s->picture[i].data[0] != s->next_picture.data[0] && s->picture[i].reference){
                    fprintf(stderr, "releasing zombie picture\n");
M
Michael Niedermayer 已提交
878
                    avctx->release_buffer(avctx, (AVFrame*)&s->picture[i]);                
M
cleanup  
Michael Niedermayer 已提交
879 880
                }
            }
881
        }
882
    }
883 884
alloc:
    if(!s->encoding){
M
Michael Niedermayer 已提交
885
        i= find_unused_picture(s, 0);
M
cleanup  
Michael Niedermayer 已提交
886
    
M
Michael Niedermayer 已提交
887
        pic= (AVFrame*)&s->picture[i];
M
cleanup  
Michael Niedermayer 已提交
888 889 890
        pic->reference= s->pict_type != B_TYPE;
        pic->coded_picture_number= s->current_picture.coded_picture_number+1;
        
M
Michael Niedermayer 已提交
891
        alloc_picture(s, (Picture*)pic, 0);
892

M
cleanup  
Michael Niedermayer 已提交
893 894
        s->current_picture= s->picture[i];
    }
895

M
cleanup  
Michael Niedermayer 已提交
896 897 898
    if (s->pict_type != B_TYPE) {
        s->last_picture= s->next_picture;
        s->next_picture= s->current_picture;
F
Fabrice Bellard 已提交
899
    }
900 901 902 903 904 905
    
    if(s->pict_type != I_TYPE && s->last_picture.data[0]==NULL){
        fprintf(stderr, "warning: first frame is no keyframe\n");
        assert(s->pict_type != B_TYPE); //these should have been dropped if we dont have a reference
        goto alloc;
    }
M
cleanup  
Michael Niedermayer 已提交
906
   
907 908 909
    s->hurry_up= s->avctx->hurry_up;
    s->error_resilience= avctx->error_resilience;

910 911 912 913 914 915 916 917 918
    /* set dequantizer, we cant do it during init as it might change for mpeg4
       and we cant do it in the header decode as init isnt called for mpeg4 there yet */
    if(s->out_format == FMT_H263){
        if(s->mpeg_quant)
            s->dct_unquantize = s->dct_unquantize_mpeg2;
        else
            s->dct_unquantize = s->dct_unquantize_h263;
    }else 
        s->dct_unquantize = s->dct_unquantize_mpeg1;
919 920

    return 0;
F
Fabrice Bellard 已提交
921
}
922

F
Fabrice Bellard 已提交
923 924 925
/* generic function for encode/decode called after a frame has been coded/decoded */
void MPV_frame_end(MpegEncContext *s)
{
M
cleanup  
Michael Niedermayer 已提交
926
    int i;
F
Fabrice Bellard 已提交
927
    /* draw edge for correct motion prediction if outside */
M
cleanup  
Michael Niedermayer 已提交
928 929 930 931 932 933
    if(s->codec_id!=CODEC_ID_SVQ1){
        if (s->pict_type != B_TYPE && !s->intra_only && !(s->flags&CODEC_FLAG_EMU_EDGE)) {
            draw_edges(s->current_picture.data[0], s->linesize  , s->h_edge_pos   , s->v_edge_pos   , EDGE_WIDTH  );
            draw_edges(s->current_picture.data[1], s->uvlinesize, s->h_edge_pos>>1, s->v_edge_pos>>1, EDGE_WIDTH/2);
            draw_edges(s->current_picture.data[2], s->uvlinesize, s->h_edge_pos>>1, s->v_edge_pos>>1, EDGE_WIDTH/2);
        }
F
Fabrice Bellard 已提交
934
    }
M
Michael Niedermayer 已提交
935
    emms_c();
936
    
M
Michael Niedermayer 已提交
937
    s->last_pict_type    = s->pict_type;
938 939 940
    if(s->pict_type!=B_TYPE){
        s->last_non_b_pict_type= s->pict_type;
    }
M
cleanup  
Michael Niedermayer 已提交
941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956
    
    s->current_picture.quality= s->qscale; //FIXME get average of qscale_table
    s->current_picture.pict_type= s->pict_type;
    s->current_picture.key_frame= s->pict_type == I_TYPE;
    
    /* copy back current_picture variables */
    for(i=0; i<MAX_PICTURE_COUNT; i++){
        if(s->picture[i].data[0] == s->current_picture.data[0]){
            s->picture[i]= s->current_picture;
            break;
        }    
    }
    assert(i<MAX_PICTURE_COUNT);

    /* release non refernce frames */
    for(i=0; i<MAX_PICTURE_COUNT; i++){
M
Michael Niedermayer 已提交
957
        if(s->picture[i].data[0] && !s->picture[i].reference /*&& s->picture[i].type!=FF_BUFFER_TYPE_SHARED*/)
M
Michael Niedermayer 已提交
958
            s->avctx->release_buffer(s->avctx, (AVFrame*)&s->picture[i]);
M
cleanup  
Michael Niedermayer 已提交
959
    }
M
Michael Niedermayer 已提交
960 961 962 963 964 965 966 967 968 969 970 971
    if(s->avctx->debug&FF_DEBUG_SKIP){
        int x,y;        
        for(y=0; y<s->mb_height; y++){
            for(x=0; x<s->mb_width; x++){
                int count= s->mbskip_table[x + y*s->mb_width];
                if(count>9) count=9;
                printf(" %1d", count);
            }
            printf("\n");
        }
        printf("pict type: %d\n", s->pict_type);
    }
F
Fabrice Bellard 已提交
972 973
}

974 975
#ifdef CONFIG_ENCODERS

M
Michael Niedermayer 已提交
976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008
static int get_sae(uint8_t *src, int ref, int stride){
    int x,y;
    int acc=0;
    
    for(y=0; y<16; y++){
        for(x=0; x<16; x++){
            acc+= ABS(src[x+y*stride] - ref);
        }
    }
    
    return acc;
}

static int get_intra_count(MpegEncContext *s, uint8_t *src, uint8_t *ref, int stride){
    int x, y, w, h;
    int acc=0;
    
    w= s->width &~15;
    h= s->height&~15;
    
    for(y=0; y<h; y+=16){
        for(x=0; x<w; x+=16){
            int offset= x + y*stride;
            int sad = s->dsp.pix_abs16x16(src + offset, ref + offset, stride);
            int mean= (s->dsp.pix_sum(src + offset, stride) + 128)>>8;
            int sae = get_sae(src + offset, mean, stride);
            
            acc+= sae + 500 < sad;
        }
    }
    return acc;
}

M
Michael Niedermayer 已提交
1009

M
Michael Niedermayer 已提交
1010 1011
static int load_input_picture(MpegEncContext *s, AVFrame *pic_arg){
    AVFrame *pic;
M
Michael Niedermayer 已提交
1012
    int i;
M
cleanup  
Michael Niedermayer 已提交
1013
    const int encoding_delay= s->max_b_frames;
M
Michael Niedermayer 已提交
1014
    int direct=1;
M
cleanup  
Michael Niedermayer 已提交
1015

M
Michael Niedermayer 已提交
1016 1017 1018 1019 1020 1021
    if(encoding_delay && !(s->flags&CODEC_FLAG_INPUT_PRESERVED)) direct=0;
    if(pic_arg->linesize[0] != s->linesize) direct=0;
    if(pic_arg->linesize[1] != s->uvlinesize) direct=0;
    if(pic_arg->linesize[2] != s->uvlinesize) direct=0;
  
//    printf("%d %d %d %d\n",pic_arg->linesize[0], pic_arg->linesize[1], s->linesize, s->uvlinesize);
M
cleanup  
Michael Niedermayer 已提交
1022
    
M
Michael Niedermayer 已提交
1023 1024
    if(direct){
        i= find_unused_picture(s, 1);
M
cleanup  
Michael Niedermayer 已提交
1025

M
Michael Niedermayer 已提交
1026
        pic= (AVFrame*)&s->picture[i];
M
Michael Niedermayer 已提交
1027
        pic->reference= 1;
M
cleanup  
Michael Niedermayer 已提交
1028
    
M
Michael Niedermayer 已提交
1029 1030 1031 1032 1033 1034 1035
        for(i=0; i<4; i++){
            pic->data[i]= pic_arg->data[i];
            pic->linesize[i]= pic_arg->linesize[i];
        }
        alloc_picture(s, (Picture*)pic, 1);
    }else{
        i= find_unused_picture(s, 0);
M
cleanup  
Michael Niedermayer 已提交
1036

M
Michael Niedermayer 已提交
1037
        pic= (AVFrame*)&s->picture[i];
M
Michael Niedermayer 已提交
1038
        pic->reference= 1;
M
cleanup  
Michael Niedermayer 已提交
1039

M
Michael Niedermayer 已提交
1040 1041 1042 1043 1044
        alloc_picture(s, (Picture*)pic, 0);

        if(   pic->data[0] == pic_arg->data[0] 
           && pic->data[1] == pic_arg->data[1]
           && pic->data[2] == pic_arg->data[2]){
M
cleanup  
Michael Niedermayer 已提交
1045
       // empty
M
Michael Niedermayer 已提交
1046 1047
        }else{
            int h_chroma_shift, v_chroma_shift;
M
cleanup  
Michael Niedermayer 已提交
1048
        
M
Michael Niedermayer 已提交
1049
            avcodec_get_chroma_sub_sample(s->avctx->pix_fmt, &h_chroma_shift, &v_chroma_shift);
M
cleanup  
Michael Niedermayer 已提交
1050
        
M
Michael Niedermayer 已提交
1051 1052 1053 1054 1055 1056 1057 1058 1059
            for(i=0; i<3; i++){
                int src_stride= pic_arg->linesize[i];
                int dst_stride= i ? s->uvlinesize : s->linesize;
                int h_shift= i ? h_chroma_shift : 0;
                int v_shift= i ? v_chroma_shift : 0;
                int w= s->width >>h_shift;
                int h= s->height>>v_shift;
                uint8_t *src= pic_arg->data[i];
                uint8_t *dst= pic->data[i];
M
cleanup  
Michael Niedermayer 已提交
1060
            
M
Michael Niedermayer 已提交
1061 1062 1063 1064 1065 1066 1067 1068
                if(src_stride==dst_stride)
                    memcpy(dst, src, src_stride*h);
                else{
                    while(h--){
                        memcpy(dst, src, w);
                        dst += dst_stride;
                        src += src_stride;
                    }
M
cleanup  
Michael Niedermayer 已提交
1069
                }
1070
            }
M
cleanup  
Michael Niedermayer 已提交
1071 1072
        }
    }
M
Michael Niedermayer 已提交
1073 1074
    pic->quality= pic_arg->quality;
    pic->pict_type= pic_arg->pict_type;
1075
    pic->pts = pic_arg->pts;
M
Michael Niedermayer 已提交
1076 1077 1078 1079 1080 1081 1082 1083 1084
    
    if(s->input_picture[encoding_delay])
        pic->display_picture_number= s->input_picture[encoding_delay]->display_picture_number + 1;

    /* shift buffer entries */
    for(i=1; i<MAX_PICTURE_COUNT /*s->encoding_delay+1*/; i++)
        s->input_picture[i-1]= s->input_picture[i];
        
    s->input_picture[encoding_delay]= (Picture*)pic;
M
cleanup  
Michael Niedermayer 已提交
1085 1086 1087

    return 0;
}
1088

M
cleanup  
Michael Niedermayer 已提交
1089 1090 1091 1092 1093 1094 1095
static void select_input_picture(MpegEncContext *s){
    int i;
    const int encoding_delay= s->max_b_frames;
    int coded_pic_num=0;    

    if(s->reordered_input_picture[0])
        coded_pic_num= s->reordered_input_picture[0]->coded_picture_number + 1;
M
Michael Niedermayer 已提交
1096

M
cleanup  
Michael Niedermayer 已提交
1097 1098 1099 1100 1101 1102
    for(i=1; i<MAX_PICTURE_COUNT; i++)
        s->reordered_input_picture[i-1]= s->reordered_input_picture[i];
    s->reordered_input_picture[MAX_PICTURE_COUNT-1]= NULL;

    /* set next picture types & ordering */
    if(s->reordered_input_picture[0]==NULL && s->input_picture[0]){
M
Michael Niedermayer 已提交
1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118
        if(/*s->picture_in_gop_number >= s->gop_size ||*/ s->next_picture.data[0]==NULL || s->intra_only){
            s->reordered_input_picture[0]= s->input_picture[0];
            s->reordered_input_picture[0]->pict_type= I_TYPE;
            s->reordered_input_picture[0]->coded_picture_number= coded_pic_num;
        }else{
            int b_frames;
            
            if(s->flags&CODEC_FLAG_PASS2){
                for(i=0; i<s->max_b_frames+1; i++){
                    int pict_num= s->input_picture[0]->display_picture_number + i;
                    int pict_type= s->rc_context.entry[pict_num].new_pict_type;
                    s->input_picture[i]->pict_type= pict_type;
                    
                    if(i + 1 >= s->rc_context.num_entries) break;
                }
            }
M
Michael Niedermayer 已提交
1119

M
Michael Niedermayer 已提交
1120 1121
            if(s->input_picture[0]->pict_type){
                /* user selected pict_type */
1122 1123 1124
                for(b_frames=0; b_frames<s->max_b_frames+1; b_frames++){
                    if(s->input_picture[b_frames]->pict_type!=B_TYPE) break;
                }
M
Michael Niedermayer 已提交
1125
            
1126 1127 1128 1129
                if(b_frames > s->max_b_frames){
                    fprintf(stderr, "warning, too many bframes in a row\n");
                    b_frames = s->max_b_frames;
                }
M
Michael Niedermayer 已提交
1130 1131 1132 1133 1134 1135
            }else if(s->b_frame_strategy==0){
                b_frames= s->max_b_frames;
            }else if(s->b_frame_strategy==1){
                for(i=1; i<s->max_b_frames+1; i++){
                    if(s->input_picture[i]->b_frame_score==0){
                        s->input_picture[i]->b_frame_score= 
M
Michael Niedermayer 已提交
1136 1137
                            get_intra_count(s, s->input_picture[i  ]->data[0], 
                                               s->input_picture[i-1]->data[0], s->linesize) + 1;
M
Michael Niedermayer 已提交
1138 1139 1140 1141 1142 1143 1144
                    }
                }
                for(i=0; i<s->max_b_frames; i++){
                    if(s->input_picture[i]->b_frame_score - 1 > s->mb_num/40) break;
                }
                                
                b_frames= FFMAX(0, i-1);
1145
                
M
Michael Niedermayer 已提交
1146 1147 1148 1149 1150 1151 1152
                /* reset scores */
                for(i=0; i<b_frames+1; i++){
                    s->input_picture[i]->b_frame_score=0;
                }
            }else{
                fprintf(stderr, "illegal b frame strategy\n");
                b_frames=0;
1153
            }
M
Michael Niedermayer 已提交
1154 1155 1156 1157 1158 1159 1160 1161 1162

            emms_c();
//static int b_count=0;
//b_count+= b_frames;
//printf("b_frames: %d\n", b_count);
                        
            s->reordered_input_picture[0]= s->input_picture[b_frames];
            if(   s->picture_in_gop_number + b_frames >= s->gop_size 
               || s->reordered_input_picture[0]->pict_type== I_TYPE)
M
cleanup  
Michael Niedermayer 已提交
1163
                s->reordered_input_picture[0]->pict_type= I_TYPE;
M
Michael Niedermayer 已提交
1164 1165 1166 1167 1168 1169 1170 1171
            else
                s->reordered_input_picture[0]->pict_type= P_TYPE;
            s->reordered_input_picture[0]->coded_picture_number= coded_pic_num;
            for(i=0; i<b_frames; i++){
                coded_pic_num++;
                s->reordered_input_picture[i+1]= s->input_picture[i];
                s->reordered_input_picture[i+1]->pict_type= B_TYPE;
                s->reordered_input_picture[i+1]->coded_picture_number= coded_pic_num;
1172 1173 1174
            }
        }
    }
M
cleanup  
Michael Niedermayer 已提交
1175 1176
    
    if(s->reordered_input_picture[0]){
M
Michael Niedermayer 已提交
1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207
       s->reordered_input_picture[0]->reference= s->reordered_input_picture[0]->pict_type!=B_TYPE;

        if(s->reordered_input_picture[0]->type == FF_BUFFER_TYPE_SHARED){
            int i= find_unused_picture(s, 0);
            Picture *pic= &s->picture[i];

            s->new_picture= *s->reordered_input_picture[0];

            /* mark us unused / free shared pic */
            for(i=0; i<4; i++)
                s->reordered_input_picture[0]->data[i]= NULL;
            s->reordered_input_picture[0]->type= 0;
            
            pic->pict_type = s->reordered_input_picture[0]->pict_type;
            pic->quality   = s->reordered_input_picture[0]->quality;
            pic->coded_picture_number = s->reordered_input_picture[0]->coded_picture_number;
            pic->reference = s->reordered_input_picture[0]->reference;
            
            alloc_picture(s, pic, 0);

            s->current_picture= *pic;
        }else{
            assert(   s->reordered_input_picture[0]->type==FF_BUFFER_TYPE_USER 
                   || s->reordered_input_picture[0]->type==FF_BUFFER_TYPE_INTERNAL);
            
            s->new_picture= *s->reordered_input_picture[0];

            for(i=0; i<4; i++){
                s->reordered_input_picture[0]->data[i]-=16; //FIXME dirty
            }
            s->current_picture= *s->reordered_input_picture[0];
M
cleanup  
Michael Niedermayer 已提交
1208 1209 1210 1211 1212 1213
        }
    
        s->picture_number= s->new_picture.display_picture_number;
//printf("dpn:%d\n", s->picture_number);
    }else{
       memset(&s->new_picture, 0, sizeof(Picture));
1214 1215 1216
    }
}

F
Fabrice Bellard 已提交
1217 1218 1219 1220
int MPV_encode_picture(AVCodecContext *avctx,
                       unsigned char *buf, int buf_size, void *data)
{
    MpegEncContext *s = avctx->priv_data;
M
Michael Niedermayer 已提交
1221
    AVFrame *pic_arg = data;
1222
    int i;
F
Fabrice Bellard 已提交
1223 1224 1225

    init_put_bits(&s->pb, buf, buf_size, NULL, NULL);

M
cleanup  
Michael Niedermayer 已提交
1226
    s->picture_in_gop_number++;
F
Fabrice Bellard 已提交
1227

M
cleanup  
Michael Niedermayer 已提交
1228
    load_input_picture(s, pic_arg);
1229
    
M
cleanup  
Michael Niedermayer 已提交
1230
    select_input_picture(s);
1231 1232
    
    /* output? */
M
cleanup  
Michael Niedermayer 已提交
1233
    if(s->new_picture.data[0]){
1234

M
cleanup  
Michael Niedermayer 已提交
1235 1236 1237 1238 1239 1240 1241
        s->pict_type= s->new_picture.pict_type;
        if (s->fixed_qscale){ /* the ratecontrol needs the last qscale so we dont touch it for CBR */
            s->qscale= (int)(s->new_picture.quality+0.5);
            assert(s->qscale);
        }
//emms_c();
//printf("qs:%f %f %d\n", s->new_picture.quality, s->current_picture.quality, s->qscale);
1242
        MPV_frame_start(s, avctx);
1243 1244

        encode_picture(s, s->picture_number);
1245
        
J
Juanjo 已提交
1246
        avctx->real_pict_num  = s->picture_number;
1247 1248 1249 1250 1251 1252
        avctx->header_bits = s->header_bits;
        avctx->mv_bits     = s->mv_bits;
        avctx->misc_bits   = s->misc_bits;
        avctx->i_tex_bits  = s->i_tex_bits;
        avctx->p_tex_bits  = s->p_tex_bits;
        avctx->i_count     = s->i_count;
1253
        avctx->p_count     = s->mb_num - s->i_count - s->skip_count; //FIXME f/b_count in avctx
1254 1255 1256 1257 1258 1259
        avctx->skip_count  = s->skip_count;

        MPV_frame_end(s);

        if (s->out_format == FMT_MJPEG)
            mjpeg_picture_trailer(s);
1260 1261 1262
        
        if(s->flags&CODEC_FLAG_PASS1)
            ff_write_pass1_stats(s);
F
Fabrice Bellard 已提交
1263 1264
    }

1265
    s->input_picture_number++;
F
Fabrice Bellard 已提交
1266 1267

    flush_put_bits(&s->pb);
1268
    s->frame_bits  = (pbBufPtr(&s->pb) - s->pb.buf) * 8;
M
Michael Niedermayer 已提交
1269
    
1270
    s->total_bits += s->frame_bits;
1271
    avctx->frame_bits  = s->frame_bits;
M
cleanup  
Michael Niedermayer 已提交
1272

1273 1274 1275 1276
    for(i=0; i<4; i++){
        avctx->error[i] += s->current_picture.error[i];
    }
    
1277
    return pbBufPtr(&s->pb) - s->pb.buf;
F
Fabrice Bellard 已提交
1278 1279
}

1280 1281
#endif //CONFIG_ENCODERS

M
Michael Niedermayer 已提交
1282
static inline void gmc1_motion(MpegEncContext *s,
1283
                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
M
Michael Niedermayer 已提交
1284
                               int dest_offset,
1285
                               uint8_t **ref_picture, int src_offset)
M
Michael Niedermayer 已提交
1286
{
1287
    uint8_t *ptr;
M
Michael Niedermayer 已提交
1288
    int offset, src_x, src_y, linesize, uvlinesize;
M
Michael Niedermayer 已提交
1289
    int motion_x, motion_y;
M
Michael Niedermayer 已提交
1290
    int emu=0;
M
Michael Niedermayer 已提交
1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303

    motion_x= s->sprite_offset[0][0];
    motion_y= s->sprite_offset[0][1];
    src_x = s->mb_x * 16 + (motion_x >> (s->sprite_warping_accuracy+1));
    src_y = s->mb_y * 16 + (motion_y >> (s->sprite_warping_accuracy+1));
    motion_x<<=(3-s->sprite_warping_accuracy);
    motion_y<<=(3-s->sprite_warping_accuracy);
    src_x = clip(src_x, -16, s->width);
    if (src_x == s->width)
        motion_x =0;
    src_y = clip(src_y, -16, s->height);
    if (src_y == s->height)
        motion_y =0;
1304

M
Michael Niedermayer 已提交
1305
    linesize = s->linesize;
M
Michael Niedermayer 已提交
1306
    uvlinesize = s->uvlinesize;
1307
    
M
Michael Niedermayer 已提交
1308 1309 1310
    ptr = ref_picture[0] + (src_y * linesize) + src_x + src_offset;

    dest_y+=dest_offset;
M
Michael Niedermayer 已提交
1311
    if(s->flags&CODEC_FLAG_EMU_EDGE){
1312 1313
        if(src_x<0 || src_y<0 || src_x + 17 >= s->h_edge_pos
                              || src_y + 17 >= s->v_edge_pos){
M
Michael Niedermayer 已提交
1314
            ff_emulated_edge_mc(s, ptr, linesize, 17, 17, src_x, src_y, s->h_edge_pos, s->v_edge_pos);
M
Michael Niedermayer 已提交
1315 1316 1317
            ptr= s->edge_emu_buffer;
        }
    }
1318 1319
    
    if((motion_x|motion_y)&7){
1320 1321
        s->dsp.gmc1(dest_y  , ptr  , linesize, 16, motion_x&15, motion_y&15, 128 - s->no_rounding);
        s->dsp.gmc1(dest_y+8, ptr+8, linesize, 16, motion_x&15, motion_y&15, 128 - s->no_rounding);
1322 1323 1324 1325 1326
    }else{
        int dxy;
        
        dxy= ((motion_x>>3)&1) | ((motion_y>>2)&2);
        if (s->no_rounding){
1327
	    s->dsp.put_no_rnd_pixels_tab[0][dxy](dest_y, ptr, linesize, 16);
1328
        }else{
1329 1330
            s->dsp.put_pixels_tab       [0][dxy](dest_y, ptr, linesize, 16);
        }
1331 1332 1333
    }
    
    if(s->flags&CODEC_FLAG_GRAY) return;
M
Michael Niedermayer 已提交
1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347

    motion_x= s->sprite_offset[1][0];
    motion_y= s->sprite_offset[1][1];
    src_x = s->mb_x * 8 + (motion_x >> (s->sprite_warping_accuracy+1));
    src_y = s->mb_y * 8 + (motion_y >> (s->sprite_warping_accuracy+1));
    motion_x<<=(3-s->sprite_warping_accuracy);
    motion_y<<=(3-s->sprite_warping_accuracy);
    src_x = clip(src_x, -8, s->width>>1);
    if (src_x == s->width>>1)
        motion_x =0;
    src_y = clip(src_y, -8, s->height>>1);
    if (src_y == s->height>>1)
        motion_y =0;

M
Michael Niedermayer 已提交
1348
    offset = (src_y * uvlinesize) + src_x + (src_offset>>1);
M
Michael Niedermayer 已提交
1349
    ptr = ref_picture[1] + offset;
1350 1351 1352 1353 1354 1355 1356
    if(s->flags&CODEC_FLAG_EMU_EDGE){
        if(src_x<0 || src_y<0 || src_x + 9 >= s->h_edge_pos>>1
                              || src_y + 9 >= s->v_edge_pos>>1){
            ff_emulated_edge_mc(s, ptr, uvlinesize, 9, 9, src_x, src_y, s->h_edge_pos>>1, s->v_edge_pos>>1);
            ptr= s->edge_emu_buffer;
            emu=1;
        }
M
Michael Niedermayer 已提交
1357
    }
1358
    s->dsp.gmc1(dest_cb + (dest_offset>>1), ptr, uvlinesize, 8, motion_x&15, motion_y&15, 128 - s->no_rounding);
M
Michael Niedermayer 已提交
1359
    
M
Michael Niedermayer 已提交
1360
    ptr = ref_picture[2] + offset;
M
Michael Niedermayer 已提交
1361
    if(emu){
M
Michael Niedermayer 已提交
1362
        ff_emulated_edge_mc(s, ptr, uvlinesize, 9, 9, src_x, src_y, s->h_edge_pos>>1, s->v_edge_pos>>1);
M
Michael Niedermayer 已提交
1363 1364
        ptr= s->edge_emu_buffer;
    }
1365
    s->dsp.gmc1(dest_cr + (dest_offset>>1), ptr, uvlinesize, 8, motion_x&15, motion_y&15, 128 - s->no_rounding);
M
Michael Niedermayer 已提交
1366 1367 1368 1369
    
    return;
}

1370
static inline void gmc_motion(MpegEncContext *s,
1371
                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
1372
                               int dest_offset,
1373
                               uint8_t **ref_picture, int src_offset)
1374
{
1375
    uint8_t *ptr;
1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389
    int linesize, uvlinesize;
    const int a= s->sprite_warping_accuracy;
    int ox, oy;

    linesize = s->linesize;
    uvlinesize = s->uvlinesize;

    ptr = ref_picture[0] + src_offset;

    dest_y+=dest_offset;
    
    ox= s->sprite_offset[0][0] + s->sprite_delta[0][0]*s->mb_x*16 + s->sprite_delta[0][1]*s->mb_y*16;
    oy= s->sprite_offset[0][1] + s->sprite_delta[1][0]*s->mb_x*16 + s->sprite_delta[1][1]*s->mb_y*16;

1390
    s->dsp.gmc(dest_y, ptr, linesize, 16,
1391 1392 1393 1394 1395 1396
           ox, 
           oy, 
           s->sprite_delta[0][0], s->sprite_delta[0][1],
           s->sprite_delta[1][0], s->sprite_delta[1][1], 
           a+1, (1<<(2*a+1)) - s->no_rounding,
           s->h_edge_pos, s->v_edge_pos);
1397
    s->dsp.gmc(dest_y+8, ptr, linesize, 16,
1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414
           ox + s->sprite_delta[0][0]*8, 
           oy + s->sprite_delta[1][0]*8, 
           s->sprite_delta[0][0], s->sprite_delta[0][1],
           s->sprite_delta[1][0], s->sprite_delta[1][1], 
           a+1, (1<<(2*a+1)) - s->no_rounding,
           s->h_edge_pos, s->v_edge_pos);

    if(s->flags&CODEC_FLAG_GRAY) return;


    dest_cb+=dest_offset>>1;
    dest_cr+=dest_offset>>1;
    
    ox= s->sprite_offset[1][0] + s->sprite_delta[0][0]*s->mb_x*8 + s->sprite_delta[0][1]*s->mb_y*8;
    oy= s->sprite_offset[1][1] + s->sprite_delta[1][0]*s->mb_x*8 + s->sprite_delta[1][1]*s->mb_y*8;

    ptr = ref_picture[1] + (src_offset>>1);
1415
    s->dsp.gmc(dest_cb, ptr, uvlinesize, 8,
1416 1417 1418 1419 1420 1421 1422 1423
           ox, 
           oy, 
           s->sprite_delta[0][0], s->sprite_delta[0][1],
           s->sprite_delta[1][0], s->sprite_delta[1][1], 
           a+1, (1<<(2*a+1)) - s->no_rounding,
           s->h_edge_pos>>1, s->v_edge_pos>>1);
    
    ptr = ref_picture[2] + (src_offset>>1);
1424
    s->dsp.gmc(dest_cr, ptr, uvlinesize, 8,
1425 1426 1427 1428 1429 1430 1431 1432 1433
           ox, 
           oy, 
           s->sprite_delta[0][0], s->sprite_delta[0][1],
           s->sprite_delta[1][0], s->sprite_delta[1][1], 
           a+1, (1<<(2*a+1)) - s->no_rounding,
           s->h_edge_pos>>1, s->v_edge_pos>>1);
}


1434
void ff_emulated_edge_mc(MpegEncContext *s, uint8_t *src, int linesize, int block_w, int block_h, 
1435 1436 1437
                                    int src_x, int src_y, int w, int h){
    int x, y;
    int start_y, start_x, end_y, end_x;
1438
    uint8_t *buf= s->edge_emu_buffer;
1439

1440 1441 1442
    if(src_y>= h){
        src+= (h-1-src_y)*linesize;
        src_y=h-1;
M
Michael Niedermayer 已提交
1443 1444 1445
    }else if(src_y<=-block_h){
        src+= (1-block_h-src_y)*linesize;
        src_y=1-block_h;
1446 1447 1448 1449
    }
    if(src_x>= w){
        src+= (w-1-src_x);
        src_x=w-1;
M
Michael Niedermayer 已提交
1450 1451 1452
    }else if(src_x<=-block_w){
        src+= (1-block_w-src_x);
        src_x=1-block_w;
1453 1454
    }

M
Michael Niedermayer 已提交
1455 1456 1457 1458
    start_y= FFMAX(0, -src_y);
    start_x= FFMAX(0, -src_x);
    end_y= FFMIN(block_h, h-src_y);
    end_x= FFMIN(block_w, w-src_x);
M
Michael Niedermayer 已提交
1459

1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494
    // copy existing part
    for(y=start_y; y<end_y; y++){
        for(x=start_x; x<end_x; x++){
            buf[x + y*linesize]= src[x + y*linesize];
        }
    }

    //top
    for(y=0; y<start_y; y++){
        for(x=start_x; x<end_x; x++){
            buf[x + y*linesize]= buf[x + start_y*linesize];
        }
    }

    //bottom
    for(y=end_y; y<block_h; y++){
        for(x=start_x; x<end_x; x++){
            buf[x + y*linesize]= buf[x + (end_y-1)*linesize];
        }
    }
                                    
    for(y=0; y<block_h; y++){
       //left
        for(x=0; x<start_x; x++){
            buf[x + y*linesize]= buf[start_x + y*linesize];
        }
       
       //right
        for(x=end_x; x<block_w; x++){
            buf[x + y*linesize]= buf[end_x - 1 + y*linesize];
        }
    }
}


F
Fabrice Bellard 已提交
1495 1496
/* apply one mpeg motion vector to the three components */
static inline void mpeg_motion(MpegEncContext *s,
1497
                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
F
Fabrice Bellard 已提交
1498
                               int dest_offset,
1499
                               uint8_t **ref_picture, int src_offset,
M
Michael Niedermayer 已提交
1500
                               int field_based, op_pixels_func (*pix_op)[4],
F
Fabrice Bellard 已提交
1501 1502
                               int motion_x, int motion_y, int h)
{
1503
    uint8_t *ptr;
1504
    int dxy, offset, mx, my, src_x, src_y, height, v_edge_pos, linesize, uvlinesize;
1505
    int emu=0;
M
Michael Niedermayer 已提交
1506
#if 0    
M
Michael Niedermayer 已提交
1507 1508 1509 1510 1511
if(s->quarter_sample)
{
    motion_x>>=1;
    motion_y>>=1;
}
M
Michael Niedermayer 已提交
1512
#endif
F
Fabrice Bellard 已提交
1513 1514 1515 1516 1517 1518
    dxy = ((motion_y & 1) << 1) | (motion_x & 1);
    src_x = s->mb_x * 16 + (motion_x >> 1);
    src_y = s->mb_y * (16 >> field_based) + (motion_y >> 1);
                
    /* WARNING: do no forget half pels */
    height = s->height >> field_based;
1519
    v_edge_pos = s->v_edge_pos >> field_based;
F
Fabrice Bellard 已提交
1520 1521 1522 1523 1524 1525
    src_x = clip(src_x, -16, s->width);
    if (src_x == s->width)
        dxy &= ~1;
    src_y = clip(src_y, -16, height);
    if (src_y == height)
        dxy &= ~2;
1526 1527
    linesize   = s->linesize << field_based;
    uvlinesize = s->uvlinesize << field_based;
F
Fabrice Bellard 已提交
1528 1529
    ptr = ref_picture[0] + (src_y * linesize) + (src_x) + src_offset;
    dest_y += dest_offset;
1530 1531

    if(s->flags&CODEC_FLAG_EMU_EDGE){
1532 1533
        if(src_x<0 || src_y<0 || src_x + (motion_x&1) + 16 > s->h_edge_pos
                              || src_y + (motion_y&1) + h  > v_edge_pos){
M
Michael Niedermayer 已提交
1534
            ff_emulated_edge_mc(s, ptr - src_offset, s->linesize, 17, 17+field_based, 
1535 1536
                             src_x, src_y<<field_based, s->h_edge_pos, s->v_edge_pos);
            ptr= s->edge_emu_buffer + src_offset;
1537 1538 1539
            emu=1;
        }
    }
M
Michael Niedermayer 已提交
1540
    pix_op[0][dxy](dest_y, ptr, linesize, h);
F
Fabrice Bellard 已提交
1541

M
Michael Niedermayer 已提交
1542 1543
    if(s->flags&CODEC_FLAG_GRAY) return;

F
Fabrice Bellard 已提交
1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567
    if (s->out_format == FMT_H263) {
        dxy = 0;
        if ((motion_x & 3) != 0)
            dxy |= 1;
        if ((motion_y & 3) != 0)
            dxy |= 2;
        mx = motion_x >> 2;
        my = motion_y >> 2;
    } else {
        mx = motion_x / 2;
        my = motion_y / 2;
        dxy = ((my & 1) << 1) | (mx & 1);
        mx >>= 1;
        my >>= 1;
    }
    
    src_x = s->mb_x * 8 + mx;
    src_y = s->mb_y * (8 >> field_based) + my;
    src_x = clip(src_x, -8, s->width >> 1);
    if (src_x == (s->width >> 1))
        dxy &= ~1;
    src_y = clip(src_y, -8, height >> 1);
    if (src_y == (height >> 1))
        dxy &= ~2;
1568
    offset = (src_y * uvlinesize) + src_x + (src_offset >> 1);
F
Fabrice Bellard 已提交
1569
    ptr = ref_picture[1] + offset;
1570
    if(emu){
M
Michael Niedermayer 已提交
1571
        ff_emulated_edge_mc(s, ptr - (src_offset >> 1), s->uvlinesize, 9, 9+field_based, 
1572 1573
                         src_x, src_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
        ptr= s->edge_emu_buffer + (src_offset >> 1);
1574
    }
M
Michael Niedermayer 已提交
1575
    pix_op[1][dxy](dest_cb + (dest_offset >> 1), ptr, uvlinesize, h >> 1);
1576

F
Fabrice Bellard 已提交
1577
    ptr = ref_picture[2] + offset;
1578
    if(emu){
M
Michael Niedermayer 已提交
1579
        ff_emulated_edge_mc(s, ptr - (src_offset >> 1), s->uvlinesize, 9, 9+field_based, 
1580 1581
                         src_x, src_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
        ptr= s->edge_emu_buffer + (src_offset >> 1);
1582
    }
M
Michael Niedermayer 已提交
1583
    pix_op[1][dxy](dest_cr + (dest_offset >> 1), ptr, uvlinesize, h >> 1);
F
Fabrice Bellard 已提交
1584 1585
}

M
Michael Niedermayer 已提交
1586
static inline void qpel_motion(MpegEncContext *s,
1587
                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
M
Michael Niedermayer 已提交
1588
                               int dest_offset,
1589
                               uint8_t **ref_picture, int src_offset,
M
Michael Niedermayer 已提交
1590 1591
                               int field_based, op_pixels_func (*pix_op)[4],
                               qpel_mc_func (*qpix_op)[16],
M
Michael Niedermayer 已提交
1592 1593
                               int motion_x, int motion_y, int h)
{
1594
    uint8_t *ptr;
1595
    int dxy, offset, mx, my, src_x, src_y, height, v_edge_pos, linesize, uvlinesize;
M
Michael Niedermayer 已提交
1596
    int emu=0;
M
Michael Niedermayer 已提交
1597 1598 1599 1600 1601 1602

    dxy = ((motion_y & 3) << 2) | (motion_x & 3);
    src_x = s->mb_x * 16 + (motion_x >> 2);
    src_y = s->mb_y * (16 >> field_based) + (motion_y >> 2);

    height = s->height >> field_based;
1603
    v_edge_pos = s->v_edge_pos >> field_based;
M
Michael Niedermayer 已提交
1604 1605 1606 1607 1608 1609 1610
    src_x = clip(src_x, -16, s->width);
    if (src_x == s->width)
        dxy &= ~3;
    src_y = clip(src_y, -16, height);
    if (src_y == height)
        dxy &= ~12;
    linesize = s->linesize << field_based;
1611
    uvlinesize = s->uvlinesize << field_based;
M
Michael Niedermayer 已提交
1612 1613 1614
    ptr = ref_picture[0] + (src_y * linesize) + src_x + src_offset;
    dest_y += dest_offset;
//printf("%d %d %d\n", src_x, src_y, dxy);
M
Michael Niedermayer 已提交
1615 1616
    
    if(s->flags&CODEC_FLAG_EMU_EDGE){
1617 1618
        if(src_x<0 || src_y<0 || src_x + (motion_x&3) + 16 > s->h_edge_pos
                              || src_y + (motion_y&3) + h  > v_edge_pos){
M
Michael Niedermayer 已提交
1619
            ff_emulated_edge_mc(s, ptr - src_offset, s->linesize, 17, 17+field_based, 
1620 1621
                             src_x, src_y<<field_based, s->h_edge_pos, s->v_edge_pos);
            ptr= s->edge_emu_buffer + src_offset;
M
Michael Niedermayer 已提交
1622 1623 1624
            emu=1;
        }
    }
1625 1626 1627 1628 1629 1630 1631 1632
    if(!field_based)
        qpix_op[0][dxy](dest_y, ptr, linesize);
    else{
        //damn interlaced mode
        //FIXME boundary mirroring is not exactly correct here
        qpix_op[1][dxy](dest_y  , ptr  , linesize);
        qpix_op[1][dxy](dest_y+8, ptr+8, linesize);
    }
M
Michael Niedermayer 已提交
1633

M
Michael Niedermayer 已提交
1634 1635
    if(s->flags&CODEC_FLAG_GRAY) return;

1636 1637 1638
    if(field_based){
        mx= motion_x/2;
        my= motion_y>>1;
M
Michael Niedermayer 已提交
1639 1640 1641 1642
    }else if(s->workaround_bugs&FF_BUG_QPEL_CHROMA2){
        static const int rtab[8]= {0,0,1,1,0,0,0,1};
        mx= (motion_x>>1) + rtab[motion_x&7];
        my= (motion_y>>1) + rtab[motion_y&7];
M
Michael Niedermayer 已提交
1643
    }else if(s->workaround_bugs&FF_BUG_QPEL_CHROMA){
1644 1645 1646 1647 1648 1649 1650 1651
        mx= (motion_x>>1)|(motion_x&1);
        my= (motion_y>>1)|(motion_y&1);
    }else{
        mx= motion_x/2;
        my= motion_y/2;
    }
    mx= (mx>>1)|(mx&1);
    my= (my>>1)|(my&1);
M
Michael Niedermayer 已提交
1652

1653 1654 1655
    dxy= (mx&1) | ((my&1)<<1);
    mx>>=1;
    my>>=1;
M
Michael Niedermayer 已提交
1656 1657 1658 1659 1660 1661 1662 1663 1664 1665

    src_x = s->mb_x * 8 + mx;
    src_y = s->mb_y * (8 >> field_based) + my;
    src_x = clip(src_x, -8, s->width >> 1);
    if (src_x == (s->width >> 1))
        dxy &= ~1;
    src_y = clip(src_y, -8, height >> 1);
    if (src_y == (height >> 1))
        dxy &= ~2;

1666
    offset = (src_y * uvlinesize) + src_x + (src_offset >> 1);
M
Michael Niedermayer 已提交
1667
    ptr = ref_picture[1] + offset;
M
Michael Niedermayer 已提交
1668
    if(emu){
M
Michael Niedermayer 已提交
1669
        ff_emulated_edge_mc(s, ptr - (src_offset >> 1), s->uvlinesize, 9, 9 + field_based, 
1670 1671
                         src_x, src_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
        ptr= s->edge_emu_buffer + (src_offset >> 1);
M
Michael Niedermayer 已提交
1672
    }
1673
    pix_op[1][dxy](dest_cb + (dest_offset >> 1), ptr,  uvlinesize, h >> 1);
M
Michael Niedermayer 已提交
1674
    
M
Michael Niedermayer 已提交
1675
    ptr = ref_picture[2] + offset;
M
Michael Niedermayer 已提交
1676
    if(emu){
M
Michael Niedermayer 已提交
1677
        ff_emulated_edge_mc(s, ptr - (src_offset >> 1), s->uvlinesize, 9, 9 + field_based, 
1678 1679
                         src_x, src_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
        ptr= s->edge_emu_buffer + (src_offset >> 1);
M
Michael Niedermayer 已提交
1680
    }
1681
    pix_op[1][dxy](dest_cr + (dest_offset >> 1), ptr,  uvlinesize, h >> 1);
M
Michael Niedermayer 已提交
1682 1683
}

1684 1685 1686 1687 1688 1689 1690 1691
inline int ff_h263_round_chroma(int x){
    if (x >= 0)
        return  (h263_chroma_roundtab[x & 0xf] + ((x >> 3) & ~1));
    else {
        x = -x;
        return -(h263_chroma_roundtab[x & 0xf] + ((x >> 3) & ~1));
    }
}
M
Michael Niedermayer 已提交
1692

F
Fabrice Bellard 已提交
1693
static inline void MPV_motion(MpegEncContext *s, 
1694 1695
                              uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
                              int dir, uint8_t **ref_picture, 
M
Michael Niedermayer 已提交
1696
                              op_pixels_func (*pix_op)[4], qpel_mc_func (*qpix_op)[16])
F
Fabrice Bellard 已提交
1697 1698 1699
{
    int dxy, offset, mx, my, src_x, src_y, motion_x, motion_y;
    int mb_x, mb_y, i;
1700
    uint8_t *ptr, *dest;
M
Michael Niedermayer 已提交
1701
    int emu=0;
F
Fabrice Bellard 已提交
1702 1703 1704 1705 1706 1707

    mb_x = s->mb_x;
    mb_y = s->mb_y;

    switch(s->mv_type) {
    case MV_TYPE_16X16:
M
Michael Niedermayer 已提交
1708
#ifdef CONFIG_RISKY
M
Michael Niedermayer 已提交
1709
        if(s->mcsel){
1710 1711 1712 1713 1714 1715 1716
            if(s->real_sprite_warping_points==1){
                gmc1_motion(s, dest_y, dest_cb, dest_cr, 0,
                            ref_picture, 0);
            }else{
                gmc_motion(s, dest_y, dest_cb, dest_cr, 0,
                            ref_picture, 0);
            }
M
Michael Niedermayer 已提交
1717
        }else if(s->quarter_sample){
M
Michael Niedermayer 已提交
1718 1719 1720 1721
            qpel_motion(s, dest_y, dest_cb, dest_cr, 0,
                        ref_picture, 0,
                        0, pix_op, qpix_op,
                        s->mv[dir][0][0], s->mv[dir][0][1], 16);
M
Michael Niedermayer 已提交
1722 1723 1724 1725
        }else if(s->mspel){
            ff_mspel_motion(s, dest_y, dest_cb, dest_cr,
                        ref_picture, pix_op,
                        s->mv[dir][0][0], s->mv[dir][0][1], 16);
M
Michael Niedermayer 已提交
1726 1727 1728
        }else
#endif
        {
M
Michael Niedermayer 已提交
1729 1730 1731 1732 1733
            mpeg_motion(s, dest_y, dest_cb, dest_cr, 0,
                        ref_picture, 0,
                        0, pix_op,
                        s->mv[dir][0][0], s->mv[dir][0][1], 16);
        }           
F
Fabrice Bellard 已提交
1734 1735
        break;
    case MV_TYPE_8X8:
M
Michael Niedermayer 已提交
1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758
        mx = 0;
        my = 0;
        if(s->quarter_sample){
            for(i=0;i<4;i++) {
                motion_x = s->mv[dir][i][0];
                motion_y = s->mv[dir][i][1];

                dxy = ((motion_y & 3) << 2) | (motion_x & 3);
                src_x = mb_x * 16 + (motion_x >> 2) + (i & 1) * 8;
                src_y = mb_y * 16 + (motion_y >> 2) + (i >>1) * 8;
                    
                /* WARNING: do no forget half pels */
                src_x = clip(src_x, -16, s->width);
                if (src_x == s->width)
                    dxy &= ~3;
                src_y = clip(src_y, -16, s->height);
                if (src_y == s->height)
                    dxy &= ~12;
                    
                ptr = ref_picture[0] + (src_y * s->linesize) + (src_x);
                if(s->flags&CODEC_FLAG_EMU_EDGE){
                    if(src_x<0 || src_y<0 || src_x + (motion_x&3) + 8 > s->h_edge_pos
                                          || src_y + (motion_y&3) + 8 > s->v_edge_pos){
M
Michael Niedermayer 已提交
1759
                        ff_emulated_edge_mc(s, ptr, s->linesize, 9, 9, src_x, src_y, s->h_edge_pos, s->v_edge_pos);
M
Michael Niedermayer 已提交
1760 1761 1762 1763 1764 1765 1766 1767 1768 1769 1770 1771 1772
                        ptr= s->edge_emu_buffer;
                    }
                }
                dest = dest_y + ((i & 1) * 8) + (i >> 1) * 8 * s->linesize;
                qpix_op[1][dxy](dest, ptr, s->linesize);

                mx += s->mv[dir][i][0]/2;
                my += s->mv[dir][i][1]/2;
            }
        }else{
            for(i=0;i<4;i++) {
                motion_x = s->mv[dir][i][0];
                motion_y = s->mv[dir][i][1];
F
Fabrice Bellard 已提交
1773

M
Michael Niedermayer 已提交
1774 1775 1776
                dxy = ((motion_y & 1) << 1) | (motion_x & 1);
                src_x = mb_x * 16 + (motion_x >> 1) + (i & 1) * 8;
                src_y = mb_y * 16 + (motion_y >> 1) + (i >>1) * 8;
F
Fabrice Bellard 已提交
1777
                    
M
Michael Niedermayer 已提交
1778 1779 1780 1781 1782 1783 1784
                /* WARNING: do no forget half pels */
                src_x = clip(src_x, -16, s->width);
                if (src_x == s->width)
                    dxy &= ~1;
                src_y = clip(src_y, -16, s->height);
                if (src_y == s->height)
                    dxy &= ~2;
F
Fabrice Bellard 已提交
1785
                    
M
Michael Niedermayer 已提交
1786 1787 1788 1789
                ptr = ref_picture[0] + (src_y * s->linesize) + (src_x);
                if(s->flags&CODEC_FLAG_EMU_EDGE){
                    if(src_x<0 || src_y<0 || src_x + (motion_x&1) + 8 > s->h_edge_pos
                                          || src_y + (motion_y&1) + 8 > s->v_edge_pos){
M
Michael Niedermayer 已提交
1790
                        ff_emulated_edge_mc(s, ptr, s->linesize, 9, 9, src_x, src_y, s->h_edge_pos, s->v_edge_pos);
M
Michael Niedermayer 已提交
1791 1792
                        ptr= s->edge_emu_buffer;
                    }
M
Michael Niedermayer 已提交
1793
                }
M
Michael Niedermayer 已提交
1794 1795 1796 1797 1798
                dest = dest_y + ((i & 1) * 8) + (i >> 1) * 8 * s->linesize;
                pix_op[1][dxy](dest, ptr, s->linesize, 8);

                mx += s->mv[dir][i][0];
                my += s->mv[dir][i][1];
M
Michael Niedermayer 已提交
1799
            }
F
Fabrice Bellard 已提交
1800
        }
M
Michael Niedermayer 已提交
1801

M
Michael Niedermayer 已提交
1802
        if(s->flags&CODEC_FLAG_GRAY) break;
F
Fabrice Bellard 已提交
1803 1804
        /* In case of 8X8, we construct a single chroma motion vector
           with a special rounding */
1805 1806
        mx= ff_h263_round_chroma(mx);
        my= ff_h263_round_chroma(my);
F
Fabrice Bellard 已提交
1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819
        dxy = ((my & 1) << 1) | (mx & 1);
        mx >>= 1;
        my >>= 1;

        src_x = mb_x * 8 + mx;
        src_y = mb_y * 8 + my;
        src_x = clip(src_x, -8, s->width/2);
        if (src_x == s->width/2)
            dxy &= ~1;
        src_y = clip(src_y, -8, s->height/2);
        if (src_y == s->height/2)
            dxy &= ~2;
        
M
Michael Niedermayer 已提交
1820
        offset = (src_y * (s->uvlinesize)) + src_x;
F
Fabrice Bellard 已提交
1821
        ptr = ref_picture[1] + offset;
M
Michael Niedermayer 已提交
1822
        if(s->flags&CODEC_FLAG_EMU_EDGE){
1823 1824
                if(src_x<0 || src_y<0 || src_x + (dxy &1) + 8 > s->h_edge_pos>>1
                                      || src_y + (dxy>>1) + 8 > s->v_edge_pos>>1){
M
Michael Niedermayer 已提交
1825
                    ff_emulated_edge_mc(s, ptr, s->uvlinesize, 9, 9, src_x, src_y, s->h_edge_pos>>1, s->v_edge_pos>>1);
M
Michael Niedermayer 已提交
1826 1827 1828 1829
                    ptr= s->edge_emu_buffer;
                    emu=1;
                }
            }
M
Michael Niedermayer 已提交
1830
        pix_op[1][dxy](dest_cb, ptr, s->uvlinesize, 8);
M
Michael Niedermayer 已提交
1831

F
Fabrice Bellard 已提交
1832
        ptr = ref_picture[2] + offset;
M
Michael Niedermayer 已提交
1833
        if(emu){
M
Michael Niedermayer 已提交
1834
            ff_emulated_edge_mc(s, ptr, s->uvlinesize, 9, 9, src_x, src_y, s->h_edge_pos>>1, s->v_edge_pos>>1);
M
Michael Niedermayer 已提交
1835 1836
            ptr= s->edge_emu_buffer;
        }
M
Michael Niedermayer 已提交
1837
        pix_op[1][dxy](dest_cr, ptr, s->uvlinesize, 8);
F
Fabrice Bellard 已提交
1838 1839 1840
        break;
    case MV_TYPE_FIELD:
        if (s->picture_structure == PICT_FRAME) {
1841 1842 1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863
            if(s->quarter_sample){
                /* top field */
                qpel_motion(s, dest_y, dest_cb, dest_cr, 0,
                            ref_picture, s->field_select[dir][0] ? s->linesize : 0,
                            1, pix_op, qpix_op,
                            s->mv[dir][0][0], s->mv[dir][0][1], 8);
                /* bottom field */
                qpel_motion(s, dest_y, dest_cb, dest_cr, s->linesize,
                            ref_picture, s->field_select[dir][1] ? s->linesize : 0,
                            1, pix_op, qpix_op,
                            s->mv[dir][1][0], s->mv[dir][1][1], 8);
            }else{
                /* top field */       
                mpeg_motion(s, dest_y, dest_cb, dest_cr, 0,
                            ref_picture, s->field_select[dir][0] ? s->linesize : 0,
                            1, pix_op,
                            s->mv[dir][0][0], s->mv[dir][0][1], 8);
                /* bottom field */
                mpeg_motion(s, dest_y, dest_cb, dest_cr, s->linesize,
                            ref_picture, s->field_select[dir][1] ? s->linesize : 0,
                            1, pix_op,
                            s->mv[dir][1][0], s->mv[dir][1][1], 8);
            }
F
Fabrice Bellard 已提交
1864
        } else {
1865 1866 1867 1868 1869 1870 1871
            int offset;
            if(s->picture_structure == s->field_select[dir][0] + 1 || s->pict_type == B_TYPE || s->first_field){
                offset= s->field_select[dir][0] ? s->linesize/2 : 0;
            }else{
                ref_picture= s->current_picture.data;
                offset= s->field_select[dir][0] ? s->linesize/2 : -s->linesize/2; 
            } 
F
Fabrice Bellard 已提交
1872

1873 1874 1875 1876
            mpeg_motion(s, dest_y, dest_cb, dest_cr, 0,
                        ref_picture, offset,
                        0, pix_op,
                        s->mv[dir][0][0], s->mv[dir][0][1], 16);
F
Fabrice Bellard 已提交
1877 1878 1879 1880 1881 1882 1883 1884
        }
        break;
    }
}


/* put block[] to dest[] */
static inline void put_dct(MpegEncContext *s, 
1885
                           DCTELEM *block, int i, uint8_t *dest, int line_size)
F
Fabrice Bellard 已提交
1886
{
1887
    s->dct_unquantize(s, block, i, s->qscale);
1888
    s->dsp.idct_put (dest, line_size, block);
F
Fabrice Bellard 已提交
1889 1890 1891 1892
}

/* add block[] to dest[] */
static inline void add_dct(MpegEncContext *s, 
1893
                           DCTELEM *block, int i, uint8_t *dest, int line_size)
F
Fabrice Bellard 已提交
1894
{
M
Michael Niedermayer 已提交
1895
    if (s->block_last_index[i] >= 0) {
1896
        s->dsp.idct_add (dest, line_size, block);
M
Michael Niedermayer 已提交
1897 1898
    }
}
1899

M
Michael Niedermayer 已提交
1900
static inline void add_dequant_dct(MpegEncContext *s, 
1901
                           DCTELEM *block, int i, uint8_t *dest, int line_size)
M
Michael Niedermayer 已提交
1902
{
F
Fabrice Bellard 已提交
1903
    if (s->block_last_index[i] >= 0) {
M
Michael Niedermayer 已提交
1904
        s->dct_unquantize(s, block, i, s->qscale);
1905

1906
        s->dsp.idct_add (dest, line_size, block);
F
Fabrice Bellard 已提交
1907 1908 1909
    }
}

1910 1911 1912 1913 1914 1915 1916 1917 1918 1919 1920 1921 1922
/**
 * cleans dc, ac, coded_block for the current non intra MB
 */
void ff_clean_intra_table_entries(MpegEncContext *s)
{
    int wrap = s->block_wrap[0];
    int xy = s->block_index[0];
    
    s->dc_val[0][xy           ] = 
    s->dc_val[0][xy + 1       ] = 
    s->dc_val[0][xy     + wrap] =
    s->dc_val[0][xy + 1 + wrap] = 1024;
    /* ac pred */
1923 1924
    memset(s->ac_val[0][xy       ], 0, 32 * sizeof(int16_t));
    memset(s->ac_val[0][xy + wrap], 0, 32 * sizeof(int16_t));
1925 1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936
    if (s->msmpeg4_version>=3) {
        s->coded_block[xy           ] =
        s->coded_block[xy + 1       ] =
        s->coded_block[xy     + wrap] =
        s->coded_block[xy + 1 + wrap] = 0;
    }
    /* chroma */
    wrap = s->block_wrap[4];
    xy = s->mb_x + 1 + (s->mb_y + 1) * wrap;
    s->dc_val[1][xy] =
    s->dc_val[2][xy] = 1024;
    /* ac pred */
1937 1938
    memset(s->ac_val[1][xy], 0, 16 * sizeof(int16_t));
    memset(s->ac_val[2][xy], 0, 16 * sizeof(int16_t));
1939 1940 1941 1942
    
    s->mbintra_table[s->mb_x + s->mb_y*s->mb_width]= 0;
}

F
Fabrice Bellard 已提交
1943 1944 1945 1946 1947 1948 1949 1950 1951 1952 1953 1954
/* generic function called after a macroblock has been parsed by the
   decoder or after it has been encoded by the encoder.

   Important variables used:
   s->mb_intra : true if intra macroblock
   s->mv_dir   : motion vector direction
   s->mv_type  : motion vector type
   s->mv       : motion vector
   s->interlaced_dct : true if interlaced dct used (mpeg2)
 */
void MPV_decode_mb(MpegEncContext *s, DCTELEM block[6][64])
{
1955
    int mb_x, mb_y;
M
Michael Niedermayer 已提交
1956
    const int mb_xy = s->mb_y * s->mb_width + s->mb_x;
F
Fabrice Bellard 已提交
1957 1958 1959 1960

    mb_x = s->mb_x;
    mb_y = s->mb_y;

M
cleanup  
Michael Niedermayer 已提交
1961
    s->current_picture.qscale_table[mb_xy]= s->qscale;
1962

F
Fabrice Bellard 已提交
1963 1964
    /* update DC predictors for P macroblocks */
    if (!s->mb_intra) {
1965
        if (s->h263_pred || s->h263_aic) {
M
Michael Niedermayer 已提交
1966
            if(s->mbintra_table[mb_xy])
1967
                ff_clean_intra_table_entries(s);
F
Fabrice Bellard 已提交
1968
        } else {
1969 1970
            s->last_dc[0] =
            s->last_dc[1] =
F
Fabrice Bellard 已提交
1971 1972 1973
            s->last_dc[2] = 128 << s->intra_dc_precision;
        }
    }
1974
    else if (s->h263_pred || s->h263_aic)
M
Michael Niedermayer 已提交
1975
        s->mbintra_table[mb_xy]=1;
1976

1977
    /* update motion predictor, not for B-frames as they need the motion_val from the last P/S-Frame */
M
Michael Niedermayer 已提交
1978
    if (s->out_format == FMT_H263 && s->pict_type!=B_TYPE) { //FIXME move into h263.c if possible, format specific stuff shouldnt be here
M
Michael Niedermayer 已提交
1979
        //FIXME a lot of thet is only needed for !low_delay
M
Michael Niedermayer 已提交
1980 1981
        const int wrap = s->block_wrap[0];
        const int xy = s->block_index[0];
1982
        const int mb_index= s->mb_x + s->mb_y*s->mb_width;
1983
        if(s->mv_type == MV_TYPE_8X8){
1984
            s->co_located_type_table[mb_index]= CO_LOCATED_TYPE_4MV;
1985 1986 1987 1988 1989
        } else {
            int motion_x, motion_y;
            if (s->mb_intra) {
                motion_x = 0;
                motion_y = 0;
1990 1991
                if(s->co_located_type_table)
                    s->co_located_type_table[mb_index]= 0;
1992 1993 1994
            } else if (s->mv_type == MV_TYPE_16X16) {
                motion_x = s->mv[0][0][0];
                motion_y = s->mv[0][0][1];
1995 1996
                if(s->co_located_type_table)
                    s->co_located_type_table[mb_index]= 0;
1997
            } else /*if (s->mv_type == MV_TYPE_FIELD)*/ {
1998
                int i;
1999 2000 2001
                motion_x = s->mv[0][0][0] + s->mv[0][1][0];
                motion_y = s->mv[0][0][1] + s->mv[0][1][1];
                motion_x = (motion_x>>1) | (motion_x&1);
2002 2003 2004 2005 2006 2007
                for(i=0; i<2; i++){
                    s->field_mv_table[mb_index][i][0]= s->mv[0][i][0];
                    s->field_mv_table[mb_index][i][1]= s->mv[0][i][1];
                    s->field_select_table[mb_index][i]= s->field_select[0][i];
                }
                s->co_located_type_table[mb_index]= CO_LOCATED_TYPE_FIELDMV;
2008
            }
F
Fabrice Bellard 已提交
2009
            /* no update if 8X8 because it has been done during parsing */
2010 2011 2012 2013 2014 2015 2016 2017
            s->motion_val[xy][0] = motion_x;
            s->motion_val[xy][1] = motion_y;
            s->motion_val[xy + 1][0] = motion_x;
            s->motion_val[xy + 1][1] = motion_y;
            s->motion_val[xy + wrap][0] = motion_x;
            s->motion_val[xy + wrap][1] = motion_y;
            s->motion_val[xy + 1 + wrap][0] = motion_x;
            s->motion_val[xy + 1 + wrap][1] = motion_y;
F
Fabrice Bellard 已提交
2018 2019 2020
        }
    }
    
2021
    if ((s->flags&CODEC_FLAG_PSNR) || !(s->encoding && (s->intra_only || s->pict_type==B_TYPE))) { //FIXME precalc
2022
        uint8_t *dest_y, *dest_cb, *dest_cr;
M
Michael Niedermayer 已提交
2023
        int dct_linesize, dct_offset;
M
Michael Niedermayer 已提交
2024 2025
        op_pixels_func (*op_pix)[4];
        qpel_mc_func (*op_qpix)[16];
2026

M
cleanup  
Michael Niedermayer 已提交
2027
        /* avoid copy if macroblock skipped in last frame too */
2028
        if (s->pict_type != B_TYPE) {
M
cleanup  
Michael Niedermayer 已提交
2029 2030 2031 2032 2033
            s->current_picture.mbskip_table[mb_xy]= s->mb_skiped;
        }

        /* skip only during decoding as we might trash the buffers during encoding a bit */
        if(!s->encoding){
2034
            uint8_t *mbskip_ptr = &s->mbskip_table[mb_xy];
M
cleanup  
Michael Niedermayer 已提交
2035
            const int age= s->current_picture.age;
M
Michael Niedermayer 已提交
2036

M
cleanup  
Michael Niedermayer 已提交
2037 2038 2039 2040 2041 2042
            assert(age);

            if (s->mb_skiped) {
                s->mb_skiped= 0;
                assert(s->pict_type!=I_TYPE);
 
M
Michael Niedermayer 已提交
2043 2044 2045
                (*mbskip_ptr) ++; /* indicate that this time we skiped it */
                if(*mbskip_ptr >99) *mbskip_ptr= 99;

M
cleanup  
Michael Niedermayer 已提交
2046
                /* if previous was skipped too, then nothing to do !  */
2047 2048
                if (*mbskip_ptr >= age && s->current_picture.reference){
                    return;
M
cleanup  
Michael Niedermayer 已提交
2049
                }
2050 2051 2052 2053
            } else if(!s->current_picture.reference){
                (*mbskip_ptr) ++; /* increase counter so the age can be compared cleanly */
                if(*mbskip_ptr >99) *mbskip_ptr= 99;
            } else{
2054 2055
                *mbskip_ptr = 0; /* not skipped */
            }
M
cleanup  
Michael Niedermayer 已提交
2056 2057
        }else
            s->mb_skiped= 0;
F
Fabrice Bellard 已提交
2058

2059
        if(s->pict_type==B_TYPE && s->avctx->draw_horiz_band && s->picture_structure==PICT_FRAME){ //FIXME precalc
M
cleanup  
Michael Niedermayer 已提交
2060 2061 2062
            dest_y  = s->current_picture.data[0] + mb_x * 16;
            dest_cb = s->current_picture.data[1] + mb_x * 8;
            dest_cr = s->current_picture.data[2] + mb_x * 8;
M
Michael Niedermayer 已提交
2063
        }else{
M
cleanup  
Michael Niedermayer 已提交
2064 2065 2066
            dest_y  = s->current_picture.data[0] + (mb_y * 16* s->linesize  ) + mb_x * 16;
            dest_cb = s->current_picture.data[1] + (mb_y * 8 * s->uvlinesize) + mb_x * 8;
            dest_cr = s->current_picture.data[2] + (mb_y * 8 * s->uvlinesize) + mb_x * 8;
M
Michael Niedermayer 已提交
2067
        }
F
Fabrice Bellard 已提交
2068 2069 2070 2071 2072 2073 2074 2075 2076 2077 2078

        if (s->interlaced_dct) {
            dct_linesize = s->linesize * 2;
            dct_offset = s->linesize;
        } else {
            dct_linesize = s->linesize;
            dct_offset = s->linesize * 8;
        }

        if (!s->mb_intra) {
            /* motion handling */
2079
            /* decoding or more than one mb_type (MC was allready done otherwise) */
M
Michael Niedermayer 已提交
2080
            if((!s->encoding) || (s->mb_type[mb_xy]&(s->mb_type[mb_xy]-1))){
2081
                if ((!s->no_rounding) || s->pict_type==B_TYPE){                
2082 2083
		    op_pix = s->dsp.put_pixels_tab;
                    op_qpix= s->dsp.put_qpel_pixels_tab;
2084
                }else{
2085 2086
                    op_pix = s->dsp.put_no_rnd_pixels_tab;
                    op_qpix= s->dsp.put_no_rnd_qpel_pixels_tab;
2087
                }
F
Fabrice Bellard 已提交
2088

2089
                if (s->mv_dir & MV_DIR_FORWARD) {
M
cleanup  
Michael Niedermayer 已提交
2090
                    MPV_motion(s, dest_y, dest_cb, dest_cr, 0, s->last_picture.data, op_pix, op_qpix);
2091 2092
		    op_pix = s->dsp.avg_pixels_tab;
                    op_qpix= s->dsp.avg_qpel_pixels_tab;
2093 2094
                }
                if (s->mv_dir & MV_DIR_BACKWARD) {
M
cleanup  
Michael Niedermayer 已提交
2095
                    MPV_motion(s, dest_y, dest_cb, dest_cr, 1, s->next_picture.data, op_pix, op_qpix);
2096
                }
F
Fabrice Bellard 已提交
2097 2098
            }

M
Michael Niedermayer 已提交
2099
            /* skip dequant / idct if we are really late ;) */
2100
            if(s->hurry_up>1) return;
M
Michael Niedermayer 已提交
2101

F
Fabrice Bellard 已提交
2102
            /* add dct residue */
2103 2104
            if(s->encoding || !(   s->mpeg2 || s->h263_msmpeg4 || s->codec_id==CODEC_ID_MPEG1VIDEO 
                                || (s->codec_id==CODEC_ID_MPEG4 && !s->mpeg_quant))){
M
Michael Niedermayer 已提交
2105 2106 2107 2108 2109
                add_dequant_dct(s, block[0], 0, dest_y, dct_linesize);
                add_dequant_dct(s, block[1], 1, dest_y + 8, dct_linesize);
                add_dequant_dct(s, block[2], 2, dest_y + dct_offset, dct_linesize);
                add_dequant_dct(s, block[3], 3, dest_y + dct_offset + 8, dct_linesize);

M
Michael Niedermayer 已提交
2110
                if(!(s->flags&CODEC_FLAG_GRAY)){
M
Michael Niedermayer 已提交
2111 2112
                    add_dequant_dct(s, block[4], 4, dest_cb, s->uvlinesize);
                    add_dequant_dct(s, block[5], 5, dest_cr, s->uvlinesize);
M
Michael Niedermayer 已提交
2113
                }
M
Michael Niedermayer 已提交
2114
            } else if(s->codec_id != CODEC_ID_WMV2){
M
Michael Niedermayer 已提交
2115 2116 2117 2118
                add_dct(s, block[0], 0, dest_y, dct_linesize);
                add_dct(s, block[1], 1, dest_y + 8, dct_linesize);
                add_dct(s, block[2], 2, dest_y + dct_offset, dct_linesize);
                add_dct(s, block[3], 3, dest_y + dct_offset + 8, dct_linesize);
F
Fabrice Bellard 已提交
2119

M
Michael Niedermayer 已提交
2120
                if(!(s->flags&CODEC_FLAG_GRAY)){
M
Michael Niedermayer 已提交
2121 2122
                    add_dct(s, block[4], 4, dest_cb, s->uvlinesize);
                    add_dct(s, block[5], 5, dest_cr, s->uvlinesize);
M
Michael Niedermayer 已提交
2123
                }
M
Michael Niedermayer 已提交
2124 2125 2126
            } 
#ifdef CONFIG_RISKY
            else{
M
Michael Niedermayer 已提交
2127
                ff_wmv2_add_mb(s, block, dest_y, dest_cb, dest_cr);
M
Michael Niedermayer 已提交
2128
            }
M
Michael Niedermayer 已提交
2129
#endif
F
Fabrice Bellard 已提交
2130 2131
        } else {
            /* dct only in intra block */
2132 2133 2134 2135 2136 2137 2138 2139 2140 2141 2142
            if(s->encoding || !(s->mpeg2 || s->codec_id==CODEC_ID_MPEG1VIDEO)){
                put_dct(s, block[0], 0, dest_y, dct_linesize);
                put_dct(s, block[1], 1, dest_y + 8, dct_linesize);
                put_dct(s, block[2], 2, dest_y + dct_offset, dct_linesize);
                put_dct(s, block[3], 3, dest_y + dct_offset + 8, dct_linesize);

                if(!(s->flags&CODEC_FLAG_GRAY)){
                    put_dct(s, block[4], 4, dest_cb, s->uvlinesize);
                    put_dct(s, block[5], 5, dest_cr, s->uvlinesize);
                }
            }else{
2143 2144 2145 2146
                s->dsp.idct_put(dest_y                 , dct_linesize, block[0]);
                s->dsp.idct_put(dest_y              + 8, dct_linesize, block[1]);
                s->dsp.idct_put(dest_y + dct_offset    , dct_linesize, block[2]);
                s->dsp.idct_put(dest_y + dct_offset + 8, dct_linesize, block[3]);
2147 2148

                if(!(s->flags&CODEC_FLAG_GRAY)){
2149 2150
                    s->dsp.idct_put(dest_cb, s->uvlinesize, block[4]);
                    s->dsp.idct_put(dest_cr, s->uvlinesize, block[5]);
2151
                }
M
Michael Niedermayer 已提交
2152
            }
F
Fabrice Bellard 已提交
2153 2154 2155 2156
        }
    }
}

2157 2158
#ifdef CONFIG_ENCODERS

2159
static inline void dct_single_coeff_elimination(MpegEncContext *s, int n, int threshold)
2160 2161 2162 2163 2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174
{
    static const char tab[64]=
        {3,2,2,1,1,1,1,1,
         1,1,1,1,1,1,1,1,
         1,1,1,1,1,1,1,1,
         0,0,0,0,0,0,0,0,
         0,0,0,0,0,0,0,0,
         0,0,0,0,0,0,0,0,
         0,0,0,0,0,0,0,0,
         0,0,0,0,0,0,0,0};
    int score=0;
    int run=0;
    int i;
    DCTELEM *block= s->block[n];
    const int last_index= s->block_last_index[n];
2175
    int skip_dc;
2176

2177 2178 2179
    if(threshold<0){
        skip_dc=0;
        threshold= -threshold;
2180 2181
    }else
        skip_dc=1;
2182

2183 2184 2185 2186
    /* are all which we could set to zero are allready zero? */
    if(last_index<=skip_dc - 1) return;

    for(i=0; i<=last_index; i++){
2187
        const int j = s->intra_scantable.permutated[i];
2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200
        const int level = ABS(block[j]);
        if(level==1){
            if(skip_dc && i==0) continue;
            score+= tab[run];
            run=0;
        }else if(level>1){
            return;
        }else{
            run++;
        }
    }
    if(score >= threshold) return;
    for(i=skip_dc; i<=last_index; i++){
2201
        const int j = s->intra_scantable.permutated[i];
2202 2203 2204 2205 2206 2207
        block[j]=0;
    }
    if(block[0]) s->block_last_index[n]= 0;
    else         s->block_last_index[n]= -1;
}

2208 2209 2210 2211 2212
static inline void clip_coeffs(MpegEncContext *s, DCTELEM *block, int last_index)
{
    int i;
    const int maxlevel= s->max_qcoeff;
    const int minlevel= s->min_qcoeff;
2213 2214 2215 2216 2217 2218 2219 2220
    
    if(s->mb_intra){
        i=1; //skip clipping of intra dc
    }else
        i=0;
    
    for(;i<=last_index; i++){
        const int j= s->intra_scantable.permutated[i];
2221 2222 2223 2224
        int level = block[j];
       
        if     (level>maxlevel) level=maxlevel;
        else if(level<minlevel) level=minlevel;
2225

M
cleanup  
Michael Niedermayer 已提交
2226
        block[j]= level;
2227 2228 2229 2230
    }
}

#if 0
2231
static int pix_vcmp16x8(uint8_t *s, int stride){ //FIXME move to dsputil & optimize
2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245
    int score=0;
    int x,y;
    
    for(y=0; y<7; y++){
        for(x=0; x<16; x+=4){
            score+= ABS(s[x  ] - s[x  +stride]) + ABS(s[x+1] - s[x+1+stride]) 
                   +ABS(s[x+2] - s[x+2+stride]) + ABS(s[x+3] - s[x+3+stride]);
        }
        s+= stride;
    }
    
    return score;
}

2246
static int pix_diff_vcmp16x8(uint8_t *s1, uint8_t*s2, int stride){ //FIXME move to dsputil & optimize
2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262
    int score=0;
    int x,y;
    
    for(y=0; y<7; y++){
        for(x=0; x<16; x++){
            score+= ABS(s1[x  ] - s2[x ] - s1[x  +stride] + s2[x +stride]);
        }
        s1+= stride;
        s2+= stride;
    }
    
    return score;
}
#else
#define SQ(a) ((a)*(a))

2263
static int pix_vcmp16x8(uint8_t *s, int stride){ //FIXME move to dsputil & optimize
2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277
    int score=0;
    int x,y;
    
    for(y=0; y<7; y++){
        for(x=0; x<16; x+=4){
            score+= SQ(s[x  ] - s[x  +stride]) + SQ(s[x+1] - s[x+1+stride]) 
                   +SQ(s[x+2] - s[x+2+stride]) + SQ(s[x+3] - s[x+3+stride]);
        }
        s+= stride;
    }
    
    return score;
}

2278
static int pix_diff_vcmp16x8(uint8_t *s1, uint8_t*s2, int stride){ //FIXME move to dsputil & optimize
2279 2280 2281 2282 2283 2284 2285 2286 2287 2288 2289 2290 2291 2292 2293
    int score=0;
    int x,y;
    
    for(y=0; y<7; y++){
        for(x=0; x<16; x++){
            score+= SQ(s1[x  ] - s2[x ] - s1[x  +stride] + s2[x +stride]);
        }
        s1+= stride;
        s2+= stride;
    }
    
    return score;
}

#endif
2294

2295 2296
#endif //CONFIG_ENCODERS

2297 2298 2299 2300 2301
/**
 *
 * @param h is the normal height, this will be reduced automatically if needed for the last row
 */
void ff_draw_horiz_band(MpegEncContext *s, int y, int h){
2302
    if (    s->avctx->draw_horiz_band 
M
Michael Niedermayer 已提交
2303
        && (s->last_picture.data[0] || s->low_delay) ) {
2304
        uint8_t *src_ptr[3];
2305 2306
        int offset;
        h= FFMIN(h, s->height - y);
2307

2308
        if(s->pict_type==B_TYPE && s->picture_structure == PICT_FRAME)
2309 2310 2311 2312
            offset = 0;
        else
            offset = y * s->linesize;

M
Michael Niedermayer 已提交
2313
        if(s->pict_type==B_TYPE || s->low_delay){
M
cleanup  
Michael Niedermayer 已提交
2314 2315 2316
            src_ptr[0] = s->current_picture.data[0] + offset;
            src_ptr[1] = s->current_picture.data[1] + (offset >> 2);
            src_ptr[2] = s->current_picture.data[2] + (offset >> 2);
2317
        } else {
M
cleanup  
Michael Niedermayer 已提交
2318 2319 2320
            src_ptr[0] = s->last_picture.data[0] + offset;
            src_ptr[1] = s->last_picture.data[1] + (offset >> 2);
            src_ptr[2] = s->last_picture.data[2] + (offset >> 2);
2321
        }
M
cleanup  
Michael Niedermayer 已提交
2322 2323
        emms_c();

2324 2325 2326 2327 2328
        s->avctx->draw_horiz_band(s->avctx, src_ptr, s->linesize,
                               y, s->width, h);
    }
}

2329 2330
#ifdef CONFIG_ENCODERS

2331
static void encode_mb(MpegEncContext *s, int motion_x, int motion_y)
F
Fabrice Bellard 已提交
2332
{
2333 2334 2335
    const int mb_x= s->mb_x;
    const int mb_y= s->mb_y;
    int i;
2336
    int skip_dct[6];
2337 2338
    int dct_offset   = s->linesize*8; //default for progressive frames
    
2339
    for(i=0; i<6; i++) skip_dct[i]=0;
2340 2341
    
    if(s->adaptive_quant){
M
cleanup  
Michael Niedermayer 已提交
2342
        s->dquant= s->current_picture.qscale_table[mb_x + mb_y*s->mb_width] - s->qscale;
2343 2344

        if(s->out_format==FMT_H263){
2345 2346
            if     (s->dquant> 2) s->dquant= 2;
            else if(s->dquant<-2) s->dquant=-2;
2347 2348 2349
        }
            
        if(s->codec_id==CODEC_ID_MPEG4){        
2350 2351 2352 2353 2354 2355 2356 2357 2358 2359 2360
            if(!s->mb_intra){
                assert(s->dquant==0 || s->mv_type!=MV_TYPE_8X8);

                if(s->mv_dir&MV_DIRECT)
                    s->dquant=0;
            }
        }
        s->qscale+= s->dquant;
        s->y_dc_scale= s->y_dc_scale_table[ s->qscale ];
        s->c_dc_scale= s->c_dc_scale_table[ s->qscale ];
    }
2361

2362
    if (s->mb_intra) {
2363
        uint8_t *ptr;
2364
        int wrap_y;
2365
        int emu=0;
2366

2367
        wrap_y = s->linesize;
M
cleanup  
Michael Niedermayer 已提交
2368
        ptr = s->new_picture.data[0] + (mb_y * 16 * wrap_y) + mb_x * 16;
2369

2370
        if(mb_x*16+16 > s->width || mb_y*16+16 > s->height){
M
Michael Niedermayer 已提交
2371
            ff_emulated_edge_mc(s, ptr, wrap_y, 16, 16, mb_x*16, mb_y*16, s->width, s->height);
2372 2373 2374
            ptr= s->edge_emu_buffer;
            emu=1;
        }
2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390
        
        if(s->flags&CODEC_FLAG_INTERLACED_DCT){
            int progressive_score, interlaced_score;
            
            progressive_score= pix_vcmp16x8(ptr, wrap_y  ) + pix_vcmp16x8(ptr + wrap_y*8, wrap_y );
            interlaced_score = pix_vcmp16x8(ptr, wrap_y*2) + pix_vcmp16x8(ptr + wrap_y  , wrap_y*2);
            
            if(progressive_score > interlaced_score + 100){
                s->interlaced_dct=1;
            
                dct_offset= wrap_y;
                wrap_y<<=1;
            }else
                s->interlaced_dct=0;
        }
        
2391 2392 2393 2394
	s->dsp.get_pixels(s->block[0], ptr                 , wrap_y);
        s->dsp.get_pixels(s->block[1], ptr              + 8, wrap_y);
        s->dsp.get_pixels(s->block[2], ptr + dct_offset    , wrap_y);
        s->dsp.get_pixels(s->block[3], ptr + dct_offset + 8, wrap_y);
2395

M
Michael Niedermayer 已提交
2396 2397 2398 2399
        if(s->flags&CODEC_FLAG_GRAY){
            skip_dct[4]= 1;
            skip_dct[5]= 1;
        }else{
2400
            int wrap_c = s->uvlinesize;
M
cleanup  
Michael Niedermayer 已提交
2401
            ptr = s->new_picture.data[1] + (mb_y * 8 * wrap_c) + mb_x * 8;
2402
            if(emu){
M
Michael Niedermayer 已提交
2403
                ff_emulated_edge_mc(s, ptr, wrap_c, 8, 8, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
2404 2405
                ptr= s->edge_emu_buffer;
            }
2406
	    s->dsp.get_pixels(s->block[4], ptr, wrap_c);
2407

M
cleanup  
Michael Niedermayer 已提交
2408
            ptr = s->new_picture.data[2] + (mb_y * 8 * wrap_c) + mb_x * 8;
2409
            if(emu){
M
Michael Niedermayer 已提交
2410
                ff_emulated_edge_mc(s, ptr, wrap_c, 8, 8, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
2411 2412
                ptr= s->edge_emu_buffer;
            }
2413
            s->dsp.get_pixels(s->block[5], ptr, wrap_c);
M
Michael Niedermayer 已提交
2414
        }
2415
    }else{
M
Michael Niedermayer 已提交
2416 2417
        op_pixels_func (*op_pix)[4];
        qpel_mc_func (*op_qpix)[16];
2418 2419
        uint8_t *dest_y, *dest_cb, *dest_cr;
        uint8_t *ptr_y, *ptr_cb, *ptr_cr;
2420
        int wrap_y, wrap_c;
2421
        int emu=0;
2422

M
cleanup  
Michael Niedermayer 已提交
2423 2424 2425
        dest_y  = s->current_picture.data[0] + (mb_y * 16 * s->linesize    ) + mb_x * 16;
        dest_cb = s->current_picture.data[1] + (mb_y * 8  * (s->uvlinesize)) + mb_x * 8;
        dest_cr = s->current_picture.data[2] + (mb_y * 8  * (s->uvlinesize)) + mb_x * 8;
2426
        wrap_y = s->linesize;
2427
        wrap_c = s->uvlinesize;
M
cleanup  
Michael Niedermayer 已提交
2428 2429 2430
        ptr_y  = s->new_picture.data[0] + (mb_y * 16 * wrap_y) + mb_x * 16;
        ptr_cb = s->new_picture.data[1] + (mb_y * 8 * wrap_c) + mb_x * 8;
        ptr_cr = s->new_picture.data[2] + (mb_y * 8 * wrap_c) + mb_x * 8;
2431

2432
        if ((!s->no_rounding) || s->pict_type==B_TYPE){
2433 2434
	    op_pix = s->dsp.put_pixels_tab;
            op_qpix= s->dsp.put_qpel_pixels_tab;
M
Michael Niedermayer 已提交
2435
        }else{
2436 2437
            op_pix = s->dsp.put_no_rnd_pixels_tab;
            op_qpix= s->dsp.put_no_rnd_qpel_pixels_tab;
2438 2439 2440
        }

        if (s->mv_dir & MV_DIR_FORWARD) {
M
cleanup  
Michael Niedermayer 已提交
2441
            MPV_motion(s, dest_y, dest_cb, dest_cr, 0, s->last_picture.data, op_pix, op_qpix);
2442 2443
            op_pix = s->dsp.avg_pixels_tab;
            op_qpix= s->dsp.avg_qpel_pixels_tab;
2444 2445
        }
        if (s->mv_dir & MV_DIR_BACKWARD) {
M
cleanup  
Michael Niedermayer 已提交
2446
            MPV_motion(s, dest_y, dest_cb, dest_cr, 1, s->next_picture.data, op_pix, op_qpix);
2447
        }
2448

2449
        if(mb_x*16+16 > s->width || mb_y*16+16 > s->height){
M
Michael Niedermayer 已提交
2450
            ff_emulated_edge_mc(s, ptr_y, wrap_y, 16, 16, mb_x*16, mb_y*16, s->width, s->height);
2451 2452 2453
            ptr_y= s->edge_emu_buffer;
            emu=1;
        }
2454 2455 2456 2457 2458 2459 2460 2461 2462 2463 2464 2465 2466 2467 2468 2469 2470 2471
        
        if(s->flags&CODEC_FLAG_INTERLACED_DCT){
            int progressive_score, interlaced_score;
            
            progressive_score= pix_diff_vcmp16x8(ptr_y           , dest_y           , wrap_y  ) 
                             + pix_diff_vcmp16x8(ptr_y + wrap_y*8, dest_y + wrap_y*8, wrap_y  );
            interlaced_score = pix_diff_vcmp16x8(ptr_y           , dest_y           , wrap_y*2)
                             + pix_diff_vcmp16x8(ptr_y + wrap_y  , dest_y + wrap_y  , wrap_y*2);
            
            if(progressive_score > interlaced_score + 600){
                s->interlaced_dct=1;
            
                dct_offset= wrap_y;
                wrap_y<<=1;
            }else
                s->interlaced_dct=0;
        }
        
2472 2473 2474 2475
	s->dsp.diff_pixels(s->block[0], ptr_y                 , dest_y                 , wrap_y);
        s->dsp.diff_pixels(s->block[1], ptr_y              + 8, dest_y              + 8, wrap_y);
        s->dsp.diff_pixels(s->block[2], ptr_y + dct_offset    , dest_y + dct_offset    , wrap_y);
        s->dsp.diff_pixels(s->block[3], ptr_y + dct_offset + 8, dest_y + dct_offset + 8, wrap_y);
M
Michael Niedermayer 已提交
2476 2477 2478 2479 2480
        
        if(s->flags&CODEC_FLAG_GRAY){
            skip_dct[4]= 1;
            skip_dct[5]= 1;
        }else{
2481
            if(emu){
M
Michael Niedermayer 已提交
2482
                ff_emulated_edge_mc(s, ptr_cb, wrap_c, 8, 8, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
2483 2484
                ptr_cb= s->edge_emu_buffer;
            }
2485
            s->dsp.diff_pixels(s->block[4], ptr_cb, dest_cb, wrap_c);
2486
            if(emu){
M
Michael Niedermayer 已提交
2487
                ff_emulated_edge_mc(s, ptr_cr, wrap_c, 8, 8, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
2488 2489
                ptr_cr= s->edge_emu_buffer;
            }
2490
            s->dsp.diff_pixels(s->block[5], ptr_cr, dest_cr, wrap_c);
M
Michael Niedermayer 已提交
2491
        }
2492
        /* pre quantization */         
M
cleanup  
Michael Niedermayer 已提交
2493
        if(s->current_picture.mc_mb_var[s->mb_width*mb_y+ mb_x]<2*s->qscale*s->qscale){
2494
            //FIXME optimize
2495 2496 2497 2498
	    if(s->dsp.pix_abs8x8(ptr_y               , dest_y               , wrap_y) < 20*s->qscale) skip_dct[0]= 1;
            if(s->dsp.pix_abs8x8(ptr_y            + 8, dest_y            + 8, wrap_y) < 20*s->qscale) skip_dct[1]= 1;
            if(s->dsp.pix_abs8x8(ptr_y +dct_offset   , dest_y +dct_offset   , wrap_y) < 20*s->qscale) skip_dct[2]= 1;
            if(s->dsp.pix_abs8x8(ptr_y +dct_offset+ 8, dest_y +dct_offset+ 8, wrap_y) < 20*s->qscale) skip_dct[3]= 1;
2499 2500
            if(s->dsp.pix_abs8x8(ptr_cb              , dest_cb              , wrap_c) < 20*s->qscale) skip_dct[4]= 1;
            if(s->dsp.pix_abs8x8(ptr_cr              , dest_cr              , wrap_c) < 20*s->qscale) skip_dct[5]= 1;
2501 2502 2503 2504 2505 2506 2507 2508 2509 2510 2511 2512 2513 2514 2515 2516
#if 0
{
 static int stat[7];
 int num=0;
 for(i=0; i<6; i++)
  if(skip_dct[i]) num++;
 stat[num]++;
 
 if(s->mb_x==0 && s->mb_y==0){
  for(i=0; i<7; i++){
   printf("%6d %1d\n", stat[i], i);
  }
 }
}
#endif
        }
2517

2518 2519 2520 2521 2522 2523 2524 2525 2526 2527 2528 2529 2530 2531 2532 2533
    }
            
#if 0
            {
                float adap_parm;
                
                adap_parm = ((s->avg_mb_var << 1) + s->mb_var[s->mb_width*mb_y+mb_x] + 1.0) /
                            ((s->mb_var[s->mb_width*mb_y+mb_x] << 1) + s->avg_mb_var + 1.0);
            
                printf("\ntype=%c qscale=%2d adap=%0.2f dquant=%4.2f var=%4d avgvar=%4d", 
                        (s->mb_type[s->mb_width*mb_y+mb_x] > 0) ? 'I' : 'P', 
                        s->qscale, adap_parm, s->qscale*adap_parm,
                        s->mb_var[s->mb_width*mb_y+mb_x], s->avg_mb_var);
            }
#endif
    /* DCT & quantize */
2534 2535 2536
    if(s->out_format==FMT_MJPEG){
        for(i=0;i<6;i++) {
            int overflow;
2537
            s->block_last_index[i] = s->dct_quantize(s, s->block[i], i, 8, &overflow);
2538
            if (overflow) clip_coeffs(s, s->block[i], s->block_last_index[i]);
2539 2540 2541
        }
    }else{
        for(i=0;i<6;i++) {
2542 2543
            if(!skip_dct[i]){
                int overflow;
2544
                s->block_last_index[i] = s->dct_quantize(s, s->block[i], i, s->qscale, &overflow);
2545
            // FIXME we could decide to change to quantizer instead of clipping
2546 2547
            // JS: I don't think that would be a good idea it could lower quality instead
            //     of improve it. Just INTRADC clipping deserves changes in quantizer
2548 2549 2550
                if (overflow) clip_coeffs(s, s->block[i], s->block_last_index[i]);
            }else
                s->block_last_index[i]= -1;
2551
        }
2552 2553
        if(s->luma_elim_threshold && !s->mb_intra)
            for(i=0; i<4; i++)
2554
                dct_single_coeff_elimination(s, i, s->luma_elim_threshold);
2555 2556
        if(s->chroma_elim_threshold && !s->mb_intra)
            for(i=4; i<6; i++)
2557
                dct_single_coeff_elimination(s, i, s->chroma_elim_threshold);
2558 2559
    }

M
Michael Niedermayer 已提交
2560 2561 2562 2563
    if((s->flags&CODEC_FLAG_GRAY) && s->mb_intra){
        s->block_last_index[4]=
        s->block_last_index[5]= 0;
        s->block[4][0]=
M
bugs  
Michael Niedermayer 已提交
2564
        s->block[5][0]= (1024 + s->c_dc_scale/2)/ s->c_dc_scale;
M
Michael Niedermayer 已提交
2565 2566
    }

2567
    /* huffman encode */
M
Michael Niedermayer 已提交
2568 2569 2570
    switch(s->codec_id){ //FIXME funct ptr could be slightly faster
    case CODEC_ID_MPEG1VIDEO:
        mpeg1_encode_mb(s, s->block, motion_x, motion_y); break;
M
Michael Niedermayer 已提交
2571
#ifdef CONFIG_RISKY
M
Michael Niedermayer 已提交
2572 2573 2574 2575 2576 2577 2578 2579 2580 2581 2582 2583
    case CODEC_ID_MPEG4:
        mpeg4_encode_mb(s, s->block, motion_x, motion_y); break;
    case CODEC_ID_MSMPEG4V2:
    case CODEC_ID_MSMPEG4V3:
    case CODEC_ID_WMV1:
        msmpeg4_encode_mb(s, s->block, motion_x, motion_y); break;
    case CODEC_ID_WMV2:
         ff_wmv2_encode_mb(s, s->block, motion_x, motion_y); break;
    case CODEC_ID_H263:
    case CODEC_ID_H263P:
    case CODEC_ID_RV10:
        h263_encode_mb(s, s->block, motion_x, motion_y); break;
M
Michael Niedermayer 已提交
2584 2585 2586
#endif
    case CODEC_ID_MJPEG:
        mjpeg_encode_mb(s, s->block); break;
M
Michael Niedermayer 已提交
2587 2588
    default:
        assert(0);
2589 2590 2591
    }
}

2592 2593
#endif //CONFIG_ENCODERS

M
cleanup  
Michael Niedermayer 已提交
2594 2595 2596 2597 2598 2599 2600 2601 2602 2603 2604 2605 2606 2607 2608 2609 2610 2611 2612 2613 2614 2615 2616 2617 2618 2619 2620 2621 2622
/**
 * combines the (truncated) bitstream to a complete frame
 * @returns -1 if no complete frame could be created
 */
int ff_combine_frame( MpegEncContext *s, int next, uint8_t **buf, int *buf_size){
    ParseContext *pc= &s->parse_context;
        
    pc->last_index= pc->index;

    if(next==-1){
        pc->buffer= av_fast_realloc(pc->buffer, &pc->buffer_size, (*buf_size) + pc->index + FF_INPUT_BUFFER_PADDING_SIZE);

        memcpy(&pc->buffer[pc->index], *buf, *buf_size);
        pc->index += *buf_size;
        return -1;
    }

    if(pc->index){
        pc->buffer= av_fast_realloc(pc->buffer, &pc->buffer_size, next + pc->index + FF_INPUT_BUFFER_PADDING_SIZE);

        memcpy(&pc->buffer[pc->index], *buf, next + FF_INPUT_BUFFER_PADDING_SIZE );
        pc->index = 0;
        *buf= pc->buffer;
        *buf_size= pc->last_index + next;
    }

    return 0;
}

2623
#ifdef CONFIG_ENCODERS
2624
void ff_copy_bits(PutBitContext *pb, uint8_t *src, int length)
2625
{
2626 2627 2628 2629
    int bytes= length>>4;
    int bits= length&15;
    int i;

2630 2631
    if(length==0) return;

2632 2633
    for(i=0; i<bytes; i++) put_bits(pb, 16, be2me_16(((uint16_t*)src)[i]));
    put_bits(pb, bits, be2me_16(((uint16_t*)src)[i])>>(16-bits));
2634 2635
}

2636
static inline void copy_context_before_encode(MpegEncContext *d, MpegEncContext *s, int type){
2637 2638 2639 2640 2641 2642 2643 2644 2645 2646 2647 2648 2649 2650
    int i;

    memcpy(d->last_mv, s->last_mv, 2*2*2*sizeof(int)); //FIXME is memcpy faster then a loop?

    /* mpeg1 */
    d->mb_incr= s->mb_incr;
    for(i=0; i<3; i++)
        d->last_dc[i]= s->last_dc[i];
    
    /* statistics */
    d->mv_bits= s->mv_bits;
    d->i_tex_bits= s->i_tex_bits;
    d->p_tex_bits= s->p_tex_bits;
    d->i_count= s->i_count;
2651 2652
    d->f_count= s->f_count;
    d->b_count= s->b_count;
2653 2654
    d->skip_count= s->skip_count;
    d->misc_bits= s->misc_bits;
2655
    d->last_bits= 0;
2656 2657

    d->mb_skiped= s->mb_skiped;
M
Michael Niedermayer 已提交
2658
    d->qscale= s->qscale;
2659 2660
}

2661
static inline void copy_context_after_encode(MpegEncContext *d, MpegEncContext *s, int type){
2662 2663 2664 2665 2666 2667 2668 2669 2670 2671 2672 2673 2674 2675 2676
    int i;

    memcpy(d->mv, s->mv, 2*4*2*sizeof(int)); 
    memcpy(d->last_mv, s->last_mv, 2*2*2*sizeof(int)); //FIXME is memcpy faster then a loop?
    
    /* mpeg1 */
    d->mb_incr= s->mb_incr;
    for(i=0; i<3; i++)
        d->last_dc[i]= s->last_dc[i];
    
    /* statistics */
    d->mv_bits= s->mv_bits;
    d->i_tex_bits= s->i_tex_bits;
    d->p_tex_bits= s->p_tex_bits;
    d->i_count= s->i_count;
2677 2678
    d->f_count= s->f_count;
    d->b_count= s->b_count;
2679 2680 2681 2682
    d->skip_count= s->skip_count;
    d->misc_bits= s->misc_bits;

    d->mb_intra= s->mb_intra;
2683
    d->mb_skiped= s->mb_skiped;
2684 2685 2686
    d->mv_type= s->mv_type;
    d->mv_dir= s->mv_dir;
    d->pb= s->pb;
2687 2688 2689 2690
    if(s->data_partitioning){
        d->pb2= s->pb2;
        d->tex_pb= s->tex_pb;
    }
2691 2692 2693
    d->block= s->block;
    for(i=0; i<6; i++)
        d->block_last_index[i]= s->block_last_index[i];
2694
    d->interlaced_dct= s->interlaced_dct;
M
Michael Niedermayer 已提交
2695
    d->qscale= s->qscale;
2696 2697
}

2698 2699 2700 2701 2702 2703 2704 2705 2706 2707 2708 2709 2710 2711 2712 2713 2714 2715 2716 2717 2718 2719 2720 2721 2722 2723 2724 2725 2726 2727
static inline void encode_mb_hq(MpegEncContext *s, MpegEncContext *backup, MpegEncContext *best, int type, 
                           PutBitContext pb[2], PutBitContext pb2[2], PutBitContext tex_pb[2],
                           int *dmin, int *next_block, int motion_x, int motion_y)
{
    int bits_count;
    
    copy_context_before_encode(s, backup, type);

    s->block= s->blocks[*next_block];
    s->pb= pb[*next_block];
    if(s->data_partitioning){
        s->pb2   = pb2   [*next_block];
        s->tex_pb= tex_pb[*next_block];
    }

    encode_mb(s, motion_x, motion_y);

    bits_count= get_bit_count(&s->pb);
    if(s->data_partitioning){
        bits_count+= get_bit_count(&s->pb2);
        bits_count+= get_bit_count(&s->tex_pb);
    }

    if(bits_count<*dmin){
        *dmin= bits_count;
        *next_block^=1;

        copy_context_after_encode(best, s, type);
    }
}
2728 2729 2730 2731 2732 2733 2734
                
static inline int sse(MpegEncContext *s, uint8_t *src1, uint8_t *src2, int w, int h, int stride){
    uint32_t *sq = squareTbl + 256;
    int acc=0;
    int x,y;
    
    if(w==16 && h==16) 
M
Michael Niedermayer 已提交
2735 2736 2737
        return s->dsp.sse[0](NULL, src1, src2, stride);
    else if(w==8 && h==8)
        return s->dsp.sse[1](NULL, src1, src2, stride);
2738 2739 2740 2741 2742 2743
    
    for(y=0; y<h; y++){
        for(x=0; x<w; x++){
            acc+= sq[src1[x + y*stride] - src2[x + y*stride]];
        } 
    }
M
Michael Niedermayer 已提交
2744 2745 2746
    
    assert(acc>=0);
    
2747 2748
    return acc;
}
2749

2750 2751
static void encode_picture(MpegEncContext *s, int picture_number)
{
M
Michael Niedermayer 已提交
2752
    int mb_x, mb_y, pdif = 0;
2753
    int i;
2754
    int bits;
2755
    MpegEncContext best_s, backup_s;
2756 2757 2758
    uint8_t bit_buf[2][3000];
    uint8_t bit_buf2[2][3000];
    uint8_t bit_buf_tex[2][3000];
2759 2760 2761 2762 2763 2764 2765
    PutBitContext pb[2], pb2[2], tex_pb[2];

    for(i=0; i<2; i++){
        init_put_bits(&pb    [i], bit_buf    [i], 3000, NULL, NULL);
        init_put_bits(&pb2   [i], bit_buf2   [i], 3000, NULL, NULL);
        init_put_bits(&tex_pb[i], bit_buf_tex[i], 3000, NULL, NULL);
    }
F
Fabrice Bellard 已提交
2766 2767

    s->picture_number = picture_number;
2768

2769 2770 2771 2772 2773 2774 2775
    s->block_wrap[0]=
    s->block_wrap[1]=
    s->block_wrap[2]=
    s->block_wrap[3]= s->mb_width*2 + 2;
    s->block_wrap[4]=
    s->block_wrap[5]= s->mb_width + 2;
    
2776
    /* Reset the average MB variance */
M
cleanup  
Michael Niedermayer 已提交
2777 2778
    s->current_picture.mb_var_sum = 0;
    s->current_picture.mc_mb_var_sum = 0;
2779

M
Michael Niedermayer 已提交
2780
#ifdef CONFIG_RISKY
2781
    /* we need to initialize some time vars before we can encode b-frames */
2782 2783
    // RAL: Condition added for MPEG1VIDEO
    if (s->codec_id == CODEC_ID_MPEG1VIDEO || (s->h263_pred && !s->h263_msmpeg4))
2784
        ff_set_mpeg4_time(s, s->picture_number); 
M
Michael Niedermayer 已提交
2785 2786
#endif
        
2787
    s->scene_change_score=0;
2788 2789
    
    s->qscale= (int)(s->frame_qscale + 0.5); //FIXME qscale / ... stuff for ME ratedistoration
M
Michael Niedermayer 已提交
2790
    
M
Michael Niedermayer 已提交
2791 2792 2793 2794 2795
    if(s->pict_type==I_TYPE){
        if(s->msmpeg4_version) s->no_rounding=1;
        else                   s->no_rounding=0;
    }else if(s->pict_type!=B_TYPE){
        if(s->flipflop_rounding || s->codec_id == CODEC_ID_H263P || s->codec_id == CODEC_ID_MPEG4)
M
Michael Niedermayer 已提交
2796 2797
            s->no_rounding ^= 1;          
    }
M
Michael Niedermayer 已提交
2798
    
2799
    /* Estimate motion for every MB */
2800
    s->mb_intra=0; //for the rate distoration & bit compare functions
2801
    if(s->pict_type != I_TYPE){
M
Michael Niedermayer 已提交
2802 2803
        if(s->pict_type != B_TYPE){
            if((s->avctx->pre_me && s->last_non_b_pict_type==I_TYPE) || s->avctx->pre_me==2){
2804
                s->me.pre_pass=1;
M
Michael Niedermayer 已提交
2805
                s->me.dia_size= s->avctx->pre_dia_size;
2806

M
Michael Niedermayer 已提交
2807 2808 2809 2810 2811 2812 2813
                for(mb_y=s->mb_height-1; mb_y >=0 ; mb_y--) {
                    for(mb_x=s->mb_width-1; mb_x >=0 ; mb_x--) {
                        s->mb_x = mb_x;
                        s->mb_y = mb_y;
                        ff_pre_estimate_p_frame_motion(s, mb_x, mb_y);
                    }
                }
2814
                s->me.pre_pass=0;
M
Michael Niedermayer 已提交
2815 2816 2817
            }
        }

M
Michael Niedermayer 已提交
2818
        s->me.dia_size= s->avctx->dia_size;
2819 2820 2821 2822 2823 2824 2825 2826 2827 2828 2829 2830
        for(mb_y=0; mb_y < s->mb_height; mb_y++) {
            s->block_index[0]= s->block_wrap[0]*(mb_y*2 + 1) - 1;
            s->block_index[1]= s->block_wrap[0]*(mb_y*2 + 1);
            s->block_index[2]= s->block_wrap[0]*(mb_y*2 + 2) - 1;
            s->block_index[3]= s->block_wrap[0]*(mb_y*2 + 2);
            for(mb_x=0; mb_x < s->mb_width; mb_x++) {
                s->mb_x = mb_x;
                s->mb_y = mb_y;
                s->block_index[0]+=2;
                s->block_index[1]+=2;
                s->block_index[2]+=2;
                s->block_index[3]+=2;
M
Michael Niedermayer 已提交
2831
                
2832
                /* compute motion vector & mb_type and store in context */
2833 2834 2835 2836
                if(s->pict_type==B_TYPE)
                    ff_estimate_b_frame_motion(s, mb_x, mb_y);
                else
                    ff_estimate_p_frame_motion(s, mb_x, mb_y);
2837 2838
            }
        }
2839
    }else /* if(s->pict_type == I_TYPE) */{
2840 2841
        /* I-Frame */
        //FIXME do we need to zero them?
2842 2843 2844
        memset(s->motion_val[0], 0, sizeof(int16_t)*(s->mb_width*2 + 2)*(s->mb_height*2 + 2)*2);
        memset(s->p_mv_table   , 0, sizeof(int16_t)*(s->mb_width+2)*(s->mb_height+2)*2);
        memset(s->mb_type      , MB_TYPE_INTRA, sizeof(uint8_t)*s->mb_width*s->mb_height);
M
Michael Niedermayer 已提交
2845 2846 2847 2848 2849 2850 2851
        
        if(!s->fixed_qscale){
            /* finding spatial complexity for I-frame rate control */
            for(mb_y=0; mb_y < s->mb_height; mb_y++) {
                for(mb_x=0; mb_x < s->mb_width; mb_x++) {
                    int xx = mb_x * 16;
                    int yy = mb_y * 16;
M
cleanup  
Michael Niedermayer 已提交
2852
                    uint8_t *pix = s->new_picture.data[0] + (yy * s->linesize) + xx;
M
Michael Niedermayer 已提交
2853
                    int varc;
2854
		    int sum = s->dsp.pix_sum(pix, s->linesize);
M
Michael Niedermayer 已提交
2855
    
2856
		    varc = (s->dsp.pix_norm1(pix, s->linesize) - (((unsigned)(sum*sum))>>8) + 500 + 128)>>8;
M
Michael Niedermayer 已提交
2857

M
cleanup  
Michael Niedermayer 已提交
2858 2859 2860
                    s->current_picture.mb_var [s->mb_width * mb_y + mb_x] = varc;
                    s->current_picture.mb_mean[s->mb_width * mb_y + mb_x] = (sum+128)>>8;
                    s->current_picture.mb_var_sum    += varc;
M
Michael Niedermayer 已提交
2861 2862 2863
                }
            }
        }
2864
    }
2865 2866
    emms_c();

2867
    if(s->scene_change_score > 0 && s->pict_type == P_TYPE){
M
Michael Niedermayer 已提交
2868
        s->pict_type= I_TYPE;
2869
        memset(s->mb_type   , MB_TYPE_INTRA, sizeof(uint8_t)*s->mb_width*s->mb_height);
M
cleanup  
Michael Niedermayer 已提交
2870
//printf("Scene change detected, encoding as I Frame %d %d\n", s->current_picture.mb_var_sum, s->current_picture.mc_mb_var_sum);
M
Michael Niedermayer 已提交
2871
    }
M
cleanup  
Michael Niedermayer 已提交
2872

M
Michael Niedermayer 已提交
2873
    if(!s->umvplus){
2874 2875
        if(s->pict_type==P_TYPE || s->pict_type==S_TYPE) {
            s->f_code= ff_get_best_fcode(s, s->p_mv_table, MB_TYPE_INTER);
2876
        
2877 2878
            ff_fix_long_p_mvs(s);
        }
2879

2880 2881
        if(s->pict_type==B_TYPE){
            int a, b;
2882

2883 2884 2885
            a = ff_get_best_fcode(s, s->b_forw_mv_table, MB_TYPE_FORWARD);
            b = ff_get_best_fcode(s, s->b_bidir_forw_mv_table, MB_TYPE_BIDIR);
            s->f_code = FFMAX(a, b);
2886

2887 2888 2889
            a = ff_get_best_fcode(s, s->b_back_mv_table, MB_TYPE_BACKWARD);
            b = ff_get_best_fcode(s, s->b_bidir_back_mv_table, MB_TYPE_BIDIR);
            s->b_code = FFMAX(a, b);
2890

2891 2892 2893 2894 2895
            ff_fix_long_b_mvs(s, s->b_forw_mv_table, s->f_code, MB_TYPE_FORWARD);
            ff_fix_long_b_mvs(s, s->b_back_mv_table, s->b_code, MB_TYPE_BACKWARD);
            ff_fix_long_b_mvs(s, s->b_bidir_forw_mv_table, s->f_code, MB_TYPE_BIDIR);
            ff_fix_long_b_mvs(s, s->b_bidir_back_mv_table, s->b_code, MB_TYPE_BIDIR);
        }
2896
    }
2897
    
2898
    if (s->fixed_qscale) 
M
cleanup  
Michael Niedermayer 已提交
2899
        s->frame_qscale = s->current_picture.quality;
2900 2901
    else
        s->frame_qscale = ff_rate_estimate_qscale(s);
2902

2903
    if(s->adaptive_quant){
M
Michael Niedermayer 已提交
2904
#ifdef CONFIG_RISKY
2905 2906 2907 2908 2909 2910 2911 2912 2913
        switch(s->codec_id){
        case CODEC_ID_MPEG4:
            ff_clean_mpeg4_qscales(s);
            break;
        case CODEC_ID_H263:
        case CODEC_ID_H263P:
            ff_clean_h263_qscales(s);
            break;
        }
M
Michael Niedermayer 已提交
2914
#endif
2915

M
cleanup  
Michael Niedermayer 已提交
2916
        s->qscale= s->current_picture.qscale_table[0];
2917
    }else
2918 2919
        s->qscale= (int)(s->frame_qscale + 0.5);
        
F
Fabrice Bellard 已提交
2920 2921
    if (s->out_format == FMT_MJPEG) {
        /* for mjpeg, we do include qscale in the matrix */
2922
        s->intra_matrix[0] = ff_mpeg1_default_intra_matrix[0];
2923
        for(i=1;i<64;i++){
2924
            int j= s->dsp.idct_permutation[i];
2925 2926 2927

            s->intra_matrix[j] = CLAMP_TO_8BIT((ff_mpeg1_default_intra_matrix[i] * s->qscale) >> 3);
        }
2928
        convert_matrix(s, s->q_intra_matrix, s->q_intra_matrix16, 
2929
                       s->q_intra_matrix16_bias, s->intra_matrix, s->intra_quant_bias, 8, 8);
F
Fabrice Bellard 已提交
2930
    }
M
cleanup  
Michael Niedermayer 已提交
2931 2932 2933 2934 2935 2936 2937
    
    //FIXME var duplication
    s->current_picture.key_frame= s->pict_type == I_TYPE;
    s->current_picture.pict_type= s->pict_type;

    if(s->current_picture.key_frame)
        s->picture_in_gop_number=0;
F
Fabrice Bellard 已提交
2938

2939
    s->last_bits= get_bit_count(&s->pb);
F
Fabrice Bellard 已提交
2940 2941 2942 2943
    switch(s->out_format) {
    case FMT_MJPEG:
        mjpeg_picture_header(s);
        break;
M
Michael Niedermayer 已提交
2944
#ifdef CONFIG_RISKY
F
Fabrice Bellard 已提交
2945
    case FMT_H263:
M
Michael Niedermayer 已提交
2946 2947 2948
        if (s->codec_id == CODEC_ID_WMV2) 
            ff_wmv2_encode_picture_header(s, picture_number);
        else if (s->h263_msmpeg4) 
F
Fabrice Bellard 已提交
2949 2950 2951 2952 2953 2954 2955 2956
            msmpeg4_encode_picture_header(s, picture_number);
        else if (s->h263_pred)
            mpeg4_encode_picture_header(s, picture_number);
        else if (s->h263_rv10) 
            rv10_encode_picture_header(s, picture_number);
        else
            h263_encode_picture_header(s, picture_number);
        break;
M
Michael Niedermayer 已提交
2957
#endif
F
Fabrice Bellard 已提交
2958 2959 2960 2961
    case FMT_MPEG1:
        mpeg1_encode_picture_header(s, picture_number);
        break;
    }
2962 2963 2964 2965 2966 2967 2968 2969
    bits= get_bit_count(&s->pb);
    s->header_bits= bits - s->last_bits;
    s->last_bits= bits;
    s->mv_bits=0;
    s->misc_bits=0;
    s->i_tex_bits=0;
    s->p_tex_bits=0;
    s->i_count=0;
2970 2971
    s->f_count=0;
    s->b_count=0;
2972 2973
    s->skip_count=0;

2974 2975 2976 2977 2978 2979 2980
    for(i=0; i<3; i++){
        /* init last dc values */
        /* note: quant matrix value (8) is implied here */
        s->last_dc[i] = 128;
        
        s->current_picture.error[i] = 0;
    }
F
Fabrice Bellard 已提交
2981 2982 2983
    s->mb_incr = 1;
    s->last_mv[0][0][0] = 0;
    s->last_mv[0][0][1] = 0;
2984 2985 2986 2987
    s->last_mv[1][0][0] = 0;
    s->last_mv[1][0][1] = 0;
     
    s->last_mv_dir = 0;
F
Fabrice Bellard 已提交
2988

M
Michael Niedermayer 已提交
2989
#ifdef CONFIG_RISKY
M
Michael Niedermayer 已提交
2990
    if (s->codec_id==CODEC_ID_H263 || s->codec_id==CODEC_ID_H263P)
2991
        s->gob_index = ff_h263_get_gob_height(s);
2992

2993
    if(s->codec_id==CODEC_ID_MPEG4 && s->partitioned_frame)
2994
        ff_mpeg4_init_partitions(s);
M
Michael Niedermayer 已提交
2995
#endif
2996 2997 2998

    s->resync_mb_x=0;
    s->resync_mb_y=0;
2999
    s->first_slice_line = 1;
M
Michael Niedermayer 已提交
3000 3001
    s->ptr_lastgob = s->pb.buf;
    s->ptr_last_mb_line = s->pb.buf;
3002
    for(mb_y=0; mb_y < s->mb_height; mb_y++) {
M
Michael Niedermayer 已提交
3003 3004
        s->y_dc_scale= s->y_dc_scale_table[ s->qscale ];
        s->c_dc_scale= s->c_dc_scale_table[ s->qscale ];
3005
        
M
Michael Niedermayer 已提交
3006 3007 3008 3009 3010 3011
        s->block_index[0]= s->block_wrap[0]*(mb_y*2 + 1) - 1;
        s->block_index[1]= s->block_wrap[0]*(mb_y*2 + 1);
        s->block_index[2]= s->block_wrap[0]*(mb_y*2 + 2) - 1;
        s->block_index[3]= s->block_wrap[0]*(mb_y*2 + 2);
        s->block_index[4]= s->block_wrap[4]*(mb_y + 1)                    + s->block_wrap[0]*(s->mb_height*2 + 2);
        s->block_index[5]= s->block_wrap[4]*(mb_y + 1 + s->mb_height + 2) + s->block_wrap[0]*(s->mb_height*2 + 2);
3012
        for(mb_x=0; mb_x < s->mb_width; mb_x++) {
3013
            int mb_type= s->mb_type[mb_y * s->mb_width + mb_x];
3014
            const int xy= (mb_y+1) * (s->mb_width+2) + mb_x + 1;
3015
//            int d;
3016
            int dmin=10000000;
3017 3018 3019

            s->mb_x = mb_x;
            s->mb_y = mb_y;
M
Michael Niedermayer 已提交
3020 3021 3022 3023 3024 3025
            s->block_index[0]+=2;
            s->block_index[1]+=2;
            s->block_index[2]+=2;
            s->block_index[3]+=2;
            s->block_index[4]++;
            s->block_index[5]++;
M
Michael Niedermayer 已提交
3026 3027

            /* write gob / video packet header  */
M
Michael Niedermayer 已提交
3028
#ifdef CONFIG_RISKY
M
Michael Niedermayer 已提交
3029 3030 3031 3032 3033 3034 3035 3036 3037 3038
            if(s->rtp_mode){
                int current_packet_size, is_gob_start;
                
                current_packet_size= pbBufPtr(&s->pb) - s->ptr_lastgob;
                is_gob_start=0;
                
                if(s->codec_id==CODEC_ID_MPEG4){
                    if(current_packet_size + s->mb_line_avgsize/s->mb_width >= s->rtp_payload_size
                       && s->mb_y + s->mb_x>0){

3039
                        if(s->partitioned_frame){
3040 3041 3042 3043 3044 3045 3046 3047 3048 3049 3050
                            ff_mpeg4_merge_partitions(s);
                            ff_mpeg4_init_partitions(s);
                        }
                        ff_mpeg4_encode_video_packet_header(s);

                        if(s->flags&CODEC_FLAG_PASS1){
                            int bits= get_bit_count(&s->pb);
                            s->misc_bits+= bits - s->last_bits;
                            s->last_bits= bits;
                        }
                        ff_mpeg4_clean_buffers(s);
M
Michael Niedermayer 已提交
3051
                        is_gob_start=1;
3052
                    }
M
Michael Niedermayer 已提交
3053 3054 3055 3056 3057 3058 3059 3060 3061 3062
                }else{
                    if(current_packet_size + s->mb_line_avgsize*s->gob_index >= s->rtp_payload_size
                       && s->mb_x==0 && s->mb_y>0 && s->mb_y%s->gob_index==0){
                       
                        h263_encode_gob_header(s, mb_y);                       
                        is_gob_start=1;
                    }
                }

                if(is_gob_start){
3063 3064 3065 3066 3067
                    s->ptr_lastgob = pbBufPtr(&s->pb);
                    s->first_slice_line=1;
                    s->resync_mb_x=mb_x;
                    s->resync_mb_y=mb_y;
                }
3068
            }
M
Michael Niedermayer 已提交
3069
#endif
3070

3071 3072 3073
            if(  (s->resync_mb_x   == s->mb_x)
               && s->resync_mb_y+1 == s->mb_y){
                s->first_slice_line=0; 
3074 3075
            }

3076
            if(mb_type & (mb_type-1)){ // more than 1 MB type possible
3077
                int next_block=0;
3078
                int pb_bits_count, pb2_bits_count, tex_pb_bits_count;
3079 3080

                copy_context_before_encode(&backup_s, s, -1);
3081 3082
                backup_s.pb= s->pb;
                best_s.data_partitioning= s->data_partitioning;
3083
                best_s.partitioned_frame= s->partitioned_frame;
3084 3085 3086 3087
                if(s->data_partitioning){
                    backup_s.pb2= s->pb2;
                    backup_s.tex_pb= s->tex_pb;
                }
3088

3089
                if(mb_type&MB_TYPE_INTER){
3090
                    s->mv_dir = MV_DIR_FORWARD;
M
Michael Niedermayer 已提交
3091
                    s->mv_type = MV_TYPE_16X16;
3092
                    s->mb_intra= 0;
3093 3094
                    s->mv[0][0][0] = s->p_mv_table[xy][0];
                    s->mv[0][0][1] = s->p_mv_table[xy][1];
3095 3096
                    encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_INTER, pb, pb2, tex_pb, 
                                 &dmin, &next_block, s->mv[0][0][0], s->mv[0][0][1]);
F
Fabrice Bellard 已提交
3097
                }
3098
                if(mb_type&MB_TYPE_INTER4V){                 
3099
                    s->mv_dir = MV_DIR_FORWARD;
M
Michael Niedermayer 已提交
3100 3101 3102 3103 3104 3105
                    s->mv_type = MV_TYPE_8X8;
                    s->mb_intra= 0;
                    for(i=0; i<4; i++){
                        s->mv[0][i][0] = s->motion_val[s->block_index[i]][0];
                        s->mv[0][i][1] = s->motion_val[s->block_index[i]][1];
                    }
3106 3107
                    encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_INTER4V, pb, pb2, tex_pb, 
                                 &dmin, &next_block, 0, 0);
3108 3109 3110 3111 3112 3113 3114
                }
                if(mb_type&MB_TYPE_FORWARD){
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mv_type = MV_TYPE_16X16;
                    s->mb_intra= 0;
                    s->mv[0][0][0] = s->b_forw_mv_table[xy][0];
                    s->mv[0][0][1] = s->b_forw_mv_table[xy][1];
3115 3116
                    encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_FORWARD, pb, pb2, tex_pb, 
                                 &dmin, &next_block, s->mv[0][0][0], s->mv[0][0][1]);
3117 3118 3119 3120 3121 3122 3123
                }
                if(mb_type&MB_TYPE_BACKWARD){
                    s->mv_dir = MV_DIR_BACKWARD;
                    s->mv_type = MV_TYPE_16X16;
                    s->mb_intra= 0;
                    s->mv[1][0][0] = s->b_back_mv_table[xy][0];
                    s->mv[1][0][1] = s->b_back_mv_table[xy][1];
3124 3125
                    encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_BACKWARD, pb, pb2, tex_pb, 
                                 &dmin, &next_block, s->mv[1][0][0], s->mv[1][0][1]);
3126 3127 3128 3129 3130 3131 3132 3133 3134
                }
                if(mb_type&MB_TYPE_BIDIR){
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
                    s->mv_type = MV_TYPE_16X16;
                    s->mb_intra= 0;
                    s->mv[0][0][0] = s->b_bidir_forw_mv_table[xy][0];
                    s->mv[0][0][1] = s->b_bidir_forw_mv_table[xy][1];
                    s->mv[1][0][0] = s->b_bidir_back_mv_table[xy][0];
                    s->mv[1][0][1] = s->b_bidir_back_mv_table[xy][1];
3135 3136
                    encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_BIDIR, pb, pb2, tex_pb, 
                                 &dmin, &next_block, 0, 0);
3137 3138
                }
                if(mb_type&MB_TYPE_DIRECT){
M
Michael Niedermayer 已提交
3139 3140 3141
                    int mx= s->b_direct_mv_table[xy][0];
                    int my= s->b_direct_mv_table[xy][1];
                    
3142 3143
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD | MV_DIRECT;
                    s->mb_intra= 0;
M
Michael Niedermayer 已提交
3144
#ifdef CONFIG_RISKY
M
Michael Niedermayer 已提交
3145
                    ff_mpeg4_set_direct_mv(s, mx, my);
M
Michael Niedermayer 已提交
3146
#endif
3147
                    encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_DIRECT, pb, pb2, tex_pb, 
M
Michael Niedermayer 已提交
3148
                                 &dmin, &next_block, mx, my);
M
Michael Niedermayer 已提交
3149
                }
3150
                if(mb_type&MB_TYPE_INTRA){
3151
                    s->mv_dir = 0;
M
Michael Niedermayer 已提交
3152
                    s->mv_type = MV_TYPE_16X16;
3153 3154 3155
                    s->mb_intra= 1;
                    s->mv[0][0][0] = 0;
                    s->mv[0][0][1] = 0;
3156 3157
                    encode_mb_hq(s, &backup_s, &best_s, MB_TYPE_INTRA, pb, pb2, tex_pb, 
                                 &dmin, &next_block, 0, 0);
3158 3159 3160
                    /* force cleaning of ac/dc pred stuff if needed ... */
                    if(s->h263_pred || s->h263_aic)
                        s->mbintra_table[mb_x + mb_y*s->mb_width]=1;
M
Michael Niedermayer 已提交
3161
                }
3162
                copy_context_after_encode(s, &best_s, -1);
3163 3164 3165 3166 3167 3168 3169 3170 3171 3172 3173 3174 3175 3176 3177 3178 3179
                
                pb_bits_count= get_bit_count(&s->pb);
                flush_put_bits(&s->pb);
                ff_copy_bits(&backup_s.pb, bit_buf[next_block^1], pb_bits_count);
                s->pb= backup_s.pb;
                
                if(s->data_partitioning){
                    pb2_bits_count= get_bit_count(&s->pb2);
                    flush_put_bits(&s->pb2);
                    ff_copy_bits(&backup_s.pb2, bit_buf2[next_block^1], pb2_bits_count);
                    s->pb2= backup_s.pb2;
                    
                    tex_pb_bits_count= get_bit_count(&s->tex_pb);
                    flush_put_bits(&s->tex_pb);
                    ff_copy_bits(&backup_s.tex_pb, bit_buf_tex[next_block^1], tex_pb_bits_count);
                    s->tex_pb= backup_s.tex_pb;
                }
3180
                s->last_bits= get_bit_count(&s->pb);
F
Fabrice Bellard 已提交
3181
            } else {
3182
                int motion_x, motion_y;
3183 3184 3185 3186 3187 3188 3189 3190 3191 3192 3193 3194 3195 3196 3197 3198 3199 3200 3201 3202 3203 3204 3205 3206 3207 3208 3209 3210 3211 3212 3213 3214 3215 3216 3217 3218 3219 3220 3221 3222 3223 3224 3225 3226 3227 3228 3229 3230 3231 3232 3233 3234 3235 3236 3237 3238 3239 3240 3241 3242 3243 3244 3245 3246 3247 3248 3249 3250 3251 3252 3253 3254 3255 3256 3257 3258 3259 3260 3261 3262 3263 3264 3265 3266
                int intra_score;
                int inter_score= s->current_picture.mb_cmp_score[mb_x + mb_y*s->mb_width];
                
              if(!(s->flags&CODEC_FLAG_HQ) && s->pict_type==P_TYPE){
                /* get luma score */
                if((s->avctx->mb_cmp&0xFF)==FF_CMP_SSE){
                    intra_score= (s->current_picture.mb_var[mb_x + mb_y*s->mb_width]<<8) - 500; //FIXME dont scale it down so we dont have to fix it
                }else{
                    uint8_t *dest_y;

                    int mean= s->current_picture.mb_mean[mb_x + mb_y*s->mb_width]; //FIXME
                    mean*= 0x01010101;
                    
                    dest_y  = s->new_picture.data[0] + (mb_y * 16 * s->linesize    ) + mb_x * 16;
                
                    for(i=0; i<16; i++){
                        *(uint32_t*)(&s->me.scratchpad[i*s->linesize+ 0]) = mean;
                        *(uint32_t*)(&s->me.scratchpad[i*s->linesize+ 4]) = mean;
                        *(uint32_t*)(&s->me.scratchpad[i*s->linesize+ 8]) = mean;
                        *(uint32_t*)(&s->me.scratchpad[i*s->linesize+12]) = mean;
                    }

                    s->mb_intra=1;
                    intra_score= s->dsp.mb_cmp[0](s, s->me.scratchpad, dest_y, s->linesize);
                                        
/*                    printf("intra:%7d inter:%7d var:%7d mc_var.%7d\n", intra_score>>8, inter_score>>8, 
                        s->current_picture.mb_var[mb_x + mb_y*s->mb_width],
                        s->current_picture.mc_mb_var[mb_x + mb_y*s->mb_width]);*/
                }
                
                /* get chroma score */
                if(s->avctx->mb_cmp&FF_CMP_CHROMA){
                    int i;
                    
                    s->mb_intra=1;
                    for(i=1; i<3; i++){
                        uint8_t *dest_c;
                        int mean;
                        
                        if(s->out_format == FMT_H263){
                            mean= (s->dc_val[i][mb_x + (mb_y+1)*(s->mb_width+2)] + 4)>>3; //FIXME not exact but simple ;)
                        }else{
                            mean= (s->last_dc[i] + 4)>>3;
                        }
                        dest_c = s->new_picture.data[i] + (mb_y * 8  * (s->uvlinesize)) + mb_x * 8;
                        
                        mean*= 0x01010101;
                        for(i=0; i<8; i++){
                            *(uint32_t*)(&s->me.scratchpad[i*s->uvlinesize+ 0]) = mean;
                            *(uint32_t*)(&s->me.scratchpad[i*s->uvlinesize+ 4]) = mean;
                        }
                        
                        intra_score+= s->dsp.mb_cmp[1](s, s->me.scratchpad, dest_c, s->uvlinesize);
                    }                
                }

                /* bias */
                switch(s->avctx->mb_cmp&0xFF){
                default:
                case FF_CMP_SAD:
                    intra_score+= 32*s->qscale;
                    break;
                case FF_CMP_SSE:
                    intra_score+= 24*s->qscale*s->qscale;
                    break;
                case FF_CMP_SATD:
                    intra_score+= 96*s->qscale;
                    break;
                case FF_CMP_DCT:
                    intra_score+= 48*s->qscale;
                    break;
                case FF_CMP_BIT:
                    intra_score+= 16;
                    break;
                case FF_CMP_PSNR:
                case FF_CMP_RD:
                    intra_score+= (s->qscale*s->qscale*109*8 + 64)>>7;
                    break;
                }

                if(intra_score < inter_score)
                    mb_type= MB_TYPE_INTRA;
              }  
                
3267
                s->mv_type=MV_TYPE_16X16;
3268
                // only one MB-Type possible
3269
                
3270 3271
                switch(mb_type){
                case MB_TYPE_INTRA:
3272
                    s->mv_dir = 0;
3273
                    s->mb_intra= 1;
3274 3275
                    motion_x= s->mv[0][0][0] = 0;
                    motion_y= s->mv[0][0][1] = 0;
3276 3277
                    break;
                case MB_TYPE_INTER:
3278 3279 3280 3281
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mb_intra= 0;
                    motion_x= s->mv[0][0][0] = s->p_mv_table[xy][0];
                    motion_y= s->mv[0][0][1] = s->p_mv_table[xy][1];
3282
                    break;
3283 3284 3285 3286 3287 3288 3289 3290 3291 3292
                case MB_TYPE_INTER4V:
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mv_type = MV_TYPE_8X8;
                    s->mb_intra= 0;
                    for(i=0; i<4; i++){
                        s->mv[0][i][0] = s->motion_val[s->block_index[i]][0];
                        s->mv[0][i][1] = s->motion_val[s->block_index[i]][1];
                    }
                    motion_x= motion_y= 0;
                    break;
3293
                case MB_TYPE_DIRECT:
3294 3295
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD | MV_DIRECT;
                    s->mb_intra= 0;
3296 3297
                    motion_x=s->b_direct_mv_table[xy][0];
                    motion_y=s->b_direct_mv_table[xy][1];
M
Michael Niedermayer 已提交
3298
#ifdef CONFIG_RISKY
M
Michael Niedermayer 已提交
3299
                    ff_mpeg4_set_direct_mv(s, motion_x, motion_y);
M
Michael Niedermayer 已提交
3300
#endif
3301 3302
                    break;
                case MB_TYPE_BIDIR:
3303
                    s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD;
3304
                    s->mb_intra= 0;
3305 3306 3307 3308 3309 3310
                    motion_x=0;
                    motion_y=0;
                    s->mv[0][0][0] = s->b_bidir_forw_mv_table[xy][0];
                    s->mv[0][0][1] = s->b_bidir_forw_mv_table[xy][1];
                    s->mv[1][0][0] = s->b_bidir_back_mv_table[xy][0];
                    s->mv[1][0][1] = s->b_bidir_back_mv_table[xy][1];
3311 3312
                    break;
                case MB_TYPE_BACKWARD:
3313 3314 3315 3316
                    s->mv_dir = MV_DIR_BACKWARD;
                    s->mb_intra= 0;
                    motion_x= s->mv[1][0][0] = s->b_back_mv_table[xy][0];
                    motion_y= s->mv[1][0][1] = s->b_back_mv_table[xy][1];
3317 3318
                    break;
                case MB_TYPE_FORWARD:
3319 3320 3321 3322 3323
                    s->mv_dir = MV_DIR_FORWARD;
                    s->mb_intra= 0;
                    motion_x= s->mv[0][0][0] = s->b_forw_mv_table[xy][0];
                    motion_y= s->mv[0][0][1] = s->b_forw_mv_table[xy][1];
//                    printf(" %d %d ", motion_x, motion_y);
3324 3325
                    break;
                default:
3326 3327
                    motion_x=motion_y=0; //gcc warning fix
                    printf("illegal MB type\n");
3328
                }
3329

3330
                encode_mb(s, motion_x, motion_y);
3331 3332 3333

                // RAL: Update last macrobloc type
                s->last_mv_dir = s->mv_dir;
F
Fabrice Bellard 已提交
3334
            }
3335

3336 3337 3338 3339 3340
            /* clean the MV table in IPS frames for direct mode in B frames */
            if(s->mb_intra /* && I,P,S_TYPE */){
                s->p_mv_table[xy][0]=0;
                s->p_mv_table[xy][1]=0;
            }
F
Fabrice Bellard 已提交
3341

3342
            MPV_decode_mb(s, s->block);
3343 3344 3345 3346 3347 3348 3349
            
            if(s->flags&CODEC_FLAG_PSNR){
                int w= 16;
                int h= 16;

                if(s->mb_x*16 + 16 > s->width ) w= s->width - s->mb_x*16;
                if(s->mb_y*16 + 16 > s->height) h= s->height- s->mb_y*16;
M
Michael Niedermayer 已提交
3350

3351 3352 3353 3354 3355 3356 3357 3358 3359 3360 3361 3362 3363 3364 3365 3366
                s->current_picture.error[0] += sse(
                    s,
                    s->new_picture    .data[0] + s->mb_x*16 + s->mb_y*s->linesize*16,
                    s->current_picture.data[0] + s->mb_x*16 + s->mb_y*s->linesize*16,
                    w, h, s->linesize);
                s->current_picture.error[1] += sse(
                    s,
                    s->new_picture    .data[1] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,
                    s->current_picture.data[1] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,
                    w>>1, h>>1, s->uvlinesize);
                s->current_picture.error[2] += sse(
                    s,
                    s->new_picture    .data[2] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,
                    s->current_picture.data[2] + s->mb_x*8  + s->mb_y*s->uvlinesize*8,
                    w>>1, h>>1, s->uvlinesize);
            }
3367
//printf("MB %d %d bits\n", s->mb_x+s->mb_y*s->mb_width, get_bit_count(&s->pb));
F
Fabrice Bellard 已提交
3368
        }
3369 3370


M
Michael Niedermayer 已提交
3371
        /* Obtain average mb_row size for RTP */
3372
        if (s->rtp_mode) {
M
Michael Niedermayer 已提交
3373
            if (mb_y==0)
3374
                s->mb_line_avgsize = pbBufPtr(&s->pb) - s->ptr_last_mb_line;
M
Michael Niedermayer 已提交
3375
            else {    
3376
                s->mb_line_avgsize = (s->mb_line_avgsize + pbBufPtr(&s->pb) - s->ptr_last_mb_line) >> 1;
3377
            }
M
Michael Niedermayer 已提交
3378
            s->ptr_last_mb_line = pbBufPtr(&s->pb);
3379
        }
F
Fabrice Bellard 已提交
3380
    }
3381
    emms_c();
3382

M
Michael Niedermayer 已提交
3383
#ifdef CONFIG_RISKY
3384
    if(s->codec_id==CODEC_ID_MPEG4 && s->partitioned_frame)
3385 3386 3387
        ff_mpeg4_merge_partitions(s);

    if (s->msmpeg4_version && s->msmpeg4_version<4 && s->pict_type == I_TYPE)
M
Michael Niedermayer 已提交
3388 3389
        msmpeg4_encode_ext_header(s);

3390 3391
    if(s->codec_id==CODEC_ID_MPEG4) 
        ff_mpeg4_stuffing(&s->pb);
M
Michael Niedermayer 已提交
3392
#endif
3393

3394 3395
    //if (s->gob_number)
    //    fprintf(stderr,"\nNumber of GOB: %d", s->gob_number);
3396 3397 3398 3399
    
    /* Send the last GOB if RTP */    
    if (s->rtp_mode) {
        flush_put_bits(&s->pb);
3400
        pdif = pbBufPtr(&s->pb) - s->ptr_lastgob;
3401 3402 3403
        /* Call the RTP callback to send the last GOB */
        if (s->rtp_callback)
            s->rtp_callback(s->ptr_lastgob, pdif, s->gob_number);
3404
        s->ptr_lastgob = pbBufPtr(&s->pb);
3405 3406
        //fprintf(stderr,"\nGOB: %2d size: %d (last)", s->gob_number, pdif);
    }
F
Fabrice Bellard 已提交
3407 3408
}

M
Michael Niedermayer 已提交
3409 3410 3411 3412
static int dct_quantize_trellis_c(MpegEncContext *s, 
                        DCTELEM *block, int n,
                        int qscale, int *overflow){
    const int *qmat;
3413
    const uint8_t *scantable= s->intra_scantable.scantable;
M
Michael Niedermayer 已提交
3414 3415 3416 3417 3418 3419
    int max=0;
    unsigned int threshold1, threshold2;
    int bias=0;
    int run_tab[65];
    int level_tab[65];
    int score_tab[65];
3420 3421 3422 3423 3424
    int last_run=0;
    int last_level=0;
    int last_score= 0;
    int last_i= 0;
    int coeff[3][64];
M
Michael Niedermayer 已提交
3425
    int coeff_count[64];
3426
    int lambda, qmul, qadd, start_i, last_non_zero, i;
M
Michael Niedermayer 已提交
3427 3428 3429
    const int esc_length= s->ac_esc_length;
    uint8_t * length;
    uint8_t * last_length;
3430 3431
    int score_limit=0;
    int left_limit= 0;
M
Michael Niedermayer 已提交
3432
        
3433
    s->dsp.fdct (block);
M
Michael Niedermayer 已提交
3434 3435 3436

    qmul= qscale*16;
    qadd= ((qscale-1)|1)*8;
3437

M
Michael Niedermayer 已提交
3438 3439 3440 3441 3442 3443 3444 3445 3446 3447 3448 3449 3450 3451 3452 3453 3454 3455 3456
    if (s->mb_intra) {
        int q;
        if (!s->h263_aic) {
            if (n < 4)
                q = s->y_dc_scale;
            else
                q = s->c_dc_scale;
            q = q << 3;
        } else{
            /* For AIC we skip quant/dequant of INTRADC */
            q = 1 << 3;
            qadd=0;
        }
            
        /* note: block[0] is assumed to be positive */
        block[0] = (block[0] + (q >> 1)) / q;
        start_i = 1;
        last_non_zero = 0;
        qmat = s->q_intra_matrix[qscale];
3457
        if(s->mpeg_quant || s->codec_id== CODEC_ID_MPEG1VIDEO)
M
Michael Niedermayer 已提交
3458 3459 3460 3461 3462 3463 3464 3465 3466 3467 3468 3469 3470
            bias= 1<<(QMAT_SHIFT-1);
        length     = s->intra_ac_vlc_length;
        last_length= s->intra_ac_vlc_last_length;
    } else {
        start_i = 0;
        last_non_zero = -1;
        qmat = s->q_inter_matrix[qscale];
        length     = s->inter_ac_vlc_length;
        last_length= s->inter_ac_vlc_last_length;
    }

    threshold1= (1<<QMAT_SHIFT) - bias - 1;
    threshold2= (threshold1<<1);
3471

M
Michael Niedermayer 已提交
3472 3473 3474 3475 3476 3477 3478 3479 3480 3481 3482 3483 3484
    for(i=start_i; i<64; i++) {
        const int j = scantable[i];
        const int k= i-start_i;
        int level = block[j];
        level = level * qmat[j];

//        if(   bias+level >= (1<<(QMAT_SHIFT - 3))
//           || bias-level >= (1<<(QMAT_SHIFT - 3))){
        if(((unsigned)(level+threshold1))>threshold2){
            if(level>0){
                level= (bias + level)>>QMAT_SHIFT;
                coeff[0][k]= level;
                coeff[1][k]= level-1;
3485
//                coeff[2][k]= level-2;
M
Michael Niedermayer 已提交
3486 3487 3488 3489
            }else{
                level= (bias - level)>>QMAT_SHIFT;
                coeff[0][k]= -level;
                coeff[1][k]= -level+1;
3490
//                coeff[2][k]= -level+2;
M
Michael Niedermayer 已提交
3491
            }
3492
            coeff_count[k]= FFMIN(level, 2);
M
Michael Niedermayer 已提交
3493 3494 3495
            max |=level;
            last_non_zero = i;
        }else{
3496
            coeff[0][k]= (level>>31)|1;
M
Michael Niedermayer 已提交
3497 3498 3499 3500 3501 3502 3503 3504 3505 3506 3507
            coeff_count[k]= 1;
        }
    }
    
    *overflow= s->max_qcoeff < max; //overflow might have happend
    
    if(last_non_zero < start_i){
        memset(block + start_i, 0, (64-start_i)*sizeof(DCTELEM));
        return last_non_zero;
    }

3508
    lambda= (qscale*qscale*64*105 + 64)>>7; //FIXME finetune
M
Michael Niedermayer 已提交
3509
        
3510
    score_tab[0]= 0;
M
Michael Niedermayer 已提交
3511 3512 3513 3514
    for(i=0; i<=last_non_zero - start_i; i++){
        int level_index, run, j;
        const int dct_coeff= block[ scantable[i + start_i] ];
        const int zero_distoration= dct_coeff*dct_coeff;
3515
        int best_score=256*256*256*120;
M
Michael Niedermayer 已提交
3516

3517
        last_score += zero_distoration;
M
Michael Niedermayer 已提交
3518 3519 3520 3521 3522 3523 3524 3525 3526 3527 3528 3529 3530
        for(level_index=0; level_index < coeff_count[i]; level_index++){
            int distoration;
            int level= coeff[level_index][i];
            int unquant_coeff;
            
            assert(level);

            if(s->out_format == FMT_H263){
                if(level>0){
                    unquant_coeff= level*qmul + qadd;
                }else{
                    unquant_coeff= level*qmul - qadd;
                }
3531
            }else{ //MPEG1
3532
                j= s->dsp.idct_permutation[ scantable[i + start_i] ]; //FIXME optimize
3533 3534 3535 3536 3537 3538 3539 3540 3541 3542 3543 3544 3545 3546 3547 3548 3549 3550 3551
                if(s->mb_intra){
                    if (level < 0) {
                        unquant_coeff = (int)((-level) * qscale * s->intra_matrix[j]) >> 3;
                        unquant_coeff = -((unquant_coeff - 1) | 1);
                    } else {
                        unquant_coeff = (int)(  level  * qscale * s->intra_matrix[j]) >> 3;
                        unquant_coeff =   (unquant_coeff - 1) | 1;
                    }
                }else{
                    if (level < 0) {
                        unquant_coeff = ((((-level) << 1) + 1) * qscale * ((int) s->inter_matrix[j])) >> 4;
                        unquant_coeff = -((unquant_coeff - 1) | 1);
                    } else {
                        unquant_coeff = (((  level  << 1) + 1) * qscale * ((int) s->inter_matrix[j])) >> 4;
                        unquant_coeff =   (unquant_coeff - 1) | 1;
                    }
                }
                unquant_coeff<<= 3;
            }
3552

M
Michael Niedermayer 已提交
3553 3554 3555
            distoration= (unquant_coeff - dct_coeff) * (unquant_coeff - dct_coeff);
            level+=64;
            if((level&(~127)) == 0){
3556
                for(run=0; run<=i - left_limit; run++){
3557
                    int score= distoration + length[UNI_AC_ENC_INDEX(run, level)]*lambda;
M
Michael Niedermayer 已提交
3558 3559 3560 3561 3562 3563 3564 3565 3566 3567 3568
                    score += score_tab[i-run];
                    
                    if(score < best_score){
                        best_score= 
                        score_tab[i+1]= score;
                        run_tab[i+1]= run;
                        level_tab[i+1]= level-64;
                    }
                }

                if(s->out_format == FMT_H263){
3569
                    for(run=0; run<=i - left_limit; run++){
3570
                        int score= distoration + last_length[UNI_AC_ENC_INDEX(run, level)]*lambda;
M
Michael Niedermayer 已提交
3571
                        score += score_tab[i-run];
3572 3573 3574 3575 3576
                        if(score < last_score){
                            last_score= score;
                            last_run= run;
                            last_level= level-64;
                            last_i= i+1;
M
Michael Niedermayer 已提交
3577 3578 3579 3580 3581
                        }
                    }
                }
            }else{
                distoration += esc_length*lambda;
3582
                for(run=0; run<=i - left_limit; run++){
M
Michael Niedermayer 已提交
3583 3584 3585 3586 3587 3588 3589 3590 3591 3592 3593
                    int score= distoration + score_tab[i-run];
                    
                    if(score < best_score){
                        best_score= 
                        score_tab[i+1]= score;
                        run_tab[i+1]= run;
                        level_tab[i+1]= level-64;
                    }
                }

                if(s->out_format == FMT_H263){
3594
                    for(run=0; run<=i - left_limit; run++){
M
Michael Niedermayer 已提交
3595
                        int score= distoration + score_tab[i-run];
3596 3597 3598 3599 3600
                        if(score < last_score){
                            last_score= score;
                            last_run= run;
                            last_level= level-64;
                            last_i= i+1;
M
Michael Niedermayer 已提交
3601 3602 3603 3604 3605 3606
                        }
                    }
                }
            }
        }

3607
        for(j=left_limit; j<=i; j++){
M
Michael Niedermayer 已提交
3608 3609
            score_tab[j] += zero_distoration;
        }
3610 3611 3612 3613 3614 3615
        score_limit+= zero_distoration;
        if(score_tab[i+1] < score_limit)
            score_limit= score_tab[i+1];
        
        //Note: there is a vlc code in mpeg4 which is 1 bit shorter then another one with a shorter run and the same level
        while(score_tab[ left_limit ] > score_limit + lambda) left_limit++;
M
Michael Niedermayer 已提交
3616
    }
3617 3618 3619

        //FIXME add some cbp penalty

M
Michael Niedermayer 已提交
3620
    if(s->out_format != FMT_H263){
3621
        last_score= 256*256*256*120;
3622
        for(i= left_limit; i<=last_non_zero - start_i + 1; i++){
3623
            int score= score_tab[i];
3624 3625
            if(i) score += lambda*2; //FIXME exacter?

3626 3627 3628 3629 3630 3631
            if(score < last_score){
                last_score= score;
                last_i= i;
                last_level= level_tab[i];
                last_run= run_tab[i];
            }
M
Michael Niedermayer 已提交
3632 3633 3634
        }
    }
    
3635
    last_non_zero= last_i - 1 + start_i;
M
Michael Niedermayer 已提交
3636 3637 3638 3639 3640
    memset(block + start_i, 0, (64-start_i)*sizeof(DCTELEM));
    
    if(last_non_zero < start_i)
        return last_non_zero;
    
3641 3642
    i= last_i;
    assert(last_level);
M
Michael Niedermayer 已提交
3643
//FIXME use permutated scantable
3644
    block[ s->dsp.idct_permutation[ scantable[last_non_zero] ] ]= last_level;
3645
    i -= last_run + 1;
M
Michael Niedermayer 已提交
3646 3647
    
    for(;i>0 ; i -= run_tab[i] + 1){
3648
        const int j= s->dsp.idct_permutation[ scantable[i - 1 + start_i] ];
M
Michael Niedermayer 已提交
3649 3650 3651 3652 3653 3654 3655 3656
    
        block[j]= level_tab[i];
        assert(block[j]);
    }

    return last_non_zero;
}

M
Michael Niedermayer 已提交
3657
static int dct_quantize_c(MpegEncContext *s, 
F
Fabrice Bellard 已提交
3658
                        DCTELEM *block, int n,
3659
                        int qscale, int *overflow)
F
Fabrice Bellard 已提交
3660 3661 3662
{
    int i, j, level, last_non_zero, q;
    const int *qmat;
3663
    const uint8_t *scantable= s->intra_scantable.scantable;
3664 3665 3666
    int bias;
    int max=0;
    unsigned int threshold1, threshold2;
3667

3668
    s->dsp.fdct (block);
F
Fabrice Bellard 已提交
3669 3670

    if (s->mb_intra) {
3671 3672 3673 3674 3675 3676 3677 3678 3679 3680
        if (!s->h263_aic) {
            if (n < 4)
                q = s->y_dc_scale;
            else
                q = s->c_dc_scale;
            q = q << 3;
        } else
            /* For AIC we skip quant/dequant of INTRADC */
            q = 1 << 3;
            
F
Fabrice Bellard 已提交
3681 3682 3683 3684
        /* note: block[0] is assumed to be positive */
        block[0] = (block[0] + (q >> 1)) / q;
        i = 1;
        last_non_zero = 0;
3685
        qmat = s->q_intra_matrix[qscale];
M
Michael Niedermayer 已提交
3686
        bias= s->intra_quant_bias<<(QMAT_SHIFT - QUANT_BIAS_SHIFT);
F
Fabrice Bellard 已提交
3687 3688 3689
    } else {
        i = 0;
        last_non_zero = -1;
3690
        qmat = s->q_inter_matrix[qscale];
M
Michael Niedermayer 已提交
3691
        bias= s->inter_quant_bias<<(QMAT_SHIFT - QUANT_BIAS_SHIFT);
F
Fabrice Bellard 已提交
3692
    }
M
Michael Niedermayer 已提交
3693 3694
    threshold1= (1<<QMAT_SHIFT) - bias - 1;
    threshold2= (threshold1<<1);
F
Fabrice Bellard 已提交
3695 3696

    for(;i<64;i++) {
M
Michael Niedermayer 已提交
3697
        j = scantable[i];
F
Fabrice Bellard 已提交
3698 3699 3700
        level = block[j];
        level = level * qmat[j];

3701 3702 3703 3704
//        if(   bias+level >= (1<<(QMAT_SHIFT - 3))
//           || bias-level >= (1<<(QMAT_SHIFT - 3))){
        if(((unsigned)(level+threshold1))>threshold2){
            if(level>0){
M
Michael Niedermayer 已提交
3705
                level= (bias + level)>>QMAT_SHIFT;
3706 3707
                block[j]= level;
            }else{
M
Michael Niedermayer 已提交
3708
                level= (bias - level)>>QMAT_SHIFT;
3709 3710 3711
                block[j]= -level;
            }
            max |=level;
F
Fabrice Bellard 已提交
3712
            last_non_zero = i;
3713 3714
        }else{
            block[j]=0;
F
Fabrice Bellard 已提交
3715 3716
        }
    }
3717 3718
    *overflow= s->max_qcoeff < max; //overflow might have happend
    
M
Michael Niedermayer 已提交
3719
    /* we need this permutation so that we correct the IDCT, we only permute the !=0 elements */
3720 3721
    if (s->dsp.idct_permutation_type != FF_NO_IDCT_PERM)
	ff_block_permute(block, s->dsp.idct_permutation, scantable, last_non_zero);
M
Michael Niedermayer 已提交
3722

F
Fabrice Bellard 已提交
3723 3724 3725
    return last_non_zero;
}

3726 3727
#endif //CONFIG_ENCODERS

3728 3729
static void dct_unquantize_mpeg1_c(MpegEncContext *s, 
                                   DCTELEM *block, int n, int qscale)
F
Fabrice Bellard 已提交
3730
{
M
Michael Niedermayer 已提交
3731
    int i, level, nCoeffs;
3732
    const uint16_t *quant_matrix;
F
Fabrice Bellard 已提交
3733

3734
    nCoeffs= s->block_last_index[n];
M
Michael Niedermayer 已提交
3735
    
F
Fabrice Bellard 已提交
3736 3737 3738 3739 3740 3741 3742
    if (s->mb_intra) {
        if (n < 4) 
            block[0] = block[0] * s->y_dc_scale;
        else
            block[0] = block[0] * s->c_dc_scale;
        /* XXX: only mpeg1 */
        quant_matrix = s->intra_matrix;
3743 3744
        for(i=1;i<=nCoeffs;i++) {
            int j= s->intra_scantable.permutated[i];
M
Michael Niedermayer 已提交
3745
            level = block[j];
F
Fabrice Bellard 已提交
3746 3747 3748
            if (level) {
                if (level < 0) {
                    level = -level;
M
Michael Niedermayer 已提交
3749
                    level = (int)(level * qscale * quant_matrix[j]) >> 3;
F
Fabrice Bellard 已提交
3750 3751 3752
                    level = (level - 1) | 1;
                    level = -level;
                } else {
M
Michael Niedermayer 已提交
3753
                    level = (int)(level * qscale * quant_matrix[j]) >> 3;
F
Fabrice Bellard 已提交
3754 3755 3756 3757 3758 3759
                    level = (level - 1) | 1;
                }
#ifdef PARANOID
                if (level < -2048 || level > 2047)
                    fprintf(stderr, "unquant error %d %d\n", i, level);
#endif
M
Michael Niedermayer 已提交
3760
                block[j] = level;
F
Fabrice Bellard 已提交
3761 3762 3763 3764
            }
        }
    } else {
        i = 0;
3765
        quant_matrix = s->inter_matrix;
3766 3767
        for(;i<=nCoeffs;i++) {
            int j= s->intra_scantable.permutated[i];
M
Michael Niedermayer 已提交
3768
            level = block[j];
F
Fabrice Bellard 已提交
3769 3770 3771 3772
            if (level) {
                if (level < 0) {
                    level = -level;
                    level = (((level << 1) + 1) * qscale *
M
Michael Niedermayer 已提交
3773
                             ((int) (quant_matrix[j]))) >> 4;
F
Fabrice Bellard 已提交
3774 3775 3776 3777
                    level = (level - 1) | 1;
                    level = -level;
                } else {
                    level = (((level << 1) + 1) * qscale *
M
Michael Niedermayer 已提交
3778
                             ((int) (quant_matrix[j]))) >> 4;
F
Fabrice Bellard 已提交
3779 3780 3781 3782 3783 3784
                    level = (level - 1) | 1;
                }
#ifdef PARANOID
                if (level < -2048 || level > 2047)
                    fprintf(stderr, "unquant error %d %d\n", i, level);
#endif
M
Michael Niedermayer 已提交
3785
                block[j] = level;
F
Fabrice Bellard 已提交
3786 3787 3788 3789
            }
        }
    }
}
3790

3791 3792 3793 3794
static void dct_unquantize_mpeg2_c(MpegEncContext *s, 
                                   DCTELEM *block, int n, int qscale)
{
    int i, level, nCoeffs;
3795
    const uint16_t *quant_matrix;
3796

3797 3798
    if(s->alternate_scan) nCoeffs= 63;
    else nCoeffs= s->block_last_index[n];
3799 3800 3801 3802 3803 3804 3805
    
    if (s->mb_intra) {
        if (n < 4) 
            block[0] = block[0] * s->y_dc_scale;
        else
            block[0] = block[0] * s->c_dc_scale;
        quant_matrix = s->intra_matrix;
3806 3807
        for(i=1;i<=nCoeffs;i++) {
            int j= s->intra_scantable.permutated[i];
3808 3809 3810 3811 3812 3813 3814 3815 3816 3817 3818 3819 3820 3821 3822 3823 3824 3825 3826
            level = block[j];
            if (level) {
                if (level < 0) {
                    level = -level;
                    level = (int)(level * qscale * quant_matrix[j]) >> 3;
                    level = -level;
                } else {
                    level = (int)(level * qscale * quant_matrix[j]) >> 3;
                }
#ifdef PARANOID
                if (level < -2048 || level > 2047)
                    fprintf(stderr, "unquant error %d %d\n", i, level);
#endif
                block[j] = level;
            }
        }
    } else {
        int sum=-1;
        i = 0;
3827
        quant_matrix = s->inter_matrix;
3828 3829
        for(;i<=nCoeffs;i++) {
            int j= s->intra_scantable.permutated[i];
3830 3831 3832 3833 3834 3835 3836 3837 3838 3839 3840 3841 3842 3843 3844 3845 3846 3847 3848 3849 3850 3851 3852 3853
            level = block[j];
            if (level) {
                if (level < 0) {
                    level = -level;
                    level = (((level << 1) + 1) * qscale *
                             ((int) (quant_matrix[j]))) >> 4;
                    level = -level;
                } else {
                    level = (((level << 1) + 1) * qscale *
                             ((int) (quant_matrix[j]))) >> 4;
                }
#ifdef PARANOID
                if (level < -2048 || level > 2047)
                    fprintf(stderr, "unquant error %d %d\n", i, level);
#endif
                block[j] = level;
                sum+=level;
            }
        }
        block[63]^=sum&1;
    }
}


3854 3855 3856 3857
static void dct_unquantize_h263_c(MpegEncContext *s, 
                                  DCTELEM *block, int n, int qscale)
{
    int i, level, qmul, qadd;
M
Michael Niedermayer 已提交
3858
    int nCoeffs;
3859
    
3860 3861 3862 3863 3864
    assert(s->block_last_index[n]>=0);
    
    qadd = (qscale - 1) | 1;
    qmul = qscale << 1;
    
3865
    if (s->mb_intra) {
3866 3867 3868 3869 3870
        if (!s->h263_aic) {
            if (n < 4) 
                block[0] = block[0] * s->y_dc_scale;
            else
                block[0] = block[0] * s->c_dc_scale;
3871 3872
        }else
            qadd = 0;
3873
        i = 1;
3874
        nCoeffs= 63; //does not allways use zigzag table 
3875 3876
    } else {
        i = 0;
3877
        nCoeffs= s->inter_scantable.raster_end[ s->block_last_index[n] ];
3878 3879
    }

3880
    for(;i<=nCoeffs;i++) {
3881 3882 3883 3884 3885 3886 3887 3888 3889 3890 3891 3892 3893 3894 3895
        level = block[i];
        if (level) {
            if (level < 0) {
                level = level * qmul - qadd;
            } else {
                level = level * qmul + qadd;
            }
#ifdef PARANOID
                if (level < -2048 || level > 2047)
                    fprintf(stderr, "unquant error %d %d\n", i, level);
#endif
            block[i] = level;
        }
    }
}
F
Fabrice Bellard 已提交
3896

3897

M
Michael Niedermayer 已提交
3898 3899 3900 3901 3902 3903
char ff_get_pict_type_char(int pict_type){
    switch(pict_type){
    case I_TYPE: return 'I'; 
    case P_TYPE: return 'P'; 
    case B_TYPE: return 'B'; 
    case S_TYPE: return 'S'; 
M
Michael Niedermayer 已提交
3904
    default:     return '?';
M
Michael Niedermayer 已提交
3905 3906 3907
    }
}

3908 3909 3910 3911 3912 3913 3914 3915 3916 3917 3918 3919 3920 3921 3922 3923 3924 3925 3926
static const AVOption mpeg4_options[] =
{
    AVOPTION_CODEC_INT("bitrate", "desired video bitrate", bit_rate, 4, 240000000, 800000),
    AVOPTION_CODEC_FLAG("vhq", "very high quality", flags, CODEC_FLAG_HQ, 0),
    AVOPTION_CODEC_INT("ratetol", "number of bits the bitstream is allowed to diverge from the reference"
		       "the reference can be CBR (for CBR pass1) or VBR (for pass2)",
		       bit_rate_tolerance, 4, 240000000, 8000),
    AVOPTION_CODEC_INT("qmin", "minimum quantizer", qmin, 1, 31, 2),
    AVOPTION_CODEC_INT("qmax", "maximum quantizer", qmax, 1, 31, 31),
    AVOPTION_CODEC_STRING("rc_eq", "rate control equation",
			  rc_eq, "tex^qComp,option1,options2", 0),
    AVOPTION_CODEC_INT("rc_minrate", "rate control minimum bitrate",
		       rc_min_rate, 4, 24000000, 0),
    AVOPTION_CODEC_INT("rc_maxrate", "rate control maximum bitrate",
		       rc_max_rate, 4, 24000000, 0),
    AVOPTION_CODEC_FLAG("psnr", "calculate PSNR of compressed frames",
		        flags, CODEC_FLAG_PSNR, 0),
    AVOPTION_CODEC_RCOVERRIDE("rc_override", "ratecontrol override (=startframe,endframe,qscale,quality_factor)",
			      rc_override),
3927
    AVOPTION_SUB(avoptions_common),
3928 3929 3930
    AVOPTION_END()
};

3931 3932
#ifdef CONFIG_ENCODERS

F
Fabrice Bellard 已提交
3933 3934 3935 3936 3937 3938 3939 3940 3941 3942
AVCodec mpeg1video_encoder = {
    "mpeg1video",
    CODEC_TYPE_VIDEO,
    CODEC_ID_MPEG1VIDEO,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
};

M
Michael Niedermayer 已提交
3943 3944
#ifdef CONFIG_RISKY

F
Fabrice Bellard 已提交
3945 3946 3947 3948 3949 3950 3951 3952 3953 3954 3955 3956 3957 3958 3959 3960 3961 3962 3963 3964 3965 3966 3967 3968 3969 3970 3971 3972 3973 3974
AVCodec h263_encoder = {
    "h263",
    CODEC_TYPE_VIDEO,
    CODEC_ID_H263,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
};

AVCodec h263p_encoder = {
    "h263p",
    CODEC_TYPE_VIDEO,
    CODEC_ID_H263P,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
};

AVCodec rv10_encoder = {
    "rv10",
    CODEC_TYPE_VIDEO,
    CODEC_ID_RV10,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
};

F
Fabrice Bellard 已提交
3975 3976
AVCodec mpeg4_encoder = {
    "mpeg4",
F
Fabrice Bellard 已提交
3977
    CODEC_TYPE_VIDEO,
F
Fabrice Bellard 已提交
3978
    CODEC_ID_MPEG4,
F
Fabrice Bellard 已提交
3979 3980 3981 3982
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
3983
    .options = mpeg4_options,
F
Fabrice Bellard 已提交
3984 3985
};

3986 3987 3988 3989 3990 3991 3992 3993 3994 3995 3996 3997 3998 3999 4000 4001 4002 4003 4004 4005 4006
AVCodec msmpeg4v1_encoder = {
    "msmpeg4v1",
    CODEC_TYPE_VIDEO,
    CODEC_ID_MSMPEG4V1,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
};

AVCodec msmpeg4v2_encoder = {
    "msmpeg4v2",
    CODEC_TYPE_VIDEO,
    CODEC_ID_MSMPEG4V2,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
};

AVCodec msmpeg4v3_encoder = {
F
Fabrice Bellard 已提交
4007 4008
    "msmpeg4",
    CODEC_TYPE_VIDEO,
4009
    CODEC_ID_MSMPEG4V3,
F
Fabrice Bellard 已提交
4010 4011 4012 4013 4014
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
};
M
Michael Niedermayer 已提交
4015 4016 4017 4018 4019 4020 4021 4022 4023 4024 4025

AVCodec wmv1_encoder = {
    "wmv1",
    CODEC_TYPE_VIDEO,
    CODEC_ID_WMV1,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
};

M
Michael Niedermayer 已提交
4026 4027 4028 4029 4030 4031 4032 4033 4034 4035 4036
#endif

AVCodec mjpeg_encoder = {
    "mjpeg",
    CODEC_TYPE_VIDEO,
    CODEC_ID_MJPEG,
    sizeof(MpegEncContext),
    MPV_encode_init,
    MPV_encode_picture,
    MPV_encode_end,
};
4037 4038 4039

#endif //CONFIG_ENCODERS