1/* 2 * The simplest mpeg encoder (well, it was the simplest!) 3 * Copyright (c) 2000,2001 Fabrice Bellard 4 * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at> 5 * 6 * 4MV & hq & B-frame encoding stuff by Michael Niedermayer <michaelni@gmx.at> 7 * 8 * This file is part of FFmpeg. 9 * 10 * FFmpeg is free software; you can redistribute it and/or 11 * modify it under the terms of the GNU Lesser General Public 12 * License as published by the Free Software Foundation; either 13 * version 2.1 of the License, or (at your option) any later version. 14 * 15 * FFmpeg is distributed in the hope that it will be useful, 16 * but WITHOUT ANY WARRANTY; without even the implied warranty of 17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 18 * Lesser General Public License for more details. 19 * 20 * You should have received a copy of the GNU Lesser General Public 21 * License along with FFmpeg; if not, write to the Free Software 22 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 23 */ 24 25/** 26 * @file 27 * The simplest mpeg encoder (well, it was the simplest!). 28 */ 29 30#ifndef AVCODEC_MPEGVIDEO_COMMON_H 31#define AVCODEC_MPEGVIDEO_COMMON_H 32 33#include <string.h> 34#include "avcodec.h" 35#include "dsputil.h" 36#include "mpegvideo.h" 37#include "mjpegenc.h" 38#include "msmpeg4.h" 39#include "faandct.h" 40#include <limits.h> 41 42int dct_quantize_c(MpegEncContext *s, DCTELEM *block, int n, int qscale, int *overflow); 43int dct_quantize_trellis_c(MpegEncContext *s, DCTELEM *block, int n, int qscale, int *overflow); 44void denoise_dct_c(MpegEncContext *s, DCTELEM *block); 45 46/** 47 * allocates a Picture 48 * The pixels are allocated/set by calling get_buffer() if shared=0 49 */ 50int alloc_picture(MpegEncContext *s, Picture *pic, int shared); 51 52/** 53 * sets the given MpegEncContext to common defaults (same for encoding and decoding). 54 * the changed fields will not depend upon the prior state of the MpegEncContext. 55 */ 56void MPV_common_defaults(MpegEncContext *s); 57 58static inline void gmc1_motion(MpegEncContext *s, 59 uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr, 60 uint8_t **ref_picture) 61{ 62 uint8_t *ptr; 63 int offset, src_x, src_y, linesize, uvlinesize; 64 int motion_x, motion_y; 65 int emu=0; 66 67 motion_x= s->sprite_offset[0][0]; 68 motion_y= s->sprite_offset[0][1]; 69 src_x = s->mb_x * 16 + (motion_x >> (s->sprite_warping_accuracy+1)); 70 src_y = s->mb_y * 16 + (motion_y >> (s->sprite_warping_accuracy+1)); 71 motion_x<<=(3-s->sprite_warping_accuracy); 72 motion_y<<=(3-s->sprite_warping_accuracy); 73 src_x = av_clip(src_x, -16, s->width); 74 if (src_x == s->width) 75 motion_x =0; 76 src_y = av_clip(src_y, -16, s->height); 77 if (src_y == s->height) 78 motion_y =0; 79 80 linesize = s->linesize; 81 uvlinesize = s->uvlinesize; 82 83 ptr = ref_picture[0] + (src_y * linesize) + src_x; 84 85 if(s->flags&CODEC_FLAG_EMU_EDGE){ 86 if( (unsigned)src_x >= s->h_edge_pos - 17 87 || (unsigned)src_y >= s->v_edge_pos - 17){ 88 ff_emulated_edge_mc(s->edge_emu_buffer, ptr, linesize, 17, 17, src_x, src_y, s->h_edge_pos, s->v_edge_pos); 89 ptr= s->edge_emu_buffer; 90 } 91 } 92 93 if((motion_x|motion_y)&7){ 94 s->dsp.gmc1(dest_y , ptr , linesize, 16, motion_x&15, motion_y&15, 128 - s->no_rounding); 95 s->dsp.gmc1(dest_y+8, ptr+8, linesize, 16, motion_x&15, motion_y&15, 128 - s->no_rounding); 96 }else{ 97 int dxy; 98 99 dxy= ((motion_x>>3)&1) | ((motion_y>>2)&2); 100 if (s->no_rounding){ 101 s->dsp.put_no_rnd_pixels_tab[0][dxy](dest_y, ptr, linesize, 16); 102 }else{ 103 s->dsp.put_pixels_tab [0][dxy](dest_y, ptr, linesize, 16); 104 } 105 } 106 107 if(CONFIG_GRAY && s->flags&CODEC_FLAG_GRAY) return; 108 109 motion_x= s->sprite_offset[1][0]; 110 motion_y= s->sprite_offset[1][1]; 111 src_x = s->mb_x * 8 + (motion_x >> (s->sprite_warping_accuracy+1)); 112 src_y = s->mb_y * 8 + (motion_y >> (s->sprite_warping_accuracy+1)); 113 motion_x<<=(3-s->sprite_warping_accuracy); 114 motion_y<<=(3-s->sprite_warping_accuracy); 115 src_x = av_clip(src_x, -8, s->width>>1); 116 if (src_x == s->width>>1) 117 motion_x =0; 118 src_y = av_clip(src_y, -8, s->height>>1); 119 if (src_y == s->height>>1) 120 motion_y =0; 121 122 offset = (src_y * uvlinesize) + src_x; 123 ptr = ref_picture[1] + offset; 124 if(s->flags&CODEC_FLAG_EMU_EDGE){ 125 if( (unsigned)src_x >= (s->h_edge_pos>>1) - 9 126 || (unsigned)src_y >= (s->v_edge_pos>>1) - 9){ 127 ff_emulated_edge_mc(s->edge_emu_buffer, ptr, uvlinesize, 9, 9, src_x, src_y, s->h_edge_pos>>1, s->v_edge_pos>>1); 128 ptr= s->edge_emu_buffer; 129 emu=1; 130 } 131 } 132 s->dsp.gmc1(dest_cb, ptr, uvlinesize, 8, motion_x&15, motion_y&15, 128 - s->no_rounding); 133 134 ptr = ref_picture[2] + offset; 135 if(emu){ 136 ff_emulated_edge_mc(s->edge_emu_buffer, ptr, uvlinesize, 9, 9, src_x, src_y, s->h_edge_pos>>1, s->v_edge_pos>>1); 137 ptr= s->edge_emu_buffer; 138 } 139 s->dsp.gmc1(dest_cr, ptr, uvlinesize, 8, motion_x&15, motion_y&15, 128 - s->no_rounding); 140 141 return; 142} 143 144static inline void gmc_motion(MpegEncContext *s, 145 uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr, 146 uint8_t **ref_picture) 147{ 148 uint8_t *ptr; 149 int linesize, uvlinesize; 150 const int a= s->sprite_warping_accuracy; 151 int ox, oy; 152 153 linesize = s->linesize; 154 uvlinesize = s->uvlinesize; 155 156 ptr = ref_picture[0]; 157 158 ox= s->sprite_offset[0][0] + s->sprite_delta[0][0]*s->mb_x*16 + s->sprite_delta[0][1]*s->mb_y*16; 159 oy= s->sprite_offset[0][1] + s->sprite_delta[1][0]*s->mb_x*16 + s->sprite_delta[1][1]*s->mb_y*16; 160 161 s->dsp.gmc(dest_y, ptr, linesize, 16, 162 ox, 163 oy, 164 s->sprite_delta[0][0], s->sprite_delta[0][1], 165 s->sprite_delta[1][0], s->sprite_delta[1][1], 166 a+1, (1<<(2*a+1)) - s->no_rounding, 167 s->h_edge_pos, s->v_edge_pos); 168 s->dsp.gmc(dest_y+8, ptr, linesize, 16, 169 ox + s->sprite_delta[0][0]*8, 170 oy + s->sprite_delta[1][0]*8, 171 s->sprite_delta[0][0], s->sprite_delta[0][1], 172 s->sprite_delta[1][0], s->sprite_delta[1][1], 173 a+1, (1<<(2*a+1)) - s->no_rounding, 174 s->h_edge_pos, s->v_edge_pos); 175 176 if(CONFIG_GRAY && s->flags&CODEC_FLAG_GRAY) return; 177 178 ox= s->sprite_offset[1][0] + s->sprite_delta[0][0]*s->mb_x*8 + s->sprite_delta[0][1]*s->mb_y*8; 179 oy= s->sprite_offset[1][1] + s->sprite_delta[1][0]*s->mb_x*8 + s->sprite_delta[1][1]*s->mb_y*8; 180 181 ptr = ref_picture[1]; 182 s->dsp.gmc(dest_cb, ptr, uvlinesize, 8, 183 ox, 184 oy, 185 s->sprite_delta[0][0], s->sprite_delta[0][1], 186 s->sprite_delta[1][0], s->sprite_delta[1][1], 187 a+1, (1<<(2*a+1)) - s->no_rounding, 188 s->h_edge_pos>>1, s->v_edge_pos>>1); 189 190 ptr = ref_picture[2]; 191 s->dsp.gmc(dest_cr, ptr, uvlinesize, 8, 192 ox, 193 oy, 194 s->sprite_delta[0][0], s->sprite_delta[0][1], 195 s->sprite_delta[1][0], s->sprite_delta[1][1], 196 a+1, (1<<(2*a+1)) - s->no_rounding, 197 s->h_edge_pos>>1, s->v_edge_pos>>1); 198} 199 200static inline int hpel_motion(MpegEncContext *s, 201 uint8_t *dest, uint8_t *src, 202 int field_based, int field_select, 203 int src_x, int src_y, 204 int width, int height, int stride, 205 int h_edge_pos, int v_edge_pos, 206 int w, int h, op_pixels_func *pix_op, 207 int motion_x, int motion_y) 208{ 209 int dxy; 210 int emu=0; 211 212 dxy = ((motion_y & 1) << 1) | (motion_x & 1); 213 src_x += motion_x >> 1; 214 src_y += motion_y >> 1; 215 216 /* WARNING: do no forget half pels */ 217 src_x = av_clip(src_x, -16, width); //FIXME unneeded for emu? 218 if (src_x == width) 219 dxy &= ~1; 220 src_y = av_clip(src_y, -16, height); 221 if (src_y == height) 222 dxy &= ~2; 223 src += src_y * stride + src_x; 224 225 if(s->unrestricted_mv && (s->flags&CODEC_FLAG_EMU_EDGE)){ 226 if( (unsigned)src_x > h_edge_pos - (motion_x&1) - w 227 || (unsigned)src_y > v_edge_pos - (motion_y&1) - h){ 228 ff_emulated_edge_mc(s->edge_emu_buffer, src, s->linesize, w+1, (h+1)<<field_based, 229 src_x, src_y<<field_based, h_edge_pos, s->v_edge_pos); 230 src= s->edge_emu_buffer; 231 emu=1; 232 } 233 } 234 if(field_select) 235 src += s->linesize; 236 pix_op[dxy](dest, src, stride, h); 237 return emu; 238} 239 240static av_always_inline 241void mpeg_motion_internal(MpegEncContext *s, 242 uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr, 243 int field_based, int bottom_field, int field_select, 244 uint8_t **ref_picture, op_pixels_func (*pix_op)[4], 245 int motion_x, int motion_y, int h, int is_mpeg12, int mb_y) 246{ 247 uint8_t *ptr_y, *ptr_cb, *ptr_cr; 248 int dxy, uvdxy, mx, my, src_x, src_y, 249 uvsrc_x, uvsrc_y, v_edge_pos, uvlinesize, linesize; 250 251#if 0 252if(s->quarter_sample) 253{ 254 motion_x>>=1; 255 motion_y>>=1; 256} 257#endif 258 259 v_edge_pos = s->v_edge_pos >> field_based; 260 linesize = s->current_picture.linesize[0] << field_based; 261 uvlinesize = s->current_picture.linesize[1] << field_based; 262 263 dxy = ((motion_y & 1) << 1) | (motion_x & 1); 264 src_x = s->mb_x* 16 + (motion_x >> 1); 265 src_y =( mb_y<<(4-field_based)) + (motion_y >> 1); 266 267 if (!is_mpeg12 && s->out_format == FMT_H263) { 268 if((s->workaround_bugs & FF_BUG_HPEL_CHROMA) && field_based){ 269 mx = (motion_x>>1)|(motion_x&1); 270 my = motion_y >>1; 271 uvdxy = ((my & 1) << 1) | (mx & 1); 272 uvsrc_x = s->mb_x* 8 + (mx >> 1); 273 uvsrc_y =( mb_y<<(3-field_based))+ (my >> 1); 274 }else{ 275 uvdxy = dxy | (motion_y & 2) | ((motion_x & 2) >> 1); 276 uvsrc_x = src_x>>1; 277 uvsrc_y = src_y>>1; 278 } 279 }else if(!is_mpeg12 && s->out_format == FMT_H261){//even chroma mv's are full pel in H261 280 mx = motion_x / 4; 281 my = motion_y / 4; 282 uvdxy = 0; 283 uvsrc_x = s->mb_x*8 + mx; 284 uvsrc_y = mb_y*8 + my; 285 } else { 286 if(s->chroma_y_shift){ 287 mx = motion_x / 2; 288 my = motion_y / 2; 289 uvdxy = ((my & 1) << 1) | (mx & 1); 290 uvsrc_x = s->mb_x* 8 + (mx >> 1); 291 uvsrc_y =( mb_y<<(3-field_based))+ (my >> 1); 292 } else { 293 if(s->chroma_x_shift){ 294 //Chroma422 295 mx = motion_x / 2; 296 uvdxy = ((motion_y & 1) << 1) | (mx & 1); 297 uvsrc_x = s->mb_x* 8 + (mx >> 1); 298 uvsrc_y = src_y; 299 } else { 300 //Chroma444 301 uvdxy = dxy; 302 uvsrc_x = src_x; 303 uvsrc_y = src_y; 304 } 305 } 306 } 307 308 ptr_y = ref_picture[0] + src_y * linesize + src_x; 309 ptr_cb = ref_picture[1] + uvsrc_y * uvlinesize + uvsrc_x; 310 ptr_cr = ref_picture[2] + uvsrc_y * uvlinesize + uvsrc_x; 311 312 if( (unsigned)src_x > s->h_edge_pos - (motion_x&1) - 16 313 || (unsigned)src_y > v_edge_pos - (motion_y&1) - h){ 314 if(is_mpeg12 || s->codec_id == CODEC_ID_MPEG2VIDEO || 315 s->codec_id == CODEC_ID_MPEG1VIDEO){ 316 av_log(s->avctx,AV_LOG_DEBUG, 317 "MPEG motion vector out of boundary (%d %d)\n", src_x, src_y); 318 return; 319 } 320 ff_emulated_edge_mc(s->edge_emu_buffer, ptr_y, s->linesize, 321 17, 17+field_based, 322 src_x, src_y<<field_based, 323 s->h_edge_pos, s->v_edge_pos); 324 ptr_y = s->edge_emu_buffer; 325 if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){ 326 uint8_t *uvbuf= s->edge_emu_buffer+18*s->linesize; 327 ff_emulated_edge_mc(uvbuf , 328 ptr_cb, s->uvlinesize, 329 9, 9+field_based, 330 uvsrc_x, uvsrc_y<<field_based, 331 s->h_edge_pos>>1, s->v_edge_pos>>1); 332 ff_emulated_edge_mc(uvbuf+16, 333 ptr_cr, s->uvlinesize, 334 9, 9+field_based, 335 uvsrc_x, uvsrc_y<<field_based, 336 s->h_edge_pos>>1, s->v_edge_pos>>1); 337 ptr_cb= uvbuf; 338 ptr_cr= uvbuf+16; 339 } 340 } 341 342 if(bottom_field){ //FIXME use this for field pix too instead of the obnoxious hack which changes picture.data 343 dest_y += s->linesize; 344 dest_cb+= s->uvlinesize; 345 dest_cr+= s->uvlinesize; 346 } 347 348 if(field_select){ 349 ptr_y += s->linesize; 350 ptr_cb+= s->uvlinesize; 351 ptr_cr+= s->uvlinesize; 352 } 353 354 pix_op[0][dxy](dest_y, ptr_y, linesize, h); 355 356 if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){ 357 pix_op[s->chroma_x_shift][uvdxy] 358 (dest_cb, ptr_cb, uvlinesize, h >> s->chroma_y_shift); 359 pix_op[s->chroma_x_shift][uvdxy] 360 (dest_cr, ptr_cr, uvlinesize, h >> s->chroma_y_shift); 361 } 362 if(!is_mpeg12 && (CONFIG_H261_ENCODER || CONFIG_H261_DECODER) && 363 s->out_format == FMT_H261){ 364 ff_h261_loop_filter(s); 365 } 366} 367/* apply one mpeg motion vector to the three components */ 368static av_always_inline 369void mpeg_motion(MpegEncContext *s, 370 uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr, 371 int field_based, int bottom_field, int field_select, 372 uint8_t **ref_picture, op_pixels_func (*pix_op)[4], 373 int motion_x, int motion_y, int h, int mb_y) 374{ 375#if !CONFIG_SMALL 376 if(s->out_format == FMT_MPEG1) 377 mpeg_motion_internal(s, dest_y, dest_cb, dest_cr, field_based, 378 bottom_field, field_select, ref_picture, pix_op, 379 motion_x, motion_y, h, 1, mb_y); 380 else 381#endif 382 mpeg_motion_internal(s, dest_y, dest_cb, dest_cr, field_based, 383 bottom_field, field_select, ref_picture, pix_op, 384 motion_x, motion_y, h, 0, mb_y); 385} 386 387//FIXME move to dsputil, avg variant, 16x16 version 388static inline void put_obmc(uint8_t *dst, uint8_t *src[5], int stride){ 389 int x; 390 uint8_t * const top = src[1]; 391 uint8_t * const left = src[2]; 392 uint8_t * const mid = src[0]; 393 uint8_t * const right = src[3]; 394 uint8_t * const bottom= src[4]; 395#define OBMC_FILTER(x, t, l, m, r, b)\ 396 dst[x]= (t*top[x] + l*left[x] + m*mid[x] + r*right[x] + b*bottom[x] + 4)>>3 397#define OBMC_FILTER4(x, t, l, m, r, b)\ 398 OBMC_FILTER(x , t, l, m, r, b);\ 399 OBMC_FILTER(x+1 , t, l, m, r, b);\ 400 OBMC_FILTER(x +stride, t, l, m, r, b);\ 401 OBMC_FILTER(x+1+stride, t, l, m, r, b); 402 403 x=0; 404 OBMC_FILTER (x , 2, 2, 4, 0, 0); 405 OBMC_FILTER (x+1, 2, 1, 5, 0, 0); 406 OBMC_FILTER4(x+2, 2, 1, 5, 0, 0); 407 OBMC_FILTER4(x+4, 2, 0, 5, 1, 0); 408 OBMC_FILTER (x+6, 2, 0, 5, 1, 0); 409 OBMC_FILTER (x+7, 2, 0, 4, 2, 0); 410 x+= stride; 411 OBMC_FILTER (x , 1, 2, 5, 0, 0); 412 OBMC_FILTER (x+1, 1, 2, 5, 0, 0); 413 OBMC_FILTER (x+6, 1, 0, 5, 2, 0); 414 OBMC_FILTER (x+7, 1, 0, 5, 2, 0); 415 x+= stride; 416 OBMC_FILTER4(x , 1, 2, 5, 0, 0); 417 OBMC_FILTER4(x+2, 1, 1, 6, 0, 0); 418 OBMC_FILTER4(x+4, 1, 0, 6, 1, 0); 419 OBMC_FILTER4(x+6, 1, 0, 5, 2, 0); 420 x+= 2*stride; 421 OBMC_FILTER4(x , 0, 2, 5, 0, 1); 422 OBMC_FILTER4(x+2, 0, 1, 6, 0, 1); 423 OBMC_FILTER4(x+4, 0, 0, 6, 1, 1); 424 OBMC_FILTER4(x+6, 0, 0, 5, 2, 1); 425 x+= 2*stride; 426 OBMC_FILTER (x , 0, 2, 5, 0, 1); 427 OBMC_FILTER (x+1, 0, 2, 5, 0, 1); 428 OBMC_FILTER4(x+2, 0, 1, 5, 0, 2); 429 OBMC_FILTER4(x+4, 0, 0, 5, 1, 2); 430 OBMC_FILTER (x+6, 0, 0, 5, 2, 1); 431 OBMC_FILTER (x+7, 0, 0, 5, 2, 1); 432 x+= stride; 433 OBMC_FILTER (x , 0, 2, 4, 0, 2); 434 OBMC_FILTER (x+1, 0, 1, 5, 0, 2); 435 OBMC_FILTER (x+6, 0, 0, 5, 1, 2); 436 OBMC_FILTER (x+7, 0, 0, 4, 2, 2); 437} 438 439/* obmc for 1 8x8 luma block */ 440static inline void obmc_motion(MpegEncContext *s, 441 uint8_t *dest, uint8_t *src, 442 int src_x, int src_y, 443 op_pixels_func *pix_op, 444 int16_t mv[5][2]/* mid top left right bottom*/) 445#define MID 0 446{ 447 int i; 448 uint8_t *ptr[5]; 449 450 assert(s->quarter_sample==0); 451 452 for(i=0; i<5; i++){ 453 if(i && mv[i][0]==mv[MID][0] && mv[i][1]==mv[MID][1]){ 454 ptr[i]= ptr[MID]; 455 }else{ 456 ptr[i]= s->obmc_scratchpad + 8*(i&1) + s->linesize*8*(i>>1); 457 hpel_motion(s, ptr[i], src, 0, 0, 458 src_x, src_y, 459 s->width, s->height, s->linesize, 460 s->h_edge_pos, s->v_edge_pos, 461 8, 8, pix_op, 462 mv[i][0], mv[i][1]); 463 } 464 } 465 466 put_obmc(dest, ptr, s->linesize); 467} 468 469static inline void qpel_motion(MpegEncContext *s, 470 uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr, 471 int field_based, int bottom_field, int field_select, 472 uint8_t **ref_picture, op_pixels_func (*pix_op)[4], 473 qpel_mc_func (*qpix_op)[16], 474 int motion_x, int motion_y, int h) 475{ 476 uint8_t *ptr_y, *ptr_cb, *ptr_cr; 477 int dxy, uvdxy, mx, my, src_x, src_y, uvsrc_x, uvsrc_y, v_edge_pos, linesize, uvlinesize; 478 479 dxy = ((motion_y & 3) << 2) | (motion_x & 3); 480 src_x = s->mb_x * 16 + (motion_x >> 2); 481 src_y = s->mb_y * (16 >> field_based) + (motion_y >> 2); 482 483 v_edge_pos = s->v_edge_pos >> field_based; 484 linesize = s->linesize << field_based; 485 uvlinesize = s->uvlinesize << field_based; 486 487 if(field_based){ 488 mx= motion_x/2; 489 my= motion_y>>1; 490 }else if(s->workaround_bugs&FF_BUG_QPEL_CHROMA2){ 491 static const int rtab[8]= {0,0,1,1,0,0,0,1}; 492 mx= (motion_x>>1) + rtab[motion_x&7]; 493 my= (motion_y>>1) + rtab[motion_y&7]; 494 }else if(s->workaround_bugs&FF_BUG_QPEL_CHROMA){ 495 mx= (motion_x>>1)|(motion_x&1); 496 my= (motion_y>>1)|(motion_y&1); 497 }else{ 498 mx= motion_x/2; 499 my= motion_y/2; 500 } 501 mx= (mx>>1)|(mx&1); 502 my= (my>>1)|(my&1); 503 504 uvdxy= (mx&1) | ((my&1)<<1); 505 mx>>=1; 506 my>>=1; 507 508 uvsrc_x = s->mb_x * 8 + mx; 509 uvsrc_y = s->mb_y * (8 >> field_based) + my; 510 511 ptr_y = ref_picture[0] + src_y * linesize + src_x; 512 ptr_cb = ref_picture[1] + uvsrc_y * uvlinesize + uvsrc_x; 513 ptr_cr = ref_picture[2] + uvsrc_y * uvlinesize + uvsrc_x; 514 515 if( (unsigned)src_x > s->h_edge_pos - (motion_x&3) - 16 516 || (unsigned)src_y > v_edge_pos - (motion_y&3) - h ){ 517 ff_emulated_edge_mc(s->edge_emu_buffer, ptr_y, s->linesize, 518 17, 17+field_based, src_x, src_y<<field_based, 519 s->h_edge_pos, s->v_edge_pos); 520 ptr_y= s->edge_emu_buffer; 521 if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){ 522 uint8_t *uvbuf= s->edge_emu_buffer + 18*s->linesize; 523 ff_emulated_edge_mc(uvbuf, ptr_cb, s->uvlinesize, 524 9, 9 + field_based, 525 uvsrc_x, uvsrc_y<<field_based, 526 s->h_edge_pos>>1, s->v_edge_pos>>1); 527 ff_emulated_edge_mc(uvbuf + 16, ptr_cr, s->uvlinesize, 528 9, 9 + field_based, 529 uvsrc_x, uvsrc_y<<field_based, 530 s->h_edge_pos>>1, s->v_edge_pos>>1); 531 ptr_cb= uvbuf; 532 ptr_cr= uvbuf + 16; 533 } 534 } 535 536 if(!field_based) 537 qpix_op[0][dxy](dest_y, ptr_y, linesize); 538 else{ 539 if(bottom_field){ 540 dest_y += s->linesize; 541 dest_cb+= s->uvlinesize; 542 dest_cr+= s->uvlinesize; 543 } 544 545 if(field_select){ 546 ptr_y += s->linesize; 547 ptr_cb += s->uvlinesize; 548 ptr_cr += s->uvlinesize; 549 } 550 //damn interlaced mode 551 //FIXME boundary mirroring is not exactly correct here 552 qpix_op[1][dxy](dest_y , ptr_y , linesize); 553 qpix_op[1][dxy](dest_y+8, ptr_y+8, linesize); 554 } 555 if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)){ 556 pix_op[1][uvdxy](dest_cr, ptr_cr, uvlinesize, h >> 1); 557 pix_op[1][uvdxy](dest_cb, ptr_cb, uvlinesize, h >> 1); 558 } 559} 560 561/** 562 * h263 chroma 4mv motion compensation. 563 */ 564static inline void chroma_4mv_motion(MpegEncContext *s, 565 uint8_t *dest_cb, uint8_t *dest_cr, 566 uint8_t **ref_picture, 567 op_pixels_func *pix_op, 568 int mx, int my){ 569 int dxy, emu=0, src_x, src_y, offset; 570 uint8_t *ptr; 571 572 /* In case of 8X8, we construct a single chroma motion vector 573 with a special rounding */ 574 mx= ff_h263_round_chroma(mx); 575 my= ff_h263_round_chroma(my); 576 577 dxy = ((my & 1) << 1) | (mx & 1); 578 mx >>= 1; 579 my >>= 1; 580 581 src_x = s->mb_x * 8 + mx; 582 src_y = s->mb_y * 8 + my; 583 src_x = av_clip(src_x, -8, s->width/2); 584 if (src_x == s->width/2) 585 dxy &= ~1; 586 src_y = av_clip(src_y, -8, s->height/2); 587 if (src_y == s->height/2) 588 dxy &= ~2; 589 590 offset = (src_y * (s->uvlinesize)) + src_x; 591 ptr = ref_picture[1] + offset; 592 if(s->flags&CODEC_FLAG_EMU_EDGE){ 593 if( (unsigned)src_x > (s->h_edge_pos>>1) - (dxy &1) - 8 594 || (unsigned)src_y > (s->v_edge_pos>>1) - (dxy>>1) - 8){ 595 ff_emulated_edge_mc(s->edge_emu_buffer, ptr, s->uvlinesize, 596 9, 9, src_x, src_y, 597 s->h_edge_pos>>1, s->v_edge_pos>>1); 598 ptr= s->edge_emu_buffer; 599 emu=1; 600 } 601 } 602 pix_op[dxy](dest_cb, ptr, s->uvlinesize, 8); 603 604 ptr = ref_picture[2] + offset; 605 if(emu){ 606 ff_emulated_edge_mc(s->edge_emu_buffer, ptr, s->uvlinesize, 607 9, 9, src_x, src_y, 608 s->h_edge_pos>>1, s->v_edge_pos>>1); 609 ptr= s->edge_emu_buffer; 610 } 611 pix_op[dxy](dest_cr, ptr, s->uvlinesize, 8); 612} 613 614static inline void prefetch_motion(MpegEncContext *s, uint8_t **pix, int dir){ 615 /* fetch pixels for estimated mv 4 macroblocks ahead 616 * optimized for 64byte cache lines */ 617 const int shift = s->quarter_sample ? 2 : 1; 618 const int mx= (s->mv[dir][0][0]>>shift) + 16*s->mb_x + 8; 619 const int my= (s->mv[dir][0][1]>>shift) + 16*s->mb_y; 620 int off= mx + (my + (s->mb_x&3)*4)*s->linesize + 64; 621 s->dsp.prefetch(pix[0]+off, s->linesize, 4); 622 off= (mx>>1) + ((my>>1) + (s->mb_x&7))*s->uvlinesize + 64; 623 s->dsp.prefetch(pix[1]+off, pix[2]-pix[1], 2); 624} 625 626/** 627 * motion compensation of a single macroblock 628 * @param s context 629 * @param dest_y luma destination pointer 630 * @param dest_cb chroma cb/u destination pointer 631 * @param dest_cr chroma cr/v destination pointer 632 * @param dir direction (0->forward, 1->backward) 633 * @param ref_picture array[3] of pointers to the 3 planes of the reference picture 634 * @param pic_op halfpel motion compensation function (average or put normally) 635 * @param pic_op qpel motion compensation function (average or put normally) 636 * the motion vectors are taken from s->mv and the MV type from s->mv_type 637 */ 638static av_always_inline void MPV_motion_internal(MpegEncContext *s, 639 uint8_t *dest_y, uint8_t *dest_cb, 640 uint8_t *dest_cr, int dir, 641 uint8_t **ref_picture, 642 op_pixels_func (*pix_op)[4], 643 qpel_mc_func (*qpix_op)[16], int is_mpeg12) 644{ 645 int dxy, mx, my, src_x, src_y, motion_x, motion_y; 646 int mb_x, mb_y, i; 647 uint8_t *ptr, *dest; 648 649 mb_x = s->mb_x; 650 mb_y = s->mb_y; 651 652 prefetch_motion(s, ref_picture, dir); 653 654 if(!is_mpeg12 && s->obmc && s->pict_type != FF_B_TYPE){ 655 int16_t mv_cache[4][4][2]; 656 const int xy= s->mb_x + s->mb_y*s->mb_stride; 657 const int mot_stride= s->b8_stride; 658 const int mot_xy= mb_x*2 + mb_y*2*mot_stride; 659 660 assert(!s->mb_skipped); 661 662 memcpy(mv_cache[1][1], s->current_picture.motion_val[0][mot_xy ], sizeof(int16_t)*4); 663 memcpy(mv_cache[2][1], s->current_picture.motion_val[0][mot_xy+mot_stride], sizeof(int16_t)*4); 664 memcpy(mv_cache[3][1], s->current_picture.motion_val[0][mot_xy+mot_stride], sizeof(int16_t)*4); 665 666 if(mb_y==0 || IS_INTRA(s->current_picture.mb_type[xy-s->mb_stride])){ 667 memcpy(mv_cache[0][1], mv_cache[1][1], sizeof(int16_t)*4); 668 }else{ 669 memcpy(mv_cache[0][1], s->current_picture.motion_val[0][mot_xy-mot_stride], sizeof(int16_t)*4); 670 } 671 672 if(mb_x==0 || IS_INTRA(s->current_picture.mb_type[xy-1])){ 673 *(int32_t*)mv_cache[1][0]= *(int32_t*)mv_cache[1][1]; 674 *(int32_t*)mv_cache[2][0]= *(int32_t*)mv_cache[2][1]; 675 }else{ 676 *(int32_t*)mv_cache[1][0]= *(int32_t*)s->current_picture.motion_val[0][mot_xy-1]; 677 *(int32_t*)mv_cache[2][0]= *(int32_t*)s->current_picture.motion_val[0][mot_xy-1+mot_stride]; 678 } 679 680 if(mb_x+1>=s->mb_width || IS_INTRA(s->current_picture.mb_type[xy+1])){ 681 *(int32_t*)mv_cache[1][3]= *(int32_t*)mv_cache[1][2]; 682 *(int32_t*)mv_cache[2][3]= *(int32_t*)mv_cache[2][2]; 683 }else{ 684 *(int32_t*)mv_cache[1][3]= *(int32_t*)s->current_picture.motion_val[0][mot_xy+2]; 685 *(int32_t*)mv_cache[2][3]= *(int32_t*)s->current_picture.motion_val[0][mot_xy+2+mot_stride]; 686 } 687 688 mx = 0; 689 my = 0; 690 for(i=0;i<4;i++) { 691 const int x= (i&1)+1; 692 const int y= (i>>1)+1; 693 int16_t mv[5][2]= { 694 {mv_cache[y][x ][0], mv_cache[y][x ][1]}, 695 {mv_cache[y-1][x][0], mv_cache[y-1][x][1]}, 696 {mv_cache[y][x-1][0], mv_cache[y][x-1][1]}, 697 {mv_cache[y][x+1][0], mv_cache[y][x+1][1]}, 698 {mv_cache[y+1][x][0], mv_cache[y+1][x][1]}}; 699 //FIXME cleanup 700 obmc_motion(s, dest_y + ((i & 1) * 8) + (i >> 1) * 8 * s->linesize, 701 ref_picture[0], 702 mb_x * 16 + (i & 1) * 8, mb_y * 16 + (i >>1) * 8, 703 pix_op[1], 704 mv); 705 706 mx += mv[0][0]; 707 my += mv[0][1]; 708 } 709 if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)) 710 chroma_4mv_motion(s, dest_cb, dest_cr, ref_picture, pix_op[1], mx, my); 711 712 return; 713 } 714 715 switch(s->mv_type) { 716 case MV_TYPE_16X16: 717 if(s->mcsel){ 718 if(s->real_sprite_warping_points==1){ 719 gmc1_motion(s, dest_y, dest_cb, dest_cr, 720 ref_picture); 721 }else{ 722 gmc_motion(s, dest_y, dest_cb, dest_cr, 723 ref_picture); 724 } 725 }else if(!is_mpeg12 && s->quarter_sample){ 726 qpel_motion(s, dest_y, dest_cb, dest_cr, 727 0, 0, 0, 728 ref_picture, pix_op, qpix_op, 729 s->mv[dir][0][0], s->mv[dir][0][1], 16); 730 }else if(!is_mpeg12 && (CONFIG_WMV2_DECODER || CONFIG_WMV2_ENCODER) && s->mspel){ 731 ff_mspel_motion(s, dest_y, dest_cb, dest_cr, 732 ref_picture, pix_op, 733 s->mv[dir][0][0], s->mv[dir][0][1], 16); 734 }else 735 { 736 mpeg_motion(s, dest_y, dest_cb, dest_cr, 737 0, 0, 0, 738 ref_picture, pix_op, 739 s->mv[dir][0][0], s->mv[dir][0][1], 16, mb_y); 740 } 741 break; 742 case MV_TYPE_8X8: 743 if (!is_mpeg12) { 744 mx = 0; 745 my = 0; 746 if(s->quarter_sample){ 747 for(i=0;i<4;i++) { 748 motion_x = s->mv[dir][i][0]; 749 motion_y = s->mv[dir][i][1]; 750 751 dxy = ((motion_y & 3) << 2) | (motion_x & 3); 752 src_x = mb_x * 16 + (motion_x >> 2) + (i & 1) * 8; 753 src_y = mb_y * 16 + (motion_y >> 2) + (i >>1) * 8; 754 755 /* WARNING: do no forget half pels */ 756 src_x = av_clip(src_x, -16, s->width); 757 if (src_x == s->width) 758 dxy &= ~3; 759 src_y = av_clip(src_y, -16, s->height); 760 if (src_y == s->height) 761 dxy &= ~12; 762 763 ptr = ref_picture[0] + (src_y * s->linesize) + (src_x); 764 if(s->flags&CODEC_FLAG_EMU_EDGE){ 765 if( (unsigned)src_x > s->h_edge_pos - (motion_x&3) - 8 766 || (unsigned)src_y > s->v_edge_pos - (motion_y&3) - 8 ){ 767 ff_emulated_edge_mc(s->edge_emu_buffer, ptr, 768 s->linesize, 9, 9, 769 src_x, src_y, 770 s->h_edge_pos, s->v_edge_pos); 771 ptr= s->edge_emu_buffer; 772 } 773 } 774 dest = dest_y + ((i & 1) * 8) + (i >> 1) * 8 * s->linesize; 775 qpix_op[1][dxy](dest, ptr, s->linesize); 776 777 mx += s->mv[dir][i][0]/2; 778 my += s->mv[dir][i][1]/2; 779 } 780 }else{ 781 for(i=0;i<4;i++) { 782 hpel_motion(s, dest_y + ((i & 1) * 8) + (i >> 1) * 8 * s->linesize, 783 ref_picture[0], 0, 0, 784 mb_x * 16 + (i & 1) * 8, mb_y * 16 + (i >>1) * 8, 785 s->width, s->height, s->linesize, 786 s->h_edge_pos, s->v_edge_pos, 787 8, 8, pix_op[1], 788 s->mv[dir][i][0], s->mv[dir][i][1]); 789 790 mx += s->mv[dir][i][0]; 791 my += s->mv[dir][i][1]; 792 } 793 } 794 795 if(!CONFIG_GRAY || !(s->flags&CODEC_FLAG_GRAY)) 796 chroma_4mv_motion(s, dest_cb, dest_cr, ref_picture, pix_op[1], mx, my); 797 } 798 break; 799 case MV_TYPE_FIELD: 800 if (s->picture_structure == PICT_FRAME) { 801 if(!is_mpeg12 && s->quarter_sample){ 802 for(i=0; i<2; i++){ 803 qpel_motion(s, dest_y, dest_cb, dest_cr, 804 1, i, s->field_select[dir][i], 805 ref_picture, pix_op, qpix_op, 806 s->mv[dir][i][0], s->mv[dir][i][1], 8); 807 } 808 }else{ 809 /* top field */ 810 mpeg_motion(s, dest_y, dest_cb, dest_cr, 811 1, 0, s->field_select[dir][0], 812 ref_picture, pix_op, 813 s->mv[dir][0][0], s->mv[dir][0][1], 8, mb_y); 814 /* bottom field */ 815 mpeg_motion(s, dest_y, dest_cb, dest_cr, 816 1, 1, s->field_select[dir][1], 817 ref_picture, pix_op, 818 s->mv[dir][1][0], s->mv[dir][1][1], 8, mb_y); 819 } 820 } else { 821 if(s->picture_structure != s->field_select[dir][0] + 1 && s->pict_type != FF_B_TYPE && !s->first_field){ 822 ref_picture= s->current_picture_ptr->data; 823 } 824 825 mpeg_motion(s, dest_y, dest_cb, dest_cr, 826 0, 0, s->field_select[dir][0], 827 ref_picture, pix_op, 828 s->mv[dir][0][0], s->mv[dir][0][1], 16, mb_y>>1); 829 } 830 break; 831 case MV_TYPE_16X8: 832 for(i=0; i<2; i++){ 833 uint8_t ** ref2picture; 834 835 if(s->picture_structure == s->field_select[dir][i] + 1 836 || s->pict_type == FF_B_TYPE || s->first_field){ 837 ref2picture= ref_picture; 838 }else{ 839 ref2picture= s->current_picture_ptr->data; 840 } 841 842 mpeg_motion(s, dest_y, dest_cb, dest_cr, 843 0, 0, s->field_select[dir][i], 844 ref2picture, pix_op, 845 s->mv[dir][i][0], s->mv[dir][i][1] + 16*i, 8, mb_y>>1); 846 847 dest_y += 16*s->linesize; 848 dest_cb+= (16>>s->chroma_y_shift)*s->uvlinesize; 849 dest_cr+= (16>>s->chroma_y_shift)*s->uvlinesize; 850 } 851 break; 852 case MV_TYPE_DMV: 853 if(s->picture_structure == PICT_FRAME){ 854 for(i=0; i<2; i++){ 855 int j; 856 for(j=0; j<2; j++){ 857 mpeg_motion(s, dest_y, dest_cb, dest_cr, 858 1, j, j^i, 859 ref_picture, pix_op, 860 s->mv[dir][2*i + j][0], s->mv[dir][2*i + j][1], 8, mb_y); 861 } 862 pix_op = s->dsp.avg_pixels_tab; 863 } 864 }else{ 865 for(i=0; i<2; i++){ 866 mpeg_motion(s, dest_y, dest_cb, dest_cr, 867 0, 0, s->picture_structure != i+1, 868 ref_picture, pix_op, 869 s->mv[dir][2*i][0],s->mv[dir][2*i][1],16, mb_y>>1); 870 871 // after put we make avg of the same block 872 pix_op=s->dsp.avg_pixels_tab; 873 874 //opposite parity is always in the same frame if this is second field 875 if(!s->first_field){ 876 ref_picture = s->current_picture_ptr->data; 877 } 878 } 879 } 880 break; 881 default: assert(0); 882 } 883} 884 885static inline void MPV_motion(MpegEncContext *s, 886 uint8_t *dest_y, uint8_t *dest_cb, 887 uint8_t *dest_cr, int dir, 888 uint8_t **ref_picture, 889 op_pixels_func (*pix_op)[4], 890 qpel_mc_func (*qpix_op)[16]) 891{ 892#if !CONFIG_SMALL 893 if(s->out_format == FMT_MPEG1) 894 MPV_motion_internal(s, dest_y, dest_cb, dest_cr, dir, 895 ref_picture, pix_op, qpix_op, 1); 896 else 897#endif 898 MPV_motion_internal(s, dest_y, dest_cb, dest_cr, dir, 899 ref_picture, pix_op, qpix_op, 0); 900} 901#endif /* AVCODEC_MPEGVIDEO_COMMON_H */ 902