1/*
2 * Generic DCT based hybrid video encoder
3 * Copyright (c) 2000, 2001, 2002 Fabrice Bellard
4 * Copyright (c) 2002-2004 Michael Niedermayer
5 *
6 * This file is part of FFmpeg.
7 *
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
12 *
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
16 * Lesser General Public License for more details.
17 *
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 */
22
23/**
24 * @file libavcodec/mpegvideo.h
25 * mpegvideo header.
26 */
27
28#ifndef AVCODEC_MPEGVIDEO_H
29#define AVCODEC_MPEGVIDEO_H
30
31#include "dsputil.h"
32#include "bitstream.h"
33#include "ratecontrol.h"
34#include "parser.h"
35#include "mpeg12data.h"
36#include "rl.h"
37
38#define FRAME_SKIPPED 100 ///< return value for header parsers if frame is not coded
39
40enum OutputFormat {
41    FMT_MPEG1,
42    FMT_H261,
43    FMT_H263,
44    FMT_MJPEG,
45    FMT_H264,
46};
47
48#define MPEG_BUF_SIZE (16 * 1024)
49
50#define QMAT_SHIFT_MMX 16
51#define QMAT_SHIFT 22
52
53#define MAX_FCODE 7
54#define MAX_MV 2048
55
56#define MAX_THREADS 8
57
58#define MAX_PICTURE_COUNT 32
59
60#define ME_MAP_SIZE 64
61#define ME_MAP_SHIFT 3
62#define ME_MAP_MV_BITS 11
63
64#define MAX_MB_BYTES (30*16*16*3/8 + 120)
65
66#define INPLACE_OFFSET 16
67
68/* Start codes. */
69#define SEQ_END_CODE            0x000001b7
70#define SEQ_START_CODE          0x000001b3
71#define GOP_START_CODE          0x000001b8
72#define PICTURE_START_CODE      0x00000100
73#define SLICE_MIN_START_CODE    0x00000101
74#define SLICE_MAX_START_CODE    0x000001af
75#define EXT_START_CODE          0x000001b5
76#define USER_START_CODE         0x000001b2
77
78/**
79 * Picture.
80 */
81typedef struct Picture{
82    FF_COMMON_FRAME
83
84    /**
85     * halfpel luma planes.
86     */
87    uint8_t *interpolated[3];
88    int16_t (*motion_val_base[2])[2];
89    uint32_t *mb_type_base;
90#define MB_TYPE_INTRA MB_TYPE_INTRA4x4 //default mb_type if there is just one type
91#define IS_INTRA4x4(a)   ((a)&MB_TYPE_INTRA4x4)
92#define IS_INTRA16x16(a) ((a)&MB_TYPE_INTRA16x16)
93#define IS_PCM(a)        ((a)&MB_TYPE_INTRA_PCM)
94#define IS_INTRA(a)      ((a)&7)
95#define IS_INTER(a)      ((a)&(MB_TYPE_16x16|MB_TYPE_16x8|MB_TYPE_8x16|MB_TYPE_8x8))
96#define IS_SKIP(a)       ((a)&MB_TYPE_SKIP)
97#define IS_INTRA_PCM(a)  ((a)&MB_TYPE_INTRA_PCM)
98#define IS_INTERLACED(a) ((a)&MB_TYPE_INTERLACED)
99#define IS_DIRECT(a)     ((a)&MB_TYPE_DIRECT2)
100#define IS_GMC(a)        ((a)&MB_TYPE_GMC)
101#define IS_16X16(a)      ((a)&MB_TYPE_16x16)
102#define IS_16X8(a)       ((a)&MB_TYPE_16x8)
103#define IS_8X16(a)       ((a)&MB_TYPE_8x16)
104#define IS_8X8(a)        ((a)&MB_TYPE_8x8)
105#define IS_SUB_8X8(a)    ((a)&MB_TYPE_16x16) //note reused
106#define IS_SUB_8X4(a)    ((a)&MB_TYPE_16x8)  //note reused
107#define IS_SUB_4X8(a)    ((a)&MB_TYPE_8x16)  //note reused
108#define IS_SUB_4X4(a)    ((a)&MB_TYPE_8x8)   //note reused
109#define IS_ACPRED(a)     ((a)&MB_TYPE_ACPRED)
110#define IS_QUANT(a)      ((a)&MB_TYPE_QUANT)
111#define IS_DIR(a, part, list) ((a) & (MB_TYPE_P0L0<<((part)+2*(list))))
112#define USES_LIST(a, list) ((a) & ((MB_TYPE_P0L0|MB_TYPE_P1L0)<<(2*(list)))) ///< does this mb use listX, note does not work if subMBs
113#define HAS_CBP(a)        ((a)&MB_TYPE_CBP)
114
115    int field_poc[2];           ///< h264 top/bottom POC
116    int poc;                    ///< h264 frame POC
117    int frame_num;              ///< h264 frame_num (raw frame_num from slice header)
118    int pic_id;                 /**< h264 pic_num (short -> no wrap version of pic_num,
119                                     pic_num & max_pic_num; long -> long_pic_num) */
120    int long_ref;               ///< 1->long term reference 0->short term reference
121    int ref_poc[2][2][16];      ///< h264 POCs of the frames used as reference (FIXME need per slice)
122    int ref_count[2][2];        ///< number of entries in ref_poc              (FIXME need per slice)
123    int mbaff;                  ///< h264 1 -> MBAFF frame 0-> not MBAFF
124
125    int mb_var_sum;             ///< sum of MB variance for current frame
126    int mc_mb_var_sum;          ///< motion compensated MB variance for current frame
127    uint16_t *mb_var;           ///< Table for MB variances
128    uint16_t *mc_mb_var;        ///< Table for motion compensated MB variances
129    uint8_t *mb_mean;           ///< Table for MB luminance
130    int32_t *mb_cmp_score;      ///< Table for MB cmp scores, for mb decision FIXME remove
131    int b_frame_score;          /* */
132} Picture;
133
134struct MpegEncContext;
135
136/**
137 * Motion estimation context.
138 */
139typedef struct MotionEstContext{
140    AVCodecContext *avctx;
141    int skip;                          ///< set if ME is skipped for the current MB
142    int co_located_mv[4][2];           ///< mv from last P-frame for direct mode ME
143    int direct_basis_mv[4][2];
144    uint8_t *scratchpad;               ///< data area for the ME algo, so that the ME does not need to malloc/free
145    uint8_t *best_mb;
146    uint8_t *temp_mb[2];
147    uint8_t *temp;
148    int best_bits;
149    uint32_t *map;                     ///< map to avoid duplicate evaluations
150    uint32_t *score_map;               ///< map to store the scores
151    int map_generation;
152    int pre_penalty_factor;
153    int penalty_factor;                /*!< an estimate of the bits required to
154                                        code a given mv value, e.g. (1,0) takes
155                                        more bits than (0,0). We have to
156                                        estimate whether any reduction in
157                                        residual is worth the extra bits. */
158    int sub_penalty_factor;
159    int mb_penalty_factor;
160    int flags;
161    int sub_flags;
162    int mb_flags;
163    int pre_pass;                      ///< = 1 for the pre pass
164    int dia_size;
165    int xmin;
166    int xmax;
167    int ymin;
168    int ymax;
169    int pred_x;
170    int pred_y;
171    uint8_t *src[4][4];
172    uint8_t *ref[4][4];
173    int stride;
174    int uvstride;
175    /* temp variables for picture complexity calculation */
176    int mc_mb_var_sum_temp;
177    int mb_var_sum_temp;
178    int scene_change_score;
179/*    cmp, chroma_cmp;*/
180    op_pixels_func (*hpel_put)[4];
181    op_pixels_func (*hpel_avg)[4];
182    qpel_mc_func (*qpel_put)[16];
183    qpel_mc_func (*qpel_avg)[16];
184    uint8_t (*mv_penalty)[MAX_MV*2+1];  ///< amount of bits needed to encode a MV
185    uint8_t *current_mv_penalty;
186    int (*sub_motion_search)(struct MpegEncContext * s,
187                                  int *mx_ptr, int *my_ptr, int dmin,
188                                  int src_index, int ref_index,
189                                  int size, int h);
190}MotionEstContext;
191
192/**
193 * MpegEncContext.
194 */
195typedef struct MpegEncContext {
196    struct AVCodecContext *avctx;
197    /* the following parameters must be initialized before encoding */
198    int width, height;///< picture size. must be a multiple of 16
199    int gop_size;
200    int intra_only;   ///< if true, only intra pictures are generated
201    int bit_rate;     ///< wanted bit rate
202    enum OutputFormat out_format; ///< output format
203    int h263_pred;    ///< use mpeg4/h263 ac/dc predictions
204    int pb_frame;     ///< PB frame mode (0 = none, 1 = base, 2 = improved)
205
206/* the following codec id fields are deprecated in favor of codec_id */
207    int h263_plus;    ///< h263 plus headers
208    int h263_msmpeg4; ///< generate MSMPEG4 compatible stream (deprecated, use msmpeg4_version instead)
209    int h263_flv;     ///< use flv h263 header
210
211    enum CodecID codec_id;     /* see CODEC_ID_xxx */
212    int fixed_qscale; ///< fixed qscale if non zero
213    int encoding;     ///< true if we are encoding (vs decoding)
214    int flags;        ///< AVCodecContext.flags (HQ, MV4, ...)
215    int flags2;       ///< AVCodecContext.flags2
216    int max_b_frames; ///< max number of b-frames for encoding
217    int luma_elim_threshold;
218    int chroma_elim_threshold;
219    int strict_std_compliance; ///< strictly follow the std (MPEG4, ...)
220    int workaround_bugs;       ///< workaround bugs in encoders which cannot be detected automatically
221    int codec_tag;             ///< internal codec_tag upper case converted from avctx codec_tag
222    int stream_codec_tag;      ///< internal stream_codec_tag upper case converted from avctx stream_codec_tag
223    /* the following fields are managed internally by the encoder */
224
225    /** bit output */
226    PutBitContext pb;
227
228    /* sequence parameters */
229    int context_initialized;
230    int input_picture_number;  ///< used to set pic->display_picture_number, should not be used for/by anything else
231    int coded_picture_number;  ///< used to set pic->coded_picture_number, should not be used for/by anything else
232    int picture_number;       //FIXME remove, unclear definition
233    int picture_in_gop_number; ///< 0-> first pic in gop, ...
234    int b_frames_since_non_b;  ///< used for encoding, relative to not yet reordered input
235    int64_t user_specified_pts;///< last non zero pts from AVFrame which was passed into avcodec_encode_video()
236    int mb_width, mb_height;   ///< number of MBs horizontally & vertically
237    int mb_stride;             ///< mb_width+1 used for some arrays to allow simple addressing of left & top MBs without sig11
238    int b8_stride;             ///< 2*mb_width+1 used for some 8x8 block arrays to allow simple addressing
239    int b4_stride;             ///< 4*mb_width+1 used for some 4x4 block arrays to allow simple addressing
240    int h_edge_pos, v_edge_pos;///< horizontal / vertical position of the right/bottom edge (pixel replication)
241    int mb_num;                ///< number of MBs of a picture
242    int linesize;              ///< line size, in bytes, may be different from width
243    int uvlinesize;            ///< line size, for chroma in bytes, may be different from width
244    Picture *picture;          ///< main picture buffer
245    Picture **input_picture;   ///< next pictures on display order for encoding
246    Picture **reordered_input_picture; ///< pointer to the next pictures in codedorder for encoding
247
248    int start_mb_y;            ///< start mb_y of this thread (so current thread should process start_mb_y <= row < end_mb_y)
249    int end_mb_y;              ///< end   mb_y of this thread (so current thread should process start_mb_y <= row < end_mb_y)
250    struct MpegEncContext *thread_context[MAX_THREADS];
251
252    /**
253     * copy of the previous picture structure.
254     * note, linesize & data, might not match the previous picture (for field pictures)
255     */
256    Picture last_picture;
257
258    /**
259     * copy of the next picture structure.
260     * note, linesize & data, might not match the next picture (for field pictures)
261     */
262    Picture next_picture;
263
264    /**
265     * copy of the source picture structure for encoding.
266     * note, linesize & data, might not match the source picture (for field pictures)
267     */
268    Picture new_picture;
269
270    /**
271     * copy of the current picture structure.
272     * note, linesize & data, might not match the current picture (for field pictures)
273     */
274    Picture current_picture;    ///< buffer to store the decompressed current picture
275
276    Picture *last_picture_ptr;     ///< pointer to the previous picture.
277    Picture *next_picture_ptr;     ///< pointer to the next picture (for bidir pred)
278    Picture *current_picture_ptr;  ///< pointer to the current picture
279    uint8_t *visualization_buffer[3]; //< temporary buffer vor MV visualization
280    int last_dc[3];                ///< last DC values for MPEG1
281    int16_t *dc_val_base;
282    int16_t *dc_val[3];            ///< used for mpeg4 DC prediction, all 3 arrays must be continuous
283    int16_t dc_cache[4*5];
284    int y_dc_scale, c_dc_scale;
285    const uint8_t *y_dc_scale_table;     ///< qscale -> y_dc_scale table
286    const uint8_t *c_dc_scale_table;     ///< qscale -> c_dc_scale table
287    const uint8_t *chroma_qscale_table;  ///< qscale -> chroma_qscale (h263)
288    uint8_t *coded_block_base;
289    uint8_t *coded_block;          ///< used for coded block pattern prediction (msmpeg4v3, wmv1)
290    int16_t (*ac_val_base)[16];
291    int16_t (*ac_val[3])[16];      ///< used for for mpeg4 AC prediction, all 3 arrays must be continuous
292    int ac_pred;
293    uint8_t *prev_pict_types;     ///< previous picture types in bitstream order, used for mb skip
294#define PREV_PICT_TYPES_BUFFER_SIZE 256
295    int mb_skipped;                ///< MUST BE SET only during DECODING
296    uint8_t *mbskip_table;        /**< used to avoid copy if macroblock skipped (for black regions for example)
297                                   and used for b-frame encoding & decoding (contains skip table of next P Frame) */
298    uint8_t *mbintra_table;       ///< used to avoid setting {ac, dc, cbp}-pred stuff to zero on inter MB decoding
299    uint8_t *cbp_table;           ///< used to store cbp, ac_pred for partitioned decoding
300    uint8_t *pred_dir_table;      ///< used to store pred_dir for partitioned decoding
301    uint8_t *allocated_edge_emu_buffer;
302    uint8_t *edge_emu_buffer;     ///< points into the middle of allocated_edge_emu_buffer
303    uint8_t *rd_scratchpad;       ///< scratchpad for rate distortion mb decision
304    uint8_t *obmc_scratchpad;
305    uint8_t *b_scratchpad;        ///< scratchpad used for writing into write only buffers
306
307    int qscale;                 ///< QP
308    int chroma_qscale;          ///< chroma QP
309    unsigned int lambda;        ///< lagrange multipler used in rate distortion
310    unsigned int lambda2;       ///< (lambda*lambda) >> FF_LAMBDA_SHIFT
311    int *lambda_table;
312    int adaptive_quant;         ///< use adaptive quantization
313    int dquant;                 ///< qscale difference to prev qscale
314    int pict_type;              ///< FF_I_TYPE, FF_P_TYPE, FF_B_TYPE, ...
315    int last_pict_type; //FIXME removes
316    int last_non_b_pict_type;   ///< used for mpeg4 gmc b-frames & ratecontrol
317    int dropable;
318    int frame_rate_index;
319    int last_lambda_for[5];     ///< last lambda for a specific pict type
320    int skipdct;                ///< skip dct and code zero residual
321
322    /* motion compensation */
323    int unrestricted_mv;        ///< mv can point outside of the coded picture
324    int h263_long_vectors;      ///< use horrible h263v1 long vector mode
325    int decode;                 ///< if 0 then decoding will be skipped (for encoding b frames for example)
326
327    DSPContext dsp;             ///< pointers for accelerated dsp functions
328    int f_code;                 ///< forward MV resolution
329    int b_code;                 ///< backward MV resolution for B Frames (mpeg4)
330    int16_t (*p_mv_table_base)[2];
331    int16_t (*b_forw_mv_table_base)[2];
332    int16_t (*b_back_mv_table_base)[2];
333    int16_t (*b_bidir_forw_mv_table_base)[2];
334    int16_t (*b_bidir_back_mv_table_base)[2];
335    int16_t (*b_direct_mv_table_base)[2];
336    int16_t (*p_field_mv_table_base[2][2])[2];
337    int16_t (*b_field_mv_table_base[2][2][2])[2];
338    int16_t (*p_mv_table)[2];            ///< MV table (1MV per MB) p-frame encoding
339    int16_t (*b_forw_mv_table)[2];       ///< MV table (1MV per MB) forward mode b-frame encoding
340    int16_t (*b_back_mv_table)[2];       ///< MV table (1MV per MB) backward mode b-frame encoding
341    int16_t (*b_bidir_forw_mv_table)[2]; ///< MV table (1MV per MB) bidir mode b-frame encoding
342    int16_t (*b_bidir_back_mv_table)[2]; ///< MV table (1MV per MB) bidir mode b-frame encoding
343    int16_t (*b_direct_mv_table)[2];     ///< MV table (1MV per MB) direct mode b-frame encoding
344    int16_t (*p_field_mv_table[2][2])[2];   ///< MV table (2MV per MB) interlaced p-frame encoding
345    int16_t (*b_field_mv_table[2][2][2])[2];///< MV table (4MV per MB) interlaced b-frame encoding
346    uint8_t (*p_field_select_table[2]);
347    uint8_t (*b_field_select_table[2][2]);
348    int me_method;                       ///< ME algorithm
349    int mv_dir;
350#define MV_DIR_FORWARD   1
351#define MV_DIR_BACKWARD  2
352#define MV_DIRECT        4 ///< bidirectional mode where the difference equals the MV of the last P/S/I-Frame (mpeg4)
353    int mv_type;
354#define MV_TYPE_16X16       0   ///< 1 vector for the whole mb
355#define MV_TYPE_8X8         1   ///< 4 vectors (h263, mpeg4 4MV)
356#define MV_TYPE_16X8        2   ///< 2 vectors, one per 16x8 block
357#define MV_TYPE_FIELD       3   ///< 2 vectors, one per field
358#define MV_TYPE_DMV         4   ///< 2 vectors, special mpeg2 Dual Prime Vectors
359    /**motion vectors for a macroblock
360       first coordinate : 0 = forward 1 = backward
361       second "         : depend on type
362       third  "         : 0 = x, 1 = y
363    */
364    int mv[2][4][2];
365    int field_select[2][2];
366    int last_mv[2][2][2];             ///< last MV, used for MV prediction in MPEG1 & B-frame MPEG4
367    uint8_t *fcode_tab;               ///< smallest fcode needed for each MV
368    int16_t direct_scale_mv[2][64];   ///< precomputed to avoid divisions in ff_mpeg4_set_direct_mv
369
370    MotionEstContext me;
371
372    int no_rounding;  /**< apply no rounding to motion compensation (MPEG4, msmpeg4, ...)
373                        for b-frames rounding mode is always 0 */
374
375    int hurry_up;     /**< when set to 1 during decoding, b frames will be skipped
376                         when set to 2 idct/dequant will be skipped too */
377
378    /* macroblock layer */
379    int mb_x, mb_y;
380    int mb_skip_run;
381    int mb_intra;
382    uint16_t *mb_type;           ///< Table for candidate MB types for encoding
383#define CANDIDATE_MB_TYPE_INTRA    0x01
384#define CANDIDATE_MB_TYPE_INTER    0x02
385#define CANDIDATE_MB_TYPE_INTER4V  0x04
386#define CANDIDATE_MB_TYPE_SKIPPED   0x08
387//#define MB_TYPE_GMC      0x10
388
389#define CANDIDATE_MB_TYPE_DIRECT   0x10
390#define CANDIDATE_MB_TYPE_FORWARD  0x20
391#define CANDIDATE_MB_TYPE_BACKWARD 0x40
392#define CANDIDATE_MB_TYPE_BIDIR    0x80
393
394#define CANDIDATE_MB_TYPE_INTER_I    0x100
395#define CANDIDATE_MB_TYPE_FORWARD_I  0x200
396#define CANDIDATE_MB_TYPE_BACKWARD_I 0x400
397#define CANDIDATE_MB_TYPE_BIDIR_I    0x800
398
399#define CANDIDATE_MB_TYPE_DIRECT0    0x1000
400
401    int block_index[6]; ///< index to current MB in block based arrays with edges
402    int block_wrap[6];
403    uint8_t *dest[3];
404
405    int *mb_index2xy;        ///< mb_index -> mb_x + mb_y*mb_stride
406
407    /** matrix transmitted in the bitstream */
408    uint16_t intra_matrix[64];
409    uint16_t chroma_intra_matrix[64];
410    uint16_t inter_matrix[64];
411    uint16_t chroma_inter_matrix[64];
412#define QUANT_BIAS_SHIFT 8
413    int intra_quant_bias;    ///< bias for the quantizer
414    int inter_quant_bias;    ///< bias for the quantizer
415    int min_qcoeff;          ///< minimum encodable coefficient
416    int max_qcoeff;          ///< maximum encodable coefficient
417    int ac_esc_length;       ///< num of bits needed to encode the longest esc
418    uint8_t *intra_ac_vlc_length;
419    uint8_t *intra_ac_vlc_last_length;
420    uint8_t *inter_ac_vlc_length;
421    uint8_t *inter_ac_vlc_last_length;
422    uint8_t *luma_dc_vlc_length;
423    uint8_t *chroma_dc_vlc_length;
424#define UNI_AC_ENC_INDEX(run,level) ((run)*128 + (level))
425
426    int coded_score[8];
427
428    /** precomputed matrix (combine qscale and DCT renorm) */
429    int (*q_intra_matrix)[64];
430    int (*q_inter_matrix)[64];
431    /** identical to the above but for MMX & these are not permutated, second 64 entries are bias*/
432    uint16_t (*q_intra_matrix16)[2][64];
433    uint16_t (*q_inter_matrix16)[2][64];
434    int block_last_index[12];  ///< last non zero coefficient in block
435    /* scantables */
436    DECLARE_ALIGNED_8(ScanTable, intra_scantable);
437    ScanTable intra_h_scantable;
438    ScanTable intra_v_scantable;
439    ScanTable inter_scantable; ///< if inter == intra then intra should be used to reduce tha cache usage
440
441    /* noise reduction */
442    int (*dct_error_sum)[64];
443    int dct_count[2];
444    uint16_t (*dct_offset)[64];
445
446    void *opaque;              ///< private data for the user
447
448    /* bit rate control */
449    int64_t wanted_bits;
450    int64_t total_bits;
451    int frame_bits;                ///< bits used for the current frame
452    int next_lambda;               ///< next lambda used for retrying to encode a frame
453    RateControlContext rc_context; ///< contains stuff only accessed in ratecontrol.c
454
455    /* statistics, used for 2-pass encoding */
456    int mv_bits;
457    int header_bits;
458    int i_tex_bits;
459    int p_tex_bits;
460    int i_count;
461    int f_count;
462    int b_count;
463    int skip_count;
464    int misc_bits; ///< cbp, mb_type
465    int last_bits; ///< temp var used for calculating the above vars
466
467    /* error concealment / resync */
468    int error_count;
469    uint8_t *error_status_table;       ///< table of the error status of each MB
470#define VP_START            1          ///< current MB is the first after a resync marker
471#define AC_ERROR            2
472#define DC_ERROR            4
473#define MV_ERROR            8
474#define AC_END              16
475#define DC_END              32
476#define MV_END              64
477//FIXME some prefix?
478
479    int resync_mb_x;                 ///< x position of last resync marker
480    int resync_mb_y;                 ///< y position of last resync marker
481    GetBitContext last_resync_gb;    ///< used to search for the next resync marker
482    int mb_num_left;                 ///< number of MBs left in this video packet (for partitioned Slices only)
483    int next_p_frame_damaged;        ///< set if the next p frame is damaged, to avoid showing trashed b frames
484    int error_recognition;
485
486    ParseContext parse_context;
487
488    /* H.263 specific */
489    int gob_index;
490    int obmc;                       ///< overlapped block motion compensation
491    int showed_packed_warning;      ///< flag for having shown the warning about divxs invalid b frames
492
493    /* H.263+ specific */
494    int umvplus;                    ///< == H263+ && unrestricted_mv
495    int h263_aic;                   ///< Advanded INTRA Coding (AIC)
496    int h263_aic_dir;               ///< AIC direction: 0 = left, 1 = top
497    int h263_slice_structured;
498    int alt_inter_vlc;              ///< alternative inter vlc
499    int modified_quant;
500    int loop_filter;
501    int custom_pcf;
502
503    /* mpeg4 specific */
504    int time_increment_bits;        ///< number of bits to represent the fractional part of time
505    int last_time_base;
506    int time_base;                  ///< time in seconds of last I,P,S Frame
507    int64_t time;                   ///< time of current frame
508    int64_t last_non_b_time;
509    uint16_t pp_time;               ///< time distance between the last 2 p,s,i frames
510    uint16_t pb_time;               ///< time distance between the last b and p,s,i frame
511    uint16_t pp_field_time;
512    uint16_t pb_field_time;         ///< like above, just for interlaced
513    int shape;
514    int vol_sprite_usage;
515    int sprite_width;
516    int sprite_height;
517    int sprite_left;
518    int sprite_top;
519    int sprite_brightness_change;
520    int num_sprite_warping_points;
521    int real_sprite_warping_points;
522    int sprite_offset[2][2];         ///< sprite offset[isChroma][isMVY]
523    int sprite_delta[2][2];          ///< sprite_delta [isY][isMVY]
524    int sprite_shift[2];             ///< sprite shift [isChroma]
525    int mcsel;
526    int quant_precision;
527    int quarter_sample;              ///< 1->qpel, 0->half pel ME/MC
528    int scalability;
529    int hierachy_type;
530    int enhancement_type;
531    int new_pred;
532    int reduced_res_vop;
533    int aspect_ratio_info; //FIXME remove
534    int sprite_warping_accuracy;
535    int low_latency_sprite;
536    int data_partitioning;           ///< data partitioning flag from header
537    int partitioned_frame;           ///< is current frame partitioned
538    int rvlc;                        ///< reversible vlc
539    int resync_marker;               ///< could this stream contain resync markers
540    int low_delay;                   ///< no reordering needed / has no b-frames
541    int vo_type;
542    int vol_control_parameters;      ///< does the stream contain the low_delay flag, used to workaround buggy encoders
543    int intra_dc_threshold;          ///< QP above whch the ac VLC should be used for intra dc
544    int use_intra_dc_vlc;
545    PutBitContext tex_pb;            ///< used for data partitioned VOPs
546    PutBitContext pb2;               ///< used for data partitioned VOPs
547    int mpeg_quant;
548    int t_frame;                       ///< time distance of first I -> B, used for interlaced b frames
549    int padding_bug_score;             ///< used to detect the VERY common padding bug in MPEG4
550    int cplx_estimation_trash_i;
551    int cplx_estimation_trash_p;
552    int cplx_estimation_trash_b;
553
554    /* divx specific, used to workaround (many) bugs in divx5 */
555    int divx_version;
556    int divx_build;
557    int divx_packed;
558    uint8_t *bitstream_buffer; //Divx 5.01 puts several frames in a single one, this is used to reorder them
559    int bitstream_buffer_size;
560    unsigned int allocated_bitstream_buffer_size;
561
562    int xvid_build;
563
564    /* lavc specific stuff, used to workaround bugs in libavcodec */
565    int lavc_build;
566
567    /* RV10 specific */
568    int rv10_version; ///< RV10 version: 0 or 3
569    int rv10_first_dc_coded[3];
570
571    /* MJPEG specific */
572    struct MJpegContext *mjpeg_ctx;
573    int mjpeg_vsample[3];       ///< vertical sampling factors, default = {2, 1, 1}
574    int mjpeg_hsample[3];       ///< horizontal sampling factors, default = {2, 1, 1}
575
576    /* MSMPEG4 specific */
577    int mv_table_index;
578    int rl_table_index;
579    int rl_chroma_table_index;
580    int dc_table_index;
581    int use_skip_mb_code;
582    int slice_height;      ///< in macroblocks
583    int first_slice_line;  ///< used in mpeg4 too to handle resync markers
584    int flipflop_rounding;
585    int msmpeg4_version;   ///< 0=not msmpeg4, 1=mp41, 2=mp42, 3=mp43/divx3 4=wmv1/7 5=wmv2/8
586    int per_mb_rl_table;
587    int esc3_level_length;
588    int esc3_run_length;
589    /** [mb_intra][isChroma][level][run][last] */
590    int (*ac_stats)[2][MAX_LEVEL+1][MAX_RUN+1][2];
591    int inter_intra_pred;
592    int mspel;
593
594    /* decompression specific */
595    GetBitContext gb;
596
597    /* Mpeg1 specific */
598    int gop_picture_number;  ///< index of the first picture of a GOP based on fake_pic_num & mpeg1 specific
599    int last_mv_dir;         ///< last mv_dir, used for b frame encoding
600    int broken_link;         ///< no_output_of_prior_pics_flag
601    uint8_t *vbv_delay_ptr;  ///< pointer to vbv_delay in the bitstream
602
603    /* MPEG-2-specific - I wished not to have to support this mess. */
604    int progressive_sequence;
605    int mpeg_f_code[2][2];
606    int picture_structure;
607/* picture type */
608#define PICT_TOP_FIELD     1
609#define PICT_BOTTOM_FIELD  2
610#define PICT_FRAME         3
611
612    int intra_dc_precision;
613    int frame_pred_frame_dct;
614    int top_field_first;
615    int concealment_motion_vectors;
616    int q_scale_type;
617    int intra_vlc_format;
618    int alternate_scan;
619    int repeat_first_field;
620    int chroma_420_type;
621    int chroma_format;
622#define CHROMA_420 1
623#define CHROMA_422 2
624#define CHROMA_444 3
625    int chroma_x_shift;//depend on pix_format, that depend on chroma_format
626    int chroma_y_shift;
627
628    int progressive_frame;
629    int full_pel[2];
630    int interlaced_dct;
631    int first_slice;
632    int first_field;         ///< is 1 for the first field of a field picture 0 otherwise
633
634    /* RTP specific */
635    int rtp_mode;
636
637    uint8_t *ptr_lastgob;
638    int swap_uv;             //vcr2 codec is an MPEG-2 variant with U and V swapped
639    DCTELEM (*pblocks[12])[64];
640
641    DCTELEM (*block)[64]; ///< points to one of the following blocks
642    DCTELEM (*blocks)[8][64]; // for HQ mode we need to keep the best block
643    int (*decode_mb)(struct MpegEncContext *s, DCTELEM block[6][64]); // used by some codecs to avoid a switch()
644#define SLICE_OK         0
645#define SLICE_ERROR     -1
646#define SLICE_END       -2 ///<end marker found
647#define SLICE_NOEND     -3 ///<no end marker or error found but mb count exceeded
648
649    void (*dct_unquantize_mpeg1_intra)(struct MpegEncContext *s,
650                           DCTELEM *block/*align 16*/, int n, int qscale);
651    void (*dct_unquantize_mpeg1_inter)(struct MpegEncContext *s,
652                           DCTELEM *block/*align 16*/, int n, int qscale);
653    void (*dct_unquantize_mpeg2_intra)(struct MpegEncContext *s,
654                           DCTELEM *block/*align 16*/, int n, int qscale);
655    void (*dct_unquantize_mpeg2_inter)(struct MpegEncContext *s,
656                           DCTELEM *block/*align 16*/, int n, int qscale);
657    void (*dct_unquantize_h263_intra)(struct MpegEncContext *s,
658                           DCTELEM *block/*align 16*/, int n, int qscale);
659    void (*dct_unquantize_h263_inter)(struct MpegEncContext *s,
660                           DCTELEM *block/*align 16*/, int n, int qscale);
661    void (*dct_unquantize_h261_intra)(struct MpegEncContext *s,
662                           DCTELEM *block/*align 16*/, int n, int qscale);
663    void (*dct_unquantize_h261_inter)(struct MpegEncContext *s,
664                           DCTELEM *block/*align 16*/, int n, int qscale);
665    void (*dct_unquantize_intra)(struct MpegEncContext *s, // unquantizer to use (mpeg4 can use both)
666                           DCTELEM *block/*align 16*/, int n, int qscale);
667    void (*dct_unquantize_inter)(struct MpegEncContext *s, // unquantizer to use (mpeg4 can use both)
668                           DCTELEM *block/*align 16*/, int n, int qscale);
669    int (*dct_quantize)(struct MpegEncContext *s, DCTELEM *block/*align 16*/, int n, int qscale, int *overflow);
670    int (*fast_dct_quantize)(struct MpegEncContext *s, DCTELEM *block/*align 16*/, int n, int qscale, int *overflow);
671    void (*denoise_dct)(struct MpegEncContext *s, DCTELEM *block);
672} MpegEncContext;
673
674
675void MPV_decode_defaults(MpegEncContext *s);
676int MPV_common_init(MpegEncContext *s);
677void MPV_common_end(MpegEncContext *s);
678void MPV_decode_mb(MpegEncContext *s, DCTELEM block[12][64]);
679int MPV_frame_start(MpegEncContext *s, AVCodecContext *avctx);
680void MPV_frame_end(MpegEncContext *s);
681int MPV_encode_init(AVCodecContext *avctx);
682int MPV_encode_end(AVCodecContext *avctx);
683int MPV_encode_picture(AVCodecContext *avctx, unsigned char *buf, int buf_size, void *data);
684void MPV_common_init_mmx(MpegEncContext *s);
685void MPV_common_init_axp(MpegEncContext *s);
686void MPV_common_init_mlib(MpegEncContext *s);
687void MPV_common_init_mmi(MpegEncContext *s);
688void MPV_common_init_arm(MpegEncContext *s);
689void MPV_common_init_altivec(MpegEncContext *s);
690void ff_clean_intra_table_entries(MpegEncContext *s);
691void ff_draw_horiz_band(MpegEncContext *s, int y, int h);
692void ff_mpeg_flush(AVCodecContext *avctx);
693void ff_print_debug_info(MpegEncContext *s, AVFrame *pict);
694void ff_write_quant_matrix(PutBitContext *pb, uint16_t *matrix);
695int ff_find_unused_picture(MpegEncContext *s, int shared);
696void ff_denoise_dct(MpegEncContext *s, DCTELEM *block);
697void ff_update_duplicate_context(MpegEncContext *dst, MpegEncContext *src);
698const uint8_t *ff_find_start_code(const uint8_t *p, const uint8_t *end, uint32_t *state);
699
700void ff_er_frame_start(MpegEncContext *s);
701void ff_er_frame_end(MpegEncContext *s);
702void ff_er_add_slice(MpegEncContext *s, int startx, int starty, int endx, int endy, int status);
703
704int ff_dct_common_init(MpegEncContext *s);
705void ff_convert_matrix(DSPContext *dsp, int (*qmat)[64], uint16_t (*qmat16)[2][64],
706                       const uint16_t *quant_matrix, int bias, int qmin, int qmax, int intra);
707
708void ff_init_block_index(MpegEncContext *s);
709void ff_copy_picture(Picture *dst, Picture *src);
710
711extern const enum PixelFormat ff_pixfmt_list_420[];
712extern const enum PixelFormat ff_hwaccel_pixfmt_list_420[];
713
714static inline void ff_update_block_index(MpegEncContext *s){
715    const int block_size= 8>>s->avctx->lowres;
716
717    s->block_index[0]+=2;
718    s->block_index[1]+=2;
719    s->block_index[2]+=2;
720    s->block_index[3]+=2;
721    s->block_index[4]++;
722    s->block_index[5]++;
723    s->dest[0]+= 2*block_size;
724    s->dest[1]+= block_size;
725    s->dest[2]+= block_size;
726}
727
728static inline int get_bits_diff(MpegEncContext *s){
729    const int bits= put_bits_count(&s->pb);
730    const int last= s->last_bits;
731
732    s->last_bits = bits;
733
734    return bits - last;
735}
736
737static inline int ff_h263_round_chroma(int x){
738    static const uint8_t h263_chroma_roundtab[16] = {
739    //  0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15
740        0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1,
741    };
742    return h263_chroma_roundtab[x & 0xf] + (x >> 3);
743}
744
745/* motion_est.c */
746void ff_estimate_p_frame_motion(MpegEncContext * s,
747                             int mb_x, int mb_y);
748void ff_estimate_b_frame_motion(MpegEncContext * s,
749                             int mb_x, int mb_y);
750int ff_get_best_fcode(MpegEncContext * s, int16_t (*mv_table)[2], int type);
751void ff_fix_long_p_mvs(MpegEncContext * s);
752void ff_fix_long_mvs(MpegEncContext * s, uint8_t *field_select_table, int field_select,
753                     int16_t (*mv_table)[2], int f_code, int type, int truncate);
754int ff_init_me(MpegEncContext *s);
755int ff_pre_estimate_p_frame_motion(MpegEncContext * s, int mb_x, int mb_y);
756int ff_epzs_motion_search(MpegEncContext * s, int *mx_ptr, int *my_ptr,
757                             int P[10][2], int src_index, int ref_index, int16_t (*last_mv)[2],
758                             int ref_mv_scale, int size, int h);
759int ff_get_mb_score(MpegEncContext * s, int mx, int my, int src_index,
760                               int ref_index, int size, int h, int add_rate);
761
762/* mpeg12.c */
763extern const uint8_t ff_mpeg1_dc_scale_table[128];
764
765void mpeg1_encode_picture_header(MpegEncContext *s, int picture_number);
766void mpeg1_encode_mb(MpegEncContext *s,
767                     DCTELEM block[6][64],
768                     int motion_x, int motion_y);
769void ff_mpeg1_encode_init(MpegEncContext *s);
770void ff_mpeg1_encode_slice_header(MpegEncContext *s);
771void ff_mpeg1_clean_buffers(MpegEncContext *s);
772int ff_mpeg1_find_frame_end(ParseContext *pc, const uint8_t *buf, int buf_size);
773
774extern const uint8_t ff_mpeg4_y_dc_scale_table[32];
775extern const uint8_t ff_mpeg4_c_dc_scale_table[32];
776extern const uint8_t ff_aic_dc_scale_table[32];
777extern const int16_t ff_mpeg4_default_intra_matrix[64];
778extern const int16_t ff_mpeg4_default_non_intra_matrix[64];
779extern const uint8_t ff_h263_chroma_qscale_table[32];
780extern const uint8_t ff_h263_loop_filter_strength[32];
781
782/* h261.c */
783void ff_h261_loop_filter(MpegEncContext *s);
784void ff_h261_reorder_mb_index(MpegEncContext* s);
785void ff_h261_encode_mb(MpegEncContext *s,
786                    DCTELEM block[6][64],
787                    int motion_x, int motion_y);
788void ff_h261_encode_picture_header(MpegEncContext * s, int picture_number);
789void ff_h261_encode_init(MpegEncContext *s);
790int ff_h261_get_picture_format(int width, int height);
791
792
793/* h263.c, h263dec.c */
794int ff_h263_decode_init(AVCodecContext *avctx);
795int ff_h263_decode_frame(AVCodecContext *avctx,
796                             void *data, int *data_size,
797                             const uint8_t *buf, int buf_size);
798int ff_h263_decode_end(AVCodecContext *avctx);
799void h263_encode_mb(MpegEncContext *s,
800                    DCTELEM block[6][64],
801                    int motion_x, int motion_y);
802void mpeg4_encode_mb(MpegEncContext *s,
803                    DCTELEM block[6][64],
804                    int motion_x, int motion_y);
805void h263_encode_picture_header(MpegEncContext *s, int picture_number);
806void ff_flv_encode_picture_header(MpegEncContext *s, int picture_number);
807void h263_encode_gob_header(MpegEncContext * s, int mb_line);
808int16_t *h263_pred_motion(MpegEncContext * s, int block, int dir,
809                        int *px, int *py);
810void mpeg4_pred_ac(MpegEncContext * s, DCTELEM *block, int n,
811                   int dir);
812void ff_set_mpeg4_time(MpegEncContext * s);
813void mpeg4_encode_picture_header(MpegEncContext *s, int picture_number);
814void h263_encode_init(MpegEncContext *s);
815void h263_decode_init_vlc(MpegEncContext *s);
816int h263_decode_picture_header(MpegEncContext *s);
817int ff_h263_decode_gob_header(MpegEncContext *s);
818int ff_mpeg4_decode_picture_header(MpegEncContext * s, GetBitContext *gb);
819void ff_h263_update_motion_val(MpegEncContext * s);
820void ff_h263_loop_filter(MpegEncContext * s);
821void ff_set_qscale(MpegEncContext * s, int qscale);
822int ff_h263_decode_mba(MpegEncContext *s);
823void ff_h263_encode_mba(MpegEncContext *s);
824
825int intel_h263_decode_picture_header(MpegEncContext *s);
826int flv_h263_decode_picture_header(MpegEncContext *s);
827int ff_h263_decode_mb(MpegEncContext *s,
828                      DCTELEM block[6][64]);
829int ff_mpeg4_decode_mb(MpegEncContext *s,
830                      DCTELEM block[6][64]);
831int h263_get_picture_format(int width, int height);
832void ff_mpeg4_encode_video_packet_header(MpegEncContext *s);
833void ff_mpeg4_clean_buffers(MpegEncContext *s);
834void ff_mpeg4_stuffing(PutBitContext * pbc);
835void ff_mpeg4_init_partitions(MpegEncContext *s);
836void ff_mpeg4_merge_partitions(MpegEncContext *s);
837void ff_clean_mpeg4_qscales(MpegEncContext *s);
838void ff_clean_h263_qscales(MpegEncContext *s);
839int ff_mpeg4_decode_partitions(MpegEncContext *s);
840int ff_mpeg4_get_video_packet_prefix_length(MpegEncContext *s);
841int ff_h263_resync(MpegEncContext *s);
842const uint8_t *ff_h263_find_resync_marker(const uint8_t *p, const uint8_t *end);
843int ff_h263_get_gob_height(MpegEncContext *s);
844void ff_mpeg4_init_direct_mv(MpegEncContext *s);
845int ff_mpeg4_set_direct_mv(MpegEncContext *s, int mx, int my);
846void ff_h263_encode_motion(MpegEncContext * s, int val, int f_code);
847
848
849/* rv10.c */
850void rv10_encode_picture_header(MpegEncContext *s, int picture_number);
851int rv_decode_dc(MpegEncContext *s, int n);
852void rv20_encode_picture_header(MpegEncContext *s, int picture_number);
853
854
855/* msmpeg4.c */
856void msmpeg4_encode_picture_header(MpegEncContext * s, int picture_number);
857void msmpeg4_encode_ext_header(MpegEncContext * s);
858void msmpeg4_encode_mb(MpegEncContext * s,
859                       DCTELEM block[6][64],
860                       int motion_x, int motion_y);
861int msmpeg4_decode_picture_header(MpegEncContext * s);
862int msmpeg4_decode_ext_header(MpegEncContext * s, int buf_size);
863int ff_msmpeg4_decode_init(MpegEncContext *s);
864void ff_msmpeg4_encode_init(MpegEncContext *s);
865int ff_wmv2_decode_picture_header(MpegEncContext * s);
866int ff_wmv2_decode_secondary_picture_header(MpegEncContext * s);
867void ff_wmv2_add_mb(MpegEncContext *s, DCTELEM block[6][64], uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr);
868void ff_mspel_motion(MpegEncContext *s,
869                               uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
870                               uint8_t **ref_picture, op_pixels_func (*pix_op)[4],
871                               int motion_x, int motion_y, int h);
872int ff_wmv2_encode_picture_header(MpegEncContext * s, int picture_number);
873void ff_wmv2_encode_mb(MpegEncContext * s,
874                       DCTELEM block[6][64],
875                       int motion_x, int motion_y);
876
877#endif /* AVCODEC_MPEGVIDEO_H */
878
879