mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
501 lines
19 KiB
501 lines
19 KiB
/* |
|
* Generic DCT based hybrid video encoder |
|
* Copyright (c) 2000,2001 Gerard Lantau. |
|
* |
|
* This program is free software; you can redistribute it and/or modify |
|
* it under the terms of the GNU General Public License as published by |
|
* the Free Software Foundation; either version 2 of the License, or |
|
* (at your option) any later version. |
|
* |
|
* This program is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
|
* GNU General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU General Public License |
|
* along with this program; if not, write to the Free Software |
|
* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. |
|
*/ |
|
|
|
/* Macros for picture code type. */ |
|
#define I_TYPE 1 |
|
#define P_TYPE 2 |
|
#define B_TYPE 3 |
|
#define S_TYPE 4 //S(GMC)-VOP MPEG4 |
|
|
|
#define FRAME_SKIPED 100 // return value for header parsers if frame is not coded |
|
|
|
enum OutputFormat { |
|
FMT_MPEG1, |
|
FMT_H263, |
|
FMT_MJPEG, |
|
}; |
|
|
|
#define MPEG_BUF_SIZE (16 * 1024) |
|
|
|
#define QMAT_SHIFT_MMX 19 |
|
#define QMAT_SHIFT 25 |
|
|
|
#define MAX_FCODE 7 |
|
#define MAX_MV 2048 |
|
#define REORDER_BUFFER_SIZE (FF_MAX_B_FRAMES+2) |
|
|
|
typedef struct Predictor{ |
|
double coeff; |
|
double count; |
|
double decay; |
|
} Predictor; |
|
|
|
typedef struct RateControlEntry{ |
|
int pict_type; |
|
int qscale; |
|
int mv_bits; |
|
int i_tex_bits; |
|
int p_tex_bits; |
|
int misc_bits; |
|
uint64_t expected_bits; |
|
int new_pict_type; |
|
float new_qscale; |
|
}RateControlEntry; |
|
|
|
typedef struct RateControlContext{ |
|
FILE *stats_file; |
|
int num_entries; |
|
RateControlEntry *entry; |
|
}RateControlContext; |
|
|
|
typedef struct ReorderBuffer{ |
|
UINT8 *picture[3]; |
|
int pict_type; |
|
int qscale; |
|
int force_type; |
|
int picture_number; |
|
int picture_in_gop_number; |
|
} ReorderBuffer; |
|
|
|
typedef struct MpegEncContext { |
|
struct AVCodecContext *avctx; |
|
/* the following parameters must be initialized before encoding */ |
|
int width, height; /* picture size. must be a multiple of 16 */ |
|
int gop_size; |
|
int frame_rate; /* number of frames per second */ |
|
int intra_only; /* if true, only intra pictures are generated */ |
|
int bit_rate; /* wanted bit rate */ |
|
int bit_rate_tolerance; /* amount of +- bits (>0)*/ |
|
enum OutputFormat out_format; /* output format */ |
|
int h263_plus; /* h263 plus headers */ |
|
int h263_rv10; /* use RV10 variation for H263 */ |
|
int h263_pred; /* use mpeg4/h263 ac/dc predictions */ |
|
int h263_msmpeg4; /* generate MSMPEG4 compatible stream */ |
|
int h263_intel; /* use I263 intel h263 header */ |
|
int fixed_qscale; /* fixed qscale if non zero */ |
|
float qcompress; /* amount of qscale change between easy & hard scenes (0.0-1.0) */ |
|
float qblur; /* amount of qscale smoothing over time (0.0-1.0) */ |
|
int qmin; /* min qscale */ |
|
int qmax; /* max qscale */ |
|
int max_qdiff; /* max qscale difference between frames */ |
|
int encoding; /* true if we are encoding (vs decoding) */ |
|
int flags; /* AVCodecContext.flags (HQ, MV4, ...) */ |
|
int force_input_type;/* 0= no force, otherwise I_TYPE, P_TYPE, ... */ |
|
int max_b_frames; /* max number of b-frames for encoding */ |
|
float b_quant_factor;/* qscale factor between ips and b frames */ |
|
int rc_strategy; |
|
int b_frame_strategy; |
|
/* the following fields are managed internally by the encoder */ |
|
|
|
/* bit output */ |
|
PutBitContext pb; |
|
|
|
/* sequence parameters */ |
|
int context_initialized; |
|
int input_picture_number; |
|
int input_picture_in_gop_number; /* 0-> first pic in gop, ... */ |
|
int picture_number; |
|
int fake_picture_number; /* picture number at the bitstream frame rate */ |
|
int gop_picture_number; /* index of the first picture of a GOP based on fake_pic_num & mpeg1 specific */ |
|
int picture_in_gop_number; /* 0-> first pic in gop, ... */ |
|
int b_frames_since_non_b; /* used for encoding, relative to not yet reordered input */ |
|
int mb_width, mb_height; /* number of MBs horizontally & vertically */ |
|
int mb_num; /* number of MBs of a picture */ |
|
int linesize; /* line size, in bytes, may be different from width */ |
|
UINT8 *new_picture[3]; /* picture to be compressed */ |
|
UINT8 *picture_buffer[REORDER_BUFFER_SIZE][3]; /* internal buffers used for reordering of input pictures */ |
|
int picture_buffer_index; |
|
ReorderBuffer coded_order[REORDER_BUFFER_SIZE]; |
|
UINT8 *last_picture[3]; /* previous picture */ |
|
UINT8 *last_picture_base[3]; /* real start of the picture */ |
|
UINT8 *next_picture[3]; /* previous picture (for bidir pred) */ |
|
UINT8 *next_picture_base[3]; /* real start of the picture */ |
|
UINT8 *aux_picture[3]; /* aux picture (for B frames only) */ |
|
UINT8 *aux_picture_base[3]; /* real start of the picture */ |
|
UINT8 *current_picture[3]; /* buffer to store the decompressed current picture */ |
|
int last_dc[3]; /* last DC values for MPEG1 */ |
|
INT16 *dc_val[3]; /* used for mpeg4 DC prediction, all 3 arrays must be continuous */ |
|
int y_dc_scale, c_dc_scale; |
|
UINT8 *coded_block; /* used for coded block pattern prediction (msmpeg4v3, wmv1)*/ |
|
INT16 (*ac_val[3])[16]; /* used for for mpeg4 AC prediction, all 3 arrays must be continuous */ |
|
int ac_pred; |
|
int mb_skiped; /* MUST BE SET only during DECODING */ |
|
UINT8 *mbskip_table; /* used to avoid copy if macroblock skipped (for black regions for example) |
|
and used for b-frame encoding & decoding (contains skip table of next P Frame) */ |
|
UINT8 *mbintra_table; /* used to avoid setting {ac, dc, cbp}-pred stuff to zero on inter MB decoding */ |
|
|
|
int input_qscale; /* qscale prior to reordering of frames */ |
|
int input_pict_type; /* pict_type prior to reordering of frames */ |
|
int force_type; /* 0= no force, otherwise I_TYPE, P_TYPE, ... */ |
|
int qscale; /* QP */ |
|
int last_non_b_qscale; /* QP of last non b frame used for b frame qscale*/ |
|
int pict_type; /* I_TYPE, P_TYPE, B_TYPE, ... */ |
|
int last_non_b_pict_type; /* used for mpeg4 gmc b-frames & ratecontrol */ |
|
int frame_rate_index; |
|
/* motion compensation */ |
|
int unrestricted_mv; |
|
int h263_long_vectors; /* use horrible h263v1 long vector mode */ |
|
|
|
int f_code; /* forward MV resolution */ |
|
int b_code; /* backward MV resolution for B Frames (mpeg4) */ |
|
INT16 (*motion_val)[2]; /* used for MV prediction (4MV per MB) */ |
|
INT16 (*p_mv_table)[2]; /* MV table (1MV per MB) p-frame encoding */ |
|
INT16 (*last_p_mv_table)[2]; /* MV table (1MV per MB) p-frame encoding */ |
|
INT16 (*b_forw_mv_table)[2]; /* MV table (1MV per MB) forward mode b-frame encoding */ |
|
INT16 (*b_back_mv_table)[2]; /* MV table (1MV per MB) backward mode b-frame encoding */ |
|
INT16 (*b_bidir_forw_mv_table)[2]; /* MV table (1MV per MB) bidir mode b-frame encoding */ |
|
INT16 (*b_bidir_back_mv_table)[2]; /* MV table (1MV per MB) bidir mode b-frame encoding */ |
|
INT16 (*b_direct_forw_mv_table)[2];/* MV table (1MV per MB) direct mode b-frame encoding */ |
|
INT16 (*b_direct_back_mv_table)[2];/* MV table (1MV per MB) direct mode b-frame encoding */ |
|
INT16 (*b_direct_mv_table)[2]; /* MV table (1MV per MB) direct mode b-frame encoding */ |
|
int me_method; /* ME algorithm */ |
|
uint8_t *me_scratchpad; /* data area for the me algo, so that the ME doesnt need to malloc/free */ |
|
int mv_dir; |
|
#define MV_DIR_BACKWARD 1 |
|
#define MV_DIR_FORWARD 2 |
|
#define MV_DIRECT 4 // bidirectional mode where the difference equals the MV of the last P/S/I-Frame (mpeg4) |
|
int mv_type; |
|
#define MV_TYPE_16X16 0 /* 1 vector for the whole mb */ |
|
#define MV_TYPE_8X8 1 /* 4 vectors (h263, mpeg4 4MV) */ |
|
#define MV_TYPE_16X8 2 /* 2 vectors, one per 16x8 block */ |
|
#define MV_TYPE_FIELD 3 /* 2 vectors, one per field */ |
|
#define MV_TYPE_DMV 4 /* 2 vectors, special mpeg2 Dual Prime Vectors */ |
|
/* motion vectors for a macroblock |
|
first coordinate : 0 = forward 1 = backward |
|
second " : depend on type |
|
third " : 0 = x, 1 = y |
|
*/ |
|
int mv[2][4][2]; |
|
int field_select[2][2]; |
|
int last_mv[2][2][2]; /* last MV, used for MV prediction in MPEG1 & B-frame MPEG4 */ |
|
UINT16 (*mv_penalty)[MAX_MV*2+1]; /* amount of bits needed to encode a MV, used for ME */ |
|
UINT8 *fcode_tab; /* smallest fcode needed for each MV */ |
|
|
|
int has_b_frames; |
|
int no_rounding; /* apply no rounding to motion compensation (MPEG4, msmpeg4, ...) |
|
for b-frames rounding mode is allways 0 */ |
|
|
|
/* macroblock layer */ |
|
int mb_x, mb_y; |
|
int mb_incr; |
|
int mb_intra; |
|
UINT16 *mb_var; /* Table for MB variances */ |
|
UINT8 *mb_type; /* Table for MB type */ |
|
#define MB_TYPE_INTRA 0x01 |
|
#define MB_TYPE_INTER 0x02 |
|
#define MB_TYPE_INTER4V 0x04 |
|
#define MB_TYPE_SKIPED 0x08 |
|
#define MB_TYPE_DIRECT 0x10 |
|
#define MB_TYPE_FORWARD 0x20 |
|
#define MB_TYPE_BACKWARD 0x40 |
|
#define MB_TYPE_BIDIR 0x80 |
|
|
|
int block_index[6]; /* index to current MB in block based arrays with edges*/ |
|
int block_wrap[6]; |
|
|
|
/* matrix transmitted in the bitstream */ |
|
UINT16 intra_matrix[64]; |
|
UINT16 chroma_intra_matrix[64]; |
|
UINT16 non_intra_matrix[64]; |
|
UINT16 chroma_non_intra_matrix[64]; |
|
/* precomputed matrix (combine qscale and DCT renorm) */ |
|
int q_intra_matrix[64]; |
|
int q_non_intra_matrix[64]; |
|
/* identical to the above but for MMX & these are not permutated */ |
|
UINT16 __align8 q_intra_matrix16[64]; |
|
UINT16 __align8 q_non_intra_matrix16[64]; |
|
int block_last_index[6]; /* last non zero coefficient in block */ |
|
|
|
void *opaque; /* private data for the user */ |
|
|
|
/* bit rate control */ |
|
int I_frame_bits; //FIXME used in mpeg12 ... |
|
int avg_mb_var; /* average MB variance for current frame */ |
|
int mc_mb_var; /* motion compensated MB variance for current frame */ |
|
int last_non_b_mc_mb_var;/* motion compensated MB variance for last non b frame */ |
|
INT64 wanted_bits; |
|
INT64 total_bits; |
|
int frame_bits; /* bits used for the current frame */ |
|
int pb_frame_bits; /* bits of the last b...bp group */ |
|
Predictor i_pred; |
|
Predictor p_pred; |
|
double qsum; /* sum of qscales */ |
|
double qcount; /* count of qscales */ |
|
double short_term_qsum; /* sum of recent qscales */ |
|
double short_term_qcount; /* count of recent qscales */ |
|
RateControlContext rc_context; |
|
|
|
/* statistics, used for 2-pass encoding */ |
|
int mv_bits; |
|
int header_bits; |
|
int i_tex_bits; |
|
int p_tex_bits; |
|
int i_count; |
|
int p_count; |
|
int skip_count; |
|
int misc_bits; // cbp, mb_type |
|
int last_bits; //temp var used for calculating the above vars |
|
|
|
/* H.263 specific */ |
|
int gob_number; |
|
int gob_index; |
|
int first_gob_line; |
|
|
|
/* H.263+ specific */ |
|
int umvplus; |
|
int umvplus_dec; |
|
int h263_aic; /* Advanded INTRA Coding (AIC) */ |
|
int h263_aic_dir; /* AIC direction: 0 = left, 1 = top */ |
|
|
|
/* mpeg4 specific */ |
|
int time_increment_resolution; |
|
int time_increment_bits; /* number of bits to represent the fractional part of time */ |
|
int last_time_base; |
|
int time_base; /* time in seconds of last I,P,S Frame */ |
|
int64_t time; /* time of current frame */ |
|
int64_t last_non_b_time; |
|
uint16_t pp_time; /* time distance between the last 2 p,s,i frames */ |
|
uint16_t bp_time; /* time distance between the last b and p,s,i frame */ |
|
int shape; |
|
int vol_sprite_usage; |
|
int sprite_width; |
|
int sprite_height; |
|
int sprite_left; |
|
int sprite_top; |
|
int sprite_brightness_change; |
|
int num_sprite_warping_points; |
|
int real_sprite_warping_points; |
|
int sprite_offset[2][2]; |
|
int sprite_delta[2][2][2]; |
|
int sprite_shift[2][2]; |
|
int mcsel; |
|
int quant_precision; |
|
int quarter_sample; /* 1->qpel, 0->half pel ME/MC */ |
|
int scalability; |
|
int new_pred; |
|
int reduced_res_vop; |
|
int aspect_ratio_info; |
|
int sprite_warping_accuracy; |
|
int low_latency_sprite; |
|
int data_partioning; |
|
int resync_marker; |
|
int resync_x_pos; |
|
int low_delay; /* no reordering needed / has no b-frames */ |
|
int vo_type; |
|
|
|
/* divx specific, used to workaround (many) bugs in divx5 */ |
|
int divx_version; |
|
int divx_build; |
|
#define BITSTREAM_BUFFER_SIZE 1024*256 |
|
uint8_t *bitstream_buffer; //Divx 5.01 puts several frames in a single one, this is used to reorder them |
|
int bitstream_buffer_size; |
|
|
|
/* RV10 specific */ |
|
int rv10_version; /* RV10 version: 0 or 3 */ |
|
int rv10_first_dc_coded[3]; |
|
|
|
/* MJPEG specific */ |
|
struct MJpegContext *mjpeg_ctx; |
|
int mjpeg_vsample[3]; /* vertical sampling factors, default = {2, 1, 1} */ |
|
int mjpeg_hsample[3]; /* horizontal sampling factors, default = {2, 1, 1} */ |
|
int mjpeg_write_tables; /* do we want to have quantisation- and |
|
huffmantables in the jpeg file ? */ |
|
|
|
/* MSMPEG4 specific */ |
|
int mv_table_index; |
|
int rl_table_index; |
|
int rl_chroma_table_index; |
|
int dc_table_index; |
|
int use_skip_mb_code; |
|
int slice_height; /* in macroblocks */ |
|
int first_slice_line; /* used in mpeg4 too to handle resync markers */ |
|
int flipflop_rounding; |
|
int bitrate; |
|
int msmpeg4_version; /* 1=mp41, 2=mp42, 3=mp43/divx3 */ |
|
/* decompression specific */ |
|
GetBitContext gb; |
|
|
|
/* MPEG2 specific - I wish I had not to support this mess. */ |
|
int progressive_sequence; |
|
int mpeg_f_code[2][2]; |
|
int picture_structure; |
|
/* picture type */ |
|
#define PICT_TOP_FIELD 1 |
|
#define PICT_BOTTOM_FIELD 2 |
|
#define PICT_FRAME 3 |
|
|
|
int intra_dc_precision; |
|
int frame_pred_frame_dct; |
|
int top_field_first; |
|
int concealment_motion_vectors; |
|
int q_scale_type; |
|
int intra_vlc_format; |
|
int alternate_scan; |
|
int repeat_first_field; |
|
int chroma_420_type; |
|
int progressive_frame; |
|
int mpeg2; |
|
int full_pel[2]; |
|
int interlaced_dct; |
|
int last_qscale; |
|
int first_slice; |
|
|
|
/* RTP specific */ |
|
/* These are explained on avcodec.h */ |
|
int rtp_mode; |
|
int rtp_payload_size; |
|
void (*rtp_callback)(void *data, int size, int packet_number); |
|
UINT8 *ptr_lastgob; |
|
UINT8 *ptr_last_mb_line; |
|
UINT32 mb_line_avgsize; |
|
|
|
DCTELEM (*block)[64]; /* points to one of the following blocks */ |
|
DCTELEM blocks[2][6][64] __align8; // for HQ mode we need to keep the best block |
|
void (*dct_unquantize_mpeg1)(struct MpegEncContext *s, |
|
DCTELEM *block, int n, int qscale); |
|
void (*dct_unquantize_mpeg2)(struct MpegEncContext *s, |
|
DCTELEM *block, int n, int qscale); |
|
void (*dct_unquantize_h263)(struct MpegEncContext *s, |
|
DCTELEM *block, int n, int qscale); |
|
void (*dct_unquantize)(struct MpegEncContext *s, // unquantizer to use (mpeg4 can use both) |
|
DCTELEM *block, int n, int qscale); |
|
} MpegEncContext; |
|
|
|
int MPV_common_init(MpegEncContext *s); |
|
void MPV_common_end(MpegEncContext *s); |
|
void MPV_decode_mb(MpegEncContext *s, DCTELEM block[6][64]); |
|
void MPV_frame_start(MpegEncContext *s); |
|
void MPV_frame_end(MpegEncContext *s); |
|
#ifdef HAVE_MMX |
|
void MPV_common_init_mmx(MpegEncContext *s); |
|
#endif |
|
|
|
/* motion_est.c */ |
|
void ff_estimate_p_frame_motion(MpegEncContext * s, |
|
int mb_x, int mb_y); |
|
void ff_estimate_b_frame_motion(MpegEncContext * s, |
|
int mb_x, int mb_y); |
|
int ff_get_best_fcode(MpegEncContext * s, int16_t (*mv_table)[2], int type); |
|
void ff_fix_long_p_mvs(MpegEncContext * s); |
|
void ff_fix_long_b_mvs(MpegEncContext * s, int16_t (*mv_table)[2], int f_code, int type); |
|
|
|
/* mpeg12.c */ |
|
extern INT16 default_intra_matrix[64]; |
|
extern INT16 default_non_intra_matrix[64]; |
|
|
|
void mpeg1_encode_picture_header(MpegEncContext *s, int picture_number); |
|
void mpeg1_encode_mb(MpegEncContext *s, |
|
DCTELEM block[6][64], |
|
int motion_x, int motion_y); |
|
void mpeg1_encode_init(MpegEncContext *s); |
|
|
|
/* h263enc.c */ |
|
|
|
/* run length table */ |
|
#define MAX_RUN 64 |
|
#define MAX_LEVEL 64 |
|
|
|
typedef struct RLTable { |
|
int n; /* number of entries of table_vlc minus 1 */ |
|
int last; /* number of values for last = 0 */ |
|
const UINT16 (*table_vlc)[2]; |
|
const INT8 *table_run; |
|
const INT8 *table_level; |
|
UINT8 *index_run[2]; /* encoding only */ |
|
INT8 *max_level[2]; /* encoding & decoding */ |
|
INT8 *max_run[2]; /* encoding & decoding */ |
|
VLC vlc; /* decoding only */ |
|
} RLTable; |
|
|
|
void init_rl(RLTable *rl); |
|
void init_vlc_rl(RLTable *rl); |
|
|
|
static inline int get_rl_index(const RLTable *rl, int last, int run, int level) |
|
{ |
|
int index; |
|
index = rl->index_run[last][run]; |
|
if (index >= rl->n) |
|
return rl->n; |
|
if (level > rl->max_level[last][run]) |
|
return rl->n; |
|
return index + level - 1; |
|
} |
|
|
|
void h263_encode_mb(MpegEncContext *s, |
|
DCTELEM block[6][64], |
|
int motion_x, int motion_y); |
|
void mpeg4_encode_mb(MpegEncContext *s, |
|
DCTELEM block[6][64], |
|
int motion_x, int motion_y); |
|
void h263_encode_picture_header(MpegEncContext *s, int picture_number); |
|
int h263_encode_gob_header(MpegEncContext * s, int mb_line); |
|
void h263_dc_scale(MpegEncContext *s); |
|
INT16 *h263_pred_motion(MpegEncContext * s, int block, |
|
int *px, int *py); |
|
void mpeg4_pred_ac(MpegEncContext * s, INT16 *block, int n, |
|
int dir); |
|
void ff_set_mpeg4_time(MpegEncContext * s, int picture_number); |
|
void mpeg4_encode_picture_header(MpegEncContext *s, int picture_number); |
|
void h263_encode_init(MpegEncContext *s); |
|
|
|
void h263_decode_init_vlc(MpegEncContext *s); |
|
int h263_decode_picture_header(MpegEncContext *s); |
|
int h263_decode_gob_header(MpegEncContext *s); |
|
int mpeg4_decode_picture_header(MpegEncContext * s); |
|
int intel_h263_decode_picture_header(MpegEncContext *s); |
|
int h263_decode_mb(MpegEncContext *s, |
|
DCTELEM block[6][64]); |
|
int h263_get_picture_format(int width, int height); |
|
|
|
/* rv10.c */ |
|
void rv10_encode_picture_header(MpegEncContext *s, int picture_number); |
|
int rv_decode_dc(MpegEncContext *s, int n); |
|
|
|
/* msmpeg4.c */ |
|
void msmpeg4_encode_picture_header(MpegEncContext * s, int picture_number); |
|
void msmpeg4_encode_ext_header(MpegEncContext * s); |
|
void msmpeg4_encode_mb(MpegEncContext * s, |
|
DCTELEM block[6][64], |
|
int motion_x, int motion_y); |
|
void msmpeg4_dc_scale(MpegEncContext * s); |
|
int msmpeg4_decode_picture_header(MpegEncContext * s); |
|
int msmpeg4_decode_ext_header(MpegEncContext * s, int buf_size); |
|
int msmpeg4_decode_mb(MpegEncContext *s, |
|
DCTELEM block[6][64]); |
|
int msmpeg4_decode_init_vlc(MpegEncContext *s); |
|
|
|
/* mjpegenc.c */ |
|
|
|
int mjpeg_init(MpegEncContext *s); |
|
void mjpeg_close(MpegEncContext *s); |
|
void mjpeg_encode_mb(MpegEncContext *s, |
|
DCTELEM block[6][64]); |
|
void mjpeg_picture_header(MpegEncContext *s); |
|
void mjpeg_picture_trailer(MpegEncContext *s); |
|
|
|
/* rate control */ |
|
int ff_rate_control_init(MpegEncContext *s); |
|
int ff_rate_estimate_qscale(MpegEncContext *s); |
|
int ff_rate_estimate_qscale_pass2(MpegEncContext *s); |
|
void ff_write_pass1_stats(MpegEncContext *s); |
|
void ff_rate_control_uninit(MpegEncContext *s); |
|
|
|
|
|
|
|
|
|
|