FFmpeg  1.2.4
mpegvideo.h
Go to the documentation of this file.
1 /*
2  * Generic DCT based hybrid video encoder
3  * Copyright (c) 2000, 2001, 2002 Fabrice Bellard
4  * Copyright (c) 2002-2004 Michael Niedermayer
5  *
6  * This file is part of FFmpeg.
7  *
8  * FFmpeg is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU Lesser General Public
10  * License as published by the Free Software Foundation; either
11  * version 2.1 of the License, or (at your option) any later version.
12  *
13  * FFmpeg is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16  * Lesser General Public License for more details.
17  *
18  * You should have received a copy of the GNU Lesser General Public
19  * License along with FFmpeg; if not, write to the Free Software
20  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21  */
22 
28 #ifndef AVCODEC_MPEGVIDEO_H
29 #define AVCODEC_MPEGVIDEO_H
30 
31 #include "avcodec.h"
32 #include "dsputil.h"
33 #include "error_resilience.h"
34 #include "get_bits.h"
35 #include "h264chroma.h"
36 #include "put_bits.h"
37 #include "ratecontrol.h"
38 #include "parser.h"
39 #include "mpeg12data.h"
40 #include "rl.h"
41 #include "videodsp.h"
42 
43 #include "libavutil/opt.h"
44 #include "libavutil/timecode.h"
45 
46 #define FRAME_SKIPPED 100
47 
54 };
55 
56 #define MPEG_BUF_SIZE (16 * 1024)
57 
58 #define QMAT_SHIFT_MMX 16
59 #define QMAT_SHIFT 21
60 
61 #define MAX_FCODE 7
62 #define MAX_MV 4096
63 
64 #define MAX_THREADS 32
65 #define MAX_PICTURE_COUNT 36
66 
67 #define ME_MAP_SIZE 64
68 #define ME_MAP_SHIFT 3
69 #define ME_MAP_MV_BITS 11
70 
71 #define MAX_MB_BYTES (30*16*16*3/8 + 120)
72 
73 #define INPLACE_OFFSET 16
74 
75 /* Start codes. */
76 #define SEQ_END_CODE 0x000001b7
77 #define SEQ_START_CODE 0x000001b3
78 #define GOP_START_CODE 0x000001b8
79 #define PICTURE_START_CODE 0x00000100
80 #define SLICE_MIN_START_CODE 0x00000101
81 #define SLICE_MAX_START_CODE 0x000001af
82 #define EXT_START_CODE 0x000001b5
83 #define USER_START_CODE 0x000001b2
84 
89 #define DELAYED_PIC_REF 4
90 
91 struct MpegEncContext;
92 
96 typedef struct Picture{
97  struct AVFrame f;
98 
100  int16_t (*motion_val_base[2])[2];
101  uint32_t *mb_type_base;
102 #define MB_TYPE_INTRA MB_TYPE_INTRA4x4 //default mb_type if there is just one type
103 #define IS_INTRA4x4(a) ((a)&MB_TYPE_INTRA4x4)
104 #define IS_INTRA16x16(a) ((a)&MB_TYPE_INTRA16x16)
105 #define IS_PCM(a) ((a)&MB_TYPE_INTRA_PCM)
106 #define IS_INTRA(a) ((a)&7)
107 #define IS_INTER(a) ((a)&(MB_TYPE_16x16|MB_TYPE_16x8|MB_TYPE_8x16|MB_TYPE_8x8))
108 #define IS_SKIP(a) ((a)&MB_TYPE_SKIP)
109 #define IS_INTRA_PCM(a) ((a)&MB_TYPE_INTRA_PCM)
110 #define IS_INTERLACED(a) ((a)&MB_TYPE_INTERLACED)
111 #define IS_DIRECT(a) ((a)&MB_TYPE_DIRECT2)
112 #define IS_GMC(a) ((a)&MB_TYPE_GMC)
113 #define IS_16X16(a) ((a)&MB_TYPE_16x16)
114 #define IS_16X8(a) ((a)&MB_TYPE_16x8)
115 #define IS_8X16(a) ((a)&MB_TYPE_8x16)
116 #define IS_8X8(a) ((a)&MB_TYPE_8x8)
117 #define IS_SUB_8X8(a) ((a)&MB_TYPE_16x16) //note reused
118 #define IS_SUB_8X4(a) ((a)&MB_TYPE_16x8) //note reused
119 #define IS_SUB_4X8(a) ((a)&MB_TYPE_8x16) //note reused
120 #define IS_SUB_4X4(a) ((a)&MB_TYPE_8x8) //note reused
121 #define IS_ACPRED(a) ((a)&MB_TYPE_ACPRED)
122 #define IS_QUANT(a) ((a)&MB_TYPE_QUANT)
123 #define IS_DIR(a, part, list) ((a) & (MB_TYPE_P0L0<<((part)+2*(list))))
124 #define USES_LIST(a, list) ((a) & ((MB_TYPE_P0L0|MB_TYPE_P1L0)<<(2*(list))))
125 #define HAS_CBP(a) ((a)&MB_TYPE_CBP)
126 
127  int field_poc[2];
128  int poc;
129  int frame_num;
131  int pic_id;
133  int long_ref;
134  int ref_poc[2][2][32];
135  int ref_count[2][2];
136  int mbaff;
138  int sync;
139 
142  uint16_t *mb_var;
143  uint16_t *mc_mb_var;
145  int b_frame_score; /* */
146  void *owner2;
149 } Picture;
150 
154 typedef struct MotionEstContext{
156  int skip;
157  int co_located_mv[4][2];
158  int direct_basis_mv[4][2];
164  uint32_t *map;
165  uint32_t *score_map;
166  unsigned map_generation;
175  int flags;
177  int mb_flags;
178  int pre_pass;
179  int dia_size;
180  int xmin;
181  int xmax;
182  int ymin;
183  int ymax;
184  int pred_x;
185  int pred_y;
186  uint8_t *src[4][4];
187  uint8_t *ref[4][4];
188  int stride;
189  int uvstride;
190  /* temp variables for picture complexity calculation */
194 /* cmp, chroma_cmp;*/
202  int *mx_ptr, int *my_ptr, int dmin,
203  int src_index, int ref_index,
204  int size, int h);
206 
210 typedef struct MpegEncContext {
211  AVClass *class;
213  /* the following parameters must be initialized before encoding */
214  int width, height;
215  int gop_size;
217  int bit_rate;
219  int h263_pred;
220  int pb_frame;
221 
222 /* the following codec id fields are deprecated in favor of codec_id */
223  int h263_plus;
224  int h263_flv;
225 
226  enum AVCodecID codec_id; /* see AV_CODEC_ID_xxx */
228  int encoding;
229  int flags;
230  int flags2;
236  int codec_tag;
238  /* the following fields are managed internally by the encoder */
239 
240  /* sequence parameters */
244  int picture_number; //FIXME remove, unclear definition
247  int mb_stride;
248  int b8_stride;
249  int b4_stride;
251  int mb_num;
252  int linesize;
257 
259  int ac_pred;
261  int h263_aic;
262 
263  /* scantables */
268 
269  /* WARNING: changes above this line require updates to hardcoded
270  * offsets used in asm. */
271 
273 
276  int64_t dts_delta;
280  int64_t reordered_pts;
281 
284 
286  int end_mb_y;
289 
295 
301 
307 
313 
320  int last_dc[3];
321  int16_t *dc_val_base;
322  int16_t *dc_val[3];
328  int16_t (*ac_val_base)[16];
329  int16_t (*ac_val[3])[16];
340 
341  int qscale;
343  unsigned int lambda;
344  unsigned int lambda2;
347  int dquant;
349  int pict_type;
351  int last_pict_type; //FIXME removes
357  int skipdct;
358 
359  /* motion compensation */
362 
366  int f_code;
367  int b_code;
368  int16_t (*p_mv_table_base)[2];
369  int16_t (*b_forw_mv_table_base)[2];
370  int16_t (*b_back_mv_table_base)[2];
373  int16_t (*b_direct_mv_table_base)[2];
374  int16_t (*p_field_mv_table_base[2][2])[2];
375  int16_t (*b_field_mv_table_base[2][2][2])[2];
376  int16_t (*p_mv_table)[2];
377  int16_t (*b_forw_mv_table)[2];
378  int16_t (*b_back_mv_table)[2];
379  int16_t (*b_bidir_forw_mv_table)[2];
380  int16_t (*b_bidir_back_mv_table)[2];
381  int16_t (*b_direct_mv_table)[2];
382  int16_t (*p_field_mv_table[2][2])[2];
383  int16_t (*b_field_mv_table[2][2][2])[2];
386  int me_method;
387  int mv_dir;
388 #define MV_DIR_FORWARD 1
389 #define MV_DIR_BACKWARD 2
390 #define MV_DIRECT 4
391  int mv_type;
392 #define MV_TYPE_16X16 0
393 #define MV_TYPE_8X8 1
394 #define MV_TYPE_16X8 2
395 #define MV_TYPE_FIELD 3
396 #define MV_TYPE_DMV 4
397 
402  int mv[2][4][2];
403  int field_select[2][2];
404  int last_mv[2][2][2];
406  int16_t direct_scale_mv[2][64];
407 
409 
413  /* macroblock layer */
414  int mb_x, mb_y;
416  int mb_intra;
417  uint16_t *mb_type;
418 #define CANDIDATE_MB_TYPE_INTRA 0x01
419 #define CANDIDATE_MB_TYPE_INTER 0x02
420 #define CANDIDATE_MB_TYPE_INTER4V 0x04
421 #define CANDIDATE_MB_TYPE_SKIPPED 0x08
422 //#define MB_TYPE_GMC 0x10
423 
424 #define CANDIDATE_MB_TYPE_DIRECT 0x10
425 #define CANDIDATE_MB_TYPE_FORWARD 0x20
426 #define CANDIDATE_MB_TYPE_BACKWARD 0x40
427 #define CANDIDATE_MB_TYPE_BIDIR 0x80
428 
429 #define CANDIDATE_MB_TYPE_INTER_I 0x100
430 #define CANDIDATE_MB_TYPE_FORWARD_I 0x200
431 #define CANDIDATE_MB_TYPE_BACKWARD_I 0x400
432 #define CANDIDATE_MB_TYPE_BIDIR_I 0x800
433 
434 #define CANDIDATE_MB_TYPE_DIRECT0 0x1000
435 
436  int block_index[6];
437  int block_wrap[6];
439 
440  int *mb_index2xy;
441 
443  uint16_t intra_matrix[64];
444  uint16_t chroma_intra_matrix[64];
445  uint16_t inter_matrix[64];
446  uint16_t chroma_inter_matrix[64];
447 #define QUANT_BIAS_SHIFT 8
458 #define UNI_AC_ENC_INDEX(run,level) ((run)*128 + (level))
459 
460  int coded_score[12];
461 
463  int (*q_intra_matrix)[64];
465  int (*q_inter_matrix)[64];
467  uint16_t (*q_intra_matrix16)[2][64];
468  uint16_t (*q_chroma_intra_matrix16)[2][64];
469  uint16_t (*q_inter_matrix16)[2][64];
470 
471  /* noise reduction */
472  int (*dct_error_sum)[64];
473  int dct_count[2];
474  uint16_t (*dct_offset)[64];
475 
476  void *opaque;
477 
478  /* bit rate control */
479  int64_t total_bits;
484 
485  /* statistics, used for 2-pass encoding */
486  int mv_bits;
490  int i_count;
491  int f_count;
492  int b_count;
494  int misc_bits;
495  int last_bits;
496 
497  /* error concealment / resync */
504 
506 
507  /* H.263 specific */
509  int obmc;
511  int mb_info;
515 
516  /* H.263+ specific */
517  int umvplus;
524 
525  /* mpeg4 specific */
528  int time_base;
529  int64_t time;
531  uint16_t pp_time;
532  uint16_t pb_time;
533  uint16_t pp_field_time;
534  uint16_t pb_field_time;
535  int shape;
544  uint16_t sprite_traj[4][2];
545  int sprite_offset[2][2];
546  int sprite_delta[2][2];
547  int sprite_shift[2];
548  int mcsel;
554  int new_pred;
556  int aspect_ratio_info; //FIXME remove
561  int rvlc;
563  int low_delay;
564  int vo_type;
571  int t_frame;
576 
577  /* divx specific, used to workaround (many) bugs in divx5 */
581  uint8_t *bitstream_buffer; //Divx 5.01 puts several frames in a single one, this is used to reorder them
584 
586 
587  /* lavc specific stuff, used to workaround bugs in libavcodec */
589 
590  /* RV10 specific */
594 
595  /* MJPEG specific */
597  int mjpeg_vsample[3];
598  int mjpeg_hsample[3];
599  int esc_pos;
600 
601  /* MSMPEG4 specific */
615  int (*ac_stats)[2][MAX_LEVEL+1][MAX_RUN+1][2];
617  int mspel;
618 
619  /* decompression specific */
621 
622  /* Mpeg1 specific */
627 
628  /* MPEG-2-specific - I wished not to have to support this mess. */
630  int mpeg_f_code[2][2];
632 /* picture type */
633 #define PICT_TOP_FIELD 1
634 #define PICT_BOTTOM_FIELD 2
635 #define PICT_FRAME 3
636 
647 #define CHROMA_420 1
648 #define CHROMA_422 2
649 #define CHROMA_444 3
650  int chroma_x_shift;//depend on pix_format, that depend on chroma_format
652 
654  int full_pel[2];
660 
661  /* RTP specific */
662  int rtp_mode;
663 
664  char *tc_opt_str;
666 
668  int swap_uv; //vcr2 codec is an MPEG-2 variant with U and V swapped
669  int16_t (*pblocks[12])[64];
670 
671  int16_t (*block)[64];
672  int16_t (*blocks)[12][64]; // for HQ mode we need to keep the best block
673  int (*decode_mb)(struct MpegEncContext *s, int16_t block[6][64]); // used by some codecs to avoid a switch()
674 #define SLICE_OK 0
675 #define SLICE_ERROR -1
676 #define SLICE_END -2
677 #define SLICE_NOEND -3
678 
680  int16_t *block/*align 16*/, int n, int qscale);
682  int16_t *block/*align 16*/, int n, int qscale);
684  int16_t *block/*align 16*/, int n, int qscale);
686  int16_t *block/*align 16*/, int n, int qscale);
688  int16_t *block/*align 16*/, int n, int qscale);
690  int16_t *block/*align 16*/, int n, int qscale);
692  int16_t *block/*align 16*/, int n, int qscale);
694  int16_t *block/*align 16*/, int n, int qscale);
695  void (*dct_unquantize_intra)(struct MpegEncContext *s, // unquantizer to use (mpeg4 can use both)
696  int16_t *block/*align 16*/, int n, int qscale);
697  void (*dct_unquantize_inter)(struct MpegEncContext *s, // unquantizer to use (mpeg4 can use both)
698  int16_t *block/*align 16*/, int n, int qscale);
699  int (*dct_quantize)(struct MpegEncContext *s, int16_t *block/*align 16*/, int n, int qscale, int *overflow);
700  int (*fast_dct_quantize)(struct MpegEncContext *s, int16_t *block/*align 16*/, int n, int qscale, int *overflow);
701  void (*denoise_dct)(struct MpegEncContext *s, int16_t *block);
702 
703  int mpv_flags;
705 
706  /* temp buffers for rate control */
707  float *cplx_tab, *bits_tab;
708 
709  /* flag to indicate a reinitialization is required, e.g. after
710  * a frame size change */
712 
715 
716 #define REBASE_PICTURE(pic, new_ctx, old_ctx) \
717  ((pic && pic >= old_ctx->picture && \
718  pic < old_ctx->picture + old_ctx->picture_count) ? \
719  &new_ctx->picture[pic - old_ctx->picture] : NULL)
720 
721 /* mpegvideo_enc common options */
722 #define FF_MPV_FLAG_SKIP_RD 0x0001
723 #define FF_MPV_FLAG_STRICT_GOP 0x0002
724 #define FF_MPV_FLAG_QP_RD 0x0004
725 #define FF_MPV_FLAG_CBP_RD 0x0008
726 
727 #define FF_MPV_OFFSET(x) offsetof(MpegEncContext, x)
728 #define FF_MPV_OPT_FLAGS (AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM)
729 #define FF_MPV_COMMON_OPTS \
730 { "mpv_flags", "Flags common for all mpegvideo-based encoders.", FF_MPV_OFFSET(mpv_flags), AV_OPT_TYPE_FLAGS, { .i64 = 0 }, INT_MIN, INT_MAX, FF_MPV_OPT_FLAGS, "mpv_flags" },\
731 { "skip_rd", "RD optimal MB level residual skipping", 0, AV_OPT_TYPE_CONST, { .i64 = FF_MPV_FLAG_SKIP_RD }, 0, 0, FF_MPV_OPT_FLAGS, "mpv_flags" },\
732 { "strict_gop", "Strictly enforce gop size", 0, AV_OPT_TYPE_CONST, { .i64 = FF_MPV_FLAG_STRICT_GOP }, 0, 0, FF_MPV_OPT_FLAGS, "mpv_flags" },\
733 { "qp_rd", "Use rate distortion optimization for qp selection", 0, AV_OPT_TYPE_CONST, { .i64 = FF_MPV_FLAG_QP_RD }, 0, 0, FF_MPV_OPT_FLAGS, "mpv_flags" },\
734 { "cbp_rd", "use rate distortion optimization for CBP", 0, AV_OPT_TYPE_CONST, { .i64 = FF_MPV_FLAG_CBP_RD }, 0, 0, FF_MPV_OPT_FLAGS, "mpv_flags" },\
735 { "luma_elim_threshold", "single coefficient elimination threshold for luminance (negative values also consider dc coefficient)",\
736  FF_MPV_OFFSET(luma_elim_threshold), AV_OPT_TYPE_INT, { .i64 = 0 }, INT_MIN, INT_MAX, FF_MPV_OPT_FLAGS },\
737 { "chroma_elim_threshold", "single coefficient elimination threshold for chrominance (negative values also consider dc coefficient)",\
738  FF_MPV_OFFSET(chroma_elim_threshold), AV_OPT_TYPE_INT, { .i64 = 0 }, INT_MIN, INT_MAX, FF_MPV_OPT_FLAGS },\
739 { "quantizer_noise_shaping", NULL, FF_MPV_OFFSET(quantizer_noise_shaping), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, FF_MPV_OPT_FLAGS },
740 
741 extern const AVOption ff_mpv_generic_options[];
742 
743 #define FF_MPV_GENERIC_CLASS(name) \
744 static const AVClass name ## _class = {\
745  .class_name = #name " encoder",\
746  .item_name = av_default_item_name,\
747  .option = ff_mpv_generic_options,\
748  .version = LIBAVUTIL_VERSION_INT,\
749 };
750 
757 
763 void ff_MPV_decode_mb(MpegEncContext *s, int16_t block[12][64]);
769  AVFrame *frame, int *got_packet);
778  Picture *last, int y, int h, int picture_structure,
779  int first_field, int draw_edges, int low_delay,
780  int v_edge_pos, int h_edge_pos);
781 void ff_mpeg_draw_horiz_band(MpegEncContext *s, int y, int h);
784 void ff_write_quant_matrix(PutBitContext *pb, uint16_t *matrix);
785 void ff_release_unused_pictures(MpegEncContext *s, int remove_current);
786 int ff_find_unused_picture(MpegEncContext *s, int shared);
787 void ff_denoise_dct(MpegEncContext *s, int16_t *block);
792 const uint8_t *avpriv_mpv_find_start_code(const uint8_t *p, const uint8_t *end, uint32_t *state);
793 void ff_set_qscale(MpegEncContext * s, int qscale);
794 
796 
799 void ff_convert_matrix(DSPContext *dsp, int (*qmat)[64], uint16_t (*qmat16)[2][64],
800  const uint16_t *quant_matrix, int bias, int qmin, int qmax, int intra);
801 int ff_dct_quantize_c(MpegEncContext *s, int16_t *block, int n, int qscale, int *overflow);
802 
804 void ff_copy_picture(Picture *dst, Picture *src);
805 
807  uint8_t *dest_y, uint8_t *dest_cb,
808  uint8_t *dest_cr, int dir,
809  uint8_t **ref_picture,
810  op_pixels_func (*pix_op)[4],
811  qpel_mc_func (*qpix_op)[16]);
812 
817 int ff_alloc_picture(MpegEncContext *s, Picture *pic, int shared);
818 
819 extern const enum AVPixelFormat ff_pixfmt_list_420[];
820 
825 void ff_block_permute(int16_t *block, uint8_t *permutation, const uint8_t *scantable, int last);
826 
827 static inline void ff_update_block_index(MpegEncContext *s){
828  const int block_size= 8 >> s->avctx->lowres;
829 
830  s->block_index[0]+=2;
831  s->block_index[1]+=2;
832  s->block_index[2]+=2;
833  s->block_index[3]+=2;
834  s->block_index[4]++;
835  s->block_index[5]++;
836  s->dest[0]+= 2*block_size;
837  s->dest[1]+= block_size;
838  s->dest[2]+= block_size;
839 }
840 
841 static inline int get_bits_diff(MpegEncContext *s){
842  const int bits= put_bits_count(&s->pb);
843  const int last= s->last_bits;
844 
845  s->last_bits = bits;
846 
847  return bits - last;
848 }
849 
850 static inline int ff_h263_round_chroma(int x){
851  static const uint8_t h263_chroma_roundtab[16] = {
852  // 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
853  0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1,
854  };
855  return h263_chroma_roundtab[x & 0xf] + (x >> 3);
856 }
857 
858 /* motion_est.c */
860  int mb_x, int mb_y);
862  int mb_x, int mb_y);
863 int ff_get_best_fcode(MpegEncContext * s, int16_t (*mv_table)[2], int type);
865 void ff_fix_long_mvs(MpegEncContext * s, uint8_t *field_select_table, int field_select,
866  int16_t (*mv_table)[2], int f_code, int type, int truncate);
867 int ff_init_me(MpegEncContext *s);
869 int ff_epzs_motion_search(MpegEncContext * s, int *mx_ptr, int *my_ptr,
870  int P[10][2], int src_index, int ref_index, int16_t (*last_mv)[2],
871  int ref_mv_scale, int size, int h);
872 int ff_get_mb_score(MpegEncContext * s, int mx, int my, int src_index,
873  int ref_index, int size, int h, int add_rate);
874 
875 /* mpeg12.c */
876 extern const uint8_t ff_mpeg1_dc_scale_table[128];
877 extern const uint8_t * const ff_mpeg2_dc_scale_table[4];
878 
881  int16_t block[6][64],
882  int motion_x, int motion_y);
886 int ff_mpeg1_find_frame_end(ParseContext *pc, const uint8_t *buf, int buf_size, AVCodecParserContext *s);
887 
888 extern const uint8_t ff_aic_dc_scale_table[32];
889 extern const uint8_t ff_h263_chroma_qscale_table[32];
890 extern const uint8_t ff_h263_loop_filter_strength[32];
891 
892 /* h261.c */
896  int16_t block[6][64],
897  int motion_x, int motion_y);
901 
902 
903 /* rv10.c */
905 int ff_rv_decode_dc(MpegEncContext *s, int n);
907 
908 
909 /* msmpeg4.c */
913  int16_t block[6][64],
914  int motion_x, int motion_y);
916 int ff_msmpeg4_decode_ext_header(MpegEncContext * s, int buf_size);
921 void ff_wmv2_add_mb(MpegEncContext *s, int16_t block[6][64], uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr);
923  uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
924  uint8_t **ref_picture, op_pixels_func (*pix_op)[4],
925  int motion_x, int motion_y, int h);
928  int16_t block[6][64],
929  int motion_x, int motion_y);
930 
931 #endif /* AVCODEC_MPEGVIDEO_H */