2 * Generic DCT based hybrid video encoder
3 * Copyright (c) 2000,2001 Gerard Lantau.
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
20 /* Macros for picture code type. */
24 #define S_TYPE 4 //S(GMC)-VOP MPEG4
32 #define MPEG_BUF_SIZE (16 * 1024)
34 #define QMAT_SHIFT_MMX 19
37 typedef struct MpegEncContext {
38 struct AVCodecContext *avctx;
39 /* the following parameters must be initialized before encoding */
40 int width, height; /* picture size. must be a multiple of 16 */
42 int frame_rate; /* number of frames per second */
43 int intra_only; /* if true, only intra pictures are generated */
44 int bit_rate; /* wanted bit rate */
45 enum OutputFormat out_format; /* output format */
46 int h263_plus; /* h263 plus headers */
47 int h263_rv10; /* use RV10 variation for H263 */
48 int h263_pred; /* use mpeg4/h263 ac/dc predictions */
49 int h263_msmpeg4; /* generate MSMPEG4 compatible stream */
50 int h263_intel; /* use I263 intel h263 header */
51 int fixed_qscale; /* fixed qscale if non zero */
52 int encoding; /* true if we are encoding (vs decoding) */
53 /* the following fields are managed internally by the encoder */
58 /* sequence parameters */
59 int context_initialized;
61 int fake_picture_number; /* picture number at the bitstream frame rate */
62 int gop_picture_number; /* index of the first picture of a GOP */
63 int mb_width, mb_height;
64 int mb_num; /* number of MBs of a picture */
65 int linesize; /* line size, in bytes, may be different from width */
66 UINT8 *new_picture[3]; /* picture to be compressed */
67 UINT8 *last_picture[3]; /* previous picture */
68 UINT8 *last_picture_base[3]; /* real start of the picture */
69 UINT8 *next_picture[3]; /* previous picture (for bidir pred) */
70 UINT8 *next_picture_base[3]; /* real start of the picture */
71 UINT8 *aux_picture[3]; /* aux picture (for B frames only) */
72 UINT8 *aux_picture_base[3]; /* real start of the picture */
73 UINT8 *current_picture[3]; /* buffer to store the decompressed current picture */
74 int last_dc[3]; /* last DC values for MPEG1 */
75 INT16 *dc_val[3]; /* used for mpeg4 DC prediction */
76 int y_dc_scale, c_dc_scale;
77 UINT8 *coded_block; /* used for coded block pattern prediction */
78 INT16 (*ac_val[3])[16]; /* used for for mpeg4 AC prediction */
80 int mb_skiped; /* MUST BE SET only during DECODING */
81 UINT8 *mbskip_table; /* used to avoid copy if macroblock
82 skipped (for black regions for example) */
83 UINT8 *mbintra_table; /* used to kill a few memsets */
87 int last_non_b_pict_type; /* used for mpeg4 gmc b-frames */
89 /* motion compensation */
91 int h263_long_vectors; /* use horrible h263v1 long vector mode */
93 int f_code; /* resolution */
94 int b_code; /* backward resolution for B Frames (mpeg4) */
95 INT16 *mv_table[2]; /* MV table (1MV per MB)*/
96 INT16 (*motion_val)[2]; /* used for MV prediction (4MV per MB)*/
99 #define MV_DIR_BACKWARD 1
100 #define MV_DIR_FORWARD 2
101 #define MV_DIRECT 4 // bidirectional mode where the difference equals the MV of the last P/S/I-Frame (mpeg4)
103 #define MV_TYPE_16X16 0 /* 1 vector for the whole mb */
104 #define MV_TYPE_8X8 1 /* 4 vectors (h263) */
105 #define MV_TYPE_16X8 2 /* 2 vectors, one per 16x8 block */
106 #define MV_TYPE_FIELD 3 /* 2 vectors, one per field */
107 #define MV_TYPE_DMV 4 /* 2 vectors, special mpeg2 Dual Prime Vectors */
108 /* motion vectors for a macroblock
109 first coordinate : 0 = forward 1 = backward
110 second " : depend on type
111 third " : 0 = x, 1 = y
114 int field_select[2][2];
115 int last_mv[2][2][2];
118 int no_rounding; /* apply no rounding to motion estimation (MPEG4) */
120 /* macroblock layer */
124 INT16 *mb_var; /* Table for MB variances */
125 char *mb_type; /* Table for MB type */
127 /* matrix transmitted in the bitstream */
128 UINT16 intra_matrix[64];
129 UINT16 chroma_intra_matrix[64];
130 UINT16 non_intra_matrix[64];
131 UINT16 chroma_non_intra_matrix[64];
132 /* precomputed matrix (combine qscale and DCT renorm) */
133 int q_intra_matrix[64];
134 int q_non_intra_matrix[64];
135 /* identical to the above but for MMX & these are not permutated */
136 UINT16 __align8 q_intra_matrix16[64] ;
137 UINT16 __align8 q_non_intra_matrix16[64];
138 int block_last_index[6]; /* last non zero coefficient in block */
140 void *opaque; /* private data for the user */
142 /* bit rate control */
143 int I_frame_bits; /* wanted number of bits per I frame */
144 int P_frame_bits; /* same for P frame */
145 int avg_mb_var; /* average MB variance for current frame */
154 /* H.263+ specific */
157 int h263_aic; /* Advanded INTRA Coding (AIC) */
158 int h263_aic_dir; /* AIC direction: 0 = left, 1 = top */
161 int time_increment_resolution;
162 int time_increment_bits;
166 int last_non_b_time[2];
168 int vol_sprite_usage;
173 int sprite_brightness_change;
174 int num_sprite_warping_points;
175 int real_sprite_warping_points;
176 int sprite_offset[2][2];
177 int sprite_delta[2][2][2];
178 int sprite_shift[2][2];
185 int aspect_ratio_info;
186 int sprite_warping_accuracy;
187 int low_latency_sprite;
190 /* divx specific, used to workaround (many) bugs in divx5 */
195 int rv10_version; /* RV10 version: 0 or 3 */
196 int rv10_first_dc_coded[3];
199 struct MJpegContext *mjpeg_ctx;
200 int mjpeg_vsample[3]; /* vertical sampling factors, default = {2, 1, 1} */
201 int mjpeg_hsample[3]; /* horizontal sampling factors, default = {2, 1, 1} */
202 int mjpeg_write_tables; /* do we want to have quantisation- and
203 huffmantables in the jpeg file ? */
205 /* MSMPEG4 specific */
208 int rl_chroma_table_index;
210 int use_skip_mb_code;
211 int slice_height; /* in macroblocks */
212 int first_slice_line;
213 int flipflop_rounding;
215 /* decompression specific */
218 /* MPEG2 specific - I wish I had not to support this mess. */
219 int progressive_sequence;
220 int mpeg_f_code[2][2];
221 int picture_structure;
223 #define PICT_TOP_FIELD 1
224 #define PICT_BOTTOM_FIELD 2
227 int intra_dc_precision;
228 int frame_pred_frame_dct;
230 int concealment_motion_vectors;
232 int intra_vlc_format;
234 int repeat_first_field;
236 int progressive_frame;
244 /* These are explained on avcodec.h */
246 int rtp_payload_size;
247 void (*rtp_callback)(void *data, int size, int packet_number);
249 UINT8 *ptr_last_mb_line;
250 UINT32 mb_line_avgsize;
252 DCTELEM block[6][64] __align8;
253 void (*dct_unquantize)(struct MpegEncContext *s,
254 DCTELEM *block, int n, int qscale);
257 int MPV_common_init(MpegEncContext *s);
258 void MPV_common_end(MpegEncContext *s);
259 void MPV_decode_mb(MpegEncContext *s, DCTELEM block[6][64]);
260 void MPV_frame_start(MpegEncContext *s);
261 void MPV_frame_end(MpegEncContext *s);
263 void MPV_common_init_mmx(MpegEncContext *s);
268 int estimate_motion(MpegEncContext *s,
270 int *mx_ptr, int *my_ptr);
273 extern INT16 default_intra_matrix[64];
274 extern INT16 default_non_intra_matrix[64];
276 void mpeg1_encode_picture_header(MpegEncContext *s, int picture_number);
277 void mpeg1_encode_mb(MpegEncContext *s,
278 DCTELEM block[6][64],
279 int motion_x, int motion_y);
283 /* run length table */
287 typedef struct RLTable {
288 int n; /* number of entries of table_vlc minus 1 */
289 int last; /* number of values for last = 0 */
290 const UINT16 (*table_vlc)[2];
291 const INT8 *table_run;
292 const INT8 *table_level;
293 UINT8 *index_run[2]; /* encoding only */
294 INT8 *max_level[2]; /* encoding & decoding */
295 INT8 *max_run[2]; /* encoding & decoding */
296 VLC vlc; /* decoding only */
299 void init_rl(RLTable *rl);
300 void init_vlc_rl(RLTable *rl);
302 static inline int get_rl_index(const RLTable *rl, int last, int run, int level)
305 index = rl->index_run[last][run];
308 if (level > rl->max_level[last][run])
310 return index + level - 1;
313 void h263_encode_mb(MpegEncContext *s,
314 DCTELEM block[6][64],
315 int motion_x, int motion_y);
316 void mpeg4_encode_mb(MpegEncContext *s,
317 DCTELEM block[6][64],
318 int motion_x, int motion_y);
319 void h263_encode_picture_header(MpegEncContext *s, int picture_number);
320 int h263_encode_gob_header(MpegEncContext * s, int mb_line);
321 void h263_dc_scale(MpegEncContext *s);
322 INT16 *h263_pred_motion(MpegEncContext * s, int block,
324 void mpeg4_pred_ac(MpegEncContext * s, INT16 *block, int n,
326 void mpeg4_encode_picture_header(MpegEncContext *s, int picture_number);
327 void h263_encode_init_vlc(MpegEncContext *s);
329 void h263_decode_init_vlc(MpegEncContext *s);
330 int h263_decode_picture_header(MpegEncContext *s);
331 int h263_decode_gob_header(MpegEncContext *s);
332 int mpeg4_decode_picture_header(MpegEncContext * s);
333 int intel_h263_decode_picture_header(MpegEncContext *s);
334 int h263_decode_mb(MpegEncContext *s,
335 DCTELEM block[6][64]);
336 int h263_get_picture_format(int width, int height);
339 void rv10_encode_picture_header(MpegEncContext *s, int picture_number);
340 int rv_decode_dc(MpegEncContext *s, int n);
343 void msmpeg4_encode_picture_header(MpegEncContext * s, int picture_number);
344 void msmpeg4_encode_ext_header(MpegEncContext * s);
345 void msmpeg4_encode_mb(MpegEncContext * s,
346 DCTELEM block[6][64],
347 int motion_x, int motion_y);
348 void msmpeg4_dc_scale(MpegEncContext * s);
349 int msmpeg4_decode_picture_header(MpegEncContext * s);
350 int msmpeg4_decode_ext_header(MpegEncContext * s, int buf_size);
351 int msmpeg4_decode_mb(MpegEncContext *s,
352 DCTELEM block[6][64]);
353 int msmpeg4_decode_init_vlc(MpegEncContext *s);
357 int mjpeg_init(MpegEncContext *s);
358 void mjpeg_close(MpegEncContext *s);
359 void mjpeg_encode_mb(MpegEncContext *s,
360 DCTELEM block[6][64]);
361 void mjpeg_picture_header(MpegEncContext *s);
362 void mjpeg_picture_trailer(MpegEncContext *s);