2 * VC-1 and WMV3 decoder
3 * Copyright (c) 2006-2007 Konstantin Shishkov
4 * Partly based on vc9.c (c) 2005 Anonymous, Alex Beregszaszi, Michael Niedermayer
6 * This file is part of Libav.
8 * Libav is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
13 * Libav is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with Libav; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
27 #include "h264chroma.h"
28 #include "mpegvideo.h"
34 /** Markers used in VC-1 AP frame data */
37 VC1_CODE_RES0 = 0x00000100,
38 VC1_CODE_ENDOFSEQ = 0x0000010A,
47 #define IS_MARKER(x) (((x) & ~0xFF) == VC1_CODE_RES0)
49 /** Available Profiles */
54 PROFILE_COMPLEX, ///< TODO: WMV9 specific
59 /** Sequence quantizer mode */
62 QUANT_FRAME_IMPLICIT, ///< Implicitly specified at frame level
63 QUANT_FRAME_EXPLICIT, ///< Explicitly specified at frame level
64 QUANT_NON_UNIFORM, ///< Non-uniform quant used for all frames
65 QUANT_UNIFORM ///< Uniform quant used for all frames
69 /** Where quant can be changed */
73 DQPROFILE_DOUBLE_EDGES,
74 DQPROFILE_SINGLE_EDGE,
79 /** @name Where quant can be changed
90 /** Which pair of edges is quantized with ALTPQUANT */
93 DQDOUBLE_BEDGE_TOPLEFT,
94 DQDOUBLE_BEDGE_TOPRIGHT,
95 DQDOUBLE_BEDGE_BOTTOMRIGHT,
96 DQDOUBLE_BEDGE_BOTTOMLEFT
100 /** MV modes for P frames */
103 MV_PMODE_1MV_HPEL_BILIN,
107 MV_PMODE_INTENSITY_COMP
111 /** MBMODE for interlaced frame P-picture */
115 MV_PMODE_INTFR_2MV_FIELD,
117 MV_PMODE_INTFR_4MV_FIELD,
119 MV_PMODE_INTFR_INTRA,
123 /** @name MV types for B frames */
128 BMV_TYPE_INTERPOLATED,
133 /** @name Block types for P/B frames */
135 enum TransformTypes {
139 TT_8X4, // both halves
142 TT_4X8, // both halves
148 CS_HIGH_MOT_INTRA = 0,
158 /** @name Overlap conditions for Advanced Profile */
168 * FCM Frame Coding Mode
169 * @note some content might be marked interlaced
170 * but have fcm set to 0 as well (e.g. HD-DVD)
172 enum FrameCodingMode {
173 PROGRESSIVE = 0, ///< in the bitstream is reported as 00b
174 ILACE_FRAME, ///< in the bitstream is reported as 10b
175 ILACE_FIELD ///< in the bitstream is reported as 11b
179 * @todo Change size wherever another size is more efficient
180 * Many members are only used for Advanced Profile
182 typedef struct VC1Context{
185 H264ChromaContext h264chroma;
186 VC1DSPContext vc1dsp;
190 /** Simple/Main Profile sequence header */
192 int res_sprite; ///< reserved, sprite mode
193 int res_y411; ///< reserved, old interlaced mode
194 int res_x8; ///< reserved
195 int multires; ///< frame-level RESPIC syntax element present
196 int res_fasttx; ///< reserved, always 1
197 int res_transtab; ///< reserved, always 0
198 int rangered; ///< RANGEREDFRM (range reduction) syntax element present
200 int res_rtm_flag; ///< reserved, set to 1
201 int reserved; ///< reserved
204 /** Advanced Profile */
206 int level; ///< 3bits, for Advanced/Simple Profile, provided by TS layer
207 int chromaformat; ///< 2bits, 2=4:2:0, only defined
208 int postprocflag; ///< Per-frame processing suggestion flag present
209 int broadcast; ///< TFF/RFF present
210 int interlace; ///< Progressive/interlaced (RPTFTM syntax element)
211 int tfcntrflag; ///< TFCNTR present
212 int panscanflag; ///< NUMPANSCANWIN, TOPLEFT{X,Y}, BOTRIGHT{X,Y} present
213 int refdist_flag; ///< REFDIST syntax element present in II, IP, PI or PP field picture headers
214 int extended_dmv; ///< Additional extended dmv range at P/B frame-level
215 int color_prim; ///< 8bits, chroma coordinates of the color primaries
216 int transfer_char; ///< 8bits, Opto-electronic transfer characteristics
217 int matrix_coef; ///< 8bits, Color primaries->YCbCr transform matrix
218 int hrd_param_flag; ///< Presence of Hypothetical Reference
219 ///< Decoder parameters
220 int psf; ///< Progressive Segmented Frame
223 /** Sequence header data for all Profiles
224 * TODO: choose between ints, uint8_ts and monobit flags
227 int profile; ///< 2bits, Profile
228 int frmrtq_postproc; ///< 3bits,
229 int bitrtq_postproc; ///< 5bits, quantized framerate-based postprocessing strength
230 int fastuvmc; ///< Rounding of qpel vector to hpel ? (not in Simple)
231 int extended_mv; ///< Ext MV in P/B (not in Simple)
232 int dquant; ///< How qscale varies with MBs, 2bits (not in Simple)
233 int vstransform; ///< variable-size [48]x[48] transform type + info
234 int overlap; ///< overlapped transforms in use
235 int quantizer_mode; ///< 2bits, quantizer mode used for sequence, see QUANT_*
236 int finterpflag; ///< INTERPFRM present
239 /** Frame decoding info for all profiles */
241 uint8_t mv_mode; ///< MV coding monde
242 uint8_t mv_mode2; ///< Secondary MV coding mode (B frames)
243 int k_x; ///< Number of bits for MVs (depends on MV range)
244 int k_y; ///< Number of bits for MVs (depends on MV range)
245 int range_x, range_y; ///< MV range
246 uint8_t pq, altpq; ///< Current/alternate frame quantizer scale
247 uint8_t zz_8x8[4][64]; ///< Zigzag table for TT_8x8, permuted for IDCT
248 int left_blk_sh, top_blk_sh; ///< Either 3 or 0, positions of l/t in blk[]
249 const uint8_t* zz_8x4; ///< Zigzag scan table for TT_8x4 coding mode
250 const uint8_t* zz_4x8; ///< Zigzag scan table for TT_4x8 coding mode
251 /** pquant parameters */
258 /** AC coding set indexes
259 * @see 8.1.1.10, p(1)10
262 int c_ac_table_index; ///< Chroma index from ACFRM element
263 int y_ac_table_index; ///< Luma index from AC2FRM element
265 int ttfrm; ///< Transform type info present at frame level
266 uint8_t ttmbf; ///< Transform type flag
267 int *ttblk_base, *ttblk; ///< Transform type at the block level
268 int codingset; ///< index of current table set from 11.8 to use for luma block decoding
269 int codingset2; ///< index of current table set from 11.8 to use for chroma block decoding
270 int pqindex; ///< raw pqindex used in coding set selection
271 int a_avail, c_avail;
272 uint8_t *mb_type_base, *mb_type[3];
275 /** Luma compensation parameters */
280 int16_t bfraction; ///< Relative position % anchors=> how to scale MVs
281 uint8_t halfpq; ///< Uniform quant over image and qp+.5
282 uint8_t respic; ///< Frame-level flag for resized images
283 int buffer_fullness; ///< HRD info
285 * -# 0 -> [-64n 63.f] x [-32, 31.f]
286 * -# 1 -> [-128, 127.f] x [-64, 63.f]
287 * -# 2 -> [-512, 511.f] x [-128, 127.f]
288 * -# 3 -> [-1024, 1023.f] x [-256, 255.f]
290 uint8_t mvrange; ///< Extended MV range flag
291 uint8_t pquantizer; ///< Uniform (over sequence) quantizer in use
292 VLC *cbpcy_vlc; ///< CBPCY VLC table
293 int tt_index; ///< Index for Transform Type tables (to decode TTMB)
294 uint8_t* mv_type_mb_plane; ///< bitplane for mv_type == (4MV)
295 uint8_t* direct_mb_plane; ///< bitplane for "direct" MBs
296 uint8_t* forward_mb_plane; ///< bitplane for "forward" MBs
297 int mv_type_is_raw; ///< mv type mb plane is not coded
298 int dmb_is_raw; ///< direct mb plane is raw
299 int fmb_is_raw; ///< forward mb plane is raw
300 int skip_is_raw; ///< skip mb plane is not coded
301 uint8_t last_luty[2][256], last_lutuv[2][256]; ///< lookup tables used for intensity compensation
302 uint8_t aux_luty[2][256], aux_lutuv[2][256]; ///< lookup tables used for intensity compensation
303 uint8_t next_luty[2][256], next_lutuv[2][256]; ///< lookup tables used for intensity compensation
304 uint8_t (*curr_luty)[256] ,(*curr_lutuv)[256];
305 int last_use_ic, curr_use_ic, next_use_ic, aux_use_ic;
306 int rnd; ///< rounding control
308 /** Frame decoding info for S/M profiles only */
310 uint8_t rangeredfrm; ///< out_sample = CLIP((in_sample-128)*2+128)
314 /** Frame decoding info for Advanced profile */
316 enum FrameCodingMode fcm;
317 uint8_t numpanscanwin;
319 uint8_t rptfrm, tff, rff;
322 uint16_t bottomrightx;
323 uint16_t bottomrighty;
326 int hrd_num_leaky_buckets;
327 uint8_t bit_rate_exponent;
328 uint8_t buffer_size_exponent;
329 uint8_t* acpred_plane; ///< AC prediction flags bitplane
331 uint8_t* over_flags_plane; ///< Overflags bitplane
334 uint16_t *hrd_rate, *hrd_buffer;
335 uint8_t *hrd_fullness;
336 uint8_t range_mapy_flag;
337 uint8_t range_mapuv_flag;
342 /** Frame decoding info for interlaced picture */
343 uint8_t dmvrange; ///< Extended differential MV range flag
346 uint8_t lumscale2; ///< for interlaced field P picture
354 uint8_t* fieldtx_plane;
357 uint8_t *blk_mv_type_base, *blk_mv_type; ///< 0: frame MV, 1: field MV (interlaced frame)
358 uint8_t *mv_f_base, *mv_f[2]; ///< 0: MV obtained from same field, 1: opposite field
359 uint8_t *mv_f_next_base, *mv_f_next[2];
360 int field_mode; ///< 1 for interlaced field pictures
363 int refdist; ///< distance of the current picture from reference
364 int numref; ///< number of past field pictures used as reference
365 // 0 corresponds to 1 and 1 corresponds to 2 references
366 int reffield; ///< if numref = 0 (1 reference) then reffield decides which
367 // field to use among the two fields from previous frame
368 int intcompfield; ///< which of the two fields to be intensity compensated
369 // 0: both fields, 1: bottom field, 2: top field
370 int cur_field_type; ///< 0: top, 1: bottom
371 int ref_field_type[2]; ///< forward and backward reference field type (top or bottom)
372 int blocks_off, mb_off;
373 int qs_last; ///< if qpel has been used in the previous (tr.) picture
375 int frfd, brfd; ///< reference frame distance (forward or backward)
376 int first_pic_header_flag;
379 /** Frame decoding info for sprite modes */
383 AVFrame *sprite_output_frame;
384 int output_width, output_height, sprite_width, sprite_height;
385 uint8_t* sr_rows[2][2]; ///< Sprite resizer line cache
392 int16_t (*block)[6][64];
393 int n_allocated_blks, cur_blk_idx, left_blk_idx, topleft_blk_idx, top_blk_idx;
394 uint32_t *cbp_base, *cbp;
395 uint8_t *is_intra_base, *is_intra;
396 int16_t (*luma_mv_base)[2], (*luma_mv)[2];
397 uint8_t bfraction_lut_index; ///< Index for BFRACTION value (see Table 40, reproduced into ff_vc1_bfraction_lut[])
398 uint8_t broken_link; ///< Broken link flag (BROKEN_LINK syntax element)
399 uint8_t closed_entry; ///< Closed entry point flag (CLOSED_ENTRY syntax element)
401 int end_mb_x; ///< Horizontal macroblock limit (used only by mss2)
403 int parse_only; ///< Context is used within parser
404 int resync_marker; ///< could this stream contain resync markers
407 /** Find VC-1 marker in buffer
408 * @return position where next marker starts or end of buffer if no marker found
410 static av_always_inline const uint8_t* find_next_marker(const uint8_t *src, const uint8_t *end)
412 uint32_t mrk = 0xFFFFFFFF;
417 mrk = (mrk << 8) | *src++;
424 static av_always_inline int vc1_unescape_buffer(const uint8_t *src, int size, uint8_t *dst)
429 for (dsize = 0; dsize < size; dsize++)
433 for (i = 0; i < size; i++, src++) {
434 if (src[0] == 3 && i >= 2 && !src[-1] && !src[-2] && i < size-1 && src[1] < 4) {
435 dst[dsize++] = src[1];
445 * Decode Simple/Main Profiles sequence header
446 * @see Figure 7-8, p16-17
447 * @param avctx Codec context
448 * @param gb GetBit context initialized from Codec context extra_data
451 int ff_vc1_decode_sequence_header(AVCodecContext *avctx, VC1Context *v, GetBitContext *gb);
453 int ff_vc1_decode_entry_point(AVCodecContext *avctx, VC1Context *v, GetBitContext *gb);
455 int ff_vc1_parse_frame_header (VC1Context *v, GetBitContext *gb);
456 int ff_vc1_parse_frame_header_adv(VC1Context *v, GetBitContext *gb);
457 int ff_vc1_init_common(VC1Context *v);
459 int ff_vc1_decode_init_alloc_tables(VC1Context *v);
460 void ff_vc1_init_transposed_scantables(VC1Context *v);
461 int ff_vc1_decode_end(AVCodecContext *avctx);
462 void ff_vc1_decode_blocks(VC1Context *v);
464 #endif /* AVCODEC_VC1_H */