2 * HEVC parameter set parsing
4 * This file is part of FFmpeg.
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 #ifndef AVCODEC_HEVC_PS_H
22 #define AVCODEC_HEVC_PS_H
26 #include "libavutil/buffer.h"
27 #include "libavutil/pixfmt.h"
28 #include "libavutil/rational.h"
34 typedef struct ShortTermRPS {
35 unsigned int num_negative_pics;
37 int rps_idx_num_delta_pocs;
38 int32_t delta_poc[32];
42 typedef struct LongTermRPS {
44 uint8_t poc_msb_present[32];
49 typedef struct SliceHeader {
52 ///< address (in raster order) of the first block in the current slice segment
53 unsigned int slice_segment_addr;
54 ///< address (in raster order) of the first block in the current slice
55 unsigned int slice_addr;
57 enum HEVCSliceType slice_type;
59 int pic_order_cnt_lsb;
61 uint8_t first_slice_in_pic_flag;
62 uint8_t dependent_slice_segment_flag;
63 uint8_t pic_output_flag;
64 uint8_t colour_plane_id;
66 ///< RPS coded in the slice header itself is stored here
67 int short_term_ref_pic_set_sps_flag;
68 int short_term_ref_pic_set_size;
69 ShortTermRPS slice_rps;
70 const ShortTermRPS *short_term_rps;
71 int long_term_ref_pic_set_size;
72 LongTermRPS long_term_rps;
73 unsigned int list_entry_lx[2][32];
75 uint8_t rpl_modification_flag[2];
76 uint8_t no_output_of_prior_pics_flag;
77 uint8_t slice_temporal_mvp_enabled_flag;
79 unsigned int nb_refs[2];
81 uint8_t slice_sample_adaptive_offset_flag[3];
82 uint8_t mvd_l1_zero_flag;
84 uint8_t cabac_init_flag;
85 uint8_t disable_deblocking_filter_flag; ///< slice_header_disable_deblocking_filter_flag
86 uint8_t slice_loop_filter_across_slices_enabled_flag;
87 uint8_t collocated_list;
89 unsigned int collocated_ref_idx;
92 int slice_cb_qp_offset;
93 int slice_cr_qp_offset;
95 uint8_t cu_chroma_qp_offset_enabled_flag;
97 int beta_offset; ///< beta_offset_div2 * 2
98 int tc_offset; ///< tc_offset_div2 * 2
100 unsigned int max_num_merge_cand; ///< 5 - 5_minus_max_num_merge_cand
102 unsigned *entry_point_offset;
105 int num_entry_point_offsets;
109 uint8_t luma_log2_weight_denom;
110 int16_t chroma_log2_weight_denom;
112 int16_t luma_weight_l0[16];
113 int16_t chroma_weight_l0[16][2];
114 int16_t chroma_weight_l1[16][2];
115 int16_t luma_weight_l1[16];
117 int16_t luma_offset_l0[16];
118 int16_t chroma_offset_l0[16][2];
120 int16_t luma_offset_l1[16];
121 int16_t chroma_offset_l1[16][2];
123 int slice_ctb_addr_rs;
126 typedef struct HEVCWindow {
127 unsigned int left_offset;
128 unsigned int right_offset;
129 unsigned int top_offset;
130 unsigned int bottom_offset;
136 int overscan_info_present_flag;
137 int overscan_appropriate_flag;
139 int video_signal_type_present_flag;
141 int video_full_range_flag;
142 int colour_description_present_flag;
143 uint8_t colour_primaries;
144 uint8_t transfer_characteristic;
145 uint8_t matrix_coeffs;
147 int chroma_loc_info_present_flag;
148 int chroma_sample_loc_type_top_field;
149 int chroma_sample_loc_type_bottom_field;
150 int neutra_chroma_indication_flag;
153 int frame_field_info_present_flag;
155 int default_display_window_flag;
156 HEVCWindow def_disp_win;
158 int vui_timing_info_present_flag;
159 uint32_t vui_num_units_in_tick;
160 uint32_t vui_time_scale;
161 int vui_poc_proportional_to_timing_flag;
162 int vui_num_ticks_poc_diff_one_minus1;
163 int vui_hrd_parameters_present_flag;
165 int bitstream_restriction_flag;
166 int tiles_fixed_structure_flag;
167 int motion_vectors_over_pic_boundaries_flag;
168 int restricted_ref_pic_lists_flag;
169 int min_spatial_segmentation_idc;
170 int max_bytes_per_pic_denom;
171 int max_bits_per_min_cu_denom;
172 int log2_max_mv_length_horizontal;
173 int log2_max_mv_length_vertical;
176 typedef struct PTLCommon {
177 uint8_t profile_space;
180 uint8_t profile_compatibility_flag[32];
181 uint8_t progressive_source_flag;
182 uint8_t interlaced_source_flag;
183 uint8_t non_packed_constraint_flag;
184 uint8_t frame_only_constraint_flag;
185 uint8_t max_12bit_constraint_flag;
186 uint8_t max_10bit_constraint_flag;
187 uint8_t max_8bit_constraint_flag;
188 uint8_t max_422chroma_constraint_flag;
189 uint8_t max_420chroma_constraint_flag;
190 uint8_t max_monochrome_constraint_flag;
191 uint8_t intra_constraint_flag;
192 uint8_t one_picture_only_constraint_flag;
193 uint8_t lower_bit_rate_constraint_flag;
194 uint8_t max_14bit_constraint_flag;
200 PTLCommon general_ptl;
201 PTLCommon sub_layer_ptl[HEVC_MAX_SUB_LAYERS];
203 uint8_t sub_layer_profile_present_flag[HEVC_MAX_SUB_LAYERS];
204 uint8_t sub_layer_level_present_flag[HEVC_MAX_SUB_LAYERS];
207 typedef struct HEVCVPS {
208 uint8_t vps_temporal_id_nesting_flag;
210 int vps_max_sub_layers; ///< vps_max_temporal_layers_minus1 + 1
213 int vps_sub_layer_ordering_info_present_flag;
214 unsigned int vps_max_dec_pic_buffering[HEVC_MAX_SUB_LAYERS];
215 unsigned int vps_num_reorder_pics[HEVC_MAX_SUB_LAYERS];
216 unsigned int vps_max_latency_increase[HEVC_MAX_SUB_LAYERS];
217 int vps_max_layer_id;
218 int vps_num_layer_sets; ///< vps_num_layer_sets_minus1 + 1
219 uint8_t vps_timing_info_present_flag;
220 uint32_t vps_num_units_in_tick;
221 uint32_t vps_time_scale;
222 uint8_t vps_poc_proportional_to_timing_flag;
223 int vps_num_ticks_poc_diff_one; ///< vps_num_ticks_poc_diff_one_minus1 + 1
224 int vps_num_hrd_parameters;
230 typedef struct ScalingList {
231 /* This is a little wasteful, since sizeID 0 only needs 8 coeffs,
232 * and size ID 3 only has 2 arrays, not 6. */
233 uint8_t sl[4][6][64];
237 typedef struct HEVCSPS {
239 int chroma_format_idc;
240 uint8_t separate_colour_plane_flag;
242 HEVCWindow output_window;
244 HEVCWindow pic_conf_win;
247 int bit_depth_chroma;
249 enum AVPixelFormat pix_fmt;
251 unsigned int log2_max_poc_lsb;
252 int pcm_enabled_flag;
256 int max_dec_pic_buffering;
257 int num_reorder_pics;
258 int max_latency_increase;
259 } temporal_layer[HEVC_MAX_SUB_LAYERS];
260 uint8_t temporal_id_nesting_flag;
265 uint8_t scaling_list_enable_flag;
266 ScalingList scaling_list;
268 unsigned int nb_st_rps;
269 ShortTermRPS st_rps[HEVC_MAX_SHORT_TERM_REF_PIC_SETS];
271 uint8_t amp_enabled_flag;
274 uint8_t long_term_ref_pics_present_flag;
275 uint16_t lt_ref_pic_poc_lsb_sps[HEVC_MAX_LONG_TERM_REF_PICS];
276 uint8_t used_by_curr_pic_lt_sps_flag[HEVC_MAX_LONG_TERM_REF_PICS];
277 uint8_t num_long_term_ref_pics_sps;
281 uint8_t bit_depth_chroma;
282 unsigned int log2_min_pcm_cb_size;
283 unsigned int log2_max_pcm_cb_size;
284 uint8_t loop_filter_disable_flag;
286 uint8_t sps_temporal_mvp_enabled_flag;
287 uint8_t sps_strong_intra_smoothing_enable_flag;
289 unsigned int log2_min_cb_size;
290 unsigned int log2_diff_max_min_coding_block_size;
291 unsigned int log2_min_tb_size;
292 unsigned int log2_max_trafo_size;
293 unsigned int log2_ctb_size;
294 unsigned int log2_min_pu_size;
296 int max_transform_hierarchy_depth_inter;
297 int max_transform_hierarchy_depth_intra;
299 int sps_range_extension_flag;
300 int transform_skip_rotation_enabled_flag;
301 int transform_skip_context_enabled_flag;
302 int implicit_rdpcm_enabled_flag;
303 int explicit_rdpcm_enabled_flag;
304 int extended_precision_processing_flag;
305 int intra_smoothing_disabled_flag;
306 int high_precision_offsets_enabled_flag;
307 int persistent_rice_adaptation_enabled_flag;
308 int cabac_bypass_alignment_enabled_flag;
310 ///< coded frame dimension in various units
333 typedef struct HEVCPPS {
334 unsigned int sps_id; ///< seq_parameter_set_id
336 uint8_t sign_data_hiding_flag;
338 uint8_t cabac_init_present_flag;
340 int num_ref_idx_l0_default_active; ///< num_ref_idx_l0_default_active_minus1 + 1
341 int num_ref_idx_l1_default_active; ///< num_ref_idx_l1_default_active_minus1 + 1
342 int pic_init_qp_minus26;
344 uint8_t constrained_intra_pred_flag;
345 uint8_t transform_skip_enabled_flag;
347 uint8_t cu_qp_delta_enabled_flag;
348 int diff_cu_qp_delta_depth;
352 uint8_t pic_slice_level_chroma_qp_offsets_present_flag;
353 uint8_t weighted_pred_flag;
354 uint8_t weighted_bipred_flag;
355 uint8_t output_flag_present_flag;
356 uint8_t transquant_bypass_enable_flag;
358 uint8_t dependent_slice_segments_enabled_flag;
359 uint8_t tiles_enabled_flag;
360 uint8_t entropy_coding_sync_enabled_flag;
362 uint16_t num_tile_columns; ///< num_tile_columns_minus1 + 1
363 uint16_t num_tile_rows; ///< num_tile_rows_minus1 + 1
364 uint8_t uniform_spacing_flag;
365 uint8_t loop_filter_across_tiles_enabled_flag;
367 uint8_t seq_loop_filter_across_slices_enabled_flag;
369 uint8_t deblocking_filter_control_present_flag;
370 uint8_t deblocking_filter_override_enabled_flag;
372 int beta_offset; ///< beta_offset_div2 * 2
373 int tc_offset; ///< tc_offset_div2 * 2
375 uint8_t scaling_list_data_present_flag;
376 ScalingList scaling_list;
378 uint8_t lists_modification_present_flag;
379 int log2_parallel_merge_level; ///< log2_parallel_merge_level_minus2 + 2
380 int num_extra_slice_header_bits;
381 uint8_t slice_header_extension_present_flag;
382 uint8_t log2_max_transform_skip_block_size;
383 uint8_t pps_range_extensions_flag;
384 uint8_t cross_component_prediction_enabled_flag;
385 uint8_t chroma_qp_offset_list_enabled_flag;
386 uint8_t diff_cu_chroma_qp_offset_depth;
387 uint8_t chroma_qp_offset_list_len_minus1;
388 int8_t cb_qp_offset_list[6];
389 int8_t cr_qp_offset_list[6];
390 uint8_t log2_sao_offset_scale_luma;
391 uint8_t log2_sao_offset_scale_chroma;
393 // Inferred parameters
394 unsigned int *column_width; ///< ColumnWidth
395 unsigned int *row_height; ///< RowHeight
396 unsigned int *col_bd; ///< ColBd
397 unsigned int *row_bd; ///< RowBd
400 int *ctb_addr_rs_to_ts; ///< CtbAddrRSToTS
401 int *ctb_addr_ts_to_rs; ///< CtbAddrTSToRS
402 int *tile_id; ///< TileId
403 int *tile_pos_rs; ///< TilePosRS
404 int *min_tb_addr_zs; ///< MinTbAddrZS
405 int *min_tb_addr_zs_tab;///< MinTbAddrZS
411 typedef struct HEVCParamSets {
412 AVBufferRef *vps_list[HEVC_MAX_VPS_COUNT];
413 AVBufferRef *sps_list[HEVC_MAX_SPS_COUNT];
414 AVBufferRef *pps_list[HEVC_MAX_PPS_COUNT];
416 /* currently active parameter sets */
423 * Parse the SPS from the bitstream into the provided HEVCSPS struct.
425 * @param sps_id the SPS id will be written here
426 * @param apply_defdispwin if set 1, the default display window from the VUI
427 * will be applied to the video dimensions
428 * @param vps_list if non-NULL, this function will validate that the SPS refers
431 int ff_hevc_parse_sps(HEVCSPS *sps, GetBitContext *gb, unsigned int *sps_id,
432 int apply_defdispwin, AVBufferRef **vps_list, AVCodecContext *avctx);
434 int ff_hevc_decode_nal_vps(GetBitContext *gb, AVCodecContext *avctx,
436 int ff_hevc_decode_nal_sps(GetBitContext *gb, AVCodecContext *avctx,
437 HEVCParamSets *ps, int apply_defdispwin);
438 int ff_hevc_decode_nal_pps(GetBitContext *gb, AVCodecContext *avctx,
441 void ff_hevc_ps_uninit(HEVCParamSets *ps);
443 int ff_hevc_decode_short_term_rps(GetBitContext *gb, AVCodecContext *avctx,
444 ShortTermRPS *rps, const HEVCSPS *sps, int is_slice_header);
446 int ff_hevc_encode_nal_vps(HEVCVPS *vps, unsigned int id,
447 uint8_t *buf, int buf_size);
450 * Compute POC of the current frame and return it.
452 int ff_hevc_compute_poc(const HEVCSPS *sps, int pocTid0, int poc_lsb, int nal_unit_type);
454 #endif /* AVCODEC_HEVC_PS_H */