2 * HEVC Parameter Set decoding
4 * Copyright (C) 2012 - 2103 Guillaume Martres
5 * Copyright (C) 2012 - 2103 Mickael Raulet
6 * Copyright (C) 2012 - 2013 Gildas Cocherel
7 * Copyright (C) 2013 Vittorio Giovara
9 * This file is part of FFmpeg.
11 * FFmpeg is free software; you can redistribute it and/or
12 * modify it under the terms of the GNU Lesser General Public
13 * License as published by the Free Software Foundation; either
14 * version 2.1 of the License, or (at your option) any later version.
16 * FFmpeg is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
19 * Lesser General Public License for more details.
21 * You should have received a copy of the GNU Lesser General Public
22 * License along with FFmpeg; if not, write to the Free Software
23 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
26 #include "libavutil/imgutils.h"
28 #include "hevc_data.h"
31 static const uint8_t default_scaling_list_intra[] = {
32 16, 16, 16, 16, 17, 18, 21, 24,
33 16, 16, 16, 16, 17, 19, 22, 25,
34 16, 16, 17, 18, 20, 22, 25, 29,
35 16, 16, 18, 21, 24, 27, 31, 36,
36 17, 17, 20, 24, 30, 35, 41, 47,
37 18, 19, 22, 27, 35, 44, 54, 65,
38 21, 22, 25, 31, 41, 54, 70, 88,
39 24, 25, 29, 36, 47, 65, 88, 115
42 static const uint8_t default_scaling_list_inter[] = {
43 16, 16, 16, 16, 17, 18, 20, 24,
44 16, 16, 16, 17, 18, 20, 24, 25,
45 16, 16, 17, 18, 20, 24, 25, 28,
46 16, 17, 18, 20, 24, 25, 28, 33,
47 17, 18, 20, 24, 25, 28, 33, 41,
48 18, 20, 24, 25, 28, 33, 41, 54,
49 20, 24, 25, 28, 33, 41, 54, 71,
50 24, 25, 28, 33, 41, 54, 71, 91
53 static const AVRational vui_sar[] = {
73 static void remove_pps(HEVCParamSets *s, int id)
75 if (s->pps_list[id] && s->pps == (const HEVCPPS*)s->pps_list[id]->data)
77 av_buffer_unref(&s->pps_list[id]);
80 static void remove_sps(HEVCParamSets *s, int id)
83 if (s->sps_list[id]) {
84 if (s->sps == (const HEVCSPS*)s->sps_list[id]->data)
87 /* drop all PPS that depend on this SPS */
88 for (i = 0; i < FF_ARRAY_ELEMS(s->pps_list); i++)
89 if (s->pps_list[i] && ((HEVCPPS*)s->pps_list[i]->data)->sps_id == id)
92 av_assert0(!(s->sps_list[id] && s->sps == (HEVCSPS*)s->sps_list[id]->data));
94 av_buffer_unref(&s->sps_list[id]);
97 static void remove_vps(HEVCParamSets *s, int id)
100 if (s->vps_list[id]) {
101 if (s->vps == (const HEVCVPS*)s->vps_list[id]->data)
104 for (i = 0; i < FF_ARRAY_ELEMS(s->sps_list); i++)
105 if (s->sps_list[i] && ((HEVCSPS*)s->sps_list[i]->data)->vps_id == id)
108 av_buffer_unref(&s->vps_list[id]);
111 int ff_hevc_decode_short_term_rps(GetBitContext *gb, AVCodecContext *avctx,
112 ShortTermRPS *rps, const HEVCSPS *sps, int is_slice_header)
114 uint8_t rps_predict = 0;
121 if (rps != sps->st_rps && sps->nb_st_rps)
122 rps_predict = get_bits1(gb);
125 const ShortTermRPS *rps_ridx;
127 unsigned abs_delta_rps;
128 uint8_t use_delta_flag = 0;
129 uint8_t delta_rps_sign;
131 if (is_slice_header) {
132 unsigned int delta_idx = get_ue_golomb_long(gb) + 1;
133 if (delta_idx > sps->nb_st_rps) {
134 av_log(avctx, AV_LOG_ERROR,
135 "Invalid value of delta_idx in slice header RPS: %d > %d.\n",
136 delta_idx, sps->nb_st_rps);
137 return AVERROR_INVALIDDATA;
139 rps_ridx = &sps->st_rps[sps->nb_st_rps - delta_idx];
140 rps->rps_idx_num_delta_pocs = rps_ridx->num_delta_pocs;
142 rps_ridx = &sps->st_rps[rps - sps->st_rps - 1];
144 delta_rps_sign = get_bits1(gb);
145 abs_delta_rps = get_ue_golomb_long(gb) + 1;
146 if (abs_delta_rps < 1 || abs_delta_rps > 32768) {
147 av_log(avctx, AV_LOG_ERROR,
148 "Invalid value of abs_delta_rps: %d\n",
150 return AVERROR_INVALIDDATA;
152 delta_rps = (1 - (delta_rps_sign << 1)) * abs_delta_rps;
153 for (i = 0; i <= rps_ridx->num_delta_pocs; i++) {
154 int used = rps->used[k] = get_bits1(gb);
157 use_delta_flag = get_bits1(gb);
159 if (used || use_delta_flag) {
160 if (i < rps_ridx->num_delta_pocs)
161 delta_poc = delta_rps + rps_ridx->delta_poc[i];
163 delta_poc = delta_rps;
164 rps->delta_poc[k] = delta_poc;
173 if (k >= FF_ARRAY_ELEMS(rps->used)) {
174 av_log(avctx, AV_LOG_ERROR,
175 "Invalid num_delta_pocs: %d\n", k);
176 return AVERROR_INVALIDDATA;
179 rps->num_delta_pocs = k;
180 rps->num_negative_pics = k0;
181 // sort in increasing order (smallest first)
182 if (rps->num_delta_pocs != 0) {
184 for (i = 1; i < rps->num_delta_pocs; i++) {
185 delta_poc = rps->delta_poc[i];
187 for (k = i - 1; k >= 0; k--) {
188 tmp = rps->delta_poc[k];
189 if (delta_poc < tmp) {
190 rps->delta_poc[k + 1] = tmp;
191 rps->used[k + 1] = rps->used[k];
192 rps->delta_poc[k] = delta_poc;
198 if ((rps->num_negative_pics >> 1) != 0) {
200 k = rps->num_negative_pics - 1;
201 // flip the negative values to largest first
202 for (i = 0; i < rps->num_negative_pics >> 1; i++) {
203 delta_poc = rps->delta_poc[i];
205 rps->delta_poc[i] = rps->delta_poc[k];
206 rps->used[i] = rps->used[k];
207 rps->delta_poc[k] = delta_poc;
213 unsigned int prev, nb_positive_pics;
214 rps->num_negative_pics = get_ue_golomb_long(gb);
215 nb_positive_pics = get_ue_golomb_long(gb);
217 if (rps->num_negative_pics >= HEVC_MAX_REFS ||
218 nb_positive_pics >= HEVC_MAX_REFS) {
219 av_log(avctx, AV_LOG_ERROR, "Too many refs in a short term RPS.\n");
220 return AVERROR_INVALIDDATA;
223 rps->num_delta_pocs = rps->num_negative_pics + nb_positive_pics;
224 if (rps->num_delta_pocs) {
226 for (i = 0; i < rps->num_negative_pics; i++) {
227 delta_poc = get_ue_golomb_long(gb) + 1;
229 rps->delta_poc[i] = prev;
230 rps->used[i] = get_bits1(gb);
233 for (i = 0; i < nb_positive_pics; i++) {
234 delta_poc = get_ue_golomb_long(gb) + 1;
236 rps->delta_poc[rps->num_negative_pics + i] = prev;
237 rps->used[rps->num_negative_pics + i] = get_bits1(gb);
245 static int decode_profile_tier_level(GetBitContext *gb, AVCodecContext *avctx,
250 if (get_bits_left(gb) < 2+1+5 + 32 + 4 + 16 + 16 + 12)
253 ptl->profile_space = get_bits(gb, 2);
254 ptl->tier_flag = get_bits1(gb);
255 ptl->profile_idc = get_bits(gb, 5);
256 if (ptl->profile_idc == FF_PROFILE_HEVC_MAIN)
257 av_log(avctx, AV_LOG_DEBUG, "Main profile bitstream\n");
258 else if (ptl->profile_idc == FF_PROFILE_HEVC_MAIN_10)
259 av_log(avctx, AV_LOG_DEBUG, "Main 10 profile bitstream\n");
260 else if (ptl->profile_idc == FF_PROFILE_HEVC_MAIN_STILL_PICTURE)
261 av_log(avctx, AV_LOG_DEBUG, "Main Still Picture profile bitstream\n");
262 else if (ptl->profile_idc == FF_PROFILE_HEVC_REXT)
263 av_log(avctx, AV_LOG_DEBUG, "Range Extension profile bitstream\n");
265 av_log(avctx, AV_LOG_WARNING, "Unknown HEVC profile: %d\n", ptl->profile_idc);
267 for (i = 0; i < 32; i++) {
268 ptl->profile_compatibility_flag[i] = get_bits1(gb);
270 if (ptl->profile_idc == 0 && i > 0 && ptl->profile_compatibility_flag[i])
271 ptl->profile_idc = i;
273 ptl->progressive_source_flag = get_bits1(gb);
274 ptl->interlaced_source_flag = get_bits1(gb);
275 ptl->non_packed_constraint_flag = get_bits1(gb);
276 ptl->frame_only_constraint_flag = get_bits1(gb);
278 skip_bits(gb, 16); // XXX_reserved_zero_44bits[0..15]
279 skip_bits(gb, 16); // XXX_reserved_zero_44bits[16..31]
280 skip_bits(gb, 12); // XXX_reserved_zero_44bits[32..43]
285 static int parse_ptl(GetBitContext *gb, AVCodecContext *avctx,
286 PTL *ptl, int max_num_sub_layers)
289 if (decode_profile_tier_level(gb, avctx, &ptl->general_ptl) < 0 ||
290 get_bits_left(gb) < 8 + (8*2 * (max_num_sub_layers - 1 > 0))) {
291 av_log(avctx, AV_LOG_ERROR, "PTL information too short\n");
295 ptl->general_ptl.level_idc = get_bits(gb, 8);
297 for (i = 0; i < max_num_sub_layers - 1; i++) {
298 ptl->sub_layer_profile_present_flag[i] = get_bits1(gb);
299 ptl->sub_layer_level_present_flag[i] = get_bits1(gb);
302 if (max_num_sub_layers - 1> 0)
303 for (i = max_num_sub_layers - 1; i < 8; i++)
304 skip_bits(gb, 2); // reserved_zero_2bits[i]
305 for (i = 0; i < max_num_sub_layers - 1; i++) {
306 if (ptl->sub_layer_profile_present_flag[i] &&
307 decode_profile_tier_level(gb, avctx, &ptl->sub_layer_ptl[i]) < 0) {
308 av_log(avctx, AV_LOG_ERROR,
309 "PTL information for sublayer %i too short\n", i);
312 if (ptl->sub_layer_level_present_flag[i]) {
313 if (get_bits_left(gb) < 8) {
314 av_log(avctx, AV_LOG_ERROR,
315 "Not enough data for sublayer %i level_idc\n", i);
318 ptl->sub_layer_ptl[i].level_idc = get_bits(gb, 8);
325 static void decode_sublayer_hrd(GetBitContext *gb, unsigned int nb_cpb,
326 int subpic_params_present)
330 for (i = 0; i < nb_cpb; i++) {
331 get_ue_golomb_long(gb); // bit_rate_value_minus1
332 get_ue_golomb_long(gb); // cpb_size_value_minus1
334 if (subpic_params_present) {
335 get_ue_golomb_long(gb); // cpb_size_du_value_minus1
336 get_ue_golomb_long(gb); // bit_rate_du_value_minus1
338 skip_bits1(gb); // cbr_flag
342 static int decode_hrd(GetBitContext *gb, int common_inf_present,
345 int nal_params_present = 0, vcl_params_present = 0;
346 int subpic_params_present = 0;
349 if (common_inf_present) {
350 nal_params_present = get_bits1(gb);
351 vcl_params_present = get_bits1(gb);
353 if (nal_params_present || vcl_params_present) {
354 subpic_params_present = get_bits1(gb);
356 if (subpic_params_present) {
357 skip_bits(gb, 8); // tick_divisor_minus2
358 skip_bits(gb, 5); // du_cpb_removal_delay_increment_length_minus1
359 skip_bits(gb, 1); // sub_pic_cpb_params_in_pic_timing_sei_flag
360 skip_bits(gb, 5); // dpb_output_delay_du_length_minus1
363 skip_bits(gb, 4); // bit_rate_scale
364 skip_bits(gb, 4); // cpb_size_scale
366 if (subpic_params_present)
367 skip_bits(gb, 4); // cpb_size_du_scale
369 skip_bits(gb, 5); // initial_cpb_removal_delay_length_minus1
370 skip_bits(gb, 5); // au_cpb_removal_delay_length_minus1
371 skip_bits(gb, 5); // dpb_output_delay_length_minus1
375 for (i = 0; i < max_sublayers; i++) {
377 unsigned int nb_cpb = 1;
378 int fixed_rate = get_bits1(gb);
381 fixed_rate = get_bits1(gb);
384 get_ue_golomb_long(gb); // elemental_duration_in_tc_minus1
386 low_delay = get_bits1(gb);
389 nb_cpb = get_ue_golomb_long(gb) + 1;
390 if (nb_cpb < 1 || nb_cpb > 32) {
391 av_log(NULL, AV_LOG_ERROR, "nb_cpb %d invalid\n", nb_cpb);
392 return AVERROR_INVALIDDATA;
396 if (nal_params_present)
397 decode_sublayer_hrd(gb, nb_cpb, subpic_params_present);
398 if (vcl_params_present)
399 decode_sublayer_hrd(gb, nb_cpb, subpic_params_present);
404 int ff_hevc_decode_nal_vps(GetBitContext *gb, AVCodecContext *avctx,
411 AVBufferRef *vps_buf = av_buffer_allocz(sizeof(*vps));
414 return AVERROR(ENOMEM);
415 vps = (HEVCVPS*)vps_buf->data;
417 av_log(avctx, AV_LOG_DEBUG, "Decoding VPS\n");
419 nal_size = gb->buffer_end - gb->buffer;
420 if (nal_size > sizeof(vps->data)) {
421 av_log(avctx, AV_LOG_WARNING, "Truncating likely oversized VPS "
422 "(%"PTRDIFF_SPECIFIER" > %"SIZE_SPECIFIER")\n",
423 nal_size, sizeof(vps->data));
424 vps->data_size = sizeof(vps->data);
426 vps->data_size = nal_size;
428 memcpy(vps->data, gb->buffer, vps->data_size);
430 vps_id = get_bits(gb, 4);
431 if (vps_id >= HEVC_MAX_VPS_COUNT) {
432 av_log(avctx, AV_LOG_ERROR, "VPS id out of range: %d\n", vps_id);
436 if (get_bits(gb, 2) != 3) { // vps_reserved_three_2bits
437 av_log(avctx, AV_LOG_ERROR, "vps_reserved_three_2bits is not three\n");
441 vps->vps_max_layers = get_bits(gb, 6) + 1;
442 vps->vps_max_sub_layers = get_bits(gb, 3) + 1;
443 vps->vps_temporal_id_nesting_flag = get_bits1(gb);
445 if (get_bits(gb, 16) != 0xffff) { // vps_reserved_ffff_16bits
446 av_log(avctx, AV_LOG_ERROR, "vps_reserved_ffff_16bits is not 0xffff\n");
450 if (vps->vps_max_sub_layers > HEVC_MAX_SUB_LAYERS) {
451 av_log(avctx, AV_LOG_ERROR, "vps_max_sub_layers out of range: %d\n",
452 vps->vps_max_sub_layers);
456 if (parse_ptl(gb, avctx, &vps->ptl, vps->vps_max_sub_layers) < 0)
459 vps->vps_sub_layer_ordering_info_present_flag = get_bits1(gb);
461 i = vps->vps_sub_layer_ordering_info_present_flag ? 0 : vps->vps_max_sub_layers - 1;
462 for (; i < vps->vps_max_sub_layers; i++) {
463 vps->vps_max_dec_pic_buffering[i] = get_ue_golomb_long(gb) + 1;
464 vps->vps_num_reorder_pics[i] = get_ue_golomb_long(gb);
465 vps->vps_max_latency_increase[i] = get_ue_golomb_long(gb) - 1;
467 if (vps->vps_max_dec_pic_buffering[i] > HEVC_MAX_DPB_SIZE || !vps->vps_max_dec_pic_buffering[i]) {
468 av_log(avctx, AV_LOG_ERROR, "vps_max_dec_pic_buffering_minus1 out of range: %d\n",
469 vps->vps_max_dec_pic_buffering[i] - 1);
472 if (vps->vps_num_reorder_pics[i] > vps->vps_max_dec_pic_buffering[i] - 1) {
473 av_log(avctx, AV_LOG_WARNING, "vps_max_num_reorder_pics out of range: %d\n",
474 vps->vps_num_reorder_pics[i]);
475 if (avctx->err_recognition & AV_EF_EXPLODE)
480 vps->vps_max_layer_id = get_bits(gb, 6);
481 vps->vps_num_layer_sets = get_ue_golomb_long(gb) + 1;
482 if (vps->vps_num_layer_sets < 1 || vps->vps_num_layer_sets > 1024 ||
483 (vps->vps_num_layer_sets - 1LL) * (vps->vps_max_layer_id + 1LL) > get_bits_left(gb)) {
484 av_log(avctx, AV_LOG_ERROR, "too many layer_id_included_flags\n");
488 for (i = 1; i < vps->vps_num_layer_sets; i++)
489 for (j = 0; j <= vps->vps_max_layer_id; j++)
490 skip_bits(gb, 1); // layer_id_included_flag[i][j]
492 vps->vps_timing_info_present_flag = get_bits1(gb);
493 if (vps->vps_timing_info_present_flag) {
494 vps->vps_num_units_in_tick = get_bits_long(gb, 32);
495 vps->vps_time_scale = get_bits_long(gb, 32);
496 vps->vps_poc_proportional_to_timing_flag = get_bits1(gb);
497 if (vps->vps_poc_proportional_to_timing_flag)
498 vps->vps_num_ticks_poc_diff_one = get_ue_golomb_long(gb) + 1;
499 vps->vps_num_hrd_parameters = get_ue_golomb_long(gb);
500 if (vps->vps_num_hrd_parameters > (unsigned)vps->vps_num_layer_sets) {
501 av_log(avctx, AV_LOG_ERROR,
502 "vps_num_hrd_parameters %d is invalid\n", vps->vps_num_hrd_parameters);
505 for (i = 0; i < vps->vps_num_hrd_parameters; i++) {
506 int common_inf_present = 1;
508 get_ue_golomb_long(gb); // hrd_layer_set_idx
510 common_inf_present = get_bits1(gb);
511 decode_hrd(gb, common_inf_present, vps->vps_max_sub_layers);
514 get_bits1(gb); /* vps_extension_flag */
516 if (get_bits_left(gb) < 0) {
517 av_log(avctx, AV_LOG_ERROR,
518 "Overread VPS by %d bits\n", -get_bits_left(gb));
519 if (ps->vps_list[vps_id])
523 if (ps->vps_list[vps_id] &&
524 !memcmp(ps->vps_list[vps_id]->data, vps_buf->data, vps_buf->size)) {
525 av_buffer_unref(&vps_buf);
527 remove_vps(ps, vps_id);
528 ps->vps_list[vps_id] = vps_buf;
534 av_buffer_unref(&vps_buf);
535 return AVERROR_INVALIDDATA;
538 static void decode_vui(GetBitContext *gb, AVCodecContext *avctx,
539 int apply_defdispwin, HEVCSPS *sps)
541 VUI *vui = &sps->vui;
542 GetBitContext backup;
543 int sar_present, alt = 0;
545 av_log(avctx, AV_LOG_DEBUG, "Decoding VUI\n");
547 sar_present = get_bits1(gb);
549 uint8_t sar_idx = get_bits(gb, 8);
550 if (sar_idx < FF_ARRAY_ELEMS(vui_sar))
551 vui->sar = vui_sar[sar_idx];
552 else if (sar_idx == 255) {
553 vui->sar.num = get_bits(gb, 16);
554 vui->sar.den = get_bits(gb, 16);
556 av_log(avctx, AV_LOG_WARNING,
557 "Unknown SAR index: %u.\n", sar_idx);
560 vui->overscan_info_present_flag = get_bits1(gb);
561 if (vui->overscan_info_present_flag)
562 vui->overscan_appropriate_flag = get_bits1(gb);
564 vui->video_signal_type_present_flag = get_bits1(gb);
565 if (vui->video_signal_type_present_flag) {
566 vui->video_format = get_bits(gb, 3);
567 vui->video_full_range_flag = get_bits1(gb);
568 vui->colour_description_present_flag = get_bits1(gb);
569 if (vui->video_full_range_flag && sps->pix_fmt == AV_PIX_FMT_YUV420P)
570 sps->pix_fmt = AV_PIX_FMT_YUVJ420P;
571 if (vui->colour_description_present_flag) {
572 vui->colour_primaries = get_bits(gb, 8);
573 vui->transfer_characteristic = get_bits(gb, 8);
574 vui->matrix_coeffs = get_bits(gb, 8);
576 // Set invalid values to "unspecified"
577 if (!av_color_primaries_name(vui->colour_primaries))
578 vui->colour_primaries = AVCOL_PRI_UNSPECIFIED;
579 if (!av_color_transfer_name(vui->transfer_characteristic))
580 vui->transfer_characteristic = AVCOL_TRC_UNSPECIFIED;
581 if (!av_color_space_name(vui->matrix_coeffs))
582 vui->matrix_coeffs = AVCOL_SPC_UNSPECIFIED;
583 if (vui->matrix_coeffs == AVCOL_SPC_RGB) {
584 switch (sps->pix_fmt) {
585 case AV_PIX_FMT_YUV444P:
586 sps->pix_fmt = AV_PIX_FMT_GBRP;
588 case AV_PIX_FMT_YUV444P10:
589 sps->pix_fmt = AV_PIX_FMT_GBRP10;
591 case AV_PIX_FMT_YUV444P12:
592 sps->pix_fmt = AV_PIX_FMT_GBRP12;
599 vui->chroma_loc_info_present_flag = get_bits1(gb);
600 if (vui->chroma_loc_info_present_flag) {
601 vui->chroma_sample_loc_type_top_field = get_ue_golomb_long(gb);
602 vui->chroma_sample_loc_type_bottom_field = get_ue_golomb_long(gb);
605 vui->neutra_chroma_indication_flag = get_bits1(gb);
606 vui->field_seq_flag = get_bits1(gb);
607 vui->frame_field_info_present_flag = get_bits1(gb);
609 if (get_bits_left(gb) >= 68 && show_bits_long(gb, 21) == 0x100000) {
610 vui->default_display_window_flag = 0;
611 av_log(avctx, AV_LOG_WARNING, "Invalid default display window\n");
613 vui->default_display_window_flag = get_bits1(gb);
614 // Backup context in case an alternate header is detected
615 memcpy(&backup, gb, sizeof(backup));
617 if (vui->default_display_window_flag) {
618 int vert_mult = 1 + (sps->chroma_format_idc < 2);
619 int horiz_mult = 1 + (sps->chroma_format_idc < 3);
620 vui->def_disp_win.left_offset = get_ue_golomb_long(gb) * horiz_mult;
621 vui->def_disp_win.right_offset = get_ue_golomb_long(gb) * horiz_mult;
622 vui->def_disp_win.top_offset = get_ue_golomb_long(gb) * vert_mult;
623 vui->def_disp_win.bottom_offset = get_ue_golomb_long(gb) * vert_mult;
625 if (apply_defdispwin &&
626 avctx->flags2 & AV_CODEC_FLAG2_IGNORE_CROP) {
627 av_log(avctx, AV_LOG_DEBUG,
628 "discarding vui default display window, "
629 "original values are l:%u r:%u t:%u b:%u\n",
630 vui->def_disp_win.left_offset,
631 vui->def_disp_win.right_offset,
632 vui->def_disp_win.top_offset,
633 vui->def_disp_win.bottom_offset);
635 vui->def_disp_win.left_offset =
636 vui->def_disp_win.right_offset =
637 vui->def_disp_win.top_offset =
638 vui->def_disp_win.bottom_offset = 0;
642 vui->vui_timing_info_present_flag = get_bits1(gb);
644 if (vui->vui_timing_info_present_flag) {
645 if( get_bits_left(gb) < 66) {
646 // The alternate syntax seem to have timing info located
647 // at where def_disp_win is normally located
648 av_log(avctx, AV_LOG_WARNING,
649 "Strange VUI timing information, retrying...\n");
650 vui->default_display_window_flag = 0;
651 memset(&vui->def_disp_win, 0, sizeof(vui->def_disp_win));
652 memcpy(gb, &backup, sizeof(backup));
655 vui->vui_num_units_in_tick = get_bits_long(gb, 32);
656 vui->vui_time_scale = get_bits_long(gb, 32);
658 av_log(avctx, AV_LOG_INFO, "Retry got %"PRIu32"/%"PRIu32" fps\n",
659 vui->vui_time_scale, vui->vui_num_units_in_tick);
661 vui->vui_poc_proportional_to_timing_flag = get_bits1(gb);
662 if (vui->vui_poc_proportional_to_timing_flag)
663 vui->vui_num_ticks_poc_diff_one_minus1 = get_ue_golomb_long(gb);
664 vui->vui_hrd_parameters_present_flag = get_bits1(gb);
665 if (vui->vui_hrd_parameters_present_flag)
666 decode_hrd(gb, 1, sps->max_sub_layers);
669 vui->bitstream_restriction_flag = get_bits1(gb);
670 if (vui->bitstream_restriction_flag) {
671 vui->tiles_fixed_structure_flag = get_bits1(gb);
672 vui->motion_vectors_over_pic_boundaries_flag = get_bits1(gb);
673 vui->restricted_ref_pic_lists_flag = get_bits1(gb);
674 vui->min_spatial_segmentation_idc = get_ue_golomb_long(gb);
675 vui->max_bytes_per_pic_denom = get_ue_golomb_long(gb);
676 vui->max_bits_per_min_cu_denom = get_ue_golomb_long(gb);
677 vui->log2_max_mv_length_horizontal = get_ue_golomb_long(gb);
678 vui->log2_max_mv_length_vertical = get_ue_golomb_long(gb);
682 static void set_default_scaling_list_data(ScalingList *sl)
686 for (matrixId = 0; matrixId < 6; matrixId++) {
688 memset(sl->sl[0][matrixId], 16, 16);
689 sl->sl_dc[0][matrixId] = 16; // default for 16x16
690 sl->sl_dc[1][matrixId] = 16; // default for 32x32
692 memcpy(sl->sl[1][0], default_scaling_list_intra, 64);
693 memcpy(sl->sl[1][1], default_scaling_list_intra, 64);
694 memcpy(sl->sl[1][2], default_scaling_list_intra, 64);
695 memcpy(sl->sl[1][3], default_scaling_list_inter, 64);
696 memcpy(sl->sl[1][4], default_scaling_list_inter, 64);
697 memcpy(sl->sl[1][5], default_scaling_list_inter, 64);
698 memcpy(sl->sl[2][0], default_scaling_list_intra, 64);
699 memcpy(sl->sl[2][1], default_scaling_list_intra, 64);
700 memcpy(sl->sl[2][2], default_scaling_list_intra, 64);
701 memcpy(sl->sl[2][3], default_scaling_list_inter, 64);
702 memcpy(sl->sl[2][4], default_scaling_list_inter, 64);
703 memcpy(sl->sl[2][5], default_scaling_list_inter, 64);
704 memcpy(sl->sl[3][0], default_scaling_list_intra, 64);
705 memcpy(sl->sl[3][1], default_scaling_list_intra, 64);
706 memcpy(sl->sl[3][2], default_scaling_list_intra, 64);
707 memcpy(sl->sl[3][3], default_scaling_list_inter, 64);
708 memcpy(sl->sl[3][4], default_scaling_list_inter, 64);
709 memcpy(sl->sl[3][5], default_scaling_list_inter, 64);
712 static int scaling_list_data(GetBitContext *gb, AVCodecContext *avctx, ScalingList *sl, HEVCSPS *sps)
714 uint8_t scaling_list_pred_mode_flag;
715 int32_t scaling_list_dc_coef[2][6];
716 int size_id, matrix_id, pos;
719 for (size_id = 0; size_id < 4; size_id++)
720 for (matrix_id = 0; matrix_id < 6; matrix_id += ((size_id == 3) ? 3 : 1)) {
721 scaling_list_pred_mode_flag = get_bits1(gb);
722 if (!scaling_list_pred_mode_flag) {
723 unsigned int delta = get_ue_golomb_long(gb);
724 /* Only need to handle non-zero delta. Zero means default,
725 * which should already be in the arrays. */
727 // Copy from previous array.
728 if (matrix_id < delta) {
729 av_log(avctx, AV_LOG_ERROR,
730 "Invalid delta in scaling list data: %d.\n", delta);
731 return AVERROR_INVALIDDATA;
734 memcpy(sl->sl[size_id][matrix_id],
735 sl->sl[size_id][matrix_id - delta],
736 size_id > 0 ? 64 : 16);
738 sl->sl_dc[size_id - 2][matrix_id] = sl->sl_dc[size_id - 2][matrix_id - delta];
741 int next_coef, coef_num;
742 int32_t scaling_list_delta_coef;
745 coef_num = FFMIN(64, 1 << (4 + (size_id << 1)));
747 scaling_list_dc_coef[size_id - 2][matrix_id] = get_se_golomb(gb) + 8;
748 next_coef = scaling_list_dc_coef[size_id - 2][matrix_id];
749 sl->sl_dc[size_id - 2][matrix_id] = next_coef;
751 for (i = 0; i < coef_num; i++) {
753 pos = 4 * ff_hevc_diag_scan4x4_y[i] +
754 ff_hevc_diag_scan4x4_x[i];
756 pos = 8 * ff_hevc_diag_scan8x8_y[i] +
757 ff_hevc_diag_scan8x8_x[i];
759 scaling_list_delta_coef = get_se_golomb(gb);
760 next_coef = (next_coef + 256U + scaling_list_delta_coef) % 256;
761 sl->sl[size_id][matrix_id][pos] = next_coef;
766 if (sps->chroma_format_idc == 3) {
767 for (i = 0; i < 64; i++) {
768 sl->sl[3][1][i] = sl->sl[2][1][i];
769 sl->sl[3][2][i] = sl->sl[2][2][i];
770 sl->sl[3][4][i] = sl->sl[2][4][i];
771 sl->sl[3][5][i] = sl->sl[2][5][i];
773 sl->sl_dc[1][1] = sl->sl_dc[0][1];
774 sl->sl_dc[1][2] = sl->sl_dc[0][2];
775 sl->sl_dc[1][4] = sl->sl_dc[0][4];
776 sl->sl_dc[1][5] = sl->sl_dc[0][5];
783 static int map_pixel_format(AVCodecContext *avctx, HEVCSPS *sps)
785 const AVPixFmtDescriptor *desc;
786 switch (sps->bit_depth) {
788 if (sps->chroma_format_idc == 0) sps->pix_fmt = AV_PIX_FMT_GRAY8;
789 if (sps->chroma_format_idc == 1) sps->pix_fmt = AV_PIX_FMT_YUV420P;
790 if (sps->chroma_format_idc == 2) sps->pix_fmt = AV_PIX_FMT_YUV422P;
791 if (sps->chroma_format_idc == 3) sps->pix_fmt = AV_PIX_FMT_YUV444P;
794 if (sps->chroma_format_idc == 0) sps->pix_fmt = AV_PIX_FMT_GRAY16;
795 if (sps->chroma_format_idc == 1) sps->pix_fmt = AV_PIX_FMT_YUV420P9;
796 if (sps->chroma_format_idc == 2) sps->pix_fmt = AV_PIX_FMT_YUV422P9;
797 if (sps->chroma_format_idc == 3) sps->pix_fmt = AV_PIX_FMT_YUV444P9;
800 if (sps->chroma_format_idc == 0) sps->pix_fmt = AV_PIX_FMT_GRAY10;
801 if (sps->chroma_format_idc == 1) sps->pix_fmt = AV_PIX_FMT_YUV420P10;
802 if (sps->chroma_format_idc == 2) sps->pix_fmt = AV_PIX_FMT_YUV422P10;
803 if (sps->chroma_format_idc == 3) sps->pix_fmt = AV_PIX_FMT_YUV444P10;
806 if (sps->chroma_format_idc == 0) sps->pix_fmt = AV_PIX_FMT_GRAY12;
807 if (sps->chroma_format_idc == 1) sps->pix_fmt = AV_PIX_FMT_YUV420P12;
808 if (sps->chroma_format_idc == 2) sps->pix_fmt = AV_PIX_FMT_YUV422P12;
809 if (sps->chroma_format_idc == 3) sps->pix_fmt = AV_PIX_FMT_YUV444P12;
812 av_log(avctx, AV_LOG_ERROR,
813 "The following bit-depths are currently specified: 8, 9, 10 and 12 bits, "
814 "chroma_format_idc is %d, depth is %d\n",
815 sps->chroma_format_idc, sps->bit_depth);
816 return AVERROR_INVALIDDATA;
819 desc = av_pix_fmt_desc_get(sps->pix_fmt);
821 return AVERROR(EINVAL);
823 sps->hshift[0] = sps->vshift[0] = 0;
824 sps->hshift[2] = sps->hshift[1] = desc->log2_chroma_w;
825 sps->vshift[2] = sps->vshift[1] = desc->log2_chroma_h;
827 sps->pixel_shift = sps->bit_depth > 8;
832 int ff_hevc_parse_sps(HEVCSPS *sps, GetBitContext *gb, unsigned int *sps_id,
833 int apply_defdispwin, AVBufferRef **vps_list, AVCodecContext *avctx)
837 int log2_diff_max_min_transform_block_size;
838 int bit_depth_chroma, start, vui_present, sublayer_ordering_info;
843 sps->vps_id = get_bits(gb, 4);
844 if (sps->vps_id >= HEVC_MAX_VPS_COUNT) {
845 av_log(avctx, AV_LOG_ERROR, "VPS id out of range: %d\n", sps->vps_id);
846 return AVERROR_INVALIDDATA;
849 if (vps_list && !vps_list[sps->vps_id]) {
850 av_log(avctx, AV_LOG_ERROR, "VPS %d does not exist\n",
852 return AVERROR_INVALIDDATA;
855 sps->max_sub_layers = get_bits(gb, 3) + 1;
856 if (sps->max_sub_layers > HEVC_MAX_SUB_LAYERS) {
857 av_log(avctx, AV_LOG_ERROR, "sps_max_sub_layers out of range: %d\n",
858 sps->max_sub_layers);
859 return AVERROR_INVALIDDATA;
862 skip_bits1(gb); // temporal_id_nesting_flag
864 if ((ret = parse_ptl(gb, avctx, &sps->ptl, sps->max_sub_layers)) < 0)
867 *sps_id = get_ue_golomb_long(gb);
868 if (*sps_id >= HEVC_MAX_SPS_COUNT) {
869 av_log(avctx, AV_LOG_ERROR, "SPS id out of range: %d\n", *sps_id);
870 return AVERROR_INVALIDDATA;
873 sps->chroma_format_idc = get_ue_golomb_long(gb);
874 if (sps->chroma_format_idc > 3U) {
875 av_log(avctx, AV_LOG_ERROR, "chroma_format_idc %d is invalid\n", sps->chroma_format_idc);
876 return AVERROR_INVALIDDATA;
879 if (sps->chroma_format_idc == 3)
880 sps->separate_colour_plane_flag = get_bits1(gb);
882 if (sps->separate_colour_plane_flag)
883 sps->chroma_format_idc = 0;
885 sps->width = get_ue_golomb_long(gb);
886 sps->height = get_ue_golomb_long(gb);
887 if ((ret = av_image_check_size(sps->width,
888 sps->height, 0, avctx)) < 0)
891 if (get_bits1(gb)) { // pic_conformance_flag
892 int vert_mult = 1 + (sps->chroma_format_idc < 2);
893 int horiz_mult = 1 + (sps->chroma_format_idc < 3);
894 sps->pic_conf_win.left_offset = get_ue_golomb_long(gb) * horiz_mult;
895 sps->pic_conf_win.right_offset = get_ue_golomb_long(gb) * horiz_mult;
896 sps->pic_conf_win.top_offset = get_ue_golomb_long(gb) * vert_mult;
897 sps->pic_conf_win.bottom_offset = get_ue_golomb_long(gb) * vert_mult;
899 if (avctx->flags2 & AV_CODEC_FLAG2_IGNORE_CROP) {
900 av_log(avctx, AV_LOG_DEBUG,
901 "discarding sps conformance window, "
902 "original values are l:%u r:%u t:%u b:%u\n",
903 sps->pic_conf_win.left_offset,
904 sps->pic_conf_win.right_offset,
905 sps->pic_conf_win.top_offset,
906 sps->pic_conf_win.bottom_offset);
908 sps->pic_conf_win.left_offset =
909 sps->pic_conf_win.right_offset =
910 sps->pic_conf_win.top_offset =
911 sps->pic_conf_win.bottom_offset = 0;
913 sps->output_window = sps->pic_conf_win;
916 sps->bit_depth = get_ue_golomb_long(gb) + 8;
917 bit_depth_chroma = get_ue_golomb_long(gb) + 8;
918 if (sps->chroma_format_idc && bit_depth_chroma != sps->bit_depth) {
919 av_log(avctx, AV_LOG_ERROR,
920 "Luma bit depth (%d) is different from chroma bit depth (%d), "
921 "this is unsupported.\n",
922 sps->bit_depth, bit_depth_chroma);
923 return AVERROR_INVALIDDATA;
926 ret = map_pixel_format(avctx, sps);
930 sps->log2_max_poc_lsb = get_ue_golomb_long(gb) + 4;
931 if (sps->log2_max_poc_lsb > 16) {
932 av_log(avctx, AV_LOG_ERROR, "log2_max_pic_order_cnt_lsb_minus4 out range: %d\n",
933 sps->log2_max_poc_lsb - 4);
934 return AVERROR_INVALIDDATA;
937 sublayer_ordering_info = get_bits1(gb);
938 start = sublayer_ordering_info ? 0 : sps->max_sub_layers - 1;
939 for (i = start; i < sps->max_sub_layers; i++) {
940 sps->temporal_layer[i].max_dec_pic_buffering = get_ue_golomb_long(gb) + 1;
941 sps->temporal_layer[i].num_reorder_pics = get_ue_golomb_long(gb);
942 sps->temporal_layer[i].max_latency_increase = get_ue_golomb_long(gb) - 1;
943 if (sps->temporal_layer[i].max_dec_pic_buffering > HEVC_MAX_DPB_SIZE) {
944 av_log(avctx, AV_LOG_ERROR, "sps_max_dec_pic_buffering_minus1 out of range: %d\n",
945 sps->temporal_layer[i].max_dec_pic_buffering - 1);
946 return AVERROR_INVALIDDATA;
948 if (sps->temporal_layer[i].num_reorder_pics > sps->temporal_layer[i].max_dec_pic_buffering - 1) {
949 av_log(avctx, AV_LOG_WARNING, "sps_max_num_reorder_pics out of range: %d\n",
950 sps->temporal_layer[i].num_reorder_pics);
951 if (avctx->err_recognition & AV_EF_EXPLODE ||
952 sps->temporal_layer[i].num_reorder_pics > HEVC_MAX_DPB_SIZE - 1) {
953 return AVERROR_INVALIDDATA;
955 sps->temporal_layer[i].max_dec_pic_buffering = sps->temporal_layer[i].num_reorder_pics + 1;
959 if (!sublayer_ordering_info) {
960 for (i = 0; i < start; i++) {
961 sps->temporal_layer[i].max_dec_pic_buffering = sps->temporal_layer[start].max_dec_pic_buffering;
962 sps->temporal_layer[i].num_reorder_pics = sps->temporal_layer[start].num_reorder_pics;
963 sps->temporal_layer[i].max_latency_increase = sps->temporal_layer[start].max_latency_increase;
967 sps->log2_min_cb_size = get_ue_golomb_long(gb) + 3;
968 sps->log2_diff_max_min_coding_block_size = get_ue_golomb_long(gb);
969 sps->log2_min_tb_size = get_ue_golomb_long(gb) + 2;
970 log2_diff_max_min_transform_block_size = get_ue_golomb_long(gb);
971 sps->log2_max_trafo_size = log2_diff_max_min_transform_block_size +
972 sps->log2_min_tb_size;
974 if (sps->log2_min_cb_size < 3 || sps->log2_min_cb_size > 30) {
975 av_log(avctx, AV_LOG_ERROR, "Invalid value %d for log2_min_cb_size", sps->log2_min_cb_size);
976 return AVERROR_INVALIDDATA;
979 if (sps->log2_diff_max_min_coding_block_size > 30) {
980 av_log(avctx, AV_LOG_ERROR, "Invalid value %d for log2_diff_max_min_coding_block_size", sps->log2_diff_max_min_coding_block_size);
981 return AVERROR_INVALIDDATA;
984 if (sps->log2_min_tb_size >= sps->log2_min_cb_size || sps->log2_min_tb_size < 2) {
985 av_log(avctx, AV_LOG_ERROR, "Invalid value for log2_min_tb_size");
986 return AVERROR_INVALIDDATA;
989 if (log2_diff_max_min_transform_block_size < 0 || log2_diff_max_min_transform_block_size > 30) {
990 av_log(avctx, AV_LOG_ERROR, "Invalid value %d for log2_diff_max_min_transform_block_size", log2_diff_max_min_transform_block_size);
991 return AVERROR_INVALIDDATA;
994 sps->max_transform_hierarchy_depth_inter = get_ue_golomb_long(gb);
995 sps->max_transform_hierarchy_depth_intra = get_ue_golomb_long(gb);
997 sps->scaling_list_enable_flag = get_bits1(gb);
998 if (sps->scaling_list_enable_flag) {
999 set_default_scaling_list_data(&sps->scaling_list);
1001 if (get_bits1(gb)) {
1002 ret = scaling_list_data(gb, avctx, &sps->scaling_list, sps);
1008 sps->amp_enabled_flag = get_bits1(gb);
1009 sps->sao_enabled = get_bits1(gb);
1011 sps->pcm_enabled_flag = get_bits1(gb);
1012 if (sps->pcm_enabled_flag) {
1013 sps->pcm.bit_depth = get_bits(gb, 4) + 1;
1014 sps->pcm.bit_depth_chroma = get_bits(gb, 4) + 1;
1015 sps->pcm.log2_min_pcm_cb_size = get_ue_golomb_long(gb) + 3;
1016 sps->pcm.log2_max_pcm_cb_size = sps->pcm.log2_min_pcm_cb_size +
1017 get_ue_golomb_long(gb);
1018 if (sps->pcm.bit_depth > sps->bit_depth) {
1019 av_log(avctx, AV_LOG_ERROR,
1020 "PCM bit depth (%d) is greater than normal bit depth (%d)\n",
1021 sps->pcm.bit_depth, sps->bit_depth);
1022 return AVERROR_INVALIDDATA;
1025 sps->pcm.loop_filter_disable_flag = get_bits1(gb);
1028 sps->nb_st_rps = get_ue_golomb_long(gb);
1029 if (sps->nb_st_rps > HEVC_MAX_SHORT_TERM_RPS_COUNT) {
1030 av_log(avctx, AV_LOG_ERROR, "Too many short term RPS: %d.\n",
1032 return AVERROR_INVALIDDATA;
1034 for (i = 0; i < sps->nb_st_rps; i++) {
1035 if ((ret = ff_hevc_decode_short_term_rps(gb, avctx, &sps->st_rps[i],
1040 sps->long_term_ref_pics_present_flag = get_bits1(gb);
1041 if (sps->long_term_ref_pics_present_flag) {
1042 sps->num_long_term_ref_pics_sps = get_ue_golomb_long(gb);
1043 if (sps->num_long_term_ref_pics_sps > 31U) {
1044 av_log(avctx, AV_LOG_ERROR, "num_long_term_ref_pics_sps %d is out of range.\n",
1045 sps->num_long_term_ref_pics_sps);
1046 return AVERROR_INVALIDDATA;
1048 for (i = 0; i < sps->num_long_term_ref_pics_sps; i++) {
1049 sps->lt_ref_pic_poc_lsb_sps[i] = get_bits(gb, sps->log2_max_poc_lsb);
1050 sps->used_by_curr_pic_lt_sps_flag[i] = get_bits1(gb);
1054 sps->sps_temporal_mvp_enabled_flag = get_bits1(gb);
1055 sps->sps_strong_intra_smoothing_enable_flag = get_bits1(gb);
1056 sps->vui.sar = (AVRational){0, 1};
1057 vui_present = get_bits1(gb);
1059 decode_vui(gb, avctx, apply_defdispwin, sps);
1061 if (get_bits1(gb)) { // sps_extension_flag
1062 int sps_extension_flag[1];
1063 for (i = 0; i < 1; i++)
1064 sps_extension_flag[i] = get_bits1(gb);
1065 skip_bits(gb, 7); //sps_extension_7bits = get_bits(gb, 7);
1066 if (sps_extension_flag[0]) {
1067 int extended_precision_processing_flag;
1068 int high_precision_offsets_enabled_flag;
1069 int cabac_bypass_alignment_enabled_flag;
1071 sps->transform_skip_rotation_enabled_flag = get_bits1(gb);
1072 sps->transform_skip_context_enabled_flag = get_bits1(gb);
1073 sps->implicit_rdpcm_enabled_flag = get_bits1(gb);
1075 sps->explicit_rdpcm_enabled_flag = get_bits1(gb);
1077 extended_precision_processing_flag = get_bits1(gb);
1078 if (extended_precision_processing_flag)
1079 av_log(avctx, AV_LOG_WARNING,
1080 "extended_precision_processing_flag not yet implemented\n");
1082 sps->intra_smoothing_disabled_flag = get_bits1(gb);
1083 high_precision_offsets_enabled_flag = get_bits1(gb);
1084 if (high_precision_offsets_enabled_flag)
1085 av_log(avctx, AV_LOG_WARNING,
1086 "high_precision_offsets_enabled_flag not yet implemented\n");
1088 sps->persistent_rice_adaptation_enabled_flag = get_bits1(gb);
1090 cabac_bypass_alignment_enabled_flag = get_bits1(gb);
1091 if (cabac_bypass_alignment_enabled_flag)
1092 av_log(avctx, AV_LOG_WARNING,
1093 "cabac_bypass_alignment_enabled_flag not yet implemented\n");
1096 if (apply_defdispwin) {
1097 sps->output_window.left_offset += sps->vui.def_disp_win.left_offset;
1098 sps->output_window.right_offset += sps->vui.def_disp_win.right_offset;
1099 sps->output_window.top_offset += sps->vui.def_disp_win.top_offset;
1100 sps->output_window.bottom_offset += sps->vui.def_disp_win.bottom_offset;
1103 ow = &sps->output_window;
1104 if (ow->left_offset >= INT_MAX - ow->right_offset ||
1105 ow->top_offset >= INT_MAX - ow->bottom_offset ||
1106 ow->left_offset + ow->right_offset >= sps->width ||
1107 ow->top_offset + ow->bottom_offset >= sps->height) {
1108 av_log(avctx, AV_LOG_WARNING, "Invalid cropping offsets: %u/%u/%u/%u\n",
1109 ow->left_offset, ow->right_offset, ow->top_offset, ow->bottom_offset);
1110 if (avctx->err_recognition & AV_EF_EXPLODE) {
1111 return AVERROR_INVALIDDATA;
1113 av_log(avctx, AV_LOG_WARNING,
1114 "Displaying the whole video surface.\n");
1115 memset(ow, 0, sizeof(*ow));
1116 memset(&sps->pic_conf_win, 0, sizeof(sps->pic_conf_win));
1119 // Inferred parameters
1120 sps->log2_ctb_size = sps->log2_min_cb_size +
1121 sps->log2_diff_max_min_coding_block_size;
1122 sps->log2_min_pu_size = sps->log2_min_cb_size - 1;
1124 if (sps->log2_ctb_size > HEVC_MAX_LOG2_CTB_SIZE) {
1125 av_log(avctx, AV_LOG_ERROR, "CTB size out of range: 2^%d\n", sps->log2_ctb_size);
1126 return AVERROR_INVALIDDATA;
1128 if (sps->log2_ctb_size < 4) {
1131 "log2_ctb_size %d differs from the bounds of any known profile\n",
1132 sps->log2_ctb_size);
1133 avpriv_request_sample(avctx, "log2_ctb_size %d", sps->log2_ctb_size);
1134 return AVERROR_INVALIDDATA;
1137 sps->ctb_width = (sps->width + (1 << sps->log2_ctb_size) - 1) >> sps->log2_ctb_size;
1138 sps->ctb_height = (sps->height + (1 << sps->log2_ctb_size) - 1) >> sps->log2_ctb_size;
1139 sps->ctb_size = sps->ctb_width * sps->ctb_height;
1141 sps->min_cb_width = sps->width >> sps->log2_min_cb_size;
1142 sps->min_cb_height = sps->height >> sps->log2_min_cb_size;
1143 sps->min_tb_width = sps->width >> sps->log2_min_tb_size;
1144 sps->min_tb_height = sps->height >> sps->log2_min_tb_size;
1145 sps->min_pu_width = sps->width >> sps->log2_min_pu_size;
1146 sps->min_pu_height = sps->height >> sps->log2_min_pu_size;
1147 sps->tb_mask = (1 << (sps->log2_ctb_size - sps->log2_min_tb_size)) - 1;
1149 sps->qp_bd_offset = 6 * (sps->bit_depth - 8);
1151 if (av_mod_uintp2(sps->width, sps->log2_min_cb_size) ||
1152 av_mod_uintp2(sps->height, sps->log2_min_cb_size)) {
1153 av_log(avctx, AV_LOG_ERROR, "Invalid coded frame dimensions.\n");
1154 return AVERROR_INVALIDDATA;
1157 if (sps->max_transform_hierarchy_depth_inter > sps->log2_ctb_size - sps->log2_min_tb_size) {
1158 av_log(avctx, AV_LOG_ERROR, "max_transform_hierarchy_depth_inter out of range: %d\n",
1159 sps->max_transform_hierarchy_depth_inter);
1160 return AVERROR_INVALIDDATA;
1162 if (sps->max_transform_hierarchy_depth_intra > sps->log2_ctb_size - sps->log2_min_tb_size) {
1163 av_log(avctx, AV_LOG_ERROR, "max_transform_hierarchy_depth_intra out of range: %d\n",
1164 sps->max_transform_hierarchy_depth_intra);
1165 return AVERROR_INVALIDDATA;
1167 if (sps->log2_max_trafo_size > FFMIN(sps->log2_ctb_size, 5)) {
1168 av_log(avctx, AV_LOG_ERROR,
1169 "max transform block size out of range: %d\n",
1170 sps->log2_max_trafo_size);
1171 return AVERROR_INVALIDDATA;
1174 if (get_bits_left(gb) < 0) {
1175 av_log(avctx, AV_LOG_ERROR,
1176 "Overread SPS by %d bits\n", -get_bits_left(gb));
1177 return AVERROR_INVALIDDATA;
1183 int ff_hevc_decode_nal_sps(GetBitContext *gb, AVCodecContext *avctx,
1184 HEVCParamSets *ps, int apply_defdispwin)
1187 AVBufferRef *sps_buf = av_buffer_allocz(sizeof(*sps));
1188 unsigned int sps_id;
1193 return AVERROR(ENOMEM);
1194 sps = (HEVCSPS*)sps_buf->data;
1196 av_log(avctx, AV_LOG_DEBUG, "Decoding SPS\n");
1198 nal_size = gb->buffer_end - gb->buffer;
1199 if (nal_size > sizeof(sps->data)) {
1200 av_log(avctx, AV_LOG_WARNING, "Truncating likely oversized SPS "
1201 "(%"PTRDIFF_SPECIFIER" > %"SIZE_SPECIFIER")\n",
1202 nal_size, sizeof(sps->data));
1203 sps->data_size = sizeof(sps->data);
1205 sps->data_size = nal_size;
1207 memcpy(sps->data, gb->buffer, sps->data_size);
1209 ret = ff_hevc_parse_sps(sps, gb, &sps_id,
1211 ps->vps_list, avctx);
1213 av_buffer_unref(&sps_buf);
1217 if (avctx->debug & FF_DEBUG_BITSTREAM) {
1218 av_log(avctx, AV_LOG_DEBUG,
1219 "Parsed SPS: id %d; coded wxh: %dx%d; "
1220 "cropped wxh: %dx%d; pix_fmt: %s.\n",
1221 sps_id, sps->width, sps->height,
1222 sps->width - (sps->output_window.left_offset + sps->output_window.right_offset),
1223 sps->height - (sps->output_window.top_offset + sps->output_window.bottom_offset),
1224 av_get_pix_fmt_name(sps->pix_fmt));
1227 /* check if this is a repeat of an already parsed SPS, then keep the
1229 * otherwise drop all PPSes that depend on it */
1230 if (ps->sps_list[sps_id] &&
1231 !memcmp(ps->sps_list[sps_id]->data, sps_buf->data, sps_buf->size)) {
1232 av_buffer_unref(&sps_buf);
1234 remove_sps(ps, sps_id);
1235 ps->sps_list[sps_id] = sps_buf;
1241 static void hevc_pps_free(void *opaque, uint8_t *data)
1243 HEVCPPS *pps = (HEVCPPS*)data;
1245 av_freep(&pps->column_width);
1246 av_freep(&pps->row_height);
1247 av_freep(&pps->col_bd);
1248 av_freep(&pps->row_bd);
1249 av_freep(&pps->col_idxX);
1250 av_freep(&pps->ctb_addr_rs_to_ts);
1251 av_freep(&pps->ctb_addr_ts_to_rs);
1252 av_freep(&pps->tile_pos_rs);
1253 av_freep(&pps->tile_id);
1254 av_freep(&pps->min_tb_addr_zs_tab);
1259 static int pps_range_extensions(GetBitContext *gb, AVCodecContext *avctx,
1260 HEVCPPS *pps, HEVCSPS *sps) {
1263 if (pps->transform_skip_enabled_flag) {
1264 pps->log2_max_transform_skip_block_size = get_ue_golomb_long(gb) + 2;
1266 pps->cross_component_prediction_enabled_flag = get_bits1(gb);
1267 pps->chroma_qp_offset_list_enabled_flag = get_bits1(gb);
1268 if (pps->chroma_qp_offset_list_enabled_flag) {
1269 pps->diff_cu_chroma_qp_offset_depth = get_ue_golomb_long(gb);
1270 pps->chroma_qp_offset_list_len_minus1 = get_ue_golomb_long(gb);
1271 if (pps->chroma_qp_offset_list_len_minus1 && pps->chroma_qp_offset_list_len_minus1 >= 5) {
1272 av_log(avctx, AV_LOG_ERROR,
1273 "chroma_qp_offset_list_len_minus1 shall be in the range [0, 5].\n");
1274 return AVERROR_INVALIDDATA;
1276 for (i = 0; i <= pps->chroma_qp_offset_list_len_minus1; i++) {
1277 pps->cb_qp_offset_list[i] = get_se_golomb_long(gb);
1278 if (pps->cb_qp_offset_list[i]) {
1279 av_log(avctx, AV_LOG_WARNING,
1280 "cb_qp_offset_list not tested yet.\n");
1282 pps->cr_qp_offset_list[i] = get_se_golomb_long(gb);
1283 if (pps->cr_qp_offset_list[i]) {
1284 av_log(avctx, AV_LOG_WARNING,
1285 "cb_qp_offset_list not tested yet.\n");
1289 pps->log2_sao_offset_scale_luma = get_ue_golomb_long(gb);
1290 pps->log2_sao_offset_scale_chroma = get_ue_golomb_long(gb);
1295 static inline int setup_pps(AVCodecContext *avctx, GetBitContext *gb,
1296 HEVCPPS *pps, HEVCSPS *sps)
1299 int pic_area_in_ctbs;
1300 int i, j, x, y, ctb_addr_rs, tile_id;
1302 // Inferred parameters
1303 pps->col_bd = av_malloc_array(pps->num_tile_columns + 1, sizeof(*pps->col_bd));
1304 pps->row_bd = av_malloc_array(pps->num_tile_rows + 1, sizeof(*pps->row_bd));
1305 pps->col_idxX = av_malloc_array(sps->ctb_width, sizeof(*pps->col_idxX));
1306 if (!pps->col_bd || !pps->row_bd || !pps->col_idxX)
1307 return AVERROR(ENOMEM);
1309 if (pps->uniform_spacing_flag) {
1310 if (!pps->column_width) {
1311 pps->column_width = av_malloc_array(pps->num_tile_columns, sizeof(*pps->column_width));
1312 pps->row_height = av_malloc_array(pps->num_tile_rows, sizeof(*pps->row_height));
1314 if (!pps->column_width || !pps->row_height)
1315 return AVERROR(ENOMEM);
1317 for (i = 0; i < pps->num_tile_columns; i++) {
1318 pps->column_width[i] = ((i + 1) * sps->ctb_width) / pps->num_tile_columns -
1319 (i * sps->ctb_width) / pps->num_tile_columns;
1322 for (i = 0; i < pps->num_tile_rows; i++) {
1323 pps->row_height[i] = ((i + 1) * sps->ctb_height) / pps->num_tile_rows -
1324 (i * sps->ctb_height) / pps->num_tile_rows;
1329 for (i = 0; i < pps->num_tile_columns; i++)
1330 pps->col_bd[i + 1] = pps->col_bd[i] + pps->column_width[i];
1333 for (i = 0; i < pps->num_tile_rows; i++)
1334 pps->row_bd[i + 1] = pps->row_bd[i] + pps->row_height[i];
1336 for (i = 0, j = 0; i < sps->ctb_width; i++) {
1337 if (i > pps->col_bd[j])
1339 pps->col_idxX[i] = j;
1345 pic_area_in_ctbs = sps->ctb_width * sps->ctb_height;
1347 pps->ctb_addr_rs_to_ts = av_malloc_array(pic_area_in_ctbs, sizeof(*pps->ctb_addr_rs_to_ts));
1348 pps->ctb_addr_ts_to_rs = av_malloc_array(pic_area_in_ctbs, sizeof(*pps->ctb_addr_ts_to_rs));
1349 pps->tile_id = av_malloc_array(pic_area_in_ctbs, sizeof(*pps->tile_id));
1350 pps->min_tb_addr_zs_tab = av_malloc_array((sps->tb_mask+2) * (sps->tb_mask+2), sizeof(*pps->min_tb_addr_zs_tab));
1351 if (!pps->ctb_addr_rs_to_ts || !pps->ctb_addr_ts_to_rs ||
1352 !pps->tile_id || !pps->min_tb_addr_zs_tab) {
1353 return AVERROR(ENOMEM);
1356 for (ctb_addr_rs = 0; ctb_addr_rs < pic_area_in_ctbs; ctb_addr_rs++) {
1357 int tb_x = ctb_addr_rs % sps->ctb_width;
1358 int tb_y = ctb_addr_rs / sps->ctb_width;
1363 for (i = 0; i < pps->num_tile_columns; i++) {
1364 if (tb_x < pps->col_bd[i + 1]) {
1370 for (i = 0; i < pps->num_tile_rows; i++) {
1371 if (tb_y < pps->row_bd[i + 1]) {
1377 for (i = 0; i < tile_x; i++)
1378 val += pps->row_height[tile_y] * pps->column_width[i];
1379 for (i = 0; i < tile_y; i++)
1380 val += sps->ctb_width * pps->row_height[i];
1382 val += (tb_y - pps->row_bd[tile_y]) * pps->column_width[tile_x] +
1383 tb_x - pps->col_bd[tile_x];
1385 pps->ctb_addr_rs_to_ts[ctb_addr_rs] = val;
1386 pps->ctb_addr_ts_to_rs[val] = ctb_addr_rs;
1389 for (j = 0, tile_id = 0; j < pps->num_tile_rows; j++)
1390 for (i = 0; i < pps->num_tile_columns; i++, tile_id++)
1391 for (y = pps->row_bd[j]; y < pps->row_bd[j + 1]; y++)
1392 for (x = pps->col_bd[i]; x < pps->col_bd[i + 1]; x++)
1393 pps->tile_id[pps->ctb_addr_rs_to_ts[y * sps->ctb_width + x]] = tile_id;
1395 pps->tile_pos_rs = av_malloc_array(tile_id, sizeof(*pps->tile_pos_rs));
1396 if (!pps->tile_pos_rs)
1397 return AVERROR(ENOMEM);
1399 for (j = 0; j < pps->num_tile_rows; j++)
1400 for (i = 0; i < pps->num_tile_columns; i++)
1401 pps->tile_pos_rs[j * pps->num_tile_columns + i] =
1402 pps->row_bd[j] * sps->ctb_width + pps->col_bd[i];
1404 log2_diff = sps->log2_ctb_size - sps->log2_min_tb_size;
1405 pps->min_tb_addr_zs = &pps->min_tb_addr_zs_tab[1*(sps->tb_mask+2)+1];
1406 for (y = 0; y < sps->tb_mask+2; y++) {
1407 pps->min_tb_addr_zs_tab[y*(sps->tb_mask+2)] = -1;
1408 pps->min_tb_addr_zs_tab[y] = -1;
1410 for (y = 0; y < sps->tb_mask+1; y++) {
1411 for (x = 0; x < sps->tb_mask+1; x++) {
1412 int tb_x = x >> log2_diff;
1413 int tb_y = y >> log2_diff;
1414 int rs = sps->ctb_width * tb_y + tb_x;
1415 int val = pps->ctb_addr_rs_to_ts[rs] << (log2_diff * 2);
1416 for (i = 0; i < log2_diff; i++) {
1418 val += (m & x ? m * m : 0) + (m & y ? 2 * m * m : 0);
1420 pps->min_tb_addr_zs[y * (sps->tb_mask+2) + x] = val;
1427 int ff_hevc_decode_nal_pps(GetBitContext *gb, AVCodecContext *avctx,
1430 HEVCSPS *sps = NULL;
1432 unsigned int pps_id = 0;
1435 AVBufferRef *pps_buf;
1436 HEVCPPS *pps = av_mallocz(sizeof(*pps));
1439 return AVERROR(ENOMEM);
1441 pps_buf = av_buffer_create((uint8_t *)pps, sizeof(*pps),
1442 hevc_pps_free, NULL, 0);
1445 return AVERROR(ENOMEM);
1448 av_log(avctx, AV_LOG_DEBUG, "Decoding PPS\n");
1450 nal_size = gb->buffer_end - gb->buffer;
1451 if (nal_size > sizeof(pps->data)) {
1452 av_log(avctx, AV_LOG_WARNING, "Truncating likely oversized PPS "
1453 "(%"PTRDIFF_SPECIFIER" > %"SIZE_SPECIFIER")\n",
1454 nal_size, sizeof(pps->data));
1455 pps->data_size = sizeof(pps->data);
1457 pps->data_size = nal_size;
1459 memcpy(pps->data, gb->buffer, pps->data_size);
1462 pps->loop_filter_across_tiles_enabled_flag = 1;
1463 pps->num_tile_columns = 1;
1464 pps->num_tile_rows = 1;
1465 pps->uniform_spacing_flag = 1;
1466 pps->disable_dbf = 0;
1467 pps->beta_offset = 0;
1469 pps->log2_max_transform_skip_block_size = 2;
1472 pps_id = get_ue_golomb_long(gb);
1473 if (pps_id >= HEVC_MAX_PPS_COUNT) {
1474 av_log(avctx, AV_LOG_ERROR, "PPS id out of range: %d\n", pps_id);
1475 ret = AVERROR_INVALIDDATA;
1478 pps->sps_id = get_ue_golomb_long(gb);
1479 if (pps->sps_id >= HEVC_MAX_SPS_COUNT) {
1480 av_log(avctx, AV_LOG_ERROR, "SPS id out of range: %d\n", pps->sps_id);
1481 ret = AVERROR_INVALIDDATA;
1484 if (!ps->sps_list[pps->sps_id]) {
1485 av_log(avctx, AV_LOG_ERROR, "SPS %u does not exist.\n", pps->sps_id);
1486 ret = AVERROR_INVALIDDATA;
1489 sps = (HEVCSPS *)ps->sps_list[pps->sps_id]->data;
1491 pps->dependent_slice_segments_enabled_flag = get_bits1(gb);
1492 pps->output_flag_present_flag = get_bits1(gb);
1493 pps->num_extra_slice_header_bits = get_bits(gb, 3);
1495 pps->sign_data_hiding_flag = get_bits1(gb);
1497 pps->cabac_init_present_flag = get_bits1(gb);
1499 pps->num_ref_idx_l0_default_active = get_ue_golomb_long(gb) + 1;
1500 pps->num_ref_idx_l1_default_active = get_ue_golomb_long(gb) + 1;
1502 pps->pic_init_qp_minus26 = get_se_golomb(gb);
1504 pps->constrained_intra_pred_flag = get_bits1(gb);
1505 pps->transform_skip_enabled_flag = get_bits1(gb);
1507 pps->cu_qp_delta_enabled_flag = get_bits1(gb);
1508 pps->diff_cu_qp_delta_depth = 0;
1509 if (pps->cu_qp_delta_enabled_flag)
1510 pps->diff_cu_qp_delta_depth = get_ue_golomb_long(gb);
1512 if (pps->diff_cu_qp_delta_depth < 0 ||
1513 pps->diff_cu_qp_delta_depth > sps->log2_diff_max_min_coding_block_size) {
1514 av_log(avctx, AV_LOG_ERROR, "diff_cu_qp_delta_depth %d is invalid\n",
1515 pps->diff_cu_qp_delta_depth);
1516 ret = AVERROR_INVALIDDATA;
1520 pps->cb_qp_offset = get_se_golomb(gb);
1521 if (pps->cb_qp_offset < -12 || pps->cb_qp_offset > 12) {
1522 av_log(avctx, AV_LOG_ERROR, "pps_cb_qp_offset out of range: %d\n",
1524 ret = AVERROR_INVALIDDATA;
1527 pps->cr_qp_offset = get_se_golomb(gb);
1528 if (pps->cr_qp_offset < -12 || pps->cr_qp_offset > 12) {
1529 av_log(avctx, AV_LOG_ERROR, "pps_cr_qp_offset out of range: %d\n",
1531 ret = AVERROR_INVALIDDATA;
1534 pps->pic_slice_level_chroma_qp_offsets_present_flag = get_bits1(gb);
1536 pps->weighted_pred_flag = get_bits1(gb);
1537 pps->weighted_bipred_flag = get_bits1(gb);
1539 pps->transquant_bypass_enable_flag = get_bits1(gb);
1540 pps->tiles_enabled_flag = get_bits1(gb);
1541 pps->entropy_coding_sync_enabled_flag = get_bits1(gb);
1543 if (pps->tiles_enabled_flag) {
1544 pps->num_tile_columns = get_ue_golomb_long(gb) + 1;
1545 pps->num_tile_rows = get_ue_golomb_long(gb) + 1;
1546 if (pps->num_tile_columns <= 0 ||
1547 pps->num_tile_columns >= sps->width) {
1548 av_log(avctx, AV_LOG_ERROR, "num_tile_columns_minus1 out of range: %d\n",
1549 pps->num_tile_columns - 1);
1550 ret = AVERROR_INVALIDDATA;
1553 if (pps->num_tile_rows <= 0 ||
1554 pps->num_tile_rows >= sps->height) {
1555 av_log(avctx, AV_LOG_ERROR, "num_tile_rows_minus1 out of range: %d\n",
1556 pps->num_tile_rows - 1);
1557 ret = AVERROR_INVALIDDATA;
1561 pps->column_width = av_malloc_array(pps->num_tile_columns, sizeof(*pps->column_width));
1562 pps->row_height = av_malloc_array(pps->num_tile_rows, sizeof(*pps->row_height));
1563 if (!pps->column_width || !pps->row_height) {
1564 ret = AVERROR(ENOMEM);
1568 pps->uniform_spacing_flag = get_bits1(gb);
1569 if (!pps->uniform_spacing_flag) {
1571 for (i = 0; i < pps->num_tile_columns - 1; i++) {
1572 pps->column_width[i] = get_ue_golomb_long(gb) + 1;
1573 sum += pps->column_width[i];
1575 if (sum >= sps->ctb_width) {
1576 av_log(avctx, AV_LOG_ERROR, "Invalid tile widths.\n");
1577 ret = AVERROR_INVALIDDATA;
1580 pps->column_width[pps->num_tile_columns - 1] = sps->ctb_width - sum;
1583 for (i = 0; i < pps->num_tile_rows - 1; i++) {
1584 pps->row_height[i] = get_ue_golomb_long(gb) + 1;
1585 sum += pps->row_height[i];
1587 if (sum >= sps->ctb_height) {
1588 av_log(avctx, AV_LOG_ERROR, "Invalid tile heights.\n");
1589 ret = AVERROR_INVALIDDATA;
1592 pps->row_height[pps->num_tile_rows - 1] = sps->ctb_height - sum;
1594 pps->loop_filter_across_tiles_enabled_flag = get_bits1(gb);
1597 pps->seq_loop_filter_across_slices_enabled_flag = get_bits1(gb);
1599 pps->deblocking_filter_control_present_flag = get_bits1(gb);
1600 if (pps->deblocking_filter_control_present_flag) {
1601 pps->deblocking_filter_override_enabled_flag = get_bits1(gb);
1602 pps->disable_dbf = get_bits1(gb);
1603 if (!pps->disable_dbf) {
1604 pps->beta_offset = get_se_golomb(gb) * 2;
1605 pps->tc_offset = get_se_golomb(gb) * 2;
1606 if (pps->beta_offset/2 < -6 || pps->beta_offset/2 > 6) {
1607 av_log(avctx, AV_LOG_ERROR, "pps_beta_offset_div2 out of range: %d\n",
1608 pps->beta_offset/2);
1609 ret = AVERROR_INVALIDDATA;
1612 if (pps->tc_offset/2 < -6 || pps->tc_offset/2 > 6) {
1613 av_log(avctx, AV_LOG_ERROR, "pps_tc_offset_div2 out of range: %d\n",
1615 ret = AVERROR_INVALIDDATA;
1621 pps->scaling_list_data_present_flag = get_bits1(gb);
1622 if (pps->scaling_list_data_present_flag) {
1623 set_default_scaling_list_data(&pps->scaling_list);
1624 ret = scaling_list_data(gb, avctx, &pps->scaling_list, sps);
1628 pps->lists_modification_present_flag = get_bits1(gb);
1629 pps->log2_parallel_merge_level = get_ue_golomb_long(gb) + 2;
1630 if (pps->log2_parallel_merge_level > sps->log2_ctb_size) {
1631 av_log(avctx, AV_LOG_ERROR, "log2_parallel_merge_level_minus2 out of range: %d\n",
1632 pps->log2_parallel_merge_level - 2);
1633 ret = AVERROR_INVALIDDATA;
1637 pps->slice_header_extension_present_flag = get_bits1(gb);
1639 if (get_bits1(gb)) { // pps_extension_present_flag
1640 int pps_range_extensions_flag = get_bits1(gb);
1641 /* int pps_extension_7bits = */ get_bits(gb, 7);
1642 if (sps->ptl.general_ptl.profile_idc == FF_PROFILE_HEVC_REXT && pps_range_extensions_flag) {
1643 if ((ret = pps_range_extensions(gb, avctx, pps, sps)) < 0)
1648 ret = setup_pps(avctx, gb, pps, sps);
1652 if (get_bits_left(gb) < 0) {
1653 av_log(avctx, AV_LOG_ERROR,
1654 "Overread PPS by %d bits\n", -get_bits_left(gb));
1658 remove_pps(ps, pps_id);
1659 ps->pps_list[pps_id] = pps_buf;
1664 av_buffer_unref(&pps_buf);
1668 int ff_hevc_compute_poc(const HEVCSPS *sps, int pocTid0, int poc_lsb, int nal_unit_type)
1670 int max_poc_lsb = 1 << sps->log2_max_poc_lsb;
1671 int prev_poc_lsb = pocTid0 % max_poc_lsb;
1672 int prev_poc_msb = pocTid0 - prev_poc_lsb;
1675 if (poc_lsb < prev_poc_lsb && prev_poc_lsb - poc_lsb >= max_poc_lsb / 2)
1676 poc_msb = prev_poc_msb + max_poc_lsb;
1677 else if (poc_lsb > prev_poc_lsb && poc_lsb - prev_poc_lsb > max_poc_lsb / 2)
1678 poc_msb = prev_poc_msb - max_poc_lsb;
1680 poc_msb = prev_poc_msb;
1682 // For BLA picture types, POCmsb is set to 0.
1683 if (nal_unit_type == HEVC_NAL_BLA_W_LP ||
1684 nal_unit_type == HEVC_NAL_BLA_W_RADL ||
1685 nal_unit_type == HEVC_NAL_BLA_N_LP)
1688 return poc_msb + poc_lsb;