2 * This file is part of Libav.
4 * Libav is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * Libav is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with Libav; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 #include "bytestream.h"
23 #include "h264_parse.h"
25 int ff_h264_pred_weight_table(GetBitContext *gb, const SPS *sps,
26 const int *ref_count, int slice_type_nos,
27 H264PredWeightTable *pwt)
30 int luma_def, chroma_def;
33 pwt->use_weight_chroma = 0;
34 pwt->luma_log2_weight_denom = get_ue_golomb(gb);
35 if (sps->chroma_format_idc)
36 pwt->chroma_log2_weight_denom = get_ue_golomb(gb);
37 luma_def = 1 << pwt->luma_log2_weight_denom;
38 chroma_def = 1 << pwt->chroma_log2_weight_denom;
40 for (list = 0; list < 2; list++) {
41 pwt->luma_weight_flag[list] = 0;
42 pwt->chroma_weight_flag[list] = 0;
43 for (i = 0; i < ref_count[list]; i++) {
44 int luma_weight_flag, chroma_weight_flag;
46 luma_weight_flag = get_bits1(gb);
47 if (luma_weight_flag) {
48 pwt->luma_weight[i][list][0] = get_se_golomb(gb);
49 pwt->luma_weight[i][list][1] = get_se_golomb(gb);
50 if (pwt->luma_weight[i][list][0] != luma_def ||
51 pwt->luma_weight[i][list][1] != 0) {
53 pwt->luma_weight_flag[list] = 1;
56 pwt->luma_weight[i][list][0] = luma_def;
57 pwt->luma_weight[i][list][1] = 0;
60 if (sps->chroma_format_idc) {
61 chroma_weight_flag = get_bits1(gb);
62 if (chroma_weight_flag) {
64 for (j = 0; j < 2; j++) {
65 pwt->chroma_weight[i][list][j][0] = get_se_golomb(gb);
66 pwt->chroma_weight[i][list][j][1] = get_se_golomb(gb);
67 if (pwt->chroma_weight[i][list][j][0] != chroma_def ||
68 pwt->chroma_weight[i][list][j][1] != 0) {
69 pwt->use_weight_chroma = 1;
70 pwt->chroma_weight_flag[list] = 1;
75 for (j = 0; j < 2; j++) {
76 pwt->chroma_weight[i][list][j][0] = chroma_def;
77 pwt->chroma_weight[i][list][j][1] = 0;
83 pwt->luma_weight[16 + 2 * i][list][0] = pwt->luma_weight[16 + 2 * i + 1][list][0] = pwt->luma_weight[i][list][0];
84 pwt->luma_weight[16 + 2 * i][list][1] = pwt->luma_weight[16 + 2 * i + 1][list][1] = pwt->luma_weight[i][list][1];
85 for (j = 0; j < 2; j++) {
86 pwt->chroma_weight[16 + 2 * i][list][j][0] = pwt->chroma_weight[16 + 2 * i + 1][list][j][0] = pwt->chroma_weight[i][list][j][0];
87 pwt->chroma_weight[16 + 2 * i][list][j][1] = pwt->chroma_weight[16 + 2 * i + 1][list][j][1] = pwt->chroma_weight[i][list][j][1];
90 if (slice_type_nos != AV_PICTURE_TYPE_B)
93 pwt->use_weight = pwt->use_weight || pwt->use_weight_chroma;
98 * Check if the top & left blocks are available if needed and
99 * change the dc mode so it only uses the available blocks.
101 int ff_h264_check_intra4x4_pred_mode(int8_t *pred_mode_cache, void *logctx,
102 int top_samples_available, int left_samples_available)
104 static const int8_t top[12] = {
105 -1, 0, LEFT_DC_PRED, -1, -1, -1, -1, -1, 0
107 static const int8_t left[12] = {
108 0, -1, TOP_DC_PRED, 0, -1, -1, -1, 0, -1, DC_128_PRED
112 if (!(top_samples_available & 0x8000)) {
113 for (i = 0; i < 4; i++) {
114 int status = top[pred_mode_cache[scan8[0] + i]];
116 av_log(logctx, AV_LOG_ERROR,
117 "top block unavailable for requested intra4x4 mode %d\n",
119 return AVERROR_INVALIDDATA;
121 pred_mode_cache[scan8[0] + i] = status;
126 if ((left_samples_available & 0x8888) != 0x8888) {
127 static const int mask[4] = { 0x8000, 0x2000, 0x80, 0x20 };
128 for (i = 0; i < 4; i++)
129 if (!(left_samples_available & mask[i])) {
130 int status = left[pred_mode_cache[scan8[0] + 8 * i]];
132 av_log(logctx, AV_LOG_ERROR,
133 "left block unavailable for requested intra4x4 mode %d\n",
135 return AVERROR_INVALIDDATA;
137 pred_mode_cache[scan8[0] + 8 * i] = status;
146 * Check if the top & left blocks are available if needed and
147 * change the dc mode so it only uses the available blocks.
149 int ff_h264_check_intra_pred_mode(void *logctx, int top_samples_available,
150 int left_samples_available,
151 int mode, int is_chroma)
153 static const int8_t top[4] = { LEFT_DC_PRED8x8, 1, -1, -1 };
154 static const int8_t left[5] = { TOP_DC_PRED8x8, -1, 2, -1, DC_128_PRED8x8 };
157 av_log(logctx, AV_LOG_ERROR,
158 "out of range intra chroma pred mode\n");
159 return AVERROR_INVALIDDATA;
162 if (!(top_samples_available & 0x8000)) {
165 av_log(logctx, AV_LOG_ERROR,
166 "top block unavailable for requested intra mode\n");
167 return AVERROR_INVALIDDATA;
171 if ((left_samples_available & 0x8080) != 0x8080) {
173 if (is_chroma && (left_samples_available & 0x8080)) {
174 // mad cow disease mode, aka MBAFF + constrained_intra_pred
175 mode = ALZHEIMER_DC_L0T_PRED8x8 +
176 (!(left_samples_available & 0x8000)) +
177 2 * (mode == DC_128_PRED8x8);
180 av_log(logctx, AV_LOG_ERROR,
181 "left block unavailable for requested intra mode\n");
182 return AVERROR_INVALIDDATA;
189 int ff_h264_parse_ref_count(int *plist_count, int ref_count[2],
190 GetBitContext *gb, const PPS *pps,
191 int slice_type_nos, int picture_structure)
194 int num_ref_idx_active_override_flag, max_refs;
196 // set defaults, might be overridden a few lines later
197 ref_count[0] = pps->ref_count[0];
198 ref_count[1] = pps->ref_count[1];
200 if (slice_type_nos != AV_PICTURE_TYPE_I) {
201 num_ref_idx_active_override_flag = get_bits1(gb);
203 if (num_ref_idx_active_override_flag) {
204 ref_count[0] = get_ue_golomb(gb) + 1;
205 if (ref_count[0] < 1)
207 if (slice_type_nos == AV_PICTURE_TYPE_B) {
208 ref_count[1] = get_ue_golomb(gb) + 1;
209 if (ref_count[1] < 1)
214 if (slice_type_nos == AV_PICTURE_TYPE_B)
220 ref_count[0] = ref_count[1] = 0;
223 max_refs = picture_structure == PICT_FRAME ? 16 : 32;
225 if (ref_count[0] > max_refs || ref_count[1] > max_refs)
228 *plist_count = list_count;
235 return AVERROR_INVALIDDATA;
238 int ff_h264_init_poc(int pic_field_poc[2], int *pic_poc,
239 const SPS *sps, H264POCContext *pc,
240 int picture_structure, int nal_ref_idc)
242 const int max_frame_num = 1 << sps->log2_max_frame_num;
245 pc->frame_num_offset = pc->prev_frame_num_offset;
246 if (pc->frame_num < pc->prev_frame_num)
247 pc->frame_num_offset += max_frame_num;
249 if (sps->poc_type == 0) {
250 const int max_poc_lsb = 1 << sps->log2_max_poc_lsb;
252 if (pc->poc_lsb < pc->prev_poc_lsb &&
253 pc->prev_poc_lsb - pc->poc_lsb >= max_poc_lsb / 2)
254 pc->poc_msb = pc->prev_poc_msb + max_poc_lsb;
255 else if (pc->poc_lsb > pc->prev_poc_lsb &&
256 pc->prev_poc_lsb - pc->poc_lsb < -max_poc_lsb / 2)
257 pc->poc_msb = pc->prev_poc_msb - max_poc_lsb;
259 pc->poc_msb = pc->prev_poc_msb;
261 field_poc[1] = pc->poc_msb + pc->poc_lsb;
262 if (picture_structure == PICT_FRAME)
263 field_poc[1] += pc->delta_poc_bottom;
264 } else if (sps->poc_type == 1) {
265 int abs_frame_num, expected_delta_per_poc_cycle, expectedpoc;
268 if (sps->poc_cycle_length != 0)
269 abs_frame_num = pc->frame_num_offset + pc->frame_num;
273 if (nal_ref_idc == 0 && abs_frame_num > 0)
276 expected_delta_per_poc_cycle = 0;
277 for (i = 0; i < sps->poc_cycle_length; i++)
278 // FIXME integrate during sps parse
279 expected_delta_per_poc_cycle += sps->offset_for_ref_frame[i];
281 if (abs_frame_num > 0) {
282 int poc_cycle_cnt = (abs_frame_num - 1) / sps->poc_cycle_length;
283 int frame_num_in_poc_cycle = (abs_frame_num - 1) % sps->poc_cycle_length;
285 expectedpoc = poc_cycle_cnt * expected_delta_per_poc_cycle;
286 for (i = 0; i <= frame_num_in_poc_cycle; i++)
287 expectedpoc = expectedpoc + sps->offset_for_ref_frame[i];
291 if (nal_ref_idc == 0)
292 expectedpoc = expectedpoc + sps->offset_for_non_ref_pic;
294 field_poc[0] = expectedpoc + pc->delta_poc[0];
295 field_poc[1] = field_poc[0] + sps->offset_for_top_to_bottom_field;
297 if (picture_structure == PICT_FRAME)
298 field_poc[1] += pc->delta_poc[1];
300 int poc = 2 * (pc->frame_num_offset + pc->frame_num);
309 if (picture_structure != PICT_BOTTOM_FIELD)
310 pic_field_poc[0] = field_poc[0];
311 if (picture_structure != PICT_TOP_FIELD)
312 pic_field_poc[1] = field_poc[1];
313 *pic_poc = FFMIN(pic_field_poc[0], pic_field_poc[1]);
318 static int decode_extradata_ps(const uint8_t *data, int size, H264ParamSets *ps,
319 int is_avc, void *logctx)
321 H2645Packet pkt = { 0 };
324 ret = ff_h2645_packet_split(&pkt, data, size, logctx, is_avc, 2, AV_CODEC_ID_H264);
328 for (i = 0; i < pkt.nb_nals; i++) {
329 H2645NAL *nal = &pkt.nals[i];
332 ret = ff_h264_decode_seq_parameter_set(&nal->gb, logctx, ps);
337 ret = ff_h264_decode_picture_parameter_set(&nal->gb, logctx, ps,
343 av_log(logctx, AV_LOG_VERBOSE, "Ignoring NAL type %d in extradata\n",
350 ff_h2645_packet_uninit(&pkt);
354 /* There are (invalid) samples in the wild with mp4-style extradata, where the
355 * parameter sets are stored unescaped (i.e. as RBSP).
356 * This function catches the parameter set decoding failure and tries again
357 * after escaping it */
358 static int decode_extradata_ps_mp4(const uint8_t *buf, int buf_size, H264ParamSets *ps,
359 int err_recognition, void *logctx)
363 ret = decode_extradata_ps(buf, buf_size, ps, 1, logctx);
364 if (ret < 0 && !(err_recognition & AV_EF_EXPLODE)) {
367 uint8_t *escaped_buf;
368 int escaped_buf_size;
370 av_log(logctx, AV_LOG_WARNING,
371 "SPS decoding failure, trying again after escaping the NAL\n");
373 if (buf_size / 2 >= (INT16_MAX - AV_INPUT_BUFFER_PADDING_SIZE) / 3)
374 return AVERROR(ERANGE);
375 escaped_buf_size = buf_size * 3 / 2 + AV_INPUT_BUFFER_PADDING_SIZE;
376 escaped_buf = av_mallocz(escaped_buf_size);
378 return AVERROR(ENOMEM);
380 bytestream2_init(&gbc, buf, buf_size);
381 bytestream2_init_writer(&pbc, escaped_buf, escaped_buf_size);
383 while (bytestream2_get_bytes_left(&gbc)) {
384 if (bytestream2_get_bytes_left(&gbc) >= 3 &&
385 bytestream2_peek_be24(&gbc) <= 3) {
386 bytestream2_put_be24(&pbc, 3);
387 bytestream2_skip(&gbc, 2);
389 bytestream2_put_byte(&pbc, bytestream2_get_byte(&gbc));
392 escaped_buf_size = bytestream2_tell_p(&pbc);
393 AV_WB16(escaped_buf, escaped_buf_size - 2);
395 ret = decode_extradata_ps(escaped_buf, escaped_buf_size, ps, 1, logctx);
396 av_freep(&escaped_buf);
404 int ff_h264_decode_extradata(const uint8_t *data, int size, H264ParamSets *ps,
405 int *is_avc, int *nal_length_size,
406 int err_recognition, void *logctx)
412 const uint8_t *p = data;
417 av_log(logctx, AV_LOG_ERROR, "avcC %d too short\n", size);
418 return AVERROR_INVALIDDATA;
421 // Decode sps from avcC
422 cnt = *(p + 5) & 0x1f; // Number of sps
424 for (i = 0; i < cnt; i++) {
425 nalsize = AV_RB16(p) + 2;
426 if (p - data + nalsize > size)
427 return AVERROR_INVALIDDATA;
428 ret = decode_extradata_ps_mp4(p, nalsize, ps, err_recognition, logctx);
430 av_log(logctx, AV_LOG_ERROR,
431 "Decoding sps %d from avcC failed\n", i);
436 // Decode pps from avcC
437 cnt = *(p++); // Number of pps
438 for (i = 0; i < cnt; i++) {
439 nalsize = AV_RB16(p) + 2;
440 if (p - data + nalsize > size)
441 return AVERROR_INVALIDDATA;
442 ret = decode_extradata_ps_mp4(p, nalsize, ps, err_recognition, logctx);
444 av_log(logctx, AV_LOG_ERROR,
445 "Decoding pps %d from avcC failed\n", i);
450 // Store right nal length size that will be used to parse all other nals
451 *nal_length_size = (data[4] & 0x03) + 1;
454 ret = decode_extradata_ps(data, size, ps, 0, logctx);
462 * Compute profile from profile_idc and constraint_set?_flags.
466 * @return profile as defined by FF_PROFILE_H264_*
468 int ff_h264_get_profile(const SPS *sps)
470 int profile = sps->profile_idc;
472 switch (sps->profile_idc) {
473 case FF_PROFILE_H264_BASELINE:
474 // constraint_set1_flag set to 1
475 profile |= (sps->constraint_set_flags & 1 << 1) ? FF_PROFILE_H264_CONSTRAINED : 0;
477 case FF_PROFILE_H264_HIGH_10:
478 case FF_PROFILE_H264_HIGH_422:
479 case FF_PROFILE_H264_HIGH_444_PREDICTIVE:
480 // constraint_set3_flag set to 1
481 profile |= (sps->constraint_set_flags & 1 << 3) ? FF_PROFILE_H264_INTRA : 0;