git.sesse.net Git - ffmpeg/blob - libavcodec/h264_parse.c

   1 /*
   2  * This file is part of FFmpeg.
   3  *
   4  * FFmpeg is free software; you can redistribute it and/or
   5  * modify it under the terms of the GNU Lesser General Public
   6  * License as published by the Free Software Foundation; either
   7  * version 2.1 of the License, or (at your option) any later version.
   8  *
   9  * FFmpeg is distributed in the hope that it will be useful,
  10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  12  * Lesser General Public License for more details.
  13  *
  14  * You should have received a copy of the GNU Lesser General Public
  15  * License along with FFmpeg; if not, write to the Free Software
  16  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  17  */
  18
  19 #include "bytestream.h"
  20 #include "get_bits.h"
  21 #include "golomb.h"
  22 #include "h264.h"
  23 #include "h264dec.h"
  24 #include "h264_parse.h"
  25 #include "h264_ps.h"
  26
  27 int ff_h264_pred_weight_table(GetBitContext *gb, const SPS *sps,
  28                               const int *ref_count, int slice_type_nos,
  29                               H264PredWeightTable *pwt,
  30                               int picture_structure, void *logctx)
  31 {
  32     int list, i, j;
  33     int luma_def, chroma_def;
  34
  35     pwt->use_weight             = 0;
  36     pwt->use_weight_chroma      = 0;
  37
  38     pwt->luma_log2_weight_denom = get_ue_golomb(gb);
  39     if (pwt->luma_log2_weight_denom > 7U) {
  40         av_log(logctx, AV_LOG_ERROR, "luma_log2_weight_denom %d is out of range\n", pwt->luma_log2_weight_denom);
  41         pwt->luma_log2_weight_denom = 0;
  42     }
  43     luma_def = 1 << pwt->luma_log2_weight_denom;
  44
  45     if (sps->chroma_format_idc) {
  46         pwt->chroma_log2_weight_denom = get_ue_golomb(gb);
  47         if (pwt->chroma_log2_weight_denom > 7U) {
  48             av_log(logctx, AV_LOG_ERROR, "chroma_log2_weight_denom %d is out of range\n", pwt->chroma_log2_weight_denom);
  49             pwt->chroma_log2_weight_denom = 0;
  50         }
  51         chroma_def = 1 << pwt->chroma_log2_weight_denom;
  52     }
  53
  54     for (list = 0; list < 2; list++) {
  55         pwt->luma_weight_flag[list]   = 0;
  56         pwt->chroma_weight_flag[list] = 0;
  57         for (i = 0; i < ref_count[list]; i++) {
  58             int luma_weight_flag, chroma_weight_flag;
  59
  60             luma_weight_flag = get_bits1(gb);
  61             if (luma_weight_flag) {
  62                 pwt->luma_weight[i][list][0] = get_se_golomb(gb);
  63                 pwt->luma_weight[i][list][1] = get_se_golomb(gb);
  64                 if ((int8_t)pwt->luma_weight[i][list][0] != pwt->luma_weight[i][list][0] ||
  65                     (int8_t)pwt->luma_weight[i][list][1] != pwt->luma_weight[i][list][1])
  66                     goto out_range_weight;
  67                 if (pwt->luma_weight[i][list][0] != luma_def ||
  68                     pwt->luma_weight[i][list][1] != 0) {
  69                     pwt->use_weight             = 1;
  70                     pwt->luma_weight_flag[list] = 1;
  71                 }
  72             } else {
  73                 pwt->luma_weight[i][list][0] = luma_def;
  74                 pwt->luma_weight[i][list][1] = 0;
  75             }
  76
  77             if (sps->chroma_format_idc) {
  78                 chroma_weight_flag = get_bits1(gb);
  79                 if (chroma_weight_flag) {
  80                     int j;
  81                     for (j = 0; j < 2; j++) {
  82                         pwt->chroma_weight[i][list][j][0] = get_se_golomb(gb);
  83                         pwt->chroma_weight[i][list][j][1] = get_se_golomb(gb);
  84                         if ((int8_t)pwt->chroma_weight[i][list][j][0] != pwt->chroma_weight[i][list][j][0] ||
  85                             (int8_t)pwt->chroma_weight[i][list][j][1] != pwt->chroma_weight[i][list][j][1])
  86                             goto out_range_weight;
  87                         if (pwt->chroma_weight[i][list][j][0] != chroma_def ||
  88                             pwt->chroma_weight[i][list][j][1] != 0) {
  89                             pwt->use_weight_chroma        = 1;
  90                             pwt->chroma_weight_flag[list] = 1;
  91                         }
  92                     }
  93                 } else {
  94                     int j;
  95                     for (j = 0; j < 2; j++) {
  96                         pwt->chroma_weight[i][list][j][0] = chroma_def;
  97                         pwt->chroma_weight[i][list][j][1] = 0;
  98                     }
  99                 }
 100             }
 101
 102             // for MBAFF
 103             if (picture_structure == PICT_FRAME) {
 104                 pwt->luma_weight[16 + 2 * i][list][0] = pwt->luma_weight[16 + 2 * i + 1][list][0] = pwt->luma_weight[i][list][0];
 105                 pwt->luma_weight[16 + 2 * i][list][1] = pwt->luma_weight[16 + 2 * i + 1][list][1] = pwt->luma_weight[i][list][1];
 106                 if (sps->chroma_format_idc) {
 107                     for (j = 0; j < 2; j++) {
 108                         pwt->chroma_weight[16 + 2 * i][list][j][0] = pwt->chroma_weight[16 + 2 * i + 1][list][j][0] = pwt->chroma_weight[i][list][j][0];
 109                         pwt->chroma_weight[16 + 2 * i][list][j][1] = pwt->chroma_weight[16 + 2 * i + 1][list][j][1] = pwt->chroma_weight[i][list][j][1];
 110                     }
 111                 }
 112             }
 113         }
 114         if (slice_type_nos != AV_PICTURE_TYPE_B)
 115             break;
 116     }
 117     pwt->use_weight = pwt->use_weight || pwt->use_weight_chroma;
 118     return 0;
 119 out_range_weight:
 120     avpriv_request_sample(logctx, "Out of range weight\n");
 121     return AVERROR_INVALIDDATA;
 122 }
 123
 124 /**
 125  * Check if the top & left blocks are available if needed and
 126  * change the dc mode so it only uses the available blocks.
 127  */
 128 int ff_h264_check_intra4x4_pred_mode(int8_t *pred_mode_cache, void *logctx,
 129                                      int top_samples_available, int left_samples_available)
 130 {
 131     static const int8_t top[12] = {
 132         -1, 0, LEFT_DC_PRED, -1, -1, -1, -1, -1, 0
 133     };
 134     static const int8_t left[12] = {
 135         0, -1, TOP_DC_PRED, 0, -1, -1, -1, 0, -1, DC_128_PRED
 136     };
 137     int i;
 138
 139     if (!(top_samples_available & 0x8000)) {
 140         for (i = 0; i < 4; i++) {
 141             int status = top[pred_mode_cache[scan8[0] + i]];
 142             if (status < 0) {
 143                 av_log(logctx, AV_LOG_ERROR,
 144                        "top block unavailable for requested intra mode %d\n",
 145                        status);
 146                 return AVERROR_INVALIDDATA;
 147             } else if (status) {
 148                 pred_mode_cache[scan8[0] + i] = status;
 149             }
 150         }
 151     }
 152
 153     if ((left_samples_available & 0x8888) != 0x8888) {
 154         static const int mask[4] = { 0x8000, 0x2000, 0x80, 0x20 };
 155         for (i = 0; i < 4; i++)
 156             if (!(left_samples_available & mask[i])) {
 157                 int status = left[pred_mode_cache[scan8[0] + 8 * i]];
 158                 if (status < 0) {
 159                     av_log(logctx, AV_LOG_ERROR,
 160                            "left block unavailable for requested intra4x4 mode %d\n",
 161                            status);
 162                     return AVERROR_INVALIDDATA;
 163                 } else if (status) {
 164                     pred_mode_cache[scan8[0] + 8 * i] = status;
 165                 }
 166             }
 167     }
 168
 169     return 0;
 170 }
 171
 172 /**
 173  * Check if the top & left blocks are available if needed and
 174  * change the dc mode so it only uses the available blocks.
 175  */
 176 int ff_h264_check_intra_pred_mode(void *logctx, int top_samples_available,
 177                                   int left_samples_available,
 178                                   int mode, int is_chroma)
 179 {
 180     static const int8_t top[4]  = { LEFT_DC_PRED8x8, 1, -1, -1 };
 181     static const int8_t left[5] = { TOP_DC_PRED8x8, -1,  2, -1, DC_128_PRED8x8 };
 182
 183     if (mode > 3U) {
 184         av_log(logctx, AV_LOG_ERROR,
 185                "out of range intra chroma pred mode\n");
 186         return AVERROR_INVALIDDATA;
 187     }
 188
 189     if (!(top_samples_available & 0x8000)) {
 190         mode = top[mode];
 191         if (mode < 0) {
 192             av_log(logctx, AV_LOG_ERROR,
 193                    "top block unavailable for requested intra mode\n");
 194             return AVERROR_INVALIDDATA;
 195         }
 196     }
 197
 198     if ((left_samples_available & 0x8080) != 0x8080) {
 199         mode = left[mode];
 200         if (mode < 0) {
 201             av_log(logctx, AV_LOG_ERROR,
 202                    "left block unavailable for requested intra mode\n");
 203             return AVERROR_INVALIDDATA;
 204         }
 205         if (is_chroma && (left_samples_available & 0x8080)) {
 206             // mad cow disease mode, aka MBAFF + constrained_intra_pred
 207             mode = ALZHEIMER_DC_L0T_PRED8x8 +
 208                    (!(left_samples_available & 0x8000)) +
 209                    2 * (mode == DC_128_PRED8x8);
 210         }
 211     }
 212
 213     return mode;
 214 }
 215
 216 int ff_h264_parse_ref_count(int *plist_count, int ref_count[2],
 217                             GetBitContext *gb, const PPS *pps,
 218                             int slice_type_nos, int picture_structure, void *logctx)
 219 {
 220     int list_count;
 221     int num_ref_idx_active_override_flag;
 222
 223     // set defaults, might be overridden a few lines later
 224     ref_count[0] = pps->ref_count[0];
 225     ref_count[1] = pps->ref_count[1];
 226
 227     if (slice_type_nos != AV_PICTURE_TYPE_I) {
 228         unsigned max[2];
 229         max[0] = max[1] = picture_structure == PICT_FRAME ? 15 : 31;
 230
 231         num_ref_idx_active_override_flag = get_bits1(gb);
 232
 233         if (num_ref_idx_active_override_flag) {
 234             ref_count[0] = get_ue_golomb(gb) + 1;
 235             if (slice_type_nos == AV_PICTURE_TYPE_B) {
 236                 ref_count[1] = get_ue_golomb(gb) + 1;
 237             } else
 238                 // full range is spec-ok in this case, even for frames
 239                 ref_count[1] = 1;
 240         }
 241
 242         if (ref_count[0] - 1 > max[0] || ref_count[1] - 1 > max[1]) {
 243             av_log(logctx, AV_LOG_ERROR, "reference overflow %u > %u or %u > %u\n",
 244                    ref_count[0] - 1, max[0], ref_count[1] - 1, max[1]);
 245             ref_count[0] = ref_count[1] = 0;
 246             *plist_count = 0;
 247             goto fail;
 248         }
 249
 250         if (slice_type_nos == AV_PICTURE_TYPE_B)
 251             list_count = 2;
 252         else
 253             list_count = 1;
 254     } else {
 255         list_count   = 0;
 256         ref_count[0] = ref_count[1] = 0;
 257     }
 258
 259     *plist_count = list_count;
 260
 261     return 0;
 262 fail:
 263     *plist_count = 0;
 264     ref_count[0] = 0;
 265     ref_count[1] = 0;
 266     return AVERROR_INVALIDDATA;
 267 }
 268
 269 int ff_h264_init_poc(int pic_field_poc[2], int *pic_poc,
 270                      const SPS *sps, H264POCContext *pc,
 271                      int picture_structure, int nal_ref_idc)
 272 {
 273     const int max_frame_num = 1 << sps->log2_max_frame_num;
 274     int field_poc[2];
 275
 276     pc->frame_num_offset = pc->prev_frame_num_offset;
 277     if (pc->frame_num < pc->prev_frame_num)
 278         pc->frame_num_offset += max_frame_num;
 279
 280     if (sps->poc_type == 0) {
 281         const int max_poc_lsb = 1 << sps->log2_max_poc_lsb;
 282
 283         if (pc->poc_lsb < pc->prev_poc_lsb &&
 284             pc->prev_poc_lsb - pc->poc_lsb >= max_poc_lsb / 2)
 285             pc->poc_msb = pc->prev_poc_msb + max_poc_lsb;
 286         else if (pc->poc_lsb > pc->prev_poc_lsb &&
 287                  pc->prev_poc_lsb - pc->poc_lsb < -max_poc_lsb / 2)
 288             pc->poc_msb = pc->prev_poc_msb - max_poc_lsb;
 289         else
 290             pc->poc_msb = pc->prev_poc_msb;
 291         field_poc[0] =
 292         field_poc[1] = pc->poc_msb + pc->poc_lsb;
 293         if (picture_structure == PICT_FRAME)
 294             field_poc[1] += pc->delta_poc_bottom;
 295     } else if (sps->poc_type == 1) {
 296         int abs_frame_num, expected_delta_per_poc_cycle, expectedpoc;
 297         int i;
 298
 299         if (sps->poc_cycle_length != 0)
 300             abs_frame_num = pc->frame_num_offset + pc->frame_num;
 301         else
 302             abs_frame_num = 0;
 303
 304         if (nal_ref_idc == 0 && abs_frame_num > 0)
 305             abs_frame_num--;
 306
 307         expected_delta_per_poc_cycle = 0;
 308         for (i = 0; i < sps->poc_cycle_length; i++)
 309             // FIXME integrate during sps parse
 310             expected_delta_per_poc_cycle += sps->offset_for_ref_frame[i];
 311
 312         if (abs_frame_num > 0) {
 313             int poc_cycle_cnt          = (abs_frame_num - 1) / sps->poc_cycle_length;
 314             int frame_num_in_poc_cycle = (abs_frame_num - 1) % sps->poc_cycle_length;
 315
 316             expectedpoc = poc_cycle_cnt * expected_delta_per_poc_cycle;
 317             for (i = 0; i <= frame_num_in_poc_cycle; i++)
 318                 expectedpoc = expectedpoc + sps->offset_for_ref_frame[i];
 319         } else
 320             expectedpoc = 0;
 321
 322         if (nal_ref_idc == 0)
 323             expectedpoc = expectedpoc + sps->offset_for_non_ref_pic;
 324
 325         field_poc[0] = expectedpoc + pc->delta_poc[0];
 326         field_poc[1] = field_poc[0] + sps->offset_for_top_to_bottom_field;
 327
 328         if (picture_structure == PICT_FRAME)
 329             field_poc[1] += pc->delta_poc[1];
 330     } else {
 331         int poc = 2 * (pc->frame_num_offset + pc->frame_num);
 332
 333         if (!nal_ref_idc)
 334             poc--;
 335
 336         field_poc[0] = poc;
 337         field_poc[1] = poc;
 338     }
 339
 340     if (picture_structure != PICT_BOTTOM_FIELD)
 341         pic_field_poc[0] = field_poc[0];
 342     if (picture_structure != PICT_TOP_FIELD)
 343         pic_field_poc[1] = field_poc[1];
 344     *pic_poc = FFMIN(pic_field_poc[0], pic_field_poc[1]);
 345
 346     return 0;
 347 }
 348
 349 static int decode_extradata_ps(const uint8_t *data, int size, H264ParamSets *ps,
 350                                int is_avc, void *logctx)
 351 {
 352     H2645Packet pkt = { 0 };
 353     int i, ret = 0;
 354
 355     ret = ff_h2645_packet_split(&pkt, data, size, logctx, is_avc, 2, AV_CODEC_ID_H264, 1);
 356     if (ret < 0) {
 357         ret = 0;
 358         goto fail;
 359     }
 360
 361     for (i = 0; i < pkt.nb_nals; i++) {
 362         H2645NAL *nal = &pkt.nals[i];
 363         switch (nal->type) {
 364         case H264_NAL_SPS:
 365             ret = ff_h264_decode_seq_parameter_set(&nal->gb, logctx, ps, 0);
 366             if (ret < 0)
 367                 goto fail;
 368             break;
 369         case H264_NAL_PPS:
 370             ret = ff_h264_decode_picture_parameter_set(&nal->gb, logctx, ps,
 371                                                        nal->size_bits);
 372             if (ret < 0)
 373                 goto fail;
 374             break;
 375         default:
 376             av_log(logctx, AV_LOG_VERBOSE, "Ignoring NAL type %d in extradata\n",
 377                    nal->type);
 378             break;
 379         }
 380     }
 381
 382 fail:
 383     ff_h2645_packet_uninit(&pkt);
 384     return ret;
 385 }
 386
 387 /* There are (invalid) samples in the wild with mp4-style extradata, where the
 388  * parameter sets are stored unescaped (i.e. as RBSP).
 389  * This function catches the parameter set decoding failure and tries again
 390  * after escaping it */
 391 static int decode_extradata_ps_mp4(const uint8_t *buf, int buf_size, H264ParamSets *ps,
 392                                    int err_recognition, void *logctx)
 393 {
 394     int ret;
 395
 396     ret = decode_extradata_ps(buf, buf_size, ps, 1, logctx);
 397     if (ret < 0 && !(err_recognition & AV_EF_EXPLODE)) {
 398         GetByteContext gbc;
 399         PutByteContext pbc;
 400         uint8_t *escaped_buf;
 401         int escaped_buf_size;
 402
 403         av_log(logctx, AV_LOG_WARNING,
 404                "SPS decoding failure, trying again after escaping the NAL\n");
 405
 406         if (buf_size / 2 >= (INT16_MAX - AV_INPUT_BUFFER_PADDING_SIZE) / 3)
 407             return AVERROR(ERANGE);
 408         escaped_buf_size = buf_size * 3 / 2 + AV_INPUT_BUFFER_PADDING_SIZE;
 409         escaped_buf = av_mallocz(escaped_buf_size);
 410         if (!escaped_buf)
 411             return AVERROR(ENOMEM);
 412
 413         bytestream2_init(&gbc, buf, buf_size);
 414         bytestream2_init_writer(&pbc, escaped_buf, escaped_buf_size);
 415
 416         while (bytestream2_get_bytes_left(&gbc)) {
 417             if (bytestream2_get_bytes_left(&gbc) >= 3 &&
 418                 bytestream2_peek_be24(&gbc) <= 3) {
 419                 bytestream2_put_be24(&pbc, 3);
 420                 bytestream2_skip(&gbc, 2);
 421             } else
 422                 bytestream2_put_byte(&pbc, bytestream2_get_byte(&gbc));
 423         }
 424
 425         escaped_buf_size = bytestream2_tell_p(&pbc);
 426         AV_WB16(escaped_buf, escaped_buf_size - 2);
 427
 428         ret = decode_extradata_ps(escaped_buf, escaped_buf_size, ps, 1, logctx);
 429         av_freep(&escaped_buf);
 430         if (ret < 0)
 431             return ret;
 432     }
 433
 434     return 0;
 435 }
 436
 437 int ff_h264_decode_extradata(const uint8_t *data, int size, H264ParamSets *ps,
 438                              int *is_avc, int *nal_length_size,
 439                              int err_recognition, void *logctx)
 440 {
 441     int ret;
 442
 443     if (!data || size <= 0)
 444         return -1;
 445
 446     if (data[0] == 1) {
 447         int i, cnt, nalsize;
 448         const uint8_t *p = data;
 449
 450         *is_avc = 1;
 451
 452         if (size < 7) {
 453             av_log(logctx, AV_LOG_ERROR, "avcC %d too short\n", size);
 454             return AVERROR_INVALIDDATA;
 455         }
 456
 457         // Decode sps from avcC
 458         cnt = *(p + 5) & 0x1f; // Number of sps
 459         p  += 6;
 460         for (i = 0; i < cnt; i++) {
 461             nalsize = AV_RB16(p) + 2;
 462             if (nalsize > size - (p - data))
 463                 return AVERROR_INVALIDDATA;
 464             ret = decode_extradata_ps_mp4(p, nalsize, ps, err_recognition, logctx);
 465             if (ret < 0) {
 466                 av_log(logctx, AV_LOG_ERROR,
 467                        "Decoding sps %d from avcC failed\n", i);
 468                 return ret;
 469             }
 470             p += nalsize;
 471         }
 472         // Decode pps from avcC
 473         cnt = *(p++); // Number of pps
 474         for (i = 0; i < cnt; i++) {
 475             nalsize = AV_RB16(p) + 2;
 476             if (nalsize > size - (p - data))
 477                 return AVERROR_INVALIDDATA;
 478             ret = decode_extradata_ps_mp4(p, nalsize, ps, err_recognition, logctx);
 479             if (ret < 0) {
 480                 av_log(logctx, AV_LOG_ERROR,
 481                        "Decoding pps %d from avcC failed\n", i);
 482                 return ret;
 483             }
 484             p += nalsize;
 485         }
 486         // Store right nal length size that will be used to parse all other nals
 487         *nal_length_size = (data[4] & 0x03) + 1;
 488     } else {
 489         *is_avc = 0;
 490         ret = decode_extradata_ps(data, size, ps, 0, logctx);
 491         if (ret < 0)
 492             return ret;
 493     }
 494     return size;
 495 }
 496
 497 /**
 498  * Compute profile from profile_idc and constraint_set?_flags.
 499  *
 500  * @param sps SPS
 501  *
 502  * @return profile as defined by FF_PROFILE_H264_*
 503  */
 504 int ff_h264_get_profile(const SPS *sps)
 505 {
 506     int profile = sps->profile_idc;
 507
 508     switch (sps->profile_idc) {
 509     case FF_PROFILE_H264_BASELINE:
 510         // constraint_set1_flag set to 1
 511         profile |= (sps->constraint_set_flags & 1 << 1) ? FF_PROFILE_H264_CONSTRAINED : 0;
 512         break;
 513     case FF_PROFILE_H264_HIGH_10:
 514     case FF_PROFILE_H264_HIGH_422:
 515     case FF_PROFILE_H264_HIGH_444_PREDICTIVE:
 516         // constraint_set3_flag set to 1
 517         profile |= (sps->constraint_set_flags & 1 << 3) ? FF_PROFILE_H264_INTRA : 0;
 518         break;
 519     }
 520
 521     return profile;
 522 }