git.sesse.net Git - ffmpeg/blob - libavcodec/proresdec2.c

   1 /*
   2  * Copyright (c) 2010-2011 Maxim Poliakovski
   3  * Copyright (c) 2010-2011 Elvis Presley
   4  *
   5  * This file is part of FFmpeg.
   6  *
   7  * FFmpeg is free software; you can redistribute it and/or
   8  * modify it under the terms of the GNU Lesser General Public
   9  * License as published by the Free Software Foundation; either
  10  * version 2.1 of the License, or (at your option) any later version.
  11  *
  12  * FFmpeg is distributed in the hope that it will be useful,
  13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  15  * Lesser General Public License for more details.
  16  *
  17  * You should have received a copy of the GNU Lesser General Public
  18  * License along with FFmpeg; if not, write to the Free Software
  19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20  */
  21
  22 /**
  23  * @file
  24  * Known FOURCCs: 'apch' (HQ), 'apcn' (SD), 'apcs' (LT), 'acpo' (Proxy), 'ap4h' (4444)
  25  */
  26
  27 //#define DEBUG
  28
  29 #define LONG_BITSTREAM_READER
  30
  31 #include "libavutil/internal.h"
  32 #include "avcodec.h"
  33 #include "get_bits.h"
  34 #include "idctdsp.h"
  35 #include "internal.h"
  36 #include "profiles.h"
  37 #include "simple_idct.h"
  38 #include "proresdec.h"
  39 #include "proresdata.h"
  40 #include "thread.h"
  41
  42 static void permute(uint8_t *dst, const uint8_t *src, const uint8_t permutation[64])
  43 {
  44     int i;
  45     for (i = 0; i < 64; i++)
  46         dst[i] = permutation[src[i]];
  47 }
  48
  49 #define ALPHA_SHIFT_16_TO_10(alpha_val) (alpha_val >> 6)
  50 #define ALPHA_SHIFT_8_TO_10(alpha_val)  ((alpha_val << 2) | (alpha_val >> 6))
  51 #define ALPHA_SHIFT_16_TO_12(alpha_val) (alpha_val >> 4)
  52 #define ALPHA_SHIFT_8_TO_12(alpha_val)  ((alpha_val << 4) | (alpha_val >> 4))
  53
  54 static void inline unpack_alpha(GetBitContext *gb, uint16_t *dst, int num_coeffs,
  55                                 const int num_bits, const int decode_precision) {
  56     const int mask = (1 << num_bits) - 1;
  57     int i, idx, val, alpha_val;
  58
  59     idx       = 0;
  60     alpha_val = mask;
  61     do {
  62         do {
  63             if (get_bits1(gb)) {
  64                 val = get_bits(gb, num_bits);
  65             } else {
  66                 int sign;
  67                 val  = get_bits(gb, num_bits == 16 ? 7 : 4);
  68                 sign = val & 1;
  69                 val  = (val + 2) >> 1;
  70                 if (sign)
  71                     val = -val;
  72             }
  73             alpha_val = (alpha_val + val) & mask;
  74             if (num_bits == 16) {
  75                 if (decode_precision == 10) {
  76                     dst[idx++] = ALPHA_SHIFT_16_TO_10(alpha_val);
  77                 } else { /* 12b */
  78                     dst[idx++] = ALPHA_SHIFT_16_TO_12(alpha_val);
  79                 }
  80             } else {
  81                 if (decode_precision == 10) {
  82                     dst[idx++] = ALPHA_SHIFT_8_TO_10(alpha_val);
  83                 } else { /* 12b */
  84                     dst[idx++] = ALPHA_SHIFT_8_TO_12(alpha_val);
  85                 }
  86             }
  87             if (idx >= num_coeffs)
  88                 break;
  89         } while (get_bits_left(gb)>0 && get_bits1(gb));
  90         val = get_bits(gb, 4);
  91         if (!val)
  92             val = get_bits(gb, 11);
  93         if (idx + val > num_coeffs)
  94             val = num_coeffs - idx;
  95         if (num_bits == 16) {
  96             for (i = 0; i < val; i++) {
  97                 if (decode_precision == 10) {
  98                     dst[idx++] = ALPHA_SHIFT_16_TO_10(alpha_val);
  99                 } else { /* 12b */
 100                     dst[idx++] = ALPHA_SHIFT_16_TO_12(alpha_val);
 101                 }
 102             }
 103         } else {
 104             for (i = 0; i < val; i++) {
 105                 if (decode_precision == 10) {
 106                     dst[idx++] = ALPHA_SHIFT_8_TO_10(alpha_val);
 107                 } else { /* 12b */
 108                     dst[idx++] = ALPHA_SHIFT_8_TO_12(alpha_val);
 109                 }
 110             }
 111         }
 112     } while (idx < num_coeffs);
 113 }
 114
 115 static void unpack_alpha_10(GetBitContext *gb, uint16_t *dst, int num_coeffs,
 116                             const int num_bits)
 117 {
 118     if (num_bits == 16) {
 119         unpack_alpha(gb, dst, num_coeffs, 16, 10);
 120     } else { /* 8 bits alpha */
 121         unpack_alpha(gb, dst, num_coeffs, 8, 10);
 122     }
 123 }
 124
 125 static void unpack_alpha_12(GetBitContext *gb, uint16_t *dst, int num_coeffs,
 126                             const int num_bits)
 127 {
 128     if (num_bits == 16) {
 129         unpack_alpha(gb, dst, num_coeffs, 16, 12);
 130     } else { /* 8 bits alpha */
 131         unpack_alpha(gb, dst, num_coeffs, 8, 12);
 132     }
 133 }
 134
 135 static av_cold int decode_init(AVCodecContext *avctx)
 136 {
 137     int ret = 0;
 138     ProresContext *ctx = avctx->priv_data;
 139     uint8_t idct_permutation[64];
 140
 141     avctx->bits_per_raw_sample = 10;
 142
 143     switch (avctx->codec_tag) {
 144     case MKTAG('a','p','c','o'):
 145         avctx->profile = FF_PROFILE_PRORES_PROXY;
 146         break;
 147     case MKTAG('a','p','c','s'):
 148         avctx->profile = FF_PROFILE_PRORES_LT;
 149         break;
 150     case MKTAG('a','p','c','n'):
 151         avctx->profile = FF_PROFILE_PRORES_STANDARD;
 152         break;
 153     case MKTAG('a','p','c','h'):
 154         avctx->profile = FF_PROFILE_PRORES_HQ;
 155         break;
 156     case MKTAG('a','p','4','h'):
 157         avctx->profile = FF_PROFILE_PRORES_4444;
 158         break;
 159     case MKTAG('a','p','4','x'):
 160         avctx->profile = FF_PROFILE_PRORES_XQ;
 161         break;
 162     default:
 163         avctx->profile = FF_PROFILE_UNKNOWN;
 164         av_log(avctx, AV_LOG_WARNING, "Unknown prores profile %d\n", avctx->codec_tag);
 165     }
 166
 167     ff_blockdsp_init(&ctx->bdsp, avctx);
 168     ret = ff_proresdsp_init(&ctx->prodsp, avctx);
 169     if (ret < 0) {
 170         av_log(avctx, AV_LOG_ERROR, "Fail to init proresdsp for bits per raw sample %d\n", avctx->bits_per_raw_sample);
 171         return ret;
 172     }
 173
 174     ff_init_scantable_permutation(idct_permutation,
 175                                   ctx->prodsp.idct_permutation_type);
 176
 177     permute(ctx->progressive_scan, ff_prores_progressive_scan, idct_permutation);
 178     permute(ctx->interlaced_scan, ff_prores_interlaced_scan, idct_permutation);
 179
 180     if (avctx->bits_per_raw_sample == 10){
 181         ctx->unpack_alpha = unpack_alpha_10;
 182     } else if (avctx->bits_per_raw_sample == 12){
 183         ctx->unpack_alpha = unpack_alpha_12;
 184     } else {
 185         av_log(avctx, AV_LOG_ERROR, "Fail to set unpack_alpha for bits per raw sample %d\n", avctx->bits_per_raw_sample);
 186         return AVERROR_BUG;
 187     }
 188     return ret;
 189 }
 190
 191 static int decode_frame_header(ProresContext *ctx, const uint8_t *buf,
 192                                const int data_size, AVCodecContext *avctx)
 193 {
 194     int hdr_size, width, height, flags;
 195     int version;
 196     const uint8_t *ptr;
 197
 198     hdr_size = AV_RB16(buf);
 199     ff_dlog(avctx, "header size %d\n", hdr_size);
 200     if (hdr_size > data_size) {
 201         av_log(avctx, AV_LOG_ERROR, "error, wrong header size\n");
 202         return AVERROR_INVALIDDATA;
 203     }
 204
 205     version = AV_RB16(buf + 2);
 206     ff_dlog(avctx, "%.4s version %d\n", buf+4, version);
 207     if (version > 1) {
 208         av_log(avctx, AV_LOG_ERROR, "unsupported version: %d\n", version);
 209         return AVERROR_PATCHWELCOME;
 210     }
 211
 212     width  = AV_RB16(buf + 8);
 213     height = AV_RB16(buf + 10);
 214     if (width != avctx->width || height != avctx->height) {
 215         av_log(avctx, AV_LOG_ERROR, "picture resolution change: %dx%d -> %dx%d\n",
 216                avctx->width, avctx->height, width, height);
 217         return AVERROR_PATCHWELCOME;
 218     }
 219
 220     ctx->frame_type = (buf[12] >> 2) & 3;
 221     ctx->alpha_info = buf[17] & 0xf;
 222
 223     if (ctx->alpha_info > 2) {
 224         av_log(avctx, AV_LOG_ERROR, "Invalid alpha mode %d\n", ctx->alpha_info);
 225         return AVERROR_INVALIDDATA;
 226     }
 227     if (avctx->skip_alpha) ctx->alpha_info = 0;
 228
 229     ff_dlog(avctx, "frame type %d\n", ctx->frame_type);
 230
 231     if (ctx->frame_type == 0) {
 232         ctx->scan = ctx->progressive_scan; // permuted
 233     } else {
 234         ctx->scan = ctx->interlaced_scan; // permuted
 235         ctx->frame->interlaced_frame = 1;
 236         ctx->frame->top_field_first = ctx->frame_type == 1;
 237     }
 238
 239     if (ctx->alpha_info) {
 240         avctx->pix_fmt = (buf[12] & 0xC0) == 0xC0 ? AV_PIX_FMT_YUVA444P10 : AV_PIX_FMT_YUVA422P10;
 241     } else {
 242         avctx->pix_fmt = (buf[12] & 0xC0) == 0xC0 ? AV_PIX_FMT_YUV444P10 : AV_PIX_FMT_YUV422P10;
 243     }
 244
 245     avctx->color_primaries = buf[14];
 246     avctx->color_trc       = buf[15];
 247     avctx->colorspace      = buf[16];
 248     avctx->color_range     = AVCOL_RANGE_MPEG;
 249
 250     ptr   = buf + 20;
 251     flags = buf[19];
 252     ff_dlog(avctx, "flags %x\n", flags);
 253
 254     if (flags & 2) {
 255         if(buf + data_size - ptr < 64) {
 256             av_log(avctx, AV_LOG_ERROR, "Header truncated\n");
 257             return AVERROR_INVALIDDATA;
 258         }
 259         permute(ctx->qmat_luma, ctx->prodsp.idct_permutation, ptr);
 260         ptr += 64;
 261     } else {
 262         memset(ctx->qmat_luma, 4, 64);
 263     }
 264
 265     if (flags & 1) {
 266         if(buf + data_size - ptr < 64) {
 267             av_log(avctx, AV_LOG_ERROR, "Header truncated\n");
 268             return AVERROR_INVALIDDATA;
 269         }
 270         permute(ctx->qmat_chroma, ctx->prodsp.idct_permutation, ptr);
 271     } else {
 272         memset(ctx->qmat_chroma, 4, 64);
 273     }
 274
 275     return hdr_size;
 276 }
 277
 278 static int decode_picture_header(AVCodecContext *avctx, const uint8_t *buf, const int buf_size)
 279 {
 280     ProresContext *ctx = avctx->priv_data;
 281     int i, hdr_size, slice_count;
 282     unsigned pic_data_size;
 283     int log2_slice_mb_width, log2_slice_mb_height;
 284     int slice_mb_count, mb_x, mb_y;
 285     const uint8_t *data_ptr, *index_ptr;
 286
 287     hdr_size = buf[0] >> 3;
 288     if (hdr_size < 8 || hdr_size > buf_size) {
 289         av_log(avctx, AV_LOG_ERROR, "error, wrong picture header size\n");
 290         return AVERROR_INVALIDDATA;
 291     }
 292
 293     pic_data_size = AV_RB32(buf + 1);
 294     if (pic_data_size > buf_size) {
 295         av_log(avctx, AV_LOG_ERROR, "error, wrong picture data size\n");
 296         return AVERROR_INVALIDDATA;
 297     }
 298
 299     log2_slice_mb_width  = buf[7] >> 4;
 300     log2_slice_mb_height = buf[7] & 0xF;
 301     if (log2_slice_mb_width > 3 || log2_slice_mb_height) {
 302         av_log(avctx, AV_LOG_ERROR, "unsupported slice resolution: %dx%d\n",
 303                1 << log2_slice_mb_width, 1 << log2_slice_mb_height);
 304         return AVERROR_INVALIDDATA;
 305     }
 306
 307     ctx->mb_width  = (avctx->width  + 15) >> 4;
 308     if (ctx->frame_type)
 309         ctx->mb_height = (avctx->height + 31) >> 5;
 310     else
 311         ctx->mb_height = (avctx->height + 15) >> 4;
 312
 313     // QT ignores the written value
 314     // slice_count = AV_RB16(buf + 5);
 315     slice_count = ctx->mb_height * ((ctx->mb_width >> log2_slice_mb_width) +
 316                                     av_popcount(ctx->mb_width & (1 << log2_slice_mb_width) - 1));
 317
 318     if (ctx->slice_count != slice_count || !ctx->slices) {
 319         av_freep(&ctx->slices);
 320         ctx->slice_count = 0;
 321         ctx->slices = av_mallocz_array(slice_count, sizeof(*ctx->slices));
 322         if (!ctx->slices)
 323             return AVERROR(ENOMEM);
 324         ctx->slice_count = slice_count;
 325     }
 326
 327     if (!slice_count)
 328         return AVERROR(EINVAL);
 329
 330     if (hdr_size + slice_count*2 > buf_size) {
 331         av_log(avctx, AV_LOG_ERROR, "error, wrong slice count\n");
 332         return AVERROR_INVALIDDATA;
 333     }
 334
 335     // parse slice information
 336     index_ptr = buf + hdr_size;
 337     data_ptr  = index_ptr + slice_count*2;
 338
 339     slice_mb_count = 1 << log2_slice_mb_width;
 340     mb_x = 0;
 341     mb_y = 0;
 342
 343     for (i = 0; i < slice_count; i++) {
 344         SliceContext *slice = &ctx->slices[i];
 345
 346         slice->data = data_ptr;
 347         data_ptr += AV_RB16(index_ptr + i*2);
 348
 349         while (ctx->mb_width - mb_x < slice_mb_count)
 350             slice_mb_count >>= 1;
 351
 352         slice->mb_x = mb_x;
 353         slice->mb_y = mb_y;
 354         slice->mb_count = slice_mb_count;
 355         slice->data_size = data_ptr - slice->data;
 356
 357         if (slice->data_size < 6) {
 358             av_log(avctx, AV_LOG_ERROR, "error, wrong slice data size\n");
 359             return AVERROR_INVALIDDATA;
 360         }
 361
 362         mb_x += slice_mb_count;
 363         if (mb_x == ctx->mb_width) {
 364             slice_mb_count = 1 << log2_slice_mb_width;
 365             mb_x = 0;
 366             mb_y++;
 367         }
 368         if (data_ptr > buf + buf_size) {
 369             av_log(avctx, AV_LOG_ERROR, "error, slice out of bounds\n");
 370             return AVERROR_INVALIDDATA;
 371         }
 372     }
 373
 374     if (mb_x || mb_y != ctx->mb_height) {
 375         av_log(avctx, AV_LOG_ERROR, "error wrong mb count y %d h %d\n",
 376                mb_y, ctx->mb_height);
 377         return AVERROR_INVALIDDATA;
 378     }
 379
 380     return pic_data_size;
 381 }
 382
 383 #define DECODE_CODEWORD(val, codebook, SKIP)                            \
 384     do {                                                                \
 385         unsigned int rice_order, exp_order, switch_bits;                \
 386         unsigned int q, buf, bits;                                      \
 387                                                                         \
 388         UPDATE_CACHE(re, gb);                                           \
 389         buf = GET_CACHE(re, gb);                                        \
 390                                                                         \
 391         /* number of bits to switch between rice and exp golomb */      \
 392         switch_bits =  codebook & 3;                                    \
 393         rice_order  =  codebook >> 5;                                   \
 394         exp_order   = (codebook >> 2) & 7;                              \
 395                                                                         \
 396         q = 31 - av_log2(buf);                                          \
 397                                                                         \
 398         if (q > switch_bits) { /* exp golomb */                         \
 399             bits = exp_order - switch_bits + (q<<1);                    \
 400             if (bits > FFMIN(MIN_CACHE_BITS, 31))                       \
 401                 return AVERROR_INVALIDDATA;                             \
 402             val = SHOW_UBITS(re, gb, bits) - (1 << exp_order) +         \
 403                 ((switch_bits + 1) << rice_order);                      \
 404             SKIP(re, gb, bits);                                         \
 405         } else if (rice_order) {                                        \
 406             SKIP_BITS(re, gb, q+1);                                     \
 407             val = (q << rice_order) + SHOW_UBITS(re, gb, rice_order);   \
 408             SKIP(re, gb, rice_order);                                   \
 409         } else {                                                        \
 410             val = q;                                                    \
 411             SKIP(re, gb, q+1);                                          \
 412         }                                                               \
 413     } while (0)
 414
 415 #define TOSIGNED(x) (((x) >> 1) ^ (-((x) & 1)))
 416
 417 #define FIRST_DC_CB 0xB8
 418
 419 static const uint8_t dc_codebook[7] = { 0x04, 0x28, 0x28, 0x4D, 0x4D, 0x70, 0x70};
 420
 421 static av_always_inline int decode_dc_coeffs(GetBitContext *gb, int16_t *out,
 422                                               int blocks_per_slice)
 423 {
 424     int16_t prev_dc;
 425     int code, i, sign;
 426
 427     OPEN_READER(re, gb);
 428
 429     DECODE_CODEWORD(code, FIRST_DC_CB, LAST_SKIP_BITS);
 430     prev_dc = TOSIGNED(code);
 431     out[0] = prev_dc;
 432
 433     out += 64; // dc coeff for the next block
 434
 435     code = 5;
 436     sign = 0;
 437     for (i = 1; i < blocks_per_slice; i++, out += 64) {
 438         DECODE_CODEWORD(code, dc_codebook[FFMIN(code, 6U)], LAST_SKIP_BITS);
 439         if(code) sign ^= -(code & 1);
 440         else     sign  = 0;
 441         prev_dc += (((code + 1) >> 1) ^ sign) - sign;
 442         out[0] = prev_dc;
 443     }
 444     CLOSE_READER(re, gb);
 445     return 0;
 446 }
 447
 448 // adaptive codebook switching lut according to previous run/level values
 449 static const uint8_t run_to_cb[16] = { 0x06, 0x06, 0x05, 0x05, 0x04, 0x29, 0x29, 0x29, 0x29, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x4C };
 450 static const uint8_t lev_to_cb[10] = { 0x04, 0x0A, 0x05, 0x06, 0x04, 0x28, 0x28, 0x28, 0x28, 0x4C };
 451
 452 static av_always_inline int decode_ac_coeffs(AVCodecContext *avctx, GetBitContext *gb,
 453                                              int16_t *out, int blocks_per_slice)
 454 {
 455     ProresContext *ctx = avctx->priv_data;
 456     int block_mask, sign;
 457     unsigned pos, run, level;
 458     int max_coeffs, i, bits_left;
 459     int log2_block_count = av_log2(blocks_per_slice);
 460
 461     OPEN_READER(re, gb);
 462     UPDATE_CACHE(re, gb);                                           \
 463     run   = 4;
 464     level = 2;
 465
 466     max_coeffs = 64 << log2_block_count;
 467     block_mask = blocks_per_slice - 1;
 468
 469     for (pos = block_mask;;) {
 470         bits_left = gb->size_in_bits - re_index;
 471         if (!bits_left || (bits_left < 32 && !SHOW_UBITS(re, gb, bits_left)))
 472             break;
 473
 474         DECODE_CODEWORD(run, run_to_cb[FFMIN(run,  15)], LAST_SKIP_BITS);
 475         pos += run + 1;
 476         if (pos >= max_coeffs) {
 477             av_log(avctx, AV_LOG_ERROR, "ac tex damaged %d, %d\n", pos, max_coeffs);
 478             return AVERROR_INVALIDDATA;
 479         }
 480
 481         DECODE_CODEWORD(level, lev_to_cb[FFMIN(level, 9)], SKIP_BITS);
 482         level += 1;
 483
 484         i = pos >> log2_block_count;
 485
 486         sign = SHOW_SBITS(re, gb, 1);
 487         SKIP_BITS(re, gb, 1);
 488         out[((pos & block_mask) << 6) + ctx->scan[i]] = ((level ^ sign) - sign);
 489     }
 490
 491     CLOSE_READER(re, gb);
 492     return 0;
 493 }
 494
 495 static int decode_slice_luma(AVCodecContext *avctx, SliceContext *slice,
 496                              uint16_t *dst, int dst_stride,
 497                              const uint8_t *buf, unsigned buf_size,
 498                              const int16_t *qmat)
 499 {
 500     ProresContext *ctx = avctx->priv_data;
 501     LOCAL_ALIGNED_32(int16_t, blocks, [8*4*64]);
 502     int16_t *block;
 503     GetBitContext gb;
 504     int i, blocks_per_slice = slice->mb_count<<2;
 505     int ret;
 506
 507     for (i = 0; i < blocks_per_slice; i++)
 508         ctx->bdsp.clear_block(blocks+(i<<6));
 509
 510     init_get_bits(&gb, buf, buf_size << 3);
 511
 512     if ((ret = decode_dc_coeffs(&gb, blocks, blocks_per_slice)) < 0)
 513         return ret;
 514     if ((ret = decode_ac_coeffs(avctx, &gb, blocks, blocks_per_slice)) < 0)
 515         return ret;
 516
 517     block = blocks;
 518     for (i = 0; i < slice->mb_count; i++) {
 519         ctx->prodsp.idct_put(dst, dst_stride, block+(0<<6), qmat);
 520         ctx->prodsp.idct_put(dst             +8, dst_stride, block+(1<<6), qmat);
 521         ctx->prodsp.idct_put(dst+4*dst_stride  , dst_stride, block+(2<<6), qmat);
 522         ctx->prodsp.idct_put(dst+4*dst_stride+8, dst_stride, block+(3<<6), qmat);
 523         block += 4*64;
 524         dst += 16;
 525     }
 526     return 0;
 527 }
 528
 529 static int decode_slice_chroma(AVCodecContext *avctx, SliceContext *slice,
 530                                uint16_t *dst, int dst_stride,
 531                                const uint8_t *buf, unsigned buf_size,
 532                                const int16_t *qmat, int log2_blocks_per_mb)
 533 {
 534     ProresContext *ctx = avctx->priv_data;
 535     LOCAL_ALIGNED_32(int16_t, blocks, [8*4*64]);
 536     int16_t *block;
 537     GetBitContext gb;
 538     int i, j, blocks_per_slice = slice->mb_count << log2_blocks_per_mb;
 539     int ret;
 540
 541     for (i = 0; i < blocks_per_slice; i++)
 542         ctx->bdsp.clear_block(blocks+(i<<6));
 543
 544     init_get_bits(&gb, buf, buf_size << 3);
 545
 546     if ((ret = decode_dc_coeffs(&gb, blocks, blocks_per_slice)) < 0)
 547         return ret;
 548     if ((ret = decode_ac_coeffs(avctx, &gb, blocks, blocks_per_slice)) < 0)
 549         return ret;
 550
 551     block = blocks;
 552     for (i = 0; i < slice->mb_count; i++) {
 553         for (j = 0; j < log2_blocks_per_mb; j++) {
 554             ctx->prodsp.idct_put(dst,              dst_stride, block+(0<<6), qmat);
 555             ctx->prodsp.idct_put(dst+4*dst_stride, dst_stride, block+(1<<6), qmat);
 556             block += 2*64;
 557             dst += 8;
 558         }
 559     }
 560     return 0;
 561 }
 562
 563 /**
 564  * Decode alpha slice plane.
 565  */
 566 static void decode_slice_alpha(ProresContext *ctx,
 567                                uint16_t *dst, int dst_stride,
 568                                const uint8_t *buf, int buf_size,
 569                                int blocks_per_slice)
 570 {
 571     GetBitContext gb;
 572     int i;
 573     LOCAL_ALIGNED_32(int16_t, blocks, [8*4*64]);
 574     int16_t *block;
 575
 576     for (i = 0; i < blocks_per_slice<<2; i++)
 577         ctx->bdsp.clear_block(blocks+(i<<6));
 578
 579     init_get_bits(&gb, buf, buf_size << 3);
 580
 581     if (ctx->alpha_info == 2) {
 582         ctx->unpack_alpha(&gb, blocks, blocks_per_slice * 4 * 64, 16);
 583     } else {
 584         ctx->unpack_alpha(&gb, blocks, blocks_per_slice * 4 * 64, 8);
 585     }
 586
 587     block = blocks;
 588     for (i = 0; i < 16; i++) {
 589         memcpy(dst, block, 16 * blocks_per_slice * sizeof(*dst));
 590         dst   += dst_stride >> 1;
 591         block += 16 * blocks_per_slice;
 592     }
 593 }
 594
 595 static int decode_slice_thread(AVCodecContext *avctx, void *arg, int jobnr, int threadnr)
 596 {
 597     ProresContext *ctx = avctx->priv_data;
 598     SliceContext *slice = &ctx->slices[jobnr];
 599     const uint8_t *buf = slice->data;
 600     AVFrame *pic = ctx->frame;
 601     int i, hdr_size, qscale, log2_chroma_blocks_per_mb;
 602     int luma_stride, chroma_stride;
 603     int y_data_size, u_data_size, v_data_size, a_data_size;
 604     uint8_t *dest_y, *dest_u, *dest_v, *dest_a;
 605     LOCAL_ALIGNED_16(int16_t, qmat_luma_scaled,  [64]);
 606     LOCAL_ALIGNED_16(int16_t, qmat_chroma_scaled,[64]);
 607     int mb_x_shift;
 608     int ret;
 609
 610     slice->ret = -1;
 611     //av_log(avctx, AV_LOG_INFO, "slice %d mb width %d mb x %d y %d\n",
 612     //       jobnr, slice->mb_count, slice->mb_x, slice->mb_y);
 613
 614     // slice header
 615     hdr_size = buf[0] >> 3;
 616     qscale = av_clip(buf[1], 1, 224);
 617     qscale = qscale > 128 ? qscale - 96 << 2: qscale;
 618     y_data_size = AV_RB16(buf + 2);
 619     u_data_size = AV_RB16(buf + 4);
 620     v_data_size = slice->data_size - y_data_size - u_data_size - hdr_size;
 621     if (hdr_size > 7) v_data_size = AV_RB16(buf + 6);
 622     a_data_size = slice->data_size - y_data_size - u_data_size -
 623                   v_data_size - hdr_size;
 624
 625     if (y_data_size < 0 || u_data_size < 0 || v_data_size < 0
 626         || hdr_size+y_data_size+u_data_size+v_data_size > slice->data_size){
 627         av_log(avctx, AV_LOG_ERROR, "invalid plane data size\n");
 628         return AVERROR_INVALIDDATA;
 629     }
 630
 631     buf += hdr_size;
 632
 633     for (i = 0; i < 64; i++) {
 634         qmat_luma_scaled  [i] = ctx->qmat_luma  [i] * qscale;
 635         qmat_chroma_scaled[i] = ctx->qmat_chroma[i] * qscale;
 636     }
 637
 638     if (ctx->frame_type == 0) {
 639         luma_stride   = pic->linesize[0];
 640         chroma_stride = pic->linesize[1];
 641     } else {
 642         luma_stride   = pic->linesize[0] << 1;
 643         chroma_stride = pic->linesize[1] << 1;
 644     }
 645
 646     if (avctx->pix_fmt == AV_PIX_FMT_YUV444P10 || avctx->pix_fmt == AV_PIX_FMT_YUVA444P10) {
 647         mb_x_shift = 5;
 648         log2_chroma_blocks_per_mb = 2;
 649     } else {
 650         mb_x_shift = 4;
 651         log2_chroma_blocks_per_mb = 1;
 652     }
 653
 654     dest_y = pic->data[0] + (slice->mb_y << 4) * luma_stride + (slice->mb_x << 5);
 655     dest_u = pic->data[1] + (slice->mb_y << 4) * chroma_stride + (slice->mb_x << mb_x_shift);
 656     dest_v = pic->data[2] + (slice->mb_y << 4) * chroma_stride + (slice->mb_x << mb_x_shift);
 657     dest_a = pic->data[3] + (slice->mb_y << 4) * luma_stride + (slice->mb_x << 5);
 658
 659     if (ctx->frame_type && ctx->first_field ^ ctx->frame->top_field_first) {
 660         dest_y += pic->linesize[0];
 661         dest_u += pic->linesize[1];
 662         dest_v += pic->linesize[2];
 663         dest_a += pic->linesize[3];
 664     }
 665
 666     ret = decode_slice_luma(avctx, slice, (uint16_t*)dest_y, luma_stride,
 667                             buf, y_data_size, qmat_luma_scaled);
 668     if (ret < 0)
 669         return ret;
 670
 671     if (!(avctx->flags & AV_CODEC_FLAG_GRAY) && (u_data_size + v_data_size) > 0) {
 672         ret = decode_slice_chroma(avctx, slice, (uint16_t*)dest_u, chroma_stride,
 673                                   buf + y_data_size, u_data_size,
 674                                   qmat_chroma_scaled, log2_chroma_blocks_per_mb);
 675         if (ret < 0)
 676             return ret;
 677
 678         ret = decode_slice_chroma(avctx, slice, (uint16_t*)dest_v, chroma_stride,
 679                                   buf + y_data_size + u_data_size, v_data_size,
 680                                   qmat_chroma_scaled, log2_chroma_blocks_per_mb);
 681         if (ret < 0)
 682             return ret;
 683     }
 684     else {
 685         size_t mb_max_x = slice->mb_count << (mb_x_shift - 1);
 686         size_t i, j;
 687         for (i = 0; i < 16; ++i)
 688             for (j = 0; j < mb_max_x; ++j) {
 689                 *(uint16_t*)(dest_u + (i * chroma_stride) + (j << 1)) = 511;
 690                 *(uint16_t*)(dest_v + (i * chroma_stride) + (j << 1)) = 511;
 691             }
 692     }
 693
 694     /* decode alpha plane if available */
 695     if (ctx->alpha_info && pic->data[3] && a_data_size)
 696         decode_slice_alpha(ctx, (uint16_t*)dest_a, luma_stride,
 697                            buf + y_data_size + u_data_size + v_data_size,
 698                            a_data_size, slice->mb_count);
 699
 700     slice->ret = 0;
 701     return 0;
 702 }
 703
 704 static int decode_picture(AVCodecContext *avctx)
 705 {
 706     ProresContext *ctx = avctx->priv_data;
 707     int i;
 708     int error = 0;
 709
 710     avctx->execute2(avctx, decode_slice_thread, NULL, NULL, ctx->slice_count);
 711
 712     for (i = 0; i < ctx->slice_count; i++)
 713         error += ctx->slices[i].ret < 0;
 714
 715     if (error)
 716         ctx->frame->decode_error_flags = FF_DECODE_ERROR_INVALID_BITSTREAM;
 717     if (error < ctx->slice_count)
 718         return 0;
 719
 720     return ctx->slices[0].ret;
 721 }
 722
 723 static int decode_frame(AVCodecContext *avctx, void *data, int *got_frame,
 724                         AVPacket *avpkt)
 725 {
 726     ProresContext *ctx = avctx->priv_data;
 727     ThreadFrame tframe = { .f = data };
 728     AVFrame *frame = data;
 729     const uint8_t *buf = avpkt->data;
 730     int buf_size = avpkt->size;
 731     int frame_hdr_size, pic_size, ret;
 732
 733     if (buf_size < 28 || AV_RL32(buf + 4) != AV_RL32("icpf")) {
 734         av_log(avctx, AV_LOG_ERROR, "invalid frame header\n");
 735         return AVERROR_INVALIDDATA;
 736     }
 737
 738     ctx->frame = frame;
 739     ctx->frame->pict_type = AV_PICTURE_TYPE_I;
 740     ctx->frame->key_frame = 1;
 741     ctx->first_field = 1;
 742
 743     buf += 8;
 744     buf_size -= 8;
 745
 746     frame_hdr_size = decode_frame_header(ctx, buf, buf_size, avctx);
 747     if (frame_hdr_size < 0)
 748         return frame_hdr_size;
 749
 750     buf += frame_hdr_size;
 751     buf_size -= frame_hdr_size;
 752
 753     if ((ret = ff_thread_get_buffer(avctx, &tframe, 0)) < 0)
 754         return ret;
 755
 756  decode_picture:
 757     pic_size = decode_picture_header(avctx, buf, buf_size);
 758     if (pic_size < 0) {
 759         av_log(avctx, AV_LOG_ERROR, "error decoding picture header\n");
 760         return pic_size;
 761     }
 762
 763     if ((ret = decode_picture(avctx)) < 0) {
 764         av_log(avctx, AV_LOG_ERROR, "error decoding picture\n");
 765         return ret;
 766     }
 767
 768     buf += pic_size;
 769     buf_size -= pic_size;
 770
 771     if (ctx->frame_type && buf_size > 0 && ctx->first_field) {
 772         ctx->first_field = 0;
 773         goto decode_picture;
 774     }
 775
 776     *got_frame      = 1;
 777
 778     return avpkt->size;
 779 }
 780
 781 #if HAVE_THREADS
 782 static int decode_init_thread_copy(AVCodecContext *avctx)
 783 {
 784     ProresContext *ctx = avctx->priv_data;
 785
 786     ctx->slices = NULL;
 787
 788     return 0;
 789 }
 790 #endif
 791
 792 static av_cold int decode_close(AVCodecContext *avctx)
 793 {
 794     ProresContext *ctx = avctx->priv_data;
 795
 796     av_freep(&ctx->slices);
 797
 798     return 0;
 799 }
 800
 801 AVCodec ff_prores_decoder = {
 802     .name           = "prores",
 803     .long_name      = NULL_IF_CONFIG_SMALL("ProRes (iCodec Pro)"),
 804     .type           = AVMEDIA_TYPE_VIDEO,
 805     .id             = AV_CODEC_ID_PRORES,
 806     .priv_data_size = sizeof(ProresContext),
 807     .init           = decode_init,
 808     .init_thread_copy = ONLY_IF_THREADS_ENABLED(decode_init_thread_copy),
 809     .close          = decode_close,
 810     .decode         = decode_frame,
 811     .capabilities   = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_SLICE_THREADS | AV_CODEC_CAP_FRAME_THREADS,
 812     .profiles       = NULL_IF_CONFIG_SMALL(ff_prores_profiles),
 813 };