git.sesse.net Git - ffmpeg/blob - libavcodec/proresdec2.c

   1 /*
   2  * Copyright (c) 2010-2011 Maxim Poliakovski
   3  * Copyright (c) 2010-2011 Elvis Presley
   4  *
   5  * This file is part of FFmpeg.
   6  *
   7  * FFmpeg is free software; you can redistribute it and/or
   8  * modify it under the terms of the GNU Lesser General Public
   9  * License as published by the Free Software Foundation; either
  10  * version 2.1 of the License, or (at your option) any later version.
  11  *
  12  * FFmpeg is distributed in the hope that it will be useful,
  13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  15  * Lesser General Public License for more details.
  16  *
  17  * You should have received a copy of the GNU Lesser General Public
  18  * License along with FFmpeg; if not, write to the Free Software
  19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20  */
  21
  22 /**
  23  * @file
  24  * Known FOURCCs: 'apch' (HQ), 'apcn' (SD), 'apcs' (LT), 'acpo' (Proxy), 'ap4h' (4444)
  25  */
  26
  27 //#define DEBUG
  28
  29 #define LONG_BITSTREAM_READER
  30
  31 #include "libavutil/internal.h"
  32 #include "avcodec.h"
  33 #include "get_bits.h"
  34 #include "idctdsp.h"
  35 #include "internal.h"
  36 #include "profiles.h"
  37 #include "simple_idct.h"
  38 #include "proresdec.h"
  39 #include "proresdata.h"
  40 #include "thread.h"
  41
  42 static void permute(uint8_t *dst, const uint8_t *src, const uint8_t permutation[64])
  43 {
  44     int i;
  45     for (i = 0; i < 64; i++)
  46         dst[i] = permutation[src[i]];
  47 }
  48
  49 #define ALPHA_SHIFT_16_TO_10(alpha_val) (alpha_val >> 6)
  50 #define ALPHA_SHIFT_8_TO_10(alpha_val)  ((alpha_val << 2) | (alpha_val >> 6))
  51 #define ALPHA_SHIFT_16_TO_12(alpha_val) (alpha_val >> 4)
  52 #define ALPHA_SHIFT_8_TO_12(alpha_val)  ((alpha_val << 4) | (alpha_val >> 4))
  53
  54 static void inline unpack_alpha(GetBitContext *gb, uint16_t *dst, int num_coeffs,
  55                                 const int num_bits, const int decode_precision) {
  56     const int mask = (1 << num_bits) - 1;
  57     int i, idx, val, alpha_val;
  58
  59     idx       = 0;
  60     alpha_val = mask;
  61     do {
  62         do {
  63             if (get_bits1(gb)) {
  64                 val = get_bits(gb, num_bits);
  65             } else {
  66                 int sign;
  67                 val  = get_bits(gb, num_bits == 16 ? 7 : 4);
  68                 sign = val & 1;
  69                 val  = (val + 2) >> 1;
  70                 if (sign)
  71                     val = -val;
  72             }
  73             alpha_val = (alpha_val + val) & mask;
  74             if (num_bits == 16) {
  75                 if (decode_precision == 10) {
  76                     dst[idx++] = ALPHA_SHIFT_16_TO_10(alpha_val);
  77                 } else { /* 12b */
  78                     dst[idx++] = ALPHA_SHIFT_16_TO_12(alpha_val);
  79                 }
  80             } else {
  81                 if (decode_precision == 10) {
  82                     dst[idx++] = ALPHA_SHIFT_8_TO_10(alpha_val);
  83                 } else { /* 12b */
  84                     dst[idx++] = ALPHA_SHIFT_8_TO_12(alpha_val);
  85                 }
  86             }
  87             if (idx >= num_coeffs)
  88                 break;
  89         } while (get_bits_left(gb)>0 && get_bits1(gb));
  90         val = get_bits(gb, 4);
  91         if (!val)
  92             val = get_bits(gb, 11);
  93         if (idx + val > num_coeffs)
  94             val = num_coeffs - idx;
  95         if (num_bits == 16) {
  96             for (i = 0; i < val; i++) {
  97                 if (decode_precision == 10) {
  98                     dst[idx++] = ALPHA_SHIFT_16_TO_10(alpha_val);
  99                 } else { /* 12b */
 100                     dst[idx++] = ALPHA_SHIFT_16_TO_12(alpha_val);
 101                 }
 102             }
 103         } else {
 104             for (i = 0; i < val; i++) {
 105                 if (decode_precision == 10) {
 106                     dst[idx++] = ALPHA_SHIFT_8_TO_10(alpha_val);
 107                 } else { /* 12b */
 108                     dst[idx++] = ALPHA_SHIFT_8_TO_12(alpha_val);
 109                 }
 110             }
 111         }
 112     } while (idx < num_coeffs);
 113 }
 114
 115 static void unpack_alpha_10(GetBitContext *gb, uint16_t *dst, int num_coeffs,
 116                             const int num_bits)
 117 {
 118     if (num_bits == 16) {
 119         unpack_alpha(gb, dst, num_coeffs, 16, 10);
 120     } else { /* 8 bits alpha */
 121         unpack_alpha(gb, dst, num_coeffs, 8, 10);
 122     }
 123 }
 124
 125 static void unpack_alpha_12(GetBitContext *gb, uint16_t *dst, int num_coeffs,
 126                             const int num_bits)
 127 {
 128     if (num_bits == 16) {
 129         unpack_alpha(gb, dst, num_coeffs, 16, 12);
 130     } else { /* 8 bits alpha */
 131         unpack_alpha(gb, dst, num_coeffs, 8, 12);
 132     }
 133 }
 134
 135 static av_cold int decode_init(AVCodecContext *avctx)
 136 {
 137     int ret = 0;
 138     ProresContext *ctx = avctx->priv_data;
 139     uint8_t idct_permutation[64];
 140
 141     avctx->bits_per_raw_sample = 10;
 142
 143     switch (avctx->codec_tag) {
 144     case MKTAG('a','p','c','o'):
 145         avctx->profile = FF_PROFILE_PRORES_PROXY;
 146         break;
 147     case MKTAG('a','p','c','s'):
 148         avctx->profile = FF_PROFILE_PRORES_LT;
 149         break;
 150     case MKTAG('a','p','c','n'):
 151         avctx->profile = FF_PROFILE_PRORES_STANDARD;
 152         break;
 153     case MKTAG('a','p','c','h'):
 154         avctx->profile = FF_PROFILE_PRORES_HQ;
 155         break;
 156     case MKTAG('a','p','4','h'):
 157         avctx->profile = FF_PROFILE_PRORES_4444;
 158         avctx->bits_per_raw_sample = 12;
 159         break;
 160     case MKTAG('a','p','4','x'):
 161         avctx->profile = FF_PROFILE_PRORES_XQ;
 162         avctx->bits_per_raw_sample = 12;
 163         break;
 164     default:
 165         avctx->profile = FF_PROFILE_UNKNOWN;
 166         av_log(avctx, AV_LOG_WARNING, "Unknown prores profile %d\n", avctx->codec_tag);
 167     }
 168
 169     if (avctx->bits_per_raw_sample == 10) {
 170         av_log(avctx, AV_LOG_DEBUG, "Auto bitdepth precision. Use 10b decoding based on codec tag.\n");
 171     } else { /* 12b */
 172         av_log(avctx, AV_LOG_DEBUG, "Auto bitdepth precision. Use 12b decoding based on codec tag.\n");
 173     }
 174
 175     ff_blockdsp_init(&ctx->bdsp, avctx);
 176     ret = ff_proresdsp_init(&ctx->prodsp, avctx);
 177     if (ret < 0) {
 178         av_log(avctx, AV_LOG_ERROR, "Fail to init proresdsp for bits per raw sample %d\n", avctx->bits_per_raw_sample);
 179         return ret;
 180     }
 181
 182     ff_init_scantable_permutation(idct_permutation,
 183                                   ctx->prodsp.idct_permutation_type);
 184
 185     permute(ctx->progressive_scan, ff_prores_progressive_scan, idct_permutation);
 186     permute(ctx->interlaced_scan, ff_prores_interlaced_scan, idct_permutation);
 187
 188     if (avctx->bits_per_raw_sample == 10){
 189         ctx->unpack_alpha = unpack_alpha_10;
 190     } else if (avctx->bits_per_raw_sample == 12){
 191         ctx->unpack_alpha = unpack_alpha_12;
 192     } else {
 193         av_log(avctx, AV_LOG_ERROR, "Fail to set unpack_alpha for bits per raw sample %d\n", avctx->bits_per_raw_sample);
 194         return AVERROR_BUG;
 195     }
 196     return ret;
 197 }
 198
 199 static int decode_frame_header(ProresContext *ctx, const uint8_t *buf,
 200                                const int data_size, AVCodecContext *avctx)
 201 {
 202     int hdr_size, width, height, flags;
 203     int version;
 204     const uint8_t *ptr;
 205
 206     hdr_size = AV_RB16(buf);
 207     ff_dlog(avctx, "header size %d\n", hdr_size);
 208     if (hdr_size > data_size) {
 209         av_log(avctx, AV_LOG_ERROR, "error, wrong header size\n");
 210         return AVERROR_INVALIDDATA;
 211     }
 212
 213     version = AV_RB16(buf + 2);
 214     ff_dlog(avctx, "%.4s version %d\n", buf+4, version);
 215     if (version > 1) {
 216         av_log(avctx, AV_LOG_ERROR, "unsupported version: %d\n", version);
 217         return AVERROR_PATCHWELCOME;
 218     }
 219
 220     width  = AV_RB16(buf + 8);
 221     height = AV_RB16(buf + 10);
 222
 223     if (width != avctx->width || height != avctx->height) {
 224         av_log(avctx, AV_LOG_ERROR, "picture resolution change: %dx%d -> %dx%d\n",
 225                avctx->width, avctx->height, width, height);
 226         return AVERROR_PATCHWELCOME;
 227     }
 228
 229     ctx->frame_type = (buf[12] >> 2) & 3;
 230     ctx->alpha_info = buf[17] & 0xf;
 231
 232     if (ctx->alpha_info > 2) {
 233         av_log(avctx, AV_LOG_ERROR, "Invalid alpha mode %d\n", ctx->alpha_info);
 234         return AVERROR_INVALIDDATA;
 235     }
 236     if (avctx->skip_alpha) ctx->alpha_info = 0;
 237
 238     ff_dlog(avctx, "frame type %d\n", ctx->frame_type);
 239
 240     if (ctx->frame_type == 0) {
 241         ctx->scan = ctx->progressive_scan; // permuted
 242     } else {
 243         ctx->scan = ctx->interlaced_scan; // permuted
 244         ctx->frame->interlaced_frame = 1;
 245         ctx->frame->top_field_first = ctx->frame_type == 1;
 246     }
 247
 248     if (ctx->alpha_info) {
 249         if (avctx->bits_per_raw_sample == 10) {
 250             avctx->pix_fmt = (buf[12] & 0xC0) == 0xC0 ? AV_PIX_FMT_YUVA444P10 : AV_PIX_FMT_YUVA422P10;
 251         } else { /* 12b */
 252             avctx->pix_fmt = (buf[12] & 0xC0) == 0xC0 ? AV_PIX_FMT_YUVA444P12 : AV_PIX_FMT_YUVA422P12;
 253         }
 254     } else {
 255         if (avctx->bits_per_raw_sample == 10) {
 256             avctx->pix_fmt = (buf[12] & 0xC0) == 0xC0 ? AV_PIX_FMT_YUV444P10 : AV_PIX_FMT_YUV422P10;
 257         } else { /* 12b */
 258             avctx->pix_fmt = (buf[12] & 0xC0) == 0xC0 ? AV_PIX_FMT_YUV444P12 : AV_PIX_FMT_YUV422P12;
 259         }
 260     }
 261
 262     avctx->color_primaries = buf[14];
 263     avctx->color_trc       = buf[15];
 264     avctx->colorspace      = buf[16];
 265     avctx->color_range     = AVCOL_RANGE_MPEG;
 266
 267     ptr   = buf + 20;
 268     flags = buf[19];
 269     ff_dlog(avctx, "flags %x\n", flags);
 270
 271     if (flags & 2) {
 272         if(buf + data_size - ptr < 64) {
 273             av_log(avctx, AV_LOG_ERROR, "Header truncated\n");
 274             return AVERROR_INVALIDDATA;
 275         }
 276         permute(ctx->qmat_luma, ctx->prodsp.idct_permutation, ptr);
 277         ptr += 64;
 278     } else {
 279         memset(ctx->qmat_luma, 4, 64);
 280     }
 281
 282     if (flags & 1) {
 283         if(buf + data_size - ptr < 64) {
 284             av_log(avctx, AV_LOG_ERROR, "Header truncated\n");
 285             return AVERROR_INVALIDDATA;
 286         }
 287         permute(ctx->qmat_chroma, ctx->prodsp.idct_permutation, ptr);
 288     } else {
 289         memset(ctx->qmat_chroma, 4, 64);
 290     }
 291
 292     return hdr_size;
 293 }
 294
 295 static int decode_picture_header(AVCodecContext *avctx, const uint8_t *buf, const int buf_size)
 296 {
 297     ProresContext *ctx = avctx->priv_data;
 298     int i, hdr_size, slice_count;
 299     unsigned pic_data_size;
 300     int log2_slice_mb_width, log2_slice_mb_height;
 301     int slice_mb_count, mb_x, mb_y;
 302     const uint8_t *data_ptr, *index_ptr;
 303
 304     hdr_size = buf[0] >> 3;
 305     if (hdr_size < 8 || hdr_size > buf_size) {
 306         av_log(avctx, AV_LOG_ERROR, "error, wrong picture header size\n");
 307         return AVERROR_INVALIDDATA;
 308     }
 309
 310     pic_data_size = AV_RB32(buf + 1);
 311     if (pic_data_size > buf_size) {
 312         av_log(avctx, AV_LOG_ERROR, "error, wrong picture data size\n");
 313         return AVERROR_INVALIDDATA;
 314     }
 315
 316     log2_slice_mb_width  = buf[7] >> 4;
 317     log2_slice_mb_height = buf[7] & 0xF;
 318     if (log2_slice_mb_width > 3 || log2_slice_mb_height) {
 319         av_log(avctx, AV_LOG_ERROR, "unsupported slice resolution: %dx%d\n",
 320                1 << log2_slice_mb_width, 1 << log2_slice_mb_height);
 321         return AVERROR_INVALIDDATA;
 322     }
 323
 324     ctx->mb_width  = (avctx->width  + 15) >> 4;
 325     if (ctx->frame_type)
 326         ctx->mb_height = (avctx->height + 31) >> 5;
 327     else
 328         ctx->mb_height = (avctx->height + 15) >> 4;
 329
 330     // QT ignores the written value
 331     // slice_count = AV_RB16(buf + 5);
 332     slice_count = ctx->mb_height * ((ctx->mb_width >> log2_slice_mb_width) +
 333                                     av_popcount(ctx->mb_width & (1 << log2_slice_mb_width) - 1));
 334
 335     if (ctx->slice_count != slice_count || !ctx->slices) {
 336         av_freep(&ctx->slices);
 337         ctx->slice_count = 0;
 338         ctx->slices = av_mallocz_array(slice_count, sizeof(*ctx->slices));
 339         if (!ctx->slices)
 340             return AVERROR(ENOMEM);
 341         ctx->slice_count = slice_count;
 342     }
 343
 344     if (!slice_count)
 345         return AVERROR(EINVAL);
 346
 347     if (hdr_size + slice_count*2 > buf_size) {
 348         av_log(avctx, AV_LOG_ERROR, "error, wrong slice count\n");
 349         return AVERROR_INVALIDDATA;
 350     }
 351
 352     // parse slice information
 353     index_ptr = buf + hdr_size;
 354     data_ptr  = index_ptr + slice_count*2;
 355
 356     slice_mb_count = 1 << log2_slice_mb_width;
 357     mb_x = 0;
 358     mb_y = 0;
 359
 360     for (i = 0; i < slice_count; i++) {
 361         SliceContext *slice = &ctx->slices[i];
 362
 363         slice->data = data_ptr;
 364         data_ptr += AV_RB16(index_ptr + i*2);
 365
 366         while (ctx->mb_width - mb_x < slice_mb_count)
 367             slice_mb_count >>= 1;
 368
 369         slice->mb_x = mb_x;
 370         slice->mb_y = mb_y;
 371         slice->mb_count = slice_mb_count;
 372         slice->data_size = data_ptr - slice->data;
 373
 374         if (slice->data_size < 6) {
 375             av_log(avctx, AV_LOG_ERROR, "error, wrong slice data size\n");
 376             return AVERROR_INVALIDDATA;
 377         }
 378
 379         mb_x += slice_mb_count;
 380         if (mb_x == ctx->mb_width) {
 381             slice_mb_count = 1 << log2_slice_mb_width;
 382             mb_x = 0;
 383             mb_y++;
 384         }
 385         if (data_ptr > buf + buf_size) {
 386             av_log(avctx, AV_LOG_ERROR, "error, slice out of bounds\n");
 387             return AVERROR_INVALIDDATA;
 388         }
 389     }
 390
 391     if (mb_x || mb_y != ctx->mb_height) {
 392         av_log(avctx, AV_LOG_ERROR, "error wrong mb count y %d h %d\n",
 393                mb_y, ctx->mb_height);
 394         return AVERROR_INVALIDDATA;
 395     }
 396
 397     return pic_data_size;
 398 }
 399
 400 #define DECODE_CODEWORD(val, codebook, SKIP)                            \
 401     do {                                                                \
 402         unsigned int rice_order, exp_order, switch_bits;                \
 403         unsigned int q, buf, bits;                                      \
 404                                                                         \
 405         UPDATE_CACHE(re, gb);                                           \
 406         buf = GET_CACHE(re, gb);                                        \
 407                                                                         \
 408         /* number of bits to switch between rice and exp golomb */      \
 409         switch_bits =  codebook & 3;                                    \
 410         rice_order  =  codebook >> 5;                                   \
 411         exp_order   = (codebook >> 2) & 7;                              \
 412                                                                         \
 413         q = 31 - av_log2(buf);                                          \
 414                                                                         \
 415         if (q > switch_bits) { /* exp golomb */                         \
 416             bits = exp_order - switch_bits + (q<<1);                    \
 417             if (bits > FFMIN(MIN_CACHE_BITS, 31))                       \
 418                 return AVERROR_INVALIDDATA;                             \
 419             val = SHOW_UBITS(re, gb, bits) - (1 << exp_order) +         \
 420                 ((switch_bits + 1) << rice_order);                      \
 421             SKIP(re, gb, bits);                                         \
 422         } else if (rice_order) {                                        \
 423             SKIP_BITS(re, gb, q+1);                                     \
 424             val = (q << rice_order) + SHOW_UBITS(re, gb, rice_order);   \
 425             SKIP(re, gb, rice_order);                                   \
 426         } else {                                                        \
 427             val = q;                                                    \
 428             SKIP(re, gb, q+1);                                          \
 429         }                                                               \
 430     } while (0)
 431
 432 #define TOSIGNED(x) (((x) >> 1) ^ (-((x) & 1)))
 433
 434 #define FIRST_DC_CB 0xB8
 435
 436 static const uint8_t dc_codebook[7] = { 0x04, 0x28, 0x28, 0x4D, 0x4D, 0x70, 0x70};
 437
 438 static av_always_inline int decode_dc_coeffs(GetBitContext *gb, int16_t *out,
 439                                               int blocks_per_slice)
 440 {
 441     int16_t prev_dc;
 442     int code, i, sign;
 443
 444     OPEN_READER(re, gb);
 445
 446     DECODE_CODEWORD(code, FIRST_DC_CB, LAST_SKIP_BITS);
 447     prev_dc = TOSIGNED(code);
 448     out[0] = prev_dc;
 449
 450     out += 64; // dc coeff for the next block
 451
 452     code = 5;
 453     sign = 0;
 454     for (i = 1; i < blocks_per_slice; i++, out += 64) {
 455         DECODE_CODEWORD(code, dc_codebook[FFMIN(code, 6U)], LAST_SKIP_BITS);
 456         if(code) sign ^= -(code & 1);
 457         else     sign  = 0;
 458         prev_dc += (((code + 1) >> 1) ^ sign) - sign;
 459         out[0] = prev_dc;
 460     }
 461     CLOSE_READER(re, gb);
 462     return 0;
 463 }
 464
 465 // adaptive codebook switching lut according to previous run/level values
 466 static const uint8_t run_to_cb[16] = { 0x06, 0x06, 0x05, 0x05, 0x04, 0x29, 0x29, 0x29, 0x29, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x4C };
 467 static const uint8_t lev_to_cb[10] = { 0x04, 0x0A, 0x05, 0x06, 0x04, 0x28, 0x28, 0x28, 0x28, 0x4C };
 468
 469 static av_always_inline int decode_ac_coeffs(AVCodecContext *avctx, GetBitContext *gb,
 470                                              int16_t *out, int blocks_per_slice)
 471 {
 472     ProresContext *ctx = avctx->priv_data;
 473     int block_mask, sign;
 474     unsigned pos, run, level;
 475     int max_coeffs, i, bits_left;
 476     int log2_block_count = av_log2(blocks_per_slice);
 477
 478     OPEN_READER(re, gb);
 479     UPDATE_CACHE(re, gb);                                           \
 480     run   = 4;
 481     level = 2;
 482
 483     max_coeffs = 64 << log2_block_count;
 484     block_mask = blocks_per_slice - 1;
 485
 486     for (pos = block_mask;;) {
 487         bits_left = gb->size_in_bits - re_index;
 488         if (!bits_left || (bits_left < 32 && !SHOW_UBITS(re, gb, bits_left)))
 489             break;
 490
 491         DECODE_CODEWORD(run, run_to_cb[FFMIN(run,  15)], LAST_SKIP_BITS);
 492         pos += run + 1;
 493         if (pos >= max_coeffs) {
 494             av_log(avctx, AV_LOG_ERROR, "ac tex damaged %d, %d\n", pos, max_coeffs);
 495             return AVERROR_INVALIDDATA;
 496         }
 497
 498         DECODE_CODEWORD(level, lev_to_cb[FFMIN(level, 9)], SKIP_BITS);
 499         level += 1;
 500
 501         i = pos >> log2_block_count;
 502
 503         sign = SHOW_SBITS(re, gb, 1);
 504         SKIP_BITS(re, gb, 1);
 505         out[((pos & block_mask) << 6) + ctx->scan[i]] = ((level ^ sign) - sign);
 506     }
 507
 508     CLOSE_READER(re, gb);
 509     return 0;
 510 }
 511
 512 static int decode_slice_luma(AVCodecContext *avctx, SliceContext *slice,
 513                              uint16_t *dst, int dst_stride,
 514                              const uint8_t *buf, unsigned buf_size,
 515                              const int16_t *qmat)
 516 {
 517     ProresContext *ctx = avctx->priv_data;
 518     LOCAL_ALIGNED_32(int16_t, blocks, [8*4*64]);
 519     int16_t *block;
 520     GetBitContext gb;
 521     int i, blocks_per_slice = slice->mb_count<<2;
 522     int ret;
 523
 524     for (i = 0; i < blocks_per_slice; i++)
 525         ctx->bdsp.clear_block(blocks+(i<<6));
 526
 527     init_get_bits(&gb, buf, buf_size << 3);
 528
 529     if ((ret = decode_dc_coeffs(&gb, blocks, blocks_per_slice)) < 0)
 530         return ret;
 531     if ((ret = decode_ac_coeffs(avctx, &gb, blocks, blocks_per_slice)) < 0)
 532         return ret;
 533
 534     block = blocks;
 535     for (i = 0; i < slice->mb_count; i++) {
 536         ctx->prodsp.idct_put(dst, dst_stride, block+(0<<6), qmat);
 537         ctx->prodsp.idct_put(dst             +8, dst_stride, block+(1<<6), qmat);
 538         ctx->prodsp.idct_put(dst+4*dst_stride  , dst_stride, block+(2<<6), qmat);
 539         ctx->prodsp.idct_put(dst+4*dst_stride+8, dst_stride, block+(3<<6), qmat);
 540         block += 4*64;
 541         dst += 16;
 542     }
 543     return 0;
 544 }
 545
 546 static int decode_slice_chroma(AVCodecContext *avctx, SliceContext *slice,
 547                                uint16_t *dst, int dst_stride,
 548                                const uint8_t *buf, unsigned buf_size,
 549                                const int16_t *qmat, int log2_blocks_per_mb)
 550 {
 551     ProresContext *ctx = avctx->priv_data;
 552     LOCAL_ALIGNED_32(int16_t, blocks, [8*4*64]);
 553     int16_t *block;
 554     GetBitContext gb;
 555     int i, j, blocks_per_slice = slice->mb_count << log2_blocks_per_mb;
 556     int ret;
 557
 558     for (i = 0; i < blocks_per_slice; i++)
 559         ctx->bdsp.clear_block(blocks+(i<<6));
 560
 561     init_get_bits(&gb, buf, buf_size << 3);
 562
 563     if ((ret = decode_dc_coeffs(&gb, blocks, blocks_per_slice)) < 0)
 564         return ret;
 565     if ((ret = decode_ac_coeffs(avctx, &gb, blocks, blocks_per_slice)) < 0)
 566         return ret;
 567
 568     block = blocks;
 569     for (i = 0; i < slice->mb_count; i++) {
 570         for (j = 0; j < log2_blocks_per_mb; j++) {
 571             ctx->prodsp.idct_put(dst,              dst_stride, block+(0<<6), qmat);
 572             ctx->prodsp.idct_put(dst+4*dst_stride, dst_stride, block+(1<<6), qmat);
 573             block += 2*64;
 574             dst += 8;
 575         }
 576     }
 577     return 0;
 578 }
 579
 580 /**
 581  * Decode alpha slice plane.
 582  */
 583 static void decode_slice_alpha(ProresContext *ctx,
 584                                uint16_t *dst, int dst_stride,
 585                                const uint8_t *buf, int buf_size,
 586                                int blocks_per_slice)
 587 {
 588     GetBitContext gb;
 589     int i;
 590     LOCAL_ALIGNED_32(int16_t, blocks, [8*4*64]);
 591     int16_t *block;
 592
 593     for (i = 0; i < blocks_per_slice<<2; i++)
 594         ctx->bdsp.clear_block(blocks+(i<<6));
 595
 596     init_get_bits(&gb, buf, buf_size << 3);
 597
 598     if (ctx->alpha_info == 2) {
 599         ctx->unpack_alpha(&gb, blocks, blocks_per_slice * 4 * 64, 16);
 600     } else {
 601         ctx->unpack_alpha(&gb, blocks, blocks_per_slice * 4 * 64, 8);
 602     }
 603
 604     block = blocks;
 605
 606     for (i = 0; i < 16; i++) {
 607         memcpy(dst, block, 16 * blocks_per_slice * sizeof(*dst));
 608         dst   += dst_stride >> 1;
 609         block += 16 * blocks_per_slice;
 610     }
 611 }
 612
 613 static int decode_slice_thread(AVCodecContext *avctx, void *arg, int jobnr, int threadnr)
 614 {
 615     ProresContext *ctx = avctx->priv_data;
 616     SliceContext *slice = &ctx->slices[jobnr];
 617     const uint8_t *buf = slice->data;
 618     AVFrame *pic = ctx->frame;
 619     int i, hdr_size, qscale, log2_chroma_blocks_per_mb;
 620     int luma_stride, chroma_stride;
 621     int y_data_size, u_data_size, v_data_size, a_data_size;
 622     uint8_t *dest_y, *dest_u, *dest_v, *dest_a;
 623     LOCAL_ALIGNED_16(int16_t, qmat_luma_scaled,  [64]);
 624     LOCAL_ALIGNED_16(int16_t, qmat_chroma_scaled,[64]);
 625     int mb_x_shift;
 626     int ret;
 627     uint16_t val_no_chroma;
 628
 629     slice->ret = -1;
 630     //av_log(avctx, AV_LOG_INFO, "slice %d mb width %d mb x %d y %d\n",
 631     //       jobnr, slice->mb_count, slice->mb_x, slice->mb_y);
 632
 633     // slice header
 634     hdr_size = buf[0] >> 3;
 635     qscale = av_clip(buf[1], 1, 224);
 636     qscale = qscale > 128 ? qscale - 96 << 2: qscale;
 637     y_data_size = AV_RB16(buf + 2);
 638     u_data_size = AV_RB16(buf + 4);
 639     v_data_size = slice->data_size - y_data_size - u_data_size - hdr_size;
 640     if (hdr_size > 7) v_data_size = AV_RB16(buf + 6);
 641     a_data_size = slice->data_size - y_data_size - u_data_size -
 642                   v_data_size - hdr_size;
 643
 644     if (y_data_size < 0 || u_data_size < 0 || v_data_size < 0
 645         || hdr_size+y_data_size+u_data_size+v_data_size > slice->data_size){
 646         av_log(avctx, AV_LOG_ERROR, "invalid plane data size\n");
 647         return AVERROR_INVALIDDATA;
 648     }
 649
 650     buf += hdr_size;
 651
 652     for (i = 0; i < 64; i++) {
 653         qmat_luma_scaled  [i] = ctx->qmat_luma  [i] * qscale;
 654         qmat_chroma_scaled[i] = ctx->qmat_chroma[i] * qscale;
 655     }
 656
 657     if (ctx->frame_type == 0) {
 658         luma_stride   = pic->linesize[0];
 659         chroma_stride = pic->linesize[1];
 660     } else {
 661         luma_stride   = pic->linesize[0] << 1;
 662         chroma_stride = pic->linesize[1] << 1;
 663     }
 664
 665     if (avctx->pix_fmt == AV_PIX_FMT_YUV444P10 || avctx->pix_fmt == AV_PIX_FMT_YUVA444P10 ||
 666         avctx->pix_fmt == AV_PIX_FMT_YUV444P12 || avctx->pix_fmt == AV_PIX_FMT_YUVA444P12) {
 667         mb_x_shift = 5;
 668         log2_chroma_blocks_per_mb = 2;
 669     } else {
 670         mb_x_shift = 4;
 671         log2_chroma_blocks_per_mb = 1;
 672     }
 673
 674     dest_y = pic->data[0] + (slice->mb_y << 4) * luma_stride + (slice->mb_x << 5);
 675     dest_u = pic->data[1] + (slice->mb_y << 4) * chroma_stride + (slice->mb_x << mb_x_shift);
 676     dest_v = pic->data[2] + (slice->mb_y << 4) * chroma_stride + (slice->mb_x << mb_x_shift);
 677     dest_a = pic->data[3] + (slice->mb_y << 4) * luma_stride + (slice->mb_x << 5);
 678
 679     if (ctx->frame_type && ctx->first_field ^ ctx->frame->top_field_first) {
 680         dest_y += pic->linesize[0];
 681         dest_u += pic->linesize[1];
 682         dest_v += pic->linesize[2];
 683         dest_a += pic->linesize[3];
 684     }
 685
 686     ret = decode_slice_luma(avctx, slice, (uint16_t*)dest_y, luma_stride,
 687                             buf, y_data_size, qmat_luma_scaled);
 688     if (ret < 0)
 689         return ret;
 690
 691     if (!(avctx->flags & AV_CODEC_FLAG_GRAY) && (u_data_size + v_data_size) > 0) {
 692         ret = decode_slice_chroma(avctx, slice, (uint16_t*)dest_u, chroma_stride,
 693                                   buf + y_data_size, u_data_size,
 694                                   qmat_chroma_scaled, log2_chroma_blocks_per_mb);
 695         if (ret < 0)
 696             return ret;
 697
 698         ret = decode_slice_chroma(avctx, slice, (uint16_t*)dest_v, chroma_stride,
 699                                   buf + y_data_size + u_data_size, v_data_size,
 700                                   qmat_chroma_scaled, log2_chroma_blocks_per_mb);
 701         if (ret < 0)
 702             return ret;
 703     }
 704     else {
 705         size_t mb_max_x = slice->mb_count << (mb_x_shift - 1);
 706         size_t i, j;
 707         if (avctx->bits_per_raw_sample == 10) {
 708             val_no_chroma = 511;
 709         } else { /* 12b */
 710             val_no_chroma = 511 * 4;
 711         }
 712         for (i = 0; i < 16; ++i)
 713             for (j = 0; j < mb_max_x; ++j) {
 714                 *(uint16_t*)(dest_u + (i * chroma_stride) + (j << 1)) = val_no_chroma;
 715                 *(uint16_t*)(dest_v + (i * chroma_stride) + (j << 1)) = val_no_chroma;
 716             }
 717     }
 718
 719     /* decode alpha plane if available */
 720     if (ctx->alpha_info && pic->data[3] && a_data_size)
 721         decode_slice_alpha(ctx, (uint16_t*)dest_a, luma_stride,
 722                            buf + y_data_size + u_data_size + v_data_size,
 723                            a_data_size, slice->mb_count);
 724
 725     slice->ret = 0;
 726     return 0;
 727 }
 728
 729 static int decode_picture(AVCodecContext *avctx)
 730 {
 731     ProresContext *ctx = avctx->priv_data;
 732     int i;
 733     int error = 0;
 734
 735     avctx->execute2(avctx, decode_slice_thread, NULL, NULL, ctx->slice_count);
 736
 737     for (i = 0; i < ctx->slice_count; i++)
 738         error += ctx->slices[i].ret < 0;
 739
 740     if (error)
 741         ctx->frame->decode_error_flags = FF_DECODE_ERROR_INVALID_BITSTREAM;
 742     if (error < ctx->slice_count)
 743         return 0;
 744
 745     return ctx->slices[0].ret;
 746 }
 747
 748 static int decode_frame(AVCodecContext *avctx, void *data, int *got_frame,
 749                         AVPacket *avpkt)
 750 {
 751     ProresContext *ctx = avctx->priv_data;
 752     ThreadFrame tframe = { .f = data };
 753     AVFrame *frame = data;
 754     const uint8_t *buf = avpkt->data;
 755     int buf_size = avpkt->size;
 756     int frame_hdr_size, pic_size, ret;
 757
 758     if (buf_size < 28 || AV_RL32(buf + 4) != AV_RL32("icpf")) {
 759         av_log(avctx, AV_LOG_ERROR, "invalid frame header\n");
 760         return AVERROR_INVALIDDATA;
 761     }
 762
 763     ctx->frame = frame;
 764     ctx->frame->pict_type = AV_PICTURE_TYPE_I;
 765     ctx->frame->key_frame = 1;
 766     ctx->first_field = 1;
 767
 768     buf += 8;
 769     buf_size -= 8;
 770
 771     frame_hdr_size = decode_frame_header(ctx, buf, buf_size, avctx);
 772     if (frame_hdr_size < 0)
 773         return frame_hdr_size;
 774
 775     buf += frame_hdr_size;
 776     buf_size -= frame_hdr_size;
 777
 778     if ((ret = ff_thread_get_buffer(avctx, &tframe, 0)) < 0)
 779         return ret;
 780
 781  decode_picture:
 782     pic_size = decode_picture_header(avctx, buf, buf_size);
 783     if (pic_size < 0) {
 784         av_log(avctx, AV_LOG_ERROR, "error decoding picture header\n");
 785         return pic_size;
 786     }
 787
 788     if ((ret = decode_picture(avctx)) < 0) {
 789         av_log(avctx, AV_LOG_ERROR, "error decoding picture\n");
 790         return ret;
 791     }
 792
 793     buf += pic_size;
 794     buf_size -= pic_size;
 795
 796     if (ctx->frame_type && buf_size > 0 && ctx->first_field) {
 797         ctx->first_field = 0;
 798         goto decode_picture;
 799     }
 800
 801     *got_frame      = 1;
 802
 803     return avpkt->size;
 804 }
 805
 806 #if HAVE_THREADS
 807 static int decode_init_thread_copy(AVCodecContext *avctx)
 808 {
 809     ProresContext *ctx = avctx->priv_data;
 810
 811     ctx->slices = NULL;
 812
 813     return 0;
 814 }
 815 #endif
 816
 817 static av_cold int decode_close(AVCodecContext *avctx)
 818 {
 819     ProresContext *ctx = avctx->priv_data;
 820
 821     av_freep(&ctx->slices);
 822
 823     return 0;
 824 }
 825
 826 AVCodec ff_prores_decoder = {
 827     .name           = "prores",
 828     .long_name      = NULL_IF_CONFIG_SMALL("ProRes (iCodec Pro)"),
 829     .type           = AVMEDIA_TYPE_VIDEO,
 830     .id             = AV_CODEC_ID_PRORES,
 831     .priv_data_size = sizeof(ProresContext),
 832     .init           = decode_init,
 833     .init_thread_copy = ONLY_IF_THREADS_ENABLED(decode_init_thread_copy),
 834     .close          = decode_close,
 835     .decode         = decode_frame,
 836     .capabilities   = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_SLICE_THREADS | AV_CODEC_CAP_FRAME_THREADS,
 837     .profiles       = NULL_IF_CONFIG_SMALL(ff_prores_profiles),
 838 };